diff --git a/public/img/serotype_capsular_structure/capsular_structure_legend.svg b/public/img/serotype_capsular_structure/capsular_structure_legend.svg new file mode 100644 index 0000000..1926b17 --- /dev/null +++ b/public/img/serotype_capsular_structure/capsular_structure_legend.svg @@ -0,0 +1,1695 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_10A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_10A_capsular_structure.svg new file mode 100644 index 0000000..f7f1f24 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_10A_capsular_structure.svg @@ -0,0 +1,160 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_10B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_10B_capsular_structure.svg new file mode 100644 index 0000000..6277e68 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_10B_capsular_structure.svg @@ -0,0 +1,139 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_10C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_10C_capsular_structure.svg new file mode 100644 index 0000000..e202683 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_10C_capsular_structure.svg @@ -0,0 +1,141 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_10D_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_10D_capsular_structure.svg new file mode 100644 index 0000000..6a46f84 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_10D_capsular_structure.svg @@ -0,0 +1,155 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_10F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_10F_capsular_structure.svg new file mode 100644 index 0000000..35ac94c --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_10F_capsular_structure.svg @@ -0,0 +1,144 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_11A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_11A_capsular_structure.svg new file mode 100644 index 0000000..8b562b6 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_11A_capsular_structure.svg @@ -0,0 +1,215 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_11B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_11B_capsular_structure.svg new file mode 100644 index 0000000..a96a723 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_11B_capsular_structure.svg @@ -0,0 +1,165 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_11C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_11C_capsular_structure.svg new file mode 100644 index 0000000..6022177 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_11C_capsular_structure.svg @@ -0,0 +1,167 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_11D_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_11D_capsular_structure.svg new file mode 100644 index 0000000..057be70 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_11D_capsular_structure.svg @@ -0,0 +1,398 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_11E_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_11E_capsular_structure.svg new file mode 100644 index 0000000..729e20d --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_11E_capsular_structure.svg @@ -0,0 +1,189 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_11F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_11F_capsular_structure.svg new file mode 100644 index 0000000..ea5b872 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_11F_capsular_structure.svg @@ -0,0 +1,172 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_12A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_12A_capsular_structure.svg new file mode 100644 index 0000000..7e7cb97 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_12A_capsular_structure.svg @@ -0,0 +1,131 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_12F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_12F_capsular_structure.svg new file mode 100644 index 0000000..48cb504 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_12F_capsular_structure.svg @@ -0,0 +1,275 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_13_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_13_capsular_structure.svg new file mode 100644 index 0000000..36e9846 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_13_capsular_structure.svg @@ -0,0 +1,135 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_14_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_14_capsular_structure.svg new file mode 100644 index 0000000..ee57388 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_14_capsular_structure.svg @@ -0,0 +1,94 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_15A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_15A_capsular_structure.svg new file mode 100644 index 0000000..2de0a05 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_15A_capsular_structure.svg @@ -0,0 +1,130 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_15B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_15B_capsular_structure.svg new file mode 100644 index 0000000..42244a1 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_15B_capsular_structure.svg @@ -0,0 +1,234 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_15C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_15C_capsular_structure.svg new file mode 100644 index 0000000..c8215f6 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_15C_capsular_structure.svg @@ -0,0 +1,131 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_15D_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_15D_capsular_structure.svg new file mode 100644 index 0000000..d943f68 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_15D_capsular_structure.svg @@ -0,0 +1,139 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_15F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_15F_capsular_structure.svg new file mode 100644 index 0000000..d28ea98 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_15F_capsular_structure.svg @@ -0,0 +1,148 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_16A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_16A_capsular_structure.svg new file mode 100644 index 0000000..47790b3 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_16A_capsular_structure.svg @@ -0,0 +1,170 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_16F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_16F_capsular_structure.svg new file mode 100644 index 0000000..7d8fa97 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_16F_capsular_structure.svg @@ -0,0 +1,137 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_17A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_17A_capsular_structure.svg new file mode 100644 index 0000000..c4aa96c --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_17A_capsular_structure.svg @@ -0,0 +1,176 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_17F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_17F_capsular_structure.svg new file mode 100644 index 0000000..91e8446 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_17F_capsular_structure.svg @@ -0,0 +1,155 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_18A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_18A_capsular_structure.svg new file mode 100644 index 0000000..8f82571 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_18A_capsular_structure.svg @@ -0,0 +1,135 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_18B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_18B_capsular_structure.svg new file mode 100644 index 0000000..94ac690 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_18B_capsular_structure.svg @@ -0,0 +1,133 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_18C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_18C_capsular_structure.svg new file mode 100644 index 0000000..981e364 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_18C_capsular_structure.svg @@ -0,0 +1,139 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_18F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_18F_capsular_structure.svg new file mode 100644 index 0000000..e265083 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_18F_capsular_structure.svg @@ -0,0 +1,153 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_19A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_19A_capsular_structure.svg new file mode 100644 index 0000000..4a9b679 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_19A_capsular_structure.svg @@ -0,0 +1,80 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_19B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_19B_capsular_structure.svg new file mode 100644 index 0000000..9dde6fd --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_19B_capsular_structure.svg @@ -0,0 +1,131 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_19C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_19C_capsular_structure.svg new file mode 100644 index 0000000..f9890e8 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_19C_capsular_structure.svg @@ -0,0 +1,152 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_19F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_19F_capsular_structure.svg new file mode 100644 index 0000000..510826a --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_19F_capsular_structure.svg @@ -0,0 +1,80 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_1_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_1_capsular_structure.svg new file mode 100644 index 0000000..f487e13 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_1_capsular_structure.svg @@ -0,0 +1,124 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_20A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_20A_capsular_structure.svg new file mode 100644 index 0000000..c28bc5c --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_20A_capsular_structure.svg @@ -0,0 +1,220 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_20B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_20B_capsular_structure.svg new file mode 100644 index 0000000..805b1dd --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_20B_capsular_structure.svg @@ -0,0 +1,238 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_20C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_20C_capsular_structure.svg new file mode 100644 index 0000000..170ee6d --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_20C_capsular_structure.svg @@ -0,0 +1,214 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_22A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_22A_capsular_structure.svg new file mode 100644 index 0000000..e9da923 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_22A_capsular_structure.svg @@ -0,0 +1,156 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_22F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_22F_capsular_structure.svg new file mode 100644 index 0000000..0a8bcee --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_22F_capsular_structure.svg @@ -0,0 +1,156 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_23A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_23A_capsular_structure.svg new file mode 100644 index 0000000..05af83a --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_23A_capsular_structure.svg @@ -0,0 +1,110 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_23B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_23B_capsular_structure.svg new file mode 100644 index 0000000..d53551e --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_23B_capsular_structure.svg @@ -0,0 +1,92 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_23F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_23F_capsular_structure.svg new file mode 100644 index 0000000..69b709c --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_23F_capsular_structure.svg @@ -0,0 +1,107 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_24A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_24A_capsular_structure.svg new file mode 100644 index 0000000..4090e48 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_24A_capsular_structure.svg @@ -0,0 +1,133 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_24B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_24B_capsular_structure.svg new file mode 100644 index 0000000..0b0d634 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_24B_capsular_structure.svg @@ -0,0 +1,132 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_24F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_24F_capsular_structure.svg new file mode 100644 index 0000000..2f797ac --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_24F_capsular_structure.svg @@ -0,0 +1,135 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_27_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_27_capsular_structure.svg new file mode 100644 index 0000000..f90a68f --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_27_capsular_structure.svg @@ -0,0 +1,134 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_28A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_28A_capsular_structure.svg new file mode 100644 index 0000000..144cfb6 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_28A_capsular_structure.svg @@ -0,0 +1,139 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_28F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_28F_capsular_structure.svg new file mode 100644 index 0000000..50ef62c --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_28F_capsular_structure.svg @@ -0,0 +1,142 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_29_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_29_capsular_structure.svg new file mode 100644 index 0000000..9d8cb83 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_29_capsular_structure.svg @@ -0,0 +1,118 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_2_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_2_capsular_structure.svg new file mode 100644 index 0000000..bae4271 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_2_capsular_structure.svg @@ -0,0 +1,122 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_31_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_31_capsular_structure.svg new file mode 100644 index 0000000..110d284 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_31_capsular_structure.svg @@ -0,0 +1,136 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_32A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_32A_capsular_structure.svg new file mode 100644 index 0000000..89fde32 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_32A_capsular_structure.svg @@ -0,0 +1,142 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_32F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_32F_capsular_structure.svg new file mode 100644 index 0000000..6113468 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_32F_capsular_structure.svg @@ -0,0 +1,138 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_33A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_33A_capsular_structure.svg new file mode 100644 index 0000000..2503048 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_33A_capsular_structure.svg @@ -0,0 +1,168 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_33B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_33B_capsular_structure.svg new file mode 100644 index 0000000..9a84db6 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_33B_capsular_structure.svg @@ -0,0 +1,165 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_33C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_33C_capsular_structure.svg new file mode 100644 index 0000000..654ec32 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_33C_capsular_structure.svg @@ -0,0 +1,165 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_33D_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_33D_capsular_structure.svg new file mode 100644 index 0000000..2cce2f2 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_33D_capsular_structure.svg @@ -0,0 +1,165 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_33E_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_33E_capsular_structure.svg new file mode 100644 index 0000000..6919dac --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_33E_capsular_structure.svg @@ -0,0 +1,127 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_33F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_33F_capsular_structure.svg new file mode 100644 index 0000000..e08d983 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_33F_capsular_structure.svg @@ -0,0 +1,148 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_33G_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_33G_capsular_structure.svg new file mode 100644 index 0000000..2a4d868 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_33G_capsular_structure.svg @@ -0,0 +1,147 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_34_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_34_capsular_structure.svg new file mode 100644 index 0000000..14177c2 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_34_capsular_structure.svg @@ -0,0 +1,145 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_35A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_35A_capsular_structure.svg new file mode 100644 index 0000000..84b9b3c --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_35A_capsular_structure.svg @@ -0,0 +1,160 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_35B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_35B_capsular_structure.svg new file mode 100644 index 0000000..2bcd041 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_35B_capsular_structure.svg @@ -0,0 +1,131 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_35C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_35C_capsular_structure.svg new file mode 100644 index 0000000..f5e05f1 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_35C_capsular_structure.svg @@ -0,0 +1,176 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_35D_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_35D_capsular_structure.svg new file mode 100644 index 0000000..20d60ce --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_35D_capsular_structure.svg @@ -0,0 +1,122 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_35F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_35F_capsular_structure.svg new file mode 100644 index 0000000..487ee9d --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_35F_capsular_structure.svg @@ -0,0 +1,132 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_36A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_36A_capsular_structure.svg new file mode 100644 index 0000000..db90deb --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_36A_capsular_structure.svg @@ -0,0 +1,139 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_36B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_36B_capsular_structure.svg new file mode 100644 index 0000000..b391d7c --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_36B_capsular_structure.svg @@ -0,0 +1,139 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_37_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_37_capsular_structure.svg new file mode 100644 index 0000000..e8c34df --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_37_capsular_structure.svg @@ -0,0 +1,59 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_38_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_38_capsular_structure.svg new file mode 100644 index 0000000..c4968a3 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_38_capsular_structure.svg @@ -0,0 +1,134 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_39_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_39_capsular_structure.svg new file mode 100644 index 0000000..3ad41d5 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_39_capsular_structure.svg @@ -0,0 +1,210 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_3_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_3_capsular_structure.svg new file mode 100644 index 0000000..1366017 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_3_capsular_structure.svg @@ -0,0 +1,56 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_41A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_41A_capsular_structure.svg new file mode 100644 index 0000000..f8b528d --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_41A_capsular_structure.svg @@ -0,0 +1,151 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_41F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_41F_capsular_structure.svg new file mode 100644 index 0000000..3a4f261 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_41F_capsular_structure.svg @@ -0,0 +1,225 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_42_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_42_capsular_structure.svg new file mode 100644 index 0000000..fc5fe17 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_42_capsular_structure.svg @@ -0,0 +1,162 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_45_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_45_capsular_structure.svg new file mode 100644 index 0000000..6f2e10e --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_45_capsular_structure.svg @@ -0,0 +1,146 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_47A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_47A_capsular_structure.svg new file mode 100644 index 0000000..0ba6f34 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_47A_capsular_structure.svg @@ -0,0 +1,177 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_47F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_47F_capsular_structure.svg new file mode 100644 index 0000000..b9ec9c9 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_47F_capsular_structure.svg @@ -0,0 +1,152 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_4_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_4_capsular_structure.svg new file mode 100644 index 0000000..f7e6b95 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_4_capsular_structure.svg @@ -0,0 +1,115 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_5_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_5_capsular_structure.svg new file mode 100644 index 0000000..0bf4428 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_5_capsular_structure.svg @@ -0,0 +1,113 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_6A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_6A_capsular_structure.svg new file mode 100644 index 0000000..8a3cc7f --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_6A_capsular_structure.svg @@ -0,0 +1,92 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_6B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_6B_capsular_structure.svg new file mode 100644 index 0000000..3b2851b --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_6B_capsular_structure.svg @@ -0,0 +1,92 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_6C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_6C_capsular_structure.svg new file mode 100644 index 0000000..f30e6f4 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_6C_capsular_structure.svg @@ -0,0 +1,92 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_6D_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_6D_capsular_structure.svg new file mode 100644 index 0000000..64e0def --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_6D_capsular_structure.svg @@ -0,0 +1,92 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_7A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_7A_capsular_structure.svg new file mode 100644 index 0000000..5c0bbc2 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_7A_capsular_structure.svg @@ -0,0 +1,128 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_7B_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_7B_capsular_structure.svg new file mode 100644 index 0000000..bde083a --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_7B_capsular_structure.svg @@ -0,0 +1,149 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_7C_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_7C_capsular_structure.svg new file mode 100644 index 0000000..6e0f86b --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_7C_capsular_structure.svg @@ -0,0 +1,146 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_7F_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_7F_capsular_structure.svg new file mode 100644 index 0000000..881faa7 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_7F_capsular_structure.svg @@ -0,0 +1,149 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_8_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_8_capsular_structure.svg new file mode 100644 index 0000000..e77a596 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_8_capsular_structure.svg @@ -0,0 +1,92 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_9A_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_9A_capsular_structure.svg new file mode 100644 index 0000000..0db1ae7 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_9A_capsular_structure.svg @@ -0,0 +1,178 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_9L_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_9L_capsular_structure.svg new file mode 100644 index 0000000..325bb37 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_9L_capsular_structure.svg @@ -0,0 +1,104 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_9N_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_9N_capsular_structure.svg new file mode 100644 index 0000000..c9ad6e4 --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_9N_capsular_structure.svg @@ -0,0 +1,104 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_capsular_structure/serotype_9V_capsular_structure.svg b/public/img/serotype_capsular_structure/serotype_9V_capsular_structure.svg new file mode 100644 index 0000000..643f96a --- /dev/null +++ b/public/img/serotype_capsular_structure/serotype_9V_capsular_structure.svg @@ -0,0 +1,207 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/cps_legend.svg b/public/img/serotype_cps/cps_legend.svg index 6f6af97..c647b84 100644 --- a/public/img/serotype_cps/cps_legend.svg +++ b/public/img/serotype_cps/cps_legend.svg @@ -1,724 +1,1944 @@ - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/group_II_nonencapsulated-NCC1_pspK.svg b/public/img/serotype_cps/group_II_nonencapsulated-NCC1_pspK.svg new file mode 100644 index 0000000..d5eddf9 --- /dev/null +++ b/public/img/serotype_cps/group_II_nonencapsulated-NCC1_pspK.svg @@ -0,0 +1,94 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/group_II_nonencapsulated-NCC2_S_mitis_aliC_aliD.svg b/public/img/serotype_cps/group_II_nonencapsulated-NCC2_S_mitis_aliC_aliD.svg new file mode 100644 index 0000000..759f913 --- /dev/null +++ b/public/img/serotype_cps/group_II_nonencapsulated-NCC2_S_mitis_aliC_aliD.svg @@ -0,0 +1,115 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/group_II_nonencapsulated-NCC2_aliC_aliD.svg b/public/img/serotype_cps/group_II_nonencapsulated-NCC2_aliC_aliD.svg new file mode 100644 index 0000000..4eb4a63 --- /dev/null +++ b/public/img/serotype_cps/group_II_nonencapsulated-NCC2_aliC_aliD.svg @@ -0,0 +1,141 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/group_II_nonencapsulated-NCC3_aliD.svg b/public/img/serotype_cps/group_II_nonencapsulated-NCC3_aliD.svg new file mode 100644 index 0000000..4361e3c --- /dev/null +++ b/public/img/serotype_cps/group_II_nonencapsulated-NCC3_aliD.svg @@ -0,0 +1,76 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_10D_cps.svg b/public/img/serotype_cps/serotype_10D_cps.svg index 492f2ab..70466eb 100644 --- a/public/img/serotype_cps/serotype_10D_cps.svg +++ b/public/img/serotype_cps/serotype_10D_cps.svg @@ -1,196 +1,316 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + - diff --git a/public/img/serotype_cps/serotype_11F_like_cps.svg b/public/img/serotype_cps/serotype_11F-like_cps.svg similarity index 100% rename from public/img/serotype_cps/serotype_11F_like_cps.svg rename to public/img/serotype_cps/serotype_11F-like_cps.svg diff --git a/public/img/serotype_cps/serotype_11X_cps.svg b/public/img/serotype_cps/serotype_11X_cps.svg index 3cc057f..449d0a0 100644 --- a/public/img/serotype_cps/serotype_11X_cps.svg +++ b/public/img/serotype_cps/serotype_11X_cps.svg @@ -1,287 +1,404 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_16X_cps.svg b/public/img/serotype_cps/serotype_16X_cps.svg index a43bab1..4a35205 100644 --- a/public/img/serotype_cps/serotype_16X_cps.svg +++ b/public/img/serotype_cps/serotype_16X_cps.svg @@ -1,282 +1,453 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_18X1_cps.svg b/public/img/serotype_cps/serotype_18X1_cps.svg index 84c0701..bd77fc6 100644 --- a/public/img/serotype_cps/serotype_18X1_cps.svg +++ b/public/img/serotype_cps/serotype_18X1_cps.svg @@ -1,325 +1,540 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_18X2_cps.svg b/public/img/serotype_cps/serotype_18X2_cps.svg index d2185c0..afa1df4 100644 --- a/public/img/serotype_cps/serotype_18X2_cps.svg +++ b/public/img/serotype_cps/serotype_18X2_cps.svg @@ -1,284 +1,435 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_18X3_cps.svg b/public/img/serotype_cps/serotype_18X3_cps.svg index 10ba0e6..cd1ac16 100644 --- a/public/img/serotype_cps/serotype_18X3_cps.svg +++ b/public/img/serotype_cps/serotype_18X3_cps.svg @@ -1,301 +1,479 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_1_cps.svg b/public/img/serotype_cps/serotype_1_cps.svg index e7df78b..b089d39 100644 --- a/public/img/serotype_cps/serotype_1_cps.svg +++ b/public/img/serotype_cps/serotype_1_cps.svg @@ -1 +1,141 @@ - \ No newline at end of file + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_33X_cps.svg b/public/img/serotype_cps/serotype_20C_cps.svg similarity index 63% rename from public/img/serotype_cps/serotype_33X_cps.svg rename to public/img/serotype_cps/serotype_20C_cps.svg index 77864d7..5d5ce26 100644 --- a/public/img/serotype_cps/serotype_33X_cps.svg +++ b/public/img/serotype_cps/serotype_20C_cps.svg @@ -1,38 +1,9 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + @@ -43,8 +14,8 @@ - - + + @@ -55,8 +26,8 @@ - - + + @@ -67,8 +38,8 @@ - - + + @@ -79,8 +50,8 @@ - - + + @@ -88,14 +59,14 @@ - + - - + + - - + + @@ -106,27 +77,38 @@ - + - - - + + - + + + + - + - + + + + + + + + + + - - + + - - + + @@ -134,41 +116,59 @@ - + - - + + - - + + - + - + + + + + + + + + + + + + - + + + + - - + + - + - - + + + + + - - + + @@ -179,48 +179,59 @@ - - + + - + - + - - + + - - + + - + - - - - + + - + - - + + - - + + - - + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_29X_cps.svg b/public/img/serotype_cps/serotype_29X_cps.svg index 45c0050..7fb1469 100644 --- a/public/img/serotype_cps/serotype_29X_cps.svg +++ b/public/img/serotype_cps/serotype_29X_cps.svg @@ -1,222 +1,331 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_36X_cps.svg b/public/img/serotype_cps/serotype_36X_cps.svg deleted file mode 100644 index 43b427a..0000000 --- a/public/img/serotype_cps/serotype_36X_cps.svg +++ /dev/null @@ -1,249 +0,0 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - diff --git a/public/img/serotype_cps/serotype_3_cps.svg b/public/img/serotype_cps/serotype_3_cps.svg index d17a337..3e6b936 100644 --- a/public/img/serotype_cps/serotype_3_cps.svg +++ b/public/img/serotype_cps/serotype_3_cps.svg @@ -1 +1,75 @@ - \ No newline at end of file + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_4_cps.svg b/public/img/serotype_cps/serotype_4_cps.svg index 363e5a7..1af9397 100644 --- a/public/img/serotype_cps/serotype_4_cps.svg +++ b/public/img/serotype_cps/serotype_4_cps.svg @@ -1 +1,135 @@ - \ No newline at end of file + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_6C_cps.svg b/public/img/serotype_cps/serotype_6C_cps.svg index b63a9c2..ebd2b7c 100644 --- a/public/img/serotype_cps/serotype_6C_cps.svg +++ b/public/img/serotype_cps/serotype_6C_cps.svg @@ -1,209 +1,290 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_6F_cps.svg b/public/img/serotype_cps/serotype_6F_cps.svg new file mode 100644 index 0000000..981397c --- /dev/null +++ b/public/img/serotype_cps/serotype_6F_cps.svg @@ -0,0 +1,331 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_6G_cps.svg b/public/img/serotype_cps/serotype_6G_cps.svg new file mode 100644 index 0000000..f59e23b --- /dev/null +++ b/public/img/serotype_cps/serotype_6G_cps.svg @@ -0,0 +1,287 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/img/serotype_cps/serotype_9X_cps.svg b/public/img/serotype_cps/serotype_9X_cps.svg index bd7dd0f..4ddd02f 100644 --- a/public/img/serotype_cps/serotype_9X_cps.svg +++ b/public/img/serotype_cps/serotype_9X_cps.svg @@ -1,249 +1,377 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/public/res/serotype_genbank/serotype_1.gb b/public/res/serotype_genbank/serotype_1.gb new file mode 100644 index 0000000..28420eb --- /dev/null +++ b/public/res/serotype_genbank/serotype_1.gb @@ -0,0 +1,1022 @@ +LOCUS CR931632 22182 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 519/43 (serotype 1). +ACCESSION CR931632 +VERSION CR931632.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22182) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22182) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22182 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="519/43" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC01_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC01_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI32694.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 321..494 + /gene="aliB" + /locus_tag="SPC01_0002" + /pseudo + CDS 321..494 + /gene="aliB" + /locus_tag="SPC01_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI32695.1" + gene complement(order(490..630,2097..2279,2281..2826)) + /gene="tnp" + /locus_tag="SPC01_0003" + /pseudo + CDS complement(join(490..630,2097..2279,2281..2826)) + /gene="tnp" + /locus_tag="SPC01_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + gene complement(order(665..1249,1306..1971)) + /gene="tnp" + /locus_tag="SPC01_0004" + /pseudo + CDS complement(join(665..1249,1306..1971)) + /gene="tnp" + /locus_tag="SPC01_0004" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(1169..1249,1306..1515)) + /gene="tnp" + /locus_tag="SPC01_0004" + /note="HMMPfam hit to PF01610, Transposase, score 6.6e-42" + /pseudo + misc_feature complement(2437..2808) + /gene="tnp" + /locus_tag="SPC01_0003" + /note="HMMPfam hit to PF01710, Transposase, score 4.1e-23" + /pseudo + gene 3061..4506 + /gene="wzg" + /locus_tag="SPC01_0005" + CDS 3061..4506 + /gene="wzg" + /locus_tag="SPC01_0005" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32698.1" + /db_xref="GOA:Q4K384" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K384" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLICFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSKIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADS + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLTDGDRDRGRNQQKVIVAIIQKLTST + EVLKNYSSILQGLQDSLQTNIPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLTVVKAAIQDVMEGR" + misc_feature 3061..3177 + /gene="wzg" + /locus_tag="SPC01_0005" + /note="Signal peptide predicted for SPC0007 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 3265..3612 + /gene="wzg" + /locus_tag="SPC01_0005" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.1e-62" + misc_feature 3790..4233 + /gene="wzg" + /locus_tag="SPC01_0005" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.3e-68" + gene 4508..5239 + /gene="wzh" + /locus_tag="SPC01_0006" + CDS 4508..5239 + /gene="wzh" + /locus_tag="SPC01_0006" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32699.1" + /db_xref="GOA:Q4K383" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K383" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 4511..5119 + /gene="wzh" + /locus_tag="SPC01_0006" + /note="HMMPfam hit to PF02811, PHP domain, score 1.3e-37" + gene 5248..5940 + /gene="wzd" + /locus_tag="SPC01_0007" + CDS 5248..5940 + /gene="wzd" + /locus_tag="SPC01_0007" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32700.1" + /db_xref="GOA:Q4K382" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K382" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQGEKPGLTNQDLQAGAYLVKDYREIVLSQDVLEEVISDLKLD + LVPKGLANKIKVTVPVDTRIVSVSVSDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGVIGTSVIVLLLELLDTRVKRPEDIENALQMT + LLGVVPNLGKLK" + misc_feature 5266..5682 + /gene="wzd" + /locus_tag="SPC01_0007" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.6e-50" + misc_feature 5788..5865 + /gene="wzd" + /locus_tag="SPC01_0007" + /note="PS00217 Sugar transport proteins signature 2." + gene 5950..6615 + /gene="wze" + /locus_tag="SPC01_0008" + CDS 5950..6615 + /gene="wze" + /locus_tag="SPC01_0008" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32701.1" + /db_xref="GOA:P96475" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:P96475" + /translation="MPTLEIAQKKLEFIKKAEEYYNTLCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIAMSFARAGYKTLLFDGDIRNSVMSGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILITATGEANKRDVQKAKQQLEQTGELFLGVVLNKLDISVDKYGVY + GRK" + gene 6756..7892 + /gene="wchB" + /locus_tag="SPC01_0009" + CDS 6756..7892 + /gene="wchB" + /locus_tag="SPC01_0009" + /note="member of homology group 206" + /codon_start=1 + /transl_table=11 + /product="galacturonosyl transferase" + /protein_id="CAI32702.1" + /db_xref="GOA:Q4K392" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K392" + /translation="MNLQKKKIMLITNHDDDIYCFRKEVIESLVEYGYEVLVSCPYGD + KIELMKSIQFEYEDITIDRRGINPLKDIRLFLSYIRLLRKYRPDVVLTYTVKPNVYAS + LAATILGIKYINNVTGLGSVLTMGSCVRSLVLLLFRISFRKSNCVFFQNEYNMKMLKT + LGLILGDSKLIPGSGVNIEKYPVQQYPNGGNGIQGETIVFNFIGRILKEKGIDTYLAA + AQIIKSRYPKTEFNIIGFIEPTESNYELKICDLEKKGIVYYLGQQKDVIPHITRSHAI + IHPSVYGEGMSNVLLENASSGRVLITTDNPGCKEIVKDRETGYIFQGGNVEELVSILE + VFLGLENEKRKEMGLQGRMYIEQYFSRQIIIDAYLDKIKGALDE" + misc_feature 7305..7817 + /gene="wchB" + /locus_tag="SPC01_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2e-40" + gene 7885..8436 + /gene="wchC" + /locus_tag="SPC01_0010" + CDS 7885..8436 + /gene="wchC" + /locus_tag="SPC01_0010" + /note="member of homology group 207" + /codon_start=1 + /transl_table=11 + /product="galacturonic acid acetyl transferase" + /protein_id="CAI32703.1" + /db_xref="GOA:P96477" + /db_xref="HSSP:1MR9" + /db_xref="InterPro:IPR011004" + /db_xref="InterPro:IPR018357" + /db_xref="UniProtKB/TrEMBL:P96477" + /translation="MNRIIKNIVGLLRANICLILLKVCRNKDLTFHYFLKFGKNVTVE + QESNAKLILGKKIRVNAGGVLKVRKGAKLKISDDVFLSNNCMIACRKYIDIKSGVKCG + PGVLIYDHDYDVSVPGGLKAKKFKTAPVMIGENVWIGANSIVLKGVSIGENSVVAAGS + VVTKDIPADTIFIQKRLSREMKL" + misc_feature 8098..8151 + /gene="wchC" + /locus_tag="SPC01_0010" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 81" + misc_feature 8269..8322 + /gene="wchC" + /locus_tag="SPC01_0010" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 6.8" + misc_feature 8296..8382 + /gene="wchC" + /locus_tag="SPC01_0010" + /note="PS00101 Hexapeptide-repeat containing-transferases + signature." + misc_feature 8323..8376 + /gene="wchC" + /locus_tag="SPC01_0010" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 1.7" + gene 8433..9587 + /gene="wchD" + /locus_tag="SPC01_0011" + CDS 8433..9587 + /gene="wchD" + /locus_tag="SPC01_0011" + /note="member of homology group 208" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32704.1" + /db_xref="GOA:P96478" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:P96478" + /translation="MKVFIATEFRCTIYKNEIYLKPKAYFIYERYAKAFGEIVLCSRY + EKVESYPEGYHKANFINKFIPIEGLHQVLFGQNKNKIIEGMIDSDLIVVRIPSIIGSK + TADYALKIGKPYLTEIMGDAWDSYWYHSLKGKLLAPYIYAKTKSIVKNANYCIYVTEK + YLQDRYPNIKSNIVASNVNITSVENRSLKSRLYKLKKFNPQKISIMTTASVNVRAKGH + RFVLEAMKRLEIQGILLDYYLAGDGDQSFLKKKAEELGVANRIHFLGELTTSQIYEYL + DKVDLYIQPSLQEGLPRAVIEAMSRACPCIGSNKAGIPELLGPHCLFTPSSSQAIAGS + IIDFISMDKEKMVIKQFEFSKKFLSSVLNKRRSDYFAQIRRELNNSDGLD" + misc_feature 8997..9503 + /gene="wchD" + /locus_tag="SPC01_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 8.5e-22" + gene 9704..11008 + /gene="wzy" + /locus_tag="SPC01_0012" + CDS 9704..11008 + /gene="wzy" + /locus_tag="SPC01_0012" + /note="member of homology group 209" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32705.1" + /db_xref="UniProtKB/TrEMBL:P96479" + /translation="MKFSLQSNDIKNKIILLVGVVFSGTLILCSENNDVTIPLFSMIF + LSFMAMIIVKFNIFHPYVWYSSFFTIYSISYPLLYRMEYINYGYTKDLIFMQWLALAT + LLLTLPSKAIVLSERKINLNNNNYLLFLNNMNTFITTVAIIYLLGSGFRNKGEIYSGA + NIVIMLVFSLVYFMILIHTYQLFIQLSTKKWRLLNCNTNTAIVICLFSIVTGERDYMF + TLFILDVIILFYFHKIKRFYLVMLVPLAALLIPLSAVFKYTLLSGQVSSINTNNIWFD + LLDGEFVSASRNLQILILHNMGNYFEGRSFFNDIVRIFYNTGYSNQTWFMDTFFPNVH + STKYGFTLVGEGYVNGGYFGIVMIFMLTGFLMRFLYINAQRNIYGMLIYLYMIPIFIY + STRADFANILSPLLKYAILGTLVIVFINRMVLISPLDEMGGE" + misc_feature 9704..9799 + /gene="wzy" + /locus_tag="SPC01_0012" + /note="Signal peptide predicted for SPC0014 by SignalP 2.0 + HMM (Signal peptide probability 0.933) with cleavage site + probability 0.413 between residues 32 and 33" + gene 11323..12363 + /gene="wzx" + /locus_tag="SPC01_0013" + CDS 11323..12363 + /gene="wzx" + /locus_tag="SPC01_0013" + /note="member of homology group 210" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32706.1" + /db_xref="GOA:Q4K388" + /db_xref="InterPro:IPR002797" + /db_xref="InterPro:IPR004268" + /db_xref="UniProtKB/TrEMBL:Q4K388" + /translation="MNLVEIFYILGGVGLGQAYSTFKRNHSNEYQNKFVFLTFIQGLL + FGIIGLIIVLADVPIDYGGVIIVLSSLSIMRTNLTMIAVIENSIKRNKIVLGVSVVYS + VMLVLLLLFHLVSIEMVFLVYAINEFLRIILFLYYYNMFPVFEHISIKEFFTIYKFGF + LSMILTLLITFNYSIDIIMLKQMSSSYNVGIYSVAVTFSNMFLMVPDSFKEILFGDSA + KRTFEKNKAINAIKVSFLFMILLIIGFLSFGEFAITLLYGSSYIKAFPITLVIFLGSL + SMIFFKILQPIYISQGKQSVAIKILSVSALINISLNWYLIPNYQITGAAIASAISYTV + CGLFFIIDYLRN" + gene 12431..13501 + /gene="gla" + /locus_tag="SPC01_0014" + CDS 12431..13501 + /gene="gla" + /locus_tag="SPC01_0014" + /note="member of homology group 96" + /codon_start=1 + /transl_table=11 + /product="putative epimerase" + /protein_id="CAI32707.1" + /db_xref="GOA:P96481" + /db_xref="HSSP:1ORR" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR008089" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:P96481" + /translation="MRGKTILITGVAGFIGSNLVRKLLELEGTMTIIGLDNLNDYYDI + ALKDYRLLQLNKLIQDYPEKNWIFIKGDIADKMLINKIFKSYHPQIVVNLAAQAGVRY + SITNPDVYIESNIVGFHNVLEACRHSYEIYDGGVEHLVYASSSSVYGGNKKIPFATED + KVDNPISLYAATKKTNELQAYAYSKIYNIPSTGLRFFTVYGPAGRPDMAYFGFTDKLR + SGSDIEIYNHGNCKRDFTYIDDIVEGIVRVMQSAPKKLVGSDNLPLAPYKVYNIGNSK + PENLLDFVDVLQQELIKAGVLPENYDFDSHKKLVPMQPGDVPVTYADTSDLERDFGFK + PKTSLREGLRKFAEWYKDYYNV" + misc_feature 12443..13486 + /gene="gla" + /locus_tag="SPC01_0014" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 3.1e-05" + misc_feature 12446..13255 + /gene="gla" + /locus_tag="SPC01_0014" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 3.7e-06" + misc_feature 12446..13249 + /gene="gla" + /locus_tag="SPC01_0014" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.3e-58" + misc_feature 12449..13327 + /gene="gla" + /locus_tag="SPC01_0014" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-09" + gene 13530..14762 + /gene="ugd" + /locus_tag="SPC01_0015" + CDS 13530..14762 + /gene="ugd" + /locus_tag="SPC01_0015" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI32708.1" + /db_xref="GOA:Q4K386" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K386" + /translation="MKIAVAGTGYVGLSIAILLAQHHQVVAVDIIPEKVELINKKKSP + IQDDYIEKYLAEKELNLVATLNAEEAYENADFIVIAAPTNYDPKKNFFDTSSVEAVIE + AVMKYNPDAIIIIKSTVPVGYTKSVRRKFLTDNIMFSPEFLRESKALYDNLYPSRIII + GTDKDDKDLVKSAEIFVKMLQEGAVKENIETLYMDFTEAEAVKLFANTYLALRVSYFN + ELDTYSEMKGLDTQAIIDGVCLDPRIGSHYNNPSFGYGGYCLPKDTKQLLANYSDVPQ + EMITAIVQSNRTRKDYIADRILDLAGSYVGNDFYKPDKEKEIVVGIYRLTMKSNSDNF + RQSSIQGIMKRLKAKGVTIIIYEPTLESGTTFYGSQVVNDFEIFKKSSQVIVANRFDE + TLEDVRGKVYTRDIFKRD" + misc_feature 13530..14063 + /gene="ugd" + /locus_tag="SPC01_0015" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 9.3e-50" + misc_feature 13530..14042 + /gene="ugd" + /locus_tag="SPC01_0015" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00016" + misc_feature 13530..13946 + /gene="ugd" + /locus_tag="SPC01_0015" + /note="HMMPfam hit to PF00056, lactate/malate + dehydrogenase, NAD bind, score 0.0013" + misc_feature 13530..13610 + /gene="ugd" + /locus_tag="SPC01_0015" + /note="Signal peptide predicted for SPC0017 by SignalP 2.0 + HMM (Signal peptide probability 0.752) with cleavage site + probability 0.397 between residues 27 and 28" + misc_feature 14115..14396 + /gene="ugd" + /locus_tag="SPC01_0015" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.3e-36" + misc_feature 14490..14741 + /gene="ugd" + /locus_tag="SPC01_0015" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 9e-05" + gene complement(order(15448..15825,15829..16032,16086..16754)) + /gene="tnp" + /locus_tag="SPC01_0016" + /pseudo + CDS complement(join(15448..15825,15829..16032,16086..16754)) + /gene="tnp" + /locus_tag="SPC01_0016" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI32709.1" + misc_feature complement(join(15952..16032,16086..16298)) + /gene="tnp" + /locus_tag="SPC01_0016" + /note="HMMPfam hit to PF01610, Transposase, score 7.2e-43" + /pseudo + gene 16968..17825 + /gene="rmlA" + /locus_tag="SPC01_0017" + CDS 16968..17825 + /gene="rmlA" + /locus_tag="SPC01_0017" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI32710.1" + /db_xref="GOA:O08434" + /db_xref="HSSP:1FXO" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:O08434" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSTDGLAIGEEFISDDSVALIL + GDNIYHGPGLSTMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEKPEYP + RSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRGFAWL + NTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKNEYGQ + YLLRLIGEA" + misc_feature 16971..17675 + /gene="rmlA" + /locus_tag="SPC01_0017" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 6.2e-111" + gene 17826..18422 + /gene="rmlC" + /locus_tag="SPC01_0018" + CDS 17826..18422 + /gene="rmlC" + /locus_tag="SPC01_0018" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI32711.1" + /db_xref="GOA:O08435" + /db_xref="HSSP:1NZC" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:O08435" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + VLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENLEEADVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 17862..18392 + /gene="rmlC" + /locus_tag="SPC01_0018" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 1.7e-15" + gene 18432..19481 + /gene="rmlB" + /locus_tag="SPC01_0019" + CDS 18432..19481 + /gene="rmlB" + /locus_tag="SPC01_0019" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI32712.1" + /db_xref="GOA:O08436" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O08436" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLVAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGIYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18447..19403 + /gene="rmlB" + /locus_tag="SPC01_0019" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 8.7e-05" + misc_feature 18450..19190 + /gene="rmlB" + /locus_tag="SPC01_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 7.5e-76" + misc_feature 18453..19265 + /gene="rmlB" + /locus_tag="SPC01_0019" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 5.1e-05" + gene 19547..20398 + /gene="rmlD" + /locus_tag="SPC01_0020" + /pseudo + CDS 19547..20398 + /gene="rmlD" + /locus_tag="SPC01_0020" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /pseudo + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + misc_feature 19547..20392 + /gene="rmlD" + /locus_tag="SPC01_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.2e-142" + /pseudo + misc_feature 19550..20188 + /gene="rmlD" + /locus_tag="SPC01_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 6e-05" + /pseudo + misc_feature 19550..20176 + /gene="rmlD" + /locus_tag="SPC01_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.4e-16" + /pseudo + misc_feature 19553..20278 + /gene="rmlD" + /locus_tag="SPC01_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 6.3e-08" + /pseudo + gene order(20522..21427,21438..21624) + /gene="tnp" + /locus_tag="SPC01_0021" + /pseudo + CDS join(20522..21427,21438..21479,21517..21624) + /gene="tnp" + /locus_tag="SPC01_0021" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 20522..20923 + /gene="tnp" + /locus_tag="SPC01_0021" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 0.0093" + /pseudo + gene 21826..>22182 + /gene="aliA" + /locus_tag="SPC01_0022" + CDS 21826..>22182 + /gene="aliA" + /locus_tag="SPC01_0022" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32715.1" + /db_xref="GOA:Q4K378" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K378" + /translation="MKSSKLLALAGVTLLAATTLAAWSGSGSSTKGEKTFSYIYETDP + DNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDA + KWYTSEGEEYAAVKAQD" + misc_feature 21826..21897 + /gene="aliA" + /locus_tag="SPC01_0022" + /note="Signal peptide predicted for SPC0028 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.207 between residues 24 and 25" + misc_feature 22069..22137 + /gene="aliA" + /locus_tag="SPC01_0022" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaagcaga aatcctttgt + 241 tttttataac caaggtttat aaactttcat tctcgaaatt caattaactt tacaaattcc + 301 cactattaag gagaaagaag atgaacataa agaagcgtgt ccttagtgca ggcctgactt + 361 ttgcatctgt tttgctttta gctgcttgcg gccaatcagg ttcagataca aaaacttact + 421 catcaacctt tagtggaaat ccaactacat ttaactatct attagactat tacactgata + 481 atatagtcaa ttgaaacaag aacaagacaa aagagcctca taaaaggtat tgcaacttgg + 541 taataccttt ttgaggtgct ttttgatatg agcccatgtt ttctcaatag gattgtactc + 601 aggtgagtag ggaggaagag gtaaaagctt aggctctttg tcaactgtag tgggttgaag + 661 tcagctaagc tcgagaaagg acaaatttcg tcctttcttt tttgatgttc agagcgatga + 721 aaatccgttt tttgaagttt tcaaagtttc gaaaaccaaa ggcattgcgc ttgataagtt + 781 tgatgagatt attggtcgct tccagtttgg cgttagaata gtgtagttga agggcgttga + 841 caatcttttc tttatctttg aggaaggttt taaagacagt ctgaaaaata ggatgaacct + 901 gcttaagatt gtcctcaata agtccgaaaa atttctctgg ttccttattc tggaaatgaa + 961 aaagcaagag ctgatagagt tgatagtggt gtttcaagtc ttccgaataa ctcaaaagct + 1021 tgtttaaaat ctctttattg gttcaatgca tacgaaaagt aggacgataa aaatgtttat + 1081 cactcagttt acgactatcc tgttgaatga gtttccagta gcgcttgata gccttgtatt + 1141 catgggattt tcgatgaaac tgatttatga tttgaacacg cacacgactc atagcacggc + 1201 taagatgttg tacaatgtga aagcgatcca acacgatttt agcattcggg agtgaaacag + 1261 tctgggagac tgtttcagcc tgagcctaga aatttgaaag cgaaactgtt tagccaagtc + 1321 atagtaaggg ctaaacatat ccatagtaat gattttgacg cgacatcgga caactctatc + 1381 gtagcgaaga aagtgatttc gaatgatagc ttgtgttcta ccctcaagaa cagtgatgat + 1441 attgagattg ttaaaatctt gcgcaatgaa gctcatcttt ccctttgtaa aagcatactc + 1501 atcccaagac ataatctcag gaagacaaga aaaatcatgt ttaaagtgaa aatcattgag + 1561 cttacgaata acagttgaag ttgagatgga aagctgatgg gcaatatcag tcatagaaat + 1621 cttttcaatt aacttttgag caatcttttg gttgatgata cgagggattt ggtgattctt + 1681 cttgacgata gaagtttcag cgaccatcat ttttgaacag tgatagcact tgaatcgacg + 1741 ctttctaagg agaattctag taggcatacc agtcgtttca agataaggga tcttagacgg + 1801 tttttgaaag tcatatttct tcattagact tccacaatca gggcaagatg gagcctcata + 1861 atccagctta gcgataattt ctttgtgggt atccatattg atgatatcta gaatcttgat + 1921 gtttgggtct ttgatatcga gtagttttgt gataaaatgt aattgtccca tatgaatctt + 1981 tctaatgagt tgtttggtcg cttttcatta taggtcatat gggacttttt ttctacaata + 2041 aaataggctc cataatatct ataagggatt tacccactac aaatattata gagccaaagt + 2101 ttatacccaa actcctcgca taaaagttct aacttaccca ttctatggaa tcttgcatta + 2161 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 2221 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattc + 2281 atttgttaga cctgcaacca aagaaattct ctgatatctt cttccagata ctttgcctct + 2341 tcttaactga ccttttaatg agcgaccata ttctcgataa aaataagtat cgaatcctgt + 2401 ttcgtcaatc taaacaggtg ctaggtgctt taaactatta aaattcttaa gaaataaggc + 2461 tactttttct gggtcttgtt catagtaggt gtggttcttt tttcgagtgt agcccatagc + 2521 tttgagcgca tagtggatgg tagttggatg acagccaaag tcagaagcta tttcagtcaa + 2581 ataagcgtct ggattgtcag taagatagtt tttaagtcta tctctatcaa cttttcttgg + 2641 ttttgttcct tttacttggt ggtttagctc tcctgttttc tcttttagct ttaaccagcc + 2701 ataaatggta ttacgtgaga tttggaaaac gtgtgatgct tctgttatac tacctgttcg + 2761 ctcacaataa gagagaactt ttttacgaaa atctattgaa tatgccataa gaagattata + 2821 ccacattgtg tactatatta tattgaaact agaatagtac acatctgatt ctaaaacatt + 2881 gttagaaatc gatttgactg tcctgattga tttgtcctat tcttatttca ttttactata + 2941 tttttggttc gcgggaagtc tactaagata cttaaagatg cagatagtga aaataaaggt + 3001 gtagacatta ccgtaaaaaa gtgatataat tgtatgatgt tcaaggtata ggtgttaatc + 3061 atgagtagac gttttaaaaa atcacgttca cagaaagtga agcgaagtgt taatatcgtt + 3121 ttgctgacta tttatttatt gttaatttgt tttttattgt tcttaatctt taagtacaat + 3181 atccttgctt ttagatatct taacctagtg gtaactgcgt tagtcctact agttgccttg + 3241 gtagggctac tcttgattat ctataaaaaa gctgaaaagt ttactatttt tctgttgctg + 3301 ttctctatcc ttgtcagctc agtgtcgctc tttgcagtac agcagtttgt tggactgacc + 3361 aatcgtttaa atgcgacttc taattactca gaatattcaa tcagtgtcgc tgttttagca + 3421 gatagtaaga tcgaaaatgt tacgcaactg acgagtgtga cagcaccgac tgggactgat + 3481 aatgaaaata ttcaaaaact actagctgat atcaagtcaa gtcagaatac cgatttgacg + 3541 gtcaaccaga gttcgtctta cttggcagct tacaagagtt tgattgcagg ggagactaag + 3601 gccattgtcc taaatagtgt ctttgaaaat atcatcgagt cagagtatcc agactacgca + 3661 tcgaagataa aaaagattta taccaaggga ttcactaaaa aagtagaggc tcctaagacg + 3721 tctaagaatc agtctttcaa tatctatgtt agtggaattg acacctatgg tcctattagt + 3781 tcggtgtcgc gatcagatgt caatatccta atgactgtca atcgagatac caagaaaatc + 3841 ctcttgacca caacgccacg tgatgcctat gtaccaatcg cagatagtgg aaataatcaa + 3901 aaagataaat taacccatgc gggcatttat ggagttgatt cgtccattca caccttagaa + 3961 aatctctatg gagtggatat caattactat gtgcgattga acttcacttc tttcttgaaa + 4021 atgattgact tattgggagg ggtagatgtt cataatgatc aagagttttc agctctacat + 4081 gggaagttcc atttcccagt agggaatgtc catctagact ctgagcaagc tttaggtttt + 4141 gtacgtgaac gctactcact aaccgatgga gaccgtgacc gtggtcgcaa ccaacaaaag + 4201 gtcattgtag caattattca gaagttaact tctacagagg ttttgaaaaa ctatagtagt + 4261 attcttcaag gattgcagga ttctcttcaa acaaatatac cgattgagac tatgatagat + 4321 ttagtgaata ctcagttgga aagtggaggg aattataaag taaattctca agatttaaaa + 4381 gggacaggtc ggatggatct tccttcttat gcaatgccag acagtaacct ctatgtgatg + 4441 gaaatagatg atagtagttt aactgtagtt aaagcagcta tacaggatgt gatggagggt + 4501 agataaaatg atagacatcc attcgcacat cgtctttgat gtagatgatg gtcccaagtc + 4561 aagagaggaa agcaaggctc tcttggcaga atcctacagg cagggggtga gaaccattgt + 4621 ctctacctct caccgtcgca agggcatgtt tgaaactccg gaagagaaga tagcagaaaa + 4681 ctttcttcag gttcgggaaa ttgcaaaaga agtagcagat gatttagtca ttgcttatgg + 4741 cgcagagata tactatactc tggatgctct agaaaagcta gaaaaaaaag aaattcctac + 4801 ccttaatgat agtcgttatg ccttgattga gtttagcatg catacttcct atcgtcagat + 4861 tcatacggga ttgagcaata ttttgatgtt gggaatcacg ccagtaattg ctcatattga + 4921 acgttatgat gctttagaga ataacgaaaa acgtgttcgt gaactgattg atatggggtg + 4981 ctatactcag ataaatagtt atcatgtttc aaaacctaag ttctttggtg aaaaatataa + 5041 attcatgaaa aagagagctc ggtatttttt ggaacgtgat ttagttcatg tagttgcaag + 5101 tgacatgcac aatttagaca gtagacctcc atatatgcaa caggcatatg atatcattgc + 5161 taagaaatat ggagcgaaaa aagcgaaaga actttttgta gataatccca gaaaaattat + 5221 aatggatcaa ttaatttagg agaaaatatg aaggaacaaa acactttgga aatcgatgta + 5281 ttgcaactat tcagagcttt atggaaaaga aagttggtca ttttattagt ggcaattata + 5341 acttcttcag ttgcttttgc ctacagtact tttgttatca aacctgagtt tactagtacg + 5401 actcggattt atgtagttaa ccgtaatcag ggagagaagc ctggtttaac caatcaagac + 5461 ttgcaggcag gagcatactt ggttaaagac tatcgtgaaa ttgtcctatc gcaggatgtt + 5521 ttggaggaag ttatttctga tttgaaacta gatttggtgc caaaaggttt ggctaataaa + 5581 attaaagtaa cagtaccagt tgatacccgt attgtctctg tttcagttag tgatcgagtt + 5641 cctgaagagg caagccgtat cgctaactct ttaagagaag tagctgctca aaaaattatc + 5701 agtattactc gtgtttctga tgtgacaaca ctggaggagg caagaccggc gatatcaccg + 5761 tcttcgccaa atattaaacg caatacacta attggttttt tggcaggggt gattggaact + 5821 agtgttatag ttcttcttct tgaacttttg gacactcgtg tgaaacgtcc ggaagatatc + 5881 gaaaatgcac tgcagatgac acttttggga gttgtaccaa acttgggtaa gttgaaatag + 5941 gagagagaga tgccgacatt agaaatagca caaaaaaaac tggagttcat taagaaggca + 6001 gaagaatatt acaatacctt gtgtacaaat atacagttga gcggagataa actaaaagta + 6061 atttccgtta cttctgttaa tccgggggaa ggaaaaacaa ctacttccgt aaatatagca + 6121 atgtcatttg cgcgtgcagg ctataaaact cttttgttcg atggcgatat tcgaaattca + 6181 gttatgtcag gattttttaa atctcgtgaa aaaattacag ggctaacaga atttttatct + 6241 gggacagctg atttatctca cggtttatgt gatacaaata ttgaaaattt atttgtagtt + 6301 caatcgggat ctgtatcacc aaaccctaca gccttgttac aaagtaaaaa ttttaatgat + 6361 atgattgaaa cattgcgtaa atattttgat tatatcattg ttgatacacc acctattgga + 6421 attgttattg atgcggcaat tatcactcaa aagtgtgatg cgtccatctt gataacagca + 6481 acaggtgagg cgaataaacg tgatgtccaa aaagcgaaac aacaattaga acaaacaggg + 6541 gaactgttcc tgggagttgt tttaaataaa ttggatatct cggttgataa gtatggagtt + 6601 tacggtcgta aatagtttgt aagttctata tgtgtataga attttaaagt gtcacaattt + 6661 ggaaacaatt acttatagaa aattactatt tttaaaatga tagttgtaaa ggataatgga + 6721 gtagcggtta attatatttt aggaagatta ttttgatgaa tttacaaaag aaaaaaatta + 6781 tgttaataac taatcatgac gatgatatct attgttttcg aaaagaagtt atagagtcac + 6841 tagttgagta tgggtatgaa gtgctagtgt catgtcctta tggagataag atagagttga + 6901 tgaagtctat tcaatttgag tatgaagata ttactattga tagaagagga ataaaccctt + 6961 taaaagatat tcgtctattt cttagttata taagattatt gagaaaatat agaccggatg + 7021 tagtcttgac atataccgtg aaaccaaatg tatatgctag cctagctgca acaattttag + 7081 gaataaaata tataaataac gtaacaggtt taggtagtgt cttaacaatg ggttcttgtg + 7141 taagaagcct ggtgttatta ctgtttagaa tttcttttag gaaatcaaat tgtgtttttt + 7201 ttcaaaatga atataatatg aaaatgttaa aaactcttgg cttgattttg ggtgactcta + 7261 agctgatacc tgggtcagga gtgaacattg aaaagtatcc tgtgcaacag tatccaaatg + 7321 gtggaaatgg aattcaagga gaaacaatcg tttttaattt tattggtagg atattaaaag + 7381 aaaaaggtat agatacttat ctggctgctg cccaaattat taagagtcga tatcccaaaa + 7441 cagagtttaa tattattggc tttatagaac cgacagagag taattatgaa cttaaaattt + 7501 gtgacttaga aaaaaaagga atcgtttatt atttgggaca acaaaaagat gtgatacctc + 7561 atattacccg ttcccatgca attatccatc ccagtgtgta tggtgaagga atgagcaatg + 7621 tattactaga aaacgctagt tcaggacgtg ttttaattac gacagataat ccaggttgca + 7681 aagaaattgt taaagataga gagacaggct atatatttca agggggaaat gttgaggaac + 7741 tagtctctat attggaagtt tttttaggtc tagaaaatga aaaacgaaaa gagatgggac + 7801 ttcaagggag aatgtatata gagcaatatt tttctcgtca aattattata gatgcttatt + 7861 tagataaaat aaaaggagct ttagatgaat aggattataa aaaatattgt tggtttactt + 7921 cgtgcaaata tttgcttgat attattaaaa gtgtgtcgaa acaaggatct tacttttcat + 7981 tattttttaa aatttggaaa gaatgtaact gtcgaacagg aatctaatgc taaattaatc + 8041 ttaggaaaaa agattagagt aaacgccggg ggagtattga aagttagaaa aggagcaaaa + 8101 ctcaagattt ctgatgatgt atttttgagt aataattgta tgatagcttg tcgtaaatac + 8161 atagatatta aatctggagt aaaatgtggt cctggagtac ttatatatga tcatgactat + 8221 gatgttagtg ttccaggtgg attgaaagca aaaaaattta agacggcccc agttatgatt + 8281 ggagaaaatg tttggattgg agctaacagc attgtcttga agggagtgag tattggtgag + 8341 aatagtgtgg ttgcagcagg aagtgttgta acaaaggata ttccagctga tactatattt + 8401 attcagaaac gtttatcaag ggagatgaaa ttatgaaagt atttatagcg actgaattta + 8461 gatgtacaat ctataaaaat gaaatatatt taaaaccgaa agcttatttt atttatgagc + 8521 gctatgctaa agcatttgga gagattgtac tatgtagtcg ttatgagaag gtggaatcat + 8581 accctgaagg atatcataaa gcgaacttta ttaataaatt tatccctata gaaggtctac + 8641 atcaggttct atttggtcaa aataaaaata agattattga aggaatgatt gatagcgact + 8701 taatagttgt tcgtattccg tctataattg gatcaaaaac tgcagactac gcattgaaga + 8761 taggtaagcc gtatctgaca gaaataatgg gggatgcttg ggattcttac tggtatcata + 8821 gtttaaaggg aaaattatta gctccatata tatacgccaa aactaaatca attgtaaaaa + 8881 acgctaatta ttgcatatac gtgacagaaa aatatttaca agatagatat cctaatatta + 8941 aatctaatat cgttgcttca aatgttaata ttacctctgt agagaataga tctttgaaga + 9001 gccgtcttta taagttgaaa aaatttaatc ctcaaaaaat ttcaataatg acaacagcat + 9061 ctgtgaatgt acgagccaag ggccatagat ttgtattgga agcaatgaag agattagaaa + 9121 tacaaggtat tttgttggat tattatttag caggtgatgg tgatcaaagt ttcttaaaaa + 9181 agaaagcaga ggaattggga gtagcgaata gaatccattt tttaggggaa ttgactacat + 9241 cacaaattta tgagtatttg gataaagttg atttatatat acaaccaagt ttacaagaag + 9301 ggttacctcg tgcggtaatt gaagctatga gccgtgcttg cccttgtata gggtctaata + 9361 aagcaggaat tccagagttg ctggggccac attgtctatt tactccatcc tcttcacaag + 9421 cgattgcggg atctattata gattttatta gtatggataa ggaaaagatg gtgataaaac + 9481 agtttgaatt ctcaaaaaaa tttctttcga gtgtattaaa taaacgcaga agtgactatt + 9541 ttgctcaaat tagaagagaa ttaaataatt ctgatggttt agattaaaat gcgatggaaa + 9601 atccgtttcg atatattaaa tatgctataa aaactgacta catagccaat caaatttttg + 9661 aatacgcatt acgtttaaat tattagttaa aggaaaaaag taaatgaagt ttagtctaca + 9721 atcaaatgat ataaaaaata aaataatact tctagtaggt gtagtttttt cagggacttt + 9781 aattttatgc agtgaaaata atgatgttac aattccatta ttttcaatga tttttttaag + 9841 ttttatggca atgataattg tgaaatttaa tatttttcat ccctatgtgt ggtatagtag + 9901 cttctttact atttattcta tttcttaccc gctactctat agaatggagt atataaacta + 9961 tggttataca aaagatttga ttttcatgca atggctggct ttggcaactt tgttgttaac + 10021 tctaccttct aaagccattg tgttaagcga aaggaaaata aacctaaata acaataacta + 10081 tttattattt ctcaataata tgaatacgtt tatcacaaca gtagcaatta tatatctatt + 10141 aggaagtggt tttagaaata aaggggaaat atattcaggt gccaatattg tgataatgtt + 10201 agtattttct ttggtttatt ttatgattct cattcataca tatcagctat ttatacagtt + 10261 gagtactaaa aaatggagac tactaaattg taatactaac acagcgatag ttatctgtct + 10321 cttctctatc gttacagggg aaagagatta tatgtttact ttattcatcc ttgatgtgat + 10381 tatattattt tactttcaca aaataaaacg tttttatctt gtaatgttag ttccgcttgc + 10441 ggcactactg attccgttat ctgcagtttt taaatatact ttattaagtg ggcaagtttc + 10501 atctataaat acaaataata tttggtttga tttgctagat ggtgagtttg tatcagctag + 10561 tcgtaattta cagattctga tattacataa tatgggcaat tatttcgaag gtcgttcttt + 10621 ttttaatgac atagtaagaa ttttttataa tacggggtat tctaatcaaa cttggtttat + 10681 ggacaccttt tttccaaacg tacattcaac caaatatggt tttactcttg tgggagaggg + 10741 atatgtgaat ggaggatact ttggaattgt aatgattttt atgctaacag gctttttgat + 10801 gagatttctt tatataaacg ctcaaagaaa tatatacggg atgctgatat atctgtatat + 10861 gatacctatt tttatttatt ctactcgtgc tgattttgct aacatattat ctccattact + 10921 taaatatgct atattgggaa cattggttat tgtttttatc aatagaatgg tgttgatatc + 10981 accattggat gaaatgggtg gtgagtagtt tatttaaaaa ggtggggtat actttttgat + 11041 actatagtgg tttgaagttg gagtagtaca atgcagcttc taaagaattt ttataaatta + 11101 ctttaaattc cctaatcgtt ttgttcatat tctatttcaa tatactataa ttttaaattt + 11161 actgttataa aatttaacat acggagaaaa taagtgagac tatctaagaa atattggttt + 11221 gctttaacga gtaaattttt gttaatctta ttaacacttt tatcctcaat tataattaat + 11281 aggggattag gtgttgaaaa aaaaggagat tatgcctatg taatgaactt agtagaaatt + 11341 ttttatattt taggtggagt tggtttaggt caggcttact cgacctttaa aaggaatcat + 11401 tctaatgagt atcagaataa atttgttttt ttaactttta ttcaaggatt attgtttgga + 11461 ataataggtt taataatagt tttagctgat gttccgatag attatggtgg ggtaataata + 11521 gttttgtcca gtctatctat tatgagaaca aatcttacta tgattgcagt aatagaaaat + 11581 agtataaaga ggaataagat tgtattagga gtaagcgtag tatattccgt tatgctagta + 11641 ttgttgttac tatttcattt agtttctata gagatggtat ttttggtata tgctattaat + 11701 gaatttttac gtatcatttt atttttatac tattacaata tgttcccagt ttttgaacat + 11761 attagtatta aagaattttt cactatatat aagtttggat ttctttctat gattcttact + 11821 ctattaatta catttaatta tagtattgat atcataatgt tgaagcaaat gtctagtagt + 11881 tataatgtag gtatatacag tgtcgcagtt acgttttcta atatgttttt gatggttcca + 11941 gactcattta aagagatttt atttggtgat tcggctaaaa gaacttttga gaaaaataaa + 12001 gcaataaatg caataaaagt atcatttcta tttatgattt tattaattat tggatttctt + 12061 tcttttggag aatttgcgat tacgctcctt tatggttcca gttatataaa ggcatttcct + 12121 ataacattag tcattttttt aggaagctta tcgatgattt tctttaaaat tttacaacca + 12181 atttatatat ctcagggtaa acagagtgta gctataaaaa ttttatctgt gtcggctttg + 12241 ataaatataa gtttaaactg gtacttaatt cctaactacc aaattacagg agctgcgata + 12301 gcatcagcaa tctcttatac tgtatgtggt ttgtttttta ttatagatta tcttagaaat + 12361 tgattataat agttgttaaa gaatgtgtat tagtggatga aaatataaaa ataacaagag + 12421 gtattatgat atgagaggaa aaacaattct aattacagga gtagctggtt ttattggatc + 12481 aaatctggtt aggaaattat tggaattaga aggaacgatg acaatcattg gtttggacaa + 12541 tttgaatgat tactatgata ttgcacttaa agattatcga ttgcttcaac ttaataagct + 12601 aattcaggat tatccagaaa aaaactggat atttatcaag ggtgatattg cagataaaat + 12661 gcttattaat aagattttta agagttatca tcctcagatt gttgttaatc tagctgccca + 12721 ggcaggagta cgctactcca ttacaaatcc agatgtatat atagaaagta atatcgttgg + 12781 ctttcataat gtgttggaag cttgtcgtca ttcgtatgag atatatgatg gtggtgtgga + 12841 acacttagtt tatgcatcgt cctcatcggt atatggtgga aataaaaaaa tcccgtttgc + 12901 aacagaagat aaggtagaca atcctatttc actatatgct gcgactaaaa aaacaaatga + 12961 acttcaagcg tatgcttatt caaagattta caatattcct tcgacaggct tacgcttttt + 13021 tacagtttat ggtcctgctg ggcgcccaga tatggcctat tttggattta cagataaatt + 13081 gcgaagtggt tccgatattg agatttataa tcatggtaat tgtaaacgag attttactta + 13141 tatagatgat atcgttgagg ggatagtaag ggtcatgcaa tcagctccga agaaactagt + 13201 gggatctgat aatttaccgt tagccccata taaagtgtac aatattggga atagtaaacc + 13261 cgaaaatttg ttagattttg tggatgttct tcaacaggag ctaatcaagg caggagtttt + 13321 gccggaaaat tatgattttg atagtcataa aaaattagtt cctatgcaac caggcgatgt + 13381 tcctgttact tatgcagata caagtgattt agagagagat tttggtttta aaccaaaaac + 13441 ttctttacga gaaggtttga gaaagtttgc agagtggtat aaagactact ataatgtata + 13501 acgagagtgt tttgagaaag gaaaaaatta tgaaaatagc agtagcaggt acaggatatg + 13561 ttggattatc tattgcaatc ttactggctc aacatcatca agttgttgcc gtagatatca + 13621 ttcctgagaa agttgagtta atcaataaaa agaagtcccc tatccaagac gattatatag + 13681 aaaaatatct cgcggaaaaa gaattgaatc tcgtagctac attgaatgca gaggaagcat + 13741 atgagaatgc ggattttata gttattgcgg ctccaactaa ttatgatccg aaaaaaaatt + 13801 ttttcgatac atcttcagtc gaggctgtca ttgaagcagt tatgaaatat aatcctgatg + 13861 caattataat aattaaaagt actgttcctg ttggatatac aaagtcagta cggaggaaat + 13921 ttcttacaga caatattatg tttagtcctg agtttttacg ggagtcaaaa gcgttatatg + 13981 ataacctata tccgagtcga attattatag gtacagataa agatgataaa gatttggtaa + 14041 agtctgctga aatttttgta aaaatgcttc aggaaggtgc agtgaaagaa aatattgaaa + 14101 cattgtatat ggattttaca gaagctgaag cagtaaaact ttttgctaat acctatcttg + 14161 ccctccgggt ttcctatttt aacgagttag atacttattc tgagatgaaa ggactagata + 14221 ctcaagcgat tattgatgga gtttgtttag atccgagaat aggttctcac tacaataatc + 14281 cttcttttgg ttatgggggt tactgtcttc ctaaagatac caagcaactt cttgcaaatt + 14341 attctgacgt tccacaagaa atgataacag ctatagtaca aagtaatcgg acaagaaaag + 14401 attatattgc agatcgtatt ttagatcttg ctggatctta tgtaggcaat gatttctata + 14461 aaccagataa agaaaaagag attgttgtag gaatttatcg tttaacaatg aaaagtaatt + 14521 cagataattt tagacaatct tctattcaag gtattatgaa gcgtttgaaa gcaaaaggtg + 14581 ttactattat tatttacgaa ccaactcttg aaagtggtac tactttctat ggtagtcaag + 14641 tagttaatga ttttgaaata tttaagaaat ctagtcaagt gattgttgca aatcgttttg + 14701 atgagacttt agaagatgtg aggggtaaag tttatactag ggatattttt aagagagatt + 14761 aaatcaattt gtatatttct agtccctaat aatctatatc atttgaatga tagaatagtt + 14821 aaaaactagc tggaggatag cgacaactca tctaaaacaa taaagatatt tctatattct + 14881 cgctcgcact tagtgaagta aatatacttc ttttgtcagt agagattgac ttaataggat + 14941 atagttgcat atattccttc gaagtgaggt gctgataatg gcagtaattt ttaaaaatgt + 15001 gcttattgaa gagaagactg aagaagaaaa acaacatatt ctatctattc taaatggtga + 15061 gtatgactta tctgatgatg taagttgtag attacgacga ctgaatgagg aaagtaaacg + 15121 cttggaagtg tttgttaagg agacgaactc acttgtctag ttcgtattct gttaatgaat + 15181 tgaaatcaat aagtatctca ttgtcatttt ttaactatga ggaagttaga gatttctaat + 15241 agctctccag ttactatgta atttagcatt gaaaaactaa gaaatggtga aattatgcct + 15301 tttacacagt tatttaaaac atccttagga attgattttt aattgtatgc aaacaaagta + 15361 gaattcgctt atttcatttc atgctaaatg taatatgaag taagtgaatt tttaggctct + 15421 ttgtcaactg tagtgggttg aagtcagcta agctcgagaa aggacaaatt tcgtcctttc + 15481 ttttttgatg ttcagagcga tgaaaatccg ttttttgaag ttttcaaagt ttcgaaaacc + 15541 aaaggcattg cgcttgataa gtttgatgag attattggtc gcttccagtt tggcgttaga + 15601 atagtgtagt tgaagggcgt tgacaatctt ttctttatct ttgaggaagg ttttaaagac + 15661 agtctgaaaa ataggatgaa cctgcttaag attgtcctca ataagtccga aaaatttctc + 15721 tggttcctta ttctggaaat gaaaaagcaa gagctgatag agttgatagt ggtgtttcaa + 15781 gtcttccgaa taactcaaaa gcttgtttaa aatctcttta ttggttcaat gcatacgaaa + 15841 agtaggacga taaaaatgtt tatcactcag tttacgacta tcctgttgaa tgagtttcca + 15901 gtagcgcttg atagccttgt attcatggga ttttcgatga aactgattta tgatttgaac + 15961 acgcacacga ctcatagcac ggctaagatg ttgtacaatg tgaaagcgat ccaacacgat + 16021 tttagcattc gggagtgaaa cagtctggga gactgtttca gcctgagcct agaaatttga + 16081 aagcgaagct gtttagccaa gtcatagtaa gggctaaaca tatccatagt aatgattttg + 16141 acgcgacatc ggacaactct atcgtagcga agaaagtgat ttcgaatgat agcttgtgtt + 16201 ctaccctcaa gaacagtgat gatattgaga ttgttaaaat cttgcgcaat gaagctcatc + 16261 tttccctttg taaaagcata ctcatcccaa gacataatct caggaagaca agaaaaatca + 16321 tgtttaaagt gaaaatcatt gagcttacga atagcagttg aagttgagat ggaaagctgc + 16381 tgggcaatat cagtcataga aatcttttca attaactttt gagcaatctt ttggttgatg + 16441 atacgaggga tttggtgatt cttcttgacg atagaagttt cagcgaccat catttttgaa + 16501 cagtgatagc acttgaatcg acgctttcta aggagaattc tagtaggcat accagtcgtt + 16561 tcaagataag gaattttaga aggtttttga aagtcatatt tcttcaattg acttccgcac + 16621 tcagggcaag atggagcctc ataatccagc ttagcgataa tttctttgtg ggtatccata + 16681 ttgatgatat ctagaatctt gatgtttggg tctttgatat cgagtagttt tgtgataaaa + 16741 tgtaattgtc ccatatgaat ctttctaatg agttgtttgg tcgcttttca ttatagatct + 16801 tatgggactt tttttctaca ataaaatagg ctccataata tctatagtgg atttacccac + 16861 tacaaatatt atagagccat ataaaacatg ggatgattgt tttcttttta gagcagtaca + 16921 caattaatag taattgactc taaaataaca aagaaaggta ccctactatg aaaggtatta + 16981 ttctagcagg tggttcgggg acacgtttat atcctttgac tcgcgctgcg tcaaaacaac + 17041 ttatgccggt ttatgataaa ccgatgattt actacccact ttcaacattg atgttggctg + 17101 ggattaggga tattttgatt atttccactc cacaggattt acatcgattt caagagcttc + 17161 ttcaagacgg atctgagttt gggatcaaac tttcttatgc agagcaacca agtacagatg + 17221 gtttggcaat tggggaagag tttatttctg acgatagcgt tgccttgatt ttaggcgaca + 17281 atatctacca tggtcctggt ctgagcacaa tgcttcaaaa agcagccaag aaagagaaag + 17341 gtgcgactgt ttttggctac caagtgaagg atccagagcg ttttggtgtg gttgagtttg + 17401 atacagacat gaatgctatt tccatagaag aaaaaccgga gtatcctcgc tccaactatg + 17461 cagtgacagg actgtatttc tatgataacg atgttgtcga aattgccaag agtattaaac + 17521 caagccctcg tggtgaactg gaaattacag atgtaaacaa ggcttaccta gatcgtggtg + 17581 atttgtctgt tgagcttatg ggacgtggct ttgcttggct gaatactgga actcatgaaa + 17641 gtttactaga ggcttcacag tacatcgaaa cagtgcaacg gatgcaaaat gttcaggtag + 17701 caaacttaga agaaattgct taccgtatgg gctatatcag tcgagaagat gtattggcct + 17761 tagcccaacc acttaagaaa aatgaatacg gacagtatct gctccgtttg attggagaag + 17821 catagatgac agataatttt ttcggtaaga cgcttgcggc acgcaaggtt gaagctattc + 17881 caggcatgtt ggagtttgat atccccgttc atggagataa tcgtggctgg tttaaagaaa + 17941 atttccaaaa ggaaaaagtg cttccacttg gatttccaga gtctttcttt gcagaaggaa + 18001 aattgcaaaa caatgtatcc ttctcacgta aaaatgtcct tcgaggcctc cacgcagagc + 18061 cttgggataa gtacatctct gtagcagatg gagggaaagt tctgggttct tgggttgatc + 18121 tacgcgaggg tgaaaccttt gggaatacct atcagacagt aattgatgca agcaagggaa + 18181 tctttgttcc tcgaggcgta gctaatggct tccaagtttt atcagataca gtgtcatata + 18241 gctatctggt caatgattac tgggctcttg aactcaaacc caagtatgcc tttgtgaact + 18301 acgctgatcc aagccttggt attgaatggg aaaatctgga agaagcagac gtatctgaag + 18361 cagacaaaca tcatccccta cttaaggacg tgaagccttt gaaaaaagaa gatttggaat + 18421 aaggaaagaa tatgactgaa tacaaaaata ttatcgtgac aggtggagct ggctttatcg + 18481 gttctaactt tgtccattat gtttacgaga actttccaga tgttcacgtg acagtcctag + 18541 ataagttgac ttatgctgga aaccgcgcga atattgagga aattttaggc aatcgtgttg + 18601 agttagttgt tggtgacatt gctgatgcgg agttggtaga caagttggtt gctcaagcag + 18661 atgctatcgt tcattatgca gcggaaagcc acaatgataa ttcgctcaat gatccatcgc + 18721 catttattca tactaacttc attggaatct atactctttt agaagctgct cgtaagtatg + 18781 atattcgctt ccaccatgta tcgacagatg aagtttatgg ggatctccct ttacgagaag + 18841 atttgccagg tcatggtgaa ggaccaggtg agaaatttac tgctgaaaca aaatacaacc + 18901 caagctctcc gtactcatca accaaggccg catcagactt gattgtcaaa gcctgggtgc + 18961 gttcttttgg agtcaaggca acgatttcca actgttcaaa taactacggt ccttatcaac + 19021 atatcgaaaa attcatccca cgtcagatta ctaacatcct aagtggaatt aagccaaaac + 19081 tttacggtga aggtaagaac gttcgtgact ggattcatac caatgaccat tcttcaggag + 19141 tttggacaat cttgacaaaa gggcaaatcg gtgaaaccta cttgattggg gctgatggtg + 19201 agaagaacaa taaggaagtt ttggaactta tccttaagga aatgggacaa gctacggatg + 19261 cctatgatca tgtgactgac cgtgcaggac atgaccttcg ctatgcgatt gatgccagca + 19321 agctccgtga tgagttgggg tggaaacctg aatttaccaa ctttgaagct gggctcaagg + 19381 caacaatcaa gtggtataca gataaccaag aatggtggaa agcagaaaaa gaagctgttg + 19441 aagccaatta tgctaagact caggagatta ttacagtata aaaagcagga aatcgctgct + 19501 ttttattgct atattgggaa gagttacata ttagaaaggt ctagagatga ttttaattac + 19561 aggggcaaat ggccaattag gaacggaact tcgctattta ttggatgaac gtaatgaaga + 19621 atacgtggca gtagatgtgg ctgagatgga cattaccaat gaagaaatgg ttgagaaagt + 19681 ttttgaagag gtgaaaccga ctttagtcta ccattgtgca gcctacaccg ctgttgatgc + 19741 agcagaggat gaaggaaaag agttggactt cgccatcaat gtgatgggga caaaaaatgt + 19801 cgcaaaagca tctgaaaagc atggtgcaac tctagtttat atttctacgg actaggtctt + 19861 tgacggtaag aaaccagttg gacaagagtg ggaagttgat gaccgaccag atccacagac + 19921 agaatatgga cgcactaagc gtatggggga agagttagtt gagaagcatg tgtctaattt + 19981 ctatattatc cgtactgcct gggtatttgg aaattatggc aaaaacttcg tttttaccat + 20041 gcaaaatctt gcgaaaactc ataagacttt aacagttgta aatgaccagt acggtcgtcc + 20101 gacttggact cgtaccttgg ctgaattcat gatctaccta gctgaaaatc gtaaggaatt + 20161 tggttattat catttgtcaa atgatgcgac agaagacaca acatggtatg attttgcagt + 20221 tgaaattttg aaagatacag atgtcgaagt caagccagta gattccagtc aatttccagc + 20281 caaagctcaa cgtccgctaa actcaacgat gagcctggcc aaagccaaag ctactggatt + 20341 tgttattcca acttggcaag atgcattgca agaattttac aaacaagaag tgagataagt + 20401 agtagaatga ttttctagtc taataaaaga ggcagataat gaactccaaa ggagcttaag + 20461 atgtacaatt atcttgttgt tggtgctggt ctctttggtg catagctttg gctcagtttc + 20521 tattatcgct cacaccatcc atcagaagtt taatctgaag gtacccaatt atcgccaaga + 20581 agaagattgg gctaggatgg gtttaccaat cacacgtaag gaaatctcta attggcatat + 20641 caaggcaagt caatactatt tagagtccct ttataagctt ttacgagaaa agttgttaga + 20701 acaacctctt cttcatgcgg atgaaacctc ttatcgggtt ctagagagtg atagccatct + 20761 gacctactat tggacttttt tgtctgggaa agctgagaat caagcaatca cgctgtacca + 20821 ccatgatcag cgtcggagtg gtttagtagt acaagaattc ctaggagatt attctggcta + 20881 tgtgcattgt gatatgttgc ggcagtaact taggacttta gtcctctagt tctgcctatg + 20941 cgatagcagt ccaaggttta ggagcaaggc gacgctaagc ttggtaaact gcgaaccgct + 21001 agaagcttat cgtcaactgg aagaagctga acttgttgga tgttgggcac atgtgagaag + 21061 gaagtttttt gaagcgcccc ccaagcaaac ggataaatca tccttaggag ctaaaggttt + 21121 agcttattgt gatcagttat tttccctgga aagagactgg gaggctttgc cagctgatga + 21181 acgactacag aaacgtcaag aacatctcca gcccctaatg gaagacttct ttgcttggtg + 21241 ccggcgtcag tcagttttag caggttcaaa actaggaagg gcaattgaat acagcctcaa + 21301 gtatgaagaa acctttaaga ctattttgaa agacggacat ctggtccttt ccaataatct + 21361 agctgaatgc gccattaaat cattggttat gggacggagt aaaagagtcc agtggactct + 21421 tttagcctaa gctcagttta aaaaagcgag ggtggttatt ttctcaaagt tttgaaggag + 21481 ctaaagcaag agctattata attaaatagc gagaaatatc tatcctatct tctagaatgt + 21541 cttccaaacg aggaaactct cgtaaacaaa gagattttag aggcctattt accgtggact + 21601 aaagttgtac aagaaaagtg caaataagaa atctccagat taggaactat ccgtgagttc + 21661 tctagtctgg agatttttca atagacttcg ttattgggcg gttacgatat tcatattttt + 21721 tgcaaagatg ttatttgaaa aataattttc aaaaattctg aaaattctgt tgacaacttt + 21781 ctgaaaagag tctataatgg agagaaagtt ttaaaggaga aaaggatgaa aagttcaaaa + 21841 ctacttgccc ttgcgggcgt gacattattg gcggcgacta ctttagctgc atggtctgga + 21901 tcaggttcaa gcactaaagg tgagaagaca ttctcataca tttatgagac agaccctgat + 21961 aacctcaact atttgacaac tgctaaggct gcgacagcaa atattaccag taacgtggtt + 22021 gatggtttgc tagaaaatga tcgctacggg aactttgtgc cgtctatggc tgaggattgg + 22081 tctgtatcca aggatggatt gacttacact tatactatcc gtaaggatgc aaaatggtat + 22141 acttctgaag gtgaagaata cgcggcagtc aaagctcaag ac +// + diff --git a/public/res/serotype_genbank/serotype_10A.gb b/public/res/serotype_genbank/serotype_10A.gb new file mode 100644 index 0000000..c48e687 --- /dev/null +++ b/public/res/serotype_genbank/serotype_10A.gb @@ -0,0 +1,763 @@ +LOCUS CR931649 17290 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 10061/38 (serotype 10a). +ACCESSION CR931649 +VERSION CR931649.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17290) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17290) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17290 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="10061/38" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC10A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC10A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33039.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..458 + /gene="aliB" + /locus_tag="SPC10A_0002" + /pseudo + CDS 293..458 + /gene="aliB" + /locus_tag="SPC10A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(462..938,940..1266)) + /gene="tnp" + /locus_tag="SPC10A_0003" + /pseudo + CDS complement(join(462..938,940..1266)) + /gene="tnp" + /locus_tag="SPC10A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(876..938,940..1248)) + /gene="tnp" + /locus_tag="SPC10A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 1.3e-22" + /pseudo + gene 1501..2946 + /gene="wzg" + /locus_tag="SPC10A_0004" + CDS 1501..2946 + /gene="wzg" + /locus_tag="SPC10A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33042.1" + /db_xref="GOA:Q4K2G0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2G0" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKSQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTLT + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1501..1617 + /gene="wzg" + /locus_tag="SPC10A_0004" + /note="Signal peptide predicted for SPC0362 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1705..2052 + /gene="wzg" + /locus_tag="SPC10A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 2230..2673 + /gene="wzg" + /locus_tag="SPC10A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2e-67" + gene 2948..3679 + /gene="wzh" + /locus_tag="SPC10A_0005" + CDS 2948..3679 + /gene="wzh" + /locus_tag="SPC10A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33043.1" + /db_xref="GOA:Q4K2F9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2F9" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKISENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEHDLVHVIASDMHNLDGRPPHMFEAYSIVA + KKYGEEKARELFEENPRQIVMNQLI" + misc_feature 2951..3559 + /gene="wzh" + /locus_tag="SPC10A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 9.2e-37" + gene 3685..4380 + /gene="wzd" + /locus_tag="SPC10A_0006" + CDS 3685..4380 + /gene="wzd" + /locus_tag="SPC10A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33044.1" + /db_xref="GOA:Q4K2F8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2F8" + /translation="MMKEQNTMEIDVFQLLNTLWKRKLIIALVAIVTGAIAFSYSSFI + IKPEYTSTTRIYVVNRNQGDKSGLTNQDLQAGSYLVKDYREIILSQDVLEKVVTDLQL + DMPTKNLASKIQVTVPVDTRIVSISVKDKQPEEASRIANSLRKIAAKKIISVTRVSDV + TTLEEARPATSPSSPNIRRNTLIGFLGGLGVVVMVVLLVELLDVRVKRPEDIEDDMQI + PLLGVIPNLDKLK" + misc_feature 3706..4122 + /gene="wzd" + /locus_tag="SPC10A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.3e-52" + misc_feature 4228..4305 + /gene="wzd" + /locus_tag="SPC10A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4390..5073 + /gene="wze" + /locus_tag="SPC10A_0007" + CDS 4390..5073 + /gene="wze" + /locus_tag="SPC10A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33045.1" + /db_xref="GOA:Q4K2F7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K2F7" + /translation="MPTLEITQKKLEIVKKAEEYYNALRTNIQLSGDNLKVISITSVK + PGEGKSTTSTNIAWAFAHAGYKTLLIDADIRNSVMSGVFRSSEKITGLTEFLSGTTDL + SQGLCDTNVENLFVIQAGSISPNPTALLQSENFRTMIDTLRKYFDYIIVDTAPIGIVI + DAVIVTQKCDASVLITAVGEVHRRDVQKAKEHLEQTGKPFLGVVLSKLNTSIEKYSSY + GGYGNYGNK" + gene 5127..5762 + /gene="wcjG" + /locus_tag="SPC10A_0008" + CDS 5127..5762 + /gene="wcjG" + /locus_tag="SPC10A_0008" + /note="member of homology group 50" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI33046.1" + /db_xref="GOA:Q4K2E0" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4K2E0" + /translation="MIQNGIIYIGFKRVMDVFIGLFGTIFIVLPSSLIIYIIYKIKGY + KGSIFFTQYRVGLKGKKFKIIKFRSMVENAEELLTANKALYEKYINNSYKLPPNEDPR + LTNIGDFIRKTSIDEIPQFINLMLGDMSLIGPRPILENELEEYSKEEQQVLLSVRPGI + TGMWQVSGRSEVYYPERCEMELYYPRNQSFLLDVKIFFLTIKKVLSGEGAH" + misc_feature 5160..5759 + /gene="wcjG" + /locus_tag="SPC10A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.9e-56" + gene 5979..6773 + /gene="wciB" + /locus_tag="SPC10A_0009" + CDS 5979..6773 + /gene="wciB" + /locus_tag="SPC10A_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33047.1" + /db_xref="GOA:Q4K2D9" + /db_xref="UniProtKB/TrEMBL:Q4K2D9" + /translation="MSKKYKIIVATHKKFQMPEDKDLYIPVQVGSEGKENLGYQRDDQ + GNHISHLNPYYCELTGLYWAWKNLDCDYLGLVHYRRYFTDRNRPYHDKINMNEVILSA + DQVKEFMSEVDVVVPKKRKYYIETLYSHYAHTHNSSHLDVTREIIKEVSPEYLATFDK + VMDCRSGYMFNMFIMSKENVSSYCEWLFPIIDELYRRLDITGYSTFDARLFGRISERL + FNVWLDYQNLRVKEVPFMYMEKVNLFEKGKSFLKAKYFGKKYGQSF" + gene 6777..8027 + /gene="wzy" + /locus_tag="SPC10A_0010" + CDS 6777..8027 + /gene="wzy" + /locus_tag="SPC10A_0010" + /note="member of homology group 67" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33048.1" + /db_xref="UniProtKB/TrEMBL:Q4K2F4" + /translation="MVLLLLTFAFFLVFPVLSISLSVIGLVNDKKRSKIYLLLISFAI + SIVALRYIPHPMDDGAFHFRATTTLIRYDSIFEMFKAFSNGWRVGNYDYGSIPIFTSL + MYLVRNTHHYSLLSFISAFITYFSFGYVVVELFKDLGKVSKLSYATVLIAVLCLNNYR + YTTSGMRFCMAVALMMLLLYLESKKGYTSLKTTIWYLLPVGIHSAVIYFIGLRFLFPL + IKKVTLAKSLFVLLGFPVLFNLVPWLANLIGWTYLQSFIRKIEVYSDNSSYSQFFNTT + LTMRLYVGIVLMVLFVLLYLGIVNSLKTTDDWRFSFVTMTYYVTLLSMGSIPFRNIYD + RNLFLLLPMIVVSTYILFTYRYQLKILTNRNIVYGLTMGILCLSCAVGAFYNNNFPFT + FIDFSKTDLLLKNIFQFFSNLPFT" + misc_feature 6777..6857 + /gene="wzy" + /locus_tag="SPC10A_0010" + /note="Signal peptide predicted for SPC0368 by SignalP 2.0 + HMM (Signal peptide probability 0.900) with cleavage site + probability 0.260 between residues 27 and 28" + gene 8037..8972 + /gene="wcrB" + /locus_tag="SPC10A_0011" + CDS 8037..8972 + /gene="wcrB" + /locus_tag="SPC10A_0011" + /note="member of homology group 87" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33049.1" + /db_xref="GOA:Q4K2F3" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K2F3" + /translation="MLLFYFLEDYMGLSTVTLFKNLKFTDSKFIKLEGELLLKYQEYL + LKIMEDIVTVCEEEGLYYSLSGGSALGAYRHKGFIPWDDDMDIFMLGSEREIFFQKFS + QKFSDKYWIHNSQTPNYGMPIGRIRQKGTVLRGREDVGVEECGFFIDIFWLENVPNSK + ILRQLHGFLCMAIGLLLSCRNFYKNRQLMLEIMKEHKEIRLVFRIKLILGFLTSFISL + RQFTRLTERIYSLCKNNESRYLSVPSGRKHYFGEMFIREDMQLTRKLNFEGHKWNVPN + NIEHYLTVMYGDYMKIPAVEDRESHIILEISFPSD" + misc_feature 8199..8897 + /gene="wcrB" + /locus_tag="SPC10A_0011" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 4.8e-25" + gene 9010..10095 + /gene="wcrC" + /locus_tag="SPC10A_0012" + CDS 9010..10095 + /gene="wcrC" + /locus_tag="SPC10A_0012" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33050.1" + /db_xref="GOA:Q4K2F2" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2F2" + /translation="MKKIALVKWILDDSGGGERVAVSLANELTKKYEVHLIGITTKQS + DLFFGINSQVKYSNFFDHRVRLSKNILKISKMLKKYFLDNEIEVAFGIGIFSNIFLSL + SGIGISTKVVLCDHTNSITANRELSKKVQRYVGTKLADKIITLTQEDRKNYIRKYGIS + ENRIAYIYNWKENRLSNIPYNDESTKIVTVGRFDYQKGYDYLIQVAKKVLAKMPDWTW + EIYGSGKQDEVDKIRDLITENDLQDKLVIKGLEKNQDLIYGDKGIYVMTSRYEGLPLV + LLEAQQYNLPIVSFRCPTGPSEIVEDGVNGYLIDCYDTDKMSEKLLELMKNDDLRQSF + SDHAKDTMDKFDKNKILNQWIELIETI" + misc_feature 9520..10032 + /gene="wcrC" + /locus_tag="SPC10A_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.5e-39" + gene 10104..11108 + /gene="wcrD" + /locus_tag="SPC10A_0013" + CDS 10104..11108 + /gene="wcrD" + /locus_tag="SPC10A_0013" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33051.1" + /db_xref="GOA:Q4K2F1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2F1" + /translation="MQECLLTIVMPSYNIQDYISRGIESFQQVHPDYKQKFEVLIVND + GSTDDTAKVAEEALRKDSFLNGRIITKENGGHGSTINRGIQEAKGKFFKVIDGDDWVI + PSEFEKFLDTLSVAGVDMVLTDFTEQHVYNNTTVRNDFIEKYEVGEEYSGIPERRIPM + HSVTYRTSILVDNRIRLSEKTFYVDIQYTLFPLEYVHSFGYWNYDVYQYYIGRPEQSM + NIESMKRNVRHHLIVTNSVLGFFSKISGDPVLKKVVADTLGYLISLQIDLSWMVEDSK + TLSEELYRQIEQSSYEYIPTKKFDRLSYLNYKFHYFLDFVFNPVLKKYSKKKEKERGI + " + misc_feature 10122..10649 + /gene="wcrD" + /locus_tag="SPC10A_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 4.8e-29" + gene 11110..12063 + /gene="wciF" + /locus_tag="SPC10A_0014" + CDS 11110..12063 + /gene="wciF" + /locus_tag="SPC10A_0014" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33052.1" + /db_xref="GOA:Q4K2F0" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2F0" + /translation="MLISVVVPVYNVSDYLHFAMDSLIKQTYQNFEVILVNDGSTDNS + PQLCEEYAKQYENVSVFHKENGGLSDARNFGVSKASSDWIFFLDPDDYLEDYTLELIV + KIQQEHQANLISTKVKATSKYNDYNPYQLEKSDYKDLCVFTKEKALELMLDDKIATVS + ACAKLYHKNILEKVPFPVGKIYEDFYVVADHLALADKIVISPLETYNYYRREGSIVRS + TFTEKRYDFFDAVSKNEEVIKKEYTQSLELQQFLQAKKLRGGFVVIGAKADSGLTDFS + KDRNLLKVDFKTMLLNKKISWKLKLKYTIFMLSSKVYLRLR" + misc_feature 11119..11634 + /gene="wciF" + /locus_tag="SPC10A_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 8.2e-44" + gene 12120..13076 + /gene="wcrG" + /locus_tag="SPC10A_0015" + CDS 12120..13076 + /gene="wcrG" + /locus_tag="SPC10A_0015" + /note="member of homology group 102" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33053.1" + /db_xref="GOA:Q4K2E9" + /db_xref="InterPro:IPR003406" + /db_xref="UniProtKB/TrEMBL:Q4K2E9" + /translation="MKRGNMKQAYIIIAHNKFEQLKFLISLLDYKEHDIFIIVGSKVN + VGESTITSLKSSAIHSNVILVDRVPIYWGNYSLSSAEMLGFRYAYNYDNYSMFHLLSG + VDLPLVSADKLFKFFDQNKSNNFLSMVSDEILKSNKVYERVKFRYLFPRFLARNIQNK + YVRKFVAYYRKLEIKIQRLMKIDCFKKYNMRLGYASNWVSINQDLVRIILEEEKNIEK + IFKYSIVNDELFIPTIMYKYNLMESLYSSSPITDAPNDFQGNLRYINWWDGDPHTWTD + SEHDIEQLKRGKALGHKFSRKFDLEKYPNLKEEILIIINRTD" + misc_feature 12141..12734 + /gene="wcrG" + /locus_tag="SPC10A_0015" + /note="HMMPfam hit to PF02485, Core-2/I-Branching enzyme, + score 0.019" + gene 13078..14490 + /gene="wzx" + /locus_tag="SPC10A_0016" + CDS 13078..14490 + /gene="wzx" + /locus_tag="SPC10A_0016" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33054.1" + /db_xref="GOA:Q4K2E8" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K2E8" + /translation="MKVLKNYAYNLSYQLLLIILPIITTPYVTRVFSLNDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKEIEKNFWGIYSLQLGATVLSMFLYLVLCLIL + PFMQNPFAYILGLSLVSKGLDISWLFQGLEDFRKITARNIIVKLVGVSSIFLFIKSAS + DLYLYVFLLTIFELLGQLSMWLPAREFIGKPYFDLSYAKQHLKPIVLLFLPQVAISLY + VTLERTMLGALSSTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVANLLATGDYKAVN + KMHEMSFLIYNLVIFPIMAGILIVNDDFVQFFLGQDFQDARYAIAIMIFRMFFIGWTN + IMGIQILIPHNKNKEFMISTTASAIISVGLNMLFLPKLGYIGAAIVSVLTEALVWAIQ + LFYTRRYLKEVPIIVSMTKIVLASVIMYGILLGSKIFIHFSPTINVLAFAVLGGIIYL + FAILSMKVIDVKELKQIIKK" + misc_feature 13084..13878 + /gene="wzx" + /locus_tag="SPC10A_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 3.3e-66" + gene 14490..15602 + /gene="glf" + /locus_tag="SPC10A_0017" + CDS 14490..15602 + /gene="glf" + /locus_tag="SPC10A_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33055.1" + /db_xref="GOA:Q4K2E7" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2E7" + /translation="MECNMYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNI + YCENVEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMN + TFYAMWGTKTPQEVKDKIAEQTADMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQW + GRFATELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFF + AHREELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHETLDEENYQGNAVVNYTEC + EIPYTRIIEHKHFEYGTQDKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEAA + QNDKVIFCGRLADYKYYDMHVVIERALEVVEKELGN" + misc_feature 14937..15539 + /gene="glf" + /locus_tag="SPC10A_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.9e-137" + gene complement(15640..16916) + /gene="tnp" + /locus_tag="SPC10A_0018" + /pseudo + CDS complement(join(15640..16404,16404..16916)) + /gene="tnp" + /locus_tag="SPC10A_0018" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI33056.1" + misc_feature complement(join(16144..16404,16404..16424)) + /gene="tnp" + /locus_tag="SPC10A_0018" + /note="HMMPfam hit to PF01610, Transposase, score 3.3e-37" + /pseudo + gene 17243..>17290 + /gene="aliA" + /locus_tag="SPC10A_0019" + CDS 17243..>17290 + /gene="aliA" + /locus_tag="SPC10A_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33057.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaaggca gaaatccttt gttttttata accaaggttt ataaaccttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagccc atgttttctc aataggattg tactcaggtg aatagggagg aagaggtaaa + 541 agtttatgcc caaactcttc acacaagagt tctagcttcc ccattctatg gaatcttgca + 601 ttatccataa taataaccga tggtgtggtt aatgttggta agagaaattt ctgaaaccaa + 661 gcttcaaaaa agtcgctcgt catcgtctct tcgtaagtca ttggaacgat taactcacca + 721 tttgttagac ctgcaaccaa agaaatcctc tgatatcttc ttccagatac tttacctctt + 781 attaactgac cttttaatga gcgaccatat tctcgataaa aataagtatc gaatcctgtt + 841 tcatcaatct aaacaggtgc taggtgcttt aaactattaa aattcttaag aaataaggct + 901 actttttctg ggtcttgttc atagtaggtg tggttctttt tttcgagtgt agcccatagc + 961 tttgagcgca tagtggatgg tagttggatg acagccaaag tcagaagcta tttcagtcaa + 1021 ataagcgtcg ggattgtcag taagatagtt tttaagtcta tctctatcaa cttttcttgg + 1081 ttttgttcct tttacttggt ggtttagctc tcctgttttc tcttttagct ttaaccagcc + 1141 ataaatggta ttacgtgaga tttggaaaac gtgtgatgct tctgttatac tacctattcg + 1201 ctcacaataa gagagaactt ttttacgaaa atctattgaa tatgccataa gaagattata + 1261 ccacattgtg tactatatta gattgaaact agaatagtac atctctgctt ctaaaacatt + 1321 gttagaaatc gatttgactg tcctgaacga tttgttctgt tcttatttca ttttactata + 1381 tttttgtttc gcgggaagtc tactaagata cttaaagatg cagatagtaa aaataaaggt + 1441 gtagacatta ccgtaaaaaa gtgatataat cgtgtaatgt tcaatgtata ggtattaatc + 1501 atgagtagac gttttaaaaa atcacgttca cagaaagtga agcgaagtgt taatatagtt + 1561 ttgctgacta tttatttatt gttagtttgt tttttattgt tcttaatctt taagtacaat + 1621 atccttgctt ttagatatct taatctagtg gtaactgcgt tagtcctact agttgccttg + 1681 gtagggttac tcttgattat ctataaaaaa gctgaaaaat ttactatttt tctgttggtg + 1741 ttctctatcc ttgtcagctc tgtgtcgctc tttgcagtac agcagtttgt tggactgacc + 1801 aatcgtttaa atgcgacttc taattactca gaatattcaa tcagtgtcgc tgttttagca + 1861 gatagtgaga tcgaaaatgt tacgcaactg acgagtgtga cagcaccgac tgggactgat + 1921 aatgaaaata ttcagaaatt actagctgat atcaagtcaa gtcagaatac cgatttgacg + 1981 gtcaaccaga gttcgtctta cttggcagct tacaagagtt tgattgcagg ggagactaag + 2041 gccattgtcc taaatagtgt ctttgaaaac atcatcgagt cagagtatcc agactacgca + 2101 tcgaagataa aaaagattta taccaaggga ttcactaaaa aagtagaagc tcctaagacg + 2161 tctaagagtc agtctttcaa tatctatgtt agtggaattg acacctatgg tcctattagt + 2221 tcggtgtcgc gatcagatgt caacatcctg atgactgtca atcgagatac caagaaaatc + 2281 ctcttgacca caacgccacg tgatgcctat gtaccaatcg cagatggtgg aaataatcaa + 2341 aaagataaat tgactcatgc gggcatttat ggagttgatt cgtccattca caccttagaa + 2401 aatctctatg gggtggatat caattactat gtgcgattga acttcacttc gtttttgaaa + 2461 ttgattgatt tgttgggtgg aattgatgtt tataatgatc aagaatttac tgcccatacg + 2521 aatggaaagt attaccctgc aggcaatgtt catcttgatt cagaacaggc tctcggtttt + 2581 gttcgtgagc gctactccct agcagatggc gatcgtgacc gcgggcgcaa tcaacaaaag + 2641 gtgattgtgg ctatccttca aaaattaacg ttaaccgaag cgctgaaaaa ttatagtacg + 2701 atcattaata gcttgcaaga ttctatccaa acaaatatgc cacttgagac catgataaat + 2761 ttggtcaatg ctcagttaga aagtggaggg aattataaag taaattctca agatttaaaa + 2821 gggacaggtc ggatggatct tccttcttat gcaatgccag acagtaacct ctatgtgatg + 2881 gaaatagatg atagtagttt agctgtagtt aaagcagcta tacaggatgt gatggagggt + 2941 agatgaaatg atagacatcc attcgcatat cgtttttgat gtagatgacg gtcccaagtc + 3001 aagagaggaa agcaaggctc tcttggcaga atcctacagg cagggggtgc gaaccattgt + 3061 ctctacctct caccgtcgca agggcatgtt tgaaactccg gaagagaaga tatcagaaaa + 3121 ctttcttcag gttcgggaaa tagctaagga agtggcgagt gacttggtca ttgcttacgg + 3181 ggctgaaatt tactacacac cagatgttct ggataagctg gaaaaaaagc ggattccgac + 3241 cctcaatgat agtcgttatg ccttgataga gtttagtatg aacactcctt atcgcgatat + 3301 tcatagcgcc ttgagcaaga tcttgatgtt gggaattact ccagtcattg cccacattga + 3361 gcgctatgat gctcttgaaa ataatgaaaa acgagttcga gaactgatcg atatgggctg + 3421 ttacacgcaa gtaaatagtt cacatgtcct caaacccaaa ctttttggcg aacgttataa + 3481 attcatgaaa aaaagagctc agtatttttt ggagcatgat ctggttcatg tgattgcaag + 3541 tgatatgcac aatctagacg gtagacctcc tcacatgttc gaagcttata gcatagttgc + 3601 caaaaagtac ggggaagaga aggcgagaga actctttgaa gaaaatcctc gacaaattgt + 3661 aatgaatcaa ctaatttagg agaaatgatg aaagaacaaa atactatgga gattgatgta + 3721 tttcaattgt taaatacctt gtggaaacgg aaattgatta ttgctttggt tgctatcgta + 3781 acgggagcga ttgccttttc atatagtagc tttattataa aaccagagta taccagtaca + 3841 acgcgtattt atgtagtcaa ccgtaaccaa ggggataaat caggtttgac aaatcaggac + 3901 ttgcaggcag gttcatatct tgttaaagac tatcgtgaga tcattctttc ccaagatgta + 3961 ttagagaagg ttgtcacaga cttgcaactc gatatgccga ccaaaaatct tgctagtaaa + 4021 atacaagtaa ctgtaccagt tgatacacgt attgtttcta tttctgtcaa ggacaaacag + 4081 ccagaggaag caagtcgtat cgctaactcc ttgcgcaaga ttgcagctaa aaaaatcatt + 4141 agcgtaacgc gtgtgtctga tgtaacaaca ctcgaagaag cgcgaccagc cacttcccct + 4201 tcatctccaa atatccgtcg gaatactttg ataggttttc tcggaggatt aggggtggta + 4261 gttatggtcg ttctcttggt tgagttgcta gatgtccgtg tcaaacgacc agaggatatc + 4321 gaagacgata tgcaaattcc actcttagga gtcattccaa atttggataa attgaaatag + 4381 gagagaacga tgccaacatt agaaatcaca cagaaaaaat tggagatcgt aaaaaaggca + 4441 gaggagtact acaatgcctt gcgtacaaat atacagttaa gtggagataa tttgaaagtc + 4501 atctctatta cttcagttaa gccgggagaa ggaaagtcta caacctctac taacattgct + 4561 tgggcttttg cgcatgcagg ctataaaacc ctattaattg atgcggatat tcgtaactcg + 4621 gtcatgtcag gtgtttttag atctagtgag aagattactg gcttaacaga gtttttatca + 4681 ggtacaacag acttgtcaca aggtctatgt gataccaatg ttgaaaatct ctttgtcatt + 4741 caggcgggtt ccatttcacc aaaccccaca gctcttttac aaagtgagaa tttcagaacg + 4801 atgatagata ccctgcgtaa atattttgac tatatcattg tggatactgc tcccataggt + 4861 atcgtgattg atgcagttat tgtgacacag aaatgtgatg cttctgtttt gattacggca + 4921 gttggtgaag tacatcgccg tgatgttcaa aaggcgaaag aacacttgga acaaacaggc + 4981 aagccgtttt taggagttgt gctaagtaaa ctgaatactt caatagagaa atattcttct + 5041 tatgggggat atgggaacta tggaaataaa tagtcttaca gtaccaagat tatttgagat + 5101 gattactatg ggagggggag tttaaggtga tacagaatgg cattatctat attggcttta + 5161 aaagagttat ggatgttttt attggtttat ttggaacaat attcatcgtc ttgcctagtt + 5221 ccttaataat ttatattatc tataaaataa aaggttacaa aggaagtata ttcttcacac + 5281 aatatagagt ggggttgaag gggaaaaaat ttaaaattat taaatttaga tcaatggttg + 5341 aaaatgctga agaacttttg accgcaaata aagcactcta tgaaaaatat ataaataaca + 5401 gttacaaatt acctccaaat gaggatcctc gtcttactaa tatcggagat tttataagaa + 5461 aaacgagtat tgatgaaatt cctcaattta taaatttgat gttaggtgat atgagcctta + 5521 ttggacctag accaattttg gagaatgagt tagaggagta ttctaaggaa gaacagcaag + 5581 ttttgttatc tgtacggcca ggtattacag ggatgtggca agtttctggt aggagtgagg + 5641 tatattatcc tgaacgctgt gaaatggagc tgtattaccc tcggaatcaa tcctttttgt + 5701 tggatgtcaa aatcttcttt ttgacaatca aaaaagttct gtctggagaa ggggctcatt + 5761 gatgtatgaa ttaaatcatc tagcacgaaa tagatagaaa gatgaagttg aatacgaata + 5821 acgtttcttg ggtattcgta ttcatttttt aagcgaagga agcattagga ataagtggag + 5881 ttaatctagt attatttgct tgaaaaaatg aatgggaatt caatctaaag aattgttcag + 5941 tgaggcaaga ttttaggaat tggagttagg atgtagaaat gtcaaaaaag tataaaatta + 6001 tagtagcgac tcataaaaaa tttcaaatgc cagaagataa ggatttatat attcctgttc + 6061 aggttggcag tgaaggaaag gaaaatttgg gctaccaacg agatgatcaa ggtaatcata + 6121 tctcacacct caatccttat tattgtgaat tgacaggatt atactgggct tggaaaaatt + 6181 tagactgtga ttacctagga ttagttcatt accgacgtta ttttacagac aggaaccgac + 6241 cttatcatga taagattaac atgaatgaag ttatcctatc ggcagatcaa gttaaggaat + 6301 tcatgtctga agtagatgtc gttgttccca aaaagagaaa atattatata gaaactctct + 6361 attctcatta tgctcacact cataattcca gtcatttaga tgtaacgcga gaaattataa + 6421 aagaggtttc gccagaatat ttagcaacat ttgacaaggt gatggactgt cgtagtggct + 6481 acatgttcaa tatgtttatc atgtccaaag aaaatgtatc atcttattgt gagtggttat + 6541 tccctatcat tgatgagttg tacagaagat tggatataac agggtactct acttttgatg + 6601 caagactatt tggacgtatt agtgagcgtc tctttaatgt ttggttagac taccaaaatc + 6661 tacgtgttaa agaagtaccg tttatgtata tggaaaaagt gaatttattt gagaagggca + 6721 aatccttctt gaaagccaag tatttcggaa aaaaatatgg acagagtttt taagttatgg + 6781 ttttgttatt acttactttt gcattctttt tagttttccc tgtgctgtca ataagtttaa + 6841 gtgttatagg gctagtaaat gacaaaaagc gttcaaaaat ctatttactt ctaattagtt + 6901 ttgcaatatc aattgttgcg ctgcgctata ttcctcatcc tatggatgat ggcgcttttc + 6961 attttcgtgc gactacgacc cttattcgct atgatagtat tttcgaaatg tttaaagcgt + 7021 tttctaatgg atggagagta gggaactatg actatggttc cataccaatt tttacttcat + 7081 taatgtatct tgttcgaaat actcatcact atagtttact gagttttatt tcagctttta + 7141 taacttactt tagttttggt tacgtagttg ttgagctatt taaggacctg ggcaaggttt + 7201 ctaaactatc gtatgctaca gtattaattg ctgtactatg tttaaataat tatagatata + 7261 caactagtgg aatgagattt tgtatggcag ttgccttgat gatgctttta ctatatttgg + 7321 agtcaaaaaa aggctatact agtttaaaaa caaccatatg gtatttgttg cctgtaggta + 7381 tccattcagc ggttatttat tttattggtt taaggttctt atttccatta atcaagaaag + 7441 tgacgcttgc taaaagttta tttgtattat taggttttcc tgttttgttc aacctagttc + 7501 catggttagc aaatttgatt ggttggactt acttacaatc atttattcgg aaaattgaag + 7561 tctactctga caattcatcc tattcccagt tttttaatac cacattaaca atgaggctat + 7621 atgttggaat agtgctgatg gttttatttg tattgttata tttgggaata gtaaattcat + 7681 tgaaaacaac tgatgattgg cgttttagtt ttgttacaat gacttattat gtaactctgt + 7741 tatctatggg ttcaatacca tttcgtaata tttatgatag aaatcttttc ttgctccttc + 7801 ctatgattgt agtttcaacc tacatattgt ttacatatag atatcaattg aaaattctta + 7861 ctaatcgtaa tattgtttat ggattaacga tgggtattct ttgtctatcc tgtgcagttg + 7921 gtgcatttta taataataat ttccctttta cttttattga ttttagtaag acagacttac + 7981 tcctaaaaaa tatttttcaa ttcttttcaa atttaccttt tacataataa gactatgtgc + 8041 tattatttta tttcttggag gattatatgg gactatctac agtaacattg tttaaaaatt + 8101 taaagttcac agatagtaaa tttattaaat tggaaggaga gctccttctt aaatatcaag + 8161 agtatttatt aaaaatcatg gaagatattg taacagtgtg tgaggaagaa gggttatact + 8221 attcactttc tggtgggagt gcgttaggag catatcgaca caaagggttt attccatggg + 8281 atgatgatat ggatatattt atgctaggaa gtgaacggga aattttcttt caaaaatttt + 8341 ctcagaaatt ctctgataag tattggatac ataattcaca aacaccaaac tatggcatgc + 8401 cgattggtcg tatcagacaa aaaggaacag ttctacgtgg tcgagaggat gtcggagttg + 8461 aagaatgtgg attttttatt gatatttttt ggcttgaaaa tgttcctaat tcaaaaatct + 8521 tgagacaact tcacggcttt ctctgcatgg cgattggatt gttactatca tgtagaaatt + 8581 tttataaaaa tcgtcagttg atgctggaga ttatgaagga acataaagaa ataaggcttg + 8641 tttttcgaat aaaactaatt ttagggtttc taactagctt tatatctttg agacaattta + 8701 caagacttac ggaaaggatc tattcattgt gcaagaataa tgaatcaaga taccttagtg + 8761 ttccttcagg aagaaaacat tattttggcg agatgtttat aagagaagat atgcagttaa + 8821 ctaggaaact aaattttgaa ggacataagt ggaatgttcc aaataatatt gagcattatt + 8881 taactgtaat gtacggtgat tatatgaaaa tacctgcagt tgaagatagg gaatcacata + 8941 tcattttaga aatctccttc cctagcgact aaacagactt tcatttttta tatgtaagga + 9001 attaatttaa tgaaaaaaat agctttagtg aaatggattt tggatgattc tggtggcggt + 9061 gagcgagttg ctgtatcttt ggcaaacgaa cttacaaaaa agtatgaagt tcatttgatt + 9121 ggaattacaa caaagcaatc ggatttattc tttggaatca attctcaagt aaaatactcc + 9181 aatttttttg accatcgagt acgcttgtct aagaatattc taaaaatctc aaaaatgtta + 9241 aaaaaatatt tcctagataa tgagatagag gttgcctttg ggatagggat attctctaat + 9301 atatttttat ccttgtcggg aataggaatt tctactaaag tagttttgtg tgatcatacc + 9361 aattcaatta cggctaatag agaactttct aagaaagtcc aaagatatgt tgggacaaag + 9421 ctagcagaca agattattac tcttacgcaa gaggatcgta aaaattatat acgaaaatac + 9481 ggcatttctg agaataggat tgcttacatc tataattgga aagaaaatcg tctttccaat + 9541 ataccttata atgatgagtc tactaaaatt gtaactgttg gtcgttttga ttatcaaaaa + 9601 ggatatgatt atcttatcca agtcgcgaaa aaagtgttag ctaaaatgcc tgactggact + 9661 tgggaaatct acggttccgg aaaacaagat gaagtagaca aaatcagaga tttaatcacc + 9721 gaaaatgatt tacaggataa gttagtcata aaaggacttg aaaaaaatca ggatctgatt + 9781 tatggagata aagggattta tgtcatgact tctcgttacg aaggtttacc gttggtattg + 9841 ttagaagctc aacaatacaa tcttcctatt gttagcttca gatgtccaac gggacctagt + 9901 gagattgttg aagatggggt caatggttat ctgatagatt gttatgatac cgataagatg + 9961 agtgagaaat tgcttgaatt gatgaaaaat gatgatttgc gacaatcttt ctcagatcat + 10021 gcaaaagata ctatggataa atttgataaa aataaaattc ttaatcagtg gatagagttg + 10081 attgagacaa tttaggagat aagatgcaag agtgtttatt gacaattgta atgcctagtt + 10141 ataatattca ggactacatt tccagaggaa tcgaatcatt ccagcaagta catccagatt + 10201 acaaacaaaa atttgaggtc ttaattgtga atgatggaag tacggacgac acagccaaag + 10261 tagcagaaga ggccctaaga aaagattcgt ttctgaatgg tcgtattatc acaaaggaaa + 10321 atggaggtca tggctcaaca attaatcgtg gtatccagga agcaaagggg aagttcttta + 10381 aagttattga tggggatgac tgggttatcc cgtcagagtt tgaaaagttt ttagataccc + 10441 tatcagttgc tggtgtggat atggttctta cggattttac agaacaacat gtttataaca + 10501 atactactgt tcgaaatgat tttattgaaa agtatgaggt tggtgaggaa tattctggaa + 10561 ttccagagag acggatccca atgcactcag taacctatag aacatctatc ctagtcgaca + 10621 atagaattcg tttaagtgaa aagacgtttt atgttgacat tcagtacact ctatttcctt + 10681 tagagtatgt tcatagtttc ggttattgga attatgatgt ttaccaatac tatatcggac + 10741 gacccgagca gagtatgaat attgagagta tgaaacgaaa tgttcgtcat catttgattg + 10801 taacaaattc tgtgctaggt tttttttcaa aaatttcagg ggatcctgtt ttaaagaaag + 10861 tggttgcaga tactttgggc tatcttatta gtttacagat tgatttgtca tggatggttg + 10921 aggattcaaa gacactatca gaagaattat acagacaaat tgagcagagt tcttatgagt + 10981 atatccctac gaaaaaattt gatagattgt cttatttgaa ctataagttt cactattttc + 11041 tagactttgt tttcaatcca gtattgaaaa aatattctaa aaagaaagaa aaagagagag + 11101 gaatttagaa tgctcattag tgttgttgtt ccggtttata atgtttctga ctatttacac + 11161 tttgccatgg atagtctgat aaagcaaaca tatcaaaatt ttgaagtaat ccttgtaaat + 11221 gatggttcaa cagataactc tcctcagtta tgtgaagagt atgctaagca atatgaaaac + 11281 gtctctgttt ttcataaaga aaatggaggg ttgtctgatg ctcgtaattt tggagtttca + 11341 aaagcatcat cagattggat tttctttcta gatccagatg attatttgga agattatact + 11401 ctagaattga tagtgaaaat tcaacaggaa catcaagcaa acttgatttc aactaaagta + 11461 aaggcaactt ctaaatataa tgattataat ccttatcaac ttgagaagtc agattataag + 11521 gatttgtgtg tttttacaaa agagaaggct cttgagctaa tgctagacga caagattgcg + 11581 acagtttctg cttgtgctaa gctttatcac aagaatatct tggaaaaagt tccatttcca + 11641 gttggaaaaa tctatgaaga cttttatgtg gtagcggatc accttgcctt agcggataaa + 11701 attgtgatta gtccacttga aacatataac tattaccgta gagaaggtag tattgtccgt + 11761 tcgactttta ctgagaaaag atatgatttt tttgatgctg tttcgaaaaa cgaagaagtt + 11821 ataaagaaag aatacacaca aagtctagaa ttacagcaat ttctgcaagc gaaaaaatta + 11881 cgaggaggct ttgttgtaat tggtgcaaag gctgactctg gtttaacaga tttttcgaaa + 11941 gatcgaaacc tattaaaagt tgattttaaa accatgttat taaataaaaa aatatcgtgg + 12001 aaactaaaat taaaatatac aatatttatg ctgtcatcta aagtatattt aagattaagg + 12061 tagtatagta gattaatgta tttgataaga atatcgagta ttttaagaaa cgaggaaata + 12121 tgaaacgagg aaatatgaaa caggcttata taataattgc acataataag tttgaacagt + 12181 tgaaattttt aatttctctg ttggattata aggaacatga tatttttatt attgtaggca + 12241 gcaaagttaa tgtgggggag tctacaatta cttcgcttaa gtccagtgca atacattcca + 12301 atgtcattct cgtagataga gttcctattt attggggaaa ttattcacta agttctgcag + 12361 agatgttagg atttcgttat gcatataatt acgataacta tagtatgttc catttgttat + 12421 caggtgtaga tttaccatta gtgtcggcag acaaattatt taaattcttt gatcagaaca + 12481 aatcaaataa ttttttgagc atggtctctg atgagatttt gaaatcaaat aaagtgtatg + 12541 agcgtgtaaa atttagatac ttatttccta gattcttagc tagaaatatt cagaacaaat + 12601 atgttcgtaa atttgtagca tattaccgta agctagagat taaaattcaa cgtttaatga + 12661 aaatagattg ttttaaaaaa tataacatga gattgggtta tgcatctaac tgggtatcta + 12721 ttaatcagga tttagttaga ataatactag aagaagagaa aaatattgaa aaaatattta + 12781 aatattcgat agtaaatgat gaactgttca ttcctacgat aatgtataaa tacaatttga + 12841 tggaatcgtt atattcatct tcaccgataa cagatgcccc aaatgatttt caaggaaatc + 12901 taagatatat caattggtgg gatggagatc ctcatacctg gactgactct gagcatgata + 12961 tagaacaatt gaagcgtggt aaagctttag gtcataagtt ttctagaaaa tttgatttag + 13021 agaaatatcc gaatcttaaa gaagaaattc taattatcat aaataggaca gattgatatg + 13081 aaagtactaa aaaattacgc ctataacctc tcctatcaac tattactcat tatactacct + 13141 atcattacaa ctccctatgt gacacgggtc ttttctttga atgatctagg gacttatggt + 13201 tattttaact ccatcgttac ttattttatt cttttagcaa ctttaggagt tgctaactat + 13261 gggaccaagg tcatttcagg gcatcgcaag gaaattgaaa aaaatttttg ggggatttac + 13321 tccctgcaat tgggtgcgac agttctttct atgtttttgt accttgttct ttgtctaatt + 13381 cttcctttta tgcaaaatcc attcgcctat attctaggct tgagtttggt ttctaaaggc + 13441 ttagatattt cctggctctt tcaaggatta gaggattttc gtaagattac agcaagaaat + 13501 atcattgtga aactcgtagg tgtaagttcg atttttttat ttataaaatc agctagtgac + 13561 ctttaccttt acgtatttct tttgacaata tttgagttgt tgggacagtt aagcatgtgg + 13621 ttacccgctc gggaatttat tgggaaacca tattttgatt taagctatgc aaagcagcat + 13681 ctgaagccaa ttgttttatt attccttcct caggtagcga tctccttata tgttactcta + 13741 gaacgtacga tgcttggtgc tttatcttct acaaaagatg taggaattta tgatcaggct + 13801 cttaaattgg taaatatttt attaacattg gtaacatcgc ttgggagtgt tatgttacct + 13861 cgagttgcta atttattagc aacaggtgat tacaaagctg ttaataagat gcatgaaatg + 13921 tccttcctca tttataattt agtgattttt ccaattatgg ctggaatttt gattgtgaat + 13981 gatgattttg ttcagttttt ccttggtcaa gattttcagg atgcacgtta tgcaatcgcc + 14041 attatgatct tccgtatgtt cttcatcggt tggaccaata taatgggaat tcagatttta + 14101 attccccata ataaaaataa agaattcatg atttcaacaa cagcttctgc aattatcagt + 14161 gtaggattaa acatgctttt cctaccaaag cttggctata ttggagcagc cattgtttct + 14221 gtattaacag aagcacttgt atgggcaatt caattgttct atactcgcag atatctcaaa + 14281 gaagttccta tcatagtatc tatgacaaaa attgttctag catcagttat catgtatggc + 14341 attttgctag gttcaaaaat atttatacat ttttccccga ctataaatgt tctagcattt + 14401 gcagtacttg gtggaatcat ttaccttttt gcaattttat ctatgaaagt aatagatgtg + 14461 aaagaattaa aacaaatcat aaaaaaataa tggagtgtaa tatgtacgac tatttaatcg + 14521 ttggagctgg tttgtctgga gcaatcttcg cgcacgaagc cacaaaacgt ggtaaaaaag + 14581 taaaagtgat tgataaacgt gatcacatag gtgggaacat ctactgtgag aacgtagaag + 14641 ggatcaatgt tcataaatat ggtgcccata tcttccatac ttctaataaa aaagtttggg + 14701 actatgtcaa tcaattcgct gagtttaaca actatatcaa ctcacctgtc gcaaactata + 14761 aaggaagtct ctataatctt cctttcaata tgaatacttt ctatgctatg tgggggacaa + 14821 aaactccaca ggaagtgaaa gataagattg ctgagcagac agctgatatg aaggatgttg + 14881 aaccgaaaaa tctggaagaa caagccatca agttgattgg tccagatatc tatgaaaagt + 14941 tgatcaaggg atatactgaa aagcaatggg gacgcttcgc gacagaactt cctccattta + 15001 tcattaaacg ccttccagtt cgtctaacct ttgataataa ctattttaac gaccgttacc + 15061 aaggaattcc tattggtggt tacaatgtca ttatcgaaaa catgcttaaa gacgttgaag + 15121 ttgagcttgg tgttgatttc tttgctcacc gtgaagagtt agaagcatca gctgaaaaag + 15181 ttgtcttcac aggaatgatc gaccagtatt ttgactacaa gcacggcgag ttagaatacc + 15241 gtagtcttcg ttttgagcat gaaactttgg acgaggagaa ttatcaagga aatgctgtag + 15301 tgaactatac agagtgtgaa atcccttata ctcgcattat tgagcataaa cattttgagt + 15361 acggtacaca agataaaacg gttattactc gtgaatatcc agctgattgg aagcgtgggg + 15421 acgagcccta ctatccgatc aacgatgaga aaaataatgc tatgtttgct aagtaccaag + 15481 aggaagcagc gcagaatgat aaagttatct tttgtgggcg tttagcagat tataaatatt + 15541 acgatatgca tgtggtgatt gaacgggcgc ttgaggttgt ggagaaagag ttaggtaact + 15601 aaagatgcct ctttgtcaac tgcagtgggt tgaagtcggc taagctcgag aaaggacaaa + 15661 attcgtcctt tcttttttga tgttcagagc gataaaaatc ctttttttga agttttcaaa + 15721 gttccgaaat ccaaaggcgt ttcgtttgat aagtttgatg agattattgg tcgcttccaa + 15781 ttttgcgttg gaataaggta attgaagagc gttgacgatt ttttctttgt tctttagaaa + 15841 ggttttaaag acagtctgaa aaataggatg aacctgcttc agattgtcct caatgagtcc + 15901 gaaaaatttc tccggttcct tattctgaaa gtgaaaaagt aagagttgat agatctgata + 15961 gtggtgtttc aagtcttctg aatagcttaa aatcttgtca agaatttctt tatttgttaa + 16021 gtgcatgcga aaagtagggc gataaaaacg tttatcgctc aatttacgac tatcctgttg + 16081 gatgagtttc cagtaacgtt tgatagcctt gtattcatga gattttcgtt caaactgatt + 16141 cataatttga acacgaaaac gactcatggc acggctgaga tgttggataa tatggaaacg + 16201 atctagaacg attttagcac acggaaaaag ctgtttagcc aagtcatagt aaggactaaa + 16261 catatccatc gtaatgattt tcacttgaca acgaacggct ctatcgtagc gaagaaagtg + 16321 atttcggatg acagcttgtg ttctgccttc aagaacagtg ataatattaa gattatcaaa + 16381 atcttgcgca atgaagctca tctccatctc ccgattgaaa cagtcactcc ccggactgtt + 16441 tcaacctccc aagacataat ctcaggcaga tttctaaaat tacactcaaa gtggaagtca + 16501 ttgagcttgc gaatgacagt tgaagttgaa atggccagct gatgggcaat atcagtcata + 16561 gaaatttttt caattaactt ttgagcaatt ttttggttga tgatacgagg gatttggtga + 16621 tttttcttta ccaggggagt ctcagcaacc atcatttttg aacagtgata gcacttgaaa + 16681 cggcgttttc taaggagaat tctagaaggc ataccagttg tttcgaggta agggatctta + 16741 gacggttttt gaaagtcata tttcttcatt agacttccac aatcagggca agatggagcc + 16801 tcataatcca gcttagcgat aatttctttg tgggtatcca tattgatgat atctagaatc + 16861 ttgatgtttg ggtctttaat atcgagcagt tttgtgataa aatgtaattg ttccatatga + 16921 atctttctaa tgagttgttt tgtcgctttt cattataggt catatgggac tttttttcta + 16981 cacaaaaata ggctccataa tatctataag ggatttaccc actacaaata ttatagagcc + 17041 ataagaaatc tccagattag gaactatccg tgagttctct agtctggaga tttttcaata + 17101 gacttcgtta ttgggcggtt acaatgatat tcatattttt tgcaaagatg ttgtttgaaa + 17161 aataattttc aaaaattctg aaaattctgt tgacaacttt ctgaaaagag tctataatgg + 17221 agagaaagtt ttaaaggaga aaatgatgaa aagttcaaaa ctacttgccc ttgcgggcgt + 17281 gacattattg +// + diff --git a/public/res/serotype_genbank/serotype_10B.gb b/public/res/serotype_genbank/serotype_10B.gb new file mode 100644 index 0000000..45839ff --- /dev/null +++ b/public/res/serotype_genbank/serotype_10B.gb @@ -0,0 +1,749 @@ +LOCUS CR931650 16991 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 423/82 (serotype 10b). +ACCESSION CR931650 +VERSION CR931650.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 16991) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 16991) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..16991 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="423/82" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC10B_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC10B_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34724.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..445 + /gene="aliB" + /locus_tag="SPC10B_0002" + /pseudo + CDS 293..445 + /gene="aliB" + /locus_tag="SPC10B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI34725.1" + gene complement(459..968) + /gene="tnp" + /locus_tag="SPC10B_0003" + /pseudo + CDS complement(459..968) + /gene="tnp" + /locus_tag="SPC10B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1204..2649 + /gene="wzg" + /locus_tag="SPC10B_0004" + CDS 1204..2649 + /gene="wzg" + /locus_tag="SPC10B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34727.1" + /db_xref="GOA:Q4K2E4" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2E4" + /translation="MSRRFKKSSSQKVKRNVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTVLVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLVDSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLM + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYHVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1204..1320 + /gene="wzg" + /locus_tag="SPC10B_0004" + /note="Signal peptide predicted for SPC0381 by SignalP 2.0 + HMM (Signal peptide probability 0.997) with cleavage site + probability 0.550 between residues 39 and 40" + misc_feature 1408..1755 + /gene="wzg" + /locus_tag="SPC10B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.8e-63" + misc_feature 1933..2376 + /gene="wzg" + /locus_tag="SPC10B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 4.1e-68" + gene 2651..3382 + /gene="wzh" + /locus_tag="SPC10B_0005" + CDS 2651..3382 + /gene="wzh" + /locus_tag="SPC10B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34728.1" + /db_xref="GOA:Q4K2E3" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2E3" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMDTPYRDIHSALSKILMLGITPVIAHIERYDALEQNEKRVRELIAMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEHDLVHVIASDMHNLDGRPPHMFEAYSIVA + KKYGEEKARELFEENPRQIVMNQLI" + misc_feature 2654..3262 + /gene="wzh" + /locus_tag="SPC10B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.5e-39" + gene 3388..4083 + /gene="wzd" + /locus_tag="SPC10B_0006" + CDS 3388..4083 + /gene="wzd" + /locus_tag="SPC10B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34729.1" + /db_xref="GOA:Q4K2E2" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2E2" + /translation="MMKEQNTMEIDVIQLLNTLWKRKLIIALVAIVTGAIAFAYSSFI + IKPEYTSTTRIYVVNRNQGDKSGLTNQDLQAGSYLVKDYREIILSQDVLEKVVTDLQL + DMPTKNLASKIQVTVPVDTRIVSISVKDKQPEEASRIANSLRKIAAKKIISVTRVSDV + TTLEEARPATSPSSPNIRRNTLIGFLGGLGVVVMVVLLLELLDVRVKRPEDIEDVMQI + PLLGVIPNLDKLK" + misc_feature 3409..3825 + /gene="wzd" + /locus_tag="SPC10B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.5e-53" + misc_feature 3931..4008 + /gene="wzd" + /locus_tag="SPC10B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4093..4776 + /gene="wze" + /locus_tag="SPC10B_0007" + CDS 4093..4776 + /gene="wze" + /locus_tag="SPC10B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34730.1" + /db_xref="GOA:Q4K2E1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K2E1" + /translation="MPTLKITQKKLEIVKKAEEYYNALRTNIQLSGDNLKVISITSVK + PGEGKSTTSTNIAWAFAHAGYKTLLIDADIRNSVMSGVFRSSEKITGLTEFLSGTTDL + SQGLCDTNVENLFVIQAGSISPNPTALLQSENFRTMIDTLRKYFDYIIVDTAPIGIVI + DAVIVTQKCDASVLITAVGEVHRRDVQKAKEHLEQTGKPFLGVVLSKLNTSIEKYSSY + GGYGNYGNK" + gene 4830..5465 + /gene="wcjG" + /locus_tag="SPC10B_0008" + CDS 4830..5465 + /gene="wcjG" + /locus_tag="SPC10B_0008" + /note="member of homology group 50" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34731.1" + /db_xref="GOA:Q4K2E0" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4K2E0" + /translation="MIQNGIIYIGFKRVMDVFIGLFGTIFIVLPSSLIIYIIYKIKGY + KGSIFFTQYRVGLKGKKFKIIKFRSMVENAEELLTANKALYEKYINNSYKLPPNEDPR + LTNIGDFIRKTSIDEIPQFINLMLGDMSLIGPRPILENELEEYSKEEQQVLLSVRPGI + TGMWQVSGRSEVYYPERCEMELYYPRNQSFLLDVKIFFLTIKKVLSGEGAH" + misc_feature 4863..5462 + /gene="wcjG" + /locus_tag="SPC10B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.9e-56" + gene 5682..6476 + /gene="wciB" + /locus_tag="SPC10B_0009" + CDS 5682..6476 + /gene="wciB" + /locus_tag="SPC10B_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34732.1" + /db_xref="GOA:Q4K2D9" + /db_xref="UniProtKB/TrEMBL:Q4K2D9" + /translation="MSKKYKIIVATHKKFQMPEDKDLYIPVQVGSEGKENLGYQRDDQ + GNHISHLNPYYCELTGLYWAWKNLDCDYLGLVHYRRYFTDRNRPYHDKINMNEVILSA + DQVKEFMSEVDVVVPKKRKYYIETLYSHYAHTHNSSHLDVTREIIKEVSPEYLATFDK + VMDCRSGYMFNMFIMSKENVSSYCEWLFPIIDELYRRLDITGYSTFDARLFGRISERL + FNVWLDYQNLRVKEVPFMYMEKVNLFEKGKSFLKAKYFGKKYGQSF" + gene 6480..7730 + /gene="wzy" + /locus_tag="SPC10B_0010" + CDS 6480..7730 + /gene="wzy" + /locus_tag="SPC10B_0010" + /note="member of homology group 67" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34733.1" + /db_xref="UniProtKB/TrEMBL:Q4K2D8" + /translation="MVLLLLTFAFFLVFPVLSISLSVIGLVNDKKRSKIYLLLISFAI + SIVALRYIPHPMDDGAFHFRATTALIRYDSIFEMFKAFSNGWRVGNYDYGSIPIFTSL + MYLVRNTHHYSLLSFISAFITYFSFGYVVVELFKDLGKVSKLSYATVLIAVLCLNNYR + YTTSGMRFCMAVALMMLLLYLESKKGYTSLKTTIWYLLPVGIHSAVIYFIGLRFLFPL + IKKVTLAKSLFVLLGFPVLFNLVPWLANLIGWTYLQSFIRKIEVYSDNSSYSQFFNTT + LTMRLYVGIVLMVLFVLLYLGIVNSLKTTDDWRFSFVTMTYYVTLLSMGSIPFRNIYD + RNLFLLLPMIVVSTYILFTYRHQLKILTNRNIVYGLTMGILCLSCAVGAFYNNNFPFA + FIDFSKTDLLLKNIFQFFSNLPFT" + misc_feature 6480..6560 + /gene="wzy" + /locus_tag="SPC10B_0010" + /note="Signal peptide predicted for SPC0387 by SignalP 2.0 + HMM (Signal peptide probability 0.900) with cleavage site + probability 0.260 between residues 27 and 28" + gene 7740..8675 + /gene="wcrB" + /locus_tag="SPC10B_0011" + CDS 7740..8675 + /gene="wcrB" + /locus_tag="SPC10B_0011" + /note="member of homology group 87" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34734.1" + /db_xref="GOA:Q4K2D7" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K2D7" + /translation="MLLFYFLEDYMGLSTVTLFKNLKFTDSKFIKLEGELLLKYQEYL + LKIMEDIVTVCEEEGLYYSLSGGSALGAYRHKGFIPWDDDMDIFMLGSERKIFFQKFS + QKFSDKYWIHNSQTPNYGMPIGRIRQKGTVLRGREDVGVEECGFFIDIFWLENVPNSK + ILRQLHGFLCMGIGLLLSCRNFYKNRQLMLEIMKEHKEVRLVFRIKLVLGFLTSFISL + RQFTRLTESIYSLCKNNKSRYLSVPSGRKHYFGEMFIREDMQLTRKLSFEGHKWNVPN + NIEHYLTVMYGDYMQIPAVEDRESHIILEISFPNE" + misc_feature 7902..8600 + /gene="wcrB" + /locus_tag="SPC10B_0011" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 1.7e-24" + gene 8714..9802 + /gene="wcrC" + /locus_tag="SPC10B_0012" + CDS 8714..9802 + /gene="wcrC" + /locus_tag="SPC10B_0012" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34735.1" + /db_xref="GOA:Q4K2D6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2D6" + /translation="MKKIAIVRYNLSKIGGAEKVAINMANELSQYYDVKLLSILLDED + GFINYDINPNVTLINFHKGDLRIRTATLKLTGKLREYIKREKIEVIFSITPLTNTMVR + LATLGLNVKIVFCDHHSLEFRDFRSREVQRFVGAKFFDKIVTLTEEDRIKYSDKYNIP + INKVNAIYNWIDEEDSENTPFDNKTNKIITVGRFHSQKGYDYLAEVAIKVLSQHPDWQ + WDIYGSGDKLIEQELKRKLEEGYVSSQVNFKENVKGTENIYPNHSIYVMTSRYEGLPL + VLLEAQQYNLPIVSFRCPTGPSEIVEDRINGFLIDCYDVDQMSEKLLELMKNDDLRQS + FSEHAKDNMDKFDKNKILNQWIELIETI" + misc_feature 9227..9739 + /gene="wcrC" + /locus_tag="SPC10B_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.5e-37" + gene 9811..10815 + /gene="wcrD" + /locus_tag="SPC10B_0013" + CDS 9811..10815 + /gene="wcrD" + /locus_tag="SPC10B_0013" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34736.1" + /db_xref="GOA:Q4K2D5" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2D5" + /translation="MQECLLTIVMPSYNIQDYISKGIESFQQVHPDYKQKFEILIVND + GSTDDTAKVAEEVLRKDSLLNGRIITKENGGHGSTINRGIQEAKGKFFKVIDGDDWVI + PSEFEKFLDALTVTEVDMILTDFTEQHVYNNTTVRNDFVEKYEIGKEYSGIPEKRIPM + HSVTYRTSILVENGIRLSEKTFYVDIQYTLFPLEYVHSFCYWNYDVYQYYIGRPEQSM + NIESMKRNVRHHLTVTNSVLTYFSKIADDPVLKKVVADTLVYLISLQVDLSWMVEDSK + TLSEELYRQIEQSSYEYIPTKKFDRLSYLNYKSHYFLGFIFNSILKKYSKKKEKERGV + " + misc_feature 9829..10332 + /gene="wcrD" + /locus_tag="SPC10B_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 9.7e-29" + gene 10817..11770 + /gene="wciF" + /locus_tag="SPC10B_0014" + CDS 10817..11770 + /gene="wciF" + /locus_tag="SPC10B_0014" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34737.1" + /db_xref="GOA:Q4K2D4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2D4" + /translation="MFISVVVPVYNVSDYLHFAMDSLIKQTYQNFEIILVNDGSTDNS + PQLCEEYAKRYENVSVFHKENGGLSDARNLGVSKASSEWIFFLDPDDYLEDYTLELIV + KIQQEHQADLISTKVKATSKYNDYSPYQLEESDYKALCVVTKEKALELMLDDKIATVS + ACAKLYHKSILEKIPYPVGKIYEDFYVVADHLALAHKIVISPLETYNYYRREGSIVRS + TFTEKRYDFFDAVSKNEQVINKEYTQSLELQQSLQAKKLRGGFVVIGAKADSGLTDFS + KDRDLLKVDFKNMLLNKKISWKLKLKYTIFMLSSKMYLRLR" + misc_feature 10826..11341 + /gene="wciF" + /locus_tag="SPC10B_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 4.5e-44" + gene 11829..12770 + /gene="wcrG" + /locus_tag="SPC10B_0015" + CDS 11829..12770 + /gene="wcrG" + /locus_tag="SPC10B_0015" + /note="member of homology group 102" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34738.1" + /db_xref="GOA:Q4K2D3" + /db_xref="InterPro:IPR003406" + /db_xref="UniProtKB/TrEMBL:Q4K2D3" + /translation="MKQAYIIIAHNKFEQLKFLISLLDYKEHDIFIIIDSKVNVGEST + ITSLKSSAIHSNVILVDSVPIYWGSNSQISAEMLGFRYAYNYDNYSMFHLLSGVDLSL + VQADKLFKFFDQNKSRNFLSTVSDEILKSNKVYERVQFRYLFPRFLARNIQNKYVRKF + VAYYRKLEIKIQSSMKIDCFKKYNMRLSYASNGGSINQDLVRIILEEEKNIEKIFKHS + IVNDELFIPTIMYKYNLMESLYSSSPITDDPDDFQGNLRYINWWDGNPHIWTDSEHDI + EQLKRGKSLGHKFSRKFDLERYPSLKEEILIIINRTD" + gene 12772..14184 + /gene="wzx" + /locus_tag="SPC10B_0016" + CDS 12772..14184 + /gene="wzx" + /locus_tag="SPC10B_0016" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34739.1" + /db_xref="GOA:Q4K2D2" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K2D2" + /translation="MKVLKNYAYNLSYQLLLIILPIITTPYVTRVFSLNDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKEIEKNFWGIYSLQLGATVLSMFLYLVLCLTL + PFMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITARNIIVKLVGVSSIFLFIKSAS + DLYLYVFLLTIFELLGQLSMWLPAREFIGKPHFDLSYAKQHLKPIVLLFLPQVAISLY + VTLNRTMLGALSSTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVANLLATGDYKAVN + KMHEMSFLIYNLVIFPIMAGILIVNDDFVQFFLGQDFQDARYAIAIMIFRMFFIGWTN + IMGIQILIPHNKNKEFMISTTVSAIISVGLNMLFLPKLGYIGAAIVSVLTEALVWAIQ + LFYTRRYLKEVPIIVSMTKIVLASVIMYGILLGSKIFIHFSPTINVLAFAVLGGIIYL + FAILSMKVIDVKELKQIIKK" + misc_feature 12778..13572 + /gene="wzx" + /locus_tag="SPC10B_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 5.5e-67" + gene 14184..15296 + /gene="glf" + /locus_tag="SPC10B_0017" + CDS 14184..15296 + /gene="glf" + /locus_tag="SPC10B_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34740.1" + /db_xref="GOA:Q4K2D1" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2D1" + /translation="MECNMYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNI + YCENVEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMN + TFYAMWGTKTPQEVKDKIAEQTADMKDVAPKNLEEQAIKLIGPDIYEKLIKGYTEKQW + GRFATELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFF + AHREELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHETLNEENYQGNAVVNYTER + EIPYTRIIEHKHFEYGTQDKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEAA + QNDKVIFCGRLADYKYYDMHVVIERALEVVEKELGN" + misc_feature 14631..15233 + /gene="glf" + /locus_tag="SPC10B_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 2.3e-137" + gene complement(order(15335..15919,15973..16641)) + /gene="tnp" + /locus_tag="SPC10B_0018" + /pseudo + CDS complement(join(15335..15919,15973..16641)) + /gene="tnp" + /locus_tag="SPC10B_0018" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI34741.1" + misc_feature complement(join(15839..15919,15973..16185)) + /gene="tnp" + /locus_tag="SPC10B_0018" + /note="HMMPfam hit to PF01610, Transposase, score 4.3e-43" + /pseudo + gene 16944..>16991 + /gene="aliA" + /locus_tag="SPC10B_0019" + CDS 16944..>16991 + /gene="aliA" + /locus_tag="SPC10B_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34742.1" + /db_xref="UniProtKB/TrEMBL:Q4K2C2" + /translation="MMKSSRLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attaagctga taatatagtc aatcgaaaca agaacaagac + 481 aaaagagcct tgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaacagt + 601 ttatgcccaa actcctcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcaattaa ctcaccattt + 781 gttagctctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 tttctgggtc ttgttcataa ttggattgaa actagaatag tacacctctg cttctaaaac + 1021 attgttagaa atcgatttga ctgtcctgat cgttttgtca tgttcttatt tcattttact + 1081 atatttttgg ttcgcgggaa gtctactaag atacttaaag atgcagatag tgaaaataaa + 1141 ggtgtagaca ttaccgtaaa aaagtgatat aatcgtatga tgttcaatgt ataggtgtta + 1201 atcatgagta gacgttttaa aaaatcaagt tcacagaaag tgaagcgaaa tgttaatata + 1261 gttttgctga ctatttattt attgttagtt tgttttttat tgttcttaat ctttaagtac + 1321 aatatccttg cttttagata tcttaatcta gtggtaactg tgttagtcct actagttgcc + 1381 ttggtagggt tactcttgat tatctataaa aaagctgaaa agtttactat ttttctgttg + 1441 gtgttctcta tccttgtcag ctctgtgtcg ctctttgcag tacagcagtt tgttggactg + 1501 accaatcgtt taaatgcgac ttctaattac tcagaatatt caatcagtgt cgctgtttta + 1561 gtagatagtg agatcgaaaa tgttacgcaa ctgacgagtg tgacagcacc gactgggact + 1621 gataatgaaa atattcagaa actactagct gatatcaagt caagtcagaa taccgatttg + 1681 atggtcaacc agagttcgtc ttacttggca gcttacaaga gtttgattgc aggggagact + 1741 aaggccattg tcctaaatag tgtctttgaa aatatcatcg agtcagagta tccagactac + 1801 gcatcgaaga taaaaaagat ttataccaag ggattcacta aaaaagtaga agctcctaag + 1861 acgtctaaga atcagtcttt caatatctat gttagtggaa ttgacaccta tggtcctatt + 1921 agttcggtgt cgcgatcaga tgtcaatatc ctgatgactg tcaatcgaga taccaagaaa + 1981 atcctcttga ccacaacgcc acgtgatgcc tatgtaccaa tcgcagatgg tggaaataat + 2041 caaaaagata aattgactca tgcgggcatt tatggagttg attcgtccat tcacacctta + 2101 gaaaatctct atggagtgga tatcaattac catgtgcgat tgaacttcac ttcgtttttg + 2161 aaattgattg atttgttggg tggaattgat gtttataatg atcaagaatt tactgcccat + 2221 acgaatggaa agtattatcc tgcaggcaat gttcatcttg attcagaaca ggctctcggt + 2281 tttgttcgtg agcgctactc cctagcagat ggcgatcgtg accgtggtcg caaccaacaa + 2341 aaggtgattg tggctatcct tcaaaaatta acgtcaaccg aagcactgaa aaattatagt + 2401 acgatcatta atagcttgca agattctatc caaacaaata tgccacttga gactatgata + 2461 aatttggtca atgctcagtt agaaagtgga gggaattata aagtaaattc tcaagattta + 2521 aaaggtacag gtcggacgga tcttccttct tatgcaatgc cagacagtaa cctctatgtg + 2581 atggaaatag atgatagtag tttagctgta gttaaagcag ctatacagga tgtgatggag + 2641 ggtagatgaa atgatagaca tccattcgca catcgtcttt gatgtagatg atggtcccaa + 2701 gtcaagggag gaaagcaagg ctctcttggc agaagcctac agacaggggg tgcgaaccat + 2761 tgtctctacc tctcaccgtc gcaagggcat gtttgaaact ccggaagaga agatagcaga + 2821 aaactttctt caggttcggg aaatagctaa ggaagtggcg agtgacttgg tcattgctta + 2881 cggggctgaa atttactaca caccagatgt tctggataag ctggaaaaaa agcggattcc + 2941 gaccctcaat gatagtcgtt atgctctcat tgagtttagt atggatacac catatcgtga + 3001 cattcatagt gcattaagca aaatcttgat gttgggtatt accccagtca ttgcccatat + 3061 cgagcgctac gatgctcttg aacaaaatga aaagcgtgtt cgtgagctga ttgcaatggg + 3121 gtgttacaca caagtaaata gttcacacgt cctcaaaccc aagctatttg gagaacgcta + 3181 caagttcatg aaaaaaagag ctcagtattt tttggagcat gatctggttc atgtgattgc + 3241 aagtgatatg cacaatctag acggtagacc tcctcacatg ttcgaagctt atagcatagt + 3301 tgccaaaaag tacggggaag agaaggcgag agaactcttt gaagaaaatc ctcgacaaat + 3361 tgtaatgaat caactaattt aggagaaatg atgaaagaac aaaatactat ggagattgat + 3421 gtaattcaat tgttaaatac cttgtggaaa cggaaattga ttattgcttt ggttgctatc + 3481 gtaacgggag cgattgcctt tgcatatagt agctttatta taaaaccaga gtataccagt + 3541 acaacgcgta tttatgtagt caaccgtaac caaggggata aatcaggttt gacaaatcag + 3601 gacttgcagg caggttcata tcttgttaaa gactatcgtg agatcattct ttcccaagat + 3661 gtattagaga aggttgtcac agacttgcaa ctcgatatgc cgaccaaaaa tcttgctagt + 3721 aaaatacaag taactgtacc agttgataca cgtattgttt ctatttctgt caaggacaaa + 3781 cagccagagg aagcaagtcg tatcgctaac tccttgcgca agattgcagc taaaaaaatc + 3841 attagcgtaa cgcgtgtgtc tgatgtaaca acactcgaag aagcgcgacc agccacttcc + 3901 ccttcatctc caaatatccg tcggaatact ttgataggtt ttctcggagg attaggggtg + 3961 gtagttatgg tcgttctctt gcttgagttg ctagatgtcc gtgtcaaacg accagaggat + 4021 atcgaagacg ttatgcaaat tccactctta ggagtcattc caaatttgga taaattgaaa + 4081 taggagagaa cgatgccaac attaaaaatc acacagaaaa aattggagat cgtaaaaaag + 4141 gcagaggagt actacaatgc cttgcgtaca aatatacagt taagtggaga taatttgaaa + 4201 gtcatctcta ttacttcagt taagccggga gaaggaaagt ctacaacatc tactaacatt + 4261 gcttgggctt ttgcgcatgc aggctataaa accctattaa ttgatgcgga tattcgtaac + 4321 tcggtcatgt caggtgtttt tagatctagt gagaagatta ctggcttaac agagttttta + 4381 tcaggtacaa cagacttgtc acaaggtcta tgtgatacca atgttgaaaa tctctttgtc + 4441 attcaggcgg gttccatttc accaaacccc acagctcttt tacaaagtga gaatttcaga + 4501 acgatgatag ataccctgcg taaatatttt gactatatca ttgtggatac tgctcccata + 4561 ggtatcgtga ttgatgcagt tattgtgaca cagaaatgtg atgcttctgt tttgattacg + 4621 gcagttggtg aagtacatcg ccgtgatgtt caaaaggcga aagaacactt ggaacaaaca + 4681 ggcaagccgt ttttaggagt tgtgctaagt aaactgaata cttcaataga gaaatattct + 4741 tcttatgggg gatatgggaa ctatggaaat aaatagtctt acagtaccaa gattatttga + 4801 gatgattact atgggagggg gagtttaagg tgatacagaa tggcattatc tatattggct + 4861 ttaaaagagt tatggatgtt tttattggtt tatttggaac aatattcatc gtcttgccta + 4921 gttccttaat aatttatatt atctataaaa taaaaggtta caaaggaagt atattcttca + 4981 cacaatatag agtggggttg aaggggaaaa aatttaaaat tattaaattt agatcaatgg + 5041 ttgaaaatgc tgaagaactt ttgaccgcaa ataaagcact ctatgaaaaa tatataaata + 5101 acagttacaa attacctcca aatgaggatc ctcgtcttac taatatcgga gattttataa + 5161 gaaaaacgag tattgatgaa attcctcaat ttataaattt aatgttaggt gatatgagcc + 5221 ttattggacc tagaccaatt ttggagaatg agttagagga gtattctaag gaagaacagc + 5281 aagttttgtt atctgtacgg ccaggtatta cagggatgtg gcaagtttct ggtaggagtg + 5341 aggtatatta tcctgaacgc tgtgaaatgg agctgtatta ccctcggaat caatcctttt + 5401 tgttggatgt caaaatcttc tttttgacaa tcaaaaaagt tctgtctgga gaaggggctc + 5461 attgatgtat gaattaaatc atctagcacg aaatagatag aaagatgaag ttgaatacga + 5521 ataacgtttc ttgggtattc gtattcattt tttaagcgaa ggaagcatta ggaataagtg + 5581 gagttaatct agtattattt gcttgaaaaa atgaatggga attcaatcta aagaattgtc + 5641 cagtgaggca agattttagg aattggagtt aggatgtaga aatgtcaaaa aagtataaaa + 5701 ttatagtagc gactcataaa aaatttcaaa tgccagaaga taaggattta tatattcctg + 5761 ttcaagttgg cagtgaagga aaggaaaatt tgggctacca acgagatgat caaggtaatc + 5821 atatctcaca cctcaatcct tattattgtg aattgacagg attatactgg gcttggaaaa + 5881 atttagactg tgattaccta ggattagttc attaccgacg ttattttaca gacaggaacc + 5941 gaccttatca tgataagatt aacatgaatg aagttatcct atcggcagat caagttaagg + 6001 aattcatgtc tgaagtagat gtcgttgttc ccaaaaagag aaaatattat atagaaactc + 6061 tctattctca ttatgctcac actcataatt ccagtcattt agatgtaacg cgagaaatta + 6121 taaaagaggt ttcgccagaa tatttagcaa catttgacaa ggtgatggac tgtcgtagtg + 6181 gctacatgtt caatatgttt atcatgtcca aagaaaatgt atcatcttat tgtgagtggt + 6241 tattccctat cattgatgag ttgtacagaa gattggatat aacagggtac tctacttttg + 6301 atgcaagact atttggacgt attagtgagc gtctctttaa tgtttggtta gactaccaaa + 6361 atctacgtgt taaagaagta ccgtttatgt atatggaaaa agtgaattta tttgagaagg + 6421 gcaaatcctt cttgaaagcc aagtatttcg gaaaaaaata tggacagagt ttttaagtta + 6481 tggttttgtt attacttact tttgcattct ttttagtttt ccctgtgctg tcaataagtt + 6541 taagtgttat agggctagta aatgacaaaa agcgttcaaa aatctattta cttctaatta + 6601 gttttgcaat atcaattgtt gcgctgcgct atattcctca tcctatggat gatggcgctt + 6661 ttcattttcg tgcgactacg gcccttattc gctatgatag tattttcgaa atgtttaaag + 6721 cgttttctaa tggatggaga gtagggaact atgactatgg ttccatacca atttttactt + 6781 cattaatgta tcttgttcga aatactcatc actatagttt actgagtttt atttcagctt + 6841 ttataactta ctttagtttt ggttacgtag ttgttgagct atttaaggac ctgggcaagg + 6901 tttctaaact atcgtatgct acagtattaa ttgctgtact atgtttaaat aattatagat + 6961 atacaactag tggaatgaga ttttgtatgg cagttgcctt gatgatgctt ttactatatt + 7021 tggagtcaaa aaaaggctat actagtttaa aaacaaccat atggtatttg ttgcctgtag + 7081 gtatccattc agcggttatt tattttattg gtttaaggtt cttatttcca ttaatcaaga + 7141 aagtgacgct tgctaaaagt ttatttgtat tattaggttt tcctgttttg ttcaacctag + 7201 ttccatggtt agcaaatctg attggttgga cttacttaca atcatttatt cggaaaattg + 7261 aagtctactc tgacaattca tcctattccc agttttttaa taccacatta acaatgaggc + 7321 tatatgttgg aatagtgctg atggttttat ttgtattgtt atatttggga atagtaaatt + 7381 cattgaaaac aactgatgat tggcgtttta gttttgttac aatgacttat tatgtaactc + 7441 tgttatctat gggttcaata ccatttcgta atatttatga tagaaatctt ttcttgctcc + 7501 ttcctatgat tgtagtttca acctacatat tgtttacata tagacatcaa ttgaaaattc + 7561 ttactaatcg taatattgtt tatggattaa cgatgggtat tctttgtcta tcctgtgcag + 7621 ttggtgcatt ttataataat aatttccctt ttgcttttat tgattttagt aagacagact + 7681 tactcctaaa aaatattttt caattctttt caaatttacc ttttacataa taagactatg + 7741 tgctattatt ttatttcttg gaggattata tgggactatc tacagtaaca ttgtttaaaa + 7801 atttaaagtt cacagatagt aaatttatta aattggaagg agagctcctt cttaaatatc + 7861 aagagtattt attaaaaatc atggaagata ttgtaacagt gtgtgaggaa gaagggttat + 7921 actattcact ttctggtggg agtgcgttag gagcatatcg acacaaaggg tttattccat + 7981 gggatgatga tatggatata tttatgctag gaagtgaacg gaaaattttc tttcaaaaat + 8041 tttctcagaa attctctgat aagtattgga tacataattc acaaacacca aactatggca + 8101 tgccgattgg tcgtatcaga caaaaaggaa cagttctacg tggtcgagag gatgttggag + 8161 ttgaagaatg tggatttttt attgatattt tttggcttga aaatgttcct aattcaaaaa + 8221 ttttgagaca acttcatggt tttctatgta tgggaattgg attgttgcta tcatgtagaa + 8281 atttttataa aaatcgtcag ctgatgctgg agattatgaa ggagcataaa gaagtaaggc + 8341 ttgtttttcg aataaaatta gttttgggat ttctaactag ttttatatct ttgagacaat + 8401 ttacaagact tacggaaagc atctactcat tgtgcaagaa taataagtcg agatacctta + 8461 gcgttccttc aggtagaaaa cattattttg gtgagatgtt tataagggaa gatatgcagt + 8521 taactaggaa actaagtttt gaaggacata agtggaatgt tccaaataat attgagcact + 8581 atttaactgt aatgtatggt gactatatgc aaatacctgc agttgaagat agggaatcac + 8641 atatcatttt agaaatctcc ttccctaatg agtaagcaat actttcattt tttatatgta + 8701 aggaattaat ttaatgaaaa aaatagcaat tgttagatat aatctaagta aaattggtgg + 8761 agcggaaaaa gtggctatta atatggctaa tgaattgtca caatactatg atgtaaaact + 8821 attatctatt ctattggatg aagatggttt tataaattat gatattaatc ctaatgtgac + 8881 attaataaat tttcacaagg gtgatcttag aattagaact gctacattaa aattaacggg + 8941 taaattaaga gaatatatta aaagagaaaa aattgaagtg attttttcta ttaccccatt + 9001 aacaaatact atggttagat tagctactct gggattaaat gtgaaaatag ttttctgtga + 9061 tcatcatagt ttagaatttc gtgattttag aagtagagaa gtgcagagat ttgtaggagc + 9121 taaatttttt gacaagattg tcactttaac agaagaagat agaataaaat attcagataa + 9181 atataatata cctataaata aagtgaatgc tatttataat tggattgatg aggaagattc + 9241 tgaaaatact ccatttgata ataagacaaa taaaataata acggtagggc gatttcacag + 9301 tcaaaaggga tatgattatc tcgccgaagt agctataaaa gtattatcac aacatccaga + 9361 ctggcagtgg gatatatatg gttcagggga taagcttatt gaacaggagc taaaaagaaa + 9421 actagaagaa ggttatgttt cttcacaagt taattttaaa gaaaatgtaa agggaactga + 9481 aaatatttat cccaatcata gtatctatgt catgacttct cgctatgagg gtttgccttt + 9541 agtcctatta gaagctcaac aatacaacct cccaattgtt agtttcagat gtccgacggg + 9601 acctagtgaa attgttgaag atagaatcaa cggatttctg attgattgct atgatgtgga + 9661 tcagatgagt gagaaattgc ttgaattgat gaaaaatgat gatttgcgac aatctttctc + 9721 agaacatgcc aaagacaata tggataaatt tgataaaaat aaaattctta atcagtggat + 9781 agagttgatt gagacaattt aggagataag atgcaagagt gtttattgac aattgtaatg + 9841 cctagttata atattcagga ctatatttcc aaaggaatcg agtcattcca gcaagtacac + 9901 ccagattaca aacaaaaatt tgagatctta attgtgaatg atggaagtac ggacgacaca + 9961 gccaaagtag cagaagaggt cctaagaaaa gattcattgt tgaatggtcg tattatcaca + 10021 aaggaaaatg gaggccatgg ctcaactatt aatcgtggta tccaggaagc aaaggggaaa + 10081 ttctttaaag ttattgatgg ggatgactgg gttatcccat cagagtttga aaaattttta + 10141 gatgccctta cagttactga agtggatatg attttgacag attttacaga acagcatgtt + 10201 tacaacaata ctactgttcg aaatgatttt gttgaaaaat atgagattgg taaggaatat + 10261 tctggaattc cagagaaacg gattccaatg cactcggtaa cttatagaac atctatccta + 10321 gttgagaatg gaattcgttt aagtgaaaag acattttatg ttgacattca gtacactctt + 10381 tttcctttag agtatgttca tagtttctgt tattggaatt atgatgtata ccaatactat + 10441 atcggacgac ccgagcagag tatgaatatt gagagtatga aacgaaatgt tcgtcaccat + 10501 ttgactgtaa caaattctgt gctgacttat ttctcaaaaa ttgcggatga tcctgtctta + 10561 aagaaagtgg ttgcagatac tttagtttat cttatcagtt tgcaggtaga tttgtcatgg + 10621 atggttgagg actcaaagac actatcagaa gaattataca gacaaattga gcagagttct + 10681 tatgagtata tccctacgaa aaaatttgat agattgtctt atttgaacta taaatctcac + 10741 tattttctag gctttatctt caattcaata ttgaaaaaat attctaaaaa gaaagaaaaa + 10801 gagagaggag tttaggatgt ttattagtgt tgttgttccg gtttataatg tttctgatta + 10861 cttacacttt gccatggata gtctgataaa acaaacgtat caaaattttg aaataatcct + 10921 tgtaaatgat ggttcaacag ataactcccc tcagttatgt gaagagtatg ctaagcgata + 10981 tgaaaatgtc tctgtttttc ataaagaaaa tggaggattg tctgatgccc gtaatttagg + 11041 agtttcgaaa gcatcatcag agtggatttt ctttttagat ccagatgatt atttggaaga + 11101 ttatactcta gaattgatag tgaaaattca gcaggaacat caagcagact tgatttctac + 11161 caaagtgaag gcaacgtcta agtataatga ttatagtcct tatcaacttg aggagtcaga + 11221 ttataaggct ttgtgtgttg ttacaaaaga gaaggctctt gagctaatgc tagacgataa + 11281 gattgcgaca gtttctgctt gtgctaagtt gtatcacaaa agtatcttgg aaaaaattcc + 11341 atatcctgtt ggaaaaatct atgaagactt ttatgtggta gcggatcacc ttgccttagc + 11401 gcataaaatt gtgattagtc cacttgaaac atataactat taccgtagag aaggtagtat + 11461 tgttcgttcg acttttactg agaaaagata tgattttttt gatgctgttt cgaaaaacga + 11521 acaagttata aataaagaat acacacaaag tttagaatta caacaatctc tgcaagcgaa + 11581 aaaattacga ggaggttttg ttgtaattgg tgcgaaagct gactctggtt taacagattt + 11641 ttcgaaagat agagacctat taaaagttga ttttaaaaac atgttattaa ataaaaaaat + 11701 atcatggaaa ttaaaattaa aatatacaat atttatgcta tcatctaaaa tgtatttaag + 11761 attaagatag tgtagtaaat tgatttattt gaataagaat atcgactatt tttaagaaat + 11821 gaggaattat gaaacaagct tatattataa ttgcacataa taagtttgaa cagttgaaat + 11881 ttttaatttc tctgttggat tataaggaac atgatatttt tattattata gatagcaaag + 11941 ttaatgtggg ggagtctaca attacttcac ttaaatctag tgcgatacat tcaaatgtta + 12001 ttctcgtaga tagtgttcct atttattggg gaagcaattc tcagatttct gcagagatgt + 12061 taggattccg ttatgcatat aattatgata attatagtat gttccatttg ttgtcaggtg + 12121 tagatttatc attagtgcag gccgataaat tatttaaatt ctttgatcag aacaaatcaa + 12181 ggaattttct gagtactgtc tctgatgaga ttttaaaatc caataaagta tatgagcgtg + 12241 tacaatttag atatttgttc cctagattct tagctagaaa tattcagaac aaatatgttc + 12301 gtaaatttgt agcatattac cgtaagctag agattaaaat tcaaagttcg atgaaaatag + 12361 attgttttaa aaaatataac atgagattga gttatgcatc taacggggga tctattaatc + 12421 aggatttagt tagaataata ctagaagaag agaaaaatat tgaaaaaata tttaaacatt + 12481 cgatagtgaa tgatgaacta tttattccta cgataatgta taaatacaat ttgatggaat + 12541 cgttatattc atcttcaccg attacagatg atccagatga ttttcaagga aatctaagat + 12601 atatcaattg gtgggatgga aatcctcata tatggactga ttctgagcat gatatagaac + 12661 aattgaaacg tggtaaatct ttaggtcata agttttctag aaaatttgat ttagaaagat + 12721 atccgagtct taaagaagaa attctaatta tcataaatag gacagattga tatgaaagta + 12781 ctaaaaaatt acgcctataa cctctcctat caactattac tcattatact acctatcatt + 12841 acaactccct atgtgacacg ggtcttttct ttgaatgatc tagggactta tggttatttt + 12901 aactccatcg ttacttattt tattctttta gcaactttag gagttgctaa ctatgggacc + 12961 aaggtcattt cagggcatcg caaggaaatt gaaaaaaatt tttgggggat ttactccctg + 13021 caattgggtg cgacagttct ttctatgttc ttgtaccttg ttctttgtct aactcttcct + 13081 tttatgcaaa atccagtcgc ctatattcta ggcttgagtt tggtttctaa aggcttagat + 13141 atttcctggc tctttcaagg attagaggat tttcgtaaga ttacagcaag aaatatcatt + 13201 gtgaaactcg taggtgtaag ttcgattttt ttatttataa aatcagctag tgacctttac + 13261 ctttatgtat ttcttttgac aatatttgag ttgttgggac agttaagcat gtggttaccc + 13321 gctcgggaat ttattgggaa accacatttt gatttaagct atgcaaagca gcatctgaag + 13381 ccaattgttt tattattcct tcctcaggta gcgatctcct tatatgttac tctaaatcgt + 13441 acgatgcttg gtgctttatc ttctacaaaa gatgtaggaa tttatgatca ggctcttaaa + 13501 ttggtaaata ttttattaac attggtaaca tcgcttggga gtgttatgtt acctcgagtt + 13561 gctaatttat tagcaacagg tgattacaaa gctgttaata agatgcatga aatgtccttc + 13621 ctcatttata atttagtgat ttttccaatt atggctggaa ttttgattgt gaatgatgat + 13681 tttgttcagt ttttccttgg tcaagatttt caggatgcac gttatgcaat cgccattatg + 13741 atcttccgta tgttcttcat cggttggacc aatataatgg gaattcagat tttaattccc + 13801 cataataaaa ataaagaatt catgatttca acaacagttt ctgcaattat cagtgtagga + 13861 ttaaacatgc ttttcctacc aaagcttggc tatattggag cagccattgt ttctgtatta + 13921 acagaagcac ttgtatgggc aattcaattg ttctatactc gcagatatct caaagaagtt + 13981 cctatcatag tatctatgac aaaaattgtt ctagcatcag ttatcatgta tggcattttg + 14041 ctaggttcaa aaatatttat acatttttcc ccgactataa atgttctagc atttgcagta + 14101 cttggtggaa tcatttacct ttttgcaatt ttatctatga aagtaataga tgtgaaagaa + 14161 ttaaaacaaa tcataaaaaa ataatggagt gtaatatgta cgactattta atcgttggag + 14221 ctggtttgtc tggagcaatc ttcgcgcacg aagccacaaa acgtggtaaa aaagtaaaag + 14281 tgattgataa acgtgatcac ataggtggga acatctactg tgagaacgta gaagggatca + 14341 atgttcataa atatggtgcc catatcttcc atacttctaa taaaaaagtt tgggactatg + 14401 tcaatcaatt cgctgagttt aacaactata tcaactcacc tgtcgcaaac tataaaggaa + 14461 gtctctataa tcttcctttc aatatgaata ctttctatgc tatgtggggg acaaaaactc + 14521 cacaggaagt gaaagataag attgctgagc agacagctga tatgaaggat gttgcaccga + 14581 aaaatctgga agaacaagcc atcaagttga ttggtccaga tatctatgaa aagttgatca + 14641 agggatatac tgaaaagcaa tggggacgct tcgcgacaga acttcctcca tttatcatta + 14701 aacgccttcc agttcgtcta acctttgata ataactattt taacgaccgt taccaaggaa + 14761 ttcctattgg tggttacaat gtcattatcg aaaacatgct taaagacgtt gaagttgagc + 14821 ttggtgttga tttctttgct caccgtgaag agttagaagc atcagctgaa aaagttgtct + 14881 tcacaggaat gatcgaccag tattttgact acaagcacgg cgagttggaa taccgtagtc + 14941 ttcgttttga gcatgaaact ttgaacgagg agaattatca aggaaatgct gtagtgaact + 15001 atacagagcg tgaaatccct tatactcgca ttattgagca taaacatttt gagtacggta + 15061 cacaagataa aacggttatt actcgtgaat atccagctga ttggaagcgt ggggacgagc + 15121 cctactatcc gatcaacgat gagaaaaata atgctatgtt tgctaagtac caagaggaag + 15181 cagcgcagaa tgataaagtt atcttttgtg ggcgtttagc agattataaa tattacgata + 15241 tgcatgtggt gattgaacgg gcgcttgagg ttgtggagaa agagttaggt aactaaagat + 15301 ggctctttgt caactgtagt gggttgaaaa aaagctaagc tcgagaaagg acaaatttcg + 15361 tcctttcttt tttgatgttc aaagcgataa aaatccgttt tttgaagttt tcaaagtttc + 15421 gaaaaccaaa ggcattgcgc ttgataagtt tgatgagatt attggtcgct tccagtttgg + 15481 cattagaata gtgtagttga agggcgttga caatcttttc tttatctttg aggaaggttt + 15541 taaagacagt ctgaaaaata ggatgaacct gcttaagatt gtcctcaata agtccgaaaa + 15601 atttctctgg ttccttattc tgaaagtgaa acagcaagag ttgatagagc tgatagtgat + 15661 gtttcaagtc ttgtgaatag ctcaaaagct tgtctaaaat ctctttattg gttaaatgca + 15721 tacgaaaagt agggcgataa aaatgtttat cgctgagttt acgactatcc tgttgtatga + 15781 gcttccagta gcgcttgata gccttgtatt catgggattt tcgatgaaac tgattcatga + 15841 tttgaacacg cacacgactc atagcacggc taagatgttg tacaatatga aagcgatcaa + 15901 gaacgatttt agcattcggg agtgaaacag tctgggagac tgtttcagcc tgagcctaga + 15961 aatttgaaag cgaagctgtt tagctaagtc atagtaagga ctaaacatat ccatagtaat + 16021 aattttgacg cgacatcgga cagctctatc gtagcgaaga aagtgatttc gaatgatagc + 16081 ttgtgttcta ccctcaagaa cagtgatgat attgagattg ttaaaatctt gcgcaatgaa + 16141 gctcatcttt ccctttgtaa aagcatactc atcccaagac ataatctcag gaagacaaga + 16201 aaaatcatgt ttaaagtgaa aatcattgag cttacgaata acagttgaag ttgagatgga + 16261 aagctgatgg gcaatatcag tcatagaaat cttttcaatt aacttttgag caatcttttg + 16321 gttgatgata cgagggattt ggtgattttt ctttaccagg ggagtctcag caaccatcat + 16381 ttttgaacag tgatagcact tgaaacgacg ctttctaagg agaattctag taggcatacc + 16441 agttgtctca aggtaaggaa tcttagacgg tttttgaaag tcatatttct tcaattggtt + 16501 tccgcactca gggcaagatg gggcgtcgta gtccagtttg gcgatgattt ctttgtgtga + 16561 atccctattg acgacatcta taatttggat atttgtgtct ttgatatcga gtagttttgt + 16621 gataaaatgt aattgttcca tatgaatctt tctaatgagt tgtttaatcg cttttcatta + 16681 tagatcttat gggacttttt ttctacacaa aaataggctc cataatatcc ataggggatt + 16741 tacccactac aaatattata gagccttatt tagaaatagt attaaaaatt ccttgactat + 16801 gtgatatagt tgagggattt ttaaatgata ttcatatttt ttgcaaagat gttgtttgaa + 16861 aaataatttt caaaaattct gaaaattctg ttgacaactt tctgaaaaga gtctataatg + 16921 gagagaaagt tttaaaggag aaaatgatga aaagttcaag actacttgcc cttgcgggcg + 16981 tgacattatt g +// + diff --git a/public/res/serotype_genbank/serotype_10C.gb b/public/res/serotype_genbank/serotype_10C.gb new file mode 100644 index 0000000..a0eed66 --- /dev/null +++ b/public/res/serotype_genbank/serotype_10C.gb @@ -0,0 +1,796 @@ +LOCUS CR931651 18126 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Gro Norge (serotype 10c). +ACCESSION CR931651 +VERSION CR931651.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18126) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 18126) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..18126 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Gro Norge" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC10C_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC10C_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33075.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..466 + /gene="aliB" + /locus_tag="SPC10C_0002" + /pseudo + CDS 293..466 + /gene="aliB" + /locus_tag="SPC10C_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..923) + /gene="tnp" + /locus_tag="SPC10C_0003" + /pseudo + CDS complement(459..923) + /gene="tnp" + /locus_tag="SPC10C_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + gene 1145..2590 + /gene="wzg" + /locus_tag="SPC10C_0004" + CDS 1145..2590 + /gene="wzg" + /locus_tag="SPC10C_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33078.1" + /db_xref="GOA:Q4K2B1" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2B1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSIGVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGIDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESRGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1145..1261 + /gene="wzg" + /locus_tag="SPC10C_0004" + /note="Signal peptide predicted for SPC0400 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1349..1696 + /gene="wzg" + /locus_tag="SPC10C_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.5e-63" + misc_feature 1874..2317 + /gene="wzg" + /locus_tag="SPC10C_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.6e-70" + gene 2592..3323 + /gene="wzh" + /locus_tag="SPC10C_0005" + CDS 2592..3323 + /gene="wzh" + /locus_tag="SPC10C_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33079.1" + /db_xref="GOA:Q4K2B0" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2B0" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTSDVLDKLENNRIPTLNNS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLERDLVHVIASDMHNVDDRPPHMAEAYDLVS + QKYGEAKAQELFIENPRKIVMDQLI" + misc_feature 2595..3203 + /gene="wzh" + /locus_tag="SPC10C_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.4e-37" + gene 3329..4024 + /gene="wzd" + /locus_tag="SPC10C_0006" + CDS 3329..4024 + /gene="wzd" + /locus_tag="SPC10C_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33080.1" + /db_xref="GOA:Q4K2A9" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2A9" + /translation="MMKEQNTIEIDVFQLLKTLWKHKLIILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDVLEKVAINLKL + DMPAKALTSKVQVIVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVRLNTLVAFLGGTVVTVITVLLIELLDTRVKRPEEIEDVLQM + PLLGVVPDLDKMK" + misc_feature 3350..3766 + /gene="wzd" + /locus_tag="SPC10C_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 6.7e-55" + gene 4034..4717 + /gene="wze" + /locus_tag="SPC10C_0007" + CDS 4034..4717 + /gene="wze" + /locus_tag="SPC10C_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33081.1" + /db_xref="GOA:Q4K2A8" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K2A8" + /translation="MPTLEISQVKLELAKKAEEYYNALCTNLQLSGDDLKVFSITSVK + PGEGKTTTSTNIAWAFARAGYKTLLIDADMRNSVMSGVFKPRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPIALLQSRNFSTMLETLRKYFDYIVVDTAPVGVVI + DAAIIMQKCDASILVTKAGETKRRDIQKAKEQLEQTGKPCLGVVLNKFDTSVDKYGSY + GSYGNDRKK" + gene 4772..5407 + /gene="wcjG" + /locus_tag="SPC10C_0008" + CDS 4772..5407 + /gene="wcjG" + /locus_tag="SPC10C_0008" + /note="member of homology group 50" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI33082.1" + /db_xref="GOA:Q4K2B6" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4K2B6" + /translation="MKRNSIIYISLKRVMDVLIGLFGTIFTVLPCSLIIYIIYKTKGY + KGSIFFTQYRVGLGGKKFKIIKFRSMVENAEEVLTANKALYEKYINNSYKLPPNEDPR + LTNIGDFIRKTSIDEIPQFINLLFGDMSLIGPRPILENELKEYSKEEQPVLLSVRPGI + TGVWQVSGRSEVYYPERCEMELYYPRNQSFLLDVKIFFLTIKKVLSGEGAH" + misc_feature 4805..5404 + /gene="wcjG" + /locus_tag="SPC10C_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 7.1e-55" + gene 5624..6418 + /gene="wciB" + /locus_tag="SPC10C_0009" + CDS 5624..6418 + /gene="wciB" + /locus_tag="SPC10C_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33083.1" + /db_xref="GOA:Q4K2B5" + /db_xref="UniProtKB/TrEMBL:Q4K2B5" + /translation="MPKKYKIIVATHKRFQMPEDKGLYIPVQVGSEGKENLGYQRDDQ + GNHISHLNPYYCELTGLYWAWKNLECDYLGLVHYRRYFTDRNRPYHDKINMNEVILSA + DQVKKLMSEVDVVVPKKRKYYIETLYSHYAHTHDSSHLDVTREIIKEVSPEYLATFDK + VMDCRSGYMFNMFIMDKENVSSYCEWLFPIIDELYRRLDITGYSAFDARLFGRVSERL + FNVWLDCQNLRVKEVPFMYMEKVNLFEKGKSFLKAKYFGKKYGQSF" + gene 6422..7672 + /gene="wzy" + /locus_tag="SPC10C_0010" + CDS 6422..7672 + /gene="wzy" + /locus_tag="SPC10C_0010" + /note="member of homology group 67" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33084.1" + /db_xref="UniProtKB/TrEMBL:Q4K2B4" + /translation="MVLLLLAFAFFLVFPVLSISLSVIGLVNDKKRSKIYLLLISFAI + SIIALRYIPHPTDDGAFHFRATTALIRYDSIFEMFKAFSNGWIVGIYDYGSIPIFTSL + MYFVRNTHHYSLLSFISAFITYFSFGYVVVDLFKDLGKFSKLSYATVFIAVLCLNNYR + YTTSGMRFCMAVALMMLLLYLESKKGYTRLKTTIWYLLPLGIHSAVIYFIGLRFLFPL + IRKVTLAKSLFVLLGFPVLFNLVPWLANLIGWTYLQFFIRKIEVYSDNSSYSQFFNTT + LTMRLYVGIVLMVLFVLLYLGIVNSLKISDDWRFSFVTMTYYVTLLSMSSIPFRNIYD + RNLFLLLPMIVVSTYILFTYRRQLKILTNRNIVYGLTIGILCLSCAVGVFYNNNFPFG + FIDFSKTDLLLKNIFQFFSNLPFT" + misc_feature 6422..6502 + /gene="wzy" + /locus_tag="SPC10C_0010" + /note="Signal peptide predicted for SPC0406 by SignalP 2.0 + HMM (Signal peptide probability 0.934) with cleavage site + probability 0.262 between residues 27 and 28" + gene 7682..8617 + /gene="wcrB" + /locus_tag="SPC10C_0011" + CDS 7682..8617 + /gene="wcrB" + /locus_tag="SPC10C_0011" + /note="member of homology group 87" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33085.1" + /db_xref="GOA:Q4K2B3" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K2B3" + /translation="MLLFYFLEDYMGLSTVTLFKNLKFIDSKFIKLEGELLLKYQEYL + LKIMEDIVTVCEEEGLYYSLSGGSALGAYRHKGFIPWDDDMDIFMLGSEREIFFQKFY + QKFSDKYWIHNSQTPNYGMPIGRVRQKGTVLRGREDVGVEECGFFIDIFWLENVPNSK + FLRQLHGFLCMAIGLLLSCRNFYKNRQLMLEIMKEHKEIRLVFRIKLILGFLTSFISL + RQFTRLTERIYSLCKNNESRYLSVPSGRKHYFGEMFIREDMQLTRKLNFEGHKWNVPN + NVEHYLTVMYGDYMKIPAVEDRESHIILEISFPSE" + misc_feature 7844..8542 + /gene="wcrB" + /locus_tag="SPC10C_0011" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 5.1e-25" + gene 8655..9740 + /gene="wcrC" + /locus_tag="SPC10C_0012" + CDS 8655..9740 + /gene="wcrC" + /locus_tag="SPC10C_0012" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33086.1" + /db_xref="GOA:Q4K2C9" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2C9" + /translation="MKKIALVKWILDDSGGGERVAVSLANELTKKYEVHLIGITTKQS + DLFFGINSQVKYSNFFDHRVRLSKNILKISKMLKKYFLDNEIEVAFGIGIFANVFLSL + SGIGISTKVVLCDHTNSITANRELSQKVQRYVGTKLADKIITLTQEDRKNYIRKYGIS + ENRIAYIYNWKENRLSNIPYNDESTKIVTVGRFDYQKGYDYLIQVAKKVLAKMPDWTW + EIYGSGKQDKVDKIRDLITENDLQDKLVIKGLEKNQDLIYGDKGIYVMTSRYEGLPLV + LLEAQQYNLPIVSFRCPTGPSEIVEDGVNGYLIDCYDTDKMSEKLLELMKNDDLRQSF + SEHAKDTMDKFDKNKILNQWIELIETI" + misc_feature 9165..9677 + /gene="wcrC" + /locus_tag="SPC10C_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 4.8e-40" + gene 9749..10553 + /gene="wcrD" + /locus_tag="SPC10C_0013" + CDS join(9749..10057,10056..10553) + /gene="wcrD" + /locus_tag="SPC10C_0013" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33087.1" + /db_xref="GOA:Q4K2C8" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2C8" + /translation="MQECLLTIVMPSYNIQDYISKGIESFQQVHPDYKNKFEVLVVND + RSTDDTALVAEKILAKDSLLDGRVITKENGGHGSTINRGIQEAKGKFFKVIDGDDWVI + PPSEIEKFLDALETVDVDMVITDFTEQHVNNDTTVRSDFIDKYEICRIYKGIPDVRIP + MHSVTYKTSILSANKIRLSEKTFYVDIQYTLFPLEYVHSFSYWNYDIYQYYIGRPEQS + MNIESMKRNVSHHLKVTNSVLDYFSKIENEPVLNRVVSETLVYLISLQVV" + misc_feature order(9767..10056,10057..10295) + /gene="wcrD" + /locus_tag="SPC10C_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.6e-28" + gene 10640..11602 + /gene="wciF" + /locus_tag="SPC10C_0014" + CDS 10640..11602 + /gene="wciF" + /locus_tag="SPC10C_0014" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33088.1" + /db_xref="GOA:Q4K2C7" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2C7" + /translation="MFKMFVSIVVPVYNVADYLHYAIESLIKQTYQNFEVILVNDGST + DDSPLLCEDYAKQYENIHVFHKENGGLSDARNFGVSKASSDWIFFLDPDDYLEEYTLE + LIVKIQETHQADLISTKVKATSKYNAYTSYRLQDSDYKDLASITKEKAMELMLDDKVA + TVSACAKLYRKCILERVPFPVGKIYEDFYVVAEHLALAERIVISPLETYNYYRREGSI + VRSTFTEKRYDFFEAVAKNEEVVKREYIQIPELKQALQAKKLLGGFVVIGAKADSGLK + DFSKDKELLRVEMSELLKNSKLSWKLKLKYLIFMFSPKLYLLLR" + misc_feature 10658..11173 + /gene="wciF" + /locus_tag="SPC10C_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6.8e-45" + gene 11756..13171 + /gene="wzx" + /locus_tag="SPC10C_0015" + CDS 11756..13171 + /gene="wzx" + /locus_tag="SPC10C_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33089.1" + /db_xref="GOA:Q4K2C6" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K2C6" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKEIEKNFWGIYSLQLGATVLSLSLYALLCLTL + PFMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVISIFIFVKSAN + DLYLYVFLLTIFELLGQLSMWLPAREFIGSSHFSIEYARHHLKPVILLFLPQVAISLY + ITLDRTMLGALASTKDVGIYDQALKLVNILLILVTSLGSVMLPRVANLLATGDHKAVN + KMHEMSFLIYNLVIFPMMAGILIVNDDFVSFFLGQDFQDARYAIAIMIFRMFFIGWTN + IMGIQILIPHNKNKEFMISTTAPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LYFTRRYLKEVPIIGSLTKIILASAIMYGILLGLKTVIHFSPIINVIVFAVLGGIIYL + FAILSLKVVDVKELKQIIRKK" + misc_feature 11762..12556 + /gene="wzx" + /locus_tag="SPC10C_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.5e-68" + gene 13173..14171 + /gene="wciG" + /locus_tag="SPC10C_0016" + CDS 13173..14171 + /gene="wciG" + /locus_tag="SPC10C_0016" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33090.1" + /db_xref="GOA:Q4K2C5" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K2C5" + /translation="MQKNRDISLDLLKVLACIGVILLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMVNGYLLLGKREITYPYILQKVKWILITVSLWNIIVWLFKRDFAVNPI + KKIVGSLLQKGYFFQFWFFGALILIYLCLPVLKTVINSKRKYVYILSLLVAIGFIVEL + ANIFLQMPIQTHVMQTFRLWTWFFYYLLGGYIAQFNVDNLKYRFKNWMKIVSILLLLI + SPIILFFIAKTTYHNLFAEYFYDTLFVKVSTLGIFLTIFTLTLNENRNKWIVFLSNQT + MGVFIIHTYIMKLWERIFGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 14185..15288 + /gene="glf" + /locus_tag="SPC10C_0017" + CDS 14185..15288 + /gene="glf" + /locus_tag="SPC10C_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33091.1" + /db_xref="GOA:Q4K2C4" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2C4" + /translation="MYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKLWDYVNQFAEFNNYINSPIANYQGHLYNLPFNMNTFYA + LWGTKTPQEVKDKIAEQTTHMQDVEPKNLEEQAIKLIGTDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTYDNNYFNDRYQGIPIGGYNVIIENMLGDVEVELGVDFFANRE + ELEASAEKVVFTGMIDQFFDYQFGELEYRSLRFEHEILDQENYQGNAVVNYTERDIPY + TRIIEHKHFEFGTQDKTVITREYPADWKRGDEPYYPINDAKNNAIYEQYLAEAKKNGR + VIFCGRLADYKYYDMHVTVERALDVVEEELGSI" + misc_feature 14620..15222 + /gene="glf" + /locus_tag="SPC10C_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 5.1e-134" + gene 15316..16368 + /gene="wcrH" + /locus_tag="SPC10C_0018" + CDS 15316..16368 + /gene="wcrH" + /locus_tag="SPC10C_0018" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33092.1" + /db_xref="GOA:Q4K2C3" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4K2C3" + /translation="MKYYLKDSFLNNEYEKNAGNKARNDVEAILISEGYKGLELKVEN + WYKMNFFKAQQHKYRATKSVFDQLGSGDELLIQFPIIHHTFFISQLIKQAQKRGVKFY + LLIHDVETVRHVGNSAVKLRHKVRDYFQEKAALTSVDGIIVHNDIMKNALTIQGIPSD + KMVSLEIFDYLIPNFEEKNAPQKEGAIIVAGNLIPTKSGYLYNLPEQPAYNLYGAGYD + ESRALKNTTYFGSFMPDDLPVALQGSFGLVWDGDSSETCQGSFGNYLRINNSHKASLY + LASGFPLVVWKESALAHFVLDKQCGIAVASLYDLQKALDDLTDQDYMELSANARQVGV + AIRSGDYLKSAISKLK" + gene complement(16392..16520) + /gene="tnp" + /locus_tag="SPC10C_0019" + /pseudo + CDS complement(16392..16520) + /gene="tnp" + /locus_tag="SPC10C_0019" + /note="Lone member of homology group 0224" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase (fragment)" + /db_xref="PSEUDO:CAI33093.1" + gene complement(order(16542..17126,17180..17848)) + /gene="tnp" + /locus_tag="SPC10C_0020" + /pseudo + CDS complement(join(16542..17126,17180..17848)) + /gene="tnp" + /locus_tag="SPC10C_0020" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI33094.1" + misc_feature complement(order(17046..17126,17180..17392)) + /gene="tnp" + /locus_tag="SPC10C_0020" + /note="HMMPfam hit to PF01610, Transposase, score 7.2e-43" + /pseudo + gene 18079..>18126 + /gene="aliA" + /locus_tag="SPC10C_0021" + CDS 18079..>18126 + /gene="aliA" + /locus_tag="SPC10C_0021" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33095.1" + /db_xref="UniProtKB/TrEMBL:Q4K2C2" + /translation="MMKSSRLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaaggca gaaatccttt gttttttata accaaggttt ataaaccttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagccc atgttttctc aataggattg tactcaggtg aatagggagg aagaggtaaa + 541 agtttatgcc caaactcttc acacaagagt tctagcttcc ccattctatg gaatcttgca + 601 ttatccataa taataaccga tggtgtggtt aatgttggta agagaaattt ctgaaaccaa + 661 gcttcaaaaa agtcgctcgt catcgtctct tcgtaagtca ttggagcgat taactcacca + 721 tttgttagac ctgcaaccaa agaaatcctc tgatatcttc ttccagatac tttgcctctt + 781 cttaactgac cttttaaaga gcgaccatgt tctcgataaa aataagtatc gaatcctgtt + 841 tcgtcaatct aaacaggtgc taggtgcttt aatctattaa aattcttaag aaataaggct + 901 actttttctg ggtcttgttc ataattagat tgaaactaga atagtagacc tctgcttcta + 961 aaacattgtt agaaatcgat ttgactgtcc tgatcgattt gtcatgttct tatttcattt + 1021 tactatattt ttgtttcgcg ggaagtctac taagatactt aaagatgcag atagtaaaaa + 1081 aaatgtagac attaccgtaa aaaagtgata taatcgtatg atgttcaagg tataggtgtt + 1141 aatcatgagt agacgtttta aaaaatcacg ttcacagaaa gtgaagcgaa gtgttaatat + 1201 cgttttgctg actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta + 1261 caatatcctt gcttttagat atcttaacct agtggtaact gcgttagtcc tactagttgc + 1321 cttggtaggg ctactcttga ttatctataa aaaagctgaa aagtttacta tttttctgtt + 1381 ggtgttctct atccttgtca gctctgtgtc gctctttgca gtacagcagt ttgttggact + 1441 gaccaatcgt ttaaatgcga cttctaatta ctcagaatat tcaatcggtg tcgctgtttt + 1501 agcagatagt gatatcgaaa atgttacgca actgacgagt gtgacagcac cgactgggac + 1561 tgataatgaa aatattcaaa aactactagc tgatattaag tcaagtcaga ataccgattt + 1621 gacggtcaac cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac + 1681 taaggccatt gtcctaaata gtgtctttga aaacatcatc gagtcagagt atccagacta + 1741 cgcatcgaag ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa + 1801 gacgtctaag aatcagtctt tcaatatcta tgttagtgga attgacacct atggtcctat + 1861 tagttcggtg tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa + 1921 aatcctcttg accacaacgc cgcgtgatgc ctatgtacca atcgcagatg gtggaaataa + 1981 tcaaaaggat aaattgactc atgctggtat atatggggtt gattcatcca ttcatacctt + 2041 agaaaacctt tatggtatag atattaatta ttatgttcgt ttgaatttta cctcattttt + 2101 gaaattgatt gacttattgg gaggggtaga tgttcataat gatcaagagt tttcagctct + 2161 acatgggaag ttccatttcc cagtagggaa tgtccatcta gactctgagc aggctctagg + 2221 ttttgtacgt gaacgctact cactagccga tggagaccgt gaccgtggtc gcaaccaaca + 2281 aaaggtgatt gtggctatcc ttcaaaaatt aacgtcaacc gaagcactga aaaattatag + 2341 tacgatcatt aatagcttgc aagattctat ccaaacaaat atgccacttg agactatgat + 2401 aaatttggtc aatgctcagt tagaaagtag agggaattat aaagtaaatt ctcaagattt + 2461 aaaaggtaca ggtcggatgg atcttccttc ttatgcaatg ccagacagta acctctatgt + 2521 gatggaaata gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga + 2581 gggtagatga aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca + 2641 agtcaagaga ggaaagcaag gctctcttgg cagaatccta caggcagggg gtgcgaacca + 2701 ttgtctctac ctctcaccgt cgcaagggca tgtttgaaac tccagaagag aagatagcag + 2761 aaaactttct tcaggttcgg gaaatagcta aggaagtcgc gagtgacttg gtcattgctt + 2821 atggggctga aatttactac acatcagatg ttttggataa gctggaaaac aatcggattc + 2881 cgacactcaa taatagtcgt tatgccttaa tagagtttag tatgaacacc ccttatcgcg + 2941 atattcatag tgccttgagt aaaatattga tgttgggaat tactcccgtc attgcccaca + 3001 tcgagcgcta tgatgctctt gaaaataatg aaaaacgcgt tcgagagctg atcgatatgg + 3061 gctgttacac gcaagtaaat agttcacatg tcctcaaatc caaacttttt ggagaacggt + 3121 ataaattcat gaaaaaaaga gcgcagtatt tcttggagcg tgatttggtt catgtgattg + 3181 caagtgatat gcataatgtg gacgacagac ctccccatat ggcagaagcg tatgaccttg + 3241 tttcccaaaa atatggagaa gcgaaggctc aggaactttt tatagaaaat cctcgaaaaa + 3301 ttgtaatgga tcaactaatt taggagaaat gatgaaagaa caaaacacga tagaaatcga + 3361 cgtatttcaa ttacttaaaa ccttgtggaa acacaagcta atcattttat tagtggcact + 3421 tgtgacaggg gcgggagctt ttgcatatag cacttttatt gttaagccag aatatacgag + 3481 caccacgcgt atttacgtag tcaaccgtaa tcaaggagat aagccgggac tgacgaatca + 3541 ggacttgcag gcagggactt atctggtaaa agactaccgc gaaattatcc tttcgcagga + 3601 tgtattggaa aaggtagcga taaatttgaa attggatatg ccagcaaaag cgttaactag + 3661 caaagtgcaa gtgattgtac cagccgacac tcgtatcgtc tcaatctctg tcaaggataa + 3721 acaaccagag gaagccagtc gcattgctaa ttctctacga gaagttgcag cagaaaagat + 3781 catcgctgtc acgcgagtat ctgatgtaac gacgcttgaa gaagcgcggc cagctacgac + 3841 tccctcttct cccaatgttc gactcaacac cttagttgct tttcttggag gaaccgtcgt + 3901 aacagtaatt actgttcttt tgattgagtt gctcgatacc cgtgtgaaac gtcctgaaga + 3961 aattgaagat gtactgcaaa tgccacttct aggagtcgtt ccagatttgg ataaaatgaa + 4021 ataggaggaa gttatgccaa cgttagaaat ctcacaggtg aaattagaac ttgcgaaaaa + 4081 ggcagaggaa tattataatg ctttgtgcac gaacctacag ttaagtggag atgatttgaa + 4141 agtgttttct attacttctg tgaaaccagg agaaggaaaa acaacgactt ccaccaatat + 4201 cgcttgggct tttgcgcgtg caggttacaa aacgctgctg attgatgcag acatgcgtaa + 4261 ctccgtgatg tcaggtgtct ttaaaccaag ggaaaggatt actggactaa cagaatttct + 4321 atcagggact acagacctgt cacaggggct ttgcgatacc aatattgaga atctctttgt + 4381 gattcaggct ggctctgtgt caccaaatcc gatagccctt cttcaaagta ggaatttcag + 4441 tacaatgctt gaaaccttgc gtaaatattt tgactatatc gtcgtagaca ctgctcctgt + 4501 cggcgtcgtg attgatgcgg ctatcattat gcagaaatgt gatgcttcta ttttagtgac + 4561 gaaggcaggt gaaacaaaac gacgggatat tcaaaaagcg aaagaacagt tggaacaaac + 4621 tgggaagccg tgtttaggag ttgtgttgaa taaattcgat acttcagtag acaaatacgg + 4681 ttcttatggg agttatggga atgacaggaa aaaataaacc agtttatagt agcgaaacta + 4741 attgagatac ttatcatgag gaggagttaa ggtgaaaaga aatagcatta tctatattag + 4801 cttaaaacga gttatggatg ttcttattgg cttgtttgga acaatattca cagtcttgcc + 4861 ctgttctcta ataatttata ttatttataa aacaaaaggt tataaaggga gtatattttt + 4921 tacacaatac agagtggggt tgggagggaa aaaatttaaa attattaaat ttagatcaat + 4981 ggttgaaaat gctgaagaag ttttgaccgc aaataaagca ctctatgaaa aatatataaa + 5041 taacagttat aaattacctc caaatgagga tcctcgtctt accaacatcg gagattttat + 5101 aagaaaaacg agtattgatg aaattcctca atttataaac ttgttgtttg gagatatgag + 5161 tcttattgga cctagaccga ttttggagaa tgagttaaag gagtactcta aggaagaaca + 5221 gccagtttta ctatctgtac gaccaggtat tacaggggtg tggcaagttt ctggtaggag + 5281 cgaggtatat tatcctgaac gctgtgaaat ggagctgtat taccctcgga accaatcctt + 5341 tttattagat gtcaaaatct tctttttgac aataaaaaaa gttctgtctg gagaaggggc + 5401 tcattgatgt atgggctaaa tcatctagca aaaaaagata gaaagatgaa gttgaatacg + 5461 cataacgttt cttggatatt cgtatttatt ttctcaagtg aaggaagcat tatgaataag + 5521 tggatttaat ctagtgtttt ttgcttgaaa aaatgaatgg gaattcaatc taaagaattg + 5581 tccagtgagg caagatttta ggaattggag ttaggatgta gaaatgccaa aaaagtataa + 5641 aattatagta gcgactcata aaagatttca aatgccagaa gataagggct tatatattcc + 5701 tgttcaggtt ggcagtgaag gaaaggaaaa tttaggctat caacgagatg atcaaggtaa + 5761 tcatatctca cacctcaatc cttattattg tgaattaaca ggattatact gggcttggaa + 5821 aaatttagaa tgtgattacc taggattagt tcattaccga cgttatttta cagataggaa + 5881 ccgaccttat catgataaga ttaacatgaa tgaagttatc ctatcggcag atcaagttaa + 5941 gaagctcatg tctgaagtag atgtcgttgt tcccaaaaag agaaaatatt atatagaaac + 6001 tctctattct cattatgctc atactcatga ttccagtcat ttagatgtaa cacgagaaat + 6061 tataaaagag gtttcgccag aatatttagc aacatttgac aaggtgatgg actgtcgtag + 6121 tggctacatg ttcaatatgt ttatcatgga caaagaaaat gtatcatctt attgtgagtg + 6181 gttgttccct atcattgatg agttgtacag aagattggat ataacaggat actctgcttt + 6241 tgatgcaaga ctatttggac gtgttagtga gcgtctcttt aatgtttggt tagattgcca + 6301 aaatctacgt gttaaagaag ttccatttat gtatatggaa aaagtgaatt tatttgagaa + 6361 gggcaaatcc ttcttgaaag ccaagtattt cggaaaaaaa tatggacaga gtttttaaat + 6421 tatggttttg ttattacttg cttttgcatt ctttttagtt ttccctgtgt tgtcaataag + 6481 tttaagtgtt atagggctag taaatgacaa aaagcgttca aaaatctatt tactactaat + 6541 tagttttgca atatcaatta ttgcgctgcg ttatattcct catcctacgg atgatggcgc + 6601 ttttcatttt cgtgcgacta ctgcccttat tcgctatgat agtattttcg aaatgtttaa + 6661 agcattttct aatgggtgga tagtagggat ctatgactat ggctccatac caatttttac + 6721 ctcattaatg tattttgttc gcaacaccca tcactatagt ttactgagtt ttatttcagc + 6781 tttcataact tactttagtt ttggttacgt agttgttgac ttatttaagg atttgggcaa + 6841 gttttctaaa ctatcgtatg ctacagtatt cattgctgta ctatgtttaa ataattatag + 6901 atatacaact agtggaatga gattttgtat ggcagttgcc ttgatgatgc ttttactata + 6961 tttggagtca aaaaaaggct atactaggtt aaaaacaact atttggtatt tgttaccatt + 7021 aggtatccat tcagcggtta tttattttat tggtttaagg ttcttatttc cattaattag + 7081 gaaagtgaca ctcgctaaaa gtttatttgt attattaggt tttcctgttt tgttcaacct + 7141 agttccatgg ttagcaaatc tgattggttg gacttactta caatttttta ttcgaaaaat + 7201 tgaagtctat tctgacaatt catcctattc ccagtttttt aataccacat taacgatgag + 7261 gctatatgtt ggaatagtac tgatggtttt atttgtattg ttatatttgg gaatagtaaa + 7321 ttcattgaaa ataagtgatg attggcgttt tagttttgtt acaatgacct attatgtaac + 7381 tctgttatct atgagttcaa taccatttcg taatatttat gatagaaatc ttttcttgct + 7441 ccttcctatg attgtagttt caacctacat attatttaca tatagacgtc agttgaaaat + 7501 tcttactaat cgtaatattg tttatggact gacgataggt attctttgtc tatcctgtgc + 7561 agttggtgta ttttataata ataatttccc ttttggtttt attgatttta gtaagacaga + 7621 cttactccta aaaaatattt ttcaattctt ttcaaattta ccttttacat aataagacta + 7681 tgtgctatta ttttatttct tggaggatta tatgggacta tctacagtaa cattgtttaa + 7741 aaatttaaag tttatagata gtaaatttat taaattggaa ggagagctcc ttcttaaata + 7801 tcaagagtat ttattaaaaa tcatggaaga tattgtaaca gtgtgtgagg aagaagggtt + 7861 atactattca ctttctggtg ggagtgcatt aggggcttat cgacacaaag ggtttattcc + 7921 atgggatgat gatatggaca tatttatgct aggaagtgag agggaaattt tctttcaaaa + 7981 attctatcag aaattttctg ataaatattg gatacataat tcacaaacac caaactatgg + 8041 catgcctatt ggtcgtgtca gacaaaaagg aacagtttta cgtggccgag aggatgtcgg + 8101 agttgaagaa tgtggatttt ttattgatat tttttggctt gaaaatgttc ctaattcaaa + 8161 attcttgaga caacttcacg gctttctctg catggcgatt ggattgttac tatcatgtag + 8221 aaatttttat aaaaatcgtc agttgatgct ggagattatg aaggaacata aagaaataag + 8281 gcttgttttt cgaataaaac taattttagg gtttctaact agctttatat ctttgagaca + 8341 atttacaaga cttacggaaa ggatctattc attgtgcaag aataatgaat caagatacct + 8401 tagtgttcct tcaggaagaa aacattattt tggcgagatg tttataagag aagatatgca + 8461 gttaactagg aaactaaatt ttgaaggaca taagtggaat gttccaaata atgttgagca + 8521 ttatttaact gtaatgtacg gtgattatat gaaaatacct gcagttgaag atagggaatc + 8581 acatatcatt ttagaaatct ccttccctag cgagtaaaca gactttcatt ttttatatgt + 8641 aaggaattaa tttaatgaaa aaaatagctt tagtgaaatg gattttggat gattctggtg + 8701 gcggtgagcg agttgctgta tctttggcaa acgaacttac aaaaaagtat gaagttcatt + 8761 tgattggaat tacaacaaag caatcggatt tattctttgg aatcaattct caagtaaaat + 8821 actccaattt ttttgaccat cgagtacgct tgtctaagaa tattctaaaa atctcaaaaa + 8881 tgttaaaaaa atatttccta gataatgaga tagaggttgc ctttgggata ggaatattcg + 8941 ctaatgtatt tttatccttg tcgggaatag gaatttctac taaagtagtt ttgtgtgatc + 9001 ataccaattc aattacggct aatagagaac tttctcagaa agtccaaaga tatgttggga + 9061 caaagctagc agacaagatt attactctta cgcaagagga tcgtaaaaat tatatacgaa + 9121 aatacggcat ttctgagaat aggattgctt acatctataa ttggaaagaa aatcgtcttt + 9181 ccaatatacc ttataatgat gagtctacta aaattgtaac tgttggtcgt tttgattatc + 9241 aaaaaggata tgattatctt atccaagtcg cgaaaaaagt gttagctaaa atgcctgact + 9301 ggacttggga aatctacggt tccggaaaac aagataaagt agacaaaatc agagatttaa + 9361 tcaccgaaaa tgatttacag gataagttag tcataaaagg acttgaaaaa aatcaggatc + 9421 tgatttatgg agataaaggg atttatgtca tgacttctcg ttacgaaggt ttaccgttgg + 9481 tattgttaga agctcaacaa tacaatcttc ctattgttag cttcagatgt ccaacgggac + 9541 ctagtgagat tgttgaagat ggggtcaatg gttatctgat agattgttat gataccgata + 9601 agatgagtga gaaattgctt gaattgatga aaaatgatga tttgcgacaa tctttctcag + 9661 agcatgcaaa agatactatg gataaatttg ataaaaataa aattcttaat cagtggatag + 9721 agttgattga gacaatttag gagataagat gcaagagtgt ttattgacaa ttgtaatgcc + 9781 tagttataat attcaggact atatttccaa aggaatcgag tcattccagc aagtacaccc + 9841 ggattataaa aataaatttg aagtactggt tgtcaatgat agaagtacag acgatacggc + 9901 tttagtagca gaaaaaatat tagccaaaga ttcgttgctg gatggccgtg tcattacaaa + 9961 agaaaacggc ggtcatggtt cgacaatcaa tcgcggtatt caagaagcaa agggaaaatt + 10021 ttttaaagtg attgatgggg atgactgggt tatccccatc agaaattgaa aagttcttag + 10081 atgctcttga aactgttgat gtggatatgg tgattacaga ttttacagag cagcatgtca + 10141 ataacgatac tacagtacga agtgacttta ttgacaagta tgaaatttgt agaatctata + 10201 aggggattcc tgatgtaagg attcccatgc attcagttac atataaaaca tctatcttgt + 10261 cggcgaataa aattcgttta agtgaaaaaa cattttatgt tgacattcag tacacactct + 10321 ttcctttgga gtatgttcat agtttcagtt attggaatta tgatatttat caatactaca + 10381 taggtagacc agagcaaagt atgaatattg agagtatgaa gcgaaatgta agtcatcatc + 10441 taaaggtaac gaattctgta ctagattatt tttcaaaaat tgaaaatgaa cccgttttaa + 10501 accgagtagt ttctgaaacc ttagtttatc tcatcagttt gcaggttgtc taacttaaat + 10561 tataggacta gctttgcttt gggaataaat tttaatccga tttggaataa atactctaaa + 10621 aaaaaagaaa aagagagagg tgtttaagat gtttgtcagc atcgttgttc cggtttataa + 10681 tgttgcagac tatctgcatt atgcgataga aagcttaatt aaacagacct atcaaaactt + 10741 tgaggtaatc cttgtaaatg atggttctac agatgattct cctctattat gcgaagatta + 10801 tgcaaagcaa tatgaaaata tccatgtttt ccacaaagaa aatggtgggt tatctgatgc + 10861 gcgtaacttt ggagtttcta aagcgagttc agattggatt ttctttttag atccggatga + 10921 ttatcttgaa gaatatactc tagagttaat cgtgaaaatt caggaaacac atcaagcaga + 10981 cttgatttca acaaaggtaa aagctacttc aaaatataat gcttatactt cttatcgatt + 11041 gcaagactca gactataaag atttggcttc gattacaaaa gaaaaggcta tggaactaat + 11101 gttggatgac aaagttgcaa cggtttctgc ttgtgctaag ctttatcgga aatgcatctt + 11161 ggaacgcgtt ccatttccag tcgggaagat ctatgaggat ttttatgttg tagcagaaca + 11221 tcttgcctta gctgaaagaa tcgtgatcag tccacttgaa acctacaatt actatcgtag + 11281 ggaagggagt attgttcgtt caacatttac tgaaaaaaga tatgatttct ttgaagctgt + 11341 tgcaaaaaat gaggaagttg ttaaaagaga gtacattcag attccagaat taaagcaagc + 11401 tttgcaagct aagaaattat taggtggttt tgtagtaatt ggtgcaaaag ctgactcagg + 11461 cttaaaagat ttttcaaaag ataaagagtt gttgagagtc gaaatgagcg agttattaaa + 11521 aaatagtaag ttatcatgga aactaaaact aaaatatctt atttttatgt ttagccctaa + 11581 attgtatttg ttgctacgat agtatgatac atagatccaa tttaatttgc aacaggtgtc + 11641 aaaaaattgt aggaaagagg gaatatgaaa gaagtgttta gaagaattgc ccattataaa + 11701 tctgttcgtt cacgattttt aatgtctctg gttgattata atagggcggg ttgaaatgaa + 11761 agtattaaaa aactacgcct acaatctttc ttatcaattg ttggtgatta tacttccgat + 11821 tattacgact ccctatgtaa cacgggtctt ttcttcggat gatttaggga cgtatggata + 11881 ctttaattcc attgttactt attttatcct cttggcgaca ctaggagttg ctaactatgg + 11941 gaccaaggtc atttcagggc atcgcaagga aattgaaaaa aacttttggg gtatctactc + 12001 tctacaatta ggggcaacag ttctttctct gtctttatat gctcttcttt gtctgaccct + 12061 tccctttatg caaaatccgg tagcctacat tctaggcttg agtttagttt caaaaggttt + 12121 agacatttcc tggctctttc aagggctaga agattttcga aagattactg ttcgaaatat + 12181 cacagttaaa ctcgttggag tcatttcaat ctttatcttt gtcaaatctg caaacgacct + 12241 atatctctat gtttttttgc taaccatatt tgaactttta gggcaactaa gtatgtggtt + 12301 acctgctcgg gagtttatcg gtagttctca ttttagcata gaatatgcta ggcatcattt + 12361 aaagccggtc atattattat tccttcctca agtagctatt tctttgtaca ttacgctgga + 12421 tcgtaccatg cttggagcac tggcgtctac aaaagatgta gggatctatg atcaggcact + 12481 taagttggta aatatccttc tgattttggt aacttccttg ggaagcgtta tgttgcctcg + 12541 tgtcgcgaat ttgttagcga caggtgatca caaagcggtt aacaaaatgc atgagatgtc + 12601 cttcctcatt tataatttag tgattttccc aatgatggca ggaattttga ttgtgaatga + 12661 tgattttgtt agctttttcc ttgggcagga ttttcaggat gcacgttatg caattgccat + 12721 tatgatcttc cgtatgttct ttatcggttg gaccaatatc atgggaattc agattttaat + 12781 tccccataat aaaaataaag aattcatgat ttcaacaaca gctcccgcaa ttatcagtgt + 12841 aggtttgaac ttactattcc ttcctaaact tggatatatc ggagcagcca ttgtttctgt + 12901 tttgacagag gcgttggtat gggcgataca attatacttt acccgtagat acctaaaaga + 12961 agttccgatt atcggatctt tgacaaaaat tattctagct tcagctatca tgtatggtat + 13021 cttgctaggt ttaaaaacag ttatacattt ttcaccaatc ataaatgtta tagtatttgc + 13081 agtgcttggt ggaatcattt atctttttgc aattctatct ttgaaagtgg tagatgtaaa + 13141 agaattaaaa caaattatta ggaaaaaata aaatgcaaaa aaatagggat attagcctag + 13201 atttattaaa agtgcttgcg tgtattgggg tcattttact ccatacaaca atgggcggat + 13261 ttaaagagac aggatcatgg aatcttttgg catatttata ttatttaggt acctactcca + 13321 ttcccttgtt ttttatggtc aatggttatt tattgttagg caaaagggaa ataacttatc + 13381 cttacatact tcaaaaagtc aaatggattc taataacagt gtcattatgg aacattatcg + 13441 tttggctttt taaaagagac tttgcggtta atccaattaa aaaaattgta ggctctctgt + 13501 tacaaaaagg gtatttcttt cagttttggt ttttcggtgc cttgatactg atttatttat + 13561 gtttgcctgt tttgaaaaca gttataaatt caaaaagaaa atatgtatac attctatctt + 13621 tattggtggc aattgggttt atagttgaat tagcaaatat tttccttcag atgcctatac + 13681 aaactcatgt tatgcaaact tttagattat ggacttggtt tttctactat cttttaggtg + 13741 gttatatagc acaattcaat gtagacaacc tcaaatatag atttaaaaat tggatgaaaa + 13801 tagttagcat acttttgtta ttgatttcac caataatatt attcttcata gcgaagacta + 13861 catatcataa tctatttgct gaatattttt atgatacttt atttgtaaaa gtcagtactc + 13921 taggaatttt tctaactatc ttcacgctta cgttgaatga aaaccgaaac aaatggattg + 13981 ttttcctttc taatcaaaca atgggagttt tcataataca cacttatatt atgaaattgt + 14041 gggaaagaat atttggtttt aattttgtag gagcatattt actttttgct ctatttactt + 14101 tgagtgttag ttttattatt gttggaatgt taatgaagat tccttacttc aatcgaatcg + 14161 tcaaattata aaaaggagaa cactatgtac gattatctta tcgtcggtgc tggtttgtct + 14221 ggagcaatct ttgcacacga agctacaaaa cgtggaaaaa aagttaaagt gattgacaag + 14281 cgtgaccaca tcggtggaaa tatctactgt gaaaatgttg agggcatcaa tgtccacaag + 14341 tatggtgccc acattttcca tacttccaat aaaaaattgt gggactatgt taaccaattc + 14401 gctgagttta acaactatat caattcccct atcgccaact atcaagggca cctttacaat + 14461 ctgcctttca atatgaacac tttctacgcc ttgtggggaa caaagacacc ccaagaagtc + 14521 aaggacaaga ttgctgagca aacgactcac atgcaagatg ttgagccaaa aaacctagag + 14581 gaacaagcca ttaagttgat tggtacggat gtctatgaaa agctgattaa gggctatact + 14641 gagaaacaat ggggacgttc tgctactgag ctgccaccct ttatcatcaa gcgtttgcca + 14701 gttcgattga cctatgataa caattatttc aacgaccgct accaaggaat tcctattggt + 14761 ggttacaatg tcatcattga aaatatgctt ggcgatgtgg aagttgagct tggtgttgat + 14821 ttctttgcca atcgtgaaga gttagaagca tcagctgaaa aagttgtctt cacagggatg + 14881 attgatcagt tctttgacta tcagtttggt gaactagagt atcgcagtct tcgttttgaa + 14941 catgagattc tggaccaaga aaactatcaa ggaaatgctg tagtcaacta tactgaacgt + 15001 gatataccat atacgcgtat catcgagcac aaacattttg agtttgggac ccaggacaag + 15061 accgttatta ctcgtgaata tccagcagat tggaaaagag gggatgaacc ctactatcca + 15121 atcaatgatg ctaaaaacaa tgcaatctat gaacagtatc tagcagaagc caagaaaaat + 15181 gggcgcgtga tcttttgtgg tcgcttggca gattataaat actatgatat gcatgtgacg + 15241 gttgaacgtg cattggatgt ggtagaagaa gaactaggga gtatctaaga acatcacaga + 15301 taaaggagag aaaaggtgaa atattatctg aaggattcat ttctgaataa tgaatacgaa + 15361 aagaatgcag gaaataaggc acgaaatgac gtggaagcta ttctaatctc agaggggtat + 15421 aagggattgg aactcaaggt tgagaattgg tataagatga atttctttaa agctcagcaa + 15481 cacaaatatc gggcaaccaa gtctgtgttt gatcagttgg gatctggaga tgaattgctg + 15541 attcagttcc cgattatcca ccatacattt ttcatttcgc aactcatcaa gcaggctcaa + 15601 aaaagaggag ttaaattcta tctgttgatc catgatgttg aaaccgtgcg tcatgtagga + 15661 aattcagcag tgaaacttcg tcataaagtg agagattact tccaagagaa ggcagctctt + 15721 acatcagtgg atggcattat cgttcataat gatatcatga aaaatgcctt gacaatccaa + 15781 ggcataccat cagataaaat ggttagcttg gagatttttg actatctgat tcctaacttt + 15841 gaggaaaaaa atgctcccca aaaagaggga gcgattatcg tcgccggaaa tctaattcca + 15901 acaaaatcag gctatcttta taatttgcca gaacagccag cttacaactt gtatggagcg + 15961 ggttacgatg aaagtcgtgc attgaaaaac acgacctact ttggttcctt tatgccagat + 16021 gacctcccag ttgctcttca aggtagtttt ggtttggtgt gggatgggga tagttcagaa + 16081 acttgccaag gttctttcgg aaattaccta cgtattaaca attcgcacaa ggcttctctt + 16141 tatttggctt cgggctttcc tctggtggtt tggaaagagt ctgcccttgc gcattttgtg + 16201 ctagataagc agtgtggtat agcggttgct tctctatatg acctccaaaa ggcactagac + 16261 gatttgacag atcaagatta catggaactg tcggctaatg ccagacaagt aggagtagcg + 16321 attcgaagtg gagattatct gaaatcggcc atttctaaat tgaagtaaga atgctaaatt + 16381 tcaagttcaa gttagccagc aatcaaaaat tctctgggag acttgtagtc caagcatttt + 16441 ttaggatagt tattgatcca cttttcgatg aaggcggctt ctttaggagt cgttttctta + 16501 gttccttggc tctttgtcaa ctgtagtggg ttgaaaaaaa gctaagctcg agaaaggaca + 16561 aattttgtcc tttctttttt gatattcaga gcgataaaaa tccgtttttt gaagttttca + 16621 aagttccgaa aaccaaaggc attgcgcttg ataagtttga tgagattatt ggtcgcttcc + 16681 aatttggcgt ttgaataggg tagttgaagg gcgttgacga ttttctcttt gtcctttaga + 16741 aaggttttaa agacagtctg aaaaatagga tgaacctgct taagattgtc ctcaatgagt + 16801 ccgaaaaatt tctccggttc cttattctga aagtgaaaca gcaagagttg atagagctga + 16861 tagtgatgtt tcaagtcttg tgaatagctc aaaagcttgt ctaaaatctc tttattggtt + 16921 aaatgtatac gaaaagtagg acgataaaat cgcttatcac tcagtttacg gctatcctgt + 16981 tgtatgagct tccagtagcg cttgatagcc ttgtattcat gggattttcg atgaaactga + 17041 ttcatgatct gaacacgcac acgactcata gcacggctaa gatgttgcac aatgtgaaag + 17101 cgatcaagaa cgattttagc attcgggagt gaaacagtct gggagactgt ttcagcctga + 17161 gcctagaaat ttgaaagcga agctgtttag ctaagtcata gtaagggcta aacatatcca + 17221 tagtaataat tttgacgcga catcggacaa ctctatcgta gcgaagaaag tgatttcgaa + 17281 tgatagcttg tgttcttccc tcaagaacag tgatgatatt gagattgtta aaatcttgcg + 17341 caatgaagct catctttccc tttgtaaaag catactcatc ccaagacata atctcaggaa + 17401 gacaagaaaa atcatgttta aagtgaaaat cattgagctt acgaataaca gttgaagttg + 17461 agatggaaag ctgatgggca atatcagtca tagaaatctt ttcaattaac ttttgagcaa + 17521 tcttttggtt gatgatacga gggatttggt gattcttctt gacgatagaa gtttcagcga + 17581 ccatcatttt tgaacagtga tagcacttga atcgacgctt tctaaggaga attctagtag + 17641 gcataccagt cgtttcaaga taaggaattt tagaaggttt ttgaaagtca tatttcttta + 17701 attggtttcc gcactcaggg caagatggag cctcataatc cagcttagcg ataatttctt + 17761 tgtgggtatc catattgatg atatctagaa tcttgatgtt tgggtcttta atatcgagca + 17821 gttttgtgat aaaatgtaat tgttccatat gaatctttct aatgatggtt ttgtcgcttt + 17881 tcattatagg tcatatggga ctttttttct acaacaaaat aggctccata atatccatag + 17941 ggaatttacc cactacaaat attatagagc cctttttgtt tttttcagaa tttaccaaat + 18001 taattaaaaa attcagaaaa ttctattgac atctctctga aaagagtcta taatggagag + 18061 aaagttttaa aggagaaaat gatgaaaagt tcaagactac ttgcccttgc gggcgtgaca + 18121 ttattg +// + diff --git a/public/res/serotype_genbank/serotype_10D.gb b/public/res/serotype_genbank/serotype_10D.gb new file mode 100644 index 0000000..70eaf1f --- /dev/null +++ b/public/res/serotype_genbank/serotype_10D.gb @@ -0,0 +1,676 @@ +LOCUS contig_1 15249 bp DNA linear UNK 10-JUN-2024 +DEFINITION contig_1, whole genome shotgun sequence. +ACCESSION contig_1 +VERSION contig_1 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/10/2024, 15:54:55 + CDSs :: 16 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..15249 + /mol_type="genomic DNA" + gene 10..1455 + /locus_tag="DFGJAL_00005" + /gene="wzg" + CDS 10..1455 + /db_xref="BlastRules:WP_000091082" + /db_xref="COG:COG1316" + /db_xref="COG:M" + /db_xref="RefSeq:WP_050150272.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E42858" + /db_xref="UniRef:UniRef100_UPI0005E42858" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_O54604" + /db_xref="UniprotKB:Q4K2G0" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="DFGJAL_00005" + /protein_id="gnl|Bakta|DFGJAL_00005" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVDQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYS + TIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSYAMPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150272.1" + /gene="wzg" + gene 1457..2188 + /locus_tag="DFGJAL_00010" + /gene="wzh" + CDS 1457..2188 + /db_xref="BlastRules:WP_000565352" + /db_xref="RefSeq:WP_050118577.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E77F07" + /db_xref="UniRef:UniRef100_UPI0005E77F07" + /db_xref="UniRef:UniRef90_Q9AHD4" + /db_xref="UniprotKB:Q4K2F9" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="DFGJAL_00010" + /protein_id="gnl|Bakta|DFGJAL_00010" + /translation="MIDIHSHIVFDVDDGPKSREESKTLLAEAYRQGVRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDILDKLEKKRIPTLNDSRY + ALIEFSVNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVTQKYG + EAKAQELFIDNPRKIVMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050118577.1" + /gene="wzh" + gene 2197..2889 + /locus_tag="DFGJAL_00015" + /gene="wzd" + CDS 2197..2889 + /db_xref="BlastRules:WP_000664160" + /db_xref="RefSeq:WP_050150275.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005DC8774" + /db_xref="UniRef:UniRef100_UPI0005DC8774" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_A0A139PG18" + /product="capsular polysaccharide biosynthesis protein + wzd" + /locus_tag="DFGJAL_00015" + /protein_id="gnl|Bakta|DFGJAL_00015" + /translation="MKEQNTIEIDVFQLVKTLWKRKLMILIVALVTGAGAFAYSTFIVK + PEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKLDMS + AKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVTTLE + EARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQIPLLGV + VPDLDKIK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150275.1" + /gene="wzd" + gene 2899..3588 + /locus_tag="DFGJAL_00020" + /gene="wze" + CDS 2899..3588 + /db_xref="RefSeq:WP_050150278.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E072CE" + /db_xref="UniRef:UniRef100_UPI0005E072CE" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_O84996" + /product="Tyrosine-protein kinase wze" + /locus_tag="DFGJAL_00020" + /protein_id="gnl|Bakta|DFGJAL_00020" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVKL + GEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDLSQ + GLCDTNIENLFVIQAGSVSPNPTALLQSKNFGTMLETLRKYFDYIIVDTAPVGVVIDAA + IITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSYGNYG + DYGKNKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150278.1" + /gene="wze" + gene 3603..4970 + /locus_tag="DFGJAL_00025" + /gene="wchA" + CDS 3603..4970 + /db_xref="RefSeq:WP_050150281.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005DF6514" + /db_xref="UniRef:UniRef100_UPI0005DF6514" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_Q8VU30" + /product="Galactosyl transferase wchA" + /locus_tag="DFGJAL_00025" + /protein_id="gnl|Bakta|DFGJAL_00025" + /translation="MNGKILRSSLAIIQSFFVILLTYLLSAVREAEIVSTTAIALYILH + YFVFYISDYGQAFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSVSRRGMIYFLT + LHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGELVAV + SVLDKPDFQHDYLKVVAEGEIVNFATHEVVDEVFINLSSEKYNIGELVSQFETMGIDVT + VNLTAFDCSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLILCGLVS + IVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTMQGGMFK + VNDDPRITKIGCFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQKRRLSF + KPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLMKDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150281.1" + /gene="wchA" + gene 4983..6095 + /locus_tag="DFGJAL_00030" + /gene="wciN-beta" + CDS 4983..6095 + /db_xref="RefSeq:WP_224782777.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005DBB6C6" + /db_xref="UniRef:UniRef100_UPI0005DBB6C6" + /db_xref="UniRef:UniRef50_D1GFD3" + /db_xref="UniRef:UniRef90_D1GFD3" + /product="Glycosyl transferase" + /locus_tag="DFGJAL_00030" + /protein_id="gnl|Bakta|DFGJAL_00030" + /translation="MKLLHFSEVGGGVDRYIKLYLKYSDKEHFKNIVVGSDQLNRQTYE + QEYNVKFYHIDIYRSLSPIKLLRAIKQFRKILYLERPDIVYLHSTFAGVVGRLASMGLS + CKVVYNPHGWSFKMDVSKIKQFVYKKIEKFLSYLTDKYILISKFEYEAAQSLKIPLKKL + TLVYNGVEIDEDFNENQINVLLPTNKYVIGMIGRISEQKNPFFFVEFAKKLSEIYSNLY + FVIVGDGELRGRTEELIEEYGLRSSFFITGWVDNPEDYLAQFNQAVLFSKWEGFGLAVA + EYMKHKKPILITNVDGMSELVIDGESGFKVPLYNLEVAVDRSRSIIENRELANELGSAA + FQRVRSIFEIKEKVSELENIFMSLGGDDNL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_224782777.1" + /gene="wciN-beta" + gene 6082..6285 + /locus_tag="DFGJAL_00035" + /gene="wciN-alpha" + CDS 6082..6285 + /product="hypothetical protein" + /locus_tag="DFGJAL_00035" + /protein_id="gnl|Bakta|DFGJAL_00035" + /translation="MITFKKKQFNIIQKKKLIRLKGRLFSDILQRVFYQEGRGKRAVKL + HMLRNLDIIIKVSTKSLKMIYF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /gene="wciN-alpha" + gene 6393..7178 + /locus_tag="DFGJAL_00040" + /gene="wcrO" + CDS 6393..7178 + /db_xref="EC:2.7.8.-" + /db_xref="KEGG:K07271" + /db_xref="RefSeq:WP_050150287.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E407F9" + /db_xref="UniRef:UniRef100_UPI0005E407F9" + /db_xref="UniRef:UniRef50_A0A0F2DZV6" + /db_xref="UniRef:UniRef90_A0A0F2DZV6" + /product="LicD family protein" + /locus_tag="DFGJAL_00040" + /protein_id="gnl|Bakta|DFGJAL_00040" + /translation="MEKQEILKKIHEEELKLLKRCIDVCEKNNIPYFALGGTLLGAVRH + KGFIPWDDDIDLGVPRSSYSRLIELLNDDNIVIEKNIINLNVLQYKKKDKVIIGDKSYE + IYIDLFPLDGTPNNKFLRNIFLSKFVFYRTLYKLSIVDQLNIVDRGFVGNSIVMFMKMI + GISKLLPTEQIVEKIHSIAEMYDFESSTYVGNILGRYRKKEIVNKKIFGSGIKLDFEDL + QLNCPEVFDSYLKHIYGDYMKLPKEEDRVAHFEELNVQE" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150287.1" + /gene="wcrO" + gene 7182..8273 + /locus_tag="DFGJAL_00045" + /gene="wcrC" + CDS 7182..8273 + /db_xref="RefSeq:WP_050150290.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005DC45A8" + /db_xref="UniRef:UniRef100_UPI0005DC45A8" + /db_xref="UniRef:UniRef50_W1Q1W1" + /db_xref="UniRef:UniRef90_UPI0005DC45A8" + /product="glycosyltransferase family 4 protein" + /locus_tag="DFGJAL_00045" + /protein_id="gnl|Bakta|DFGJAL_00045" + /translation="MKKIALVKWIIDGTDGGLKVATNIANELSKKYEVHLISIVSTEEI + FFPLSNEVYYKNLSSKKISIRKNFFKAVKLLRKYIKENDIKLLLGIGMGMNSVGIASTI + GLDTKFISCDHTNSIIDIDTTVKRFQRYVGAKFADKIITLTTADRKNYINKYKIKPDRV + EYIYNWIDSMDIVNKYDIDSKKLITVGRFDSQKGYDYLSKVAINILSSYPDWQWDIYGS + GDEQVKQDLITELNKGGILSQVHFKGNVNGTDNIYPGQAIYVMTSRYEGLPLVLLEAKQ + YGLPIVSFNCPTGPAEIVLDGENGYLIEDFDINQMSQKIIELIKNNDLRLRFSRNAMID + TDKFNKKKIVKQWIELIEKVTGE" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150290.1" + /gene="wcrC" + gene 8275..9279 + /locus_tag="DFGJAL_00050" + /gene="wcrD" + CDS 8275..9279 + /db_xref="RefSeq:WP_050150293.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E5B324" + /db_xref="UniRef:UniRef100_UPI0005E5B324" + /db_xref="UniRef:UniRef50_A0A4V0BMV4" + /db_xref="UniRef:UniRef90_A0A3R9KU69" + /product="Putative glycosyltransferase EpsJ" + /locus_tag="DFGJAL_00050" + /protein_id="gnl|Bakta|DFGJAL_00050" + /translation="MYDKLVTIIVPMYNIEQYITKCIESFKQVNKKYYADFEVIVVNDG + STDDSLQVVEDLITNSCLNIRLVNKENGGHGSTINVGIKESKGKFFKVIDGDDWIDVPS + FEKLLEELKGIDVDMIITNYTEQHTYNQTEIEIGFSDILDCNKIYEGIPFKRIPMHALT + YKTSILKESGIKISEKTFYVDMEYTLLPLQYVKSYVYIDLNVYQYFLGRKDQSMNLNVM + KQKADHHNRVTKRILDYYEVIRFDKNLEPVVKDVLTYLINKQCQLFIMNKNIDDASRLF + SYAYKCQYRWKYDHSKKTVSLIYINSRFKNIFNLILKPLINKQHKEWSEMDEY" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150293.1" + /gene="wcrD" + gene 9269..10231 + /locus_tag="DFGJAL_00055" + /gene="wciF" + CDS 9269..10231 + /db_xref="RefSeq:WP_050150296.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E00558" + /db_xref="UniRef:UniRef100_UPI0005E00558" + /db_xref="UniRef:UniRef50_A0A0F2E1M2" + /db_xref="UniRef:UniRef90_A0A0F2E1M2" + /product="Glycosyl transferase family protein" + /locus_tag="DFGJAL_00055" + /protein_id="gnl|Bakta|DFGJAL_00055" + /translation="MNISVVIPVYNVEDCLHYAIESLVNQTYKNFEVLLINDGSTDNSG + KLCDKYAQEYDWIRVFHKENGGLSDARNYGVLKATNEWIFFLDPDDYIEPFTFELLTLI + QEKYQADLISTKVQTTNEYEKFSKEQFNSETAKNVTKEEALELMLEDKVATVSACAKLY + KKQILEMRPFPVGKIYEDFFVVAEHLRLAEQVVISPVVTYHYYRRPGSIVQSKFTDKRF + DFFDAGENNRIQIKQFYDGNSVEKALNLKIVQGSFHISEAAAFTDTKALRNIVKKVSSF + YWSIIFNSKASVKLKLKYNWFLLTPNLYFRIKKMLKRSI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150296.1" + /gene="wciF" + gene 10231..11505 + /locus_tag="DFGJAL_00060" + /gene="wzy" + CDS 10231..11505 + /db_xref="RefSeq:WP_050150299.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005DDBD31" + /db_xref="UniRef:UniRef100_UPI0005DDBD31" + /db_xref="UniRef:UniRef50_A0A0F2E0D2" + /db_xref="UniRef:UniRef90_A0A0F2E0D2" + /product="Polymerase" + /locus_tag="DFGJAL_00060" + /protein_id="gnl|Bakta|DFGJAL_00060" + /translation="MFLVFLMFFCVFLLFPIITTPFLLIPIVYRFKYSRYYLMLFVIGI + SLIALRYIPYFTDDGAYHFKAAYLYQFYDNIFDWFKNLMSKNIPTEYGYYNYPLFALLL + YIFSKTGTYSLISFTVIMIVYFLYTKIIYDVFQRYKISKILFLLALLTMIVIVNVRYTT + SGMRYSLAVSLLVFLFYKEINNGFKINKSIFFYLIPVLIHSSTVIFVLMRLMFPWLKDM + KIYKKLLVLFSLPPLIQLSPALQHININYLSFLLEKFDVYQNTTTFITLFRTSDLYNVY + IGVFICFLYIFFYHTNFRFQKNHKVNLFFSFVLYICLLTLSVLPFLTILDRFIWFIYPL + VSISIVLYIASDKSKVEKVRFKGYNNLPFYIILCLCFIGGMIGNKKFFDFLRLLDFNIF + DILTKNVFEYFSDLHHFSLNEVRRR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150299.1" + /gene="wzy" + gene 11693..12634 + /locus_tag="DFGJAL_00065" + /gene="wcrG" + CDS 11693..12634 + /db_xref="RefSeq:WP_050150302.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E8CB7D" + /db_xref="UniRef:UniRef100_UPI0005E8CB7D" + /db_xref="UniRef:UniRef50_Q4K2E9" + /db_xref="UniRef:UniRef90_Q4JZ27" + /product="Putative glycosyl transferase" + /locus_tag="DFGJAL_00065" + /protein_id="gnl|Bakta|DFGJAL_00065" + /translation="MKQAYLIIAHNKIEQLKFLLSLLDYEKHDIFILFDKKVEITDKQK + NELTQIVTKSNIFFTREIPIYWGDYSLVEAEIELFETANKQENYSMYHLLSGVDLPLDT + AEKIYNFFDSRKEYNFLTMVSDELYIRNKVYERVAFKTILPHLTVRTVNNNFLRSVLKI + YRRFEVELQRIFKVDCFKKFNLELKYASNWCSLNKEAVDILLEEKQLIATIFKNTKVND + ELFIPTVLQKHQLLDTVYSIEPTNDRPTDFQGNLRYINWWDGSPYTWTDSSDDIEQLKR + GKALGHKFSRKFDLERNPNLKEKILTIINRTD" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150302.1" + /gene="wcrG" + gene 12636..14060 + /locus_tag="DFGJAL_00070" + /gene="wzx" + CDS 12636..14060 + /db_xref="RefSeq:WP_050274613.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E121F9" + /db_xref="UniRef:UniRef100_UPI0005E121F9" + /db_xref="UniRef:UniRef50_K8MPI1" + /db_xref="UniRef:UniRef90_Q4JZ26" + /product="Flippase Wzx" + /locus_tag="DFGJAL_00070" + /protein_id="gnl|Bakta|DFGJAL_00070" + /translation="MKVLKNYAYNFSYQLLLIILPIITTPYVTRIFSATDLGTYGYFNS + IVTYFILLATLGVASYGTKEISSNRKNIPKNFWGIYTLQFCAASLSIILYTLLCFGVDV + MRNPVAYILGMSLISKGLDISWLFQGLEDFRKIIVRNILVKLVGVISIFLLIKSADDLY + LYVFLLTIFELLGQLSMWLPAQKFIGKAHFDIDYTKYHLKPILLLFLPQIAISLYATLD + RTMLGMISSTNDVGIYDQALKLINILLTVVTSLGSVMLPRVSNLLATGNHKAVNKMHEM + SFLIYNLVIFPIMAGMLIVNDDFVNFFLGKDFQDARYAIAIMIFRMFFIGWTNIMGFQM + LIPHNKNKEYMVSTTVPAVLSVALNLLFLPKLGYIGAAIVSVLTEALVWGIQLFYTRSY + LREVPILGSLFKIIVSSGFMYVILLFVKQVLNVSPMINVGIYAVSGAMIYLVFILIFSV + INPNELKQQLLKNKGA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050274613.1" + /gene="wzx" + gene 14062..15165 + /locus_tag="DFGJAL_00075" + /gene="glf" + CDS 14062..15165 + /db_xref="EC:5.4.99.9" + /db_xref="GO:0008767" + /db_xref="GO:0009273" + /db_xref="RefSeq:WP_050150308.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E4607D" + /db_xref="UniRef:UniRef100_UPI0005E4607D" + /db_xref="UniRef:UniRef50_P37747" + /db_xref="UniRef:UniRef90_A0A0F2DGD0" + /product="UDP-galactopyranose mutase" + /locus_tag="DFGJAL_00075" + /protein_id="gnl|Bakta|DFGJAL_00075" + /translation="MYDYLIVGAGLFGAVFAHEAALKGKKVKVIEKRNHIAGNIYTREE + EGIQVHQYGAHIFHTSDKEIWEYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNKLW + GVVTPAEAQAKIDEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPTTEL + PAFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVNKEQY + LKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAETPYTRI + IEHKHFEFGSQTKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQGNVIFG + GRLGHYRYYDMHQVIGAALQCVRNELN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050150308.1" + /gene="glf" + gene 15172..15249 + /locus_tag="DFGJAL_00080" + CDS 15172..15249 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000990B463" + /db_xref="UniRef:UniRef100_A0A1T0C5L4" + /db_xref="UniRef:UniRef50_A0A1T0C5L4" + /db_xref="UniRef:UniRef90_A0A1T0C5L4" + /product="Chlorohydrolase" + /locus_tag="DFGJAL_00080" + /protein_id="gnl|Bakta|DFGJAL_00080" + /translation="MKIKEQTRKLATGCSKHCFEVADGS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Bakta:1.9" + /inference="similar to AA + sequence:UniRef:UniRef100_A0A1T0C5L4" +ORIGIN + 1 gtgttaatca tgagtagacg ttttaaaaaa tcacgttcac agaaagtgaa gcgaagtgtt + 61 aatatcgttt tgctgactat ttatttattg ttagtttgtt ttttattgtt cttaatcttt + 121 aagtacaata tccttgcttt tagatatctt aacctagtgg taactgcgtt agtcctacta + 181 gttgccttgg tagggctact cttgattatc tataaaaaag ctgaaaagtt tactattttt + 241 ctgttggtgt tctctatcct tgtcagctct gtgtcgctct ttgcagtaca gcagtttgtt + 301 ggactgacca atcgtttaaa tgcgacttct aattactcag aatattcaat cagtgtcgct + 361 gttttagcag atagtgatat cgaaaatgtt acgcaactga cgagtgtgac agcaccgact + 421 gggactgata atgaaaatat tcaaaaacta ctagctgata ttaagtcaag tcagaatacc + 481 gatttgacgg tcgaccagag ttcgtcttac ttggcagctt acaagagttt gattgcaggg + 541 gagactaagg ccattgtctt aaatagtgtc tttgaaaata tcatcgagtc agagtatcca + 601 gactacgcat cgaagataaa aaagatttat accaagggat tcactaaaaa agtagaagct + 661 cctaagacgt ctaagaatca gtctttcaat atctatgtta gtggaattga cacctatggc + 721 cctattagtt cggtgtcgcg atcagatgtc aatatcctga tgactgtcaa tcgagatacc + 781 aagaaaatcc tcttgaccac aacgccacgt gatgcctatg taccaatcgc agatggtgga + 841 aataatcaaa aagataaatt aacccatgcg ggcatttatg gagttgattc gtccattcac + 901 accttagaaa atctctatgg agtggatatc aattactatg tgcgattgaa cttcacttct + 961 ttcttgaaaa tgattgactt attgggaggg gtagatgttc ataatgatca agagttttca + 1021 gctctacatg ggaagttcca tttcccagta gggaatgtcc atctagactc tgagcaagct + 1081 ctaggttttg tacgtgaacg ctactcacta gccgatggag accgtgaccg tggtcgcaac + 1141 caacaaaagg tgattgtggc tatccttcaa aaattaacgt caaccgaagc actgaaaaat + 1201 tatagtacga tcattgatag cttgcaagat tctatccaaa caaatatgcc acttgagaca + 1261 atgataaatt tggtcaatgc tcagttggaa agtggaggga attataaagt aaattctcaa + 1321 gatttaaaag ggacaggtcg gatggatctt ccttcttatg caatgccaga cagtaacctc + 1381 tatgtgatgg aaatagatga tagtagttta gctgtagtta aagcagctat acaggatgtg + 1441 atggagggta gatgaaatga tagacatcca ttcgcacatc gtctttgatg tagatgatgg + 1501 tcccaagtca agggaggaaa gcaagactct cttggcagaa gcctatagac agggggtgcg + 1561 aaccattgtc tctacctctc accgtcgcaa gggcatgttt gaaactccgg aagagaagat + 1621 agcagaaaac tttcttcagg ttcgggaaat agctaaggaa gtggcgagtg acttggtcat + 1681 tgcttacggg gctgaaattt actacacacc agatattctg gataagctgg aaaaaaagcg + 1741 gattccgacc ctcaatgata gtcgttatgc cttgatagag tttagtgtga acactcctta + 1801 tcgcgatatt catagcgcct tgagcaagat cttgatgttg ggaattactc cagtcattgc + 1861 ccacattgag cgctatgatg ctcttgaaaa taatgaaaaa cgcgttcgag aactgatcga + 1921 tatgggctgt tacacgcaag taaatagttc acatgtcctc aaacccaaac tttttggcga + 1981 acgttataaa ttcatgaaaa aaagagctca gtatttttta gagcaggatt tggttcatgt + 2041 cattgcaagt gatatgcaca atctagacgg tagacctcct catatggcag aagcatatga + 2101 ccttgttacc caaaaatacg gagaagcgaa ggctcaggaa ctttttatag acaatcctcg + 2161 aaaaattgta atggatcaac taatttagga gaaatgatga aagaacaaaa cacgatagaa + 2221 atcgatgtat ttcaattagt taaaaccttg tggaaacgca agctaatgat tttaatagtg + 2281 gcacttgtga caggtgcggg ggcttttgca tatagcactt ttattgttaa gccagaatat + 2341 acgagtacca cgcgaattta cgtagtgaat cgcaatcaag gagacaagcc ggggctgaca + 2401 aatcaggatt tgcaggcagg aacttatctg gtaaaagact accgtgagat tatcctttcg + 2461 caggatgcat tggaaaaagt agcgacaaat ttgaagttgg atatgtcagc aaaaacgtta + 2521 gccagcaaag ttcaagtggc tgtaccagct gacactcgta tcgtctcaat ctctgtcaag + 2581 gataaacagc cagaggaagc cagtcgtatc gctaattctc tacgagaagt tgctgcagaa + 2641 aagatcgtcg ctgtaacgcg agtatctgat gtaacgacac ttgaagaagc gcgaccagct + 2701 acgactccct cttctccaaa tgttcgacgc aattccttgt ttggttttct tggaggagca + 2761 gtcgtaacag taattgctgt tcttttgatt gagttgctcg acacccgtgt gaaacgtcct + 2821 gaagatgttg aagatgtact gcaaattcca cttttagggg tcgttccaga tttggacaaa + 2881 ataaaatagg aggaagttat gccaacatta gaaatctcac aggcaaaatt ggattttgta + 2941 aaaaaggcag aggaaaatta taacgctttg tgcacgaacc tacagttaag tggagatgat + 3001 ttgaaagtat tttctatcac ttctgtgaaa ctaggagaag gaaaatcaac gacttccacc + 3061 aatatcgctt gggcttttgc gcgtgcaggt tacaaaacgc tgctgattga tggagatatt + 3121 cgcaattctg ttatgttagg tgtctttaaa gcaagggata agattacagg cctgacagaa + 3181 tttttatcag gaactacaga cctatcacaa gggctttgtg ataccaatat cgaaaatctc + 3241 tttgtaattc aggctggctc tgtgtcaccg aatccgacag ctcttcttca aagtaagaat + 3301 ttcggtacaa tgcttgaaac cttgcgtaaa tattttgact acatcattgt agatactgct + 3361 cctgtcggtg tcgtgattga tgcggctatt attacgcgaa aatgcgatgc ttctatttta + 3421 gtgacggagg caggtgaaat aaatcgacgg gatattcaaa aagcaaaaga acagttggaa + 3481 cacacaggga agccgttttt gggaattgtg ttgaataaat tcgatacttc agtagacaaa + 3541 tacggttctt atggaaatta tggagattac gggaaaaata aaaaatagtt caggggatag + 3601 agatgaatgg gaaaatatta aggtcttcat tggccataat ccagagtttt tttgttattt + 3661 tattgactta tctacttagt gctgtgagag aagcggagat tgtttcaaca acagctattg + 3721 cactttatat cctccattat tttgtctttt atatcagtga ttatggacag gccttcttta + 3781 aaaggggata tttgattgaa cttgtccaga cattgaaata tatcctattc tttgcactcg + 3841 cgattagtat ttctaatttt ttcttagagg atcgatttag tgtttctaga cgaggcatga + 3901 tttacttcct cacattacat gctctcttag tctatgtgct aaacctattt atcaagtggt + 3961 attggaagcg ggcttatccc aactttaaag gaagtaagaa gattctccta cttacagcaa + 4021 cttctcgtgt cgaaaaggta ctggatagat taatagaatc aaatgaggtt gttggggagt + 4081 tggtagccgt cagtgtctta gataaaccag attttcagca tgattattta aaggtagtag + 4141 cagaggggga gatagtaaac tttgcgactc atgaggtggt cgatgaagtc tttatcaatc + 4201 tttcaagtga aaaatacaat attggagagc ttgtctctca gtttgaaacg atgggaattg + 4261 atgtaacagt caatctaact gcttttgatt gtagtttggc acgtaacaag caaattcgtg + 4321 agatggcagg attaaacgtt gtgacttttt ctacaacatt ttataagact agtcatgtaa + 4381 ttgctaagcg gattattgat atcgtgggtg cattggtagg gctgatatta tgtggtttag + 4441 tcagtattgt actggttcct ttgattcgaa aggatggggg ctctgctatt tttgctcaga + 4501 cgcgtatagg aaaaaatggt cgtcagttca ctttttataa gtttcgctct atgtgtgtag + 4561 atgccgaggc gaaaaaaaga gaactcatgg aacaaaatac catgcagggt ggaatgttta + 4621 aggtgaacga tgatcctcgt atcacgaaaa ttggttgttt tatacggaag actagcttgg + 4681 acgagctacc acagttttac aatgttctaa agggagatat gagcttggta ggtacacgac + 4741 cgccaacagt ggacgagtat gaacactata ccccagaaca aaaacgtcgg ctaagtttta + 4801 aacctggtat aacaggctta tggcaggtca gtggacgaag tgaaatcaaa aatttcgatg + 4861 aagttgtcaa attagatgtg gcttatatag atgattggac aatctggaaa gatattgaaa + 4921 ttttattgaa gacagttaag gtagtattga tgaaggatgg agccaaatag ggggatatgt + 4981 tcatgaaatt gcttcatttt agtgaagttg gcggtggagt tgataggtat attaagttat + 5041 atttaaaata ttcagataaa gaacatttta aaaatattgt ggtaggatca gatcagctca + 5101 atagacaaac atatgaacaa gaatataatg taaagtttta tcacattgat atctatagaa + 5161 gcttgtctcc aataaagctt ttacgcgcga ttaaacaatt tagaaaaata ttgtatctag + 5221 aaagacctga tatagtatat ctgcacagta cttttgcagg cgtagtaggc aggttagctt + 5281 ctatgggttt gtcgtgtaaa gtagtataca atcctcacgg atggtctttt aagatggatg + 5341 tttctaagat taagcaattc gtttataaaa agattgaaaa gtttttgtct tatcttacag + 5401 ataagtatat attaatctct aaatttgaat atgaagcggc tcaatcttta aaaatacccc + 5461 ttaagaaatt gactttagtg tataatggag tagagattga tgaagatttt aacgaaaatc + 5521 aaataaacgt tttattaccc acaaataaat atgttattgg aatgattggt cgtattagtg + 5581 aacagaaaaa tcctttcttt tttgttgaat ttgcaaaaaa attatcagag atttatagca + 5641 atttatattt tgttattgtc ggcgatggcg aattgcgtgg gcgaactgaa gaactaattg + 5701 aagagtatgg gcttcgaagc tcatttttta taacagggtg ggtggataat ccagaggatt + 5761 atttagctca gttcaatcag gcagttcttt tctcgaaatg ggagggcttt ggattggcgg + 5821 ttgcggaata tatgaaacat aagaagccaa ttcttataac taatgttgat gggatgtcag + 5881 aattggttat tgatggtgag tcaggtttta aagtcccact atataattta gaagtagctg + 5941 tagatagaag tagaagtatt attgagaata gagaactagc caatgagtta ggtagtgctg + 6001 ctttccaaag agttcgatct atatttgaaa taaaagaaaa agtgtcagaa ttagagaata + 6061 tattcatgag tttaggagga gatgataacc tttaaaaaaa aacaattcaa tattattcaa + 6121 aagaagaaat taatcaggct aaaaggcaga ttgttctcag acattttaca acgagttttt + 6181 tatcaagaag gccgtggcaa gagggcagtg aagttgcaca tgttgaggaa tttagacatt + 6241 attatcaagg tgagtacaaa atcgttaaag atgatatatt tttaaaaatt tttaagataa + 6301 ttcctcgaaa aattgcaatt aaagttgttg gaattataca atcaaaaatc agactaaagg + 6361 tttataaaat attgaggtga aaaactttta taatggaaaa acaagaaatt ttgaaaaaaa + 6421 tacatgaaga agagttgaag cttttaaaaa gatgtattga tgtgtgtgaa aaaaataata + 6481 ttccatactt tgctttaggc ggtactcttt taggagcagt tagacataaa ggatttattc + 6541 cttgggatga tgatattgat ttaggagtac ctagaagtag ttacagtcga cttatagagt + 6601 tgttgaatga tgataatatt gttatagaaa agaatattat taatttaaat gtactgcaat + 6661 ataagaaaaa agataaggtt ataattgggg ataaatcata tgaaatttac attgatttat + 6721 tcccattaga tggtactcca aataataaat tcttaagaaa tatattttta tcaaaatttg + 6781 tattctatcg aacattgtat aaattatcaa ttgttgatca attaaatatt gttgatcggg + 6841 gatttgtagg taattctatt gtgatgttta tgaaaatgat tggtatcagt aagcttttac + 6901 caactgaaca aatagttgaa aaaatacata gtattgctga aatgtatgat tttgaaagca + 6961 gtacgtatgt aggtaatatt ttaggccgat atcgtaaaaa agagattgtg aataaaaaga + 7021 tatttggtag cggaataaaa ttagattttg aagatttaca attgaattgc cctgaggttt + 7081 ttgattcata cctaaagcac atttatggag actatatgaa gcttccaaaa gaagaggata + 7141 gagtagcaca ttttgaagaa ttaaatgtac aggagtaatg aatgaaaaaa atagctttag + 7201 ttaagtggat tatagacggt actgacggtg gattaaaagt cgccacaaat attgcaaatg + 7261 aattatcaaa aaaatatgaa gtacatttaa tttcaattgt aagcacagaa gaaatatttt + 7321 ttccattaag taatgaagtt tattataaaa atttatcttc taaaaaaata tcaatacgta + 7381 agaatttttt taaagcagtg aagttattaa gaaaatatat taaagagaat gatattaaat + 7441 tgcttttggg tattggaatg ggaatgaaca gtgtgggtat tgcaagtact ataggattgg + 7501 atactaaatt tatttcttgt gatcacacta actctattat agatatagat actactgtca + 7561 aaagatttca aagatatgta ggagcaaaat ttgcagataa gataattaca ctaactactg + 7621 ctgatagaaa aaattatata aataaatata aaataaaacc cgatagagtt gaatacatct + 7681 acaattggat agattctatg gatatcgtaa acaaatatga tattgattct aaaaaactaa + 7741 ttactgtagg tcggtttgac agccaaaaag gatatgatta tctatctaaa gtagctataa + 7801 acattttatc aagctatccg gattggcaat gggatatata cggatctggt gatgagcaag + 7861 taaaacaaga tttgataact gaactgaata aaggtggcat tttgtcacaa gttcatttta + 7921 aggggaatgt aaatggtaca gataatattt atccaggtca ggccatttat gtaatgactt + 7981 cccgatatga aggacttccc ttagttcttt tagaagctaa acaatatgga ctaccaattg + 8041 ttagttttaa ttgtcctact gggcctgcag aaattgtatt ggatggggaa aatggttatt + 8101 taattgagga ttttgatata aatcaaatga gtcaaaaaat aatagaatta attaaaaata + 8161 atgacttgag attaagattt tcgcgaaatg cgatgataga tactgataaa ttcaataaaa + 8221 agaaaattgt taaacaatgg attgaattga tagaaaaagt gacaggagaa tgaaatgtac + 8281 gataaattag taacaatcat agtaccaatg tataatattg aacaatatat tactaagtgt + 8341 atagaatcat ttaaacaagt aaataaaaaa tattatgcag attttgaagt gattgttgtt + 8401 aatgacggta gtacggatga ctcacttcaa gttgtcgaag atttaattac taatagttgt + 8461 cttaatatta gacttgttaa taaagaaaat ggtggacatg gttcaacgat taatgttggt + 8521 ataaaggaat ctaaaggaaa attttttaaa gttattgatg gggatgattg gattgatgta + 8581 cccagttttg aaaaattatt agaagaactt aaaggtatag atgtcgatat gattattaca + 8641 aattatactg aacaacatac ctataatcag actgaaatag agattggctt ttctgatata + 8701 ttagattgca ataaaatata tgagggaata cctttcaaac ggattcccat gcatgctctg + 8761 acatacaaaa catcgatatt gaaagaatct ggaattaaaa taagtgaaaa aaccttttat + 8821 gttgatatgg aatatacttt actaccttta caatacgtaa aaagttatgt ttatattgac + 8881 ttaaatgttt accaatattt tttaggtaga aaagatcaga gtatgaattt aaacgtgatg + 8941 aaacaaaaag cagaccatca caatagagta acaaaaagaa ttctcgatta ttatgaggta + 9001 attcgctttg acaagaactt agaaccagta gtcaaagacg tattgacata cttaatcaac + 9061 aagcaatgtc agttgtttat aatgaataag aatatcgatg acgcgagcag attatttagt + 9121 tacgcttata aatgccaata tagatggaaa tatgatcatt cgaaaaaaac ggtctcacta + 9181 atttatataa attctagatt taaaaatata tttaatctca tcttaaaacc gttaatcaat + 9241 aagcaacaca aagaatggag tgagatggat gaatattagt gtagttattc ctgtttataa + 9301 tgttgaggat tgccttcatt atgctataga aagtttagta aatcaaactt ataaaaattt + 9361 tgaggtcttg ctaatcaatg atggttctac tgataattca ggaaaattat gtgataaata + 9421 tgctcaagaa tatgattgga ttcgagtatt tcacaaagag aatggtggct tatcagatgc + 9481 gcgtaattat ggagtgttaa aagcaactaa tgagtggata ttttttttgg atccggatga + 9541 ttatatagag ccttttacat ttgaattatt gactcttatt caagagaaat atcaagctga + 9601 tttgatttca acaaaagttc aaactacaaa tgagtatgaa aaatttagca aggaacaatt + 9661 taattcagaa actgctaaaa acgttacaaa agaagaagca ctagaattaa tgttagaaga + 9721 taaagttgca acggtatctg catgtgcaaa actttataaa aaacaaattt tagaaatgag + 9781 accatttcct gtaggaaaaa tttacgaaga tttttttgtt gtagccgaac atttaagatt + 9841 agctgaacaa gtagttattt cacctgttgt tacttatcat tactatcgtc gtcctggaag + 9901 tattgtacaa tcgaaattta cagataagag atttgatttt tttgatgcag gtgagaataa + 9961 tagaattcag ataaaacaat tttatgatgg taatagtgta gaaaaagcgt taaatttaaa + 10021 aattgttcaa ggttcttttc atatttctga agctgcagct tttacggaca caaaagcttt + 10081 aagaaatatt gttaaaaaag taagttcatt ttactggagt ataatcttta attctaaagc + 10141 ttctgtaaaa ttaaaattga aatataactg gtttttactt actcccaatt tatactttcg + 10201 tataaaaaaa atgttaaaaa ggagtatata atgtttttag tttttttaat gtttttttgt + 10261 gtatttctat tatttccaat tataactacg ccattcttat taattccaat agtttataga + 10321 tttaagtata gcagatatta tttaatgtta tttgttatag gtatttcctt aattgcgtta + 10381 aggtatattc cgtattttac tgatgatgga gcctatcatt ttaaggctgc atatctgtat + 10441 caattctatg ataatatttt tgactggttt aaaaatttga tgtcaaaaaa cattccaact + 10501 gaatatggat actacaatta tccattattt gcactattgt tatatatatt tagtaaaact + 10561 gggacgtatt cattaattag ttttacagtc attatgattg tttatttctt atatactaaa + 10621 ataatatatg atgttttcca gagatataaa atctctaaaa ttttattttt actagctctt + 10681 ttgacaatga ttgttatagt aaatgtacgg tatacaacca gtggaatgag gtatagttta + 10741 gcggtttctc ttttagtttt cttattttat aaagagatta ataatggatt caaaatcaac + 10801 aaatcaattt ttttttatct cattccggtg ctaattcatt ctagtacggt aatatttgtc + 10861 ttaatgagat tgatgtttcc ttggttaaaa gatatgaaaa tatataagaa attattagta + 10921 ctattttcac taccaccttt aattcaattg tctcctgcac ttcagcacat caatattaat + 10981 tacttatctt ttttgttaga aaaatttgat gtgtatcaga atactacgac atttattact + 11041 ttatttcgta cttcagattt atataatgta tatataggtg tatttatttg tttcttatat + 11101 atatttttct atcatactaa ttttcgtttt caaaaaaacc ataaagtaaa cttatttttc + 11161 tcttttgtac tatacatctg cttattaact ttatcagtat tacctttttt aacgatacta + 11221 gataggttta tttggtttat atatccttta gtgtctattt cgatagttct ttatattgct + 11281 agtgataaaa gcaaagttga aaaagttaga tttaaaggat acaataattt accattttat + 11341 ataattttgt gtttatgttt tattggtggt atgattggaa ataagaaatt ttttgatttt + 11401 ttaagattgt tagattttaa tatatttgat atcttaacta aaaatgtatt tgagtatttt + 11461 tctgatttac atcatttttc tttaaatgaa gttagaagac gatagacata ggtgtaattt + 11521 tatttttaag tacaataggt tttaatgagg ccacaataaa aaaatattca agattaatga + 11581 ggattgaaca acatgaaagc tagcgtcttt agacgctagc tggtaatttg gatatatagc + 11641 cttggagcga actatccgtt aggcggatgg ttataattta aataggagtc atatgaaaca + 11701 agcttattta atcatagcac acaataaaat agaacagtta aagtttttac tttcattatt + 11761 agattatgaa aaacatgata tttttatttt atttgataaa aaagtagaaa ttactgataa + 11821 acaaaaaaat gaactaactc aaatagtgac gaaatcaaat atattcttca caagggaaat + 11881 accaatttat tggggagatt attctctagt tgaagcagag atagaacttt ttgaaacagc + 11941 aaataaacaa gaaaattaca gtatgtatca tttgttatcg ggtgtagatt tacctttaga + 12001 tactgcagaa aaaatatata atttttttga tagtagaaaa gaatataatt ttttaacaat + 12061 ggtatcagat gaattatata ttcgaaataa ggtctatgag cgtgtagcgt ttaaaacaat + 12121 acttcctcat ttaacggtaa gaactgtaaa taataatttc ttacggtcgg ttttaaaaat + 12181 ttatagaagg tttgaagttg aactgcaaag aatatttaaa gttgattgtt ttaaaaagtt + 12241 taatttagaa ttgaaatatg cttctaattg gtgttctctt aataaggagg cggtagatat + 12301 actgctagaa gaaaagcaat tgattgctac tatttttaaa aataccaaag taaatgacga + 12361 attatttatt cctacagttt tacagaaaca tcagttattg gatacagttt attcgataga + 12421 accgacaaat gataggccta ctgattttca aggcaatctt cgctatatta attggtggga + 12481 tggaagtcca tatacatgga ctgattcttc tgatgatatt gaacaattga aacgtggcaa + 12541 ggctttaggt cataagtttt ctagaaaatt tgatttagag agaaatccga atctaaaaga + 12601 aaaaattcta acgatcataa ataggacaga ttgatatgaa agtactaaaa aattacgctt + 12661 ataacttctc ttatcagttg ttactcatta tacttcccat cattacaact ccctatgtga + 12721 cacggatatt ttctgcaacg gatctaggaa catatggcta ctttaattct attgttacct + 12781 attttatttt gttagctact ttgggggttg ctagctatgg aactaaggag atttcgagta + 12841 atcgaaaaaa catcccgaag aatttctggg gaatatatac tcttcaattt tgtgcagcat + 12901 cattatcaat tatcttatat actttattgt gtttcggagt tgacgtaatg agaaatcctg + 12961 ttgcttatat attaggaatg agtttgattt ctaaaggact agatatatcc tggctttttc + 13021 agggattgga agatttccgt aagattatag tcagaaatat attagtcaaa ctcgttggtg + 13081 taatttcaat atttttattg ataaaatcgg cggatgatct ctatctctat gtttttcttt + 13141 taacgatatt tgagttattg ggacaattaa gtatgtggtt acctgctcaa aagtttattg + 13201 gaaaagcaca ttttgatata gattatacta aatatcattt aaagccaatt cttttattat + 13261 tcctccctca gattgctatt tcactatatg caactttaga ccgtacgatg ttaggaatga + 13321 tatcatctac aaatgatgtc gggatctacg atcaagcatt aaaattgatt aatattctat + 13381 tgactgtagt aacttcttta ggaagtgtca tgttgccgag agtatctaat ctcttggcga + 13441 caggaaatca taaagcagtt aataaaatgc atgagatgtc atttctaatt tataatttgg + 13501 ttatttttcc cattatggca ggaatgttaa ttgtaaatga tgattttgtt aactttttcc + 13561 tcggtaaaga ttttcaagat gcacgttatg cgatagcaat tatgattttt agaatgtttt + 13621 ttattgggtg gaccaatatt atggggtttc aaatgctaat cccacataat aagaataaag + 13681 aatatatggt ctcaacaact gtgcctgcag ttctaagtgt tgccttgaat ttgttatttc + 13741 ttcctaaact cggatatata ggagcggcaa ttgtgtctgt tttaacagag gcgttagttt + 13801 gggggataca gttattctat actcgttctt atttgagaga agttcctatt ttaggttcat + 13861 tgtttaaaat tatagtttca tcgggattta tgtatgtcat tttattattt gtaaaacaag + 13921 tcctaaatgt atcaccgatg ataaatgtgg ggatttatgc tgtttcggga gcaatgattt + 13981 atctcgtatt tattttgatt tttagtgtta taaatccaaa tgagttaaaa caacaattat + 14041 taaaaaataa aggagcataa gatgtacgat tatcttatcg ttggtgctgg tctctttggt + 14101 gcagtctttg cccatgaagc agccttaaaa ggaaaaaaag taaaagttat tgaaaaacga + 14161 aatcatatcg cgggtaatat ctatactcgt gaagaggaag gaattcaggt tcatcaatat + 14221 ggtgctcata tcttccatac ttctgataag gagatctggg agtatgtaaa tcagtttgca + 14281 gagtttaacc gttataccaa ttctcctgtt gcaaactata agggagagat ttataactta + 14341 ccttttaata tgaatacctt caataaactc tggggagttg tgacgccagc agaagcacaa + 14401 gctaagattg atgaacaacg tgctatttta aatggtaaaa ctcctgaaaa tttggaagaa + 14461 caagcgattt ctcttgtagg tacagacatc tacgaaaaat taatcaaaga ctatacagag + 14521 aaacagtggg gcaaaccaac tactgaactt ccagccttta ttattcgccg tttgccagta + 14581 cgtctgacct atgataacaa ctattttaac gatacctatc aagggattcc aattggtgga + 14641 tacactcaaa tagttgaaaa aatgttggat catgaaaata ttgatgtaga aacaaatgtt + 14701 gatttctttg tgaataaaga gcaatatctg aaagattttc ctaagattgt ctttactggt + 14761 atgattgatg aattctttga ctataagttg ggcgaactag agtaccgtag tcttcgtttt + 14821 gaaaatgaga ccttggatat ggaaaattac caaggaaatg cagttgtgaa ctatacggat + 14881 gcagaaaccc catatactcg cattattgaa cacaaacatt ttgagtttgg gagtcaaaca + 14941 aagactatca ttactaaaga acattctaaa acatgggaaa aaggtgatga gccttattat + 15001 ccagttaata atgatcgtaa taatcatttg tataaatcat ataaaaaact tgctgatgag + 15061 caagggaatg ttatctttgg tggccgctta ggacactatc gttattacga tatgcaccaa + 15121 gtaattggag cagctttgca gtgcgtgaga aatgagttaa attaatactc aatgaaaatt + 15181 aaagagcaaa ctaggaagct agccacaggt tgctcaaaac actgttttga ggttgcagat + 15241 ggtagctga +// diff --git a/public/res/serotype_genbank/serotype_10F.gb b/public/res/serotype_genbank/serotype_10F.gb new file mode 100644 index 0000000..8b944ae --- /dev/null +++ b/public/res/serotype_genbank/serotype_10F.gb @@ -0,0 +1,806 @@ +LOCUS CR931652 18532 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 34355 (serotype 10f). +ACCESSION CR931652 +VERSION CR931652.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18532) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 18532) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..18532 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="34355" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC10F_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC10F_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33096.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SPC10F_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SPC10F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(488..1009) + /gene="tnp" + /locus_tag="SPC10F_0003" + /pseudo + CDS complement(488..1009) + /gene="tnp" + /locus_tag="SPC10F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1231..2676 + /gene="wzg" + /locus_tag="SPC10F_0004" + CDS 1231..2676 + /gene="wzg" + /locus_tag="SPC10F_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33099.1" + /db_xref="GOA:Q4K2B1" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2B1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSIGVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGIDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESRGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1231..1347 + /gene="wzg" + /locus_tag="SPC10F_0004" + /note="Signal peptide predicted for SPC0421 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1435..1782 + /gene="wzg" + /locus_tag="SPC10F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.5e-63" + misc_feature 1960..2403 + /gene="wzg" + /locus_tag="SPC10F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.6e-70" + gene 2678..3409 + /gene="wzh" + /locus_tag="SPC10F_0005" + CDS 2678..3409 + /gene="wzh" + /locus_tag="SPC10F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33100.1" + /db_xref="GOA:Q4K2B0" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2B0" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTSDVLDKLENNRIPTLNNS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLERDLVHVIASDMHNVDDRPPHMAEAYDLVS + QKYGEAKAQELFIENPRKIVMDQLI" + misc_feature 2681..3289 + /gene="wzh" + /locus_tag="SPC10F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.4e-37" + gene 3415..4110 + /gene="wzd" + /locus_tag="SPC10F_0006" + CDS 3415..4110 + /gene="wzd" + /locus_tag="SPC10F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33101.1" + /db_xref="GOA:Q4K2A9" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2A9" + /translation="MMKEQNTIEIDVFQLLKTLWKHKLIILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDVLEKVAINLKL + DMPAKALTSKVQVIVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVRLNTLVAFLGGTVVTVITVLLIELLDTRVKRPEEIEDVLQM + PLLGVVPDLDKMK" + misc_feature 3436..3852 + /gene="wzd" + /locus_tag="SPC10F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 6.7e-55" + gene 4120..4803 + /gene="wze" + /locus_tag="SPC10F_0007" + CDS 4120..4803 + /gene="wze" + /locus_tag="SPC10F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33102.1" + /db_xref="GOA:Q4K2A8" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K2A8" + /translation="MPTLEISQVKLELAKKAEEYYNALCTNLQLSGDDLKVFSITSVK + PGEGKTTTSTNIAWAFARAGYKTLLIDADMRNSVMSGVFKPRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPIALLQSRNFSTMLETLRKYFDYIVVDTAPVGVVI + DAAIIMQKCDASILVTKAGETKRRDIQKAKEQLEQTGKPCLGVVLNKFDTSVDKYGSY + GSYGNDRKK" + gene 4858..5493 + /gene="wcjG" + /locus_tag="SPC10F_0008" + CDS 4858..5493 + /gene="wcjG" + /locus_tag="SPC10F_0008" + /note="member of homology group 50" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI33103.1" + /db_xref="GOA:Q4K2A7" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4K2A7" + /translation="MKRNSIIYISLKRVMDVLIGLFGTIFTVLPCSLIIYIIYKTKGY + KGSIFFTQYRVGLGEKKFKIIKFRSMVENAEEVLTANKALYEKYINNSYKLPPNEDPR + LTNIGDFIRKTSIDEIPQFINLLFGDMSLIGPRPILENELKEYSKEEQPVLLSVRPGI + TGVWQVSGRSEVYYPERCEMELYYPRNQSFLLDVKIFFLTIKKVLSGEGAH" + misc_feature 4891..5490 + /gene="wcjG" + /locus_tag="SPC10F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.7e-53" + gene 5711..6505 + /gene="wciB" + /locus_tag="SPC10F_0009" + CDS 5711..6505 + /gene="wciB" + /locus_tag="SPC10F_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33104.1" + /db_xref="GOA:Q4K2A6" + /db_xref="UniProtKB/TrEMBL:Q4K2A6" + /translation="MPKKYKIIVATHKRFQMPEDKGLYIPVQVGSEGKENLGYQRDDQ + GNHISHLNPYYCELTGLYWAWKNLECDYLGLVHYRRYFTDRNRPYHDKINMNEVILSA + DQVKELMSEVDVVVPKKRKYYIETLYSHYAHTHDSSHLDVTREIIKEVSPEYLATFDK + VMDCRSGYMFNMFIMDKENVSSYCEWLFPIIDELYRRLDITGYSAFDARLFGRVSERL + FNVWLDCQNLRVKEVPFMYMGKVNLFEKGKSFLKAKYFGKKYGQSF" + gene 6509..7759 + /gene="wzy" + /locus_tag="SPC10F_0010" + CDS 6509..7759 + /gene="wzy" + /locus_tag="SPC10F_0010" + /note="member of homology group 67" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33105.1" + /db_xref="UniProtKB/TrEMBL:Q4K2A5" + /translation="MVLLLLAFAFFLVFPVLSISLSVIGLVNDKKRSKIYLLLISFAI + SIIALRYIPHPTDDGAFHFRATTALIRYDSIFEMFKAFSNGWRVGNYDYGSIPIFTSL + MYFVRNTHHYSLLSFISAFITYFSFGYVVVDLFKDLGKFSKLSYATVFIAVLCLNNYR + YTTSGMRFCMAVALMMLLLYLESKKGYTSLKTTIWYLLPLGIHSAVIYFIGLRFLFPL + IRKVTLAKSLFVLLGFPVLFNLVPWLANLIGWTYLQFFIRKIEVYSDNSSYSQFFNTT + LTMRLYVGIVLMVLFVLLYLGIVNSLKITDDWRFSFVTMTYYVTLLSMSSIPFRNIYD + RNLFLLLPMIVVSTYILFTYRRQLKILTNRNIVYGLTIGILCLSCAVGVFYNNNFPFG + FIDFSKTDLLIKNIFQFFSNLPFT" + misc_feature 6509..6589 + /gene="wzy" + /locus_tag="SPC10F_0010" + /note="Signal peptide predicted for SPC0427 by SignalP 2.0 + HMM (Signal peptide probability 0.934) with cleavage site + probability 0.262 between residues 27 and 28" + gene 7769..8704 + /gene="wcrB" + /locus_tag="SPC10F_0011" + CDS 7769..8704 + /gene="wcrB" + /locus_tag="SPC10F_0011" + /note="member of homology group 87" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33106.1" + /db_xref="GOA:Q4K2A4" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K2A4" + /translation="MLLFYFLEDYMGLSTVTLFKNLKFSDSKFIKLEGELLLKYQEYL + LKIMEDIVTVCEEEGLYYSLSGGSALGAYRHKGFIPWDDDMDIFMLGSEREIFFQKFS + QKFSDKYWIHNSQTPNYGMPIGRIRQKGTVLRGREDVGVEECGFFIDIFWLENVPNSK + ILRQLHGFLCMAIGLLLSCRNFYKNRQLMLEIMKEHKEVRLVFRIKLILGFLTSFMSL + RQFTRLTERIYSLCKNNESRYLSVPSGRKHYFGEMFTREDMQLTRKLNFEGHKWNVPN + NIEHYLTVMYGDYMKIPVVEDRESHIILEISFPNE" + misc_feature 7931..8629 + /gene="wcrB" + /locus_tag="SPC10F_0011" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 3.7e-27" + gene 8743..9831 + /gene="wcrC" + /locus_tag="SPC10F_0012" + CDS 8743..9831 + /gene="wcrC" + /locus_tag="SPC10F_0012" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33107.1" + /db_xref="GOA:Q4K2A3" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2A3" + /translation="MKKIAIVRYNLSKIGGAEKVAINMANELSQYYDVKLLSILLDED + GFINYDVNPNVTLINFHKGDLRIRTATLKLTEKLRDYIKREKIKVIFSITPLTNTMVR + LATLGLNVKIVFCDHHSLEFRDFRSREVQRFVGAKFFDKIVTLTEEDRIKYSDKYNIP + INKVNAIYNWIDEEDFENTPFDNEANKIITVGRFHSQKGYDYLAKVAIKVLSQHPDWQ + WDIYGSGDKLIEQELKRKLEEGCVSSQINFKGNVKGTENIYPNHSIYVMTSRYEGLPL + VLLEAQQYNLPIVSFRCPTGPSEIVEDRINGFLIDCYDVDQMSEKLLELMKNDDLRQS + FSEHAQDNMDKFDKNKILNQWIELIETI" + misc_feature 9256..9768 + /gene="wcrC" + /locus_tag="SPC10F_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.6e-38" + gene order(9840..10121,10123..10644) + /gene="wcrD" + /locus_tag="SPC10F_0013" + CDS join(9840..10121,10123..10644) + /gene="wcrD" + /locus_tag="SPC10F_0013" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33108.1" + /db_xref="GOA:Q4K2A2" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2A2" + /translation="MQECLLTIVMPSYNIQDYISKGIESFQQVHPDYKNKFEVLVVND + RSTDDTALVAEKILAKDSLLDGRVITKENGGHGSTINRGIQEAKGKFFKVLMGMTGLS + PSEIEKFLDALETVDVDMVITDFTEQHVNNDTTVRNDFIDKYEIGRIYKGIPDVRIPM + HSVTYKTSILSANKIRLSEKTFYVDIQYTLFPLEYVHSFSYWNYDIYQYYIGRPEQSM + NIESMKRNVSHHLKVTNSVLDYFSKIENEPVLNRVVSETLVYLISLQVV" + misc_feature join(9858..10121,10123..10386) + /gene="wcrD" + /locus_tag="SPC10F_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 8.2e-20" + gene 10742..11695 + /gene="wciF" + /locus_tag="SPC10F_0014" + CDS 10742..11695 + /gene="wciF" + /locus_tag="SPC10F_0014" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33109.1" + /db_xref="GOA:Q4K2A1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2A1" + /translation="MFVSIVVPVYNVADYLHYAIESLIKQTYQNFEVILVNDGSTDDS + PLLCEDYAKQYENIHVFHKENGGLSDARNFGVSKASSDWIFFLDPDDYLEEYTLELIV + KIQETHQADLISTKVKATSKYNAYTSYRLQDSDYKDLASITKEKALELMLDDKVATVS + ACAKLYRKCILERVPFPVGKIYEDFYVVAEHLALAERIVISPLETYNYYRREGSIVRS + TFTEKRYDFFEAVAKNEEVVKREYIQIPELKQALQAKKLLGGFVVIGAKADSGLKDFS + KDKELLRVEMSELLKNSKLSWKLKLKYLIFMFSPKLYLLLR" + misc_feature 10751..11266 + /gene="wciF" + /locus_tag="SPC10F_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 5e-45" + gene 11849..13264 + /gene="wzx" + /locus_tag="SPC10F_0015" + CDS 11849..13264 + /gene="wzx" + /locus_tag="SPC10F_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33110.1" + /db_xref="GOA:Q4K2A0" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K2A0" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKEIKKNFWGIYSLQLGATVLSLSLYALLCLTL + PFMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVISIFIFVKSAN + DLYLYVFLLTIFELLGQLSMWFPAREFIGSAHFSIEYARHHLKPVILLFLPQVAISLY + ITLDRTMLGALASTKDVGIYDQALKLVNILLILVTSLGSVMLPRVANLLATGEHKAVN + KMHEMSFLIYNLVIFSMMAGILIVNDDFVSFFLGQDFQDARYAIAIMIFRMFFIGWTN + IMGIQILIPHNKNKEFMTSTTAPAIISVGLNLLFLPKFGYIGAAIVSVLTEALVWAIQ + LYFTRRYLKEVPIIGSLTKIILASAIMYGILLGLKTVIHFSPIINVIVFAVLGGIIYL + FAILSLKVVDVKELKQIIRKK" + misc_feature 11855..12649 + /gene="wzx" + /locus_tag="SPC10F_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 5.3e-67" + gene 13266..14264 + /gene="wciG" + /locus_tag="SPC10F_0016" + CDS 13266..14264 + /gene="wciG" + /locus_tag="SPC10F_0016" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33111.1" + /db_xref="GOA:Q4K299" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K299" + /translation="MQKNRNISLDLLKVLACIGVILLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMVNGYLLLGKREITYPYILQKVKWILITVSLWNIIVWLFKRDFAVNPI + KKIVGSLLQKGYFFQFWFFGALILIYLCLPVLKTVINSKRKYVYILSLLVAIGFIVEL + ANIFLQMPIQTHVMQTFRLWTWFFYYLLGGYIAQFNVGNLKYRFKNWMKIVSILLLLI + SPIILFFIAKTTYHNLFAEYFYDTLFVKVSTLGIFLTIFTLTLNENRNKWIVFLSNQT + MGVFIIHTYIMKLWERIFGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 14278..15381 + /gene="glf" + /locus_tag="SPC10F_0017" + CDS 14278..15381 + /gene="glf" + /locus_tag="SPC10F_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33112.1" + /db_xref="GOA:Q4K298" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K298" + /translation="MYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPIANYQGHLYNLPFNMNTFYA + LWGTKTPQEVKDKIAEQTTHMQDVEPKNLEEQAIKLIGTDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTYDNNYFNDRYQGIPIGGYNVIIENMLGDVEVELGVDFFANRE + ELEASAEKVVFTGMIDQFFDYQFGELEYRSLRFEHEILDQENYQGNAVVNYTERDIPY + TRIIEHKHFEFGTQDKTVITREYPADWKRGDEPYYPINDAKNNAIYEQYLAEAKKNGR + VIFCGRLADYKYYDMHVTVERALDVVEEELGSI" + misc_feature 14713..15315 + /gene="glf" + /locus_tag="SPC10F_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 5.1e-134" + gene 15409..16461 + /gene="wcrH" + /locus_tag="SPC10F_0018" + CDS 15409..16461 + /gene="wcrH" + /locus_tag="SPC10F_0018" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33113.1" + /db_xref="GOA:Q4K297" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4K297" + /translation="MKYYLKDSFLNNEYEKNAGNKARNDVEAILISEGYKGLELKVEN + WYKMNFFKAQQHKYRATKSVFDQLGSGDELLIQFPIIHHTFFISQLIKQAQKRGVKFY + LLIHDVETVRHVGNSAVKLRHKVRNYFQEKAALTSVDGIIVHNDIMKNALTIQGIPSD + KMVSLEIFDYLIPNFEEKNAPQKEGAIIVAGNLIPTKSGYLYNLPEQPAYNLYGAGYD + ESRALKNTTYFGSFMPDDLPVALQGSFGLVWDGDSSETCQGSFGNYLRINNSHKASLY + LASGFPLVVWKESALAHFVLDKQCGIAVASLYDLQKALDDLTDQDYMELSANARQVGV + AIRSGDYLKSAISKLK" + gene complement(order(16634..17218,17272..17940)) + /gene="tnp" + /locus_tag="SPC10F_0019" + /pseudo + CDS complement(join(16634..17218,17272..17940)) + /gene="tnp" + /locus_tag="SPC10F_0019" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI33114.1" + misc_feature complement(join(17138..17218,17272..17484)) + /gene="tnp" + /locus_tag="SPC10F_0019" + /note="HMMPfam hit to PF01610, Transposase, score 9.7e-45" + /pseudo + gene 18173..>18532 + /gene="aliA" + /locus_tag="SPC10F_0020" + CDS 18173..>18532 + /gene="aliA" + /locus_tag="SPC10F_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33115.1" + /db_xref="GOA:Q4K296" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K296" + /translation="MMKSSKLFALAGVTLLAATTLAACSKSGSSAKAEKTFSYIYETD + PDNLNYLTTGKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 18173..18265 + /gene="aliA" + /locus_tag="SPC10F_0020" + /note="Signal peptide predicted for SPC0437 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.629 between residues 31 and 32" + misc_feature 18419..18487 + /gene="aliA" + /locus_tag="SPC10F_0020" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcctagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggtctgact + 361 tttgcatctg ctttgctttt agctgcttgc gaccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtca attgaaacaa gagcaggaca aaagagcctc gtaaaaggta ttgcaacttg + 541 gtaatacctt tttgaggtgc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggcgagta gggaggaaga ggtaaaagtt tatgcccaaa ctcttcgcat aaaagttcta + 661 gcttccccat tctatggaat cttacattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagaa aaacttctga aaccaagctt caaaaaagtc gctcgtcatc atctcttcgt + 781 aagtcattgg agcgattaac tcaccatttg ttagacctgc aaccaaagaa atcctctgat + 841 atcttcttcc agatacttta cctcttatta actgaccttt taatgagcga ccatattctc + 901 gataaaaata agtatcaaat cctgtttcgt caatctaaac aggtgctagg tgctttaaac + 961 tattaaaatt cttaagaaat aaggctactt tttctgggtc ttgttcataa ttagattgaa + 1021 actagaatag tagacctctg cttctaaaac attgttagaa atcgatttga ctgtcctgat + 1081 cgatttgtca tgttcttatt tcattttact atatttttgt ttcgcgggaa gtctactaag + 1141 atacttaaag atgcagatag taaaaaaaat gtagacatta ccgtaaaaaa gtgatataat + 1201 cgtatgatgt tcaaggtata ggtgttaatc atgagtagac gttttaaaaa atcacgttca + 1261 cagaaagtga agcgaagtgt taatatcgtt ttgctgacta tttatttatt gttagtttgt + 1321 tttttattgt tcttaatctt taagtacaat atccttgctt ttagatatct taacctagtg + 1381 gtaactgcgt tagtcctact agttgccttg gtagggctac tcttgattat ctataaaaaa + 1441 gctgaaaagt ttactatttt tctgttggtg ttctctatcc ttgtcagctc tgtgtcgctc + 1501 tttgcagtac agcagtttgt tggactgacc aatcgtttaa atgcgacttc taattactca + 1561 gaatattcaa tcggtgtcgc tgttttagca gatagtgata tcgaaaatgt tacgcaactg + 1621 acgagtgtga cagcaccgac tgggactgat aatgaaaata ttcaaaaact actagctgat + 1681 attaagtcaa gtcagaatac cgatttgacg gtcaaccaga gttcgtctta cttggcagct + 1741 tacaagagtt tgattgcagg ggagactaag gccattgtcc taaatagtgt ctttgaaaac + 1801 atcatcgagt cagagtatcc agactacgca tcgaagataa aaaagattta taccaaggga + 1861 ttcactaaaa aagtagaagc tcctaagacg tctaagaatc agtctttcaa tatctatgtt + 1921 agtggaattg acacctatgg tcctattagt tcggtgtcgc gatcagatgt caatatcctg + 1981 atgactgtca atcgagatac caagaaaatc ctcttgacca caacgccgcg tgatgcctat + 2041 gtaccaatcg cagatggtgg aaataatcaa aaggataaat tgactcatgc tggtatatat + 2101 ggggttgatt catccattca taccttagaa aacctttatg gtatagatat taattattat + 2161 gttcgtttga attttacctc atttttgaaa ttgattgact tattgggagg ggtagatgtt + 2221 cataatgatc aagagttttc agctctacat gggaagttcc atttcccagt agggaatgtc + 2281 catctagact ctgagcaggc tctaggtttt gtacgtgaac gctactcact agccgatgga + 2341 gaccgtgacc gtggtcgcaa ccaacaaaag gtgattgtgg ctatccttca aaaattaacg + 2401 tcaaccgaag cactgaaaaa ttatagtacg atcattaata gcttgcaaga ttctatccaa + 2461 acaaatatgc cacttgagac tatgataaat ttggtcaatg ctcagttaga aagtagaggg + 2521 aattataaag taaattctca agatttaaaa ggtacaggtc ggatggatct tccttcttat + 2581 gcaatgccag acagtaacct ctatgtgatg gaaatagatg atagtagttt agctgtagtt + 2641 aaagcagcta tacaggatgt gatggagggt agatgaaatg atagacatcc attcgcatat + 2701 cgtttttgat gtagatgacg gtcccaagtc aagagaggaa agcaaggctc tcttggcaga + 2761 atcctacagg cagggggtgc gaaccattgt ctctacctct caccgtcgca agggcatgtt + 2821 tgaaactcca gaagagaaga tagcagaaaa ctttcttcag gttcgggaaa tagctaagga + 2881 agtcgcgagt gacttggtca ttgcttatgg ggctgaaatt tactacacat cagatgtttt + 2941 ggataagctg gaaaacaatc ggattccgac actcaataat agtcgttatg ccttaataga + 3001 gtttagtatg aacacccctt atcgcgatat tcatagtgcc ttgagtaaaa tattgatgtt + 3061 gggaattact cccgtcattg cccacatcga gcgctatgat gctcttgaaa ataatgaaaa + 3121 acgcgttcga gagctgatcg atatgggctg ttacacgcaa gtaaatagtt cacatgtcct + 3181 caaatccaaa ctttttggag aacggtataa attcatgaaa aaaagagcgc agtatttctt + 3241 ggagcgtgat ttggttcatg tgattgcaag tgatatgcat aatgtggacg acagacctcc + 3301 ccatatggca gaagcgtatg accttgtttc ccaaaaatat ggagaagcga aggctcagga + 3361 actttttata gaaaatcctc gaaaaattgt aatggatcaa ctaatttagg agaaatgatg + 3421 aaagaacaaa acacgataga aatcgacgta tttcaattac ttaaaacctt gtggaaacac + 3481 aagctaatca ttttattagt ggcacttgtg acaggggcgg gagcttttgc atatagcact + 3541 tttattgtta agccagaata tacgagcacc acgcgtattt acgtagtcaa ccgtaatcaa + 3601 ggagataagc cgggactgac gaatcaggac ttgcaggcag ggacttatct ggtaaaagac + 3661 taccgcgaaa ttatcctttc gcaggatgta ttggaaaagg tagcgataaa tttgaaattg + 3721 gatatgccag caaaagcgtt aactagcaaa gtgcaagtga ttgtaccagc cgacactcgt + 3781 atcgtctcaa tctctgtcaa ggataaacaa ccagaggaag ccagtcgcat tgctaattct + 3841 ctacgagaag ttgcagcaga aaagatcatc gctgtcacgc gagtatctga tgtaacgacg + 3901 cttgaagaag cgcggccagc tacgactccc tcttctccca atgttcgact caacacctta + 3961 gttgcttttc ttggaggaac cgtcgtaaca gtaattactg ttcttttgat tgagttgctc + 4021 gatacccgtg tgaaacgtcc tgaagaaatt gaagatgtac tgcaaatgcc acttctagga + 4081 gtcgttccag atttggataa aatgaaatag gaggaagtta tgccaacgtt agaaatctca + 4141 caggtgaaat tagaacttgc gaaaaaggca gaggaatatt ataatgcttt gtgcacgaac + 4201 ctacagttaa gtggagatga tttgaaagtg ttttctatta cttctgtgaa accaggagaa + 4261 ggaaaaacaa cgacttccac caatatcgct tgggcttttg cgcgtgcagg ttacaaaacg + 4321 ctgctgattg atgcagacat gcgtaactcc gtgatgtcag gtgtctttaa accaagggaa + 4381 aggattactg gactaacaga atttctatca gggactacag acctgtcaca ggggctttgc + 4441 gataccaata ttgagaatct ctttgtgatt caggctggct ctgtgtcacc aaatccgata + 4501 gcccttcttc aaagtaggaa tttcagtaca atgcttgaaa ccttgcgtaa atattttgac + 4561 tatatcgtcg tagacactgc tcctgtcggc gtcgtgattg atgcggctat cattatgcag + 4621 aaatgtgatg cttctatttt agtgacgaag gcaggtgaaa caaaacgacg ggatattcaa + 4681 aaagcgaaag aacagttgga acaaactggg aagccgtgtt taggagttgt gttgaataaa + 4741 ttcgatactt cagtagacaa atacggttct tatgggagtt atgggaatga caggaaaaaa + 4801 taaaccagtt tatagtagcg aaactaattg agatacttat catgaggagg agttaaggtg + 4861 aaaagaaata gcattatcta tattagctta aaacgagtta tggatgttct tattggcttg + 4921 tttggaacaa tattcacagt cttgccctgt tctctaataa tttatattat ttataaaaca + 4981 aaaggttata aagggagtat attttttaca caatacagag tggggttggg agagaaaaaa + 5041 tttaaaatta ttaaatttag atcaatggtt gaaaatgctg aagaagtttt gaccgcaaat + 5101 aaagcactct atgaaaaata tataaataac agttataaat tacctccaaa tgaggatcct + 5161 cgtcttacca acatcggaga ttttataaga aaaacgagta ttgatgaaat tcctcaattt + 5221 ataaacttgt tgtttggaga tatgagtctt attggaccta gaccgatttt ggagaatgag + 5281 ttaaaggagt actctaagga agaacagcca gttttactat ctgtacgacc aggtattaca + 5341 ggggtgtggc aagtttctgg taggagcgag gtatattatc ctgaacgctg tgaaatggag + 5401 ctgtattacc ctcggaacca atccttttta ttagatgtca aaatcttctt tttgacaata + 5461 aaaaaagttc tgtctggaga aggggctcat tgatgtatga gctaaatcat ctagcaaaaa + 5521 aaagatagaa agatgaagtt gaatacgcat aacgtttctt ggatattcgt attcattttc + 5581 tcaagtgaag gaagcattat gaataagtgg atttaatcta gtgttttttg cttgaaaaaa + 5641 tgaatgggaa ttcaatctaa agaattgtcc agttaggcaa gattttagga attggagtta + 5701 ggatgtagaa atgccaaaaa agtataaaat tatagtagcg actcataaaa gatttcaaat + 5761 gccagaagat aagggcttat atattcctgt tcaggttggc agtgaaggaa aggaaaattt + 5821 aggttaccaa cgagatgatc aaggtaatca tatctcacac ctcaatcctt attattgtga + 5881 attgacagga ttatactggg cttggaaaaa tttagaatgt gattacctag gattagttca + 5941 ttaccgacgt tattttacag ataggaaccg accttatcat gataagatta acatgaatga + 6001 agttatccta tcggcagatc aagttaagga gctcatgtct gaagtagatg tcgttgttcc + 6061 caaaaagaga aaatattata tagaaactct ctattctcat tatgctcata ctcatgattc + 6121 cagtcattta gatgtaacac gagaaattat aaaagaggtt tcgccagaat atttagcaac + 6181 atttgacaag gtgatggact gtcgtagtgg ctacatgttc aatatgttta tcatggacaa + 6241 agaaaatgta tcatcttatt gtgagtggtt gttccctatc attgatgagt tgtacagaag + 6301 attggatata acaggatact ctgcttttga tgcaagacta tttggacgtg ttagtgagcg + 6361 tctctttaat gtttggttag attgccaaaa tctacgtgtt aaagaagttc cgtttatgta + 6421 tatgggaaaa gtgaatttat ttgagaaggg caaatccttc ttgaaagcta agtatttcgg + 6481 aaaaaaatat ggacagagtt tttaaattat ggttttgtta ttacttgctt ttgcattctt + 6541 tttagttttc cctgtgttgt caataagttt aagtgttata gggctagtaa atgacaaaaa + 6601 gcgttcaaaa atctatttac tactaattag ttttgcaata tcaattattg cgctgcgtta + 6661 tattcctcat cctacggatg atggcgcttt tcattttcgt gcgactactg cccttattcg + 6721 ctatgatagt attttcgaaa tgtttaaagc attttctaat gggtggagag tagggaacta + 6781 tgactatggc tccataccaa tttttacctc attaatgtat tttgttcgca acacccatca + 6841 ctatagttta ctgagtttta tttcagcttt cataacttac tttagttttg gttacgtagt + 6901 tgttgactta tttaaggatt tgggcaagtt ttctaaacta tcgtatgcta cagtatttat + 6961 tgctgtacta tgtttaaata attacagata tacaactagt ggaatgagat tttgtatggc + 7021 agttgccttg atgatgcttt tactatattt ggagtcaaaa aaaggctata ctagtttaaa + 7081 aacaactatt tggtatttgt taccattagg tatccattca gcggttattt attttattgg + 7141 tttaaggttc ttatttccat taattaggaa agtgacactc gctaaaagtt tatttgtatt + 7201 attaggtttt cctgttttgt tcaacctagt tccatggtta gcaaatctga ttggttggac + 7261 ttacttacaa ttttttattc gaaaaattga agtctactct gacaattcat cctattccca + 7321 gttttttaat accacattaa caatgaggct atatgttgga atagtactga tggttttatt + 7381 tgtattgtta tatttgggaa tagtaaattc attgaaaata actgatgatt ggcgttttag + 7441 ttttgttaca atgacatatt atgtaactct gttatctatg agttcaatac catttcgtaa + 7501 tatttatgat agaaatcttt tcttgctcct tcctatgatt gtagtttcaa cctacatatt + 7561 atttacatat agacgtcaat tgaaaattct tactaatcgt aatattgttt atggactgac + 7621 gataggtatt ctttgtctat cctgtgcagt tggtgtattt tataataata atttcccttt + 7681 tggttttatt gattttagta aaacggattt actcataaaa aatatttttc aattcttttc + 7741 aaatttacct tttacgtaat aagactatgt gctattattt tattttttgg aggattatat + 7801 gggactatct accgtgacat tatttaaaaa tttaaagttc tcagatagta aatttattaa + 7861 attggaggga gagcttcttc ttaaatatca agagtattta ttaaaaatca tggaagatat + 7921 tgtaacagta tgtgaggaag aaggattata ttattcactt tctggtggta gtgcactagg + 7981 ggcttatcga cacaaaggat ttattccatg ggatgatgat atggacatat ttatgctagg + 8041 aagtgagcgg gagattttct ttcaaaaatt ctctcaaaaa ttttctgata aatattggat + 8101 acataattca caaacaccaa actatggtat gcctattggt cgtatcagac aaaaaggaac + 8161 agttttacgt ggtcgagagg atgtcggagt tgaagaatgt ggatttttta ttgatatttt + 8221 ttggcttgaa aatgttccta attcaaaaat attgagacaa cttcacggct ttctctgcat + 8281 ggcgattgga ttgttactat catgtagaaa tttttataaa aatcgtcagc tgatgctgga + 8341 gattatgaag gaacataaag aagtaaggct tgtttttcga ataaaactaa ttttagggtt + 8401 tctaactagt tttatgtctt tgagacaatt tacaagactt acggaaagga tctactcatt + 8461 gtgcaagaat aatgaatcaa gataccttag cgttccttca ggaagaaaac attattttgg + 8521 cgagatgttt acaagagaag atatgcagtt aactaggaaa ctaaattttg aaggacataa + 8581 gtggaatgtt ccaaataata ttgagcatta tttaactgta atgtacggtg attatatgaa + 8641 aatacctgta gttgaagata gggaatcaca tatcatttta gaaatttcct tccctaacga + 8701 gtaaacagta ctttcatttt ttatatgtaa ggaattaatt taatgaaaaa aatagcaatt + 8761 gttagatata atctaagtaa aattggtgga gcggaaaaag tagctattaa tatggctaat + 8821 gaattgtcac aatactatga tgtaaaattg ttatcaattc tattggatga agatggtttt + 8881 ataaattatg atgttaatcc taatgtgaca ttaataaatt ttcacaaggg tgatcttaga + 8941 attagaactg ctacattaaa attaacggag aaattaaggg attatattaa aagagaaaaa + 9001 attaaagtga ttttttctat aaccccatta acaaatacta tggttagatt agctactcta + 9061 ggattaaatg tgaaaatagt tttctgtgat caccatagct tagaatttcg tgattttaga + 9121 agtagggaag tgcagagatt tgtaggagct aaattttttg acaagatcgt cactttaaca + 9181 gaagaagata gaatcaaata ctccgataaa tataatatac ctataaataa agtaaatgct + 9241 atttataatt ggattgatga agaagatttt gaaaatactc catttgataa tgaggcaaat + 9301 aaaataataa cggtaggtcg atttcatagt caaaaggggt atgattatct tgccaaagta + 9361 gctataaaag tattatcaca acatccagac tggcagtggg atatatatgg ttcaggggat + 9421 aaacttattg aacaggagct aaaaagaaaa ctagaagaag gctgtgtttc ttcacaaatt + 9481 aatttcaaag gaaatgtaaa gggaactgaa aatatttatc ccaatcatag tatctacgtc + 9541 atgacttctc gctatgaggg cttaccttta gttctattag aagctcaaca atacaatctt + 9601 cctattgtta gctttagatg tccgacggga cctagtgaga ttgttgaaga tagaatcaac + 9661 ggatttctga ttgattgcta tgacgtggat cagatgagtg agaaattact tgaattgatg + 9721 aaaaatgatg atttgcgaca atctttctca gaacatgccc aagacaatat ggataaattt + 9781 gataaaaata aaattctcaa ccagtggata gaattaattg agacaattta ggagacaaga + 9841 tgcaagagtg tttattgaca attgtaatgc ctagttataa tattcaggac tatatttcca + 9901 aaggaatcga gtcattccag caagtacacc cggattataa aaataaattt gaagtactgg + 9961 ttgtcaatga tagaagtaca gacgatacgg ctttagtagc agaaaaaata ttagccaaag + 10021 attcgttgct ggatggccgt gtcattacaa aagaaaacgg cggtcatggt tcgacaatca + 10081 atcgcggtat tcaagaagca aagggaaaat tttttaaagt gattgatggg gatgactggg + 10141 ttatccccat cagaaattga aaagttctta gatgctcttg aaactgttga tgtggatatg + 10201 gtgattacag attttacaga gcagcatgtc aataacgata ctacagtacg aaatgacttt + 10261 attgacaagt atgaaattgg tagaatctat aaggggattc ctgatgtaag aattcccatg + 10321 cattcagtta catataaaac atctatcttg tcggcgaata aaattcgttt aagtgaaaaa + 10381 acattttatg ttgacattca gtacacactc tttcctttgg agtatgttca tagtttcagt + 10441 tattggaatt atgatattta tcaatactac ataggtagac cagagcaaag tatgaatatt + 10501 gagagtatga agcgaaatgt aagtcatcat ctaaaggtaa cgaattctgt actagattat + 10561 ttttcaaaaa ttgaaaatga acccgtttta aaccgagtag tttctgaaac cttagtttat + 10621 ctcatcagtt tgcaggttgt ctaacttaaa ttataggact agctttgctt tgggaataaa + 10681 ttttaatccg atttggaata aatactctaa aaaaaaaaag aaaaagagag aggtatttag + 10741 gatgtttgtc agcatcgttg ttccggttta taatgttgca gactatctgc attatgcgat + 10801 agaaagctta attaaacaga cctatcaaaa ctttgaggta atccttgtaa atgatggttc + 10861 tacagatgat tctcctctat tatgcgaaga ttatgcaaag caatatgaaa atatccatgt + 10921 tttccacaaa gaaaatggtg ggttatctga tgcgcgtaac tttggagttt ctaaagcgag + 10981 ttcagattgg attttctttt tagatccgga tgattatctt gaagaatata ctctagagtt + 11041 aatcgtgaaa attcaggaaa cacatcaagc agacttgatt tcaacaaagg taaaagctac + 11101 ttcaaaatat aatgcttata cttcttatcg attgcaagac tcagactata aagatttggc + 11161 ttcgattaca aaagaaaagg ctctggaact aatgttggat gacaaagttg caacggtttc + 11221 tgcttgtgct aagctttatc ggaaatgcat cttggaacgc gttccatttc cagtcgggaa + 11281 gatctatgag gatttttatg ttgtagcaga acatcttgcc ttagctgaaa gaatcgtgat + 11341 cagtccactt gaaacctaca attactatcg tagggaaggg agtattgttc gttcaacatt + 11401 tactgaaaaa agatatgatt tctttgaagc tgttgcaaaa aatgaggaag ttgttaaaag + 11461 agagtacatt cagattccag aattaaagca agctttgcaa gctaagaaat tattaggtgg + 11521 ttttgtagta attggtgcaa aagctgactc aggcttaaaa gatttttcaa aagataaaga + 11581 gttgttgaga gtcgaaatga gcgagttatt aaaaaatagt aagttatcat ggaaactaaa + 11641 actaaaatat cttattttta tgtttagccc taaattgtat ttgttgctac gatagtatga + 11701 tacatagatc caatttaatt tgcaacaggt gtcaaaaaat tgtaggaaag agggaatatg + 11761 aaagaagtgt ttagaagaat tgcccattat aaatctgttc gttcacgatt tttaatgtct + 11821 ctggttgatt ataatagggc gggttgaaat gaaagtatta aaaaactacg cctacaatct + 11881 ttcttatcaa ttgttggtga ttatacttcc gattattacg actccctatg taacacgggt + 11941 cttttcttcg gatgatttag ggacgtatgg atactttaat tccattgtta cttattttat + 12001 cctcttggcg acactaggag ttgctaacta tgggaccaag gtcatttcag ggcatcgcaa + 12061 ggaaattaaa aaaaactttt ggggtatcta ctctctacaa ttaggggcaa cagttctttc + 12121 tctgtcttta tatgctcttc tttgtctgac ccttcccttt atgcaaaatc cggtagccta + 12181 cattctaggc ttgagtttag tttcaaaagg tttagacatt tcctggctct ttcaagggct + 12241 agaagatttt cgaaagatta ctgttcgaaa tatcacagtt aaactcgttg gagtcatttc + 12301 aatctttatc tttgtcaaat ctgcaaatga cctatatctc tatgtttttt tgctaaccat + 12361 atttgaactt ttggggcaac taagtatgtg gttccctgct cgggagttta tcggtagtgc + 12421 tcattttagc atagaatatg ctaggcatca tttaaagccg gtcatattat tattccttcc + 12481 tcaagtagct atttctttgt acattacgct ggatcgtacc atgcttggag cactggcgtc + 12541 tacaaaagat gtagggatct atgatcaggc acttaagttg gtaaatatcc ttctgatttt + 12601 ggtaacttcc ttgggaagcg ttatgttgcc tcgtgttgcg aatttgttag cgacaggtga + 12661 acacaaagcg gttaacaaaa tgcatgagat gtccttcctc atttataatt tagtgatttt + 12721 ctcaatgatg gcaggaattt tgattgtgaa tgatgatttt gttagctttt tccttgggca + 12781 ggattttcag gatgcacgtt atgcaattgc cattatgatc ttccgtatgt tctttatcgg + 12841 ttggaccaat atcatgggaa ttcagatttt aattccccat aataaaaata aagaattcat + 12901 gacttcaaca acagctcccg caattatcag tgtaggtttg aacttactat tccttcctaa + 12961 atttggatat atcggagcag ccattgtttc tgttttgaca gaggcgttgg tatgggcgat + 13021 acaattatac tttacccgta gatacctaaa agaagttccg attatcggat ctttgacaaa + 13081 aattattcta gcttcagcta tcatgtatgg tatcttgcta ggtttaaaaa cagttataca + 13141 tttttcacca atcataaatg ttatagtatt tgcagtgctt ggtggaatca tttatctttt + 13201 tgcaattcta tctttgaaag tggtagatgt aaaagaatta aaacaaatta ttaggaaaaa + 13261 atagaatgca aaaaaatagg aatattagcc tagatttatt aaaagtgctt gcgtgtattg + 13321 gggtcatttt actccataca acaatgggtg gatttaaaga gacaggatca tggaatcttt + 13381 tggcatattt atattattta ggtacctact ccattccctt gttttttatg gtcaatggtt + 13441 atttattgtt aggcaaaagg gaaataactt atccttacat acttcaaaaa gtcaaatgga + 13501 ttctaataac agtgtcatta tggaacatta tcgtttggct ttttaaaaga gactttgcgg + 13561 ttaatccaat taaaaaaatt gtaggctctc tgttacaaaa agggtatttc tttcagtttt + 13621 ggtttttcgg tgccttgata ctgatttatt tatgtttgcc tgttttgaaa acagttataa + 13681 attcaaaaag aaaatatgta tacattctat ctttattggt ggcaattggg tttatagttg + 13741 aattagcaaa tattttcctt cagatgccta tacaaactca tgttatgcaa acttttagat + 13801 tatggacttg gtttttctac tatcttttag gtggttatat agcacaattc aatgtaggca + 13861 acctcaaata tagatttaaa aattggatga aaatagttag catacttttg ttattgattt + 13921 caccaataat attattcttc atagcgaaga ctacatatca taatctattt gctgaatatt + 13981 tttatgatac tttatttgta aaagtcagta ctctaggaat ttttctaact atcttcacgc + 14041 ttacgttgaa tgaaaaccga aacaaatgga ttgttttcct ttctaatcaa acaatgggag + 14101 ttttcataat acacacttat attatgaaat tgtgggaaag aatatttggt tttaattttg + 14161 taggagcata tttacttttt gctctattta ctttgagtgt tagttttatt attgttggaa + 14221 tgttaatgaa gattccttac ttcaatcgaa tcgtcaaatt ataaaaagga gaacactatg + 14281 tacgattatc ttatcgtcgg tgctggtttg tctggagcaa tctttgcaca cgaagctaca + 14341 aaacgtggaa aaaaagttaa agtgattgac aagcgtgacc acatcggtgg aaatatctac + 14401 tgtgaaaatg ttgagggcat caatgtccac aagtatggtg cccacatttt ccatacttcc + 14461 aataaaaaag tgtgggacta tgtcaatcaa ttcgctgagt ttaacaacta tatcaattcc + 14521 cctatcgcca actatcaagg gcacctttac aatctgcctt tcaatatgaa cactttctac + 14581 gccttgtggg gaacaaagac accccaagaa gtcaaggaca agattgctga gcagacgact + 14641 catatgcaag atgttgagcc aaaaaaccta gaggaacaag ccattaagtt gattggtacg + 14701 gatgtctatg aaaagctgat taagggctat actgagaaac aatggggacg ttctgctact + 14761 gagctgccac cctttatcat caagcgtttg ccagttcgat tgacctatga taacaattat + 14821 ttcaacgacc gctaccaagg aattcctatt ggtggttaca atgtcatcat tgaaaatatg + 14881 cttggcgatg tggaagttga gcttggtgtt gatttctttg ccaatcgtga agagttagaa + 14941 gcatcagctg aaaaagttgt cttcacaggg atgattgatc agttctttga ctatcagttt + 15001 ggtgaactag agtatcgcag tcttcgtttt gaacatgaga ttctggacca agaaaactat + 15061 caaggaaatg ctgtagtcaa ctatactgaa cgtgatatac cttatacgcg tatcatcgag + 15121 cacaaacatt ttgagtttgg gacccaggac aagaccgtta ttactcgtga atatccagca + 15181 gattggaaaa gaggggatga accctactat ccaatcaatg atgctaaaaa caatgcaatc + 15241 tatgaacagt atctagcaga agccaagaaa aatgggcgcg tgatcttttg tggtcgcttg + 15301 gcagattata aatactatga tatgcatgtg acggttgaac gtgcattgga tgtggtagaa + 15361 gaagaactag ggagtatcta agaacatcac agataaagga gagaaaaggt gaaatattat + 15421 ctgaaggatt catttctgaa taatgaatac gaaaagaatg caggaaataa ggcacgaaat + 15481 gacgtggaag ctattctaat ctcagagggg tataagggat tggaactcaa ggttgagaat + 15541 tggtataaga tgaatttctt taaagctcag caacacaaat atcgggcaac caagtctgtg + 15601 tttgatcagt tgggatctgg agatgaattg ctgattcagt tcccgattat ccaccataca + 15661 tttttcattt cgcaactcat caagcaggct caaaaaagag gagttaaatt ctatctgttg + 15721 atccatgatg ttgaaaccgt gcgtcatgta ggaaattcag cagtgaaact tcgtcataaa + 15781 gtgagaaatt acttccaaga gaaggcagct cttacatcag tggatggcat tatcgttcat + 15841 aatgatatca tgaaaaatgc cttgacaatc caaggcatac catcagataa aatggttagc + 15901 ttggagattt ttgactatct gattcctaac tttgaggaaa aaaatgctcc ccaaaaagag + 15961 ggagcgatta tcgtcgccgg aaatctaatt ccaacaaaat caggctatct ttataatttg + 16021 ccagaacagc cagcttacaa cttgtatgga gcgggttacg atgaaagtcg tgcattgaaa + 16081 aacacgacct actttggttc ctttatgcca gatgacctcc cagttgctct tcaaggtagt + 16141 tttggtttgg tgtgggatgg ggatagttca gaaacttgcc aaggttcttt cggaaattac + 16201 ctacgtatta acaattcgca caaggcttct ctttatttgg cttcgggctt tcctctggtg + 16261 gtttggaaag agtctgccct tgcgcatttt gtgctagata agcagtgtgg tatagcggtt + 16321 gcttctctat atgacctcca aaaggcacta gacgatttga cagatcaaga ttacatggaa + 16381 ctgtcggcta atgccagaca agtaggagta gcgattcgaa gtggagatta tctgaaatcg + 16441 gccatttcta aattgaagta agaatgctaa atttcaagtt caagttagcc agcaatcaaa + 16501 aattctctgg gagacttgta gtccaagcat tttttaggat agttattgat ccacttttcg + 16561 atgaaggcgg cttctttagg agtcgttttc ttagttcctt ggctctttgt caactgtagt + 16621 gggttgaagt cagctaagct cgagaaagga caaattttgt cctttctttt ttgatattca + 16681 gagcgatgaa aatccgtttt ttgaagtttt caaagtttcg aaaaccaaag gcattgcgct + 16741 tgataagttt gatgagatta ttggtcgctt ccagtttggc attagaatag tgtagttgaa + 16801 gggcgttgac aatcttttct ttatctttga ggaaggtttt aaagacagtc tgaaaaatag + 16861 gatgaacctg cttaagattg tcctcaataa gcccgaaaaa tttctctggt tccttattct + 16921 ggaaatgaaa aagcaagagc tgatagagtt tatagtggtg tttcaagtct tccgaataac + 16981 tcaaaagctt gtttaaaatc tctttattgg ttaagtgcat acgaaaagta ggacgataaa + 17041 atcgcttatc actcagttta cggctatcct gttgaatgag tttccagtag cgcttgatag + 17101 ccttgtattc atgggatttt cgatgaaact gattcatgat ttgaacacgc acacgactca + 17161 tagcacggct aagatgttgt acaatgtgaa agcgatcaag aacgatttta gcattcggga + 17221 gtgaaacagt ctgggagact gtttcagcct gagcctagaa atttgaaagc gaagctgttt + 17281 agccaagtca tagtaaggac taaacatatc catagtaata attttcactt gacatcggac + 17341 ggctctatca tatttaagaa agtgatttcg aatgacagct tgtgttcttc cctcaagaac + 17401 agtgatgata ttgagattgt taaaatcttg cgcaatgaag ctcatctttc cctttgtaaa + 17461 agcatactca tcccaagaca taatctcagg aagacaagaa aaatcatgtt taaagtgaaa + 17521 gtcattgagc ttacgaataa cagttgaagt tgagatggaa agctgatggg caatattagt + 17581 catagaattc ttttcaatta acttttgcgc aatcttttgg ttgatgatac gagggatttg + 17641 gtgattcttc ttgacgatag aagtttcagc gaccatcatt tttgaacagt gatagcactt + 17701 gaatcgacgc tttctaagga gaattctagt aggcatacca gttgtctcaa ggtaaggaat + 17761 cttagacggt ttttgaaagt catatttctt catttgactt ccgcactcag ggcaagatgg + 17821 ggcgtcgtag tccagtttgg cgatgatttc tttgtgtgaa tccctattga cgacatctat + 17881 aatttggata tttgtgtctt taatgtctag taattttgtg ataaaatgta attgtttcat + 17941 atgattcttt ctaatgagtt gttttgtcgc ttttcattat aggtcatatg ggactttttt + 18001 tctacacaaa aataggctcc ataatatcca taggggattt acccattaca aatattatag + 18061 agcccttttt gttttttttc agaatttacc aaattaatta aaaaattcag aaaattctat + 18121 tgacatctct ctgaaaagag tctataatag agagaaagtt ttaaaggaga agatgatgaa + 18181 aagttcaaaa ctatttgccc ttgcgggtgt aaccttattg gcggcgacta ctttagctgc + 18241 atgttctaaa tcaggttcga gcgctaaagc tgagaagaca ttctcataca tttatgaaac + 18301 ggatcctgac aacctaaact acttgacaac tggtaaggct gcgacagcaa atattaccag + 18361 taacgtggtt gatggtttgc tagaaaatga tcgctacggg aactttgtgc cgtctatggc + 18421 tgaggattgg tctgtatcca aggatggatt gacttacact tatactatcc gtaaggatgc + 18481 aaaatggtat acttctgaag gtgaagaata cgcggcagtc aaagctcaag ac +// + diff --git a/public/res/serotype_genbank/serotype_11A.gb b/public/res/serotype_genbank/serotype_11A.gb new file mode 100644 index 0000000..4a733aa --- /dev/null +++ b/public/res/serotype_genbank/serotype_11A.gb @@ -0,0 +1,815 @@ +LOCUS CR931653 17948 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 1813/39 (serotype 11a). +ACCESSION CR931653 +VERSION CR931653.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17948) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17948) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17948 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="1813/39" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC11A_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC11A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33116.1" + /db_xref="GOA:Q4K295" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K295" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQVLAPWDAFCVEMTD + " + gene complement(215..2380) + /gene="tnp" + /locus_tag="SPC11A_0002" + /pseudo + CDS complement(215..2380) + /gene="tnp" + /locus_tag="SPC11A_0002" + /note="member of homology group 17; + possible fusion of 2 transposases" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202/IS663 fusion transposase" + /db_xref="PSEUDO:CAI33117.1" + misc_feature complement(248..946) + /gene="tnp" + /locus_tag="SPC11A_0002" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 2.2e-12" + /pseudo + misc_feature complement(1394..1897) + /gene="tnp" + /locus_tag="SPC11A_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 2e-21" + /pseudo + gene 2556..4001 + /gene="wzg" + /locus_tag="SPC11A_0003" + CDS 2556..4001 + /gene="wzg" + /locus_tag="SPC11A_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33118.1" + /db_xref="GOA:Q4K240" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K240" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGIDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEINDSSLASVKTAIQDVLEGR" + misc_feature 2556..2672 + /gene="wzg" + /locus_tag="SPC11A_0003" + /note="Signal peptide predicted for SPC0440 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 2760..3107 + /gene="wzg" + /locus_tag="SPC11A_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 3285..3728 + /gene="wzg" + /locus_tag="SPC11A_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.1e-69" + gene 4003..4734 + /gene="wzh" + /locus_tag="SPC11A_0004" + CDS 4003..4734 + /gene="wzh" + /locus_tag="SPC11A_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33119.1" + /db_xref="GOA:Q4K239" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K239" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKNRIPTLNNS + RYALIEFSMNTPYRDIHSALIKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLERDLVHVIASDMHNVDSRPPHMAEAYDLVS + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 4006..4614 + /gene="wzh" + /locus_tag="SPC11A_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 6.8e-38" + gene 4743..5435 + /gene="wzd" + /locus_tag="SPC11A_0005" + CDS 4743..5435 + /gene="wzd" + /locus_tag="SPC11A_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33120.1" + /db_xref="GOA:Q4K238" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K238" + /translation="MKEQNTIEIDVFQSLKTLWKYKLIILLVALVTGAGAFAYSTFIV + KPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDVLEKVATNLKLD + IPAKTLTSKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDVT + TLEEARPATTPSSPNVRRNTLVGFLGGAAVTVITVLLIELLDTRVKRPEDVEDVLQMP + LLGVVPDFDKMK" + misc_feature 4761..5177 + /gene="wzd" + /locus_tag="SPC11A_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 4.7e-51" + misc_feature 5283..5360 + /gene="wzd" + /locus_tag="SPC11A_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 5445..6134 + /gene="wze" + /locus_tag="SPC11A_0006" + CDS 5445..6134 + /gene="wze" + /locus_tag="SPC11A_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33121.1" + /db_xref="GOA:Q4K237" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K237" + /translation="MPTLEISQVKLELAKKAEEYYNALCTNLQLSGDDLKVFSITSVK + AGEGKTTTSTNIAWAFARAGYKTLLIDADMRNSVMSGVFKSRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLGTLRKYFDYIVVDTAPIGIVI + DAAIIMQKCDASILVTKAGETKRRDLQKAKEQLEQTGKSCLGVVLNKFDTSVEKYGSY + GSYGNYRKQKK" + gene 6149..7510 + /gene="wchA" + /locus_tag="SPC11A_0007" + CDS 6149..7510 + /gene="wchA" + /locus_tag="SPC11A_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33122.1" + /db_xref="GOA:Q4K290" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K290" + /translation="MSEKLAKPSVAIVQSFLVILLTYLLSAVRETEIVSTTAIVLYIL + HYFVFYISDYGRNFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LLLHVFLVYVLNLFIKWYWKRAYPNFKGSKKVFLLTATSHVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDYLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDWARNKQIREMAGLNVVTFSTTFYKTSHMIAKRIIDIVGSLVGLILCG + LVSIVLVPLIRKDGGSAFFAQTRIGKNGRHFTFYKFRSMCVDAEDKKRELMEQNTMQG + GMFKVDDDPRITKIGHFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQK + RRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLMKD + GAK" + misc_feature 6926..7507 + /gene="wchA" + /locus_tag="SPC11A_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.5e-157" + gene 7514..7963 + /gene="wchJ" + /locus_tag="SPC11A_0008" + CDS 7514..7963 + /gene="wchJ" + /locus_tag="SPC11A_0008" + /note="member of homology group 26" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="CAI33123.1" + /db_xref="GOA:Q4K235" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:Q4K235" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKEDTRSILGN + ETFYPCHYPTNRNLKNLIKNTVLAFNILRKERPDVIISSGAAVAVPFFYLGKLFGAKT + VYIEVFDRIDAPTLTGKIVYPVTDKFIVQWEEMKKVYPKAINLGGIF" + gene 7963..8442 + /gene="wchK" + /locus_tag="SPC11A_0009" + CDS 7963..8442 + /gene="wchK" + /locus_tag="SPC11A_0009" + /note="member of homology group 27" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33124.1" + /db_xref="GOA:Q4K234" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q4K234" + /translation="MIFVTIGTHEQQFNRLIKEVDRLKGEGFIQDDVFIQTGFSDYEP + VYCQWKNLISYDEMNRYIDEANIIITHGGPATFMAVIAKGKIPIVVPRLKKFGEHVND + HQMEFCSKILSEGYELSLINDISELQYSLKQEKKTKFYSNNTCFLKKLSKTIEDLIV" + misc_feature 7963..8433 + /gene="wchK" + /locus_tag="SPC11A_0009" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 8.7e-47" + gene 8684..9781 + /gene="wcyK" + /locus_tag="SPC11A_0010" + CDS 8684..9781 + /gene="wcyK" + /locus_tag="SPC11A_0010" + /note="member of homology group 116" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33125.1" + /db_xref="GOA:Q4K233" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K233" + /translation="MKILHIPTGGLFSDGIGTFIYSYLEYMDLNKYDVTILATNSPLK + SDKEKFECLGVKVIEIERKKSNLSKYVYKLKKIIKKEKFDIIHVHGSSALMSIELLTA + KVAGIPVRIAHSHNTTCEHHKLDKLLRPIFYRVYTQACACSVSAGQWLFEEKNYKIIH + NARDVNRYQYDAIKRKKLREELLLSDETIALGHVGRFNTQKNQCFLVSLMEKLVIKNI + DIKLFLVGTGDTLEEIKKLVIQKKLEDNIVFLGQFDDMKSFVSSMDIMLLPSLYEGLP + LVSVEWQINGVESILSDRVTQECIYTGTVQQLSIDSMELWEKEILNLSTSDRERVSLQ + NIQLIKNAGYDISLEVKEIEELYNSLYDIAN" + misc_feature 9206..9697 + /gene="wcyK" + /locus_tag="SPC11A_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.1e-18" + gene 9782..10462 + /gene="wcwC" + /locus_tag="SPC11A_0011" + CDS 9782..10462 + /gene="wcwC" + /locus_tag="SPC11A_0011" + /note="member of homology group 48" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33126.1" + /db_xref="GOA:Q4K286" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4K286" + /translation="MKGKSFLLKMLQNLKPIKRKLKPIKRTYKRIVYSITKSNMRKRL + KNTDFSIISDNCWGGRVYEELGLPYRTPFIGLYIFSEDYVKLLKNFRKYMEYELTFTN + NSKWNTEYDGEYPIGILKDIELHFLHYANQEEAYEKWNKRKNRINYENIFFKMNDDNK + CSLKLLKEFDTLDLKNKIIFAAFNYKELDNLIHFTNPRGNGNVGTDLFYYDQYFDVVN + WLNGETQT" + gene 10459..11181 + /gene="wcrL" + /locus_tag="SPC11A_0012" + CDS 10459..11181 + /gene="wcrL" + /locus_tag="SPC11A_0012" + /note="member of homology group 54" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33127.1" + /db_xref="GOA:Q4K285" + /db_xref="InterPro:IPR007577" + /db_xref="UniProtKB/TrEMBL:Q4K285" + /translation="MIPKKIHYCWFGGKPLSNDVKRCIASWKKFCPDYEIIEWTEKNF + CIENQNQFVQDAYRDKAWAFVSDYARLKIIYENGGIYLDTDVEVIKNLDKLLENKAFF + GVHQVNHLVNTGLGFGSEKGTSILKELLNLYDEIEFDLSKKDELLCPELNTPVFKRLG + YTYSDCVVKNEYFTIYPEEYFDPISLGDGVENILSDKTFSIHHYSASWTSLRNQMKSK + IIRKLGRSNILELKRILKGKTR" + gene 11178..12350 + /gene="wzy" + /locus_tag="SPC11A_0013" + CDS 11178..12350 + /gene="wzy" + /locus_tag="SPC11A_0013" + /note="member of homology group 68" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33128.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K230" + /translation="MRISPSKLIFAFFSSFYILVILFPRGIFLGHSTLASRLWIIYNG + SLYLSILLGLIYVILKILSRNIAIHQHAFFILQYYFIVIILTFMVSGSIGVGLQSIFY + PIFIYLFFNEVRDKKSIVLIFDIFLYILTPLFVINTIDVFLNFTNIFHITFLGHVQVI + SQYSVIGFLVSAYYLLEEKRNILVAQLLLILTIINCFFSDVSLSKVIALFMIVYIISY + KLRKLFWKRGRKISVVTFIASVVMLALVIFGYFLPYLRYFDFTFNGRYQIWRIVYATI + LQVKWFGYGLFGFQFKLPWQKLGEVGINYTHNQVLQLALDSGIVGIISFFTMIFYMIF + STKNIQNSTISSLFIFAYFCLFIIMFIESVTYYPYYFIIIVLQTLYLKLERERNVK" + misc_feature 11178..11264 + /gene="wzy" + /locus_tag="SPC11A_0013" + /note="Signal peptide predicted for SPC0450 by SignalP 2.0 + HMM (Signal peptide probability 0.862) with cleavage site + probability 0.448 between residues 29 and 30" + misc_feature 11952..12146 + /gene="wzy" + /locus_tag="SPC11A_0013" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 8e-10" + gene 12340..12840 + /gene="wcwT" + /locus_tag="SPC11A_0014" + CDS 12340..12840 + /gene="wcwT" + /locus_tag="SPC11A_0014" + /note="member of homology group 69" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33129.1" + /db_xref="GOA:Q4K229" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K229" + /translation="MLNRLIRNFNKVYYSYRIKRKAAQCGGRVYTGGKTFVTANTYLD + ENVSFNGMSMYGEGKISIGKNFHSGLNCQIITSFHNYDLGDKIPYDESYIHKDVLIED + NVWVGNNVIILGGAIIEEGAIIQAGSTVIGRIPAGAIAGGHPAKPFRFRNMEHYNQLK + RQKKFH" + misc_feature 12628..12681 + /gene="wcwT" + /locus_tag="SPC11A_0014" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.9" + misc_feature 12682..12735 + /gene="wcwT" + /locus_tag="SPC11A_0014" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 2.7" + gene 12850..14037 + /gene="wcwU" + /locus_tag="SPC11A_0015" + CDS 12850..14037 + /gene="wcwU" + /locus_tag="SPC11A_0015" + /note="member of homology group 70" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33130.1" + /db_xref="GOA:Q4K228" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K228" + /translation="MNIVSYLKKNGITHTLKIINEYKMQELFDSLVSIFTKQKELRNS + IVIECHTDFENNGGAFYDYLINNEYNKKYKIVLLLKDKLVKELPENVDYFYLRKPSLR + KSYVMSLSKFFTFDNDMLRKYRKDQKHFYLTHGCFPLKSTIGKITVPNYVDFVLSPSG + NVDNIIVKQFGLTSKEQCLHTGFPCHDIFYSKPEPLVFLSNYDKKIIWAPTFRKGGGY + NRNDSTASYPLGIPLLETLDELANLNTYLSQRDIALIVKLHPMQDISDLELKQFSHIK + FLTNQDLNRKNTNLYQLLMNSDALLSDYSAISYDYLHLDKPIGYVFSDLNDYKLGLSV + DNVDDYIAGDKILSFNNLLHFIDNIYLEIDKNKEKRKELFNKIFEKQDGESCERLAQI + MEL" + misc_feature 13423..14034 + /gene="wcwU" + /locus_tag="SPC11A_0015" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 9.5e-11" + gene 14054..15457 + /gene="wzx" + /locus_tag="SPC11A_0016" + CDS 14054..15457 + /gene="wzx" + /locus_tag="SPC11A_0016" + /note="member of homology group 52" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33131.1" + /db_xref="GOA:Q4K227" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K227" + /translation="MSVGMKAALWYTVANFIQKGFVFLSTPILTRILNVNDYGTLILY + QSWFVLFAIFATLNLSQTAYNKGLVEFENDKDNFTFSLLFLSKTITIIVAFLYFTFNI + LVKDSTGLTPSFMIFLFSDILFNISIEFYLARQRFEFKYRKAVLISTFSSFFIVAIST + TILLAIKNDLFIKIVLDAIIRIIFGLYCFYLLFFSGRRQLKIEKKYIKYGLSYSLPLI + PHFLSHYILNQSDRLMINMFDGKEKLAIYSLAYSVSMIMFLFTNAINQSIMPHTFQAL + KKKDYCGIHGSTKWLFVVVGGITALSILFAPELIVILGGNKYKESIWLVPPIAISVYF + LFVYSMFSNISFYYKMNKLISLVSTGAALSNIILNYIFINIFGYQAAAYTTLLCYILL + AFSHFFLYRFLLKKEEIHEELYNMKMILIISLILLIILFLILVIYNLAIIRYAIIAII + LFLLFTKRNKIITSLKS" + misc_feature 14063..14881 + /gene="wzx" + /locus_tag="SPC11A_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.4e-16" + gene 15571..15963 + /gene="gct" + /locus_tag="SPC11A_0017" + CDS 15571..15963 + /gene="gct" + /locus_tag="SPC11A_0017" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33132.1" + /db_xref="GOA:Q4K226" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K226" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNFEHRKNLVEAIRYVDLVISETSWEQKKTDIKEYHIDTFVMGDDWKGKFDY + LKEEGVEVIYLPRTKEISTTKIKEDLAD" + misc_feature 15583..15951 + /gene="gct" + /locus_tag="SPC11A_0017" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 9.7e-29" + gene 16325..17353 + /gene="wcjE" + /locus_tag="SPC11A_0018" + CDS 16325..17353 + /gene="wcjE" + /locus_tag="SPC11A_0018" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33133.1" + /db_xref="GOA:Q4K279" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K279" + /translation="MTKVRINWVDFGKGFAIFLVLVGHVFIGLSESNKFSIANDVLLF + LIAQIYIFHIPVFFALSGYFFRPVSDLKEFWHYAKKKTIILGIPYIFYSIIHFCLQKL + AGASVRVPTTIHNLLNIYRYPLGVSWYLYTLWSILIVYGLLSIVFKNRKSLFLVSVFA + YIFTLFIQIDIFIVQRTLVWGVCFCLGSVLSEVHFNKINLKKFLFFFVLFDFIYMFAW + FLFYEVGSKKDYVSYSNPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSL + GIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLL + PQKYIKLK" + misc_feature 16340..17314 + /gene="wcjE" + /locus_tag="SPC11A_0018" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 4.4e-05" + gene 17517..17636 + /gene="aliA" + /locus_tag="SPC11A_0019" + /pseudo + CDS 17517..17636 + /gene="aliA" + /locus_tag="SPC11A_0019" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliA + (pseudogene)" + gene 17901..>17948 + /gene="aliA" + /locus_tag="SPC11A_0020" + CDS 17901..>17948 + /gene="aliA" + /locus_tag="SPC11A_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33135.1" + /db_xref="UniProtKB/TrEMBL:Q4K2C2" + /translation="MMKSSRLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaagagt ctggaacaaa atagttctcg accacaaaaa + 181 agctagagat ttccaattgt ggaactctag ctttttaatt ttgagtcatt ctcttattgt + 241 attttagggg gttattggcc ataagtacca atcccatgtc aattctcact tgacgcttgc + 301 ccctcagatt acatctcttg taacccaaac aagcctttat ctgcccaaag acaggttcca + 361 catcaatctt gcgttgagcg aaaatctgtc taccttgggg agataaaagc gcttgacatt + 421 ctttagcttt caagttttga tagccttcgt tcatatacag tcccttttga ggggctgatt + 481 caggttcgtc ggcgtagtaa accttgattt cctgttgaaa gtctgtctgt gttttctgat + 541 gtttggtatg gtgaaaacga taataccagc catcaggatg tgtatagcta tcctccttgt + 601 cattatagtg ccaattcgct aagtttctag ctgactgttt atagcctctc ttctgttcct + 661 tatcaaacat ggcatattta atcagatggt ttacctcctt ttcatctaaa cgaaggaggt + 721 tctcttcact tccatatcca gcatctgcga caactgtctt caagtcatgc ggataggttt + 781 caaggaatgg cagaagagtc ttggtatctg tcggatttga aaagacatca tagtgaagaa + 841 caaattggtt ttccgtagcg atttgaagat tataagcagc cttgagttga ccatttttca + 901 tatgatcttc cttcatccgc ataaaagtgg catctggatc ggttttggaa aaactgttag + 961 gcccttcaac tgtctcctga tagttctcat atttttcagc acgtactgaa aaatcctcct + 1021 ttaaactctt cataatcctt tttattttta tgaagatatt gtttgaaaga tgtgagtttc + 1081 cacggatggg tttgtggagg gatatacttg cgtctttctt tttttgttct ggttcttgtt + 1141 caaagttttt cgaatagagc tcatgattta gtagctcctt tgtgtgatag attttgtcag + 1201 cgatattgag gtagatgtca ccatcaaatg cttttataac taatgctttt gtctttctga + 1261 tgaaatagac ttcttttcct tgttcggtag gaatatagca acgattttgg aatcggatat + 1321 ggcgtccact atcgacgact ctctccgcca gtctagctag aatgagattt cgttcagaga + 1381 gcttaggagc ctcctcaaag acagagagtt ttgtcttgtt tccaaactgt tcattaaaag + 1441 tttggatata ggaaagaagg aaaatattgg cttcttccaa ggtatgaatc ttgtttcgtt + 1501 ccagttcgat aggcaggcga gattgtagta tctgattgag tctttcgact ctccctttag + 1561 cttgagggat agaggttgtc tcaaggagaa tccccagttg gtgacaggcg tatccaaatt + 1621 gtgtatgggt gtcgtcctcc attttcttag agttgggggc ttgataggta aagaccgttc + 1681 tcttatctgt tttgatttga agaggaatgc cgtggttggc taagatttgt tcgaggacat + 1741 gatagtaagc attcaaggtc tcttgtttat caaaataagc gcctaggata ttgccagaag + 1801 catcatcaat ggctaggtgt aagttagagg tttctgctcc aaaccaggca tgagggctgg + 1861 tatccatttg aatgagttca ccagcaaatt tctttctggg tctactagga tgtacttttt + 1921 tagggttttc caggaagtct tcagccgtcg gtaagattag attgtctagg ggttgcttgg + 1981 ggttcagttt agcttgtttt cttactctct tctttgtctt tctatgggac ttaggcgaca + 2041 ggatattttt cttatagagt atttttctaa cagttgtatc agagagctga attccttctt + 2101 cttcagctag caattcacag aaatgacgga catttggttt atatgtttca taggagaggt + 2161 atttctttag gatacgttct ttgatttcat cagggattgc atgttttggt tttcgatttc + 2221 tgtttccgtg tctgaaggct tcttttcctt tctgttgaca ggctagtagc agacgattga + 2281 tttgcctttc agaaagattg agcacgacac aggctcgttt ctttgttttc tttccttggg + 2341 ctatagcttt tatcacaaga tattttttcg tttcattcat attcagttgg atcctttaca + 2401 tatgactatt ctaccaaatg ggacattttt acgttcgatt tactaaagac attatcacat + 2461 tcgaattaca caagatgcag atagtgaaaa aaggtgtaga cattaccgta aaaaagtgat + 2521 ataatcgtat gatgttcaat gtataggtgt taatcatgag tagacgtttt aaaaaatcag + 2581 gttcacagaa agtgaagcga agtgttaata tagttttgtt gactatttat ttattgttag + 2641 tttgtttttt attgttctta atctttaagt acaatatcct tgcttttaga tatcttaatc + 2701 tagtggtaac tgcgttagtc ctactagttg ccttggtagg gctactcttg attatctata + 2761 aaaaagctga aaaatttact atttttctgt tggtgttctc tatccttgtc agctctgtgt + 2821 cgctctttgc agtacagcag tttgttggac tgaccaatcg tttaaatgcg acttctaatt + 2881 actcagaata ttcaatcagt gtcgctgttt tagcagatag tgagatcgaa aatgttacgc + 2941 aactgacgag tgtgacagca ccgactggga ctgataatga aaatattcaa aaactactag + 3001 ctgatatcaa gtcaagtcag aataccgatt tgacggtcaa ccagagttcg tcttacttgg + 3061 cagcttacaa gagtttgatt gcaggggaga ctaaggccat tgtcctaaat agtgtctttg + 3121 aaaacatcat cgagtcagag tatccagact acgcatcgaa gataaagaag atttatacca + 3181 agggattcac taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct + 3241 atgttagtgg aattgacacc tatggtccta ttagttcggt gtcgcgatca gatgtcaata + 3301 tcctgatgac tgtcaatcga gataccaaga aaatcctctt gaccacaaca ccacgtgatg + 3361 cctatgtacc aatcgcagat ggtggaaata atcaaaaaga taaattaacc catgcgggca + 3421 tttatggagt tgattcgtcc attcacacct tagaaaatct ctatggagtg gatatcaatt + 3481 actatgtgcg attgaacttc acttctttct tgaaaatgat tgacttattg ggagggatag + 3541 atgttcataa tgatcaagag ttttcagctc tacatgggaa gttccatttc ccagtaggga + 3601 atgtccatct agactctgag caagctttag gttttgttcg tgagcgctac tccctagcag + 3661 atggcgatcg tgaccgtggt cgcaaccaac aaaaggtgat tgtggctatc cttcaaaaat + 3721 taacgtcaac cgaagcgctg aaaaattata gtacgatcat tgatagcttg caagattcta + 3781 tccaaacaaa tatgccactt gagaccatga taaatttggt caatgctcag ttagaaagtg + 3841 gagggaatta taaagtaaat tctcaagatt taaaagggac aggtcggacg gatcttcctt + 3901 cctatgcgat gccagatagt aacctctatg tgatggaaat taacgacagt agccttgcat + 3961 ctgtcaaaac tgctattcag gacgtgttgg agggcagatg aaatgattga tattcattcg + 4021 cacattgtct ttgatgtaga tgatggtccc aagtcaagag aggaaagcaa ggctctcttg + 4081 acagaagcct acaggcaggg ggtgcgaacc attgtctcta cctctcaccg tcgcaagggc + 4141 atgtttgaaa ctccagaaga gaagatagca gaaaactttc ttcaggttcg ggaaatagct + 4201 aaggaagtcg cgagtgactt agtcattgct tatggggctg aaatttacta cacaccagat + 4261 gttttggata agctggaaaa aaatcggatt ccgaccctca ataatagtcg ttatgccttg + 4321 atagagttta gtatgaacac cccttatcgc gatattcata gtgccttgat taaaatattg + 4381 atgttgggaa ttactccagt cattgcccac atcgagcgct atgatgcact tgaaaacaat + 4441 gaaaaacgcg ttcgagagct gatcgatatg ggctgttaca cgcaagtaaa tagttcacat + 4501 gtcctcaaat ccaaactttt tggagaacgg tataaattca tgaaaaaaag agcgcagtat + 4561 ttcttggagc gtgatttggt tcatgtgatt gcaagtgata tgcataatgt ggacagcaga + 4621 cctccccata tggcagaagc atatgacctt gtttctcaaa aatacggaga agcgaaggct + 4681 caggaacttt ttatagataa tcctcgaaaa attgtaatgg atcaactaat ttaggagaaa + 4741 taatgaaaga acaaaatacg atagaaatcg atgtatttca atcacttaaa accttatgga + 4801 aatacaagct aatcatttta ttagtggcac ttgtgacagg ggcgggagct tttgcatata + 4861 gcacttttat tgttaagcca gaatatacaa gtaccacgcg tatttacgta gtcaaccgta + 4921 atcaaggaga taagccggga ctgacgaatc aggacttgca ggcaggaact tatctggtaa + 4981 aagactaccg cgaaattatc ctttcgcaag atgtattgga aaaggtagcg acaaatttga + 5041 aattggatat tccagcaaaa acgttaacta gcaaagtgca agtgactgta ccagccgaca + 5101 ctcgtatcgt ctcaatctct gtcaaggata aacaaccaga ggaagccagt cgcattgcta + 5161 attctctacg agaagttgct gcagaaaaga tcatcgctgt aacgcgagta tctgatgtaa + 5221 cgacgcttga agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgacgcaaca + 5281 ccttagttgg ttttcttgga ggagccgccg taacagtaat tactgttctt ttgattgagt + 5341 tgctcgatac ccgtgtaaaa cgtcctgaag atgttgaaga tgtactgcaa atgccacttc + 5401 taggagtcgt tccagatttt gataaaatga aataggagga agttatgcca acgttagaaa + 5461 tctcacaggt gaaattagaa cttgcgaaaa aggcagagga atattataat gctttgtgca + 5521 cgaacctaca gttaagtgga gatgatttga aagtattttc tatcacttct gtgaaagcag + 5581 gagaaggaaa aacaacgact tccaccaata tcgcttgggc ttttgcgcgt gcaggttaca + 5641 aaacgctgct gattgatgca gacatgcgta actccgttat gtcaggtgtc tttaaatcaa + 5701 gggaaaggat tactggacta acagaatttc tatcagggac aacagacctg tcacaggggc + 5761 tttgcgatac caatattgag aatctctttg tgattcaggc tggctctgtg tcaccaaatc + 5821 cgacagccct tcttcaaagt aagaatttca gcacaatgct tggaaccttg cgtaaatatt + 5881 ttgactatat cgtcgtagac actgctccta tcggtatcgt gattgatgcg gctatcatta + 5941 tgcagaaatg tgatgcttct attttagtga cgaaggcagg tgaaacaaaa cgacgggatc + 6001 ttcaaaaagc gaaagaacag ttggaacaaa ctgggaagtc gtgtttagga gttgtgttga + 6061 ataaattcga tacttcagta gagaaatacg gttcttatgg gagttatggg aattacagga + 6121 aacagaaaaa ataggttgag ggatagaaat gagtgaaaaa ctagcaaagc cttcagtagc + 6181 catagtccag agttttcttg ttattttatt gacttatcta cttagcgctg tgagagaaac + 6241 agagattgtt tcaacaacag ctattgtact ttatatcctc cactattttg tcttttatat + 6301 cagtgattat ggacggaatt tctttaaaag gggatatttg attgaacttg tccagacatt + 6361 gaaatatatc ctattctttg cgctagcgat tagtatttct aattttttct tagaagatcg + 6421 atttagtatt tccagaagag gcatgattta cttcctctta ttacatgttt tcttagtcta + 6481 tgtgctaaac ctatttatca agtggtattg gaagcgggct tatcccaact ttaaaggaag + 6541 taagaaggtt ttcctactta cagcaacttc tcatgtcgaa aaggtactgg atagattaat + 6601 agaatcaaat gaggttgttg gggagttggt agccgtcagt gttttagata aaccagattt + 6661 tcagcatgat tatttaaagg ttgtagcaga gggggagata gtaaactttg cgactcatga + 6721 ggtggtcgat gaagtcttta tcaatcttcc aagtgaaaaa tacaatattg gagagcttgt + 6781 ctctcagttt gaaacgatgg gaattgatgt aacagtcaat ctaaatgctt tcgattgggc + 6841 acgtaacaag caaattcgtg agatggcagg actaaatgtt gtgacttttt ctacaacatt + 6901 ttataagact agccatatga ttgctaagcg gattattgat attgtcggtt ccctggtagg + 6961 tttgatatta tgtggtctag tcagtattgt gctggttcct ttgattcgaa aggatggggg + 7021 ttctgctttt tttgctcaga cgcgtatagg aaaaaatggc cgccatttca ctttttataa + 7081 gtttcgctct atgtgtgtag atgctgagga taaaaagaga gaactcatgg aacaaaatac + 7141 catgcagggt ggaatgttta aggtggacga tgatcctcgt atcacgaaaa ttggtcattt + 7201 tatacggaag acgagcttgg acgagctacc acagttttat aatgttctaa agggagatat + 7261 gagtttggta ggtacacgac caccaacagt ggacgagtat gaacactata ccccagaaca + 7321 aaaacgtcgg ctaagtttta aacctggtat aacaggctta tggcaggtca gtggacgaag + 7381 tgagatcaag aatttcgatg aagttgtcaa gttagatgtg gcctatatag acgattggac + 7441 aatctggaaa gatattgaga ttttattgaa gacagttaaa gttgtattga tgaaggatgg + 7501 agcgaaatag gaaatgaaaa tatgtttagt tgggtctagt ggaggtcatc tgactcattt + 7561 atatctatta aaacctttct ggaaagataa ggaaagattt tgggttactt ttgataaaga + 7621 ggatacaaga agtatcttgg gaaatgagac attttatcct tgtcattatc ctactaatcg + 7681 taatttgaaa aatcttatta aaaatacggt tcttgctttc aatattttga gaaaggaacg + 7741 ccctgatgtt atcatctcat caggggctgc tgtagcagtt cctttctttt acctaggaaa + 7801 actatttggc gctaagacag tctacattga agtttttgat cgtattgatg cgccaacctt + 7861 aacaggaaaa atagtatatc cagtaacaga taagttcata gttcagtggg aggaaatgaa + 7921 aaaagtatat ccaaaagcaa ttaatctcgg agggattttc taatgatttt tgtgacaata + 7981 ggtactcatg agcaacagtt taatcgactt attaaagaag ttgatagatt aaaaggtgag + 8041 ggatttattc aggatgatgt ttttattcag actggttttt cagattatga accagtgtat + 8101 tgtcaatgga agaatctgat ttcttatgat gagatgaatc gctatataga tgaagcaaat + 8161 attatcatta cacatggcgg cccagctaca tttatggcag ttattgctaa aggaaaaata + 8221 ccaatagttg ttccgagatt aaagaagttt ggtgagcatg tgaatgatca tcagatggaa + 8281 ttttgttcta aaatactatc cgaagggtat gaattatctc tgattaatga tataagcgaa + 8341 ttgcagtata gtttaaagca agaaaagaaa actaaatttt actctaataa tacatgtttt + 8401 cttaagaaat tatcaaaaac aattgaagat ttaatagtat gaaatgagat tatttattct + 8461 tgttgcagat aaattaaaaa taaatgaaat tttaagtcaa gtagttgtgc taaaatgtat + 8521 ttatgattaa gaataaaata atcactattc ctatatatgg aaatagttct taaagcatag + 8581 tttaaattat ggatgtagat tatttcgtta actcttataa tcaatttata aggccagata + 8641 gtaacattat taaaatcata gctaggagta agggaggatg taaatgaaaa tactacacat + 8701 tccaacaggt ggtttatttt ctgatggtat aggaactttt atttattcat atttagagta + 8761 tatggactta aacaagtatg atgtgacaat tttagccact aattcccctt tgaaaagtga + 8821 taaggaaaaa tttgaatgtt taggggttaa agttattgaa attgaaagaa aaaaatcaaa + 8881 cctttctaaa tatgtataca aattaaaaaa aataataaaa aaagaaaaat ttgacattat + 8941 acatgttcac ggaagtagcg ccttaatgtc aattgaatta ctgactgcta aagttgctgg + 9001 tatcccagtt cgaattgccc atagtcataa cactacttgt gagcatcata aattagataa + 9061 actactacga ccgatatttt atcgagttta tactcaggca tgtgcttgta gtgttagtgc + 9121 tggtcaatgg ctttttgagg aaaaaaatta taagattatc cataacgcta gagatgtaaa + 9181 taggtatcag tatgatgcca taaaaagaaa aaaacttaga gaagaattgt tgctatctga + 9241 tgagactatt gctctaggtc atgttggacg ttttaatact caaaaaaatc aatgttttct + 9301 agtgtctcta atggaaaaat tagtaatcaa aaatatagat ataaaattat ttttagtagg + 9361 gacaggtgat actttggaag aaatcaagaa attagtcatt cagaaaaaac tagaagataa + 9421 cattgttttt ttaggtcaat ttgatgatat gaaatctttt gtgtcatcaa tggatataat + 9481 gttgcttcca agtttatatg aagggttacc actagtatct gttgaatggc aaattaacgg + 9541 agtagaaagt atcctatctg accgtgttac acaagagtgt atctatacag gaactgttca + 9601 acaattatct atcgatagca tggaattatg ggaaaaagaa attttgaatt tatctacttc + 9661 agatagagaa agagtgtcat tgcaaaatat tcagttgata aaaaatgcag gttatgatat + 9721 ttctttagaa gttaaagaaa tagaagaatt atataattca ctttatgata ttgcgaattg + 9781 aatgaaaggg aagagttttc ttttgaagat gttacaaaat ttaaaaccaa taaaacggaa + 9841 attaaaacca attaagagaa cttataagag aatcgtttat tctatcacta agtcaaatat + 9901 gaggaagagg ctcaaaaata cagatttttc aattatcagt gataattgct ggggaggacg + 9961 ggtatatgaa gaattgggtc tgccgtatag aacaccattt ataggtctgt atattttttc + 10021 cgaggattat gtgaaactgt tgaaaaactt cagaaagtat atggaatatg agctaacttt + 10081 taccaataat tcaaaatgga acacagaata tgacggggag tatcctatag gcatacttaa + 10141 ggatattgaa cttcattttt tacattatgc taatcaagaa gaggcttatg agaaatggaa + 10201 taaaagaaag aacaggatta attatgaaaa tatctttttt aagatgaatg atgataataa + 10261 atgttctttg aaattgctta aggaatttga tactttagat ttgaaaaata aaattatttt + 10321 tgctgcattc aattataaag aactagataa tcttattcat tttaccaatc ctagagggaa + 10381 tggtaatgta ggtacagact tattttatta tgatcaatat tttgatgttg taaattggct + 10441 gaatggagag acacaaacat gatacctaaa aagattcatt attgttggtt cggtggcaaa + 10501 cctttatcaa atgatgtaaa gcgatgtata gcaagttgga aaaaattttg tcctgattat + 10561 gaaattattg aatggactga aaaaaacttt tgtattgaaa atcaaaatca atttgtgcag + 10621 gatgcatata gagataaagc atgggctttt gtaagcgatt atgcaagact taaaattata + 10681 tatgaaaatg gaggtattta tttagatact gatgttgaag tgattaaaaa tctagataag + 10741 ttgttggaaa ataaagcatt ctttggagtt catcaagtta atcatctagt taatacagga + 10801 ttagggtttg gatcggaaaa gggcacctct attttaaagg agttattaaa tttgtatgat + 10861 gaaatagaat ttgatcttag taagaaagat gaattgttat gtcctgaatt aaatacacct + 10921 gtatttaaac gtcttggtta tacttattct gactgtgttg taaaaaacga atatttcaca + 10981 atctatcctg aagaatattt tgatccgatt tctttgggtg atggcgtaga aaatatttta + 11041 tcagataaaa cattctctat tcatcattat agtgcttctt ggacttcctt aagaaatcag + 11101 atgaagagca aaataattcg taaactaggc agaagtaata tcttggagtt aaaaagaata + 11161 ttaaagggga aaactagatg agaatatcac cttcgaagct gatatttgca ttttttagca + 11221 gcttttatat tcttgtaatc cttttcccaa gaggaatttt tctaggacat tctactttag + 11281 cttctcgatt atggattatt tacaatggaa gtttatattt atcaatatta cttggtttaa + 11341 tatatgttat tttaaaaata ttatctcgaa atatcgccat tcatcagcat gcttttttca + 11401 tcttacaata ttattttatt gtaattattt taactttcat ggtaagtggg tcaatcggtg + 11461 ttgggctaca atcgattttc tatccaatat tcatctattt attttttaat gaagttcgag + 11521 ataagaaatc aatagtgtta atttttgata tctttcttta tatacttact cctttattcg + 11581 ttatcaatac gattgatgtt tttctgaatt tcacaaatat ttttcatatt acttttttag + 11641 gacatgttca ggtgatttcc caatatagtg ttatcggatt tctcgtatca gcatattact + 11701 tattagaaga aaagagaaat atattagtgg cacagttgct gttgatttta acgattatca + 11761 attgtttttt ttcagatgtc tctctctcta aagttattgc tttgtttatg attgtttata + 11821 ttatttcata caagttaaga aaactattct ggaaaagagg aaggaagata tctgttgtaa + 11881 cttttattgc atctgttgtg atgttagcat tagtaatttt tggatatttt ttaccatatc + 11941 ttagatattt tgattttact tttaatggtc gataccaaat ttggcgcatt gtgtatgcta + 12001 ccattcttca agtgaaatgg tttggatatg gtttgtttgg ctttcaattt aaacttccgt + 12061 ggcagaaatt gggagaagtt ggaataaatt acactcataa tcaagtttta cagttagcac + 12121 ttgatagtgg tattgttggg attatctcat tctttactat gattttttat atgatctttt + 12181 caactaaaaa tattcaaaat tccacaataa gctctctatt tatttttgcc tatttttgtc + 12241 tatttattat aatgtttata gagagtgtca cttattaccc atactatttt attataatag + 12301 ttcttcagac tttgtactta aaattggaaa gagaaagaaa tgttaaatag attgataaga + 12361 aattttaata aagtatatta tagttatcgt ataaaaagaa aggcagcgca atgcggtggg + 12421 agagtgtata cgggaggcaa aacgtttgtt actgcaaata cgtaccttga tgaaaatgtt + 12481 tcatttaatg gtatgtcaat gtatggtgaa gggaaaataa gcattggtaa aaattttcat + 12541 tcaggattga attgccaaat tatcacttcc tttcataatt atgacttggg cgataaaatt + 12601 ccttatgatg agagttatat acataaagac gtcttaattg aagataacgt ctgggtagga + 12661 aataatgtga taattttagg tggtgcgatt attgaggaag gtgcaatcat tcaagcagga + 12721 agtacagtta ttggaagaat tccagcaggt gcaattgcag gtggacatcc agcaaaacca + 12781 ttcagattta gaaacatgga acattataat caacttaaac ggcaaaaaaa gtttcattag + 12841 aggttaagaa tgaatattgt aagttatcta aaaaaaaacg gtattacaca tactttaaaa + 12901 attattaatg aatataaaat gcaagagctg tttgatagtc ttgttagtat ttttacaaag + 12961 cagaaggaac ttcgtaacag tattgtcatt gaatgtcata ctgattttga aaataatggt + 13021 ggtgcgttct atgactatct aatcaataat gagtataata aaaaatataa aattgtctta + 13081 ctattgaagg ataaattagt taaagaatta ccagaaaatg tagattattt ttatttaaga + 13141 aagcccagtt tacgaaaatc ctatgtaatg tcattaagta aattctttac ttttgataat + 13201 gatatgcttc gtaaatatag aaaagatcaa aaacactttt atttaacaca tggatgcttt + 13261 cctttaaaaa gtacaatagg taaaataaca gttccgaatt atgttgattt tgttctatct + 13321 ccctcgggca atgtagataa tattatagtt aagcagtttg gattaacatc taaagagcaa + 13381 tgtcttcaca ctggatttcc gtgtcatgat atcttttatt caaaaccaga acctctagta + 13441 tttttatcta attatgataa aaaaattatc tgggcaccaa cttttagaaa gggtggtggc + 13501 tataatagaa atgatagtac agctagctat cctttaggca ttccgttact tgaaacacta + 13561 gatgaactgg caaacctaaa cacatatcta agccaacggg atattgccct gattgtaaag + 13621 ttacatccaa tgcaagatat ttcagatttg gagttgaaac aatttagtca tattaagttt + 13681 ctgacaaatc aagatttgaa tcgtaaaaat acaaatctgt atcaattgct gatgaattca + 13741 gatgctttac tcagtgacta ttctgcaatc tcgtatgatt atttacacct tgataaacca + 13801 atagggtatg ttttttcgga tctaaatgat tataagttgg ggctttcagt tgataatgta + 13861 gatgattaca tagcaggtga taagatactg tcttttaaca acttgctgca ctttattgat + 13921 aacatttatc tagaaattga taaaaataaa gaaaaacgca aggaattatt taataaaata + 13981 tttgaaaaac aggatggaga atcgtgtgaa agattggcac aaattatgga attataaaag + 14041 ccgttacgaa gaaatgtctg tcgggatgaa agcggcactc tggtatactg ttgcaaattt + 14101 tattcaaaag ggttttgtat ttctttcaac tccgatttta accagaatac ttaatgttaa + 14161 tgattacggt acattgatac tttaccaatc atggtttgta ctatttgcta tttttgcgac + 14221 cttgaatctt tctcaaacag cttataataa gggattggta gaatttgaga atgataaaga + 14281 taattttaca ttttctttgt tgtttttgtc taagactatt actataattg ttgctttttt + 14341 atattttact tttaatatac tggttaaaga tagtactgga ttaactccca gtttcatgat + 14401 atttttattc agtgatatct tatttaatat tagtatagaa ttttatttgg cacgtcagag + 14461 atttgaattc aaatatagaa aagcagttct aatttcaact ttttcaagtt tttttattgt + 14521 agctattagt acaactatct tattagcgat taagaatgat ttattcatta aaattgtatt + 14581 ggatgctatt atccgaatta tctttggttt atattgtttt tatctcttgt ttttttcagg + 14641 gagaaggcaa cttaagatag aaaaaaaata tattaaatat ggtttgagtt attcattacc + 14701 tttgataccg catttcttat cgcactatat tttgaatcag tctgaccgtt tgatgattaa + 14761 catgtttgat ggtaaggaga aattagctat atatagtcta gcttattctg tatcaatgat + 14821 tatgtttttg tttactaatg caattaatca atcaataatg ccgcatacat ttcaagcttt + 14881 gaaaaaaaag gattattgtg ggatacatgg gagcaccaaa tggctttttg tagtagttgg + 14941 ggggattaca gctctctcaa ttctatttgc accagaacta attgttattt taggcggcaa + 15001 taaatataag gaatcaattt ggctagtacc tccaattgcc atctcggttt atttcctttt + 15061 tgtatattct atgtttagta atatcagttt ttattataag atgaataagc tgatttcgtt + 15121 agtttccaca ggtgcggctc tttcaaatat tattttaaat tatattttta ttaatatatt + 15181 tgggtatcaa gctgcagctt acactacatt attatgctat atattgttgg cgttttctca + 15241 ttttttctta tatagatttt tattaaaaaa agaggaaatt catgaggaac tttataacat + 15301 gaagatgatt ttaataatat ctttaatatt attaataata ctatttttga tacttgttat + 15361 ttataactta gccattataa gatatgcaat tattgcaatt attttatttc ttttgtttac + 15421 aaagagaaat aaaataatta catcgctaaa aagttgatat tgaaaattta gaatcaaata + 15481 aagaatatag tggatatcaa gccagtatta ataatgaata attgttttta tgtaatttaa + 15541 gattaataaa aaaattgaaa ggaaatatca atgaaaagag taattactta tggaaccttt + 15601 gatttgcttc attatggaca tatcaatttg ttaaagagag caaagcaatt aggagattat + 15661 ctcattgttg tagtttcaag cgatgagttc aatttgaaag aaaaaaataa agtttgttac + 15721 tttaattttg aacatagaaa aaatttggtt gaagcaataa gatatgttga tctggtgatt + 15781 tctgaaacaa gctgggaaca gaaaaaaaca gatattaaag aatatcacat tgatacattt + 15841 gttatggggg atgattggaa gggaaaattt gattatttaa aagaagaagg agtggaagta + 15901 atttatttac caagaactaa agaaatatct acaactaaaa ttaaagaaga tttagcagat + 15961 tagatttttt acaaaaatat tttgagttca gataataaat ttgtttctat aattattaat + 16021 gtcttgacta tttaaatctt attttaaaaa aatctagttt aagatatgaa agaaaatttt + 16081 atccataact atcatattat tggcaatata tattgtgata atgtatggga agttagtaga + 16141 tatgaatgtg atatatagct agaattaata ttattcattg ctatttaaaa tgtaggtaag + 16201 aatgtattag atttagcata aaattagaaa acaagctatt ttttctgtga aattaggtag + 16261 atatacaata atatttgtat tgttagagaa agaaatctta atattgtaat gggggcattt + 16321 tgaattgact aaagtaagaa ttaattgggt agattttggg aaaggatttg caatattctt + 16381 agttctagta gggcatgtat ttattggttt atctgaatcc aataagtttt caattgcaaa + 16441 tgatgtgtta ttattcctga tagctcaaat ctatatattt catataccag tgttttttgc + 16501 gttatcagga tactttttca gacctgtatc agatttgaag gaattttggc attatgctaa + 16561 aaagaagaca attattttag gcataccata tattttttat tcaattattc acttttgtct + 16621 tcaaaagctt gctggtgctt ctgtgagagt acccactacg atacataatc tattaaatat + 16681 atatagatat cctttgggag tttcatggta tctatatacg ctatggtcga tattgatagt + 16741 ttatggttta ctatctattg ttttcaaaaa tcgtaagtct ctctttttag ttagtgtttt + 16801 tgcctatatt tttacactat ttattcaaat tgatattttt attgtacaac ggacgttggt + 16861 ttggggtgtt tgcttctgtc taggcagtgt attgagtgaa gttcacttta ataaaattaa + 16921 tttgaaaaaa tttctgtttt tctttgtgct atttgatttt atttatatgt tcgcttggtt + 16981 cttgttttat gaagtagggt ctaaaaagga ttatgtaagc tatagtaacc cagggttgtg + 17041 gggaattgct tttattgttt gtgtattagt tgcttttgcg atttttccta aaatggagaa + 17101 aaatttccct aaaactttcc tatatttcac taaatacggg aaagatagtt taggtatcta + 17161 tattcttcat gcaccaattt gtagcatgat tcggattcta atgttgaaag tgggaataaa + 17221 ctcagttttt cttcacgttg ttgttgggat tgtcttaggc tggtatttat ccatactagc + 17281 aacttatata ttgaaaaaaa ttccattttt gaatattgtt ttattaccac agaagtatat + 17341 taaattaaaa taaattattt tagatttata atgtggctcc ttgtcaatga acatctggag + 17401 aggacaatca ctgtcttctc ctttttgttt tttcagaata taccaaatta acccaaaaat + 17461 tatgttgata actttctgaa agatactata atggagagaa agttttaaag gagaaaatga + 17521 tgaaaagttt aagactactt actcttgcgg gtgtaacctt attggtggct actactttag + 17581 ctgcatgttc tggatcaggt tcgatcgcta aaggagagaa gacattctta tatattagac + 17641 ttcctgcgaa acaaaatggc tctttgtcaa ctgtagtggg ttgaagaaaa gctaagctcg + 17701 agaaaggaca aatttcgtcc tttctttttt gatgttcaaa gcgataaaaa tccgttttag + 17761 actaatttcc actttggtta ggcaagtgga agttactttg agaagttacc gtttgaaaaa + 17821 taattttcaa aaattctgaa aattctgttg acatctttct gaaaagagtc tataatggag + 17881 agaaagtttt aaaggagaaa atgatgaaaa gttcaagact acttgccctt gcgggcgtga + 17941 cattattg +// + diff --git a/public/res/serotype_genbank/serotype_11B.gb b/public/res/serotype_genbank/serotype_11B.gb new file mode 100644 index 0000000..f2d8810 --- /dev/null +++ b/public/res/serotype_genbank/serotype_11B.gb @@ -0,0 +1,814 @@ +LOCUS CR931654 17082 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 8087/40 (serotype 11b). +ACCESSION CR931654 +VERSION CR931654.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17082) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17082) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17082 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="8087/40" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC11B_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC11B_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33136.1" + /db_xref="GOA:Q4JZD8" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JZD8" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAP + WDAFCVELL" + gene 322..495 + /gene="aliB" + /locus_tag="SPC11B_0002" + /pseudo + CDS 322..495 + /gene="aliB" + /locus_tag="SPC11B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(488..1352) + /gene="tnp" + /locus_tag="SPC11B_0003" + /pseudo + CDS complement(join(488..991,990..1352)) + /gene="tnp" + /locus_tag="SPC11B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(965..991,990..1334)) + /gene="tnp" + /locus_tag="SPC11B_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.5e-20" + /pseudo + gene 1586..3031 + /gene="wzg" + /locus_tag="SPC11B_0004" + CDS 1586..3031 + /gene="wzg" + /locus_tag="SPC11B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33139.1" + /db_xref="GOA:Q4K276" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K276" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVATAFVLLVALVGLLSIIYKKAEKFTIFLLVLSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNIDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDHASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDIHYYVRLNFTSFLKLIDLLGGVDVYNDQ + EFTALANKKHYSIGNVHLDSEEALAFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EVLKNYSRIIDSLQNSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGRGRTDLPSY + AMPDSNLYMMEINDSSLASVKTAIQDVLEGR" + misc_feature 1586..1702 + /gene="wzg" + /locus_tag="SPC11B_0004" + /note="Signal peptide predicted for SPC0462 by SignalP 2.0 + HMM (Signal peptide probability 0.994) with cleavage site + probability 0.468 between residues 39 and 40" + misc_feature 1790..2137 + /gene="wzg" + /locus_tag="SPC11B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.2e-63" + misc_feature 2315..2758 + /gene="wzg" + /locus_tag="SPC11B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8e-65" + gene 3033..3764 + /gene="wzh" + /locus_tag="SPC11B_0005" + CDS 3033..3764 + /gene="wzh" + /locus_tag="SPC11B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33140.1" + /db_xref="GOA:Q4K256" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K256" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLENNRIPTLNNS + RYALIEFSMNTPYRDIRSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGEPDKFMKKRAQYFLERDLVHVIASDMHNVDGRPPYMAEAYDLVS + QKYGEAKAQDLFIDNPQKIVMDQLI" + misc_feature 3036..3644 + /gene="wzh" + /locus_tag="SPC11B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1e-38" + gene 3770..4465 + /gene="wzd" + /locus_tag="SPC11B_0006" + CDS 3770..4465 + /gene="wzd" + /locus_tag="SPC11B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33141.1" + /db_xref="GOA:Q4K255" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K255" + /translation="MMKEQNTIEIDVFQSLKTLWKHKLIILLVALVTGAVAFAYSTFI + VKPEYMSTTRIYVVNRNQGDKPGLTNQDLQAGAYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLTSKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVRRNTLVGFLGGAAVTVITVLLIELLDTRVKRPEDVEDVLQM + PLLGVVPDFDKMK" + misc_feature 3791..4207 + /gene="wzd" + /locus_tag="SPC11B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.3e-51" + misc_feature 4313..4390 + /gene="wzd" + /locus_tag="SPC11B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4475..5182 + /gene="wze" + /locus_tag="SPC11B_0007" + CDS 4475..5182 + /gene="wze" + /locus_tag="SPC11B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33142.1" + /db_xref="GOA:Q4K273" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K273" + /translation="MPTLEISQAKLEPMKKAEEYYNALCTNLQLSGDDLKVFSITSVK + AGEGKTTTSINIAWAFARAGYKTLLIDADMRNSVMSGVFKPRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLGTLRKYFDYIVVDTAPIGIVI + DAAIIMQKCDASILVTKAGETKRRDLQKAKEQLEQTGKSCLGVVLNKFDTLVEKYGSY + GNYGNYGNYGNYRKQKK" + gene 5197..6564 + /gene="wchA" + /locus_tag="SPC11B_0008" + CDS 5197..6564 + /gene="wchA" + /locus_tag="SPC11B_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33143.1" + /db_xref="GOA:Q4K253" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K253" + /translation="MNEKLAKLSVVIAQSFLVILLTVLLSAVRETEIVSTTAIVLYIL + HYFVFYISDYGRNFFKRGYLIELVQTLKYILFFALAISISNFFSEDRFSISRRGMIYF + LLLYVFLVYVLNLFIKWYWRRAYPNFKGSKKFFLLTATSHIEKVLDRLIESDDVVGKL + VAVSVLDKPDFQHDYLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDCILAHNKQICEMAGLNVVTFSTTFYKTSHVIAKRVIDIIGSLVGLIL + CSLVSIVLVPLIRKDGGSAIFAQTRIGKNGRHFTFYKFRSMCVDAEEKKRELMEQNTM + QGGMFKVHDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5197..5283 + /gene="wchA" + /locus_tag="SPC11B_0008" + /note="Signal peptide predicted for SPC0466 by SignalP 2.0 + HMM (Signal peptide probability 0.901) with cleavage site + probability 0.304 between residues 29 and 30" + misc_feature 5980..6561 + /gene="wchA" + /locus_tag="SPC11B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.8e-156" + gene 6568..7017 + /gene="wchJ" + /locus_tag="SPC11B_0009" + CDS 6568..7017 + /gene="wchJ" + /locus_tag="SPC11B_0009" + /note="member of homology group 26" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="CAI33144.1" + /db_xref="GOA:Q4K252" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:Q4K252" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKEDARSILGN + ETFYPCHYPTNRNLKNLIKNTILAFNILRKERPDVIISSGAAVAVPFFYLGKLFGAKT + VYIEVFDRIDTPTLTGKLVYPVTDKFIVQWDEMKKVYPKAINLGGIF" + gene 7017..7496 + /gene="wchK" + /locus_tag="SPC11B_0010" + CDS 7017..7496 + /gene="wchK" + /locus_tag="SPC11B_0010" + /note="member of homology group 27" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33145.1" + /db_xref="GOA:Q4K251" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q4K251" + /translation="MIFVTVGTHEQQFNRLIKEVDRLKGEGLIQDEVIIQTGFSDYEP + VHCQWKALISYDEMNQYMDEADIVITHGGPATFMGVISKGKRPIVVPRQEKFGEHVND + HQMEFCLKLLGEGYDLVVIDEIDKLNENIKYSKVQQVSSHNSKFTNELSDIIENMFI" + misc_feature 7017..7487 + /gene="wchK" + /locus_tag="SPC11B_0010" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 1.1e-50" + gene 7638..8750 + /gene="wcyK" + /locus_tag="SPC11B_0011" + CDS 7638..8750 + /gene="wcyK" + /locus_tag="SPC11B_0011" + /note="member of homology group 116" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33146.1" + /db_xref="GOA:Q4K250" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K250" + /translation="MKILHIPTGGLFSDGIGTFIYSYLECMNLDKWEVTVLATNIPLL + EDKAKFENLGIQVVVLERKKTAIIHYMCQLYKLIRANKYDIIHVHGSSSLMSIELSVA + KIAGVPVRIAHSHNTTCDHRKLDKVLRPVFHKLYTQAWACGEGAGKWLFTNREYTIIH + NARNIKRYQFSESKRQRFRKKLSLKDTTLALGHVGRFNVQKNHEFLVLLMENLVIQGL + DVKLFLVGEGSTLSKIKNMVSEKSLEDRVFFLGHLNDMKSFVSAMDIMLLPSLYEGLP + LVSVEWQINGIQCILSDTITKECIYTKQVTSLPIRTPLYWEKAIRDFCPEDRLRQSIE + NQRLAREAGYDIELELVKLDTLYNKLIMTIKDRTRK" + misc_feature 8160..8657 + /gene="wcyK" + /locus_tag="SPC11B_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 9.1e-19" + gene 8747..9217 + /gene="wcwR" + /locus_tag="SPC11B_0012" + CDS 8747..9217 + /gene="wcwR" + /locus_tag="SPC11B_0012" + /note="member of homology group 147" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33147.1" + /db_xref="GOA:Q4K249" + /db_xref="InterPro:IPR001451" + /db_xref="InterPro:IPR005881" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K249" + /translation="MKNDRKAQLIITIFKYGKRHVGRSTFYHKLNYKMYQILNAIFVI + GIFNTELPASQNISDNIILFHPYGIIVNGDVTLGNNVVIRQQVTIGNKGMERDVGKSP + IIEAGVDIGAGAKIIGGITIGEGSKVGANAVVTKSFPPGSILVGVPARNIALEK" + misc_feature 8966..9019 + /gene="wcwR" + /locus_tag="SPC11B_0012" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.0059" + misc_feature 9047..9100 + /gene="wcwR" + /locus_tag="SPC11B_0012" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 18" + misc_feature 9101..9154 + /gene="wcwR" + /locus_tag="SPC11B_0012" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.99" + gene 9482..10201 + /gene="wcrL" + /locus_tag="SPC11B_0013" + CDS 9482..10201 + /gene="wcrL" + /locus_tag="SPC11B_0013" + /note="member of homology group 54" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33148.1" + /db_xref="GOA:Q4K248" + /db_xref="InterPro:IPR007577" + /db_xref="UniProtKB/TrEMBL:Q4K248" + /translation="MIPKKIHYCWFGGGPLPTDVKKCIDSWRKFCPNYEIIRWDESNF + IISDQNNFVQTAYENKAWAFVSDYARLRIIYENGGIYLDTDVELIRNLDELLEHAAFF + GAHQINGLVATGLGFGSKKGTKILKELLRLYDNTDFDPCKKNELACPILNSFVFTDFG + YQPSSNIVQTEYFTIYPAEYFDPIYVGANARNLLSEKTYSIHHYSASWTPVRVRIKNK + IIRYIGRDKILLLKKILERKR" + gene 10201..11370 + /gene="wzy" + /locus_tag="SPC11B_0014" + CDS 10201..11370 + /gene="wzy" + /locus_tag="SPC11B_0014" + /note="member of homology group 68" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33149.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K247" + /translation="MKISLSKVFFLQFCALYIFTILYPRGITLTYSPSADFFTLIYKF + CLYFTIAASIIYIFIKILYQRLHLASYTFFILQYYIVSIVITLLLTGTIDSGLQSVFY + PICIYLFFNEIQDRVLIIKISDIFLYCLTLLFFINILDLMMNFTNIYHITFLGHVQVI + SQFGIIAFFISSYYLMIGNRNRKIAFLLQILTVLNCLYADVFLSKVIAIFMIIYALSF + NIKRVFWKRGILISFLTFIITILLLFIDIQGYLIRYLQYFDFTFNGRYQIWRIAYQKF + LDSKIYGYGVFSFHFNLPWQDSGAKGINYAHNQLMQLAIDNGVIGIVSFFIMIFYMIF + LTRKIRNFRVASLFLFSYFCLFIVMFIESVTYYPYYFIILIFQILYERLEQVGEC" + misc_feature 10975..11169 + /gene="wzy" + /locus_tag="SPC11B_0014" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 4.4e-09" + gene 11364..11864 + /gene="wcwT" + /locus_tag="SPC11B_0015" + CDS 11364..11864 + /gene="wcwT" + /locus_tag="SPC11B_0015" + /note="member of homology group 69" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33150.1" + /db_xref="GOA:Q4K246" + /db_xref="InterPro:IPR001451" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K246" + /translation="MLNSLIRRFNQIFYSYRVRRKAAVAKGRVYTGGKTFVTSNTYLS + ENVSFNGMSMFGEGRISIGRNFHSGINCQIITSFHDYDTGTKIPYDNKYIHKDVIIDD + NVWIGNNVIILGGSRIGEGAVIQAGSTVVGEIPPGAIAGGHPARVFKFRNMKHYEELK + RLEQFY" + misc_feature 11652..11705 + /gene="wcwT" + /locus_tag="SPC11B_0015" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.41" + misc_feature 11706..11759 + /gene="wcwT" + /locus_tag="SPC11B_0015" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 2.6" + gene 11874..13061 + /gene="wcwU" + /locus_tag="SPC11B_0016" + CDS 11874..13061 + /gene="wcwU" + /locus_tag="SPC11B_0016" + /note="member of homology group 70" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33151.1" + /db_xref="GOA:Q4K264" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K264" + /translation="MNIIRYLKRNGFRYALNVLYQYKIQKILDSIVIRFTKFKKLQNI + IVIECHTDFDNNGGAFYDYLIRNNYNKKYKIILLLKNRLVRTLPENVDYFYLKKPSLR + KSYLLSLSKFFLFDNDILRKYRKDQKHFYLTHGCFGLKNTIGKITVPDYVDFVLSPSG + NVDNIIVKQFGLTSKEQCLHTGFPCHDIFYSKPKPLVFLSDYDKKIIWAPTFRKGGGD + NRNDSTASYPLGIPLLGTLDELAHLNTYLSQRDIVLIVKLHPMQDISDLELKQFSHIK + FLTNQDLKRKNTNVYQLLMNSDALLSDYSAISYDYLHLDKPIGYVFSDLNDYKLGLSV + DNVDDYIAGDKIMFFNDLLHFIDNIYLEIDKNKEKRKELFNKIFEKQDGESCERLAQI + MEL" + misc_feature 12447..13058 + /gene="wcwU" + /locus_tag="SPC11B_0016" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 1.8e-10" + gene 13078..14481 + /gene="wzx" + /locus_tag="SPC11B_0017" + CDS 13078..14481 + /gene="wzx" + /locus_tag="SPC11B_0017" + /note="member of homology group 52" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33152.1" + /db_xref="GOA:Q4K209" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K209" + /translation="MSVGMKAALWYTVANFIQKGFVFLSTPILTRILNVNDYGTLMLY + QSWFVLFAIFATLNLSQTAYNKGLVEFENDKDNFTFSLLFLSEIITIIVAFLYFTFNI + LVKDSTGLTPGFMIFLFSDILFNISIEFYLARQRFEFKYRKAVLISISSSFFIVAIST + TILLAIKNDLFIKIVLDAIIRIIFGLYCFYLLFFSGKRQLKIEKKYIKYGLSYSLPLI + PHFLSHYILNQSDRLMINMFDGKEKLAIYSLAYSVSMIMFLFTNAINQSIMPYTFQAL + KKKDYRGIHERTKWLFIIVGGGTVLSILFAPELIVILGGNKYKESIWLVPPIAVSVYF + LFVYSMFSNISFYYKMNKLISLVSTGAALSNIILNYIFINIFGYQAAAYTTLLCYILL + AFSHFFLYRFLLKKEEIHEELYNMKMILIISLILLTILFLILVIYNLAFIRYAIIVII + LFLLFTKRNKIITSLKS" + misc_feature 13087..13905 + /gene="wzx" + /locus_tag="SPC11B_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2e-17" + gene 14594..14985 + /gene="gct" + /locus_tag="SPC11B_0018" + CDS join(14594..14728,14728..14985) + /gene="gct" + /locus_tag="SPC11B_0018" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33153.1" + /db_xref="GOA:Q4K262" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K262" + /translation="MKRVITYGTFDFLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNFEHRKNLVEAIRYVDLVIPETSWEQKKTDIKEYHIDTFVMGDDWKGKFDY + LKEEGVEVVYLPRTKEISTTKIKEDLAD" + misc_feature join(14606..14728,14728..14973) + /gene="gct" + /locus_tag="SPC11B_0018" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 1.1e-29" + gene complement(order(15201..15776,15830..16498)) + /gene="tnp" + /locus_tag="SPC11B_0019" + /pseudo + CDS complement(join(15201..15776,15830..16498)) + /gene="tnp" + /locus_tag="SPC11B_0019" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI33154.1" + misc_feature complement(join(15696..15776,15830..16042)) + /gene="tnp" + /locus_tag="SPC11B_0019" + /note="HMMPfam hit to PF01610, Transposase, score 3.5e-42" + /pseudo + gene 16723..>17082 + /gene="aliA" + /locus_tag="SPC11B_0020" + CDS 16723..>17082 + /gene="aliA" + /locus_tag="SPC11B_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33155.1" + /db_xref="GOA:Q4K242" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K242" + /translation="MMKSSKLFALAGVTLLAATTLAACSKSGSSAKAEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 16723..16815 + /gene="aliA" + /locus_tag="SPC11B_0020" + /note="Signal peptide predicted for SPC0479 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.629 between residues 31 and 32" + misc_feature 16969..17037 + /gene="aliA" + /locus_tag="SPC11B_0020" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttggct ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaaggcgg aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gacgaacata aagaagcgta tccttagtgc aggcctgact + 361 tttgcatctg ctttgctttt agctgcttgc gaccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtca attgaaacaa gagaaagaca aaagagcctc gtaaaaggta ttgcaacttg + 541 gtaatacctt tttgaggtgc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggtgagta gggaggaaga ggtaaaagtt tatgcccaaa ctcttcgcat aaaagttcta + 661 gcttccccat tctatggaat cttgcattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagaa aaacttctga aaccaagctt caaaaaagtc gctcgtcatc gtctcttcgt + 781 aagtcattgg aacgattaac tcaccatttg ttagacctgc aaccaaagaa atcctctgat + 841 atcttcttcc agatactttg cctcttctta actgaccttt taatgagcga ccatattctc + 901 gataaaaata agtatcgaat cctgtttcat caatctaaac aggtgctagg tgctttaaac + 961 tattaaaatt cttaagaaat aaggctactt tttctgggtc ttgttcatag taggtgtggt + 1021 tctttttttc gagtgtagcc catagctttg agcgcatagt ggatggtagt tggatgacag + 1081 ccaaattcag aagctatttc agtcaaataa gcgtctggat tatcagtaag atagttttta + 1141 agtctatctc tatcaacttt tcttggtttt gttcctttta cttggtggtt tagctctcct + 1201 gttttctctt ttagctttaa ccagccataa atggtattac gtgagatttg gaaaacgtgt + 1261 gacgcttctg ttatactacc tgttcgctca caataagaga gaactttttt acgaaaatct + 1321 attgaatatg ccataagaag attataccac attgtgtact atattatatt gaaactagaa + 1381 tagtacacat ctgcttctaa aatattgtta gaaaacgatt tgactgtcct gatcaatttg + 1441 tcatgttctt atttcatttt actatatttt tggttcgcgg gaagtctact aagatactta + 1501 aagatgcaga tagtgagaaa aaggtgtaga cattaccgta aaaaagtgat ataattgtaa + 1561 gatgttcaat gtataggtgt taatcatgag tagacgtttt aagaaatcag gttcacagaa + 1621 agtgaagcga agtgttaata tagttttgtt gactatttat ttattgttag tttgtttttt + 1681 attgttctta atctttaagt acaatatcct tgcttttaga tatcttaatc tagtggcaac + 1741 tgcctttgtt ctactagttg ccttggtagg gctactctcg attatctata aaaaagctga + 1801 aaagtttacc atttttttgt tggtgctctc tattcttgtc agctcagtgt cgctctttgc + 1861 agtacagcag tttgtgggac tgaccaatcg tttaaatgcg acttctaatt actcagaata + 1921 ttcgctcagt gtcgctgttt tagcagatag tgagattgag aatgttacgc aactgacgag + 1981 tgtgacagca ccgactggga ctgataatga aaacattcaa aaactactag ctgatatcaa + 2041 atcaagtcag aatatcgatt tgacggttaa tcaaagttcg tcttacttgg cagcttacaa + 2101 gagtttgatt gcaggagaga ctaaggccat tgtcttaaat agtgtctttg aaaatatcat + 2161 tgaatcggag tatccagatc acgcatcgaa gataaaaaag atttatacca agggattcac + 2221 taaaaaagta gaagctccta agacttctaa gaatcagtct ttcaatatct atgttagtgg + 2281 aattgatact tatggtccaa ttagttcggt gtcgcgttca gatgtcaata tcttgatgac + 2341 tgtcaatcga gataccaaga aaatcctctt gaccacaacg ccacgtgatg cttatgtacc + 2401 aatcgcagat ggtgggaata atcaaaaaga taaattaacc catgcaggta tttatggagt + 2461 tgattcgtcc atccacacct tagaaaatct atatggagtg gatatccatt actatgtccg + 2521 tttgaacttc acttctttct tgaagttgat cgatttgttg ggtggggtag atgtttataa + 2581 tgatcaggaa ttcacagctc ttgctaataa aaaacactat tctattggta atgtccattt + 2641 agattcagaa gaggcactcg cttttgttcg tgagcgctac tctctagcag atggtgatcg + 2701 tgaccgtggg cgcaatcaac aaaaggtgat tgtggctatc cttcaaaaat taacttcgac + 2761 cgaagtgctg aaaaattata gcagaatcat tgatagcttg caaaattcta tccaaacaaa + 2821 catgcccctt gagactatga taaacttggt caatgctcag ttagaaagtg gtggaacgta + 2881 caaagtaaat tcgcaagact tgaagggtag gggacggacg gatcttcctt cctatgcgat + 2941 gccagatagt aacctctata tgatggaaat taacgacagt agccttgcat ctgtcaaaac + 3001 tgctattcag gatgtgttgg aggggagatg aaatgattga tattcattcg cacattgtct + 3061 ttgatgtaga tgatggtccc aagtcaagag aggaaagtaa ggctctcttg acagaagcct + 3121 acaggcaggg ggtgcgaacc attgtctcta cctctcaccg tcgcaagggc atgtttgaaa + 3181 ctccagaaga gaagatagca gaaaactttc ttcaggttcg ggaaatagct aaggaagtcg + 3241 cgagtgactt ggtcattgct tatggggctg aaatttacta cacaccagat gttttggata + 3301 agctggaaaa taatcggatt ccgaccctca ataatagtcg ttatgccttg atagagttta + 3361 gtatgaacac cccttatcgc gatattcgta gtgccttgag taaaatattg atgttgggaa + 3421 ttactccagt cattgcccac atcgagcgct atgatgctct tgaaaataat gaaaaacgcg + 3481 ttcgagagct gatcgatatg ggctgttaca cgcaagtaaa tagttcacat gtcctcaaat + 3541 ccaaactttt tggagaacct gataaattca tgaaaaaaag agcgcagtat ttcttggagc + 3601 gtgatttggt tcatgtgatt gcaagtgata tgcataatgt ggacggcaga cctccttata + 3661 tggcagaagc atatgacctt gtttcccaaa aatacggaga agcgaaggct caggaccttt + 3721 ttatagacaa tcctcaaaaa attgtaatgg atcaactaat ttaggagaaa tgatgaaaga + 3781 acaaaacacg atagaaatcg atgtatttca atcacttaaa accttatgga aacacaagct + 3841 aatcatttta ttagtggcac ttgtgacagg ggcggtagcc tttgcatata gcacttttat + 3901 tgttaagcca gaatatatga gcaccacgcg tatttacgta gtcaaccgta atcaaggaga + 3961 taagccagga ctgacgaatc aggacttgca ggcaggagct tatctggtaa aagactaccg + 4021 cgaaattatc ctttcgcaag atgtattgga aaaggtagcg acaaacttga aattggatat + 4081 gccagcaaaa acgttaacta gcaaagtgca agtgactgta ccagccgaca ctcgtatcgt + 4141 ctcaatctct gtcaaggata aacaaccaga ggaagccagt cgcattgcta attctctacg + 4201 agaagttgct gcagaaaaga tcatcgctgt aacgcgagta tctgatgtaa cgacgcttga + 4261 agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgacgcaaca ccttagttgg + 4321 ttttcttgga ggagccgccg taacagtaat tactgttctt ttgattgagt tgctcgatac + 4381 ccgtgtaaaa cgtcctgaag atgttgaaga tgtactgcaa atgccacttc taggagtcgt + 4441 tccagatttt gataaaatga aataggagga agttatgcca acgttagaaa tctcacaggc + 4501 gaaattagaa cctatgaaaa aggcagagga atattataat gctttgtgca cgaacctaca + 4561 gttaagtgga gatgatttga aagtattttc tatcacttct gtgaaagcag gagaaggaaa + 4621 aacaacgact tccatcaata tcgcttgggc ttttgcgcgt gcaggttaca aaacgctgct + 4681 gattgatgca gacatgcgta actccgtgat gtcaggtgtc tttaaaccaa gggaaaggat + 4741 tactggacta acagaatttc tatcagggac aacagacctg tcacaggggc tttgcgatac + 4801 caatattgag aatctctttg tgattcaggc tggttctgtg tcaccaaatc cgacagccct + 4861 tcttcaaagt aagaatttca gtacaatgct tggaaccttg cgtaaatatt ttgactatat + 4921 cgtcgtagac actgctccta tcggtatcgt gattgatgcg gctatcatta tgcagaaatg + 4981 tgatgcttct attttagtga cgaaggcagg tgaaacaaaa cgacgggatc ttcaaaaagc + 5041 gaaagaacag ttggaacaaa ctgggaagtc gtgtttagga gttgtgttga ataaatttga + 5101 tactttagta gagaaatacg gttcttatgg gaattatggg aattatggga attatgggaa + 5161 ttacaggaaa cagaaaaaat aggttgaggg atagagatga atgaaaaatt agcaaagctt + 5221 tcagtagtca tagcccagag ttttcttgtc attctattga ctgttctact tagcgctgtg + 5281 agagaaacag agattgtttc aacaacagct attgtacttt atatcctcca ctattttgtc + 5341 ttttatatca gtgattatgg acggaatttc tttaaaaggg gatatttgat tgaacttgtc + 5401 cagacattga aatatatcct attctttgcg ctagcgatta gtatttctaa ttttttctca + 5461 gaagatcgat ttagtatttc cagaagaggc atgatttact tcctcttatt atatgttttc + 5521 ttagtctatg tgctaaacct atttatcaag tggtattgga ggcgggctta tcccaacttt + 5581 aaaggaagta agaagttttt cctacttaca gcaacttctc atatcgaaaa ggtactggat + 5641 agactaatag aatcagatga tgttgttggg aagttggtag ccgtcagtgt tttagataaa + 5701 ccagattttc agcacgatta tttaaaggtt gtagcagagg gggagatcgt aaactttgcg + 5761 actcatgagg tggtcgatga agtctttatc aatcttccaa gtgaaaaata caatattgga + 5821 gagcttgtct ctcagtttga aacgatggga attgatgtaa cagtcaatct aaatgctttc + 5881 gattgtatct tggcacataa caagcaaatt tgtgagatgg caggattaaa cgttgtgact + 5941 ttttctacaa cattttataa gactagccat gtgattgcta agcgggttat tgatattatc + 6001 ggttccctgg taggtttgat actatgtagt ctagtcagta ttgtgctggt tcctttgatt + 6061 cgaaaggatg ggggctctgc tatttttgct cagacgcgta taggaaaaaa tggccgccat + 6121 ttcacttttt ataagtttcg ctccatgtgt gtagatgctg aggagaaaaa aagagaactc + 6181 atggaacaaa ataccatgca gggtggaatg tttaaggtgc acgatgatcc tcgtatcacg + 6241 aaaattggtc gttttatacg gaagacgagc ttggacgagc taccacagtt ttataatgtt + 6301 ctaaagggag atatgagttt ggttggcaca cggccaccaa cagtggacga gtatgaacac + 6361 tataccccag aacaaaaacg tcggctaagt tttaaacctg gtataacagg cttatggcag + 6421 gtcagtggac gaagtgaaat caaaaatttc gatgaagttg tcaaattaga tgtggcctat + 6481 atagacgatt ggacaatctg gaaagatatt gagattttat tgaagacagt taaagttgta + 6541 ttgatgaagg atggagctaa ataggaaatg aaaatatgtt tagttggatc tagtggaggt + 6601 catctgactc atttatatct attaaaacct ttctggaaag ataaggaaag attttgggtt + 6661 acttttgata aagaggatgc aagaagtatc ttgggaaatg aaacatttta tccttgtcat + 6721 tatcctacta atcgtaattt gaaaaatctt attaaaaata cgattcttgc tttcaatatt + 6781 ttgagaaagg aacgccctga tgttatcatc tcatcagggg ctgctgtagc agttcctttc + 6841 ttttacctag gaaaactatt tggtgctaag acagtctata ttgaagtttt tgaccgtatt + 6901 gatacgccaa cattaacagg gaaattggta tatccagtga cagataagtt catagttcag + 6961 tgggatgaaa tgaaaaaagt atatccgaaa gcaatcaacc tcggagggat tttctaatga + 7021 tttttgtgac agtaggtact catgagcaac agtttaatcg acttattaaa gaggttgata + 7081 gattaaaagg tgagggactt attcaggatg aagttattat tcagactggt ttttcggatt + 7141 atgaaccagt gcactgccaa tggaaagctt tgatttctta tgatgagatg aatcaatata + 7201 tggatgaagc agatattgtc attacacatg gtggcccagc aacatttatg ggagtgattt + 7261 ctaaggggaa gagaccgatt gtagtaccta gacaagaaaa atttggcgag catgtgaatg + 7321 atcaccaaat ggaattttgc ttaaagttac taggcgaagg atacgatcta gttgtaatcg + 7381 atgaaattga taaacttaat gagaatatta aatattcaaa agttcagcaa gttagttctc + 7441 ataatagtaa gtttactaat gaactgtcag atataattga aaatatgttt atataagata + 7501 tgtgtgactg ccggtttttt gtgttactaa taattgtcat acagtcagag ctttttaaac + 7561 tatatcgtta ttaaatagtg agttttatat tttaatgatt accattcgta tttaataaga + 7621 aataatggag aagatgaatg aagattttgc atattccaac aggtggctta ttttcagatg + 7681 gaatagggac gtttatctat tcttatttag aatgcatgaa tctagataaa tgggaagtga + 7741 cagttttagc tactaatatt ccactgttag aagataaagc aaaatttgag aatttaggta + 7801 tccaggtagt agttctagag cggaaaaaaa ctgcgattat tcactatatg tgtcaattat + 7861 acaaattaat aagagctaat aaatatgata taattcatgt tcatggtagt agttctttaa + 7921 tgtcaatcga gctatctgtt gcaaaaattg caggggttcc agtaaggatt gcccatagtc + 7981 ataatactac ttgtgaccat agaaaattag ataaagtatt acggccagta tttcataaat + 8041 tatatacgca ggcgtgggca tgtggtgaag gagctgggaa atggcttttt accaatagag + 8101 aatatactat tattcataat gcaagaaata taaaacgtta tcaatttagt gagtccaaac + 8161 gacaacgatt tagaaaaaaa ctatctctta aagatacaac tcttgcttta ggtcatgttg + 8221 gtcgctttaa tgttcaaaaa aatcatgaat ttcttgtgtt attaatggaa aatttagtaa + 8281 tacaaggact agatgttaaa ttatttttag taggtgaagg gtcaacttta tcaaaaatta + 8341 agaatatggt ttctgaaaaa tctttagaag atagggtctt ctttttaggt catcttaatg + 8401 atatgaaatc atttgtgtct gctatggata taatgcttct cccaagcttg tacgaaggtc + 8461 tccctctggt gtcagtagaa tggcaaataa atggaataca atgtatctta tctgatacta + 8521 taacaaagga gtgtatctac actaaacaag tgacttcttt accaattagg acccctcttt + 8581 attgggaaaa agcgataaga gatttctgtc cagaagatag attgagacaa tcaattgaga + 8641 atcaaagact tgcgagagaa gctggttatg atattgaact ggaattagtt aaattagata + 8701 ctttatacaa taaattgata atgactataa aagataggac aagaaaatga aaaatgatag + 8761 gaaagctcaa ctaataatta caatttttaa atatggtaaa agacatgtag gacggtcaac + 8821 tttttatcat aagttaaatt ataaaatgta tcaaatttta aatgctatat ttgtaattgg + 8881 tattttcaat acagaattac cagcatcaca aaatattagt gataatataa tattgtttca + 8941 tccatatggg ataatagtta atggcgatgt aactttaggg aataatgttg tgataagaca + 9001 gcaggttacc attggtaata aagggatgga aagggacgtg ggaaaatctc ctattatcga + 9061 agcaggtgtt gatattggag caggtgctaa aattatagga gggataacga ttggtgaggg + 9121 ttcaaaagta ggagctaatg ctgttgtaac aaaaagcttt ccacctggtt caattttagt + 9181 aggagttcca gcgaggaata tagcattaga gaagtaattt gggatagaat gcaaataagt + 9241 gtgttaatac actaagatat tggcatcagc gacaatgctg tttgaatatt ttagtgaatc + 9301 aaaaaagaga gaaaaatgat aaaatttaac ttagtaagca ttatatcata tgttcaataa + 9361 gaactgtcga attaatttaa taaatttagt gataaatacg tactagtgag aatttgtttt + 9421 attgtaagag agttcctata attatagata attactaaat agtcagggaa aggaaaaact + 9481 aatgattcca aaaaaaatac attattgctg gtttggtgga ggtccattac ctactgatgt + 9541 taaaaaatgt attgacagct ggagaaaatt ttgtccgaac tatgagatta ttagatggga + 9601 tgaaagcaat ttcattatta gtgatcaaaa caattttgtt cagactgcat atgaaaacaa + 9661 agcttgggca tttgttagcg actatgcacg gttaagaatc atatatgaaa atggtggcat + 9721 ctatttggat acagatgttg aattgattag aaatcttgat gaattgcttg agcatgcagc + 9781 tttttttggt gctcaccaga taaatggatt agtagctact ggtctaggtt ttggttcgaa + 9841 aaaggggacg aagatattaa aagaattatt aagactgtat gataatacag attttgatcc + 9901 gtgtaaaaag aatgagttgg catgtcccat acttaattcg tttgtcttta ctgattttgg + 9961 ctatcagcct tcttctaaca ttgttcaaac ggagtatttt actatctatc ctgctgagta + 10021 ttttgatcct atatatgttg gagccaatgc tagaaattta ttatcggaga aaacatattc + 10081 aattcatcat tacagtgcct cttggactcc tgtgagagtt agaataaaaa ataagatcat + 10141 tagatatatt ggtagggata agattctact attaaagaaa attctagaaa ggaaaagata + 10201 atgaaaatat cgctttctaa agtatttttt ttacaatttt gtgcacttta tatctttaca + 10261 attttatatc ctagaggtat tacattaact tattctccat ctgcagattt ttttactctg + 10321 atttataaat tttgtttata tttcaccatc gcagccagta taatatatat atttataaaa + 10381 atattatatc agagactaca cctagcatca tatacttttt ttatattgca gtattatatt + 10441 gtttctatag ttattacatt gcttttaaca ggcacaatag attcgggttt acaatcagtc + 10501 ttttatccga tctgtatata tttatttttt aatgagattc aagatagggt attgattata + 10561 aaaattagtg atatattttt atactgttta actcttttat tctttataaa tattttggat + 10621 cttatgatga attttaccaa tatttatcat ataacctttt tggggcatgt ccaagtgata + 10681 tcacaatttg gaattatagc ttttttcatt tcttcctatt acttaatgat aggaaataga + 10741 aatcgcaaga tagccttcct attacaaatt ttgactgtgc tcaattgtct atatgctgat + 10801 gtttttttat caaaggttat agcaatcttc atgattattt acgcattatc atttaacata + 10861 aagagagtat tttggaagag agggattcta atttctttct tgacatttat tataactatt + 10921 ctgcttcttt tcattgatat tcaaggttat ttgataagat atttacaata ttttgatttt + 10981 acttttaatg gccgctatca aatttggcgt attgcttatc aaaaattttt agattcaaaa + 11041 atatatggct atggagtttt tagctttcat ttcaatcttc cgtggcaaga ttctggtgct + 11101 aaggggatca actatgctca taatcagctt atgcaattag caatagataa tggagtaatt + 11161 ggtatcgtct ctttctttat tatgattttt tatatgatat ttttaacaag gaagattaga + 11221 aattttagag tagcttcatt gtttttattt tcgtactttt gtttgtttat agtaatgttt + 11281 attgaaagtg taacctatta cccgtattac tttattatat tgatttttca aatattatat + 11341 gaaaggttag agcaggtggg agaatgctaa atagtttaat tagaagattt aatcagattt + 11401 tctatagtta tcgggttaga agaaaagctg cagttgctaa aggaagagtg tacacgggtg + 11461 gaaaaacatt tgttacttcg aatacctatc tttctgagaa tgtttctttt aatggcatgt + 11521 caatgtttgg agaaggtaga atttcgatag gaagaaattt ccattctggt ataaattgcc + 11581 aaattataac gtcatttcat gactatgata caggaactaa gataccatac gacaataagt + 11641 acatacataa agatgtaatt attgatgata atgtgtggat tgggaataat gttattatcc + 11701 tcggcggatc tcgtatcgga gaaggagcag ttattcaagc agggagtaca gttgtagggg + 11761 aaatacctcc aggagcaatc gcaggtggtc atccagcaag agtatttaaa tttaggaata + 11821 tgaagcatta tgaagaatta aagagactag aacaatttta ttaggagcta tatatgaata + 11881 ttataagata cttgaaaaga aatggatttc gatatgcatt aaatgtcctc tatcaatata + 11941 aaattcaaaa gattttagat tcaattgtta ttagatttac taagtttaaa aagttacaaa + 12001 atattattgt cattgaatgt cacacagact ttgataataa tggaggagct ttttatgatt + 12061 atttgataag aaataattat aataagaaat ataaaattat tttattatta aaaaatcgac + 12121 tagtacgtac tcttcctgaa aatgtagatt atttttactt gaaaaaacct agtttgagga + 12181 agtcatattt gttatcatta agtaaatttt ttcttttcga taatgatata cttcgtaaat + 12241 atagaaaaga tcaaaaacac ttttatttaa cacatggatg ctttggttta aaaaatacaa + 12301 taggtaaaat aacagttccg gattatgttg attttgttct atctccctcg ggcaatgtag + 12361 ataatattat agttaagcag tttggattaa catctaaaga gcaatgtctt cacactggat + 12421 ttccgtgtca tgatatcttt tattcaaaac caaaacctct agtattttta tctgattatg + 12481 ataaaaaaat tatctgggca ccaactttta gaaagggtgg aggcgataat agaaatgata + 12541 gtacagctag ctatccttta ggtattccat tacttggaac actagatgaa cttgcacacc + 12601 taaacacata tctaagccaa cgggatattg tcctgattgt aaagttacat ccaatgcaag + 12661 atatttcaga tttggagttg aaacaattta gtcatattaa gtttctgaca aatcaagatt + 12721 tgaaacgtaa aaatacaaat gtgtatcaat tgctgatgaa ttcagatgct ttactcagtg + 12781 actattctgc aatctcgtat gattatttac accttgataa accaataggg tatgtttttt + 12841 cggatctaaa tgattataag ttggggcttt cagttgataa tgtagatgat tacatagcag + 12901 gtgataagat aatgtttttt aacgacttgc tgcactttat tgataacatt tatctagaaa + 12961 ttgataaaaa taaagaaaaa cgcaaggaat tatttaataa aatatttgaa aaacaggatg + 13021 gagaatcgtg tgaaagattg gcccaaatta tggaattata aaagacgtta cgaagaaatg + 13081 tctgtcggga tgaaagcggc actctggtat actgttgcaa attttattca aaagggtttt + 13141 gtatttcttt caactccgat tttaaccaga atacttaatg ttaatgatta cggtacattg + 13201 atgctttacc aatcatggtt tgtactattt gctatttttg ctaccttgaa tctttctcaa + 13261 acagcttata ataagggatt agtagaattt gagaatgata aagataattt tacattttct + 13321 ttgttgtttt tgtctgagat cattacgata attgttgctt ttttgtattt tacttttaat + 13381 atactggtta aagatagtac tggattaact cccggtttca tgatattttt attcagtgat + 13441 attttattta atattagtat agaattttat ttggcacgtc agagatttga attcaaatat + 13501 agaaaagcag ttctaatttc aatttcttca agttttttta ttgtagctat tagtacaact + 13561 atcttattag cgattaagaa tgatttattc attaaaattg tattagatgc tattatccga + 13621 attatctttg gtttatattg tttttatctc ttgttttttt cagggaaaag gcaacttaag + 13681 atagaaaaaa aatatattaa atatggtttg agttattcat tacctttgat accgcatttc + 13741 ttatcgcact atattttgaa tcagtctgac cgtttgatga ttaacatgtt tgatggtaag + 13801 gagaaattag ctatatatag tctagcttat tctgtatcaa tgattatgtt tttgtttact + 13861 aatgcaatta atcaatcaat aatgccgtat acatttcaag ctttgaaaaa aaaggattat + 13921 cgtgggatac atgagagaac caaatggctt tttataatag ttgggggggg cacagttctt + 13981 tcaattctat ttgcaccaga actaattgtt attttaggcg gcaataaata taaggagtca + 14041 atttggctag tacctccaat tgctgtctcg gtttatttcc tttttgtata ttctatgttt + 14101 agtaatatca gtttttatta taagatgaat aagctgattt cgttagtttc cacaggtgca + 14161 gctctttcaa atattatttt aaattatatt tttattaata tatttgggta tcaagctgca + 14221 gcttacacta cattattatg ctatatattg ttagcatttt ctcatttttt cttatataga + 14281 tttttattaa aaaaagagga aattcatgag gaactttata atatgaagat gattttaata + 14341 atatctttaa tattattaac aatattattt ttgatacttg ttatttataa cttagccttt + 14401 ataaggtatg caattattgt aattatttta tttcttttgt ttacaaagag aaataaaata + 14461 attacatccc taaaaagttg atattgaaaa tttagattca aattaagaat atagtggata + 14521 tcaaaccagt aataataatg aataattgtt tttatgtaat ttaggattaa taaaaaattg + 14581 aaaggaaata tcaatgaaaa gagtaattac ttatggaacc tttgattttc ttcattatgg + 14641 acatatcaat ttgctaaaga gagcgaagca attaggagat tatctcattg ttgtagtttc + 14701 aagtgatgag ttcaatttga aagaaaaaat aaagtttgtt actttaattt tgaacataga + 14761 aaaaatttag ttgaagcgat aagatatgtt gatttggtga ttcctgaaac aagctgggaa + 14821 cagaaaaaaa cagatattaa agaatatcac attgatacat ttgttatggg ggatgattgg + 14881 aaaggaaaat ttgattattt aaaagaagaa ggagtggaag tagtttattt accaagaact + 14941 aaagaaatat ctacaactaa aattaaagaa gatttagcag attagatttt ttacaaaaat + 15001 attttgagat cagataataa atttgttttc ataattatta atgtctattg ttttattacc + 15061 acagaagtat attaaattaa aataaattat tttagattta taatgtggct ccttgtcaac + 15121 gaacatctgg agaggacaat cactgtcttc tcctttttat ttttttggct ctttgtcaac + 15181 tgtagtgggt tgaaaaaaag ctaagctcga gaaaggacaa attttgtcct ttcttttttg + 15241 atattcagag caataaaaat ccgttttttg aagttttcaa agtttcgaaa accaaaggca + 15301 ttgcgcttga taagtttgat gagattattg gtcgcttcca gtttggcgtt ggaataaggt + 15361 aattgaaggg cgttgataat cttttcttta tctttgagga aggttttaaa gacagtctga + 15421 aaaataggat gaacctgctt aagattgtcc tcaataagtc cgaaaaattt ctctggttcc + 15481 ttattctgga aatgaaaaag caagagctga tagtggtgtt tcaagtcttc cgaatagctc + 15541 aaaagcttgt ttaaaatctc tttattggtt aagtgcatac gaaaagtagg acgataaaaa + 15601 cgtttatcac tcagtttacg gctatcctgt tgaatgagtt tccagtagcg cttgatagcc + 15661 ttgtattcat gggattttcg atgaaactga ttcatgattt gaacacgcac acgactcata + 15721 gcacggctaa gatgttgcac aatgtgaaag cgatcaagaa cgattttagc attcgggagt + 15781 gaaacagtct gggagactgt ttcagcctga gcctagaaat ttgaaagcga agctgtttag + 15841 ctaagtcata gtaagggcta aacatatcca tagtaataat tttgacgcga cataggacaa + 15901 ctctatcgta gcgaagaaag tgatttcgaa tgatagcttg tgttcttccc tcaagaacag + 15961 tgatgatatt gagattgtta aaatcttgcg caatgaagct catctttccc tttgtaaaag + 16021 catactcatc ccaagacata atctcaggaa gacaagaaaa atcaagttta aagtgaaaat + 16081 cattgagctt acgaataaca gttgaagttg agatggaaag ctgatgggca atatcagtca + 16141 tagaaatctt ttcaattaac ttttgagcaa tcttttggtt gatgatacga gggatttggt + 16201 gattcttctt gacgatagaa gtttcagcga ccatcatttt tgaacagtga tagcacttga + 16261 aacgacactt tctaaggaga attctagtag gcataccagt cgtttcaaga taaggaattt + 16321 tagaaggttt ttgaaagtca tatttcttca attggtttcc gcactcaggg caagatgggg + 16381 cgtcgtagtc cagtttggcg atgatttcct tgtgtgtatc cttattgatg atgtctaaaa + 16441 tctggatatt agggtcttta atgtctagta attttgtgat aaaatgtaat tgttccatat + 16501 gattctttct aatgagttgt tttgtcgctt ttcattatag gtcatatggg actttttttc + 16561 tacacaaaaa taggctccat aatatctata gtggatttac ccactacaaa tattatagag + 16621 tctttttttc agaatttacc aaattaatta aaaaattcag aaaattatat tgacatctct + 16681 ctgaaaagag tctataatag agagaaagtt ttaaaggaga agatgatgaa aagttcaaaa + 16741 ctatttgccc ttgcgggtgt aaccttattg gcggcgacta ctttagctgc atgttctaaa + 16801 tcaggttcga gcgctaaagc tgagaagaca ttctcataca tttatgaaac ggatcctgac + 16861 aacctaaact acttgacaac tgctaaggct gcgacagcaa atattaccag taacgtggtt + 16921 gatggtttgc tagaaaatga tcgctacggg aactttgtgc cgtctatggc tgaggattgg + 16981 tctgtatcca aggatggatt gacttacact tatactatcc gtaaggatgc aaaatggtat + 17041 acttctgaag gtgaagaata cgcggcagtc aaagctcaag ac +// + diff --git a/public/res/serotype_genbank/serotype_11C.gb b/public/res/serotype_genbank/serotype_11C.gb new file mode 100644 index 0000000..80d213b --- /dev/null +++ b/public/res/serotype_genbank/serotype_11C.gb @@ -0,0 +1,877 @@ +LOCUS CR931655 18532 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Eddy nr. 53 (serotype 11c). +ACCESSION CR931655 +VERSION CR931655.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18532) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 18532) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..18532 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Eddy nr. 53" + /db_xref="taxon:1313" + gene <1..166 + /gene="dexB" + /locus_tag="SPC11C_0001" + CDS <1..166 + /gene="dexB" + /locus_tag="SPC11C_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33156.1" + /db_xref="GOA:Q4K241" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K241" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVEMTD" + gene complement(297..1706) + /gene="tnp" + /locus_tag="SPC11C_0002" + CDS complement(297..1706) + /gene="tnp" + /locus_tag="SPC11C_0002" + /note="member of homology group 17" + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + /protein_id="CAI33157.1" + /db_xref="GOA:Q4K259" + /db_xref="InterPro:IPR001584" + /db_xref="InterPro:IPR009057" + /db_xref="InterPro:IPR011991" + /db_xref="InterPro:IPR012337" + /db_xref="UniProtKB/TrEMBL:Q4K259" + /translation="MNETKKYLVIKAIAQGKKTKKRACVELNLSERQINRLLLAYQQK + GKEAFRHRNRNRKPKHAIPDEIKERILKKYLSYETYKPNVRHFCELLAEEEGIQLSDT + TVRKILYKKNILSPKSHRKTKKRVRKQAKLNPKQPLDNPILPTAEKFLEDPKKVHPSR + PRKKFAGELIQMDASPHAWFGAETSNLHLAIDDASGNILGSYFDKQETLNAYYHVLEQ + ILANHGIPLQIKTDKRTVFTYQASNSKKMEDDTYTQFGYACHQLGILLETTSIPQAKG + RVERLNQTLQSRLPIELERNNIHTLEEANTFLPSYIQTFNEQFGNKTKLSVFEEAPKP + SERNLILARLSERVVDSGHHIRFQNRCYIPTEQGKEVYFIRKTKALVIKAFDGDIYLN + IADKIYHTKELLNHELYSKNFEQEPEQKKKDASISLHKPIRGNSHLSNNIFIKIKRIM + KSLLVRSLILLNYKYSKMK" + misc_feature complement(720..1223) + /gene="tnp" + /locus_tag="SPC11C_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 6.3e-22" + misc_feature complement(1590..1655) + /gene="tnp" + /locus_tag="SPC11C_0002" + /note="Predicted helix-turn-helix motif with score + 1142.000, SD 3.08 at aa 18-39, sequence + KTKKRACVELNLSERQINRLLL" + gene 2052..3005 + /gene="tnp" + /locus_tag="SPC11C_0003" + CDS 2052..3005 + /gene="tnp" + /locus_tag="SPC11C_0003" + /note="member of homology group 39" + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + /protein_id="CAI33158.1" + /db_xref="GOA:Q4K0X9" + /db_xref="InterPro:IPR001584" + /db_xref="InterPro:IPR012337" + /db_xref="UniProtKB/TrEMBL:Q4K0X9" + /translation="MQEHYTPKGKHLTIDNRRLIERWKNENKSNREIAGLLGKAPQTI + HNEVKRGTTLQQVRKGLYKKVYSADYAQTVYQFNRKRSVKKLILTKEIREKILHYHKQ + KFSPEMMVNKKQVKVGISTIYYWFHNGHLGLTKADMLYPRKRKGVKKQASPNFKPAGK + SIEERPDVINLRLENGHYEIDTVLLTKIKNYCLLVLTDRRSRHQIIRLIPNKTAESVN + QALTLLLGEHRILSITADNGSEFKRLSEVFPEEHIYYAHAYSSWERGSNENHNRLIRR + WLPKGTKKTTPKEVAFIENWINNYPKKCLDYKSPSEFLLGG" + misc_feature 2133..2198 + /gene="tnp" + /locus_tag="SPC11C_0003" + /note="Predicted helix-turn-helix motif with score + 1087.000, SD 2.89 at aa 28-49, sequence + KSNREIAGLLGKAPQTIHNEVK" + misc_feature 2559..2996 + /gene="tnp" + /locus_tag="SPC11C_0003" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 6.6e-23" + gene 3128..4573 + /gene="wzg" + /locus_tag="SPC11C_0004" + CDS 3128..4573 + /gene="wzg" + /locus_tag="SPC11C_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33159.1" + /db_xref="GOA:Q4K257" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K257" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVATAFVLLVALIGLLSIIYKKAEKFTIFLLVLSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNIDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDHASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDIHYYVRLNFTSFLKLIDLLGGVDVYNDQ + EFTALANKKHYSIGNVHLDSEEALAFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EVLKNYSRIIDSLQNSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGRGRTDLPSY + AMPDSNLYMMEINDSSLASVKTAIQDVLEGR" + misc_feature 3128..3244 + /gene="wzg" + /locus_tag="SPC11C_0004" + /note="Signal peptide predicted for SPC0483 by SignalP 2.0 + HMM (Signal peptide probability 0.994) with cleavage site + probability 0.469 between residues 39 and 40" + misc_feature 3332..3679 + /gene="wzg" + /locus_tag="SPC11C_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.2e-63" + misc_feature 3857..4300 + /gene="wzg" + /locus_tag="SPC11C_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8e-65" + gene 4575..5306 + /gene="wzh" + /locus_tag="SPC11C_0005" + CDS 4575..5306 + /gene="wzh" + /locus_tag="SPC11C_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33160.1" + /db_xref="GOA:Q4K256" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K256" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLENNRIPTLNNS + RYALIEFSMNTPYRDIRSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGEPDKFMKKRAQYFLERDLVHVIASDMHNVDGRPPYMAEAYDLVS + QKYGEAKAQDLFIDNPQKIVMDQLI" + misc_feature 4578..5186 + /gene="wzh" + /locus_tag="SPC11C_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1e-38" + gene 5312..6007 + /gene="wzd" + /locus_tag="SPC11C_0006" + CDS 5312..6007 + /gene="wzd" + /locus_tag="SPC11C_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33161.1" + /db_xref="GOA:Q4K255" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K255" + /translation="MMKEQNTIEIDVFQSLKTLWKHKLIILLVALVTGAVAFAYSTFI + VKPEYMSTTRIYVVNRNQGDKPGLTNQDLQAGAYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLTSKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVRRNTLVGFLGGAAVTVITVLLIELLDTRVKRPEDVEDVLQM + PLLGVVPDFDKMK" + misc_feature 5333..5749 + /gene="wzd" + /locus_tag="SPC11C_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.3e-51" + misc_feature 5855..5932 + /gene="wzd" + /locus_tag="SPC11C_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 6017..6706 + /gene="wze" + /locus_tag="SPC11C_0007" + CDS 6017..6706 + /gene="wze" + /locus_tag="SPC11C_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33162.1" + /db_xref="GOA:Q4K254" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K254" + /translation="MPTLEISQAKLEPVKKAEEYYNALCTNLQLSGDDLKVFSITSVK + AGEGKTTTSINIAWAFARAGYKTLLIDADMRNSVMSGVFKPRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLGTLRKYFDYIVVDTAPIGIVI + DAAIIMQKCDASILVTKAGETKRRDLQKAKEQLEQTGKSCLGVVLNKFDTSVEKYGSY + GNYGNYRKQKK" + gene 6721..8088 + /gene="wchA" + /locus_tag="SPC11C_0008" + CDS 6721..8088 + /gene="wchA" + /locus_tag="SPC11C_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33163.1" + /db_xref="GOA:Q4K253" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K253" + /translation="MNEKLAKLSVVIAQSFLVILLTVLLSAVRETEIVSTTAIVLYIL + HYFVFYISDYGRNFFKRGYLIELVQTLKYILFFALAISISNFFSEDRFSISRRGMIYF + LLLYVFLVYVLNLFIKWYWRRAYPNFKGSKKFFLLTATSHIEKVLDRLIESDDVVGKL + VAVSVLDKPDFQHDYLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDCILAHNKQICEMAGLNVVTFSTTFYKTSHVIAKRVIDIIGSLVGLIL + CSLVSIVLVPLIRKDGGSAIFAQTRIGKNGRHFTFYKFRSMCVDAEEKKRELMEQNTM + QGGMFKVHDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 6721..6807 + /gene="wchA" + /locus_tag="SPC11C_0008" + /note="Signal peptide predicted for SPC0487 by SignalP 2.0 + HMM (Signal peptide probability 0.901) with cleavage site + probability 0.304 between residues 29 and 30" + misc_feature 7504..8085 + /gene="wchA" + /locus_tag="SPC11C_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.8e-156" + gene 8092..8541 + /gene="wchJ" + /locus_tag="SPC11C_0009" + CDS 8092..8541 + /gene="wchJ" + /locus_tag="SPC11C_0009" + /note="member of homology group 26" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="CAI33164.1" + /db_xref="GOA:Q4K252" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:Q4K252" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKEDARSILGN + ETFYPCHYPTNRNLKNLIKNTILAFNILRKERPDVIISSGAAVAVPFFYLGKLFGAKT + VYIEVFDRIDTPTLTGKLVYPVTDKFIVQWDEMKKVYPKAINLGGIF" + gene 8541..9020 + /gene="wchK" + /locus_tag="SPC11C_0010" + CDS 8541..9020 + /gene="wchK" + /locus_tag="SPC11C_0010" + /note="member of homology group 27" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33165.1" + /db_xref="GOA:Q4K251" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q4K251" + /translation="MIFVTVGTHEQQFNRLIKEVDRLKGEGLIQDEVIIQTGFSDYEP + VHCQWKALISYDEMNQYMDEADIVITHGGPATFMGVISKGKRPIVVPRQEKFGEHVND + HQMEFCLKLLGEGYDLVVIDEIDKLNENIKYSKVQQVSSHNSKFTNELSDIIENMFI" + misc_feature 8541..9011 + /gene="wchK" + /locus_tag="SPC11C_0010" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 1.1e-50" + gene 9162..10274 + /gene="wcyK" + /locus_tag="SPC11C_0011" + CDS 9162..10274 + /gene="wcyK" + /locus_tag="SPC11C_0011" + /note="member of homology group 116" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33166.1" + /db_xref="GOA:Q4K250" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K250" + /translation="MKILHIPTGGLFSDGIGTFIYSYLECMNLDKWEVTVLATNIPLL + EDKAKFENLGIQVVVLERKKTAIIHYMCQLYKLIRANKYDIIHVHGSSSLMSIELSVA + KIAGVPVRIAHSHNTTCDHRKLDKVLRPVFHKLYTQAWACGEGAGKWLFTNREYTIIH + NARNIKRYQFSESKRQRFRKKLSLKDTTLALGHVGRFNVQKNHEFLVLLMENLVIQGL + DVKLFLVGEGSTLSKIKNMVSEKSLEDRVFFLGHLNDMKSFVSAMDIMLLPSLYEGLP + LVSVEWQINGIQCILSDTITKECIYTKQVTSLPIRTPLYWEKAIRDFCPEDRLRQSIE + NQRLAREAGYDIELELVKLDTLYNKLIMTIKDRTRK" + misc_feature 9684..10181 + /gene="wcyK" + /locus_tag="SPC11C_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 9.1e-19" + gene 10271..10741 + /gene="wcwR" + /locus_tag="SPC11C_0012" + CDS 10271..10741 + /gene="wcwR" + /locus_tag="SPC11C_0012" + /note="member of homology group 147" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33167.1" + /db_xref="GOA:Q4K249" + /db_xref="InterPro:IPR001451" + /db_xref="InterPro:IPR005881" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K249" + /translation="MKNDRKAQLIITIFKYGKRHVGRSTFYHKLNYKMYQILNAIFVI + GIFNTELPASQNISDNIILFHPYGIIVNGDVTLGNNVVIRQQVTIGNKGMERDVGKSP + IIEAGVDIGAGAKIIGGITIGEGSKVGANAVVTKSFPPGSILVGVPARNIALEK" + misc_feature 10490..10543 + /gene="wcwR" + /locus_tag="SPC11C_0012" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.0059" + misc_feature 10571..10624 + /gene="wcwR" + /locus_tag="SPC11C_0012" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 18" + misc_feature 10625..10678 + /gene="wcwR" + /locus_tag="SPC11C_0012" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.99" + gene 11006..11725 + /gene="wcrL" + /locus_tag="SPC11C_0013" + CDS 11006..11725 + /gene="wcrL" + /locus_tag="SPC11C_0013" + /note="member of homology group 54" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33168.1" + /db_xref="GOA:Q4K248" + /db_xref="InterPro:IPR007577" + /db_xref="UniProtKB/TrEMBL:Q4K248" + /translation="MIPKKIHYCWFGGGPLPTDVKKCIDSWRKFCPNYEIIRWDESNF + IISDQNNFVQTAYENKAWAFVSDYARLRIIYENGGIYLDTDVELIRNLDELLEHAAFF + GAHQINGLVATGLGFGSKKGTKILKELLRLYDNTDFDPCKKNELACPILNSFVFTDFG + YQPSSNIVQTEYFTIYPAEYFDPIYVGANARNLLSEKTYSIHHYSASWTPVRVRIKNK + IIRYIGRDKILLLKKILERKR" + gene 11725..12894 + /gene="wzy" + /locus_tag="SPC11C_0014" + CDS 11725..12894 + /gene="wzy" + /locus_tag="SPC11C_0014" + /note="member of homology group 68" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33169.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K247" + /translation="MKISLSKVFFLQFCALYIFTILYPRGITLTYSPSADFFTLIYKF + CLYFTIAASIIYIFIKILYQRLHLASYTFFILQYYIVSIVITLLLTGTIDSGLQSVFY + PICIYLFFNEIQDRVLIIKISDIFLYCLTLLFFINILDLMMNFTNIYHITFLGHVQVI + SQFGIIAFFISSYYLMIGNRNRKIAFLLQILTVLNCLYADVFLSKVIAIFMIIYALSF + NIKRVFWKRGILISFLTFIITILLLFIDIQGYLIRYLQYFDFTFNGRYQIWRIAYQKF + LDSKIYGYGVFSFHFNLPWQDSGAKGINYAHNQLMQLAIDNGVIGIVSFFIMIFYMIF + LTRKIRNFRVASLFLFSYFCLFIVMFIESVTYYPYYFIILIFQILYERLEQVGEC" + misc_feature 12499..12693 + /gene="wzy" + /locus_tag="SPC11C_0014" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 4.4e-09" + gene 12888..13388 + /gene="wcwT" + /locus_tag="SPC11C_0015" + CDS 12888..13388 + /gene="wcwT" + /locus_tag="SPC11C_0015" + /note="member of homology group 69" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33170.1" + /db_xref="GOA:Q4K246" + /db_xref="InterPro:IPR001451" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K246" + /translation="MLNSLIRRFNQIFYSYRVRRKAAVAKGRVYTGGKTFVTSNTYLS + ENVSFNGMSMFGEGRISIGRNFHSGINCQIITSFHDYDTGTKIPYDNKYIHKDVIIDD + NVWIGNNVIILGGSRIGEGAVIQAGSTVVGEIPPGAIAGGHPARVFKFRNMKHYEELK + RLEQFY" + misc_feature 13176..13229 + /gene="wcwT" + /locus_tag="SPC11C_0015" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.41" + misc_feature 13230..13283 + /gene="wcwT" + /locus_tag="SPC11C_0015" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 2.6" + gene 13398..14585 + /gene="wcwU" + /locus_tag="SPC11C_0016" + CDS 13398..14585 + /gene="wcwU" + /locus_tag="SPC11C_0016" + /note="member of homology group 70" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33171.1" + /db_xref="GOA:Q4K245" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K245" + /translation="MNIIRYLKRNGFRYALNVLYQYKIQKILDSIVIRFTKFKKLQNI + IVIECHTDFDNNGGAFYDYLIRNNYNKKYKIILLLKNRLVRTLPENVDYFYLKKPSLR + KSYLLSLSKFFLFDNDILRKYRKDQKHFYLTHGCFPLKNTIGKITVPNYVDFVLSPSG + NVDNIIVKQFGLTSKEQCLHTGFPCHDIFYSKPEPLVFLSDYDKKIIWAPTFRKGGGY + NRNDSTASYPLGIPLLETLDELANLNIYLSQRDIVLIVKLHPMQDISDLELKQFSHIK + FLTNQDLNRKNTNLYQLLMNSDALLSDYSAISYDYLHLDKPIGYVFSDLNDYKLGLSV + DNVDDYIAGDKILSFENLLHFIDNIYLEIDKNKEKRKELFNKIFEKQDGESCERLAQI + MEL" + misc_feature 13971..14582 + /gene="wcwU" + /locus_tag="SPC11C_0016" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 6.1e-12" + gene 14602..16005 + /gene="wzx" + /locus_tag="SPC11C_0017" + CDS 14602..16005 + /gene="wzx" + /locus_tag="SPC11C_0017" + /note="member of homology group 52" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33172.1" + /db_xref="GOA:Q4K244" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K244" + /translation="MSVGMKAALWYTVANFIQKGFVFLSTPILTRILNVNDYGTLMLY + QSWFVLFAIFATLNLSQAAYNKGLVEFENDKDNFTFSLLFLSKIITIIVAFLYFTFNI + LVKDSTGLTPSFMIFLFSDILFNISIEFYLARQRFEFKYRKAILISTSSSFFIVAIST + TILLAIKNDLFIKIVLDAIIRIIFGLYCFYLLFFSGRRQLKIEKKYIKYGFSYSLPLM + PHFLSHYILNQSDRLMINMFDGREKLAIYSLAYSVSMIMFLFTSAINQSIMPYTFQAL + KKKDYCGIHGSTKWLFVVVGGITALSILFAPELIVILGGNKYKESIWLVPPIAISVYF + LFVYSMFSNISFYYKMNKLISLVSIGVALSNIILNYIFINIFGYQAAAYTTLLCYILL + AFSHFFLYRFLLKKEEIHEELYNMKMILIISLILLIILFLILVIYNLAIIRYAIIAIV + LFLLFTKRNKIITSLKS" + misc_feature 14611..15429 + /gene="wzx" + /locus_tag="SPC11C_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.4e-19" + gene 16119..16511 + /gene="gct" + /locus_tag="SPC11C_0018" + CDS 16119..16511 + /gene="gct" + /locus_tag="SPC11C_0018" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33173.1" + /db_xref="GOA:Q4K243" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K243" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNFEHRKNLVEAIRYVDLVIPETSWEQKKTDIKEYRIDTFVMGDDWKGKFDY + LKEEGVEVVYLPRTKEISTTKIKEDLAD" + misc_feature 16131..16499 + /gene="gct" + /locus_tag="SPC11C_0018" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 3.4e-29" + gene complement(order(16727..17311,17365..17958)) + /gene="tnp" + /locus_tag="SPC11C_0019" + /pseudo + CDS complement(join(16727..17311,17365..17958)) + /gene="tnp" + /locus_tag="SPC11C_0019" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(17231..17311,17365..17577)) + /gene="tnp" + /locus_tag="SPC11C_0019" + /note="HMMPfam hit to PF01610, Transposase, score 3.5e-42" + /pseudo + gene 18173..>18532 + /gene="aliA" + /locus_tag="SPC11C_0020" + CDS 18173..>18532 + /gene="aliA" + /locus_tag="SPC11C_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33175.1" + /db_xref="GOA:Q4K242" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K242" + /translation="MMKSSKLFALAGVTLLAATTLAACSKSGSSAKAEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 18173..18265 + /gene="aliA" + /locus_tag="SPC11C_0020" + /note="Signal peptide predicted for SPC0500 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.629 between residues 31 and 32" + misc_feature 18419..18487 + /gene="aliA" + /locus_tag="SPC11C_0020" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaaatgact gactagaatg agcaaacctc + 181 aagtttttga agcttgaggt tttttactat agtggattga aactagaata gtgcacctct + 241 gcttctaaaa cattgttaga aatcgatttg actgtcccga tcgatttgtc ctattcttat + 301 ttcattttgc tatacttgta gttgaggaga attaagctcc tcactagtaa actcttcata + 361 atccttttta tttttatgaa gatattgttt gaaagatgtg agtttccacg gatgggtttg + 421 tggagggata tacttgcgtc tttctttttt tgttctggtt cttgttcaaa gtttttcgaa + 481 tagagttcat gatttagtag ctcctttgtg tgatagattt tgtcagcgat attgaggtag + 541 atgtctccgt caaatgcttt tataactaat gctttcgtct ttctgatgaa atagacttct + 601 tttccttgct cggtagggat atagcaacga ttttggaatc ggatatggtg tccactatcg + 661 acgactctct ccgacagtct agctagaatg agatttcgtt cagagggctt aggagcctcc + 721 tcaaagacag agagttttgt cttgtttcca aactgttcat taaaggtttg gatataggaa + 781 ggcagaaagg tattggcttc ttccaaggta tgaatattgt ttcgttccag ttcgataggc + 841 aggcgagatt gtaatgtctg attgagtctt tcgactctcc ctttagcttg agggatagag + 901 gttgtctcaa ggagaattcc cagttggtga caggcgtatc caaattgtgt ataggtgtcg + 961 tcctccattt tcttagagtt ggaggcttga taggtaaaaa cagttctctt atctgtttta + 1021 atttgaagag gaatgccgtg gttggctaag atttgttcga ggacatgata gtaagcattc + 1081 aaggtttctt gtttgtcaaa ataagagcct aggatattgc cagaagcatc atcaatggct + 1141 aggtgtaagt tagaggtttc tgctccaaac caggcatgag ggctggcatc catttggatg + 1201 agttctccag caaatttctt tctgggtcta ctaggatgta cctttttagg gtcttccagg + 1261 aacttttcag ccgtcggtaa gattggattg tctaggggtt gcttggggtt cagtttagct + 1321 tgttttctta ctctcttctt tgtctttctg tgagacttag gcgacaggat atttttctta + 1381 tagagtattt ttctaacagt tgtatcagag agctgaattc cttcttcttc agctagcaat + 1441 tcacagaaat gacggacatt tggtttatat gtttcatagg agaggtattt ctttaggata + 1501 cgttctttga tttcatcagg gattgcatgt tttggttttc gatttctgtt tctgtgtctg + 1561 aaggcttctt ttcctttctg ttgataggct agtagcagac gattgatttg tctttcagaa + 1621 agattgagtt cgacacaggc ccgtttcttt gttttctttc cttgggctat agcttttatc + 1681 acaagatatt ttttcgtttc attcatattc agttggatcc ttttcatatg actattctac + 1741 caaatgggac atttttacgt tcgatttact aaagacatta tcacattcga attgaaagtt + 1801 ctataatgaa gttagccacc ttaccttagt caagaattag atgtttcact atgtttgagt + 1861 aagttgatga tttcatttga taacaggttt gaaactgtta ggctaggtgg ccaaggctaa + 1921 tcatagcctt ggtttagctg aaaaaacagg ttcaagggtt cctgttgtca aatgaaatgt + 1981 gatttaaggt ataagaaaac acctctgtgc tatacttgtt gttcaccaca aacacaagga + 2041 aaggcacaga gatgcaagaa cattataccc caaaagggaa acatttgaca atagataacc + 2101 gtcgcttgat tgagcggtgg aagaatgaaa ataagtccaa tcgtgaaatt gcaggcttgt + 2161 taggaaaggc gcctcaaacg attcataatg aagtcaaaag aggtacaact ttacaacaag + 2221 tgagaaaagg gctatacaaa aaggtctatt ctgccgatta cgcacaaact gtttaccaat + 2281 tcaatcgaaa acggtcggtg aaaaagttaa ttttaacaaa ggaaatcaga gagaagatct + 2341 tacactatca taagcaaaaa ttttcgcctg aaatgatggt taacaagaag caagtgaaag + 2401 ttggtatttc aaccatctac tactggtttc ataatggtca tttaggattg acgaaggccg + 2461 acatgcttta tcccagaaaa aggaaaggtg tcaagaagca agctagtccg aactttaagc + 2521 cggcaggtaa atctatcgaa gaacgtcctg acgttattaa tcttcgcttg gaaaatggtc + 2581 attatgaaat tgataccgtc ctactgacta agataaaaaa ttattgcctg ttagtcttaa + 2641 ccgaccggcg gagcagacac caaattataa ggttaattcc aaataaaact gctgaatctg + 2701 tcaatcaggc gcttacgtta ctattagggg agcatcgtat tctgtccatt actgcagata + 2761 atggttcgga gttcaaacga ttgtctgagg tatttcctga ggaacatatc tactacgcac + 2821 atgcttactc ttcatgggag agaggttcaa atgaaaatca taatcgatta attcggagat + 2881 ggttacctaa aggaaccaag aaaacgactc cgaaagaagt agcttttatc gaaaattgga + 2941 ttaacaacta ccctaaaaaa tgcttggact acaagtcgcc aagtgaattt cttttgggtg + 3001 gctaacttca acttgaaatt tgggatcaca ttcgaattac acaagatgca gatagtgaga + 3061 aaaaggtgta gacattaccg taaaaaagtg atataattgt aagatgttca atgtataggt + 3121 gttaatcatg agtagacgtt ttaagaaatc aggttcacag aaagtgaagc gaagtgttaa + 3181 tatagttttg ttgactattt atttattgtt agtttgtttt ttattgttct taatctttaa + 3241 gtacaatatc cttgctttta gatatcttaa tctagtggca actgcctttg ttctactagt + 3301 tgccttaata gggctactct cgattatcta taaaaaagct gaaaagttta ccattttttt + 3361 gttggtgctc tctattcttg tcagctcagt gtcgctcttt gcagtacagc agtttgtggg + 3421 actgaccaat cgtttaaatg cgacttctaa ttactcagaa tattcgctca gtgtcgctgt + 3481 tttagcagat agtgagattg agaatgttac gcaactgacg agtgtgacag caccgactgg + 3541 gactgataat gaaaacattc aaaaactact agctgatatc aaatcaagtc agaatatcga + 3601 tttgacggtt aatcaaagtt cgtcttactt ggcagcttac aagagtttga ttgcaggaga + 3661 gactaaggcc attgtcttaa atagtgtctt tgaaaatatc attgaatcgg agtatccaga + 3721 tcacgcatcg aagataaaaa agatttatac caagggattc actaaaaaag tagaagctcc + 3781 taagacttct aagaatcagt ctttcaatat ctatgttagt ggaattgata cttatggtcc + 3841 aattagttcg gtgtcgcgtt cagatgtcaa tatcttgatg actgtcaatc gagataccaa + 3901 gaaaatcctc ttgaccacaa cgccacgtga tgcttatgta ccaatcgcag atggtgggaa + 3961 taatcaaaaa gataaattaa cccatgcagg tatttatgga gttgattcgt ccatccacac + 4021 cttagaaaat ctatatggag tggatatcca ttactatgtc cgtttgaact tcacttcttt + 4081 cttgaagttg atcgatttgt tgggtggggt agatgtttat aatgatcagg aattcacagc + 4141 tcttgctaat aaaaaacact attctattgg taatgtccat ttagattcag aagaggcact + 4201 cgcttttgtt cgtgagcgct actctctagc agatggtgat cgtgaccgtg ggcgcaatca + 4261 acaaaaggtg attgtggcta tccttcaaaa attaacttcg accgaagtgc tgaaaaatta + 4321 tagcagaatc attgatagct tgcaaaattc tatccaaaca aacatgcccc ttgagactat + 4381 gataaacttg gtcaatgctc agttagaaag tggtggaacg tacaaagtaa attcgcaaga + 4441 cttgaagggt aggggacgga cggatcttcc ttcctatgcg atgccagata gtaacctcta + 4501 tatgatggaa attaacgaca gtagccttgc atctgtcaaa actgctattc aggatgtgtt + 4561 ggaggggaga tgaaatgatt gatattcatt cgcacattgt ctttgatgta gatgatggtc + 4621 ccaagtcaag agaggaaagt aaggctctct tgacagaagc ctacaggcag ggggtgcgaa + 4681 ccattgtctc tacctctcac cgtcgcaagg gcatgtttga aactccagaa gagaagatag + 4741 cagaaaactt tcttcaggtt cgggaaatag ctaaggaagt cgcgagtgac ttggtcattg + 4801 cttatggggc tgaaatttac tacacaccag atgttttgga taagctggaa aataatcgga + 4861 ttccgaccct caataatagt cgttatgcct tgatagagtt tagtatgaac accccttatc + 4921 gcgatattcg tagtgccttg agtaaaatat tgatgttggg aattactcca gtcattgccc + 4981 acatcgagcg ctatgatgct cttgaaaata atgaaaaacg cgttcgagag ctgatcgata + 5041 tgggctgtta cacgcaagta aatagttcac atgtcctcaa atccaaactt tttggagaac + 5101 ctgataaatt catgaaaaaa agagcgcagt atttcttgga gcgtgatttg gttcatgtga + 5161 ttgcaagtga tatgcataat gtggacggca gacctcctta tatggcagaa gcatatgacc + 5221 ttgtttccca aaaatacgga gaagcgaagg ctcaggacct ttttatagac aatcctcaaa + 5281 aaattgtaat ggatcaacta atttaggaga aatgatgaaa gaacaaaaca cgatagaaat + 5341 cgatgtattt caatcactta aaaccttatg gaaacacaag ctaatcattt tattagtggc + 5401 acttgtgaca ggggcggtag cctttgcata tagcactttt attgttaagc cagaatatat + 5461 gagcaccacg cgtatttacg tagtcaaccg taatcaagga gataagccag gactgacgaa + 5521 tcaggacttg caggcaggag cttatctggt aaaagactac cgcgaaatta tcctttcgca + 5581 agatgtattg gaaaaggtag cgacaaactt gaaattggat atgccagcaa aaacgttaac + 5641 tagcaaagtg caagtgactg taccagccga cactcgtatc gtctcaatct ctgtcaagga + 5701 taaacaacca gaggaagcca gtcgcattgc taattctcta cgagaagttg ctgcagaaaa + 5761 gatcatcgct gtaacgcgag tatctgatgt aacgacgctt gaagaagcgc gaccagctac + 5821 gactccctct tctccaaatg ttcgacgcaa caccttagtt ggttttcttg gaggagccgc + 5881 cgtaacagta attactgttc ttttgattga gttgctcgat acccgtgtaa aacgtcctga + 5941 agatgttgaa gatgtactgc aaatgccact tctaggagtc gttccagatt ttgataaaat + 6001 gaaataggag gaagttatgc caacgttaga aatctcacag gcgaaattag aacctgtgaa + 6061 aaaggcagag gaatattata atgctttgtg cacgaaccta cagttaagtg gagatgattt + 6121 gaaagtattt tctatcactt ctgtgaaagc aggagaagga aaaacaacga cttccatcaa + 6181 tatcgcttgg gcttttgcgc gtgcaggtta caaaacgctg ctgattgatg cagacatgcg + 6241 taactccgtg atgtcaggtg tctttaaacc aagggaaagg attactggac taacagaatt + 6301 tctatcaggg acaacagacc tgtcacaggg gctttgcgat accaatattg agaatctctt + 6361 tgtgattcag gctggttctg tgtcaccaaa tccgacagcc cttcttcaaa gtaagaattt + 6421 cagtacaatg cttggaacct tgcgtaaata ttttgactat atcgtcgtag acactgctcc + 6481 tatcggtatc gtgattgatg cggctatcat tatgcagaaa tgtgatgctt ctattttagt + 6541 gacgaaggca ggtgaaacaa aacgacggga tcttcaaaaa gcgaaagaac agttggaaca + 6601 aactgggaag tcgtgtttag gagttgtgtt gaataaattt gatacttcag tagagaaata + 6661 cggttcttat gggaattatg ggaattacag gaaacagaaa aaataggttg agggatagag + 6721 atgaatgaaa aattagcaaa gctttcagta gtcatagccc agagttttct tgttattcta + 6781 ttgactgttc tacttagcgc tgtgagagaa acagagattg tttcaacaac agctattgta + 6841 ctttatatcc tccactattt tgtcttttat atcagtgatt atggacggaa tttctttaaa + 6901 aggggatatt tgattgaact tgtccagaca ttgaaatata tcctattctt tgcgctagcg + 6961 attagtattt ctaatttttt ctcagaagat cgatttagta tttccagaag aggcatgatt + 7021 tacttcctct tattatatgt tttcttagtc tatgtgctaa acctatttat caagtggtat + 7081 tggaggcggg cttatcccaa ctttaaagga agtaagaagt ttttcctact tacagcaact + 7141 tctcatatcg aaaaggtact ggatagacta atagaatcag atgatgttgt tgggaagttg + 7201 gtagccgtca gtgttttaga taaaccagat tttcagcacg attatttaaa ggttgtagca + 7261 gagggggaga tcgtaaactt tgcgactcat gaggtggtcg atgaagtctt tatcaatctt + 7321 ccaagtgaaa aatacaatat tggagagctt gtctctcagt ttgaaacgat gggaattgat + 7381 gtaacagtca atctaaatgc tttcgattgt atcttggcac ataacaagca aatttgtgag + 7441 atggcaggac taaatgttgt gactttttct acaacatttt ataagactag ccatgtgatt + 7501 gctaagcggg ttattgatat tatcggttcc ctggtaggtt tgatactatg tagtctagtc + 7561 agtattgtgc tggttccttt gattcgaaag gatgggggct ctgctatttt tgctcagacg + 7621 cgtataggaa aaaatggccg ccatttcact ttttataagt ttcgctccat gtgtgtagat + 7681 gctgaggaga aaaaaagaga actcatggaa caaaatacca tgcagggtgg aatgtttaag + 7741 gtgcacgatg atcctcgtat cacgaaaatt ggtcgtttta tacggaagac gagcttggac + 7801 gagctaccac agttttataa tgttctaaag ggagatatga gtttggttgg cacacggcca + 7861 ccaacagtgg acgagtatga acactatacc ccagaacaaa aacgtcggct aagttttaaa + 7921 cctggtataa caggcttatg gcaggtcagt ggacgaagtg aaatcaaaaa tttcgatgaa + 7981 gttgtcaaat tagatgtggc ctatatagac gattggacaa tctggaaaga tattgagatt + 8041 ttattgaaga cagttaaagt tgtattgatg aaggatggag ctaaatagga aatgaaaata + 8101 tgtttagttg gatctagtgg aggtcatctg actcatttat atctattaaa acctttctgg + 8161 aaagataagg aaagattttg ggttactttt gataaagagg atgcaagaag tatcttggga + 8221 aatgaaacat tttatccttg tcattatcct actaatcgta atttgaaaaa tcttattaaa + 8281 aatacgattc ttgctttcaa tattttgaga aaggaacgcc ctgatgttat catctcatca + 8341 ggggctgctg tagcagttcc tttcttttac ctaggaaaac tatttggtgc taagacagtc + 8401 tatattgaag tttttgaccg tattgatacg ccaacattaa cagggaaatt ggtatatcca + 8461 gtgacagata agttcatagt tcagtgggat gaaatgaaaa aagtatatcc gaaagcaatc + 8521 aacctcggag ggattttcta atgatttttg tgacagtagg tactcatgag caacagttta + 8581 atcgacttat taaagaggtt gatagattaa aaggtgaggg acttattcag gatgaagtta + 8641 ttattcagac tggtttttcg gattatgaac cagtgcactg ccaatggaaa gctttgattt + 8701 cttatgatga gatgaatcaa tatatggatg aagcagatat tgtcattaca catggtggcc + 8761 cagcaacatt tatgggagtg atttctaagg ggaagagacc gattgtagta cctagacaag + 8821 aaaaatttgg cgagcatgtg aatgatcacc aaatggaatt ttgcttaaag ttactaggcg + 8881 aaggatacga tctagttgta atcgatgaaa ttgataaact taatgagaat attaaatatt + 8941 caaaagttca gcaagttagt tctcataata gtaagtttac taatgaactg tcagatataa + 9001 ttgaaaatat gtttatataa gatatgtgtg actgccggtt ttttgtgtta ctaataattg + 9061 tcatacagtc agagcttttt aaactatatc gttattaaat agtgagtttt atattttaat + 9121 gattaccatt cgtatttaat aagaaataat ggagaagatg aatgaagatt ttgcatattc + 9181 caacaggtgg cttattttca gatggaatag ggacgtttat ctattcttat ttagaatgca + 9241 tgaatctaga taaatgggaa gtgacagttt tagctactaa tattccactg ttagaagata + 9301 aagcaaaatt tgagaattta ggtatccagg tagtagttct agagcggaaa aaaactgcga + 9361 ttattcacta tatgtgtcaa ttatacaaat taataagagc taataaatat gatataattc + 9421 atgttcatgg tagtagttct ttaatgtcaa tcgagctatc tgttgcaaaa attgcagggg + 9481 ttccagtaag gattgcccat agtcataata ctacttgtga ccatagaaaa ttagataaag + 9541 tattacggcc agtatttcat aaattatata cgcaggcgtg ggcatgtggt gaaggagctg + 9601 ggaaatggct ttttaccaat agagaatata ctattattca taatgcaaga aatataaaac + 9661 gttatcaatt tagtgagtcc aaacgacaac gatttagaaa aaaactatct cttaaagata + 9721 caactcttgc tttaggtcat gttggtcgct ttaatgttca aaaaaatcat gaatttcttg + 9781 tgttattaat ggaaaattta gtaatacaag gactagatgt taaattattt ttagtaggtg + 9841 aagggtcaac tttatcaaaa attaagaata tggtttctga aaaatcttta gaagataggg + 9901 tcttcttttt aggtcatctt aatgatatga aatcatttgt gtctgctatg gatataatgc + 9961 ttctcccaag cttgtacgaa ggtctccctc tggtgtcagt agaatggcaa ataaatggaa + 10021 tacaatgtat cttatctgat actataacaa aggagtgtat ctacactaaa caagtgactt + 10081 ctttaccaat taggacccct ctttattggg aaaaagcgat aagagatttc tgtccagaag + 10141 atagattgag acaatcaatt gagaatcaaa gacttgcgag agaagctggt tatgatattg + 10201 aactggaatt agttaaattg gatactttat acaataaatt gataatgact ataaaagata + 10261 ggacaagaaa atgaaaaatg ataggaaagc tcaactaata attacaattt ttaaatatgg + 10321 taaaagacat gtaggacggt caacttttta tcataagtta aattataaaa tgtatcaaat + 10381 tttaaatgct atatttgtaa ttggtatttt caatacagaa ttaccagcat cacaaaatat + 10441 tagtgataat ataatattgt ttcatccata tgggataata gttaatggcg atgtaacttt + 10501 agggaataat gttgtgataa gacagcaggt taccattggt aataaaggga tggaaaggga + 10561 cgtgggaaaa tctcctatta tcgaagcagg tgttgatatt ggagcaggtg ctaaaattat + 10621 aggagggata acgattggtg agggttcaaa agtaggagct aatgctgttg taacaaaaag + 10681 ctttccacct ggttcaattt tagtaggagt tccagcgagg aatatagcat tagagaagta + 10741 atttgggata gaatgcaaat aagtgtgtta atacactaag atattggcat cagcgacaat + 10801 gctgtttgaa tattttagtg aatcaaaaaa gagagaaaaa tgataaaatt taacttagta + 10861 agcattatat catatgttca ataagaactg tcgaattaat ttaataaatt tagtgataaa + 10921 tacgtactag tgagaatttg ttttattgta agagagttcc tataattata gataattact + 10981 aaatagtcag ggaaaggaaa aactaatgat tccaaaaaaa atacattatt gctggtttgg + 11041 tggaggtcca ttacctactg atgttaaaaa atgtattgac agctggagaa aattttgtcc + 11101 gaactatgag attattagat gggatgaaag caatttcatt attagtgatc aaaacaattt + 11161 tgttcagact gcatatgaaa acaaagcttg ggcatttgtt agcgactatg cacggttaag + 11221 aatcatatat gaaaatggtg gcatctattt ggatacagat gttgaattga ttagaaatct + 11281 tgatgaattg cttgagcatg cagctttttt tggtgctcac cagataaatg gattagtagc + 11341 tactggtcta ggttttggtt cgaaaaaggg gacgaagata ttaaaagaat tattaagact + 11401 gtatgataat acagattttg atccgtgtaa aaagaatgag ttggcatgtc ccatacttaa + 11461 ttcgtttgtc tttactgatt ttggctatca gccttcttct aacattgttc aaacggagta + 11521 ttttactatc tatcctgctg agtattttga tcctatatat gttggagcca atgctagaaa + 11581 tttattatcg gagaaaacat attcaattca tcattacagt gcctcttgga ctcctgtgag + 11641 agttagaata aaaaataaga tcattagata tattggtagg gataagattc tactattaaa + 11701 gaaaattcta gaaaggaaaa gataatgaaa atatcgcttt ctaaagtatt ttttttacaa + 11761 ttttgtgcac tttatatctt tacaatttta tatcctagag gtattacatt aacttattct + 11821 ccatctgcag atttttttac tctgatttat aaattttgtt tatatttcac catcgcagcc + 11881 agtataatat atatatttat aaaaatatta tatcagagac tacacctagc atcatatact + 11941 ttttttatat tgcagtatta tattgtttct atagttatta cattgctttt aacaggcaca + 12001 atagattcgg gtttacaatc agtcttttat ccgatctgta tatatttatt ttttaatgag + 12061 attcaagata gggtattgat tataaaaatt agtgatatat ttttatactg tttaactctt + 12121 ttattcttta taaatatttt ggatcttatg atgaatttta ccaatattta tcatataacc + 12181 tttttggggc atgtccaagt gatatcacaa tttggaatta tagctttttt catttcttcc + 12241 tattacttaa tgataggaaa tagaaatcgc aagatagcct tcctattaca aattttgact + 12301 gtgctcaatt gtctatatgc tgatgttttt ttatcaaagg ttatagcaat cttcatgatt + 12361 atttacgcat tatcatttaa cataaagaga gtattttgga agagagggat tctaatttct + 12421 ttcttgacat ttattataac tattctgctt cttttcattg atattcaagg ttatttgata + 12481 agatatttac aatattttga ttttactttt aatggccgct atcaaatttg gcgtattgct + 12541 tatcaaaaat ttttagattc aaaaatatat ggctatggag tttttagctt tcatttcaat + 12601 cttccgtggc aagattctgg tgctaagggg atcaactatg ctcataatca gcttatgcaa + 12661 ttagcaatag ataatggagt aattggtatc gtctctttct ttattatgat tttttatatg + 12721 atatttttaa caaggaagat tagaaatttt agagtagctt cattgttttt attttcgtac + 12781 ttttgtttgt ttatagtaat gtttattgaa agtgtaacct attacccgta ttactttatt + 12841 atattgattt ttcaaatatt atatgaaagg ttagagcagg tgggagaatg ctaaatagtt + 12901 taattagaag atttaatcag attttctata gttatcgggt tagaagaaaa gctgcagttg + 12961 ctaaaggaag agtgtacacg ggtggaaaaa catttgttac ttcgaatacc tatctttctg + 13021 agaatgtttc ttttaatggc atgtcaatgt ttggagaagg tagaatttcg ataggaagaa + 13081 atttccattc tggtataaat tgccaaatta taacgtcatt tcatgactat gatacaggaa + 13141 ctaagatacc atacgacaat aagtacatac ataaagatgt aattattgat gataatgtgt + 13201 ggattgggaa taatgttatt atcctcggcg gatctcgtat cggagaagga gcagttattc + 13261 aagcagggag tacagttgta ggggaaatac ctccaggagc aatcgcaggt ggtcatccag + 13321 caagagtatt taaatttagg aatatgaagc attatgaaga attaaagaga ctagaacaat + 13381 tttattagga gctatatatg aatattataa gatacttgaa aagaaatgga tttcgatatg + 13441 cattaaatgt cctctatcaa tataaaattc aaaagatttt agattcaatt gttattagat + 13501 ttactaagtt taaaaagtta caaaatatta ttgtcattga atgtcacaca gactttgata + 13561 ataatggagg agctttttat gattatttga taagaaataa ttataataag aaatataaaa + 13621 ttattttatt attaaaaaat cgactagtac gtactcttcc tgaaaatgta gattattttt + 13681 acttgaaaaa acctagtttg aggaagtcat atttgttatc attaagtaaa ttttttcttt + 13741 tcgataatga tatacttcgt aaatatagaa aagatcaaaa acacttctat ttaacacatg + 13801 gatgctttcc tttaaaaaat acaataggta aaataacagt tccgaattat gttgattttg + 13861 ttctatctcc ctcgggcaat gtagataata ttatagttaa gcagtttgga ttaacatcta + 13921 aagagcaatg tcttcacact ggatttccgt gtcatgatat cttttattca aaaccagaac + 13981 ctctagtatt tttatctgat tatgataaaa aaattatctg ggcaccaact tttagaaagg + 14041 gtggtggcta taatagaaat gatagtacag ctagctatcc tttaggtatt ccgttacttg + 14101 aaacactaga tgaacttgca aacctaaata tatatctaag ccaacgggat attgtcctga + 14161 ttgtaaagtt acatccaatg caagatattt cagatttgga gttgaaacaa tttagtcata + 14221 ttaagtttct gacaaatcaa gatttgaatc gtaaaaatac aaatctgtat caattgctga + 14281 tgaattcaga tgctttactc agtgactatt ctgcaatctc gtatgattat ttacaccttg + 14341 ataaaccaat agggtatgtt ttttcggatc taaatgatta taagttgggg ctttcagttg + 14401 ataatgtaga tgattatata gcaggtgata agatactgtc ttttgaaaac ttgctgcact + 14461 ttattgataa catttatcta gaaattgata aaaataaaga aaaacgcaaa gaattattta + 14521 ataaaatatt tgaaaaacag gatggagaat cgtgtgaaag attggcacaa attatggaat + 14581 tataaaagcc gttacgaaga aatgtctgtc gggatgaaag cggcactctg gtatactgtt + 14641 gcaaatttta ttcaaaaggg ttttgtattt ctttcaactc caattttaac cagaatactt + 14701 aatgttaatg attacggtac attgatgctt taccaatcat ggtttgtact atttgctatt + 14761 tttgcgacct tgaatctttc tcaagcagct tataataagg gattagtaga atttgagaat + 14821 gataaagata attttacatt ttctttgttg tttttgtcta agattattac tataattgtt + 14881 gcttttttat attttacttt taatatactg gttaaagata gtactggatt aactcccagt + 14941 ttcatgatat ttttattcag tgatatttta tttaatatca gtatagaatt ttatttggca + 15001 cgtcagagat ttgaattcaa atatagaaaa gcaattctaa tttcaacttc ttcaagtttt + 15061 tttattgtag ctattagtac aactatctta ttagcgatta agaatgattt attcattaaa + 15121 attgtattag atgctattat ccgaattatc tttggtttat attgttttta tctcttgttt + 15181 ttttcaggga gaagacaact taagatagaa aaaaaatata ttaaatatgg ttttagttat + 15241 tcattacctt tgatgccgca tttcttatcg cactatattt tgaatcagtc tgaccgtttg + 15301 atgattaaca tgtttgatgg tagggagaaa ttagctatat atagtctagc ttattctgta + 15361 tcaatgatta tgtttttgtt tactagtgca attaatcaat caataatgcc gtatacattt + 15421 caagctttga aaaaaaagga ttattgtggg atacatggga gcaccaaatg gctttttgta + 15481 gtagttgggg ggatcacagc tctctcaatt ctatttgcac cagaactaat tgttatttta + 15541 ggcggcaata aatataagga atcaatttgg ctagtaccac caattgccat ctcggtttat + 15601 ttcctttttg tatattctat gtttagtaat atcagctttt attataagat gaataagttg + 15661 atttcgttag tttccatagg tgtggctctt tcaaatatta ttttaaatta tatttttatt + 15721 aatatatttg ggtatcaagc tgcagcttac actacattat tatgctatat attgttagcg + 15781 ttttctcatt ttttcttata tagattttta ttaaaaaaag aggaaattca tgaggaactt + 15841 tataatatga agatgatttt aataatatct ttaatattat taataatact atttttgata + 15901 cttgttattt ataacttagc cattataaga tatgcaatta ttgcaattgt tttatttctt + 15961 ttgtttacaa agagaaataa aataattaca tcgctaaaaa gttgatattg aaaatttaga + 16021 atcaaattaa gaatatagtg aatatcaaac tagtattaat aatgaataat tgtttttatg + 16081 taatttagga ttaataaaaa aattgaaagg aaatatcaat gaaaagagta attacttatg + 16141 gaacctttga tttgcttcat tatggacata tcaatttgct aaagagagca aagcaattag + 16201 gagattatct cattgttgta gtttcaagtg atgagttcaa tttgaaagaa aaaaataaag + 16261 tttgttactt taattttgaa catagaaaga atttggttga agcaataaga tatgttgatc + 16321 tggtaattcc tgaaacaagc tgggaacaga aaaaaacaga tattaaagaa tatcgcattg + 16381 atacatttgt tatgggggat gattggaaag gaaaatttga ttatttaaaa gaagaaggag + 16441 tggaagtagt ttatttacca agaactaaag aaatatctac aactaaaatt aaagaagatt + 16501 tagcagatta gattttttac aaaaatattt tgagatcaga taataaattt gttttcataa + 16561 ttattaatgt ctattgtttt attaccacag aagtatatta aattaaaata aattatttta + 16621 gatttataat gtggctcctt gtcaacgaac atctggagag gacaatcact gtcttctcct + 16681 ttttattttt ttggctcttt gtcaactgta gtgggttgaa aaaaagctaa gctcgagaaa + 16741 ggacaaattt tgtcctttct tttttgatat tcagagcaat aaaaatccgt tttttgaagt + 16801 tttcaaagtt tcgaaaacca aaggcattgc gcttgataag tttgatgaga ttattggtcg + 16861 cttccagttt ggcgttggaa taaggtaatt gaagggcgtt gataatcttt tctttatctt + 16921 tgaggaaggt tttaaagaca gtctgaaaaa taggatgaac ctgcttaaga ttgtcctcaa + 16981 taagtccgaa aaatttctct ggttccttat tctggaagtg aaaaagcaag agctgataga + 17041 gctgatagtg gtgtttcaag tcttccgaat agctcaaaag cttgtttaaa atctctttat + 17101 tggttaagtg catacgaaaa gtaggacgat aaaaacgttt atcactcagt ttacggctat + 17161 cctgttgaat gagtttccag tagcgcttga tagccttgta ttcatgggat tttcgatgaa + 17221 actgattcat gatttgaaca cgcacacgac tcatagcacg gctaagatgt tgcacaatgt + 17281 gaaagcgatc aagaacgatt ttagcattcg ggagtgaaac agtctgggag actgtttcag + 17341 cctgagccta gaaatttgaa agcgaagctg tttagctaag tcatagtaag ggctaaacat + 17401 atccatagta ataattttga cgcgacatag gacaactcta tcgtagcgaa gaaagtgatt + 17461 tcgaatgata gcttgtgttc ttccctcaag aacagtgatg atattgagat tgttaaaatc + 17521 ttgcgcaatg aagctcatct ttccctttgt aaaagcatac tcatcccaag acataatctc + 17581 aggaagacaa gaaaaatcat gtttaaagtg aaaatcattg agcttacgaa tagcagttga + 17641 agttgagatg gaaagctgat gggcaatatc agtcatagaa atcttttcaa ttaacttttg + 17701 agcaatcttt tggttgatga tacgagggat ttggtgattc ttcttgacga tagaagtttc + 17761 agcgaccatc atttttgaac agtgatagca cttgaaacga cactttctaa ggagaattct + 17821 agtaggcata ccagtcgttt caagataagg aattttagaa ggtttttgaa agtcatattt + 17881 cttcaattgg tttccgcact cagggcaaga tggggcgtcg tagtccagtt tggcgatgat + 17941 ttccttgtgt gtatccttct aatgagttgt tttgtcgctt ttcattatag gtcatatggg + 18001 actttttttc tacacaaaaa taggctccat aatatctata gtggatttac ccactacaaa + 18061 tattatagag tctttttttc agaatttacc aaattaatta aaaaattcag aaaattctat + 18121 tgacatctct ctgaaaagag tctataatag agagaaagtt ttaaaggaga agatgatgaa + 18181 aagttcaaaa ctatttgccc ttgcgggtgt aaccttattg gcggcgacta ctttagctgc + 18241 atgttctaaa tcaggttcga gcgctaaagc tgagaagaca ttctcataca tttatgaaac + 18301 ggatcctgac aacctaaact acttgacaac tgctaaggct gcgacagcaa atattaccag + 18361 taacgtggtt gatggtttgc tagaaaatga tcgctacggg aactttgtgc cgtctatggc + 18421 tgaggattgg tctgtatcca aggatggatt gacttacact tatactatcc gtaaggatgc + 18481 aaaatggtat acttctgaag gtgaagaata cgcggcagtc aaagctcaag ac +// + diff --git a/public/res/serotype_genbank/serotype_11D.gb b/public/res/serotype_genbank/serotype_11D.gb new file mode 100644 index 0000000..5083995 --- /dev/null +++ b/public/res/serotype_genbank/serotype_11D.gb @@ -0,0 +1,797 @@ +LOCUS CR931656 17213 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 70/86 (serotype 11d). +ACCESSION CR931656 +VERSION CR931656.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17213) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17213) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17213 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="70/86" + /db_xref="taxon:1313" + gene <1..166 + /gene="dexB" + /locus_tag="SPC11D_0001" + CDS <1..166 + /gene="dexB" + /locus_tag="SPC11D_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33176.1" + /db_xref="GOA:Q4K241" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K241" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVEMTD" + gene complement(313..1706) + /gene="tnp" + /locus_tag="SPC11D_0002" + /pseudo + CDS complement(join(313..447,447..1706)) + /gene="tnp" + /locus_tag="SPC11D_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(720..1223) + /gene="tnp" + /locus_tag="SPC11D_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 3.8e-23" + /pseudo + gene 1882..3327 + /gene="wzg" + /locus_tag="SPC11D_0003" + CDS 1882..3327 + /gene="wzg" + /locus_tag="SPC11D_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33178.1" + /db_xref="GOA:Q4K240" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K240" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGIDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEINDSSLASVKTAIQDVLEGR" + misc_feature 1882..1998 + /gene="wzg" + /locus_tag="SPC11D_0003" + /note="Signal peptide predicted for SPC0503 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 2086..2433 + /gene="wzg" + /locus_tag="SPC11D_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 2611..3054 + /gene="wzg" + /locus_tag="SPC11D_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.1e-69" + gene 3329..4060 + /gene="wzh" + /locus_tag="SPC11D_0004" + CDS 3329..4060 + /gene="wzh" + /locus_tag="SPC11D_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33179.1" + /db_xref="GOA:Q4K239" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K239" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKNRIPTLNNS + RYALIEFSMNTPYRDIHSALIKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLERDLVHVIASDMHNVDSRPPHMAEAYDLVS + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3332..3940 + /gene="wzh" + /locus_tag="SPC11D_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 6.8e-38" + gene 4069..4761 + /gene="wzd" + /locus_tag="SPC11D_0005" + CDS 4069..4761 + /gene="wzd" + /locus_tag="SPC11D_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33180.1" + /db_xref="GOA:Q4K238" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K238" + /translation="MKEQNTIEIDVFQSLKTLWKYKLIILLVALVTGAGAFAYSTFIV + KPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDVLEKVATNLKLD + IPAKTLTSKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDVT + TLEEARPATTPSSPNVRRNTLVGFLGGAAVTVITVLLIELLDTRVKRPEDVEDVLQMP + LLGVVPDFDKMK" + misc_feature 4087..4503 + /gene="wzd" + /locus_tag="SPC11D_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 4.7e-51" + misc_feature 4609..4686 + /gene="wzd" + /locus_tag="SPC11D_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4771..5460 + /gene="wze" + /locus_tag="SPC11D_0006" + CDS 4771..5460 + /gene="wze" + /locus_tag="SPC11D_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33181.1" + /db_xref="GOA:Q4K237" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K237" + /translation="MPTLEISQVKLELAKKAEEYYNALCTNLQLSGDDLKVFSITSVK + AGEGKTTTSTNIAWAFARAGYKTLLIDADMRNSVMSGVFKSRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLGTLRKYFDYIVVDTAPIGIVI + DAAIIMQKCDASILVTKAGETKRRDLQKAKEQLEQTGKSCLGVVLNKFDTSVEKYGSY + GSYGNYRKQKK" + gene 5475..6836 + /gene="wchA" + /locus_tag="SPC11D_0007" + CDS 5475..6836 + /gene="wchA" + /locus_tag="SPC11D_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33182.1" + /db_xref="GOA:Q4K236" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K236" + /translation="MSEKLAKPSVAIVQSFLVILLTYLLSAVRETEIVSTTAIVLYIL + HYFVFYISDYGRNFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LLLHVFLVYVLNLFIKWYWKRAYPNFKGSKKVFLLTATSHVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDYLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDWARNKQIREMAGLNVVTFSTTFYKTSHVIAKWIIDIVGSLVGLILCG + LVSIVLVPLIRKDGGSAFFAQTRIGKNGRHFTFYKFRSMCVDAEDKKRELMEQNTMQG + GMFKVDDDPRITKIGHFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQK + RRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLMKD + GAK" + misc_feature 6252..6833 + /gene="wchA" + /locus_tag="SPC11D_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.6e-155" + gene 6840..7289 + /gene="wchJ" + /locus_tag="SPC11D_0008" + CDS 6840..7289 + /gene="wchJ" + /locus_tag="SPC11D_0008" + /note="member of homology group 26" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="CAI33183.1" + /db_xref="GOA:Q4K235" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:Q4K235" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKEDTRSILGN + ETFYPCHYPTNRNLKNLIKNTVLAFNILRKERPDVIISSGAAVAVPFFYLGKLFGAKT + VYIEVFDRIDAPTLTGKIVYPVTDKFIVQWEEMKKVYPKAINLGGIF" + gene 7289..7768 + /gene="wchK" + /locus_tag="SPC11D_0009" + CDS 7289..7768 + /gene="wchK" + /locus_tag="SPC11D_0009" + /note="member of homology group 27" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33184.1" + /db_xref="GOA:Q4K234" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q4K234" + /translation="MIFVTIGTHEQQFNRLIKEVDRLKGEGFIQDDVFIQTGFSDYEP + VYCQWKNLISYDEMNRYIDEANIIITHGGPATFMAVIAKGKIPIVVPRLKKFGEHVND + HQMEFCSKILSEGYELSLINDISELQYSLKQEKKTKFYSNNTCFLKKLSKTIEDLIV" + misc_feature 7289..7759 + /gene="wchK" + /locus_tag="SPC11D_0009" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 8.7e-47" + gene 8010..9107 + /gene="wcyK" + /locus_tag="SPC11D_0010" + CDS 8010..9107 + /gene="wcyK" + /locus_tag="SPC11D_0010" + /note="member of homology group 116" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33185.1" + /db_xref="GOA:Q4K233" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K233" + /translation="MKILHIPTGGLFSDGIGTFIYSYLEYMDLNKYDVTILATNSPLK + SDKEKFECLGVKVIEIERKKSNLSKYVYKLKKIIKKEKFDIIHVHGSSALMSIELLTA + KVAGIPVRIAHSHNTTCEHHKLDKLLRPIFYRVYTQACACSVSAGQWLFEEKNYKIIH + NARDVNRYQYDAIKRKKLREELLLSDETIALGHVGRFNTQKNQCFLVSLMEKLVIKNI + DIKLFLVGTGDTLEEIKKLVIQKKLEDNIVFLGQFDDMKSFVSSMDIMLLPSLYEGLP + LVSVEWQINGVESILSDRVTQECIYTGTVQQLSIDSMELWEKEILNLSTSDRERVSLQ + NIQLIKNAGYDISLEVKEIEELYNSLYDIAN" + misc_feature 8532..9023 + /gene="wcyK" + /locus_tag="SPC11D_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.1e-18" + gene 9108..9788 + /gene="wcwC" + /locus_tag="SPC11D_0011" + CDS 9108..9788 + /gene="wcwC" + /locus_tag="SPC11D_0011" + /note="member of homology group 48" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33186.1" + /db_xref="GOA:Q4K232" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4K232" + /translation="MKGKSFLLKMLQNLKPIKRKLKPIKRTYKRIVYSITKSNMRKRL + KNTDFSIISDNCWGGRVYEELGLPYRTPFIGLYIFSEDYVKLLKNFRKYMEYELTFTN + NSKWNTEYDGEYPIGILKDIELHFLHYANQEEAYEKWNKRKNRINYENIFFKMNDDNK + CSLKLLKEFDTLDLKNKIIFAAFNYKELDNLIHFTDPRGNGNVGTDLFYYDQYFDVVN + WLNGETQT" + gene 9785..10507 + /gene="wcrL" + /locus_tag="SPC11D_0012" + CDS 9785..10507 + /gene="wcrL" + /locus_tag="SPC11D_0012" + /note="member of homology group 54" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33187.1" + /db_xref="GOA:Q4K231" + /db_xref="InterPro:IPR007577" + /db_xref="UniProtKB/TrEMBL:Q4K231" + /translation="MIPKKIHYCWFGGKPLSNDVKRCIASWKKFCPDYEIIEWTEKNF + CIENQNQFVQDAYRDKAWAFVSDYARLKIIYENGGIYLDTDVEVIKNLDKLLENKAFF + GVHQVNHLVSTGLGFGSEKGTSILKELLNLYDEIEFDLSKKDELLCPELNTPVFKRLG + YTYSDCVVKNEYFTIYPEEYFDPISLGDGVENILSDKTFSIHHYSASWTSLRNQMKSK + IIRKLGRSNILELKRILKGKTR" + gene 10504..11676 + /gene="wzy" + /locus_tag="SPC11D_0013" + CDS 10504..11676 + /gene="wzy" + /locus_tag="SPC11D_0013" + /note="member of homology group 68" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33188.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K230" + /translation="MRISPSKLIFAFFSSFYILVILFPRGIFLGHSTLASRLWIIYNG + SLYLSILLGLIYVILKILSRNIAIHQHAFFILQYYFIVIILTFMVSGSIGVGLQSIFY + PIFIYLFFNEVRDKKSIVLIFDIFLYILTPLFVINTIDVFLNFTNIFHITFLGHVQVI + SQYSVIGFLVSAYYLLEEKRNILVAQLLLILTIINCFFSDVSLSKVIALFMIVYIISY + KLRKLFWKRGRKISVVTFIASVVMLALVIFGYFLPYLRYFDFTFNGRYQIWRIVYATI + LQVKWFGYGLFGFQFKLPWQKLGEVGINYTHNQVLQLALDSGIVGIISFFTMIFYMIF + STKNIQNSTISSLFIFAYFCLFIIMFIESVTYYPYYFIIIVLQTLYLKLERERNVK" + misc_feature 10504..10590 + /gene="wzy" + /locus_tag="SPC11D_0013" + /note="Signal peptide predicted for SPC0513 by SignalP 2.0 + HMM (Signal peptide probability 0.862) with cleavage site + probability 0.448 between residues 29 and 30" + misc_feature 11278..11472 + /gene="wzy" + /locus_tag="SPC11D_0013" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 8e-10" + gene 11666..12166 + /gene="wcwT" + /locus_tag="SPC11D_0014" + CDS 11666..12166 + /gene="wcwT" + /locus_tag="SPC11D_0014" + /note="member of homology group 69" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33189.1" + /db_xref="GOA:Q4K229" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K229" + /translation="MLNRLIRNFNKVYYSYRIKRKAAQCGGRVYTGGKTFVTANTYLD + ENVSFNGMSMYGEGKISIGKNFHSGLNCQIITSFHNYDLGDKIPYDESYIHKDVLIED + NVWVGNNVIILGGAIIEEGAIIQAGSTVIGRIPAGAIAGGHPAKPFRFRNMEHYNQLK + RQKKFH" + misc_feature 11954..12007 + /gene="wcwT" + /locus_tag="SPC11D_0014" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.9" + misc_feature 12008..12061 + /gene="wcwT" + /locus_tag="SPC11D_0014" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 2.7" + gene 12176..13363 + /gene="wcwU" + /locus_tag="SPC11D_0015" + CDS 12176..13363 + /gene="wcwU" + /locus_tag="SPC11D_0015" + /note="member of homology group 70" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33190.1" + /db_xref="GOA:Q4K228" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K228" + /translation="MNIVSYLKKNGITHTLKIINEYKMQELFDSLVSIFTKQKELRNS + IVIECHTDFENNGGAFYDYLINNEYNKKYKIVLLLKDKLVKELPENVDYFYLRKPSLR + KSYVMSLSKFFTFDNDMLRKYRKDQKHFYLTHGCFPLKSTIGKITVPNYVDFVLSPSG + NVDNIIVKQFGLTSKEQCLHTGFPCHDIFYSKPEPLVFLSNYDKKIIWAPTFRKGGGY + NRNDSTASYPLGIPLLETLDELANLNTYLSQRDIALIVKLHPMQDISDLELKQFSHIK + FLTNQDLNRKNTNLYQLLMNSDALLSDYSAISYDYLHLDKPIGYVFSDLNDYKLGLSV + DNVDDYIAGDKILSFNNLLHFIDNIYLEIDKNKEKRKELFNKIFEKQDGESCERLAQI + MEL" + misc_feature 12749..13360 + /gene="wcwU" + /locus_tag="SPC11D_0015" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 9.5e-11" + gene 13380..14783 + /gene="wzx" + /locus_tag="SPC11D_0016" + CDS 13380..14783 + /gene="wzx" + /locus_tag="SPC11D_0016" + /note="member of homology group 52" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33191.1" + /db_xref="GOA:Q4K227" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K227" + /translation="MSVGMKAALWYTVANFIQKGFVFLSTPILTRILNVNDYGTLILY + QSWFVLFAIFATLNLSQTAYNKGLVEFENDKDNFTFSLLFLSKTITIIVAFLYFTFNI + LVKDSTGLTPSFMIFLFSDILFNISIEFYLARQRFEFKYRKAVLISTFSSFFIVAIST + TILLAIKNDLFIKIVLDAIIRIIFGLYCFYLLFFSGRRQLKIEKKYIKYGLSYSLPLI + PHFLSHYILNQSDRLMINMFDGKEKLAIYSLAYSVSMIMFLFTNAINQSIMPHTFQAL + KKKDYCGIHGSTKWLFVVVGGITALSILFAPELIVILGGNKYKESIWLVPPIAISVYF + LFVYSMFSNISFYYKMNKLISLVSTGAALSNIILNYIFINIFGYQAAAYTTLLCYILL + AFSHFFLYRFLLKKEEIHEELYNMKMILIISLILLIILFLILVIYNLAIIRYAIIAII + LFLLFTKRNKIITSLKS" + misc_feature 13389..14207 + /gene="wzx" + /locus_tag="SPC11D_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.4e-16" + gene 14897..15289 + /gene="gct" + /locus_tag="SPC11D_0017" + CDS 14897..15289 + /gene="gct" + /locus_tag="SPC11D_0017" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33192.1" + /db_xref="GOA:Q4K226" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K226" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNFEHRKNLVEAIRYVDLVISETSWEQKKTDIKEYHIDTFVMGDDWKGKFDY + LKEEGVEVIYLPRTKEISTTKIKEDLAD" + misc_feature 14909..15277 + /gene="gct" + /locus_tag="SPC11D_0017" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 9.7e-29" + gene 15651..16679 + /gene="wcjE" + /locus_tag="SPC11D_0018" + CDS 15651..16679 + /gene="wcjE" + /locus_tag="SPC11D_0018" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33193.1" + /db_xref="GOA:Q4K225" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K225" + /translation="MTKVRINWVDFGKGFAIFLVLVGHVFIGLSESNKFSIANDVLLF + LIAQIYIFHIPVFFALSGYFFRPVSDLKEFWYYAKKKTIILGIPYIFYSIIHFCLQKL + AGASVRVPTTIHNLLNIYRYPLGVSWYLYTLWSILIVYGLLSIVFKNRKSLFLVSVFA + YIFTLFIQIDIFIVQRTLVWGICFFLGSVLSEIHFDKINLKKFLFFFVLFDFIYMFAW + FLFYEVGSKKDYVSYINPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSL + GIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLL + PQKYIKLK" + misc_feature 15666..16640 + /gene="wcjE" + /locus_tag="SPC11D_0018" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 0.00014" + gene 16854..>17213 + /gene="aliA" + /locus_tag="SPC11D_0019" + CDS 16854..>17213 + /gene="aliA" + /locus_tag="SPC11D_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33194.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 16854..16940 + /gene="aliA" + /locus_tag="SPC11D_0019" + /note="Signal peptide predicted for SPC0519 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 17100..17168 + /gene="aliA" + /locus_tag="SPC11D_0019" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaaatgact gactagaatg agcaaacctc + 181 aagtttttga agcttgaggt tttttactat agtggattga aactagaata gtgcacctct + 241 gcttctaaaa cattgttaga aatcgatttg actgtcccga tcgatttgtc ctattcttat + 301 ttcattttgc tatacttgta gttgaggaga attaagctcc tcactagtaa actcttcata + 361 atccttttta tttttatgaa gatattgttt gaaagatgtg agtttccacg gatgggtttg + 421 tggagggata tacttgcgtc tttctttttt tgttctggtt cttgttcaaa gtttttcgaa + 481 tagagttcat gatttagtag ctcctttgtg tgatagattt tgtcagcgat attgaggtag + 541 atgtctccgt caaatgcttt tataactaat gctttcgtct ttctgatgaa atagacttct + 601 tttccttgtt cggtagggat atagtaacga ttttggaatc ggatatggtg tccactatcg + 661 acgactctct ccgccagtct agccagaatg agattccttt cagaggggtt aggaacctcc + 721 tcgaagacag agagttttgt cttgtttcca aactgttcat taaaggtttg aatgtaggaa + 781 agcaggaagg tattggcttc ttccaaggta tgaatattgt tttgttccag ttcgataggc + 841 aggcgagatt gtagtgtctg attgagtctt tcgactctcc ctttagcttg agggatagag + 901 gttgtctcaa ggagaatccc tagttggtga caggcgtatc caaactgtgt atgggtatcg + 961 tcctccattt tcttagagtt ggaggcttga taggtaaaga ccgttctctt atctgtttta + 1021 atttgaaggg gaatgccgtg attggctaag atttgttcga ggacatgata gtaagcattc + 1081 aaggtctctt gtttatcaaa ataagcgcct aggatattgc cagaagcatc atcaatggct + 1141 aggtgtaagt tagaggtttc tgctccaaac caggcatgag ggctggtatc catttgaatg + 1201 agttcaccag caaatttctt tctgggtcta ctaggatgta cttttttagg gttttccagg + 1261 aagtcttcag ccgtcggtaa gattagattg tctaggggtt gcttggggtt cagtttagct + 1321 tgttttctta ctctcttctt tgtctttcta tgggacttag gcgacaggat atttttctta + 1381 tagagtattt ttctaacagt tgtatcagag agctgaattc cttcttcttc agctagcaat + 1441 tcacagaaat gacggacatt tggtttatat gtttcatagg agaggtattt ctttaggata + 1501 cgttctttga tttcatcagg gattgcatgt tttggttttc gatttctgtt tccgtgtctg + 1561 aaggcttctt ttcctttctg ttgataggct agtagcagac gattgatttg cctttcagaa + 1621 agattgagca cgacacaggc tcgtttcttt gttttctttc cttgggctat agcttttatc + 1681 acaagatatt ttttcgtttc attcatattc agttggatcc tttacatatg actattctac + 1741 caaatgggac atttttacgt tcgatttact aaagacatta tcacattcga attacacaag + 1801 atgcagatag tgaaaaaagg tgtagacatt accgtaaaaa agtgatataa tcgtatgatg + 1861 ttcaatgtat aggtgttaat catgagtaga cgttttaaaa aatcaggttc acagaaagtg + 1921 aagcgaagtg ttaatatagt tttgttgact atttatttat tgttagtttg ttttttattg + 1981 ttcttaatct ttaagtacaa tatccttgct tttagatatc ttaatctagt ggtaactgcg + 2041 ttagtcctac tagttgcctt ggtagggcta ctcttgatta tctataaaaa agctgaaaaa + 2101 tttactattt ttctgttggt gttctctatc cttgtcagct ctgtgtcgct ctttgcagta + 2161 cagcagtttg ttggactgac caatcgttta aatgcgactt ctaattactc agaatattca + 2221 atcagtgtcg ctgttttagc agatagtgag atcgaaaatg ttacgcaact gacgagtgtg + 2281 acagcaccga ctgggactga taatgaaaat attcaaaaac tactagctga tatcaagtca + 2341 agtcagaata ccgatttgac ggtcaaccag agttcgtctt acttggcagc ttacaagagt + 2401 ttgattgcag gggagactaa ggccattgtc ctaaatagtg tctttgaaaa catcatcgag + 2461 tcagagtatc cagactacgc atcgaagata aagaagattt ataccaaggg attcactaaa + 2521 aaagtagaag ctcctaagac gtctaagaat cagtctttca atatctatgt tagtggaatt + 2581 gacacctatg gtcctattag ttcggtgtcg cgatcagatg tcaatatcct gatgactgtc + 2641 aatcgagata ccaagaaaat cctcttgacc acaacaccac gtgatgccta tgtaccaatc + 2701 gcagatggtg gaaataatca aaaagataaa ttaacccatg cgggcattta tggagttgat + 2761 tcgtccattc acaccttaga aaatctctat ggagtggata tcaattacta tgtgcgattg + 2821 aacttcactt ctttcttgaa aatgattgac ttattgggag ggatagatgt tcataatgat + 2881 caagagtttt cagctctaca tgggaagttc catttcccag tagggaatgt ccatctagac + 2941 tctgagcaag ctttaggttt tgttcgtgag cgctactccc tagcagatgg cgatcgtgac + 3001 cgtggtcgca accaacaaaa ggtgattgtg gctatccttc aaaaattaac gtcaaccgaa + 3061 gcgctgaaaa attatagtac gatcattgat agcttgcaag attctatcca aacaaatatg + 3121 ccacttgaga ccatgataaa tttggtcaat gctcagttag aaagtggagg gaattataaa + 3181 gtaaattctc aagatttaaa agggacaggt cggacggatc ttccttccta tgcgatgcca + 3241 gatagtaacc tctatgtgat ggaaattaac gacagtagcc ttgcatctgt caaaactgct + 3301 attcaggacg tgttggaggg cagatgaaat gattgatatt cattcgcaca ttgtctttga + 3361 tgtagatgat ggtcccaagt caagagagga aagcaaggct ctcttgacag aagcctacag + 3421 gcagggggtg cgaaccattg tctctacctc tcaccgtcgc aagggcatgt ttgaaactcc + 3481 agaagagaag atagcagaaa actttcttca ggttcgggaa atagctaagg aagtcgcgag + 3541 tgacttagtc attgcttatg gggctgaaat ttactacaca ccagatgttt tggataagct + 3601 ggaaaaaaat cggattccga ccctcaataa tagtcgttat gccttgatag agtttagtat + 3661 gaacacccct tatcgcgata ttcatagtgc cttgattaaa atattgatgt tgggaattac + 3721 tccagtcatt gcccacatcg agcgctatga tgcacttgaa aacaatgaaa aacgcgttcg + 3781 agagctgatc gatatgggct gttacacgca agtaaatagt tcacatgtcc tcaaatccaa + 3841 actttttgga gaacggtata aattcatgaa aaaaagagcg cagtatttct tggagcgtga + 3901 tttggttcat gtgattgcaa gtgatatgca taatgtggac agcagacctc cccatatggc + 3961 agaagcatat gaccttgttt ctcaaaaata cggagaagcg aaggctcagg aactttttat + 4021 agataatcct cgaaaaattg taatggatca actaatttag gagaaataat gaaagaacaa + 4081 aatacgatag aaatcgatgt atttcaatca cttaaaacct tatggaaata caagctaatc + 4141 attttattag tggcacttgt gacaggggcg ggagcttttg catatagcac ttttattgtt + 4201 aagccagaat atacaagtac cacgcgtatt tacgtagtca accgtaatca aggagataag + 4261 ccgggactga cgaatcagga cttgcaggca ggaacttatc tggtaaaaga ctaccgcgaa + 4321 attatccttt cgcaagatgt attggaaaag gtagcgacaa atttgaaatt ggatattcca + 4381 gcaaaaacgt taactagcaa agtgcaagtg actgtaccag ccgacactcg tatcgtctca + 4441 atctctgtca aggataaaca accagaggaa gccagtcgca ttgctaattc tctacgagaa + 4501 gttgctgcag aaaagatcat cgctgtaacg cgagtatctg atgtaacgac gcttgaagaa + 4561 gcgcgaccag ctacgactcc ctcttctcca aatgttcgac gcaacacctt agttggtttt + 4621 cttggaggag ccgccgtaac agtaattact gttcttttga ttgagttgct cgatacccgt + 4681 gtaaaacgtc ctgaagatgt tgaagatgta ctgcaaatgc cacttctagg agtcgttcca + 4741 gattttgata aaatgaaata ggaggaagtt atgccaacgt tagaaatctc acaggtgaaa + 4801 ttagaacttg cgaaaaaggc agaggaatat tataatgctt tgtgcacgaa cctacagtta + 4861 agtggagatg atttgaaagt attttctatc acttctgtga aagcaggaga aggaaaaaca + 4921 acgacttcca ccaatatcgc ttgggctttt gcgcgtgcag gttacaaaac gctgctgatt + 4981 gatgcagaca tgcgtaactc cgttatgtca ggtgtcttta aatcaaggga aaggattact + 5041 ggactaacag aatttctatc agggacaaca gacctgtcac aggggctttg cgataccaat + 5101 attgagaatc tctttgtgat tcaggctggc tctgtgtcac caaatccgac agcccttctt + 5161 caaagtaaga atttcagcac aatgcttgga accttgcgta aatattttga ctatatcgtc + 5221 gtagacactg ctcctatcgg tattgtgatt gatgcggcta tcattatgca gaaatgtgat + 5281 gcttctattt tagtgacgaa ggcaggtgaa acaaaacgac gggatcttca aaaagcgaaa + 5341 gaacagttgg aacaaactgg gaagtcgtgt ttaggagttg tgttgaataa attcgatact + 5401 tcagtagaga aatacggttc ttatgggagt tatgggaatt acaggaaaca gaaaaaatag + 5461 gttgagggat agaaatgagt gaaaaactag caaagccttc agtagccata gtccagagtt + 5521 ttcttgttat tttattgact tatctactta gcgctgtgag agaaacagag attgtttcaa + 5581 caacagctat tgtactttat atcctccact attttgtctt ttatatcagt gattatggac + 5641 ggaatttctt taaaagggga tatttgattg aacttgtcca gacattgaaa tatatcctat + 5701 tctttgcgct agcgattagt atttctaatt ttttcttaga agatcgattt agtatttcca + 5761 gaagaggcat gatttacttc ctcttattac atgttttctt agtctatgtg ctaaacctat + 5821 ttatcaagtg gtattggaag cgggcttatc ccaactttaa aggaagtaag aaggttttcc + 5881 tacttacagc aacttctcat gtcgaaaagg tactggatag attaatagaa tcaaatgagg + 5941 ttgttgggga gttggtagcc gtcagtgttt tagataaacc agattttcag catgattatt + 6001 taaaggttgt agcagagggg gagatagtaa actttgcgac tcatgaggtg gtcgatgaag + 6061 tctttatcaa tcttccaagt gaaaaataca atattggaga gcttgtctct cagtttgaaa + 6121 cgatgggaat tgatgtaaca gtcaatctaa atgctttcga ttgggcacgt aacaagcaaa + 6181 ttcgtgagat ggcaggacta aatgttgtga ctttttctac aacattttat aagactagcc + 6241 atgtgattgc taagtggatt attgatattg tcggttccct ggtaggtttg atattatgtg + 6301 gtctagtcag tattgtgctg gttcctttga ttcgaaagga tgggggttct gctttttttg + 6361 ctcagacgcg tataggaaaa aatggccgcc atttcacttt ttataagttt cgctctatgt + 6421 gtgtagatgc tgaggataaa aagagagaac tcatggaaca aaataccatg cagggtggaa + 6481 tgtttaaggt ggacgatgat cctcgtatca cgaaaattgg tcattttata cggaagacga + 6541 gcttggacga gctaccacag ttttataatg ttctaaaggg agatatgagt ttggtaggta + 6601 cacgaccacc aacagtggac gagtatgaac actatacccc agaacaaaaa cgtcggctaa + 6661 gttttaaacc tggtataaca ggcttatggc aggtcagtgg acgaagtgag atcaagaatt + 6721 tcgatgaagt tgtcaagtta gatgtggcct atatagatga ttggacaatc tggaaagata + 6781 ttgagatttt attgaagaca gttaaagttg tattgatgaa ggatggagcg aaataggaaa + 6841 tgaaaatatg tttagttggg tctagtggag gtcatctgac tcatttatat ctattaaaac + 6901 ctttctggaa agataaggaa agattttggg ttacttttga taaagaggat acaagaagta + 6961 tcttgggaaa tgagacattt tatccttgtc attatcctac taatcgtaat ttgaaaaatc + 7021 ttattaaaaa tacggttctt gctttcaata ttttgagaaa ggaacgccct gatgttatca + 7081 tctcatcagg ggctgctgta gcagttcctt tcttttacct aggaaaacta tttggcgcta + 7141 agacagtcta cattgaagtt tttgatcgta ttgatgcgcc aaccttaaca ggaaaaatag + 7201 tatatccagt aacagataag ttcatagttc agtgggagga aatgaaaaaa gtatatccaa + 7261 aagcaattaa tctcggaggg attttctaat gatttttgtg acaataggta ctcatgagca + 7321 acagtttaat cgacttatta aagaagttga tagattaaaa ggtgagggat ttattcagga + 7381 tgatgttttt attcagactg gtttttcaga ttatgaacca gtgtattgtc aatggaagaa + 7441 tctgatttct tatgatgaga tgaatcgcta tatagatgaa gcaaatatta tcattacaca + 7501 tggcggccca gctacattta tggcagttat tgctaaagga aaaataccaa tagttgttcc + 7561 gagattaaag aagtttggtg agcatgtgaa tgatcatcag atggaatttt gttctaaaat + 7621 actatccgaa gggtatgaat tatctctgat taatgatata agcgaattgc agtatagttt + 7681 aaagcaagaa aagaaaacta aattttactc taataataca tgttttctta agaaattatc + 7741 aaaaacaatt gaagatttaa tagtatgaaa tgagattatt tattcttgtt gcagataaat + 7801 taaaaataaa tgaaatttta agtcaagtag ttgtgctaaa atgtatttat gattaagaat + 7861 aaaataatca ctattcctat atatggaaat agttcttaaa gcatagttta aattatggat + 7921 gtagattatt tcgttaactc ttataatcaa tttataaggc cagatagtaa cattattaaa + 7981 atcatagcta ggagtaaggg aggatgtaaa tgaaaatact acacattcca acaggtggtt + 8041 tattttctga tggtatagga acttttattt attcatattt agagtatatg gacttaaaca + 8101 agtatgatgt gacaatttta gccactaatt cccctttgaa aagtgataag gaaaaatttg + 8161 aatgtttagg ggttaaagtt attgaaattg aaagaaaaaa atcaaacctt tctaaatatg + 8221 tatacaaatt aaaaaaaata ataaaaaaag aaaaatttga cattatacat gttcacggaa + 8281 gtagcgcctt aatgtcaatt gaattactga ctgctaaagt tgctggtatc ccagttcgaa + 8341 ttgcccatag tcataacact acttgtgagc atcataaatt agataaacta ctacgaccga + 8401 tattttatcg agtttatact caggcatgtg cttgtagtgt tagtgctggt caatggcttt + 8461 ttgaggaaaa aaattataag attatccata acgctagaga tgtaaatagg tatcagtatg + 8521 atgccataaa acgaaaaaaa cttagagaag aattgttgct atctgatgag actattgctc + 8581 taggtcatgt tggacgtttt aatactcaaa aaaatcaatg ttttctagtg tctctaatgg + 8641 aaaaattagt aatcaaaaat atagatataa aattattttt agtagggaca ggtgatactt + 8701 tggaagaaat caagaaatta gtcattcaga aaaaactaga agataacatt gtttttttag + 8761 gtcaatttga tgatatgaaa tcttttgtgt catcaatgga tataatgttg cttccaagtt + 8821 tatatgaagg gttaccacta gtatctgttg aatggcaaat caacggagta gaaagtatcc + 8881 tatctgaccg tgttacacaa gagtgtatct atacaggaac tgttcaacaa ttatctatcg + 8941 atagcatgga attatgggaa aaagaaattt tgaatttatc tacttcagat agagaaagag + 9001 tgtcattgca aaatattcag ttgataaaaa atgcaggtta tgatatttct ttagaagtta + 9061 aagaaataga agaattatat aattcacttt atgatattgc gaattgaatg aaagggaaga + 9121 gttttctttt gaagatgtta caaaatttaa aaccaataaa acggaaatta aaaccaatta + 9181 agagaactta taagagaatc gtttattcta tcactaagtc aaatatgagg aagaggctca + 9241 aaaatacaga tttttcaatt atcagtgata attgctgggg aggacgggta tatgaagaat + 9301 tgggtctgcc gtatagaaca ccatttatag gtctgtatat tttttccgag gattatgtga + 9361 aactgttgaa aaacttcaga aagtatatgg aatatgagct aacttttacc aataattcaa + 9421 aatggaacac agaatatgac ggggagtatc ctataggcat acttaaggat attgaacttc + 9481 attttttaca ttatgctaat caagaagagg cttatgagaa atggaataaa agaaagaaca + 9541 ggattaatta tgaaaatatc ttttttaaga tgaatgatga taataaatgt tctttgaaat + 9601 tgcttaagga atttgatact ttagatttga aaaataaaat tatttttgct gcattcaatt + 9661 ataaagaact agataatctt attcatttta ccgatcctag agggaatggt aatgtaggta + 9721 cagacttatt ttattatgat caatattttg atgttgtaaa ttggctgaat ggagagacac + 9781 aaacatgata cctaaaaaga ttcattattg ttggttcggt ggcaaacctt tatcaaatga + 9841 tgtaaagcga tgtatagcaa gttggaaaaa attttgtcct gattatgaaa ttattgaatg + 9901 gactgaaaaa aacttttgta ttgaaaatca aaatcaattt gttcaggatg catatagaga + 9961 taaagcatgg gcttttgtaa gcgattatgc aagacttaaa attatatatg aaaatggagg + 10021 tatttattta gatactgatg ttgaagtgat taaaaatcta gataagttgt tggaaaataa + 10081 agcattcttt ggagttcatc aagttaatca tctagttagt acaggattag ggtttggatc + 10141 ggaaaagggc acctctattt taaaggagtt attaaatttg tatgatgaaa tagaatttga + 10201 tcttagtaag aaagatgaat tgttatgtcc tgaattaaat acacctgtat ttaaacgtct + 10261 tggttatact tattctgact gtgttgtaaa aaacgaatat ttcacaatct atcctgaaga + 10321 atattttgat ccgatttctt tgggtgatgg cgtagaaaat attttatcag ataaaacatt + 10381 ctctattcat cattatagtg cttcttggac ttccttaaga aatcagatga agagcaaaat + 10441 aattcgtaaa ctaggcagaa gtaatatctt ggagttaaaa agaatattaa aggggaaaac + 10501 tagatgagaa tatcaccttc gaagctgata tttgcatttt ttagcagctt ttatattctt + 10561 gtaatccttt tcccaagagg aatttttcta ggacattcta ctttagcttc tcgattatgg + 10621 attatttaca atggaagttt atatttatca atattacttg gtttaatata tgttatttta + 10681 aaaatattat ctcgaaatat cgccattcat cagcatgctt ttttcatctt acaatattat + 10741 tttattgtaa ttattttaac tttcatggta agtgggtcaa tcggtgttgg gctacaatcg + 10801 attttctatc caatattcat ctatttattt tttaatgaag ttcgagataa gaaatcaata + 10861 gtgttaattt ttgatatctt tctttatata cttactcctt tattcgttat caatacgatt + 10921 gatgtttttc tgaatttcac aaatattttt catattactt ttttaggaca tgttcaggtg + 10981 atttcccaat atagtgttat cggatttctc gtatcagcat attacttatt agaagaaaag + 11041 agaaatatat tagtggcaca gttgctgttg attttaacga ttatcaattg ttttttttca + 11101 gatgtctctc tctctaaagt tattgctttg tttatgattg tttatattat ttcatacaag + 11161 ttaagaaaac tattctggaa aagaggaagg aagatatctg ttgtaacttt tattgcatct + 11221 gttgtgatgt tagcattagt aatttttgga tattttttac catatcttag atattttgat + 11281 tttactttta atggtcgata ccaaatttgg cgcattgtgt atgctaccat tcttcaagtg + 11341 aaatggtttg gatatggttt gtttggcttt caatttaaac ttccgtggca gaaattggga + 11401 gaagttggaa taaattacac tcataatcaa gttttacagt tagcacttga tagtggtatt + 11461 gttgggatta tctcattctt tactatgatt ttttatatga tcttttcaac taaaaatatt + 11521 caaaattcca caataagctc tctatttatt tttgcctatt tttgtctatt tattataatg + 11581 tttatagaga gtgtcactta ttacccatac tattttatta taatagttct tcagactttg + 11641 tacttaaaat tggaaagaga aagaaatgtt aaatagattg ataagaaatt ttaataaagt + 11701 atattatagt tatcgtataa aaagaaaggc agcgcaatgc ggtgggagag tgtatacggg + 11761 aggcaaaacg tttgttactg caaatacgta ccttgatgaa aatgtttcat ttaatggtat + 11821 gtcaatgtat ggtgaaggga aaataagcat tggtaaaaat tttcattcag gattgaattg + 11881 ccaaattatc acttcctttc ataattatga cttgggcgat aaaattcctt atgatgagag + 11941 ttatatacat aaagacgtct taattgaaga taacgtctgg gtaggaaata atgtgataat + 12001 tttaggtggt gcgattattg aggaaggtgc aatcattcaa gcaggaagta cagttattgg + 12061 aagaattcca gcaggtgcaa ttgcaggtgg acatccagca aaaccattca gatttagaaa + 12121 catggaacat tataatcaac ttaaacggca aaaaaagttt cattagaggt taagaatgaa + 12181 tattgtaagt tatctaaaaa aaaacggtat tacacatact ttaaaaatta ttaatgaata + 12241 taaaatgcaa gagctgtttg atagtcttgt tagtattttt acaaagcaga aggaacttcg + 12301 taacagtatt gtcattgaat gtcatactga ttttgaaaat aatggtggtg cgttctatga + 12361 ctatctaatc aataatgagt ataataaaaa atataaaatt gtcttactat tgaaggataa + 12421 attagttaaa gaattaccag aaaatgtaga ttatttttat ttaagaaagc ccagtttacg + 12481 aaaatcctat gtaatgtcat taagtaaatt ctttactttt gataatgata tgcttcgtaa + 12541 atatagaaaa gatcaaaaac acttttattt aacacatgga tgctttcctt taaaaagtac + 12601 aataggtaaa ataacagttc cgaattatgt tgattttgtt ctatctccct cgggcaatgt + 12661 agataatatt atagttaagc agtttggatt aacatctaaa gagcaatgtc ttcacactgg + 12721 atttccgtgt catgatatct tttattcaaa accagaacct ctagtatttt tatctaatta + 12781 tgataaaaaa attatctggg caccaacttt tagaaagggt ggtggctata atagaaatga + 12841 tagtacagct agctatcctt taggcattcc gttacttgaa acactagatg aactggcaaa + 12901 cctaaacaca tatctaagcc aacgggatat tgccctgatt gtaaagttac atccaatgca + 12961 agatatttca gatttggagt tgaaacaatt tagtcatatt aagtttctga caaatcaaga + 13021 tttgaatcgt aaaaatacaa atctgtatca attgctgatg aattcagatg ctttactcag + 13081 tgactattct gcaatctcgt atgattattt acaccttgat aaaccaatag ggtatgtttt + 13141 ttcggatcta aatgattata agttggggct ttcagttgat aatgtagatg attacatagc + 13201 aggagataag atactgtctt ttaacaactt gctgcacttt attgataaca tttatctaga + 13261 aattgataaa aataaagaaa aacgcaagga attatttaat aaaatatttg aaaaacagga + 13321 tggagaatcg tgtgaaagat tggcacaaat tatggaatta taaaagccgt tacgaagaaa + 13381 tgtctgtcgg gatgaaagcg gcactctggt atactgttgc aaattttatt caaaagggtt + 13441 ttgtatttct ttcaactccg attttaacca gaatacttaa tgttaatgat tacggtacat + 13501 tgatacttta ccaatcatgg tttgtactat ttgctatttt tgcgaccttg aatctttctc + 13561 aaacagctta taataaggga ttggtagaat ttgagaatga taaagataat tttacatttt + 13621 ctttgttgtt tttgtctaag actattacta taattgttgc ttttttatat tttactttta + 13681 atatactggt taaagatagt actggattaa ctcccagttt catgatattt ttattcagtg + 13741 atatcttatt taatattagt atagaatttt atttggcacg tcagagattt gaattcaaat + 13801 atagaaaagc agttctaatt tcaacttttt caagtttttt tattgtagct attagtacaa + 13861 ctatcttatt agcgattaag aatgatttat tcattaaaat tgtattggat gctattatcc + 13921 gaattatctt tggtttatat tgtttttatc tcttgttttt ttcagggaga aggcaactta + 13981 agatagaaaa aaaatatatt aaatatggtt tgagttattc attacctttg ataccgcatt + 14041 tcttatcgca ctatattttg aatcagtctg accgtttgat gattaacatg tttgatggta + 14101 aggagaaatt agctatatat agtctagctt attctgtatc aatgattatg tttttgttta + 14161 ctaatgcaat taatcaatca ataatgccgc atacatttca agctttgaaa aaaaaggatt + 14221 attgtgggat acatgggagc accaaatggc tttttgtagt agttgggggg attacagctc + 14281 tctcaattct atttgcacca gaactaattg ttattttagg cggcaataaa tataaggaat + 14341 caatttggct agtacctcca attgccatct cggtttattt cctttttgta tattctatgt + 14401 ttagtaatat cagtttttat tataagatga ataagctgat ttcgttagtt tccacaggtg + 14461 cggctctttc aaatattatt ttaaattata tttttattaa tatatttggg tatcaagctg + 14521 cagcttacac tacattatta tgctatatat tgttggcgtt ttctcatttt ttcttatata + 14581 gatttttatt aaaaaaagag gaaattcatg aggaacttta taacatgaag atgattttaa + 14641 taatatcttt aatattatta ataatactat ttttgatact tgttatttat aacttagcca + 14701 ttataagata tgcaattatt gcaattattt tatttctttt gtttacaaag agaaataaaa + 14761 taattacatc gctaaaaagt tgatattgaa aatttagaat caaataaaga atatagtgga + 14821 tatcaagcca gtattaataa tgaataattg tttttatgta atttaagatt aataaaaaaa + 14881 ttgaaaggaa atatcaatga aaagagtaat tacttatgga acctttgatt tgcttcatta + 14941 tggacatatc aatttgttaa agagagcaaa gcaattagga gattatctca ttgttgtagt + 15001 ttcaagcgat gagttcaatt tgaaagaaaa aaataaagtt tgttacttta attttgaaca + 15061 tagaaaaaat ttggttgaag caataagata tgttgatctg gtgatttctg aaacaagctg + 15121 ggaacagaaa aaaacagata ttaaagaata tcacattgat acatttgtta tgggggatga + 15181 ttggaaggga aaatttgatt atttaaaaga agaaggagtg gaagtaattt atttaccaag + 15241 aactaaagaa atatctacaa ctaaaattaa agaagattta gcagattaga ttttttacaa + 15301 aaatattttg agttcagata ataaatttgt ttctataatt attaatgtct tgactattta + 15361 aatcttattt taaaaaaatc tagtttaaga tatgaaagaa aattttatcc ataactatca + 15421 tattattggc aatatatatt gtgataatgt atgggaagtt agtagatatg aatgtgatat + 15481 atagctagaa ttaatattat tcattgctat ttaaaatgta ggtaagaatg tattagattt + 15541 agcataaaat tagaaaacaa gctatttttt ctgtgaaatt aggtagatat acaataatat + 15601 ttgtattgtt agagaaagaa atcttaatat tgtaatgggg gcattttgaa ttgactaaag + 15661 taagaattaa ttgggtagat tttgggaaag gatttgcaat attcttagtt ctagtagggc + 15721 atgtatttat tggtttatct gaatccaata agttttcaat tgcaaatgat gtgttattat + 15781 tcctgatagc tcaaatctat atatttcata taccagtgtt ttttgcgtta tcaggatact + 15841 ttttcagacc tgtatcagat ttgaaggaat tttggtatta tgctaaaaag aagacaatta + 15901 ttttaggcat accatatatt ttttattcaa ttattcactt ttgtcttcaa aagcttgctg + 15961 gtgcttctgt gagagtaccc actacgatac ataatctatt aaatatatat agatatcctt + 16021 tgggagtttc atggtatcta tatacgctat ggtcgatatt gatagtttat ggtttactat + 16081 ctattgtttt caaaaatcgt aagtctctct ttttagttag tgtttttgcc tatattttta + 16141 cactatttat tcaaattgat atttttattg tacaacggac gttggtttgg gggatttgtt + 16201 tctttcttgg cagtgtattg agtgaaattc actttgataa aattaatttg aaaaaatttc + 16261 tttttttctt tgtgttattt gattttattt atatgttcgc ttggttcttg ttttatgaag + 16321 tagggtctaa gaaggattat gtaagctata ttaacccagg tttgtggggg attgctttta + 16381 ttgtctgtgt attagttgct tttgcgattt ttcctaaaat ggagaaaaat tttcctaaaa + 16441 ctttcctata tttcactaaa tacgggaaag atagtttagg gatctatatt cttcatgcac + 16501 caatttgtag catgattcgg attctaatgt tgaaagtggg aataaactca gtttttcttc + 16561 acgttgttgt tgggattgtg ctaggctggt atttatccat actagcaact tatatattga + 16621 aaaaaattcc atttttgaat attgttttat taccacaaaa gtatattaaa ttaaaataaa + 16681 ttattttaga tttataatgt ggctctttgt caactaacat ctggagagga caatcactgt + 16741 cttctctttt tttgtctttt cagaatatac caaattaaca caaaaattct gaaaattctg + 16801 ttgacatctt tctgaaaaga gtttataatg gagagaaagt tttaaaggag aaaatgatga + 16861 aaagttcaaa actatttgcc cttgcgggcg tgacattatt ggcggcgact actttagctg + 16921 catgctctgg atcaggttca agcactaaag gtgagaagac attctcatac atttatgaga + 16981 cagaccctga taacctcaac tatttgacaa ctgctaaggc tgcgacagca aatattacca + 17041 gtaacgtggt tgatggtttg ctagaaaatg atcgctacgg gaactttgtg ccgtctatgg + 17101 ctgaggattg gtctgtatcc aaggatggat tgacttacac ttatactatc cgtaaggatg + 17161 caaaatggta tacttctgaa ggtgaagaat acgcggcagt caaagctcaa gac +// + diff --git a/public/res/serotype_genbank/serotype_11E.gb b/public/res/serotype_genbank/serotype_11E.gb new file mode 100644 index 0000000..f607300 --- /dev/null +++ b/public/res/serotype_genbank/serotype_11E.gb @@ -0,0 +1,706 @@ +LOCUS 11E 14880 bp DNA linear UNK 10-JUN-2024 +DEFINITION 11E, whole genome shotgun sequence. +ACCESSION 11E +VERSION 11E +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/10/2024, 16:47:36 + CDSs :: 17 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..14880 + /mol_type="genomic DNA" + gene 10..1455 + /locus_tag="KBDEHD_00005" + /gene="wzg" + CDS 10..1455 + /db_xref="BlastRules:WP_000091082" + /db_xref="RefSeq:WP_044812598.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598E649" + /db_xref="UniRef:UniRef100_A0A4P8GBG2" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_Q9R928" + /db_xref="UniprotKB:Q4K240" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="KBDEHD_00005" + /protein_id="gnl|Bakta|KBDEHD_00005" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVDQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYS + TIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSYAMPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812598.1" + /gene="wzg" + gene 1457..2188 + /locus_tag="KBDEHD_00010" + /gene="wzh" + CDS 1457..2188 + /db_xref="BlastRules:WP_000565352" + /db_xref="RefSeq:WP_044812597.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598FDB7" + /db_xref="UniRef:UniRef100_A0A4P8GCD5" + /db_xref="UniRef:UniRef90_Q9AHD4" + /db_xref="UniprotKB:Q4K239" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="KBDEHD_00010" + /protein_id="gnl|Bakta|KBDEHD_00010" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGMRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDSRY + ALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVTQKYG + EAKAQELFIDNPQKIVMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812597.1" + /gene="wzh" + gene 2197..2889 + /locus_tag="KBDEHD_00015" + /gene="wzd" + CDS 2197..2889 + /db_xref="BlastRules:WP_000664160" + /db_xref="RefSeq:WP_044812595.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598C59E" + /db_xref="UniRef:UniRef100_A0A222C8Q5" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_A0A139PG18" + /db_xref="UniprotKB:Q4K238" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="KBDEHD_00015" + /protein_id="gnl|Bakta|KBDEHD_00015" + /translation="MKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSAFIVK + PEYTSTTRIYVVNRDQGDKPGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKLDMP + AKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVTTLE + EARPATTPSSPNVRRNSLFGFLGGAVVTVSAVLLIELLDTRVKRPEDVEDVLQIPLLGV + VPNLDKMK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812595.1" + /gene="wzd" + gene 2899..3579 + /locus_tag="KBDEHD_00020" + /gene="wze" + CDS 2899..3579 + /db_xref="RefSeq:WP_044812593.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598E5C1" + /db_xref="UniRef:UniRef100_UPI000598E5C1" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_O84996" + /product="Tyrosine-protein kinase wze" + /locus_tag="KBDEHD_00020" + /protein_id="gnl|Bakta|KBDEHD_00020" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDDLKVFSITSVKL + GEGKSTTSTNIAWAFAHAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDLSQ + GLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVIDAA + IITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSYGDYG + KNKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812593.1" + /gene="wze" + gene 3594..4961 + /locus_tag="KBDEHD_00025" + /gene="wchA" + CDS 3594..4961 + /db_xref="RefSeq:WP_044812591.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598EC9A" + /db_xref="UniRef:UniRef100_A0A4P8GB07" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_Q8VU30" + /db_xref="UniprotKB:Q4K290" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="KBDEHD_00025" + /protein_id="gnl|Bakta|KBDEHD_00025" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYILH + YFVFYISDYGQNFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYFLT + VHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGELVAV + SVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSKKYNIGELVSQFETMGIDVT + VNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLILCGLVS + IVLLPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTMQGGMFK + VDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQKRRLSF + KPGITGLWQISGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFMRDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812591.1" + /gene="wchA" + gene 4965..5414 + /locus_tag="KBDEHD_00030" + /gene="wchJ" + CDS 4965..5414 + /db_xref="GO:0016740" + /db_xref="RefSeq:WP_044812590.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598C6EA" + /db_xref="UniRef:UniRef100_A0A4P8GCT4" + /db_xref="UniRef:UniRef50_J9W567" + /db_xref="UniRef:UniRef90_Q4K1M2" + /product="PssD/Cps14F family polysaccharide biosynthesis + glycosyltransferase wchJ" + /locus_tag="KBDEHD_00030" + /protein_id="gnl|Bakta|KBDEHD_00030" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKADARSVLSEE + VVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKTVY + IEVFDRIDAPTITGKLVYPVTDRFIVQWEEMKKIYPKAINLGGIF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812590.1" + /gene="wchJ" + gene 5414..5893 + /locus_tag="KBDEHD_00035" + /gene="wchK" + CDS 5414..5893 + /db_xref="KEGG:K25904" + /db_xref="RefSeq:WP_044812589.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598BC25" + /db_xref="UniRef:UniRef100_A0A4P8GCW3" + /db_xref="UniRef:UniRef50_Q4K216" + /db_xref="UniRef:UniRef90_Q4K216" + /product="Putative glycosyl transferase" + /locus_tag="KBDEHD_00035" + /protein_id="gnl|Bakta|KBDEHD_00035" + /translation="MIFVTVGTHEQQFDRLIKEFDRLKEENLIQEEVFIQTGYSNYVPK + YCKWEKIISYEKMNQFIEEADTIVTHGGPATFMAIIAKGKTPIVVPRQKKFGEHVNDHQ + MNFCSKISSEGYELSLINDISELQYSLKQEKKTKFYSNNANFLKQLSKIIEDLIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812589.1" + /gene="wchK" + gene 6135..7232 + /locus_tag="KBDEHD_00040" + /gene="wcyK" + CDS 6135..7232 + /db_xref="RefSeq:WP_044812587.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598DB13" + /db_xref="UniRef:UniRef100_A0A4P8GC17" + /db_xref="UniRef:UniRef50_A0A428BKJ5" + /db_xref="UniRef:UniRef90_Q4K233" + /db_xref="UniprotKB:Q4K233" + /db_xref="UserProtein:wcyK" + /product="""putative glycosyl transferase""" + /locus_tag="KBDEHD_00040" + /protein_id="gnl|Bakta|KBDEHD_00040" + /translation="MKILHIPTGGLFSDGIGTFIYSYLEYMDLNKYDVTILATNPLLKS + DKEKFEYLGVKVIEIERKKSNLSKYIYKLKKLMKKEKFDIIHVHGSSALMSIELLTAKI + AGIPVRIAHSHNTTCEHHKLDKLLRPIFYRVYTQACACSVSAGQWLFEEKNYEIIHNAR + DVNKYQYDAIKRKKLREELLLSDETIALGHVGRFNTQKNQRFLVSLMERLVIKNIDLKL + FLVGTGDTLEEIKKLVIQKKLEDNIVFLGQFDDMKSFVSSMDIMLLPSLYEGLPLVSVE + WQINGVKSILSDRVTQECIYTETVQQLSIDSMELWEKEILNLSTSDRERVSLQNIQLIR + NAGYDISLEVKEIEELYNSLYDIAN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812587.1" + /gene="wcyK" + gene 7260..7928 + /locus_tag="KBDEHD_00045" + /gene="wcwC" + CDS 7260..7928 + /db_xref="RefSeq:WP_044812604.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598E4C8" + /db_xref="UniRef:UniRef100_A0A222C8N3" + /db_xref="UniRef:UniRef50_A0A222C8N3" + /db_xref="UniRef:UniRef90_A0A222C8N3" + /product="Putative acetyl transferase" + /locus_tag="KBDEHD_00045" + /protein_id="gnl|Bakta|KBDEHD_00045" + /translation="MLQNLKLIKRRLKPIKRKLKPIKRTYKKIVYSITKSNMRKRLKNT + DFSIISDNCWGGRVYEELGLPYRTPFIGLYIFSEDYVKLLKNFKKYMEYELTFTNNSKW + NTEYDGEYPIGILNDIEIHFLHYSSMEEAYKKWNKRKKRINYKNIFFKMNDDNKCSLKL + LKEFDTLDLKNKIIFAAFNYKELDNLIHFTNPIGNGNVGADLFYYNKYFDVVNWLNGEY + " + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812604.1" + /gene="wcwC" + gene 7931..8653 + /locus_tag="KBDEHD_00050" + /gene="wcrL" + CDS 7931..8653 + /db_xref="RefSeq:WP_044812586.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598EF0B" + /db_xref="UniRef:UniRef100_A0A4P8GCY9" + /db_xref="UniRef:UniRef50_Q4K285" + /db_xref="UniRef:UniRef90_A0A4P8GCY9" + /product="Putative glycosyltransferase" + /locus_tag="KBDEHD_00050" + /protein_id="gnl|Bakta|KBDEHD_00050" + /translation="MIPKKIHYCWFGGKPLPNDVKRCIASWRKFCPDYEIIEWTEKNFC + IQNQNQFVKDAYKNKAWAFVSDYARLKIVYENGGIYLDTDVEIIKKLDLLLDNTAFFGV + HQVNHLVNTGLGFGAEKGSFILKELLDSYDEVKFDINKKDELLCPELNTQIFKQLGYVY + SNSVIKSQYFTIYPEEYFDPISLGDEVANILSDKTFSIHHYNASWTSLMNRVKRKIIRK + LGRSNVSELKRILKGKTR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812586.1" + /gene="wcrL" + gene 8650..9822 + /locus_tag="KBDEHD_00055" + /gene="wzy" + CDS 8650..9822 + /db_xref="RefSeq:WP_044812585.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598B141" + /db_xref="UniRef:UniRef100_A0A4P8GBH0" + /db_xref="UniRef:UniRef50_Q4K230" + /db_xref="UniRef:UniRef90_Q4K230" + /db_xref="UniprotKB:Q4K230" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="KBDEHD_00055" + /protein_id="gnl|Bakta|KBDEHD_00055" + /translation="MRISPSKLIFAFFSSFYILVILFPRGIFLGHSTLASRLWIIYKES + LYLSILLGSIYVILKILSRNIAIHQHAFFILQYYFIVMILTFMLSGSIGDGVQSIFYPI + FIYLFFNEVRDKKSIVLIFDIFLYILTALFVINTIDIFLNFTNIFHVTFLGHVQVISQY + SILGFLVSAYYLLEEKRNILVAQLLLILTIINCFFSDVSLSKAIALFMIIYIISYKLKK + LFWKRGRKISVITFIASVVMLALVIFGYFLPYLRYFDFTFNGRYQIWRIVYATILQVKW + FGYGVFGFQFKLPWQELGEIGINYTHNQILQLALDSGIVGIISFFTMIFYMIFSTKNIQ + NPAIGSLFIFAYFCLFIIMFIESVTYYPYYFIIIVLQTLYLKLERERNVK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812585.1" + /gene="wzy" + gene 9812..10312 + /locus_tag="KBDEHD_00060" + /gene="wcwT" + CDS 9812..10312 + /db_xref="RefSeq:WP_044812583.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598AF11" + /db_xref="UniRef:UniRef100_A0A4P8GCE2" + /db_xref="UniRef:UniRef50_K2QI84" + /db_xref="UniRef:UniRef90_A0A4P8GCE2" + /db_xref="UniprotKB:Q4K229" + /db_xref="UserProtein:wcwT" + /product="""putative acetyl transferase""" + /locus_tag="KBDEHD_00060" + /protein_id="gnl|Bakta|KBDEHD_00060" + /translation="MLNRLIRNFNKVYYSYRIKRKAAQCSGRVYTGGKTFVTANTYLDE + NVSFNGMSMYGEGKISIGKNFHSGLNCQIITSFHNYDLGDKIPYDESYIHKDVLIEDNV + WVGNNVIILGGAIIEEGAIIQAGSTVAGRIPAGAIAGGHPAKPFRFRNMEHYNRLKRQK + KFH" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812583.1" + /gene="wcwT" + gene 10322..11509 + /locus_tag="KBDEHD_00065" + /gene="wcwU" + CDS 10322..11509 + /db_xref="RefSeq:WP_044812582.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598B077" + /db_xref="UniRef:UniRef100_A0A4V1E867" + /db_xref="UniRef:UniRef50_A0A4V1E867" + /db_xref="UniRef:UniRef90_A0A4V1E867" + /db_xref="UniprotKB:Q4K228" + /db_xref="UserProtein:wcwU" + /product="""putative glycerol phosphotransferase""" + /locus_tag="KBDEHD_00065" + /protein_id="gnl|Bakta|KBDEHD_00065" + /translation="MNIVSYLKKNGITHTLKIINEYKMQELFDSLVSIFTKQKELRDSI + VIECHTDFENNGGAFYDYLINNEYNKKYKIVLLLKDKLSKELPENVDYFYLRKPSLRKS + YVMSLSKFFTFDNDMLRKYRKDQKHFYLTHGCFPLKNTIGKITVPNYVDFVLSPSGNVD + NIIVKQFGLTSKEQCLHTGFPCHDIFYSKTEPLVFLSDYDKKIIWAPTFRKGGGYNRND + STASYPLGIPLLGTLDELAHLNTYLSQRDIVLIVKLHPMQDISDLELKQFSHIKFLTNQ + NLKRKNINMYQLLMNSDALLSDYSAISYDYLHLDKPIGYVFSDLNDYKLGFSVDNVDDY + IAGDKIMSFNDLLHFIDNIYLEIDKNKEKRKELFNKIFEKQDGESCERLAQIMEL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812582.1" + /gene="wcwU" + gene 11478..12929 + /locus_tag="KBDEHD_00070" + /gene="wzx" + CDS 11478..12929 + /db_xref="RefSeq:WP_226957940.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000598F25F" + /db_xref="UniRef:UniRef100_A0A4P8GDQ5" + /db_xref="UniRef:UniRef50_Q4K244" + /db_xref="UniRef:UniRef90_Q4K244" + /db_xref="UniprotKB:Q4K227" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="KBDEHD_00070" + /protein_id="gnl|Bakta|KBDEHD_00070" + /translation="MKDWPKLWNYRRRYEEMSVGMKAALWYTVANFIQKGFVFLSTPIL + TRILNVNDYGTLILYQSWFVLFAIFATLNLSQTAYNKGLVEFENDKDNFTFSLLFLSKI + ITIIVAFLYFTFNILVKDSTGLTPGFMIFLFSDILFNISIEFYLARQRFEFKYRKAVLI + SISSSFLIVAISTTILLVIKNDLFIKIVLDAIIRIIFGLYCFYLLFFSGRRQLKIEKKY + IKYGLSYSLPLMPHFLSHYILNQSDRLMINMFDGKEKLAIYSLAYSVSMIMFLFTNAIN + QSIMPYTFQALKKKDYRGIHGSTKWLFITVGGVTVLSILFAPELIVILGGNKYKESIWL + VPPIAISVYFLFVYSMFSNISFYYKMNKLISLVSTGAALSNIILNYIFINIFGYQAASY + TTLLCYILLAFSHFFLYRFLLKKEEIHEELYNMKMILIISLILLTILFLILVIYNLAFI + RYAIIVIIVFLLFTKRNKIITSLKS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_226957940.1" + /gene="wzx" + gene 13042..13434 + /locus_tag="KBDEHD_00075" + /gene="gct" + CDS 13042..13434 + /db_xref="EC:2.7.7.39" + /db_xref="GO:0047348" + /db_xref="RefSeq:WP_044812580.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000599019D" + /db_xref="UniRef:UniRef100_A0A4P8GB25" + /db_xref="UniRef:UniRef50_F9PIZ6" + /db_xref="UniRef:UniRef90_Q9AH85" + /db_xref="UniprotKB:Q4K226" + /db_xref="UserProtein:gct" + /product="""CDP-glycerol-1-phosphate biosynthetic protein + Gct""" + /locus_tag="KBDEHD_00075" + /protein_id="gnl|Bakta|KBDEHD_00075" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKEK + NKVCYFNFEHRKNLVEAIRYVDLVIPETSWEQKKTDIKEYHIDTFVMGDDWKGKFDYLK + EEGVEVVYLPRTKEISTTKIKEDLAD" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_044812580.1" + /gene="gct" + gene 13852..14253 + /locus_tag="KBDEHD_00080" + CDS 13852..14253 + /db_xref="RefSeq:WP_226957675.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E2493E" + /db_xref="UniRef:UniRef100_A0A4P8GCT8" + /db_xref="UniRef:UniRef50_Q8KWN9" + /db_xref="UniRef:UniRef90_Q8KWN9" + /note="Inactivated wcjE gene" + /product="Putative O-acetyltransferase wcjE" + /locus_tag="KBDEHD_00080" + /protein_id="gnl|Bakta|KBDEHD_00080" + /translation="MTKVRINWVDFGKGFAIFLVLVGHVFIGLYESNKFSIANDVLLFL + IAQIYIFHIPVFFALSGYFFRPVSDLKEFWHYAKKKTIILGIPYIFYSIIHFCLQKVAG + ASVRVPTTIFNLLNIYKFPLGVSWYLYTL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_226957675.1" + gene 14260..14880 + /locus_tag="KBDEHD_00085" + CDS 14260..14880 + /db_xref="RefSeq:WP_235787786.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E795C0" + /db_xref="UniRef:UniRef100_UPI0005E795C0" + /db_xref="UniRef:UniRef50_A0A6C7J428" + /db_xref="UniRef:UniRef90_A0A4J1ZXX5" + /note="Inactivated wcjE gene" + /product="Putative acetyl transferase" + /locus_tag="KBDEHD_00085" + /protein_id="gnl|Bakta|KBDEHD_00085" + /translation="MIVYGLLSVVFKNRKSLLLVSVFAYIFTLFIQTDIFIVQRTLVWG + ICFLLGSVLSEIHFDKINFKKILVFFVLFDFIYMFAWFLFYEVGSKKDYVSYSNPGLWG + IAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSLGIYILHAPICSMIRILMLKVGIN + SVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLLPQKYIKLK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_235787786.1" +ORIGIN + 1 gtgttaatca tgagtagacg ttttaaaaaa tcacgttcac agaaagtgaa gcgaagtgtt + 61 aatatcgttt tgctgactat ttatttattg ttagtttgtt ttttattgtt cttaatcttt + 121 aagtacaata tccttgcttt tagatatctt aacctagtgg taactgcgtt agtcctacta + 181 gttgccttgg tagggctact cttgattatc tataaaaaag ctgaaaaatt tactattttt + 241 ctgttgctgt tctctatcct tgtcagctct gtgtcgctct ttgcagtaca gcagtttgtt + 301 ggactgacca atcgtttaaa tgcgacttct aattactcag aatattcaat cagtgtcgct + 361 gttttagcag atagtgatat cgaaaatgtt acgcaactga cgagtgtgac agcaccgact + 421 gggactgata atgaaaatat tcaaaaatta ctagctgata ttaagtcaag tcagaatacc + 481 gatttgacgg tcgaccagag ttcgtcttac ttggcagctt acaagagttt gattgcaggg + 541 gagactaagg ccattgtctt aaatagtgtc tttgaaaata tcatcgagtc agagtatcca + 601 gactacgcat cgaagataaa aaagatttat accaagggat tcactaaaaa agtagaagct + 661 cctaagacgt ctaagaatca gtctttcaat atctatgtta gtggaattga cacatatggt + 721 cctattagtt cggtgtcgcg atcagatgtc aatatcctga tgactgtcaa tcgagatacc + 781 aagaaaatcc tcttgaccac aacgccacgt gatgcctatg taccaatagc agatggtgga + 841 aataatcaaa aagataaatt aacccatgcg ggcatttatg gagttgattc gtccattcac + 901 accttagaaa atctctatgg agtggatatc aattactatg tgcgattgaa cttcacttct + 961 ttcttgaaaa tgattgactt attgggaggg gtagatgttc ataatgatca agagttttca + 1021 gctctacatg ggaagttcca tttcccagta gggaatgtcc atctagactc tgagcaggct + 1081 ctaggttttg tacgtgaacg ctactcacta gccgatggag accgtgaccg tggtcgcaac + 1141 caacaaaagg tgattgtggc tatccttcaa aaattaacgt caaccgaagc actgaaaaat + 1201 tatagtacga tcattaatag cttgcaagat tctatccaaa caaatatgcc acttgagact + 1261 atgataaatt tggttaatgc tcagttagaa agtggaggga attataaagt aaattctcaa + 1321 gatttaaaag ggacaggtcg gacggatctt ccttcttatg caatgccaga cagtaacctc + 1381 tatgtgatgg aaatagatga tagtagttta gctgtagtta aagcagctat acaggatgtg + 1441 atggagggta gatgaaatga tagacatcca ttcgcacatc gtctttgatg tagatgatgg + 1501 tcccaagtca agagaggaaa gcaaggctct cttggcagaa gcctacagac aggggatgcg + 1561 aaccattgtc tctacctctc accgtcgcaa gggcatgttt gaaactccgg aagagaagat + 1621 agcagaaaac tttcttcagg ttcgggaaat agctaaggaa gtggcgagtg acttggtcat + 1681 tgcttacggg gctgaaattt actacacacc agatgttctg gataagctgg aaaaaaagcg + 1741 gattccgacc ctcaatgata gtcgttatgc cttgatagag tttagtatga acactcctta + 1801 tcgcgatatt catagcgcct tgagcaagat cttgatgttg ggaattactc cagtcattgc + 1861 ccacattgag cgctatgatg ctcttgaaaa taatgaaaaa cgcgttcgag aactgatcga + 1921 tatgggctgt tacacgcaag taaatagttc acatgtcctc aaacccaaac tttttggcga + 1981 acgttataaa ttcatgaaaa aaagagctca gtatttttta gagcaggatt tggttcatgt + 2041 cattgcaagt gatatgcaca atctagacgg tagacctcct catatggcag aagcatatga + 2101 ccttgttacc caaaaatacg gagaagcgaa ggctcaggaa ctttttatag acaatcctca + 2161 aaaaattgta atggatcaac taatttagga gaaatgatga aagaacaaaa cacgatagaa + 2221 atcgatgtat ttcaattatt taaaaccttg tggaaacgca agctaatgat tttaatagtg + 2281 gcacttgtga caggtgcggg ggcttttgca tatagcgctt ttattgttaa gccagaatat + 2341 acgagtacta cgcgaattta cgtagtgaat cgcgatcaag gagacaagcc ggggctgaca + 2401 aatcaggatt tgcaggcagg atcttatctg gtaaaagact accgtgagat tatcctttcg + 2461 caggatgtat tggaaaaagt agcgacaaat ttgaagttgg atatgccagc aaaaacgtta + 2521 gccagcaaag ttcaagtgac tgtaccagct gacactcgta tcgtctcaat ctctgtcaaa + 2581 gataaacagc cagaagaagc cagtcgtatc gctaattctc tacgagaagt tgctgcagaa + 2641 aagatcgtcg ctgtaacgcg agtatctgat gtaacgacac ttgaagaagc gcgaccagct + 2701 acgactccct cttctccaaa tgttcgacgc aattccttgt ttggttttct tggaggagca + 2761 gtcgtaacag taagtgctgt tcttttgatt gagttgctcg acacccgtgt gaaacgtcct + 2821 gaagatgtcg aagatgtact gcaaattcca cttttagggg tcgttccaaa tttggacaaa + 2881 atgaaatagg aggaagttat gccaacatta gaaatctcac aggcaaaatt ggattttgta + 2941 aaaaaggcag aggaatatta taacgctttg tgcacgaacc tacagttaag tggagatgat + 3001 ttgaaagtat tttctatcac ttctgtgaaa ctaggagaag gaaaatcaac gacttccacc + 3061 aatatcgctt gggcttttgc gcatgcaggt tacaaaacgc tgctgattga tggagatatt + 3121 cgcaattctg ttatgttagg tgtctttaaa gcaagggata agattacagg cctgacagaa + 3181 tttttatcag gaactacaga tctatcacaa gggctttgtg ataccaatat cgaaaatctc + 3241 tttgtaattc aggctggctc tgtgtcaccg aatccgacag ctcttcttca aagtaagaat + 3301 ttcagtacaa tgcttgaaac cttgcgtaaa tattttgact acatcattgt agatactgct + 3361 cctgtcggtg tcgtgattga tgcggctatt attacgcgaa aatgcgatgc ttctatttta + 3421 gtgacggagg caggtgaaat aaatcgacgg gatattcaaa aagcaaaaga acagttggaa + 3481 cacacaggga agccgttttt gggagttgtg ttgaataaat tcgatacttc agtagacaaa + 3541 tacggttctt atggagatta cgggaaaaat aaaaaatagg tcggaggaca gagatgaatg + 3601 gaaaaatagt aaagtcttca ttggctataa tccagagttt tcttgttatt ttattgactt + 3661 atctccttag tgctgtgaga gaagcggaga ttgtttcaac aacagctatt gcactttata + 3721 tcctccatta ttttgtcttt tatattagtg attatggaca gaatttcttt aaaaggggat + 3781 atttgattga acttgtccag acattgaaat atatcctatt ctttgcacta gcgattagta + 3841 tttctaattt tttcttagag gatcgattta gtatttccag acgaggcatg atttacttcc + 3901 tcacagtaca tgctctctta gtctatgtgc taaacctatt tatcaagtgg tattggaagc + 3961 gggcttatcc caactttaaa ggaagtaaga agattctcct acttacagca acttctcgtg + 4021 tcgaaaaggt actggataga ttaatagaat caaatgaggt tgttggggag ttggtagctg + 4081 tcagtgtctt agataaacca gattttcagc atgattgttt aaaggtagta gcagaggggg + 4141 agatagtaaa ctttgcgact catgaggtgg tcgatgaagt ctttatcaat cttccaagta + 4201 aaaaatacaa tattggagag cttgtctctc agtttgaaac gatgggaatt gatgtaacag + 4261 ttaatctaaa tgcttttgat cgtagtttgg cacgtaacaa gcaaattcgt gagatggcag + 4321 gattaaacgt tgtgactttt tctacaacat tttataagac tagtcatgta attgctaagc + 4381 ggattattga tatcgtgggt gcattggtag ggctgatact atgtggttta gtcagtattg + 4441 tattgcttcc tttgattcga aaggatgggg gctctgctat ttttgctcag acgcgtatag + 4501 gaaaaaatgg tcgtcagttc actttttata agtttcgctc tatgtgtgta gatgccgagg + 4561 cgaaaaaaag agaactcatg gaacaaaata ccatgcaggg tggaatgttt aaggtggacg + 4621 atgatcctcg tatcacgaaa attggtcgtt ttatacggaa gactagcttg gacgagctac + 4681 cacagtttta taatgttcta aagggagata tgagtttggt tggcacacgg ccaccgacag + 4741 tggacgagta tgaacactat accccagaac aaaaacgtcg gctaagtttt aaacctggta + 4801 taacaggctt atggcagatc agtggacgaa gtgagattaa gaattttgat gaagttgtca + 4861 aattagatgt agcctatata gacgattgga caatttggaa agacattgaa attttattga + 4921 agacagttaa agttgtattt atgagagacg gagcgaagta ggaaatgaaa atatgtttag + 4981 ttggatctag tggaggtcat ctgactcatt tatatctttt aaaacctttc tggaaagata + 5041 aagaaagatt ttgggttact tttgataagg cggacgctcg gagtgtactc tctgaggaag + 5101 ttgtatatcc ctgttattat ccaaccaatc gtaatataaa aaatttaata aaaaatactt + 5161 ttctcgccta taaaatttta aaaaaagaga gaccagattt gattatttct tctggtgccg + 5221 ctatcgctgt tcctttcttt tatattggga agttatttgg atcaaagaca gtgtatatag + 5281 aagtgtttga tagaattgat gctccaacaa taacgggaaa acttgtttat ccagtaacgg + 5341 ataggtttat tgttcaatgg gaagaaatga aaaaaattta tccgaaagca attaatctag + 5401 gaggaatatt ctgatgattt ttgttactgt agggacacat gaacaacaat ttgatcgttt + 5461 gataaaagaa tttgatcgtt tgaaagaaga gaatctaatt caagaggaag tatttattca + 5521 aacaggatat tctaattatg tcccaaaata ttgtaaatgg gaaaaaataa tatcttatga + 5581 aaaaatgaat cagtttattg aggaagctga tacaattgtt acccatggtg gtccagcaac + 5641 ttttatggca attattgcta aaggaaaaac tccaatagtt gttccgaggc aaaagaaatt + 5701 tggggagcat gtgaatgatc atcagatgaa tttttgttct aaaatatcct ctgaagggta + 5761 tgaattatct ctgattaacg atataagcga attgcagtat agtttaaagc aagaaaagaa + 5821 aactaaattt tactctaata atgcaaattt tcttaagcag ttatcaaaaa taattgaaga + 5881 tttaatagta taaaatgaga ttgtttcttc ttattgcaga tgaattagaa ataaatcagg + 5941 ttgtgagtaa agcaacagtg ccaaagtgta tttgtaatta agaataaaat aaacaccatt + 6001 tcaatatctg aaaataattc tcaaggcata gtttgaatta tggatataga ttattttgct + 6061 aagtcttcta atcgatttat aagttaaggc agtaacatta ttaaaatcat agatagaagt + 6121 aaggagggaa ctaaatgaaa atactacata ttccaacggg tggtttattt tctgatggta + 6181 taggaacttt tatttattca tatttggagt atatggactt aaacaagtat gatgtgacaa + 6241 ttttagccac taatcctctt ttgaaaagtg ataaggaaaa atttgaatat ttaggggtta + 6301 aagttattga aattgaaagg aaaaaatcaa acctttctaa atatatatac aaattgaaaa + 6361 aattaatgaa aaaagaaaaa tttgatatta tacatgttca cggaagtagc gctttaatgt + 6421 caattgaatt actgactgct aaaattgctg gtatcccagt tcgaattgcc catagccata + 6481 acactacttg tgagcatcat aaactagata aactactacg accgatattt tatcgagttt + 6541 atactcaggc atgtgcttgc agtgttagtg ctggtcagtg gctttttgag gaaaaaaatt + 6601 atgagattat ccataacgct agagatgtaa ataagtatca gtatgatgcc ataaaacgaa + 6661 aaaaacttag agaagaattg ttactgtctg atgagactat tgctctaggt catgttggac + 6721 gttttaatac tcaaaaaaat caacgttttc tagtgtctct gatggaaaga ttagtgatca + 6781 aaaatataga tttaaaatta tttttagtag ggacgggtga tactttagaa gaaatcaaga + 6841 aattagtcat tcagaaaaaa ctagaagata atattgtttt tttaggtcaa tttgatgata + 6901 tgaaatcttt tgtgtcatca atggatataa tgttacttcc aagtttatat gaagggttac + 6961 cactagtatc tgttgaatgg caaataaacg gagtaaaaag tatcctatct gaccgtgtta + 7021 cacaagagtg tatctataca gaaactgttc aacaattatc tatcgatagt atggaattat + 7081 gggaaaaaga aattttaaat ttatctactt cagatagaga aagagtgtca ttgcaaaata + 7141 ttcagttaat aagaaatgca ggctatgata tttctttaga agttaaagaa atagaagaat + 7201 tatataattc actttatgat attgcgaatt gaatgaaagg aaagagtttt cttttgaaga + 7261 tgttacaaaa tttaaaacta ataaaacgga gattaaaacc aataaaacgg aaattaaaac + 7321 caattaagag aacttataag aaaatagttt attctatcac taagtcaaat atgaggaaga + 7381 ggctcaaaaa tacagatttt tcaattatca gtgataattg ctggggagga cgggtatatg + 7441 aagaattggg tctgccgtat agaacaccat ttataggtct gtatattttt tctgaggatt + 7501 atgtgaagct gttgaaaaac ttcaaaaagt atatggaata tgagctaacg tttaccaata + 7561 attcaaaatg gaacacagaa tatgacgggg agtatcctat aggtattctc aatgatatag + 7621 aaattcattt tttacattat tctagcatgg aagaagcata taaaaaatgg aataaaagaa + 7681 aaaaaagaat taattataaa aatatttttt ttaagatgaa tgatgataat aaatgttctt + 7741 tgaaattgct taaggaattt gatactttgg atttgaaaaa taaaattatt tttgctgcat + 7801 tcaattataa agaactagat aatcttattc attttaccaa tcctataggt aatggaaatg + 7861 taggtgcaga cctattttat tataataaat actttgatgt tgttaattgg ttgaatggag + 7921 agtactaagt atgataccta aaaaaattca ttattgttgg tttggtggca aaccattacc + 7981 aaatgatgtg aaacgatgta tagctagttg gagaaagttt tgtcccgact atgaaattat + 8041 tgaatggact gaaaaaaatt tttgtattca aaatcaaaat caatttgtaa aagatgcgta + 8101 taaaaataag gcatgggctt ttgttagcga ctatgctaga ctcaaaattg tttatgaaaa + 8161 tggaggtatc tatttagata ctgatgttga gattattaaa aagctagatt tgttactgga + 8221 taacacagca ttctttggtg ttcatcaagt taatcatcta gttaatacag gattaggttt + 8281 tggggctgaa aaggggtcat tcattttaaa agaattatta gattcttatg atgaagtgaa + 8341 atttgatatt aacaagaaag acgagctatt atgtccagaa ttaaacacgc aaatatttaa + 8401 acaactaggt tatgtttatt ctaattcagt tataaaaagt caatatttca caatctatcc + 8461 cgaagaatac ttcgatccca tttcattggg agatgaagtt gctaatattt tatcagataa + 8521 aacattttct attcatcatt ataatgcatc ttggacttcc ttgatgaatc gggtgaagag + 8581 aaaaataatt cgtaaactag gtagaagtaa tgtctcggag ttaaaaagaa tattaaaggg + 8641 gaaaactaga tgagaatatc accatcgaag ctgatatttg cattttttag cagtttttat + 8701 attcttgtaa tccttttccc gagaggaatt ttcctagggc attctacttt agcttctcgt + 8761 ttatggatta tttacaaaga aagtttatat ctatcaatac tacttggttc aatatatgtt + 8821 attttaaaaa tattatctcg aaatatcgcc attcatcagc atgctttttt tatcttacaa + 8881 tattatttta ttgtaatgat tttaactttt atgttaagtg ggtcaatcgg tgatggggta + 8941 caatcgattt tctatccaat attcatctat ttgtttttta atgaagttcg agataagaaa + 9001 tcaatagtgt taatttttga tatatttctt tatatactta ccgctttatt cgttatcaat + 9061 acgattgata tttttctgaa tttcacaaat atttttcatg ttactttttt aggacatgtt + 9121 caggtgattt cccaatatag tattctcgga tttctcgtat cagcttatta tctattagaa + 9181 gaaaagagga atatattagt cgcacagttg ctgttgattt taacgattat caattgtttt + 9241 ttttcagatg tctctctctc taaagctatt gctttgttta tgattattta tattatttca + 9301 tacaagttaa aaaaactatt ttggaaaaga ggaaggaaga tatctgttat aacttttatt + 9361 gcatctgttg tgatgttagc attagtgatt tttggatatt ttttaccata tcttagatat + 9421 tttgatttta cttttaatgg tcgataccaa atttggcgca ttgtgtatgc caccattctt + 9481 caagtgaaat ggtttggata tggtgtgttt ggctttcaat ttaaacttcc gtggcaggaa + 9541 ttgggagaaa ttggaataaa ttatactcat aatcaaattt tacagttagc acttgatagt + 9601 ggcattgttg ggattatctc attctttact atgatttttt atatgatctt ttcaactaaa + 9661 aatattcaaa atcccgcaat aggctcccta tttatttttg cctatttttg tctatttatt + 9721 ataatgttta tagagagtgt tacttattat ccatactatt ttattataat agttcttcaa + 9781 actttgtact taaaattgga aagagaaaga aatgttaaat agattgataa gaaattttaa + 9841 taaagtatat tatagttatc gtataaaaag aaaggccgca caatgcagtg ggagagtgta + 9901 tacgggaggc aaaacgtttg ttactgcaaa tacgtacctt gatgaaaatg tttcatttaa + 9961 tggtatgtca atgtatggtg aagggaaaat aagcattggt aaaaattttc attcaggatt + 10021 aaattgccaa attatcactt cctttcataa ttatgacttg ggtgataaaa ttccttatga + 10081 tgagagttac atacataaag acgtcttaat tgaagataac gtttgggtag ggaataatgt + 10141 gataatttta ggtggtgcga ttattgagga aggtgcaatc attcaagcag gaagtacagt + 10201 tgctggaaga attccagcag gtgcgattgc aggtggacat ccggcaaaac cattcagatt + 10261 tagaaatatg gaacattata atcggcttaa acggcaaaaa aaatttcatt agaggttaag + 10321 aatgaatatt gtaagttatc taaaaaaaaa cggtattaca catactttaa aaattattaa + 10381 tgaatataaa atgcaagagc tgtttgatag tcttgttagt atttttacaa agcagaagga + 10441 acttcgtgac agtattgtca ttgaatgtca tactgatttt gagaataatg gtggtgcgtt + 10501 ctatgactat ctaatcaata atgagtataa caaaaaatat aaaattgtct tactattgaa + 10561 ggataaatta tctaaagaat taccagaaaa tgtagattat ttttatttaa gaaagcccag + 10621 tttacgaaaa tcctacgtaa tgtcattaag taaattcttt acttttgata atgatatgct + 10681 tcgtaaatat agaaaagatc aaaaacactt ttatttaaca catggatgct ttcctttaaa + 10741 aaatacaata ggtaaaataa cagttccgaa ttatgttgat tttgttctat ctccatcggg + 10801 caatgtagat aatattatag ttaagcagtt tggattaaca tctaaagagc aatgtcttca + 10861 cactggattt ccgtgtcatg atatctttta ttcaaaaaca gaacctctag tatttttatc + 10921 tgattatgat aaaaaaatta tctgggcacc aacttttaga aagggtggtg gctataatag + 10981 aaatgatagt acagctagct atcctttagg tattccatta cttggaacac tagatgaact + 11041 tgcacaccta aacacatatc taagccaacg ggatattgtc ctgattgtaa agttacatcc + 11101 aatgcaagat atttcagatt tggagttgaa acaatttagt catattaagt ttctgacaaa + 11161 tcaaaatctg aaacgtaaaa atataaatat gtatcaattg ctgatgaatt cagatgcttt + 11221 acttagtgac tattctgcaa tctcgtatga ttatttacat cttgataaac caatagggta + 11281 tgttttttca gatctaaatg attataagtt ggggttttca gttgataatg tagatgatta + 11341 catagcaggt gataagataa tgtcttttaa cgacttgctg cactttattg ataacattta + 11401 tctagaaatt gataaaaata aagaaaaacg caaggaatta tttaataaaa tatttgaaaa + 11461 acaggatgga gaatcgtgtg aaagattggc ccaaattatg gaattatagg agacgttacg + 11521 aagaaatgtc tgttgggatg aaagcggcac tctggtatac tgttgcaaat tttattcaaa + 11581 agggttttgt atttctttca actccgattt taaccagaat acttaatgtt aatgattacg + 11641 gtacattgat actttaccaa tcatggtttg tactatttgc tatttttgct accttgaatc + 11701 tttctcaaac agcttataat aagggattag tagaatttga gaatgataaa gataatttta + 11761 cattttcttt gttgtttttg tctaagatta ttacgataat tgttgctttt ttgtatttta + 11821 cttttaatat actggttaaa gatagtactg gattaactcc cggtttcatg atatttttat + 11881 tcagtgatat tttatttaat attagtatag aattttattt ggcacgtcag agatttgaat + 11941 tcaaatatag aaaagcagtt ctaatttcaa tttcttcaag ttttttaatt gtagctatta + 12001 gtacaactat cttattagtg attaagaatg atttattcat taaaattgta ttagatgcta + 12061 ttatccgaat tatctttggt ttatattgtt tttatctctt gtttttttca gggagaaggc + 12121 aacttaagat agaaaaaaaa tatattaaat atggtttgag ttattcatta cctttgatgc + 12181 cgcatttctt atcgcactat attttgaatc agtctgatcg tttgatgatt aacatgtttg + 12241 atggtaagga gaaattagct atatatagtc tagcttattc tgtatcaatg attatgtttt + 12301 tgtttactaa tgcaattaat caatcaataa tgccgtatac atttcaagct ttgaaaaaaa + 12361 aggattatcg tgggatacat gggagcacca aatggctttt tataacagtt gggggagtca + 12421 cagttctctc aattctattt gcaccagaac taattgttat tttaggcggc aataaatata + 12481 aggaatcaat ttggctagta cctccaattg ctatctcggt ttatttcctt tttgtgtatt + 12541 ctatgtttag taatatcagt ttttattata agatgaataa actgatttcg ttagtttcca + 12601 caggtgcagc tctttcaaat attattttaa attatatttt tattaatata tttgggtatc + 12661 aagctgcatc ttacactaca ttattatgct atatattgtt agcattttct cattttttct + 12721 tatatagatt tttattaaaa aaagaggaaa ttcatgagga actttataat atgaagatga + 12781 ttctaataat atctttaata ttattaacaa tactattttt gatacttgtt atttataact + 12841 tagcctttat aaggtatgca attattgtaa ttattgtatt tcttttgttt acaaagagaa + 12901 ataaaataat tacatcccta aaaagttgat attgaaaatt tagattcaaa ttaagaatat + 12961 agtggatatc aaaccagtaa taataatgaa taattgtttt tatgtaattt gggattaata + 13021 aaaaattgaa aggaaatatc aatgaaaaga gtgattactt atggaacctt tgatttgctt + 13081 cattatggac atatcaattt gctaaagaga gcgaagcaat taggagatta tctcattgtt + 13141 gtagtttcaa gtgatgagtt caatttgaaa gaaaaaaata aagtttgtta ctttaatttt + 13201 gaacatagaa aaaatttggt tgaagcgata agatatgttg atttggtgat tcctgaaaca + 13261 agctgggaac agaaaaaaac agatattaaa gaatatcaca ttgatacatt tgttatgggg + 13321 gatgattgga aaggaaaatt tgattattta aaagaagaag gagtggaagt agtttattta + 13381 ccaagaacta aagaaatatc tacaactaaa attaaagaag atttagcaga ttagattttt + 13441 tacaaaaata ttttgagatc agataataaa tttgtttcca taattattaa tgttttgact + 13501 atttaaatct cattttttaa aaaattcgga ttgattaata ataaaaaaat ctagtttaag + 13561 atatgaaaga aaattatatc cataactatt atattgtttg taatatgtat cgtgataatg + 13621 tataagaaat tagtagatat aaatgtgata tatagctaaa actaatatta ttcattgcta + 13681 tttaaaatgt agttagaagt aaagcatcta ataaacttga aggtacataa aaatttagca + 13741 ttaaattata aaacaaggta tttttctgtg aaaattgggt agatatacaa taatatttgt + 13801 attgttagag aaagaattct taatattata ttgtaatgga ggcattttga attgactaaa + 13861 gtaagaatta attgggtaga ttttgggaaa ggatttgcaa tattcttagt tctagtaggg + 13921 catgtattta ttggtttata tgaatccaat aagttttcaa ttgcaaatga tgtgttatta + 13981 ttcctgatag ctcaaatcta tatatttcat ataccagtgt tttttgcgtt atcaggatac + 14041 tttttcagac ctgtatcaga tttgaaggag ttttggcatt atgctaaaaa gaaaaccatt + 14101 attttaggca taccatatat tttttattca attattcact tttgtcttca aaaggttgcg + 14161 ggtgcttctg tccgagtacc cactacgata tttaacctat tgaatatcta taaatttcct + 14221 ctgggagttt catggtatct atatacgtta tgatcgatat tgatagttta tggtttacta + 14281 tctgttgttt tcaaaaatcg taagtccctt ttgttagtta gtgtttttgc ctatattttc + 14341 acactattta ttcaaactga tatttttatt gtgcaacgga cgttggtttg ggggatttgt + 14401 ttccttcttg gcagtgtatt gagtgaaatt cactttgata aaattaattt taaaaaaatt + 14461 cttgttttct ttgtgttatt tgattttatt tatatgttcg cttggttctt gttttatgaa + 14521 gtaggatcta agaaggatta tgtaagctat agtaacccag gtttgtgggg gattgctttt + 14581 attgtctgtg tattagttgc ttttgcgatt tttcctaaaa tggagaaaaa ttttcctaaa + 14641 actttcctat atttcactaa atacgggaaa gatagtttag ggatctatat tcttcatgca + 14701 ccaatttgta gcatgattcg gattctaatg ttgaaagtgg gaataaactc agtttttctt + 14761 cacgttgttg ttgggattgt gctaggctgg tatttatcca tactggcaac ttatatattg + 14821 aaaaaaattc catttttgaa tattgtttta ttaccacaaa agtatattaa attaaaataa +// diff --git a/public/res/serotype_genbank/serotype_11F-like.gb b/public/res/serotype_genbank/serotype_11F-like.gb new file mode 100644 index 0000000..626c9b6 --- /dev/null +++ b/public/res/serotype_genbank/serotype_11F-like.gb @@ -0,0 +1,517 @@ +LOCUS MF140334 14871 bp DNA linear BCT 05-AUG-2017 +DEFINITION Streptococcus pneumoniae strain PMP1342 csp gene locus, complete + sequence. +ACCESSION MF140334 +VERSION MF140334.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 14871) + AUTHORS Manna,S., Ortika,B., Dunne,E.M., Holt,K.E., Kama,M., Russell,F.M., + Hinds,J. and Satzke,C. + TITLE A novel genetic variant of Streptococcus pneumoniae serotype 11A + discovered in Fiji + JOURNAL Clin. Microbiol. Infect. (2017) In press + PUBMED 28736074 + REMARK Publication Status: Available-Online prior to print +REFERENCE 2 (bases 1 to 14871) + AUTHORS Manna,S., Ortika,B.D., Dunne,E.M., Holt,K.E., Kama,M., + Russell,F.M., Hinds,J. and Satzke,C. + TITLE Direct Submission + JOURNAL Submitted (21-MAY-2017) Pneumococcal Research, Murdoch Childrens + Research Institute, 50 Flemington road Parkville, Melbourne, VIC + 3052, Australia +COMMENT ##Assembly-Data-START## + Assembly Method :: SPAdes v. June 2015 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..14871 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="PMP1342" + /serotype="11A(11F-like)" + /isolation_source="nasopharynx" + /db_xref="taxon:1313" + /geo_loc_name="Fiji" + misc_feature 1..14871 + /note="csp gene locus" + gene 1..1446 + /gene="wzg" + CDS 1..1446 + /gene="wzg" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="ASO97413.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 1448..2179 + /gene="wzh" + CDS 1448..2179 + /gene="wzh" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="ASO97414.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGMRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPQKIVMDQLI" + gene 2188..2880 + /gene="wzd" + CDS 2188..2880 + /gene="wzd" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="ASO97415.1" + /translation="MKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSAFIV + KPEYTSTTRIYVVNRDQGDKPGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKLD + MPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVT + TLEEARPATTPSSPNVRRNSLFGFLGGAVVTVSAVLLIELLDTRVKRPEDVEDVLQIP + LLGVVPNLDKMK" + gene 2890..3570 + /gene="wze" + CDS 2890..3570 + /gene="wze" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="ASO97416.1" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDDLKVFSITSVK + LGEGKSTTSTNIAWAFAHAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GDYGKNKK" + gene 3585..4952 + /gene="wchA" + CDS 3585..4952 + /gene="wchA" + /note="initial sugar transferase" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA" + /protein_id="ASO97417.1" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQNFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTVHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSKKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLLPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQISGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFM + RDGAK" + gene 4956..5405 + /gene="wchJ" + CDS 4956..5405 + /gene="wchJ" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="ASO97418.1" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKADARSVLSE + EVVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKT + VYIEVFDRIDAPTITGKLVYPVTDRFIVQWEEMKKIYPKAINLGGIF" + gene 5405..5884 + /gene="wchK" + CDS 5405..5884 + /gene="wchK" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="ASO97419.1" + /translation="MIFVTVGTHEQQFDRLIKEFDRLKEENLIQEEVFIQTGYSNYVP + KYCKWEKIISYEKMNQFIEEADTIVTHGGPATFMAIIAKGKTPIVVPRQKKFGEHVND + HQMNFCSKISSEGYELSLINDISELQYSLKQEKKTKFYSNNANFLKQLSKIIEDLIV" + gene 6126..7223 + /gene="wcyK" + CDS 6126..7223 + /gene="wcyK" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="ASO97420.1" + /translation="MKILHIPTGGLFSDGIGTFIYSYLEYMDLNKYDVTILATNPLLK + SDKEKFEYLGVKVIEIERKKSNLSKYIYKLKKLMKKEKFDIIHVHGSSALMSIELLTA + KIAGIPVRIAHSHNTTCEHHKLDKLLRPIFYRVYTQACACSVSAGQWLFEEKNYEIIH + NARDVNKYQYDAIKRKKLREELLLSDETIALGHVGRFNTQKNQRFLVSLMERLVIKNI + DLKLFLVGTGDTLEEIKKLVIQKKLEDNIVFLGQFDDMKSFVSSMDIMLLPSLYEGLP + LVSVEWQINGVKSILSDRVTQECIYTETVQQLSIDSMELWEKEILNLSTSDRERVSLQ + NIQLIRNAGYDISLEVKEIEELYNSLYDIAN" + gene 7224..7919 + /gene="wcwC" + CDS 7224..7919 + /gene="wcwC" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="ASO97421.1" + /translation="MKGKSFLLKMLQNLKLIKRRLKPIKRKLKPIKRTYKKIVYSITK + SNMRKRLKNTDFSIISDNCWGGRVYEELGLPYRTPFIGLYIFSEDYVKLLKNFKKYME + YELTFTNNSKWNTEYDGEYPIGILNDIEIHFLHYSSMEEAYKKWNKRKKRINYKNIFF + KMNDDNKCSLKLLKEFDTLDLKNKIIFAAFNYKELDNLIHFTNPIGNGNVGADLFYYN + KYFDVVNWLNGEY" + gene 7922..8644 + /gene="wcrL" + CDS 7922..8644 + /gene="wcrL" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="ASO97422.1" + /translation="MIPKKIHYCWFGGKPLPNDVKRCIASWRKFCPDYEIIEWTEKNF + CIQNQNQFVKDAYKNKAWAFVSDYARLKIVYENGGIYLDTDVEIIKKLDLLLDNTAFF + GVHQVNHLVNTGLGFGAEKGSFILKELLDSYDEVKFDINKKDELLCPELNTQIFKQLG + YVYSNSVIKSQYFTIYPEEYFDPISLGDEVANILSDKTFSIHHYNASWTSLMNRVKRK + IIRKLGRSNVSELKRILKGKTR" + gene 8641..9813 + /gene="wzy" + CDS 8641..9813 + /gene="wzy" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="ASO97423.1" + /translation="MRISPSKLIFAFFSSFYILVILFPRGIFLGHSTLASRLWIIYKE + SLYLSILLGSIYVILKILSRNIAIHQHAFFILQYYFIVMILTFMLSGSIGDGVQSIFY + PIFIYLFFNEVRDKKSIVLIFDIFLYILTALFVINTIDIFLNFTNIFHVTFLGHVQVI + SQYSILGFLVSAYYLLEEKRNILVAQLLLILTIINCFFSDVSLSKAIALFMIIYIISY + KLKKLFWKRGRKISVITFIASVVMLALVIFGYFLPYLRYFDFTFNGRYQIWRIVYATI + LQVKWFGYGVFGFQFKLPWQELGEIGINYTHNQILQLALDSGIVGIISFFTMIFYMIF + STKNIQNPAIGSLFIFAYFCLFIIMFIESVTYYPYYFIIIVLQTLYLKLERERNVK" + gene 9803..10303 + /gene="wcwT" + CDS 9803..10303 + /gene="wcwT" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="ASO97424.1" + /translation="MLNRLIRNFNKVYYSYRIKRKAAQCSGRVYTGGKTFVTANTYLD + ENVSFNGMSMYGEGKISIGKNFHSGLNCQIITSFHNYDLGDKIPYDESYIHKDVLIED + NVWVGNNVIILGGAIIEEGAIIQAGSTVAGRIPAGAIAGGHPAKPFRFRNMEHYNRLK + RQKKFH" + gene 10313..11500 + /gene="wcwU" + CDS 10313..11500 + /gene="wcwU" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="ASO97425.1" + /translation="MNIVSYLKKNGITHTLKIINEYKMQELFDSLVSIFTKQKELRDS + IVIECHTDFENNGGAFYDYLINNEYNKKYKIVLLLKDKLSKELPENVDYFYLRKPSLR + KSYVMSLSKFFTFDNDMLRKYRKDQKHFYLTHGCFPLKNTIGKITVPNYVDFVLSPSG + NVDNIIVKQFGLTSKEQCLHTGFPCHDIFYSKTEPLVFLSDYDKKIIWAPTFRKGGGY + NRNDSTASYPLGIPLLGTLDELAHLNTYLSQRDIVLIVKLHPMQDISDLELKQFSHIK + FLTNQNLKRKNINMYQLLMNSDALLSDYSAISYDYLHLDKPIGYVFSDLNDYKLGFSV + DNVDDYIAGDKIMSFNDLLHFIDNIYLEIDKNKEKRKELFNKIFEKQDGESCERLAQI + MEL" + gene 11517..12920 + /gene="wzx" + CDS 11517..12920 + /gene="wzx" + /codon_start=1 + /transl_table=11 + /product="group 52 protein" + /protein_id="ASO97426.1" + /translation="MSVGMKAALWYTVANFIQKGFVFLSTPILTRILNVNDYGTLILY + QSWFVLFAIFATLNLSQTAYNKGLVEFENDKDNFTFSLLFLSKIITIIVAFLYFTFNI + LVKDSTGLTPGFMIFLFSDILFNISIEFYLARQRFEFKYRKAVLISISSSFLIVAIST + TILLVIKNDLFIKIVLDAIIRIIFGLYCFYLLFFSGRRQLKIEKKYIKYGLSYSLPLM + PHFLSHYILNQSDRLMINMFDGKEKLAIYSLAYSVSMIMFLFTNAINQSIMPYTFQAL + KKKDYRGIHGSTKWLFITVGGVTVLSILFAPELIVILGGNKYKESIWLVPPIAISVYF + LFVYSMFSNISFYYKMNKLISLVSTGAALSNIILNYIFINIFGYQAASYTTLLCYILL + AFSHFFLYRFLLKKEEIHEELYNMKMILIISLILLTILFLILVIYNLAFIRYAIIVII + VFLLFTKRNKIITSLKS" + gene 13033..13425 + /gene="gct" + CDS 13033..13425 + /gene="gct" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="ASO97427.1" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNFEHRKNLVEAIRYVDLVIPETSWEQKKTDIKEYHIDTFVMGDDWKGKFDY + LKEEGVEVVYLPRTKEISTTKIKEDLAD" + gene 13843..14871 + /gene="wcjE" + CDS 13843..14871 + /gene="wcjE" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="ASO97428.1" + /translation="MTKVRINWVDFGKGFAIFLVLVGHVFIGLYESNKFSIANDVLLF + LIAQIYIFHIPVFFALSGYFFRPVSDLKEFWHYAKKKTIILGIPYIFYSIIHFCLQKV + AGASVRVPTTIFNLLNIYKFPLGVSWYLYTLWSILIVYGLLSVVFKNRKSLLLVSVFA + YIFTLFIQTDIFIVQRTLVWGICFLLGSVLSEIHFDKINFKKILVFFVLFDFIYMFAW + FLFYEVGSKKDYVSYSNPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSL + GIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLL + PQKYIKLK" +ORIGIN + 1 atgagtagac gttttaaaaa atcacgttca cagaaagtga agcgaagtgt taatatcgtt + 61 ttgctgacta tttatttatt gttagtttgt tttttattgt tcttaatctt taagtacaat + 121 atccttgctt ttagatatct taacctagtg gtaactgcgt tagtcctact agttgccttg + 181 gtagggctac tcttgattat ctataaaaaa gctgaaaaat ttactatttt tctgttgctg + 241 ttctctatcc ttgtcagctc tgtgtcgctc tttgcagtac agcagtttgt tggactgacc + 301 aatcgtttaa atgcgacttc taattactca gaatattcaa tcagtgtcgc tgttttagca + 361 gatagtgata tcgaaaatgt tacgcaactg acgagtgtga cagcaccgac tgggactgat + 421 aatgaaaata ttcaaaaatt actagctgat attaagtcaa gtcagaatac cgatttgacg + 481 gtcgaccaga gttcgtctta cttggcagct tacaagagtt tgattgcagg ggagactaag + 541 gccattgtct taaatagtgt ctttgaaaat atcatcgagt cagagtatcc agactacgca + 601 tcgaagataa aaaagattta taccaaggga ttcactaaaa aagtagaagc tcctaagacg + 661 tctaagaatc agtctttcaa tatctatgtt agtggaattg acacatatgg tcctattagt + 721 tcggtgtcgc gatcagatgt caatatcctg atgactgtca atcgagatac caagaaaatc + 781 ctcttgacca caacgccacg tgatgcctat gtaccaatag cagatggtgg aaataatcaa + 841 aaagataaat taacccatgc gggcatttat ggagttgatt cgtccattca caccttagaa + 901 aatctctatg gagtggatat caattactat gtgcgattga acttcacttc tttcttgaaa + 961 atgattgact tattgggagg ggtagatgtt cataatgatc aagagttttc agctctacat + 1021 gggaagttcc atttcccagt agggaatgtc catctagact ctgagcaggc tctaggtttt + 1081 gtacgtgaac gctactcact agccgatgga gaccgtgacc gtggtcgcaa ccaacaaaag + 1141 gtgattgtgg ctatccttca aaaattaacg tcaaccgaag cactgaaaaa ttatagtacg + 1201 atcattaata gcttgcaaga ttctatccaa acaaatatgc cacttgagac tatgataaat + 1261 ttggttaatg ctcagttaga aagtggaggg aattataaag taaattctca agatttaaaa + 1321 gggacaggtc ggacggatct tccttcttat gcaatgccag acagtaacct ctatgtgatg + 1381 gaaatagatg atagtagttt agctgtagtt aaagcagcta tacaggatgt gatggagggt + 1441 agatgaaatg atagacatcc attcgcacat cgtctttgat gtagatgatg gtcccaagtc + 1501 aagagaggaa agcaaggctc tcttggcaga agcctacaga caggggatgc gaaccattgt + 1561 ctctacctct caccgtcgca agggcatgtt tgaaactccg gaagagaaga tagcagaaaa + 1621 ctttcttcag gttcgggaaa tagctaagga agtggcgagt gacttggtca ttgcttacgg + 1681 ggctgaaatt tactacacac cagatgttct ggataagctg gaaaaaaagc ggattccgac + 1741 cctcaatgat agtcgttatg ccttgataga gtttagtatg aacactcctt atcgcgatat + 1801 tcatagcgcc ttgagcaaga tcttgatgtt gggaattact ccagtcattg cccacattga + 1861 gcgctatgat gctcttgaaa ataatgaaaa acgcgttcga gaactgatcg atatgggctg + 1921 ttacacgcaa gtaaatagtt cacatgtcct caaacccaaa ctttttggcg aacgttataa + 1981 attcatgaaa aaaagagctc agtatttttt agagcaggat ttggttcatg tcattgcaag + 2041 tgatatgcac aatctagacg gtagacctcc tcatatggca gaagcatatg accttgttac + 2101 ccaaaaatac ggagaagcga aggctcagga actttttata gacaatcctc aaaaaattgt + 2161 aatggatcaa ctaatttagg agaaatgatg aaagaacaaa acacgataga aatcgatgta + 2221 tttcaattat ttaaaacctt gtggaaacgc aagctaatga ttttaatagt ggcacttgtg + 2281 acaggtgcgg gggcttttgc atatagcgct tttattgtta agccagaata tacgagtact + 2341 acgcgaattt acgtagtgaa tcgcgatcaa ggagacaagc cggggctgac aaatcaggat + 2401 ttgcaggcag gatcttatct ggtaaaagac taccgtgaga ttatcctttc gcaggatgta + 2461 ttggaaaaag tagcgacaaa tttgaagttg gatatgccag caaaaacgtt agccagcaaa + 2521 gttcaagtga ctgtaccagc tgacactcgt atcgtctcaa tctctgtcaa agataaacag + 2581 ccagaagaag ccagtcgtat cgctaattct ctacgagaag ttgctgcaga aaagatcgtc + 2641 gctgtaacgc gagtatctga tgtaacgaca cttgaagaag cgcgaccagc tacgactccc + 2701 tcttctccaa atgttcgacg caattccttg tttggttttc ttggaggagc agtcgtaaca + 2761 gtaagtgctg ttcttttgat tgagttgctc gacacccgtg tgaaacgtcc tgaagatgtc + 2821 gaagatgtac tgcaaattcc acttttaggg gtcgttccaa atttggacaa aatgaaatag + 2881 gaggaagtta tgccaacatt agaaatctca caggcaaaat tggattttgt aaaaaaggca + 2941 gaggaatatt ataacgcttt gtgcacgaac ctacagttaa gtggagatga tttgaaagta + 3001 ttttctatca cttctgtgaa actaggagaa ggaaaatcaa cgacttccac caatatcgct + 3061 tgggcttttg cgcatgcagg ttacaaaacg ctgctgattg atggagatat tcgcaattct + 3121 gttatgttag gtgtctttaa agcaagggat aagattacag gcctgacaga atttttatca + 3181 ggaactacag atctatcaca agggctttgt gataccaata tcgaaaatct ctttgtaatt + 3241 caggctggct ctgtgtcacc gaatccgaca gctcttcttc aaagtaagaa tttcagtaca + 3301 atgcttgaaa ccttgcgtaa atattttgac tacatcattg tagatactgc tcctgtcggt + 3361 gtcgtgattg atgcggctat tattacgcga aaatgcgatg cttctatttt agtgacggag + 3421 gcaggtgaaa taaatcgacg ggatattcaa aaagcaaaag aacagttgga acacacaggg + 3481 aagccgtttt tgggagttgt gttgaataaa ttcgatactt cagtagacaa atacggttct + 3541 tatggagatt acgggaaaaa taaaaaatag gtcggaggac agagatgaat ggaaaaatag + 3601 taaagtcttc attggctata atccagagtt ttcttgttat tttattgact tatctcctta + 3661 gtgctgtgag agaagcggag attgtttcaa caacagctat tgcactttat atcctccatt + 3721 attttgtctt ttatattagt gattatggac agaatttctt taaaagggga tatttgattg + 3781 aacttgtcca gacattgaaa tatatcctat tctttgcact agcgattagt atttctaatt + 3841 ttttcttaga ggatcgattt agtatttcca gacgaggcat gatttacttc ctcacagtac + 3901 atgctctctt agtctatgtg ctaaacctat ttatcaagtg gtattggaag cgggcttatc + 3961 ccaactttaa aggaagtaag aagattctcc tacttacagc aacttctcgt gtcgaaaagg + 4021 tactggatag attaatagaa tcaaatgagg ttgttgggga gttggtagct gtcagtgtct + 4081 tagataaacc agattttcag catgattgtt taaaggtagt agcagagggg gagatagtaa + 4141 actttgcgac tcatgaggtg gtcgatgaag tctttatcaa tcttccaagt aaaaaataca + 4201 atattggaga gcttgtctct cagtttgaaa cgatgggaat tgatgtaaca gttaatctaa + 4261 atgcttttga tcgtagtttg gcacgtaaca agcaaattcg tgagatggca ggattaaacg + 4321 ttgtgacttt ttctacaaca ttttataaga ctagtcatgt aattgctaag cggattattg + 4381 atatcgtggg tgcattggta gggctgatac tatgtggttt agtcagtatt gtattgcttc + 4441 ctttgattcg aaaggatggg ggctctgcta tttttgctca gacgcgtata ggaaaaaatg + 4501 gtcgtcagtt cactttttat aagtttcgct ctatgtgtgt agatgccgag gcgaaaaaaa + 4561 gagaactcat ggaacaaaat accatgcagg gtggaatgtt taaggtggac gatgatcctc + 4621 gtatcacgaa aattggtcgt tttatacgga agactagctt ggacgagcta ccacagtttt + 4681 ataatgttct aaagggagat atgagtttgg ttggcacacg gccaccgaca gtggacgagt + 4741 atgaacacta taccccagaa caaaaacgtc ggctaagttt taaacctggt ataacaggct + 4801 tatggcagat cagtggacga agtgagatta agaattttga tgaagttgtc aaattagatg + 4861 tagcctatat agacgattgg acaatttgga aagacattga aattttattg aagacagtta + 4921 aagttgtatt tatgagagac ggagcgaagt aggaaatgaa aatatgttta gttggatcta + 4981 gtggaggtca tctgactcat ttatatcttt taaaaccttt ctggaaagat aaagaaagat + 5041 tttgggttac ttttgataag gcggacgctc ggagtgtact ctctgaggaa gttgtatatc + 5101 cctgttatta tccaaccaat cgtaatataa aaaatttaat aaaaaatact tttctcgcct + 5161 ataaaatttt aaaaaaagag agaccagatt tgattatttc ttctggtgcc gctatcgctg + 5221 ttcctttctt ttatattggg aagttatttg gatcaaagac agtgtatata gaagtgtttg + 5281 atagaattga tgctccaaca ataacgggaa aacttgttta tccagtaacg gataggttta + 5341 ttgttcaatg ggaagaaatg aaaaaaattt atccgaaagc aattaatcta ggaggaatat + 5401 tctgatgatt tttgttactg tagggacaca tgaacaacaa tttgatcgtt tgataaaaga + 5461 atttgatcgt ttgaaagaag agaatctaat tcaagaggaa gtatttattc aaacaggata + 5521 ttctaattat gtcccaaaat attgtaaatg ggaaaaaata atatcttatg aaaaaatgaa + 5581 tcagtttatt gaggaagctg atacaattgt tacccatggt ggtccagcaa cttttatggc + 5641 aattattgct aaaggaaaaa ctccaatagt tgttccgagg caaaagaaat ttggggagca + 5701 tgtgaatgat catcagatga atttttgttc taaaatatcc tctgaagggt atgaattatc + 5761 tctgattaac gatataagcg aattgcagta tagtttaaag caagaaaaga aaactaaatt + 5821 ttactctaat aatgcaaatt ttcttaagca gttatcaaaa ataattgaag atttaatagt + 5881 ataaaatgag attgtttctt cttattgcag atgaattaga aataaatcag gttgtgagta + 5941 aagcaacagt gccaaagtgt atttgtaatt aagaataaaa taaacaccat ttcaatatct + 6001 gaaaataatt ctcaaggcat agtttgaatt atggatatag attattttgc taagtcttct + 6061 aatcgattta taagttaagg cagtaacatt attaaaatca tagatagaag taaggaggga + 6121 actaaatgaa aatactacat attccaacgg gtggtttatt ttctgatggt ataggaactt + 6181 ttatttattc atatttggag tatatggact taaacaagta tgatgtgaca attttagcca + 6241 ctaatcctct tttgaaaagt gataaggaaa aatttgaata tttaggggtt aaagttattg + 6301 aaattgaaag gaaaaaatca aacctttcta aatatatata caaattgaaa aaattaatga + 6361 aaaaagaaaa atttgatatt atacatgttc acggaagtag cgctttaatg tcaattgaat + 6421 tactgactgc taaaattgct ggtatcccag ttcgaattgc ccatagccat aacactactt + 6481 gtgagcatca taaactagat aaactactac gaccgatatt ttatcgagtt tatactcagg + 6541 catgtgcttg cagtgttagt gctggtcagt ggctttttga ggaaaaaaat tatgagatta + 6601 tccataacgc tagagatgta aataagtatc agtatgatgc cataaaacga aaaaaactta + 6661 gagaagaatt gttactgtct gatgagacta ttgctctagg tcatgttgga cgttttaata + 6721 ctcaaaaaaa tcaacgtttt ctagtgtctc tgatggaaag attagtgatc aaaaatatag + 6781 atttaaaatt atttttagta gggacgggtg atactttaga agaaatcaag aaattagtca + 6841 ttcagaaaaa actagaagat aatattgttt ttttaggtca atttgatgat atgaaatctt + 6901 ttgtgtcatc aatggatata atgttacttc caagtttata tgaagggtta ccactagtat + 6961 ctgttgaatg gcaaataaac ggagtaaaaa gtatcctatc tgaccgtgtt acacaagagt + 7021 gtatctatac agaaactgtt caacaattat ctatcgatag tatggaatta tgggaaaaag + 7081 aaattttaaa tttatctact tcagatagag aaagagtgtc attgcaaaat attcagttaa + 7141 taagaaatgc aggctatgat atttctttag aagttaaaga aatagaagaa ttatataatt + 7201 cactttatga tattgcgaat tgaatgaaag gaaagagttt tcttttgaag atgttacaaa + 7261 atttaaaact aataaaacgg agattaaaac caataaaacg gaaattaaaa ccaattaaga + 7321 gaacttataa gaaaatagtt tattctatca ctaagtcaaa tatgaggaag aggctcaaaa + 7381 atacagattt ttcaattatc agtgataatt gctggggagg acgggtatat gaagaattgg + 7441 gtctgccgta tagaacacca tttataggtc tgtatatttt ttctgaggat tatgtgaagc + 7501 tgttgaaaaa cttcaaaaag tatatggaat atgagctaac gtttaccaat aattcaaaat + 7561 ggaacacaga atatgacggg gagtatccta taggtattct caatgatata gaaattcatt + 7621 ttttacatta ttctagcatg gaagaagcat ataaaaaatg gaataaaaga aaaaaaagaa + 7681 ttaattataa aaatattttt tttaagatga atgatgataa taaatgttct ttgaaattgc + 7741 ttaaggaatt tgatactttg gatttgaaaa ataaaattat ttttgctgca ttcaattata + 7801 aagaactaga taatcttatt cattttacca atcctatagg taatggaaat gtaggtgcag + 7861 acctatttta ttataataaa tactttgatg ttgttaattg gttgaatgga gagtactaag + 7921 tatgatacct aaaaaaattc attattgttg gtttggtggc aaaccattac caaatgatgt + 7981 gaaacgatgt atagctagtt ggagaaagtt ttgtcccgac tatgaaatta ttgaatggac + 8041 tgaaaaaaat ttttgtattc aaaatcaaaa tcaatttgta aaagatgcgt ataaaaataa + 8101 ggcatgggct tttgttagcg actatgctag actcaaaatt gtttatgaaa atggaggtat + 8161 ctatttagat actgatgttg agattattaa aaagctagat ttgttactgg ataacacagc + 8221 attctttggt gttcatcaag ttaatcatct agttaataca ggattaggtt ttggggctga + 8281 aaaggggtca ttcattttaa aagaattatt agattcttat gatgaagtga aatttgatat + 8341 taacaagaaa gacgagctat tatgtccaga attaaacacg caaatattta aacaactagg + 8401 ttatgtttat tctaattcag ttataaaaag tcaatatttc acaatctatc ccgaagaata + 8461 cttcgatccc atttcattgg gagatgaagt tgctaatatt ttatcagata aaacattttc + 8521 tattcatcat tataatgcat cttggacttc cttgatgaat cgggtgaaga gaaaaataat + 8581 tcgtaaacta ggtagaagta atgtctcgga gttaaaaaga atattaaagg ggaaaactag + 8641 atgagaatat caccatcgaa gctgatattt gcatttttta gcagttttta tattcttgta + 8701 atccttttcc cgagaggaat tttcctaggg cattctactt tagcttctcg tttatggatt + 8761 atttacaaag aaagtttata tctatcaata ctacttggtt caatatatgt tattttaaaa + 8821 atattatctc gaaatatcgc cattcatcag catgcttttt ttatcttaca atattatttt + 8881 attgtaatga ttttaacttt tatgttaagt gggtcaatcg gtgatggggt acaatcgatt + 8941 ttctatccaa tattcatcta tttgtttttt aatgaagttc gagataagaa atcaatagtg + 9001 ttaatttttg atatatttct ttatatactt accgctttat tcgttatcaa tacgattgat + 9061 atttttctga atttcacaaa tatttttcat gttacttttt taggacatgt tcaggtgatt + 9121 tcccaatata gtattctcgg atttctcgta tcagcttatt atctattaga agaaaagagg + 9181 aatatattag tcgcacagtt gctgttgatt ttaacgatta tcaattgttt tttttcagat + 9241 gtctctctct ctaaagctat tgctttgttt atgattattt atattatttc atacaagtta + 9301 aaaaaactat tttggaaaag aggaaggaag atatctgtta taacttttat tgcatctgtt + 9361 gtgatgttag cattagtgat ttttggatat tttttaccat atcttagata ttttgatttt + 9421 acttttaatg gtcgatacca aatttggcgc attgtgtatg ccaccattct tcaagtgaaa + 9481 tggtttggat atggtgtgtt tggctttcaa tttaaacttc cgtggcagga attgggagaa + 9541 attggaataa attatactca taatcaaatt ttacagttag cacttgatag tggcattgtt + 9601 gggattatct cattctttac tatgattttt tatatgatct tttcaactaa aaatattcaa + 9661 aatcccgcaa taggctccct atttattttt gcctattttt gtctatttat tataatgttt + 9721 atagagagtg ttacttatta tccatactat tttattataa tagttcttca aactttgtac + 9781 ttaaaattgg aaagagaaag aaatgttaaa tagattgata agaaatttta ataaagtata + 9841 ttatagttat cgtataaaaa gaaaggccgc acaatgcagt gggagagtgt atacgggagg + 9901 caaaacgttt gttactgcaa atacgtacct tgatgaaaat gtttcattta atggtatgtc + 9961 aatgtatggt gaagggaaaa taagcattgg taaaaatttt cattcaggat taaattgcca + 10021 aattatcact tcctttcata attatgactt gggtgataaa attccttatg atgagagtta + 10081 catacataaa gacgtcttaa ttgaagataa cgtttgggta gggaataatg tgataatttt + 10141 aggtggtgcg attattgagg aaggtgcaat cattcaagca ggaagtacag ttgctggaag + 10201 aattccagca ggtgcgattg caggtggaca tccggcaaaa ccattcagat ttagaaatat + 10261 ggaacattat aatcggctta aacggcaaaa aaaatttcat tagaggttaa gaatgaatat + 10321 tgtaagttat ctaaaaaaaa acggtattac acatacttta aaaattatta atgaatataa + 10381 aatgcaagag ctgtttgata gtcttgttag tatttttaca aagcagaagg aacttcgtga + 10441 cagtattgtc attgaatgtc atactgattt tgagaataat ggtggtgcgt tctatgacta + 10501 tctaatcaat aatgagtata acaaaaaata taaaattgtc ttactattga aggataaatt + 10561 atctaaagaa ttaccagaaa atgtagatta tttttattta agaaagccca gtttacgaaa + 10621 atcctacgta atgtcattaa gtaaattctt tacttttgat aatgatatgc ttcgtaaata + 10681 tagaaaagat caaaaacact tttatttaac acatggatgc tttcctttaa aaaatacaat + 10741 aggtaaaata acagttccga attatgttga ttttgttcta tctccatcgg gcaatgtaga + 10801 taatattata gttaagcagt ttggattaac atctaaagag caatgtcttc acactggatt + 10861 tccgtgtcat gatatctttt attcaaaaac agaacctcta gtatttttat ctgattatga + 10921 taaaaaaatt atctgggcac caacttttag aaagggtggt ggctataata gaaatgatag + 10981 tacagctagc tatcctttag gtattccatt acttggaaca ctagatgaac ttgcacacct + 11041 aaacacatat ctaagccaac gggatattgt cctgattgta aagttacatc caatgcaaga + 11101 tatttcagat ttggagttga aacaatttag tcatattaag tttctgacaa atcaaaatct + 11161 gaaacgtaaa aatataaata tgtatcaatt gctgatgaat tcagatgctt tacttagtga + 11221 ctattctgca atctcgtatg attatttaca tcttgataaa ccaatagggt atgttttttc + 11281 agatctaaat gattataagt tggggttttc agttgataat gtagatgatt acatagcagg + 11341 tgataagata atgtctttta acgacttgct gcactttatt gataacattt atctagaaat + 11401 tgataaaaat aaagaaaaac gcaaggaatt atttaataaa atatttgaaa aacaggatgg + 11461 agaatcgtgt gaaagattgg cccaaattat ggaattatag gagacgttac gaagaaatgt + 11521 ctgttgggat gaaagcggca ctctggtata ctgttgcaaa ttttattcaa aagggttttg + 11581 tatttctttc aactccgatt ttaaccagaa tacttaatgt taatgattac ggtacattga + 11641 tactttacca atcatggttt gtactatttg ctatttttgc taccttgaat ctttctcaaa + 11701 cagcttataa taagggatta gtagaatttg agaatgataa agataatttt acattttctt + 11761 tgttgttttt gtctaagatt attacgataa ttgttgcttt tttgtatttt acttttaata + 11821 tactggttaa agatagtact ggattaactc ccggtttcat gatattttta ttcagtgata + 11881 ttttatttaa tattagtata gaattttatt tggcacgtca gagatttgaa ttcaaatata + 11941 gaaaagcagt tctaatttca atttcttcaa gttttttaat tgtagctatt agtacaacta + 12001 tcttattagt gattaagaat gatttattca ttaaaattgt attagatgct attatccgaa + 12061 ttatctttgg tttatattgt ttttatctct tgtttttttc agggagaagg caacttaaga + 12121 tagaaaaaaa atatattaaa tatggtttga gttattcatt acctttgatg ccgcatttct + 12181 tatcgcacta tattttgaat cagtctgatc gtttgatgat taacatgttt gatggtaagg + 12241 agaaattagc tatatatagt ctagcttatt ctgtatcaat gattatgttt ttgtttacta + 12301 atgcaattaa tcaatcaata atgccgtata catttcaagc tttgaaaaaa aaggattatc + 12361 gtgggataca tgggagcacc aaatggcttt ttataacagt tgggggagtc acagttctct + 12421 caattctatt tgcaccagaa ctaattgtta ttttaggcgg caataaatat aaggaatcaa + 12481 tttggctagt acctccaatt gctatctcgg tttatttcct ttttgtgtat tctatgttta + 12541 gtaatatcag tttttattat aagatgaata aactgatttc gttagtttcc acaggtgcag + 12601 ctctttcaaa tattatttta aattatattt ttattaatat atttgggtat caagctgcat + 12661 cttacactac attattatgc tatatattgt tagcattttc tcattttttc ttatatagat + 12721 ttttattaaa aaaagaggaa attcatgagg aactttataa tatgaagatg attctaataa + 12781 tatctttaat attattaaca atactatttt tgatacttgt tatttataac ttagccttta + 12841 taaggtatgc aattattgta attattgtat ttcttttgtt tacaaagaga aataaaataa + 12901 ttacatccct aaaaagttga tattgaaaat ttagattcaa attaagaata tagtggatat + 12961 caaaccagta ataataatga ataattgttt ttatgtaatt tgggattaat aaaaaattga + 13021 aaggaaatat caatgaaaag agtgattact tatggaacct ttgatttgct tcattatgga + 13081 catatcaatt tgctaaagag agcgaagcaa ttaggagatt atctcattgt tgtagtttca + 13141 agtgatgagt tcaatttgaa agaaaaaaat aaagtttgtt actttaattt tgaacataga + 13201 aaaaatttgg ttgaagcgat aagatatgtt gatttggtga ttcctgaaac aagctgggaa + 13261 cagaaaaaaa cagatattaa agaatatcac attgatacat ttgttatggg ggatgattgg + 13321 aaaggaaaat ttgattattt aaaagaagaa ggagtggaag tagtttattt accaagaact + 13381 aaagaaatat ctacaactaa aattaaagaa gatttagcag attagatttt ttacaaaaat + 13441 attttgagat cagataataa atttgtttcc ataattatta atgttttgac tatttaaatc + 13501 tcatttttta aaaaattcgg attgattaat aataaaaaaa tctagtttaa gatatgaaag + 13561 aaaattatat ccataactat tatattgttt gtaatatgta tcgtgataat gtataagaaa + 13621 ttagtagata taaatgtgat atatagctaa aactaatatt attcattgct atttaaaatg + 13681 tagttagaag taaagcatct aataaacttg aaggtacata aaaatttagc attaaattat + 13741 aaaacaaggt atttttctgt gaaaattggg tagatataca ataatatttg tattgttaga + 13801 gaaagaattc ttaatattat attgtaatgg aggcattttg aattgactaa agtaagaatt + 13861 aattgggtag attttgggaa aggatttgca atattcttag ttctagtagg gcatgtattt + 13921 attggtttat atgaatccaa taagttttca attgcaaatg atgtgttatt attcctgata + 13981 gctcaaatct atatatttca tataccagtg ttttttgcgt tatcaggata ctttttcaga + 14041 cctgtatcag atttgaagga gttttggcat tatgctaaaa agaaaaccat tattttaggc + 14101 ataccatata ttttttattc aattattcac ttttgtcttc aaaaggttgc gggtgcttct + 14161 gtccgagtac ccactacgat atttaaccta ttgaatatct ataaatttcc tctgggagtt + 14221 tcatggtatc tatatacgtt atggtcgata ttgatagttt atggtttact atctgttgtt + 14281 ttcaaaaatc gtaagtccct tttgttagtt agtgtttttg cctatatttt cacactattt + 14341 attcaaactg atatttttat tgtgcaacgg acgttggttt gggggatttg tttccttctt + 14401 ggcagtgtat tgagtgaaat tcactttgat aaaattaatt ttaaaaaaat tcttgttttc + 14461 tttgtgttat ttgattttat ttatatgttc gcttggttct tgttttatga agtaggatct + 14521 aagaaggatt atgtaagcta tagtaaccca ggtttgtggg ggattgcttt tattgtctgt + 14581 gtattagttg cttttgcgat ttttcctaaa atggagaaaa attttcctaa aactttccta + 14641 tatttcacta aatacgggaa agatagttta gggatctata ttcttcatgc accaatttgt + 14701 agcatgattc ggattctaat gttgaaagtg ggaataaact cagtttttct tcacgttgtt + 14761 gttgggattg tgctaggctg gtatttatcc atactggcaa cttatatatt gaaaaaaatt + 14821 ccatttttga atattgtttt attaccacaa aagtatatta aattaaaata a +// + diff --git a/public/res/serotype_genbank/serotype_11F.gb b/public/res/serotype_genbank/serotype_11F.gb new file mode 100644 index 0000000..293323b --- /dev/null +++ b/public/res/serotype_genbank/serotype_11F.gb @@ -0,0 +1,776 @@ +LOCUS CR931657 16926 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 34356 (serotype 11f). +ACCESSION CR931657 +VERSION CR931657.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 16926) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 16926) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..16926 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="34356" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC11F_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC11F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33195.1" + /db_xref="GOA:Q4K0Y0" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K0Y0" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVEMTD + " + gene complement(268..1679) + /gene="tnp" + /locus_tag="SPC11F_0002" + /pseudo + CDS complement(join(268..963,963..1679)) + /gene="tnp" + /locus_tag="SPC11F_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + /db_xref="PSEUDO:CAI33196.1" + misc_feature complement(join(691..963,963..1196)) + /gene="tnp" + /locus_tag="SPC11F_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 5.4e-19" + /pseudo + gene 1848..3302 + /gene="wzg" + /locus_tag="SPC11F_0003" + CDS 1848..3302 + /gene="wzg" + /locus_tag="SPC11F_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33197.1" + /db_xref="GOA:Q4K222" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K222" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFTVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGDTKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYGTIINSLQDSIQTNMPLETMIDLVNTQLESGGKYKVNSQDLKGTGRMDL + PSYAMPDSNLYVLEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1848..1973 + /gene="wzg" + /locus_tag="SPC11F_0003" + /note="Signal peptide predicted for SPC0523 by SignalP 2.0 + HMM (Signal peptide probability 0.991) with cleavage site + probability 0.537 between residues 42 and 43" + misc_feature 2061..2408 + /gene="wzg" + /locus_tag="SPC11F_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 4.7e-62" + misc_feature 2586..3029 + /gene="wzg" + /locus_tag="SPC11F_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 3304..4035 + /gene="wzh" + /locus_tag="SPC11F_0004" + CDS 3304..4035 + /gene="wzh" + /locus_tag="SPC11F_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33198.1" + /db_xref="GOA:Q4K221" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K221" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGVTPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRVQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3307..3915 + /gene="wzh" + /locus_tag="SPC11F_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 9.3e-37" + gene 4041..4736 + /gene="wzd" + /locus_tag="SPC11F_0005" + CDS 4041..4736 + /gene="wzd" + /locus_tag="SPC11F_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33199.1" + /db_xref="GOA:Q4K220" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K220" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFVYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGTVVTVIAVLLIELLDTRVKRPEDVEDVLQI + PLLGLVPDLDKIK" + misc_feature 4062..4478 + /gene="wzd" + /locus_tag="SPC11F_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 5.1e-55" + misc_feature 4584..4661 + /gene="wzd" + /locus_tag="SPC11F_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4746..5435 + /gene="wze" + /locus_tag="SPC11F_0006" + CDS 4746..5435 + /gene="wze" + /locus_tag="SPC11F_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33200.1" + /db_xref="GOA:O84996" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:O84996" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGNYGKNKK" + gene 5450..6817 + /gene="wchA" + /locus_tag="SPC11F_0007" + CDS 5450..6817 + /gene="wchA" + /locus_tag="SPC11F_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33201.1" + /db_xref="GOA:Q4K218" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K218" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLYALLVYVLNLFIKWYWKRTYPNFKGSKKILLLTATSRVEKVLHKLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSGKYNIGELVSQFETMG + IDVTVNLNTFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSVVLVPLIRKDGGSAIFAQTRIGKNGRHFTFYKFRSMCVDAEDKKRKLMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5450..5536 + /gene="wchA" + /locus_tag="SPC11F_0007" + /note="Signal peptide predicted for SPC0527 by SignalP 2.0 + HMM (Signal peptide probability 0.844) with cleavage site + probability 0.429 between residues 29 and 30" + misc_feature 6233..6814 + /gene="wchA" + /locus_tag="SPC11F_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.8e-156" + gene 6821..7270 + /gene="wchJ" + /locus_tag="SPC11F_0008" + CDS 6821..7270 + /gene="wchJ" + /locus_tag="SPC11F_0008" + /note="member of homology group 26" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="CAI33202.1" + /db_xref="GOA:Q4K217" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:Q4K217" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKADARSVLSE + EVVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKT + VYIEVFDRIDAPTITGKLVYPVTDKFIVQWEEMKKIYPKAINLGGIF" + gene 7270..7749 + /gene="wchK" + /locus_tag="SPC11F_0009" + CDS 7270..7749 + /gene="wchK" + /locus_tag="SPC11F_0009" + /note="member of homology group 27" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33203.1" + /db_xref="GOA:Q4K216" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q4K216" + /translation="MIFVTVGTHEQQFDRLIKEVDRLKEENLIQEEVFIQTGYSNYVP + KYCKWEKIISYEKMNQFIEESDTIVTHGGPATFMAIIAKGKTPIVVPRQKKFGEHVND + HQMNFCSKISSEGYELSLINDISELQYSLKQEKKTKFYSNNANFLKQLSKIIEDLIV" + misc_feature 7270..7740 + /gene="wchK" + /locus_tag="SPC11F_0009" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 6.8e-45" + gene 7991..9088 + /gene="wcyK" + /locus_tag="SPC11F_0010" + CDS 7991..9088 + /gene="wcyK" + /locus_tag="SPC11F_0010" + /note="member of homology group 116" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33204.1" + /db_xref="GOA:Q4K215" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K215" + /translation="MKILHIPTGGLFSDGIGTFIYSYLEYMDLNKYDVTILATNPLLK + SDKEKFEYLGVKVIEIERKKSNLSKYVYRLKKLIKKEKFDIIHVHGSSALMSIELLTA + KIAGIPVRIAHSHNTTCEHHKLDKLLRPIFYRVYTQACACSVSAGQWLFEEKNYKIIH + NARDVNKYQYDAIKRKKLREELLLSDETIALGHVGRFNTQKNQRFLVSLIERLVIKNI + DLKLFLVGTGDTLEEIKKLVIQKKLEDNIVFLGQFDDMKSFVSSMDIMLLPSLYEGLP + LVSVEWQINGVKSILSDRVTQECIYTETVQQLSIDSMELWEKEILNLSTSDRERVSLQ + NIQLIRNAGYDISLEVKEIEELYNSLYDISN" + misc_feature 8513..9004 + /gene="wcyK" + /locus_tag="SPC11F_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.2e-19" + gene 9109..9759 + /gene="wcwC" + /locus_tag="SPC11F_0011" + CDS 9109..9759 + /gene="wcwC" + /locus_tag="SPC11F_0011" + /note="member of homology group 48" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33205.1" + /db_xref="GOA:Q4K214" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4K214" + /translation="MKTLKSIKRKLKPIKKTYKKIVYSITKSKMRKRLKNRDFSIISD + NCWAGRVYEELGLPYRTPFIGMYIYSEDYVKLLKNFKDYMGYELTFTNVTKWNEEYTG + EYPIGILKDIEIHFLHYVNQEEAYEKWNKRKNRINYENIFFKMNDDNKCSFELLKEFD + NLDFKNKIIFAAFNYKELDNLIHFTNPRGNGNVGTDLFYYDQYFDVVNWLNGETQT" + gene 9756..10478 + /gene="wcrL" + /locus_tag="SPC11F_0012" + CDS 9756..10478 + /gene="wcrL" + /locus_tag="SPC11F_0012" + /note="member of homology group 54" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33206.1" + /db_xref="GOA:Q4K213" + /db_xref="InterPro:IPR007577" + /db_xref="UniProtKB/TrEMBL:Q4K213" + /translation="MIPKKIHYCWFGGKPLSSDVKRCIASWKKFCPDYEIIEWTEKNF + CIENQNQFVQDAYRDKAWAFVSDYARLKIIYENGGIYLDTDVEVIKNLDKLLENKAFF + GVHQVNHLVATGLGFGSEKGTFILKELLNLYDEIEFDLRKKDELLCPELNTPVFKRLG + YTYSDCVVKNEYFTIYPEEYFDPISLGYGVENILSDKTFSIHHYSASWTSLRDQMKSK + IIRKFGRGNVLKLKRILKGKTR" + gene 10475..11647 + /gene="wzy" + /locus_tag="SPC11F_0013" + CDS 10475..11647 + /gene="wzy" + /locus_tag="SPC11F_0013" + /note="member of homology group 68" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33207.1" + /db_xref="UniProtKB/TrEMBL:Q4K212" + /translation="MRISPSKLIFAFFSSFYILVILFPRGIFLGHSTLASRLWIIYKE + SLYLSILLGSIYVILKILSRNIAIHQHAFFILQYYFIVMILTFMLSGSIGDGVQSIFY + PIFIYLFFNEVRDKKSIVLIFDIFLYILTALFVINTIDIFLNFTNIFHVTFLGHVQVI + SQYSILGFLVSAYYLLEEKRNILVAQLLLILTIINCFFSDVSLSKPIALFMIIYIMSY + KLRKLFWKRGRKISVITFIASVVMLALVIFEYFLPYLRYFDFTFNGRYQIWRIVYATI + PQVKWFGYGVFGFQFKLPWQELGEIGINYTHNQVLQLALDSGIVGIISFLIMIFYMIF + STKNIQNPTISSLFIFAYFCLFIIMFIESVTYYPYYFIIIVLQTLYLKLERERNVK" + misc_feature 10475..10561 + /gene="wzy" + /locus_tag="SPC11F_0013" + /note="Signal peptide predicted for SPC0533 by SignalP 2.0 + HMM (Signal peptide probability 0.862) with cleavage site + probability 0.448 between residues 29 and 30" + misc_feature 11249..11443 + /gene="wzy" + /locus_tag="SPC11F_0013" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 6.7e-09" + gene 11637..12137 + /gene="wcwT" + /locus_tag="SPC11F_0014" + CDS 11637..12137 + /gene="wcwT" + /locus_tag="SPC11F_0014" + /note="member of homology group 69" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33208.1" + /db_xref="GOA:Q4K211" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K211" + /translation="MLNRLIRNFNKVYYSYRIKRKAAQCGGRVYTGGKTFVTANTYLD + ENVSFNGMSMYGEGKISIGKNFHSGLNCQIITSFHNYDLGDKIPYDESYIHKDVLIED + NVWVGNNVIILGGAIIEEGAIIQAGSTVVGRIPAGAIAGGHPAKPFRFRNMEHYNRLK + RQKKFH" + misc_feature 11925..11978 + /gene="wcwT" + /locus_tag="SPC11F_0014" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.9" + misc_feature 11979..12032 + /gene="wcwT" + /locus_tag="SPC11F_0014" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 6.6" + gene 12147..13334 + /gene="wcwU" + /locus_tag="SPC11F_0015" + CDS 12147..13334 + /gene="wcwU" + /locus_tag="SPC11F_0015" + /note="member of homology group 70" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33209.1" + /db_xref="GOA:Q4K210" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K210" + /translation="MNIVSYLKKNGITHTLKIINEYKMQELFDSLVSIFTKQKELRDS + IVIECHTDFENNGGAFYDYLINNEYNKKYKIVLLLKDKLAKELPENVDYFYLRKPSLR + KSYVMSLSKFFTFDNDMLRKYRKDQKHFYLTHGCFGLKNTIGKITVPDYVDFVLSPSG + NVDNIIVKQFGLTSKEQCLHTGFPCHDIFYSKPKPLVFLSDYDKKIIWAPTFRKGGGY + NRNDSTASYPLGIPLLGTLDELAHLNTYLSQRDIVLIVKLHPIQDISDLELKQFSHIK + FLTNQDLKRKNTNVYQLLMNSDALLSDYSAISYDYLHLDKPIGYVFSDLNDYKLGLSV + DNVDDYIAGDKIMFFNDLLHFIDNIYLEIDKNKEKRKELFNKIFEKQDGESCERLAQI + MEL" + misc_feature 12720..13331 + /gene="wcwU" + /locus_tag="SPC11F_0015" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 7.2e-12" + gene 13351..14754 + /gene="wzx" + /locus_tag="SPC11F_0016" + CDS 13351..14754 + /gene="wzx" + /locus_tag="SPC11F_0016" + /note="member of homology group 52" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33210.1" + /db_xref="GOA:Q4K209" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K209" + /translation="MSVGMKAALWYTVANFIQKGFVFLSTPILTRILNVNDYGTLMLY + QSWFVLFAIFATLNLSQTAYNKGLVEFENDKDNFTFSLLFLSEIITIIVAFLYFTFNI + LVKDSTGLTPGFMIFLFSDILFNISIEFYLARQRFEFKYRKAVLISISSSFFIVAIST + TILLAIKNDLFIKIVLDAIIRIIFGLYCFYLLFFSGKRQLKIEKKYIKYGLSYSLPLI + PHFLSHYILNQSDRLMINMFDGKEKLAIYSLAYSVSMIMFLFTNAINQSIMPYTFQAL + KKKDYRGIHERTKWLFIIVGGGTVLSILFAPELIVILGGNKYKESIWLVPPIAVSVYF + LFVYSMFSNISFYYKMNKLISLVSTGAALSNIILNYIFINIFGYQAAAYTTLLCYILL + AFSHFFLYRFLLKKEEIHEELYNMKMILIISLILLTILFLILVIYNLAFIRYAIIVII + LFLLFTKRNKIITSLKS" + misc_feature 13360..14178 + /gene="wzx" + /locus_tag="SPC11F_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2e-17" + gene 14867..15258 + /gene="gct" + /locus_tag="SPC11F_0017" + CDS join(14867..14998,14998..15258) + /gene="gct" + /locus_tag="SPC11F_0017" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33211.1" + /db_xref="GOA:Q4K208" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K208" + /translation="MKRVITYGTFDFLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNFEHRKNLVEAIRYVDLVIPETSWEQKKTDIKEYHIDTFVMGDNWKGKFDY + LKEEGVEVVYLPRTKEISTTKIKEDLAD" + misc_feature join(14879..14998,14998..15246) + /gene="gct" + /locus_tag="SPC11F_0017" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 1e-28" + gene 15676..16704 + /gene="wcjE" + /locus_tag="SPC11F_0018" + /pseudo + CDS 15676..16704 + /gene="wcjE" + /locus_tag="SPC11F_0018" + /note="member of homology group 18" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase (pseudogene)" + /db_xref="PSEUDO:CAI33212.1" + misc_feature 15691..16665 + /gene="wcjE" + /locus_tag="SPC11F_0018" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 0.00018" + /pseudo + gene 16879..>16926 + /gene="aliA" + /locus_tag="SPC11F_0019" + CDS 16879..>16926 + /gene="aliA" + /locus_tag="SPC11F_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33213.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaaacct caagtttttg aagcttgagg ttttttacta + 181 tagtggattg aaactagaat agtgcacctc tacttctaaa acattgttag aaatcgattt + 241 gactgtcctg actaatttgt cctattctta tttcatttta ctatatttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttatga agatattgtt + 361 tgaaagatgt gagtttccac ggatgggttt gtggagggat atacttgcgt ctttcttttt + 421 ttgttctggt tcttgttcaa agtttttcga atagagttca tgatctagta gctcctttgt + 481 gtgatagatt ttgtcagcga tattgaggta gatgtctccg tcaaatgctt ttataactaa + 541 tgctttcgta tttctgatga aatagacttc ttttccttgt tcggtaggga tatagtaacg + 601 attttggaat cggatatggt gtccactatc gacgactctc tccgccagtc tggccagaat + 661 gagattcctt tcagaggggt taggaacctc ctcgaagaca gagagttttg tcttgtttcc + 721 aaactgttca ttaaaggttt ggatgtagga aagcaggaag gtattggctt cttccaaggt + 781 atgaatattg tttcgttcca gttcgatagg caggcgagat tgtagtgtct gattaagtct + 841 ttcgactctc cctttagctt gagggataga ggttgtctcc agaagaatcc ctagttggtg + 901 acaggcgtat ccaaattgtg tatgggtgtc gtcctccatt ttcttcgagt tggaggcttg + 961 atataggtaa agaccgttct cttatctgtt ttaatttgaa ggggaacgcc gtgattgcct + 1021 aaaatttgtt cgaggacatg atagtaagca ttcaaggtct cttgtttatc aaaataagcg + 1081 cctaggatat tgccagaagc atcatcaatg gctaagtgta agttagatgt ttgggctcca + 1141 aaccatgcat gagggctggc atccatttga atgagttctc cagcaaattt ctttctgggt + 1201 ctactaggat gtactttttt aggggcttca aggaagtttt cagccgtcgg taagattgga + 1261 ttgtctaggg gttgattcag gttcagttta gcttgttttc ttactctctt ctttgtcttt + 1321 ctatgggact taggcgacag gatatttttc ttatagagta tttttctaac agttgtatca + 1381 gagagctgaa ttccttcttc ttcagctagc aattcacaga aatgaaggac atttggttta + 1441 tatgtttcat aggagaggta tttctttagg agacgttctt tgatttcatc agggattgca + 1501 tgttttggtt ttcgatttct gtttccgtgt ctgaaggctt cttttccttt cagttgatag + 1561 gctagtagca gacgattgat ttgtctttca gaaagattga gctcgacaca ggttcgtttc + 1621 tttgttttct ttccttgcgc tatagctttt atcacaagat attttttagt ttcattcata + 1681 ttcagttgga tccttttcat atgactattc taccaaatgg gacattttca cgttcgattt + 1741 actaaagaca ttatcacatt cgaattacac aagatgcaga tagtgaaaat aaaggtgtag + 1801 acattaccgt aaaaaagtga tataatcgta tgatgttcaa ggtataggtg ttaatcatga + 1861 gtagacgttt taaaaaatca ggttcacaga aagtgaagcg aagtgttaat atcgttttgc + 1921 tgactattta tttattatta gtttgttttt tattgttctt aatctttaag tacaatatcc + 1981 ttgcttttag atatcttaat ctagtggtaa ctgcgttagt cctactagtt gccttggtag + 2041 ggctactctt gattatctat aaaaaagctg aaaaatttac tatttttctg ttgctgttct + 2101 ctatccttgt cagctctgtg tctctcttta cagtacagca gtttgttgga ctgaccaatc + 2161 gtttaaatgc gacttctaat tactcagaat attcaatcag tgtcgctgtt ttagcagata + 2221 gtgagatcga aaatgttacg caactgacga gtgtgacagc accgactggg actgataatg + 2281 aaaatattca aaaactatta gctgatatca agtcaagtca gaataccgat ttgacggtca + 2341 accagagttc gtcttacttg gcagcttata agagtttgat tgcaggtgac accaaggcca + 2401 ttgtcttaaa tagtgtcttt gaaaatatca tcgagtcaga gtatccagac tacgcatcga + 2461 agataaaaaa gatttatacc aagggattca ctaaaaaagt agaagctcct aagacgtcta + 2521 agaatcagtc tttcaatatc tatgttagtg gaattgacac ctatggtcct attagttcgg + 2581 tgtcgcgatc agatgtcaat atcctgatga ctgtcaatcg agacaccaag aaaatcctct + 2641 tgaccacaac gccgcgtgat gcctatgtac caatcgcaga tggtggaaat aatcaaaaag + 2701 ataaattgac tcatgcgggc atttatggag ttgattcgtc cattcacacc ttagaaaatc + 2761 tctatggagt ggatatcaat tactatgtgc gattgaactt cacttctttc ttgaaattga + 2821 ttgacttatt gggaggggta gatgttcata atgatcaaga gttttcagct ctacatggga + 2881 agttccattt cccagtaggg aatgtccatc tagactctga gcaagctcta ggttttgtac + 2941 gtgaacgcta ctcactagcc gatggagacc gtgaccgtgg tcgcaaccaa caaaaggtga + 3001 ttgtggctat ccttcaaaaa ttaacgtcaa ccgaagcact gaaaaattat ggtacgatca + 3061 ttaatagctt gcaagattct atccaaacaa atatgccact tgagaccatg atagatttag + 3121 tgaatactca gttggaaagt ggagggaagt ataaagtaaa ttctcaagat ttaaaaggga + 3181 caggtcggat ggatcttcct tcttatgcaa tgccagacag taacctctat gtgctggaaa + 3241 tagatgatag tagtttagct gtagttaaag cagctataca ggatgtgatg gagggtagat + 3301 gaaatgatag acatccattc gcatatcgtt tttgatgtag atgacggtcc caagtcaaga + 3361 gaggaaagca aggctctctt ggcagaatcc tacaggcagg gggtgcgaac cattgtctct + 3421 acctctcacc gtcgcaaggg catgtttgaa actccagaag agaagatagc agaaaacttt + 3481 cttcaggttc gggaaatagc taaggaagtg gcgagtgact tggtcattgc ttacggggct + 3541 gaaatttact acacaccaga tgttctggat aagctggaaa aaaagcggat tccgaccctc + 3601 aatgatagtc gttatgcctt gatagagttt agtatgaaca ctccttatcg cgatattcat + 3661 agcgccttga gcaagatctt gatgttggga gttactccag tcattgccca cattgagcgc + 3721 tatgatgctc ttgaaaataa tgaaaaacgc gttcgagaac tgatcgatat gggctgttac + 3781 acgcaagtaa atagttcaca tgtcctcaaa tccaaacttt ttggcgaacg ttataaattc + 3841 atgaaaaaaa gagttcagta ttttttagag caggatttgg ttcatgtcat tgcaagtgat + 3901 atgcacaatc tagacggtag acctcctcat atggcagaag catatgacct tgttacccaa + 3961 aaatacggag aagcgaaggc tcaggaactt tttatagaca atcctcgaaa aattgtaatg + 4021 gatcaactaa tttaggagaa atgatgaaag aacaaaacac gatagaaatc gatgtatttc + 4081 aattatttaa aaccttgtgg aaacgcaagc taatgatttt aatagtggca cttgtgacag + 4141 gtgcgggggc ttttgtatat agcactttta ttgttaagcc agaatatacg agtaccacgc + 4201 gaatttacgt agtgaatcgc aatcaaggag acaagccggg gttgacaaat caggatttac + 4261 aggcaggatc ttatctggta aaagactacc gtgagattat cctttcgcag gatgcattgg + 4321 aaaaagtagc gacaaatttg aagttggata tgccagcaaa aacgttagcc agcaaagttc + 4381 aagtagctgt accagctgac actcgtatcg tctcaatctc tgtcaaggat aaacagccag + 4441 aggaagccag tcgtatcgct aattctctac gagaagttgc tgcagaaaag atcgtcgctg + 4501 taacgcgagt atctgatgta acgacacttg aagaagcgcg accagctacg actccctctt + 4561 ctccaaatgt tcgacgcaat tccttgtttg gttttcttgg aggaacagtc gtaacagtaa + 4621 ttgctgttct tttgattgag ttgctggaca cccgtgtgaa acgtcctgaa gatgttgaag + 4681 atgtactgca aattccactt ttagggctcg ttccagattt ggacaaaata aaataggagg + 4741 aagttatgcc aacattagaa atctcacagg caaaattgga ttctgtaaaa aaggcagagg + 4801 aatattataa cgctttgtgc acgaacctac agttaagtgg agatggtttg aaagtatttt + 4861 ctatcacttc tgtgaaaata ggagaaggaa aatcaacgac ttccgccaat atcgcttggg + 4921 cttttgcgcg tgcaggttac aaaacgctgc tgattgatgg agatattcgc aattctgtta + 4981 tgttaggtgt ctttaaagca aggaataaga ttacaggcct gacagaattt ttatcaggaa + 5041 ctacagacct atcacaaggg ctttgtgata ccaatatcga aaatctcttt gtaattcagg + 5101 ctggctctgt gtcaccgaat ccgacagctc ttcttcaaag taagaatttc actacaatgc + 5161 ttgaaacctt gcgtaaatat tttgactaca tcattgtaga tactgctcct gttggtgtcg + 5221 tgattgatgc ggctattatt acgcgaaact gcgatgcttc tattttagtg acggaggcag + 5281 gtgaaataaa tcgacgggat attcaaaaag caaaagaaca gttggaacac acaggaaagc + 5341 cgtttttggg aattgtgttg aataaattcg atacttcagt agacaaatac ggttcttatg + 5401 gaaattatgg aaattacggg aaaaataaaa aataggtcag gggatagaga tgaatggaaa + 5461 aatattaagg tcttcattgg ccataatcca gagttttctt gttattttat tgacttatct + 5521 acttagtgct gtgagagaaa cggagattgt ttcaacaaca gctattgcac tttatatcct + 5581 ccattatttt gtcttttata tcagtgatta tggacaggat ttctttaaaa ggagatattt + 5641 gattgaactt gtccagacat tgaaatatat cctattcttt gcactagcga ttagtatttc + 5701 taattttttc ttagaggatc gatttagtat ttccagacga ggcatgattt acttcctcac + 5761 attatatgct ctcttagtct atgtgctaaa cctatttatc aagtggtatt ggaagcggac + 5821 ttatcccaac tttaaaggaa gtaagaagat tctcctactt acagcaactt ctcgtgtcga + 5881 aaaggtactg cataaattaa tagaatcaaa tgaggttgtt ggggagttgg tagccgtcag + 5941 tgtcttagat aaaccagatt ttcagcatga ttgtttaaag gtagtagcag agggggagat + 6001 agtaaacttt gcgactcatg aggtggtcga tgaagtcttt atcaatcttc caagtggaaa + 6061 atacaatatt ggagagcttg tctctcagtt tgaaacgatg ggaattgatg taacagtcaa + 6121 tctaaatact tttgatcgta gtttggcacg taacaagcaa atccgtgaga tggcaggatt + 6181 aaatgttgtg actttttcta caacatttta taagactagt catgtaattg ctaagcggat + 6241 tattgatatt gtgggtgcat tggtagggct gatactatgc ggtctagtca gtgttgtact + 6301 ggttcctttg attcgaaaag atgggggctc tgctattttt gctcagacgc gtattggaaa + 6361 aaatggacga cattttactt tttataagtt tcgctccatg tgtgtagatg ctgaggacaa + 6421 aaaaagaaaa ctcatggaac aaaataccat gcagggtgga atgtttaagg tggatgatga + 6481 cccacgtatc acgaaaattg gtcgttttat acggaagact agcttggacg agctgccaca + 6541 gttttataat gttctaaagg gagatatgag tttggttggc acacggccac caacagtgga + 6601 cgagtatgaa cactataccc cagaacaaaa acgtcggtta agttttaaac ctggtataac + 6661 aggcttatgg caggtcagtg gacgaagtga gattaagaat tttgatgaag ttgtcaaatt + 6721 agatgtagcc tatatagacg attggacaat ttggaaagat attgagattt tattgaagac + 6781 agttaaagtt gtattgatga aggatggagc gaagtaggaa atgaaaatat gtttagttgg + 6841 atctagtgga ggtcatctga ctcatttata tcttttaaaa cctttctgga aagataaaga + 6901 aagattttgg gttacttttg ataaggcgga cgctcggagt gtactctctg aggaagttgt + 6961 atatccctgt tattatccaa ccaatcgtaa tataaaaaat ttaataaaaa atacttttct + 7021 cgcctataaa attttaaaaa aagagagacc agatttgatt atttcttctg gtgccgctat + 7081 cgctgttcct ttcttttata ttgggaagtt atttggatca aagacagtgt atatagaagt + 7141 gtttgataga attgatgctc caacaataac gggaaaactt gtttatccag taacggataa + 7201 gtttattgtt caatgggaag aaatgaaaaa aatttatcca aaagcaatta atctaggagg + 7261 aatattctga tgatttttgt tactgtaggg acacatgaac aacaatttga tcgtttgata + 7321 aaagaagttg atcgtttgaa agaagagaat ctaattcaag aggaagtatt tattcaaaca + 7381 ggatattcta attatgtccc aaaatattgt aaatgggaaa aaataatatc ttatgaaaaa + 7441 atgaatcagt ttattgagga atctgataca attgttaccc atggtggtcc agctactttt + 7501 atggcaatta ttgctaaagg aaaaactcca atagttgttc cgaggcaaaa gaaatttggg + 7561 gagcatgtga atgatcatca gatgaatttt tgttctaaaa tatcctctga agggtatgaa + 7621 ttatctctga ttaacgatat aagcgaatta cagtatagtt taaagcaaga aaagaaaact + 7681 aaattttact ctaataatgc aaattttctt aagcagttat caaaaataat tgaagattta + 7741 atagtataaa atgagattgt ttcttcttat tgcagatgaa ttagaaataa atcaggttgt + 7801 aagtaaagca acagtgccaa agtatatttg taattaagaa taaaataatc accatttcaa + 7861 tatctgaaaa taattctcaa ggcatagttt gaattatgga tatagattat ttcgctaagt + 7921 cttctaatct atttataagt taaggcagta acattattaa aatcatagat gggagtaagg + 7981 agggaactaa atgaaaatac tacatattcc aacgggtggt ttattttctg atggtatagg + 8041 aacttttatt tattcatatt tggagtatat ggacttaaac aagtatgatg tgacaatttt + 8101 agccactaat ccccttttga aaagtgataa ggaaaaattt gaatatttag gggttaaagt + 8161 tattgaaatt gaaaggaaaa aatcaaacct atctaaatat gtatacagat tgaaaaaatt + 8221 aataaaaaaa gaaaaatttg atattataca tgttcacgga agtagcgctt taatgtcaat + 8281 tgaattactg actgctaaaa ttgctggtat cccagttcga attgcccata gccacaacac + 8341 tacttgtgag catcataaac tagataaact actacgaccg atattttatc gagtttatac + 8401 tcaggcatgt gcttgcagtg ttagtgctgg tcagtggctt tttgaggaaa aaaattataa + 8461 gattatccat aacgctagag atgtaaataa gtatcagtat gatgccataa aacgaaaaaa + 8521 acttagagaa gaattgttac tgtctgatga gactattgct ctaggtcatg ttggacgttt + 8581 taatactcaa aaaaatcaac gttttctagt gtctctgata gaaagattag tgattaaaaa + 8641 tatagattta aaattatttt tagtagggac gggtgatact ttagaagaaa tcaagaaatt + 8701 agtcattcag aaaaaactag aagataatat tgttttttta ggtcaatttg atgatatgaa + 8761 atcttttgtg tcatcaatgg atataatgtt acttccaagt ttatatgaag ggttaccact + 8821 agtatctgtt gaatggcaaa taaacggagt aaaaagtatc ctatctgacc gtgttacaca + 8881 agagtgtatc tatacagaaa ctgttcaaca attatctatc gatagtatgg aattatggga + 8941 aaaagaaatt ttaaatttat ctacttcaga tagagaaaga gtgtcattgc aaaatattca + 9001 gttaataaga aatgcaggct atgatatttc tttagaagtt aaagaaatag aagaattata + 9061 taattcactt tatgatattt caaattaaga gaaaggggag gttatctttt gaagacgtta + 9121 aaatccataa agcggaaatt aaaacctata aagaaaactt ataagaaaat tgtttactct + 9181 attactaagt caaaaatgcg gaaaagacta aaaaatagag atttttcaat tatcagtgat + 9241 aattgctggg caggaagagt atatgaagaa ttaggtctac catatagaac accatttata + 9301 ggtatgtata tttattccga agattatgtt aagctattaa aaaattttaa agattatatg + 9361 ggatatgaac tgacttttac taatgttaca aaatggaatg aagaatatac tggggagtat + 9421 cctataggca tacttaagga tattgaaatt cattttttac attatgttaa tcaagaagag + 9481 gcttatgaga aatggaataa aagaaagaac aggattaatt atgaaaatat cttttttaaa + 9541 atgaatgatg ataataagtg ttcttttgaa ttgcttaaag aatttgataa tttggatttt + 9601 aaaaacaaaa ttatttttgc agcatttaat tataaagaat tagataatct tattcatttt + 9661 accaatccta gagggaatgg gaatgtaggt acagacttat tttattatga tcaatatttt + 9721 gatgttgtaa attggctgaa tggagagaca caaacatgat acctaaaaag attcattatt + 9781 gttggttcgg tggcaaacct ttatcaagtg atgtaaagcg atgcatagca agttggaaaa + 9841 aattttgtcc tgattatgaa attattgaat ggactgaaaa aaatttttgt attgaaaatc + 9901 aaaatcaatt tgtgcaggat gcatatagag ataaagcatg ggcttttgta agcgattatg + 9961 caagacttaa aattatatat gaaaatggag gtatttattt agatactgat gttgaagtaa + 10021 ttaaaaatct agataagttg ttggaaaata aagcattctt tggagttcat caagttaatc + 10081 atcttgttgc tacagggtta ggatttggat cggaaaaggg cacctttatt ttaaaggagt + 10141 tattaaattt gtatgatgaa atagaatttg atcttaggaa gaaagatgaa ttgttatgtc + 10201 ctgaattaaa tacacctgta tttaaacgtc ttggttatac ttattctgac tgtgttgtaa + 10261 aaaacgaata tttcacaatc tatcctgaag aatattttga tccgatttct ttgggttatg + 10321 gcgtagaaaa tattttatca gataagacat tctctattca tcattatagt gcttcttgga + 10381 cttccttgag agatcagatg aagagtaaaa taattcgtaa atttggtaga ggtaatgtgt + 10441 tgaagttaaa aagaatatta aaggggaaaa ctagatgaga atatcaccat cgaagctgat + 10501 atttgcattt tttagcagtt tttatattct tgtaatcctt ttcccgagag gaattttcct + 10561 agggcattct actttagctt ctcgtttatg gattatttac aaagaaagtt tatatctatc + 10621 aatactactt ggttcaatat atgttatttt aaaaatatta tctcgaaata tcgccattca + 10681 tcagcatgct ttttttatct tacaatatta ttttattgta atgattttaa cttttatgtt + 10741 aagtgggtca atcggtgatg gggtacaatc gattttctat ccaatattca tctatttgtt + 10801 ttttaatgaa gttcgagata agaaatcaat agtgttaatt tttgatatat ttctttatat + 10861 acttaccgct ttattcgtta tcaatacgat tgatattttt ctgaatttca caaatatttt + 10921 tcatgttact tttttaggac atgttcaggt gatttcccaa tatagtattc tcggatttct + 10981 cgtatcagct tattatctat tagaagaaaa gaggaatata ttagtcgcac agttgctgtt + 11041 gattttaacg attatcaatt gttttttttc agatgtctct ctctctaaac ctattgcttt + 11101 gtttatgatt atttatatta tgtcatacaa gttaagaaaa ctattttgga aaagaggaag + 11161 gaagatatct gtcataactt ttattgcatc tgttgtgatg ttagcattag tgatttttga + 11221 atatttttta ccatatctta gatattttga ttttactttt aatggtcgat accaaatttg + 11281 gcgcattgtg tatgctacca ttcctcaagt gaaatggttt ggatatggtg tgtttggctt + 11341 tcaatttaaa cttccgtggc aggaattggg agaaattgga ataaattata ctcataatca + 11401 agttttacag ttagcacttg atagtggaat tgttgggatt atctcattcc ttattatgat + 11461 tttttatatg atcttttcaa ctaaaaatat tcaaaatccc acaataagct ccctatttat + 11521 ttttgcctat ttttgtctat ttattataat gtttatagag agtgttactt attatccata + 11581 ctattttatt ataatagttc ttcaaacttt gtacttaaaa ttggaaagag aaagaaatgt + 11641 taaatagatt gataagaaat tttaataaag tatattatag ttatcgtata aaaagaaagg + 11701 cagcacaatg cggtgggaga gtgtatacgg gaggcaaaac gtttgttact gcaaatacgt + 11761 accttgatga aaatgtttca tttaatggta tgtcaatgta tggtgaagga aaaataagca + 11821 ttggtaaaaa ttttcattca ggattaaatt gccaaattat cacttccttt cataattatg + 11881 acttgggtga taaaattcct tatgatgaga gttacataca taaagacgtc ttaattgaag + 11941 ataacgtttg ggtagggaat aatgtgataa ttttaggtgg tgcgattatt gaggaaggtg + 12001 caatcattca agcaggaagt acagttgttg gaagaattcc agcaggtgcg attgcaggtg + 12061 gacatccggc aaaaccattc agatttagaa acatggaaca ttataatcgg cttaaacggc + 12121 aaaaaaagtt tcattagagg ttaagaatga atattgtaag ttatctaaaa aaaaacggta + 12181 ttacacatac tttaaaaatt attaatgaat ataaaatgca agagctgttt gatagtcttg + 12241 ttagtatttt tacaaagcag aaggaacttc gtgacagtat tgtcattgaa tgtcatactg + 12301 attttgaaaa taatggtggt gcgttctatg actacctaat caataatgag tataacaaaa + 12361 aatataaaat tgtcttacta ttgaaggata aattagctaa agaattacca gaaaatgtag + 12421 attattttta tttaagaaag cccagtttac gaaaatccta tgtaatgtca ttaagtaaat + 12481 tctttacttt tgataatgat atgcttcgta aatatagaaa agatcaaaaa cacttttatt + 12541 taacacatgg atgctttggt ttaaaaaata caataggtaa aataacagtt ccggattatg + 12601 ttgattttgt tctatctccc tcgggcaatg tagataatat tatagttaag cagtttggat + 12661 taacatctaa agagcaatgt cttcacactg gatttccgtg tcatgatatc ttttattcaa + 12721 aaccaaaacc tctagtattt ttatctgatt atgataaaaa aattatctgg gcaccaactt + 12781 ttagaaaggg tggaggctat aatagaaatg atagtacagc tagctatcct ttaggtattc + 12841 cattacttgg aacactagat gaacttgcac acctaaacac atatctaagc caacgggata + 12901 ttgtcctgat tgtaaagtta catccaattc aagatatttc agatttggag ttgaaacaat + 12961 ttagtcatat taagtttctg acaaatcaag atttgaaacg taaaaataca aatgtgtatc + 13021 aattgctgat gaattcagat gctttactca gtgactattc tgcaatctcg tatgattatt + 13081 tacaccttga taaaccaata gggtatgttt tttcggatct aaatgattat aagttggggc + 13141 tttcagttga taatgtagat gattacatag caggtgataa gataatgttt tttaacgact + 13201 tgctgcactt tattgataac atttatctag aaattgataa aaataaagaa aaacgcaagg + 13261 aattatttaa taaaatattt gaaaaacagg atggagaatc gtgtgaaaga ttggcccaaa + 13321 ttatggaatt ataaaagacg ttacgaagaa atgtctgtcg ggatgaaagc ggcactctgg + 13381 tatactgttg caaattttat tcaaaagggt tttgtatttc tttcaactcc gattttaacc + 13441 agaatactta atgttaatga ttacggtaca ttgatgcttt accaatcatg gtttgtacta + 13501 tttgctattt ttgctacctt gaatctttct caaacagctt ataataaggg attagtagaa + 13561 tttgagaatg ataaagataa ttttacattt tctttgttgt ttttgtctga gatcattacg + 13621 ataattgttg cttttttgta ttttactttt aatatactgg ttaaagatag tactggatta + 13681 actcccggtt tcatgatatt tttattcagt gatattttat ttaatattag tatagaattt + 13741 tatttggcac gtcagagatt tgaattcaaa tatagaaaag cagttctaat ttcaatttct + 13801 tcaagttttt ttattgtagc tattagtaca actatcttat tagcgattaa gaatgattta + 13861 ttcattaaaa ttgtattaga tgctattatc cgaattatct ttggtttata ttgtttttat + 13921 ctcttgtttt tttcagggaa aaggcaactt aagatagaaa aaaaatatat taaatatggt + 13981 ttgagttatt cattaccttt gataccgcat ttcttatcgc actatatttt gaatcagtct + 14041 gaccgtttga tgattaacat gtttgatggt aaggagaaat tagctatata tagtctagct + 14101 tattctgtat caatgattat gtttttgttt actaatgcaa ttaatcaatc aataatgccg + 14161 tatacatttc aagctttgaa aaaaaaggat tatcgtggga tacatgagag aaccaaatgg + 14221 ctttttataa tagttggggg gggcacagtt ctttcaattc tatttgcacc agaactaatt + 14281 gttattttag gcggcaataa atataaggag tcaatttggc tagtacctcc aattgctgtc + 14341 tcggtttatt tcctttttgt atattctatg tttagtaata tcagttttta ttataagatg + 14401 aataagctga tttcgttagt ttccacaggt gcagctcttt caaatattat tttaaattat + 14461 atttttatta atatatttgg gtatcaagct gcagcttaca ctacattatt atgctatata + 14521 ttgttagcat tttctcattt tttcttatat agatttttat taaaaaaaga ggaaattcat + 14581 gaggaacttt ataatatgaa gatgatttta ataatatctt taatattatt aacaatatta + 14641 tttttgatac ttgttattta taacttagcc tttataaggt atgcaattat tgtaattatt + 14701 ttatttcttt tgtttacaaa gagaaataaa ataattacat ccctaaaaag ttgatattga + 14761 aaatttagat tcaaattaag aatatagtgg atatcaaacc agtaataata atgaataatt + 14821 gtttttatgt aatttaggat taataaaaaa ttgaaaggaa atatcaatga aaagagtaat + 14881 tacttatgga acctttgatt ttcttcatta tggacatatc aatttgctaa agagagcgaa + 14941 gcaattagga gattatctca ttgttgtagt ttcaagtgat gagttcaatt tgaaagaaaa + 15001 aataaagttt gttactttaa ttttgaacat agaaaaaatt tagttgaagc gataagatat + 15061 gttgatttgg tgattcctga aacaagctgg gaacagaaaa aaacagatat taaagaatat + 15121 cacattgata catttgttat gggggataat tggaaaggaa aatttgatta tttaaaagaa + 15181 gaaggagtgg aggtagttta tttaccaaga actaaagaaa tatctacaac taaaattaaa + 15241 gaagatttag cagattagat tttttacaaa aatattttga gaccagataa taaatttgtt + 15301 tccataatta ttaatgtttt gactatttaa atctcatttt ttaaaaaatt cggattgatt + 15361 aataattaaa aaatctagtt taagatatga aagaaaatta tatccataac tattatattg + 15421 tttgtaatat gtatcgtgat aatgtataag aaattagtag atataaatgt gatatatagc + 15481 taaaactaat attattcatt gctatttaaa atgtagttag aagtaaagca tctaataaac + 15541 ttgaaggtac ataaaaattt agcattaaat tataaaacaa ggtatttttc tgtgaaaatt + 15601 gggtagatat acaataatat ttgtattgtt agagaaagaa ttcttaatat tatattgtaa + 15661 tggaggcatt ttgaattgac taaagtaaga attaattggg tagattttgg gaaaggattt + 15721 gcaatatttt tagttctagt aggacatgta tttattggtt tatatgaatc caataagttt + 15781 tcaattgcaa atgatgtgtt attattccta atagctcaaa tctatatatt tcatatacca + 15841 gtgttttttg cgttatcagg atactttttc agacctgtat cagatttgaa ggagttttgg + 15901 cattatgcta aaaagaaaac cattatttta ggcataccat atatttttta ttcaattatt + 15961 cacttttgtc ttcaaaaggt tgcgggtgcc tctgtccgag tacccactac gatatttaac + 16021 ctattgaata tctataaatt tcctctggga gtttcatggt atctatatac gttatggtcg + 16081 atattgatag tttatggttt actatctgtt gttttcaaaa atcgtaagtc ccttttgtta + 16141 gttagtgttt ttgcctatat tttcacatta tttattcaaa ctgatatttt tattgtgcaa + 16201 cggacgttgg tttgggggat ttgtttcttt cttggcagtg tattgagtga aattcacttt + 16261 gataaaatta atttaaaaaa aattcttttt ttctttgtgt tatttgattt tatttatatg + 16321 ttcgcttggt tcttgtttta tgaagtaggg tctaagaagg attatgtaag ctatagtaac + 16381 ccaggtttgt gggggattgc ttttattgtc tgtgtattag ctgcttttgc gatttttcct + 16441 aaaatggaga aaaattttcc taaaactttc ctatatttca ctaaatacgg gaaagatagt + 16501 ttagggatct atattcttca tgcaccaatt tgtagcatga ttcggattct aatgttgaaa + 16561 gtgggaataa actcagtttt tcttcacgtt gttgttggga ttgtgctagg ctggtattta + 16621 tccatactgg caacttatat attgaaaaaa attccatttt tgaatattgt tttattacca + 16681 caaaagtata ttaaattaaa ataaattatt ttagatttat aatgtggctc tttgtcaact + 16741 aacatctgga gaggacaatc actgtcttct ctttttttgt cttttcagaa tataccaaat + 16801 taacacaaaa attctgaaaa ttctgttgac atctttctga aaagagtcta taatggagag + 16861 aaagttttaa aggagaaaat gatgaaaagt tcaaaactac ttgcccttgc gggcgtgaca + 16921 ttattg +// + diff --git a/public/res/serotype_genbank/serotype_11X.gb b/public/res/serotype_genbank/serotype_11X.gb new file mode 100755 index 0000000..0156981 --- /dev/null +++ b/public/res/serotype_genbank/serotype_11X.gb @@ -0,0 +1,836 @@ +LOCUS MK606429 20356 bp DNA linear BCT 30-SEP-2020 +DEFINITION Streptococcus pneumoniae strain GPS_HK_33 cps gene cluster, + complete sequence. +ACCESSION MK606429 +VERSION MK606429.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 20356) + AUTHORS van Tonder,A.J., Gladstone,R.A., Lo,S.W., Nahm,M.H., du Plessis,M., + Cornick,J., Kwambana-Adams,B., Madhi,S.A., Hawkins,P.A., + Benisty,R., Dagan,R., Everett,D., Antonio,M., Klugman,K.P., von + Gottberg,A., Breiman,R.F., McGee,L., Bentley,S.D. and The Global + Pneumococcal Sequencing,C.O. + TITLE Putative novel cps loci in a large global collection of pneumococci + JOURNAL Microb Genom 5 (7) (2019) + PUBMED 31184299 +REFERENCE 2 (bases 1 to 20356) + AUTHORS van Tonder,A.J. + TITLE Direct Submission + JOURNAL Submitted (06-MAR-2019) Parasites and Microbes, Wellcome Sanger + Institute, Wellcome Genome Campus, Hinxton, Cambridge CB10 1SA, + United Kingdom +COMMENT ##Assembly-Data-START## + Assembly Method :: Velvet v. 1.2 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..20356 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="GPS_HK_33" + /isolation_source="nasopharyngeal swab" + /host="Homo sapiens" + /db_xref="taxon:1313" + /geo_loc_name="China" + /collection_date="2000" + misc_feature 1..20356 + /note="cps gene cluster" + gene 1..1611 + /gene="dexB" + CDS 1..1611 + /gene="dexB" + /EC_number="3.2.1.70" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3280" + /inference="protein motif:CLUSTERS:PRK10933" + /inference="protein motif:Pfam:PF00128.18" + /inference="protein motif:TIGRFAMs:TIGR02403" + /inference="similar to AA sequence:RefSeq:YP_004326655.1" + /inference="similar to AA sequence:UniProtKB:Q99040" + /note="trehalose-6-phosphate hydrolase; maltooligosyl + trehalose synthase; alpha,alpha-phosphotrehalase; alpha + amylase catalytic domain protein" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="QCO91862.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNEDGIGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIAAIFGTMEDMDQLIAEAEKRDIRIIMDLVVN + HTSDEHAWFVEACENPNSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGAKDLLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKGVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTGQPWLAVNPNYEMINVQEALANPDSIFYTYQKL + VQIRKENSWLIRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTAAKEVLEKQVLAPWDAFCVEMTD" + gene 1742..2881 + /gene="tnp" + CDS complement(1742..2881) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00665.20" + /inference="similar to AA sequence:RefSeq:YP_006065738.1" + /note="integrase core domain protein" + /codon_start=1 + /transl_table=11 + /product="IS1202 transposase" + /protein_id="QCO91863.1" + /translation="MLAEEGIQLSDTTVRKILYKENILSPKAHRKTKKRVRKQAKLNP + KQPLDNPILPTAENFLEDPKKVHPSRPRKKFAGELIQMDASPHAWFGAQTSNLHLAID + DASGNILGAYFDKQETLNTYYHVLEQILGNHGVPLQIKTDKRTVFTYQASNSKKMEDD + THTQFGYACHQLGILLETTSIPQAKGRVERLNQTLQSRLPIELERNKIHTLEEANTFL + LSYIQTFNEQFGNKTKLSVFEEAPKPSERNLILARLAERVVDSGHHIRFQNRYYIPTE + QGKEVYFIRKTKALVIKAFDGDIYLNIADKIYRTKELLDYELYSKNFEQEPEQKKKDT + SISLHKPIRGNSHLSNNIFIKIKRIMKSLLVRSLILLNYKYSKMK" + gene 2958..3149 + /gene="tnp" + CDS complement(2958..3149) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_003878591.1" + /codon_start=1 + /transl_table=11 + /product="IS transposase" + /protein_id="QCO91864.1" + /translation="MNEVKKYLVIKAIAQGKKTKKRACAELNLSERQINRLLLAYQLK + RKRSLQTRKQKSKTKTCNP" + gene 3326..4771 + /gene="wzg" + CDS 3326..4771 + /gene="wzg" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09379" + /inference="protein motif:Pfam:PF03816.8" + /inference="protein motif:TIGRFAMs:TIGR00350" + /inference="similar to AA sequence:RefSeq:YP_001835063.1" + /inference="similar to AA sequence:UniProtKB:Q7WY78" + /note="putative transcriptional regulator ywtF; + membrane-bound transcriptional regulator LytR; cell + envelope-related function transcriptional attenuator + common domain; cell envelope-related transcriptional + attenuator domain protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14A" + /protein_id="QCO91865.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 4773..5504 + /gene="wzh" + CDS 4773..5504 + /gene="wzh" + /EC_number="3.1.3.48" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4464" + /inference="protein motif:Pfam:PF02811.13" + /inference="similar to AA sequence:RefSeq:YP_003878593.1" + /inference="similar to AA sequence:UniProtKB:Q9AHD4" + /note="capsular polysaccharide biosynthesis protein; PHP + domain protein" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein phosphatase wzh" + /protein_id="QCO91866.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGMRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPQKIVMDQLI" + gene 5513..6205 + /gene="wzd" + CDS 5513..6205 + /gene="wzd" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:Pfam:PF02706.9" + /inference="protein motif:TIGRFAMs:TIGR01006" + /inference="similar to AA sequence:RefSeq:YP_003724090.1" + /inference="similar to AA sequence:UniProtKB:P72367" + /note="capsular polysaccharide type 8 biosynthesis protein + cap8A; capsular polysaccharide biosynthesis protein; MPA1 + family polysaccharide export protein; chain length + determinant protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + wzd" + /protein_id="QCO91867.1" + /translation="MKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSAFIV + KPEYTSTTRIYVVNRDQGDKPGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKLD + MPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVT + TLEEARPATTPSSPNVRRNSLFGFLGGAVVTVSAVLLIELLDTRVKRPEDVEDVLQIP + LLGVVPNLDKMK" + gene 6215..6895 + /gene="wze" + CDS 6215..6895 + /gene="wze" + /EC_number="2.7.10.1" + /EC_number="2.7.10.2" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:CLUSTERS:PRK11519" + /inference="protein motif:Pfam:PF01656.17" + /inference="protein motif:TIGRFAMs:TIGR01007" + /inference="similar to AA sequence:RefSeq:YP_002510377.1" + /inference="similar to AA sequence:UniProtKB:Q54520" + /note="tyrosine-protein kinase CpsD; tyrosine kinase; + capsular polysaccharide biosynthesis protein; capsular + exopolysaccharide family protein; CobQ/CobB/MinD/ParA + nucleotide binding domain" + /codon_start=1 + /transl_table=11 + /product="capsule biosynthesis tyrosine-protein kinase + Wze" + /protein_id="QCO91868.1" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDDLKVFSITSVK + LGEGKSTISTNIAWAFAHAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GDYGKNKK" + gene 6910..8277 + /gene="wchA" + CDS 6910..8277 + /gene="wchA" + /EC_number="2.7.8.-" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15204" + /inference="protein motif:Pfam:PF02397.10" + /inference="protein motif:TIGRFAMs:TIGR03025" + /inference="similar to AA sequence:RefSeq:YP_003878596.1" + /inference="similar to AA sequence:UniProtKB:P71241" + /note="putative colanic biosynthesis UDP-glucose lipid + carrier transferase; undecaprenyl-phosphate galactose + phosphotransferase; exopolysaccharide biosynthesis + polyprenyl glycosylphosphotransferase; bacterial sugar + transferase" + /codon_start=1 + /transl_table=11 + /product="galactosyl transferase wchA" + /protein_id="QCO91869.1" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQNFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTVHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSKKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLLPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQISGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFM + RDGAK" + gene 8281..8730 + /gene="wchJ" + CDS 8281..8730 + /gene="wchJ" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF08660.5" + /inference="similar to AA sequence:RefSeq:YP_003875974.1" + /note="Alg14-like oligosaccharide biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="putative glycosyltransferase enhancer" + /protein_id="QCO91870.1" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKADARSVLSE + EVVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKT + VYIEVFDRIDAPTITGKLVYPVTDRFIVQWEEMKKIYPKAINLGGIF" + gene 8730..9209 + /gene="wchK" + CDS 8730..9209 + /gene="wchK" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04101.10" + /inference="similar to AA sequence:RefSeq:YP_003875975.1" + /note="glycosyltransferase family 28 C-terminal domain + protein" + /codon_start=1 + /transl_table=11 + /product="putative glycosyltransferase" + /protein_id="QCO91871.1" + /translation="MIFVTVGTHEQQFDRLIKEFDRLKEENLIQEEVFIQTGYSNYVP + KYCKWEKIISYEKMNQFIEEADTIVTHGGPATFMAIIAKGKTPIVVPRQKKFGEHVND + HQMNFCSKISSEGYELSLINDISELQYSLKQEKKTKFYSNNANFLKQLSKIIEDLIV" + gene 9451..10548 + /gene="wcyK" + CDS 9451..10548 + /gene="wcyK" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15179" + /inference="protein motif:Pfam:PF00534.14" + /inference="protein motif:TIGRFAMs:TIGR03088" + /inference="similar to AA sequence:RefSeq:YP_003875976.1" + /inference="similar to AA sequence:UniProtKB:A0QWG6" + /note="GDP-mannose-dependent + alpha-(1-2)-phosphatidylinositol mannosyltransferase; Vi + polysaccharide biosynthesis protein TviE; PEP-CTERM/EpsH1 + system-associated sugar transferase; glycosyl transferase + group 1 protein" + /codon_start=1 + /transl_table=11 + /product="putative glycosyltransferase" + /protein_id="QCO91872.1" + /translation="MKILHIPTGGLFSDGIGTFIYSYLEYMDLNKYDVTILATNPLLK + SDKEKFEYLGVKVIEIERKKSNLSKYIYKLKKLMKKEKFDIIHVHGSSALMSIELLTA + KIAGIPVRIAHSHNTTCEHHKLDKLLRPIFYRVYTQACACSVSAGQWLFEEKNYEIIH + NARDVNKYQYDAIKRKKLREELLLSDETIALGHVGRFNTQKNQRFLVSLMERLVIKNI + DLKLFLVGTGDTLEEIKKLVIQKKLEDNIVFLGQFDDMKSFVSSMDIMLLPSLYEGLP + LVSVEWQINGVKSILSDRVTQECIYTETVQQLSIDSMELWEKEILNLSTSDRERVSLQ + NIQLIRNAGYDISLEVKEIEELYNSLYDIAN" + gene 10549..11244 + /gene="wcwC" + CDS 10549..11244 + /gene="wcwC" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3955" + /inference="protein motif:Pfam:PF08942.4" + /inference="similar to AA sequence:RefSeq:YP_003875977.1" + /note="exopolysaccharide biosynthesis protein; DUF1919 + protein" + /codon_start=1 + /transl_table=11 + /product="putative acetyltransferase" + /protein_id="QCO91873.1" + /translation="MKGKSFLLKMLQNLKLIKRRLKPIKRKLKPIKRTYKKIVYSITK + SNMRKRLKNTDFSIISDNCWGGRVYEELGLPYRTPFIGLYIFSEDYVKLLKNFKKYME + YELTFTNNSKWNTEYDGEYPIGILNDIEIHFLHYSSMEEAYKKWNKRKKRINYKNIFF + KMNDDNKCSLKLLKEFDTLDLKNKIIFAAFNYKELDNLIHFTNPIGNGNVGADLFYYN + KYFDVVNWLNGEY" + gene 11247..11969 + /gene="wcrL" + CDS 11247..11969 + /gene="wcrL" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3774" + /inference="protein motif:Pfam:PF04488.9" + /inference="similar to AA sequence:RefSeq:YP_003875978.1" + /note="mannosyltransferase OCH1-related enzyme; + glycosyltransferase sugar-binding region" + /codon_start=1 + /transl_table=11 + /product="putative glycosyltransferase" + /protein_id="QCO91874.1" + /translation="MIPKKIHYCWFGGKPLPNDVKRCIASWRKFCPDYEIIEWTEKNF + CIQNQNQFVKDAYKNKAWAFVSDYARLKIVYENGGIYLDTDVEIIKKLDLLLDNTAFF + GVHQVNHLVNTGLGFGAEKGSFILKELLDSYDEVKFDINKKDELLCPELNTQIFKQLG + YVYSNSVIKSQYFTIYPEEYFDPISLGDEVANILSDKTFSIHHYNASWTSLMNRVKRK + IIRKLGRSNVSELKRILKGKTR" + gene 11966..13138 + /gene="wzy" + CDS 11966..13138 + /gene="wzy" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3307" + /inference="protein motif:Pfam:PF04932.9" + /inference="similar to AA sequence:RefSeq:YP_003875979.1" + /note="lipid A core O-antigen ligase-related enzyme; + O-antigen ligase" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="QCO91875.1" + /translation="MRISPSKLIFAFFSSFYILVILFPRGIFLGHSTLASRLWIIYKE + SLYLSILLGSIYVILKILSRNIAIHQHAFFILQYYFIVMILTFMLSGSIGDGVQSIFY + PIFIYLFFNEVRDKKSIVLIFDIFLYILTALFVINTIDIFLNFTNIFHVTFLGHVQVI + SQYSILGFLVSAYYLLEEKRNILVAQLLLILTIINCFFSDVSLSKAIALFMIIYIISY + KLKKLFWKRGRKISVITFIASVVMLALVIFGYFLPYLRYFDFTFNGRYQIWRIVYATI + LQVKWFGYGVFGFQFKLPWQELGEIGINYTHNQILQLALDSGIVGIISFFTMIFYMIF + STKNIQNPAIGSLFIFAYFCLFIIMFIESVTYYPYYFIIIVLQTLYLKLERERNVK" + gene 13128..13628 + /gene="wcwT" + CDS 13128..13628 + /gene="wcwT" + /EC_number="2.3.1.-" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0110" + /inference="protein motif:CLUSTERS:PRK09677" + /inference="protein motif:Pfam:PF00132.18" + /inference="protein motif:TIGRFAMs:TIGR03570" + /inference="similar to AA sequence:RefSeq:YP_003875980.1" + /inference="similar to AA sequence:UniProtKB:Q7A3E8" + /note="putative acetyltransferase SA2342; putative + lipopolysaccharide biosynthesis O-acetyl transferase WbbJ; + isoleucine patch superfamily acetyltransferase; sugar + O-acyltransferase sialic acid O-acetyltransferase NeuD + family protein; Bacterial transferase hexapeptide (six + repeats)" + /codon_start=1 + /transl_table=11 + /product="putative acetyltransferase" + /protein_id="QCO91876.1" + /translation="MLNRLIRNFNKVYYSYRIKRKAAQCSGRVYTGGKTFVTANTYLD + ENVSFNGMSMYGEGKISIGKNFHSGLNCQIITSFHNYDLGDKIPYDESYIHKDVLIED + NVWVGNNVIILGGAIIEEGAIIQAGSTVAGRIPAGAIAGGHPAKPFRFRNMEHYNRLK + RQKKFH" + gene 13638..14825 + /gene="wcwU" + CDS 13638..14825 + /gene="wcwU" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04464.8" + /inference="similar to AA sequence:RefSeq:YP_003875981.1" + /note="CDP-glycerol:poly(glycerophosphate) + glycerophosphotransferase" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="QCO91877.1" + /translation="MNIVSYLKKNGITHTLKIINEYKMQELFDSLVSIFTKQKELRDS + IVIECHTDFENNGGAFYDYLINNEYNKKYKIVLLLKDKLSKELPENVDYFYLRKPSLR + KSYVMSLSKFFTFDNDMLRKYRKDQKHFYLTHGCFPLKNTIGKITVPNYVDFVLSPSG + NVDNIIVKQFGLTSKEQCLHTGFPCHDIFYSKTEPLVFLSDYDKKIIWAPTFRKGGGY + NRNDSTASYPLGIPLLGTLDELAHLNTYLSQRDIVLIVKLHPMQDISDLELKQFSHIK + FLTNQNLKRKNINMYQLLMNSDALLSDYSAISYDYLHLDKPIGYVFSDLNDYKLGFSV + DNVDDYIAGDKIMSFNDLLHFIDNIYLEIDKNKEKRKELFNKIFEKQDGESCERLAQI + MEL" + gene 14794..16245 + /gene="wzx" + CDS 14794..16245 + /gene="wzx" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF01943.11" + /inference="similar to AA sequence:RefSeq:YP_003875982.1" + /note="polysaccharide biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="QCO91878.1" + /translation="MKDWPKLWNYRRRYEEMSVGMKAALWYTVANFIQKGFVFLSTPI + LTRILNVNDYGTLILYQSWFVLFAIFATLNLSQTAYNKGLVEFENDKDNFTFSLLFLS + KIITIIVAFLYFTFNILVKDSTGLTPGFMIFLFSDILFNISIEFYLARQRFEFKYRKA + VLISISSSFLIVAISTTILLVIKNDLFIKIVLDAIIRIIFGLYCFYLLFFSGRRQLKI + EKKYIKYGLSYSLPLMPHFLSHYILNQSDRLMINMFDGKEKLAIYSLAYSVSMIMFLF + TNAINQSIMPYTFQALKKKDYRGIHGSTKWLFITVGGVTVLSILFAPELIVILGGNKY + KESIWLVPPIAISVYFLFVYSMFSNISFYYKMNKLISLVSTGAALSNIILNYIFINIF + GYQAASYTTLLCYILLAFSHFFLYRFLLKKEEIHEELYNMKMILIISLILLTILFLIL + VIYNLAFIRYAIIVIIVFLLFTKRNKIITSLKS" + gene 16358..16750 + /gene="gct" + CDS 16358..16750 + /gene="gct" + /EC_number="2.7.7.39" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0615" + /inference="protein motif:CLUSTERS:PRK11316" + /inference="protein motif:Pfam:PF01467.1" + /inference="protein motif:TIGRFAMs:TIGR01518" + /inference="similar to AA sequence:RefSeq:YP_003875983.1" + /inference="similar to AA sequence:UniProtKB:P27623" + /note="glycerol-3-phosphate cytidylyltransferase; + bifunctional heptose 7-phosphate kinase/heptose + 1-phosphate adenyltransferase; cytidylyltransferase" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="QCO91879.1" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNFEHRKNLVEAIRYVDLVIPETSWEQKKTDIKEYHIDTFVMGDDWKGKFDY + LKEEGVEVVYLPRTKEISTTKIKEDLAD" + gene 17168..18196 + /gene="wcjE" + CDS 17168..18196 + /gene="wcjE" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3594" + /inference="protein motif:Pfam:PF01757.16" + /inference="similar to AA sequence:RefSeq:YP_003875984.1" + /note="fucose 4-O-acetylase-related acetyltransferase; + acyltransferase family protein" + /codon_start=1 + /transl_table=11 + /product="putative acetyltransferase" + /protein_id="QCO91880.1" + /translation="MTKVRINWVDFGKGFAIFLVLVGHVFIGLYESNKFSIANDVLLF + LIAQIYIFHIPVFFALSGYFFRPVSDLKEFWHYAKKKTIILGIPYIFYSIIHFCLQKV + AGASVRVPTTIFNLLNIYKFPLGVSWYLYTLWSILIVYGLLSVVFKNRKSLLLVSVFA + YIFTLFIQTDIFIVQRTLVWGICFLLGSVLSEIHFDKINFKKILVFFVLFDFIYMFAW + FLFYEVGSKKDYVSYSNPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSL + GIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLL + PQKYIKLK" + gene 18374..20356 + /gene="aliA" + CDS 18374..20356 + /gene="aliA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4166" + /inference="protein motif:CLUSTERS:PRK15104" + /inference="protein motif:Pfam:PF00496.16" + /inference="protein motif:TIGRFAMs:TIGR02294" + /inference="similar to AA sequence:RefSeq:YP_001835080.1" + /inference="similar to AA sequence:UniProtKB:P31306" + /note="76 kDa cell surface lipoprotein; oligopeptide ABC + transporter substrate-binding protein OppA; ABC-type + oligopeptide transport system, periplasmic component; + nickel ABC transporter, nickel/metallophore periplasmic + binding protein; Bacterial extracellular solute-binding + proteins, family 5 Middle" + /codon_start=1 + /transl_table=11 + /product="oligopeptide ABC transporter + oligopeptide-binding protein AliA" + /protein_id="QCO91881.1" + /translation="MKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETDP + DNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDA + KWYTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDAYVKGEIKDFSQVG + IKALDEQTVQYTLNKPESFWNSKTTMGVLAPVNEEFLNSKGDDFAKATDPSSLLYNGP + YLLKSIVTKSSVEFAKNPNYWDKDNVHVDKVKLSFWDGQDTSKPAENFKDGSLTAARL + YPTSASFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKALL + NKDFRQAIAFGFDRTAYASQLNGQTGASKILRNLFVPPTFVQADGKNFGDMVKEKLVT + YGDEWKDVNLADSQDGLYNPEKAKAEFAKAKSALQAEGVQFPIHLDMPVDQTATTKVQ + RVQSMKQSLEATLGADNVIIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPDFA + DPSTYLDIIKPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDETTDVAKRY + DKYAAAQAWLTDSALIIPTTSRTGRPILSKMVPFTIPFALSGNKGTSEPVLYKYLELQ + DKAVTVDEYQKAQEKWMKEKEESNKKAQEDLAKHVK" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg aagatggaat tggcgatttg ccaggaatta ccagtaagtt ggactatcta + 121 gccaagctag gaatcacagc aatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctatg atattgctga ttatcaagcg attgcggcta tttttggaac catggaggat + 241 atggatcaac tgattgcaga agctgagaag cgtgatatcc gtatcatcat ggacttggtg + 301 gtcaatcata cctcggatga gcatgcctgg tttgtagagg cctgtgaaaa tcctaatagc + 361 cctgagcgag attactatat ctggcgggat gagcctaacg atttagattc tatttttagt + 421 ggatctgctt gggaatacga tgaaaaatct ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaggg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agctaaggat ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcaac ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttacttcat + 1021 ctcatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatctctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaacct + 1261 tggttggcag ttaatccaaa ttacgagatg atcaacgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 attcgagctg actttgaatt gcttgatacg gctgataagg tctttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacactg cggctaaaga agtacttgaa + 1561 aaacaggtct tggctccatg ggatgctttc tgtgtggaaa tgactgacta gaatgagcaa + 1621 acctcaagtt tttgaagctt gaggtttttt actatagtgg attgaaacta gaatagtgca + 1681 cctctacttc taaaatattg ttagaaatcg atttgattgt cctgatcgat ttgtcctatt + 1741 cttatttcat tttactatac ttgtagttga ggagaattaa gctcctcact agtaaactct + 1801 tcataatcct ttttattttt atgaagatat tgtttgaaag atgtgagttt ccacggatgg + 1861 gtttgtggag ggatatactt gtgtctttct ttttttgttc tggttcttgt tcaaagtttt + 1921 tcgaatagag ttcataatct agtagctcct ttgtgcgata gattttgtca gcgatattga + 1981 ggtagatgtc tccgtcaaat gcttttataa ctaatgcttt cgtctttctg atgaaataga + 2041 cttcttttcc ttgttcggta gggatatagt aacgattttg gaatcggata tggtgtccac + 2101 tatcgacgac tctctccgcc agtctagcca gaatgagatt tcgttcagag ggcttaggag + 2161 cctcctcaaa aacagagagt tttgtcttgt ttccaaactg ttcattaaag gtttggatgt + 2221 aggaaagcag gaaggtattg gcttcttcca aggtatgaat cttgtttcgt tccagttcga + 2281 taggcaggcg agattgtagt gtctgattaa gtctttcgac tctcccttta gcttgaggga + 2341 tagaggttgt ctccagaaga atccctagtt ggtgacaggc gtatccaaat tgtgtatggg + 2401 tgtcgtcctc cattttctta gagttggagg cttgataggt aaagaccgtt ctcttatctg + 2461 ttttaatttg aaggggaacg ccgtgattgc ctaaaatttg ttcgaggaca tgatagtaag + 2521 tattcaaggt ctcttgttta tcaaaataag cgcctaggat attgccagaa gcatcatcaa + 2581 tggctaagtg taagttagat gtttgtgctc caaaccaggc atgagggctg gcatccattt + 2641 gaatgagttc accagcaaat ttctttctgg gtctactagg atgtactttt ttagggtctt + 2701 caaggaagtt ttcagccgtc ggtaagattg gattatctag gggttgcttg gggttcagtt + 2761 tagcttgttt tcttactctc ttctttgtct ttctatgagc cttaggcgac aggatgtttt + 2821 ccttatagag tatttttcta acagttgtat cagagagctg aattccttct tcagctagca + 2881 attcacagaa atgaaggaca tttggtttat atgtttcata ggagaggtat ttttttagga + 2941 gatgttcttt gatttcatca aggattgcat gttttggttt tcgatttctg tttccgtgtc + 3001 tgaaggcttc ttttcctttt cagttgatag gctagtagca gacgattgat ttgcctttca + 3061 gaaagattga gttcggcaca ggctcgtttc tttgttttct ttccttgggc tatagctttt + 3121 atcacaagat attttttcac ttcattcata tttagttgga tccttttcat atgattattc + 3181 taccaaatgg gacattttca cgttcgattt actaaagaca tcatcacctt cgaatcacaa + 3241 agatgcagat agtgaaaata aaggtgtaga cattaccgta aaaaagtgat ataatcgtat + 3301 gatgttcaag gtataggtgt taatcatgag tagacgtttt aaaaaatcac gttcacagaa + 3361 agtgaagcga agtgttaata tcgttttgct gactatttat ttattgttag tttgtttttt + 3421 attgttctta atctttaagt acaatatcct tgcttttaga tatcttaacc tagtggtaac + 3481 tgcgttagtc ctactagttg ccttggtagg gctactcttg attatctata aaaaagctga + 3541 aaaatttact atttttctgt tgctgttctc tatccttgtc agctctgtgt cgctctttgc + 3601 agtacagcag tttgttggac tgaccaatcg tttaaatgcg acttctaatt actcagaata + 3661 ttcaatcagt gtcgctgttt tagcagatag tgatatcgaa aatgttacgc aactgacgag + 3721 tgtgacagca ccgactggga ctgataatga aaatattcaa aaattactag ctgatattaa + 3781 gtcaagtcag aataccgatt tgacggtcga ccagagttcg tcttacttgg cagcttacaa + 3841 gagtttgatt gcaggggaga ctaaggccat tgtcttaaat agtgtctttg aaaatatcat + 3901 cgagtcagag tatccagact acgcatcgaa gataaaaaag atttatacca agggattcac + 3961 taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct atgttagtgg + 4021 aattgacaca tatggtccta ttagttcggt gtcgcgatca gatgtcaata tcctgatgac + 4081 tgtcaatcga gataccaaga aaatcctctt gaccacaacg ccacgtgatg cctatgtacc + 4141 aatagcagat ggtggaaata atcaaaaaga taaattaacc catgcgggca tttatggagt + 4201 tgattcgtcc attcacacct tagaaaatct ctatggagtg gatatcaatt actatgtgcg + 4261 attgaacttc acttctttct tgaaaatgat tgacttattg ggaggggtag atgttcataa + 4321 tgatcaagag ttttcagctc tacatgggaa gttccatttc ccagtaggga atgtccatct + 4381 agactctgag caggctctag gttttgtacg tgaacgctac tcactagccg atggagaccg + 4441 tgaccgtggt cgcaaccaac aaaaggtgat tgtggctatc cttcaaaaat taacgtcaac + 4501 cgaagcactg aaaaattata gtacgatcat taatagcttg caagattcta tccaaacaaa + 4561 tatgccactt gagactatga taaatttggt taatgctcag ttagaaagtg gagggaatta + 4621 taaagtaaat tctcaagatt taaaagggac aggtcggacg gatcttcctt cttatgcaat + 4681 gccagacagt aacctctatg tgatggaaat agatgatagt agtttagctg tagttaaagc + 4741 agctatacag gatgtgatgg agggtagatg aaatgataga catccattcg cacatcgtct + 4801 ttgatgtaga tgatggtccc aagtcaagag aggaaagcaa ggctctcttg gcagaagcct + 4861 acagacaggg gatgcgaacc attgtctcta cctctcaccg tcgcaagggc atgtttgaaa + 4921 ctccggaaga gaagatagca gaaaactttc ttcaggttcg ggaaatagct aaggaagtgg + 4981 cgagtgactt ggtcattgct tacggggctg aaatttacta cacaccagat gttctggata + 5041 agctggaaaa aaagcggatt ccgaccctca atgatagtcg ttatgccttg atagagttta + 5101 gtatgaacac tccttatcgc gatattcata gcgccttgag caagatcttg atgttgggaa + 5161 ttactccagt cattgcccac attgagcgct atgatgctct tgaaaataat gaaaaacgcg + 5221 ttcgagaact gatcgatatg ggctgttaca cgcaagtaaa tagttcacat gtcctcaaac + 5281 ccaaactttt tggcgaacgt tataaattca tgaaaaaaag agctcagtat tttttagagc + 5341 aggatttggt tcatgtcatt gcaagtgata tgcacaatct agacggtaga cctcctcata + 5401 tggcagaagc atatgacctt gttacccaaa aatacggaga agcgaaggct caggaacttt + 5461 ttatagacaa tcctcaaaaa attgtaatgg atcaactaat ttaggagaaa tgatgaaaga + 5521 acaaaacacg atagaaatcg atgtatttca attatttaaa accttgtgga aacgcaagct + 5581 aatgatttta atagtggcac ttgtgacagg tgcgggggct tttgcatata gcgcttttat + 5641 tgttaagcca gaatatacga gtactacgcg aatttacgta gtgaatcgcg atcaaggaga + 5701 caagccgggg ctgacaaatc aggatttgca ggcaggatct tatctggtaa aagactaccg + 5761 tgagattatc ctttcgcagg atgtattgga aaaagtagcg acaaatttga agttggatat + 5821 gccagcaaaa acgttagcca gcaaagttca agtgactgta ccagctgaca ctcgtatcgt + 5881 ctcaatctct gtcaaagata aacagccaga agaagccagt cgtatcgcta attctctacg + 5941 agaagttgct gcagaaaaga tcgtcgctgt aacgcgagta tctgatgtaa cgacacttga + 6001 agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgacgcaatt ccttgtttgg + 6061 ttttcttgga ggagcagtcg taacagtaag tgctgttctt ttgattgagt tgctcgacac + 6121 ccgtgtgaaa cgtcctgaag atgtcgaaga tgtactgcaa attccacttt taggggtcgt + 6181 tccaaatttg gacaaaatga aataggagga agttatgcca acattagaaa tctcacaggc + 6241 aaaattggat tttgtaaaaa aggcagagga atattataac gctttgtgca cgaacctaca + 6301 gttaagtgga gatgatttga aagtattttc tatcacttct gtgaaactag gagaaggaaa + 6361 atcaacgatt tccaccaata tcgcttgggc ttttgcgcat gcaggttaca aaacgctgct + 6421 gattgatgga gatattcgca attctgttat gttaggtgtc tttaaagcaa gggataagat + 6481 tacaggcctg acagaatttt tatcaggaac tacagatcta tcacaagggc tttgtgatac + 6541 caatatcgaa aatctctttg taattcaggc tggctctgtg tcaccgaatc cgacagctct + 6601 tcttcaaagt aagaatttca gtacaatgct tgaaaccttg cgtaaatatt ttgactacat + 6661 cattgtagat actgctcctg tcggtgtcgt gattgatgcg gctattatta cgcgaaaatg + 6721 cgatgcttct attttagtga cggaggcagg tgaaataaat cgacgggata ttcaaaaagc + 6781 aaaagaacag ttggaacaca cagggaagcc gtttttggga gttgtgttga ataaattcga + 6841 tacttcagta gacaaatacg gttcttatgg agattacggg aaaaataaaa aataggtcgg + 6901 aggacagaga tgaatggaaa aatagtaaag tcttcattgg ctataatcca gagttttctt + 6961 gttattttat tgacttatct ccttagtgct gtgagagaag cggagattgt ttcaacaaca + 7021 gctattgcac tttatatcct ccattatttt gtcttttata ttagtgatta tggacagaat + 7081 ttctttaaaa ggggatattt gattgaactt gtccagacat tgaaatatat cctattcttt + 7141 gcactagcga ttagtatttc taattttttc ttagaggatc gatttagtat ttccagacga + 7201 ggcatgattt acttcctcac agtacatgct ctcttagtct atgtgctaaa cctatttatc + 7261 aagtggtatt ggaagcgggc ttatcccaac tttaaaggaa gtaagaagat tctcctactt + 7321 acagcaactt ctcgtgtcga aaaggtactg gatagattaa tagaatcaaa tgaggttgtt + 7381 ggggagttgg tagctgtcag tgtcttagat aaaccagatt ttcagcatga ttgtttaaag + 7441 gtagtagcag agggggagat agtaaacttt gcgactcatg aggtggtcga tgaagtcttt + 7501 atcaatcttc caagtaaaaa atacaatatt ggagagcttg tctctcagtt tgaaacgatg + 7561 ggaattgatg taacagttaa tctaaatgct tttgatcgta gtttggcacg taacaagcaa + 7621 attcgtgaga tggcaggatt aaacgttgtg actttttcta caacatttta taagactagt + 7681 catgtaattg ctaagcggat tattgatatc gtgggtgcat tggtagggct gatactatgt + 7741 ggtttagtca gtattgtatt gcttcctttg attcgaaagg atgggggctc tgctattttt + 7801 gctcagacgc gtataggaaa aaatggtcgt cagttcactt tttataagtt tcgctctatg + 7861 tgtgtagatg ccgaggcgaa aaaaagagaa ctcatggaac aaaataccat gcagggtgga + 7921 atgtttaagg tggacgatga tcctcgtatc acgaaaattg gtcgttttat acggaagact + 7981 agcttggacg agctaccaca gttttataat gttctaaagg gagatatgag tttggttggc + 8041 acacggccac cgacagtgga cgagtatgaa cactataccc cagaacaaaa acgtcggcta + 8101 agttttaaac ctggtataac aggcttatgg cagatcagtg gacgaagtga gattaagaat + 8161 tttgatgaag ttgtcaaatt agatgtagcc tatatagacg attggacaat ttggaaagac + 8221 attgaaattt tattgaagac agttaaagtt gtatttatga gagacggagc gaagtaggaa + 8281 atgaaaatat gtttagttgg atctagtgga ggtcatctga ctcatttata tcttttaaaa + 8341 cctttctgga aagataaaga aagattttgg gttacttttg ataaggcgga cgctcggagt + 8401 gtactctctg aggaagttgt atatccctgt tattatccaa ccaatcgtaa tataaaaaat + 8461 ttaataaaaa atacttttct cgcctataaa attttaaaaa aagagagacc agatttgatt + 8521 atttcttctg gtgccgctat cgctgttcct ttcttttata ttgggaagtt atttggatca + 8581 aagacagtgt atatagaagt gtttgataga attgatgctc caacaataac gggaaaactt + 8641 gtttatccag taacggatag gtttattgtt caatgggaag aaatgaaaaa aatttatccg + 8701 aaagcaatta atctaggagg aatattctga tgatttttgt tactgtaggg acacatgaac + 8761 aacaatttga tcgtttgata aaagaatttg atcgtttgaa agaagagaat ctaattcaag + 8821 aggaagtatt tattcaaaca ggatattcta attatgtccc aaaatattgt aaatgggaaa + 8881 aaataatatc ttatgaaaaa atgaatcagt ttattgagga agctgataca attgttaccc + 8941 atggtggtcc agcaactttt atggcaatta ttgctaaagg aaaaactcca atagttgttc + 9001 cgaggcaaaa gaaatttggg gagcatgtga atgatcatca gatgaatttt tgttctaaaa + 9061 tatcctctga agggtatgaa ttatctctga ttaacgatat aagcgaattg cagtatagtt + 9121 taaagcaaga aaagaaaact aaattttact ctaataatgc aaattttctt aagcagttat + 9181 caaaaataat tgaagattta atagtataaa atgagattgt ttcttcttat tgcagatgaa + 9241 ttagaaataa atcaggttgt gagtaaagca acagtgccaa agtgtatttg taattaagaa + 9301 taaaataaac accatttcaa tatctgaaaa taattctcaa ggcatagttt gaattatgga + 9361 tatagattat tttgctaagt cttctaatcg atttataagt taaggcagta acattattaa + 9421 aatcatagat agaagtaagg agggaactaa atgaaaatac tacatattcc aacgggtggt + 9481 ttattttctg atggtatagg aacttttatt tattcatatt tggagtatat ggacttaaac + 9541 aagtatgatg tgacaatttt agccactaat cctcttttga aaagtgataa ggaaaaattt + 9601 gaatatttag gggttaaagt tattgaaatt gaaaggaaaa aatcaaacct ttctaaatat + 9661 atatacaaat tgaaaaaatt aatgaaaaaa gaaaaatttg atattataca tgttcacgga + 9721 agtagcgctt taatgtcaat tgaattactg actgctaaaa ttgctggtat cccagttcga + 9781 attgcccata gccataacac tacttgtgag catcataaac tagataaact actacgaccg + 9841 atattttatc gagtttatac tcaggcatgt gcttgcagtg ttagtgctgg tcagtggctt + 9901 tttgaggaaa aaaattatga gattatccat aacgctagag atgtaaataa gtatcagtat + 9961 gatgccataa aacgaaaaaa acttagagaa gaattgttac tgtctgatga gactattgct + 10021 ctaggtcatg ttggacgttt taatactcaa aaaaatcaac gttttctagt gtctctgatg + 10081 gaaagattag tgatcaaaaa tatagattta aaattatttt tagtagggac gggtgatact + 10141 ttagaagaaa tcaagaaatt agtcattcag aaaaaactag aagataatat tgttttttta + 10201 ggtcaatttg atgatatgaa atcttttgtg tcatcaatgg atataatgtt acttccaagt + 10261 ttatatgaag ggttaccact agtatctgtt gaatggcaaa taaacggagt aaaaagtatc + 10321 ctatctgacc gtgttacaca agagtgtatc tatacagaaa ctgttcaaca attatctatc + 10381 gatagtatgg aattatggga aaaagaaatt ttaaatttat ctacttcaga tagagaaaga + 10441 gtgtcattgc aaaatattca gttaataaga aatgcaggct atgatatttc tttagaagtt + 10501 aaagaaatag aagaattata taattcactt tatgatattg cgaattgaat gaaaggaaag + 10561 agttttcttt tgaagatgtt acaaaattta aaactaataa aacggagatt aaaaccaata + 10621 aaacggaaat taaaaccaat taagagaact tataagaaaa tagtttattc tatcactaag + 10681 tcaaatatga ggaagaggct caaaaataca gatttttcaa ttatcagtga taattgctgg + 10741 ggaggacggg tatatgaaga attgggtctg ccgtatagaa caccatttat aggtctgtat + 10801 attttttctg aggattatgt gaagctgttg aaaaacttca aaaagtatat ggaatatgag + 10861 ctaacgttta ccaataattc aaaatggaac acagaatatg acggggagta tcctataggt + 10921 attctcaatg atatagaaat tcatttttta cattattcta gcatggaaga agcatataaa + 10981 aaatggaata aaagaaaaaa aagaattaat tataaaaata ttttttttaa gatgaatgat + 11041 gataataaat gttctttgaa attgcttaag gaatttgata ctttggattt gaaaaataaa + 11101 attatttttg ctgcattcaa ttataaagaa ctagataatc ttattcattt taccaatcct + 11161 ataggtaatg gaaatgtagg tgcagaccta ttttattata ataaatactt tgatgttgtt + 11221 aattggttga atggagagta ctaagtatga tacctaaaaa aattcattat tgttggtttg + 11281 gtggcaaacc attaccaaat gatgtgaaac gatgtatagc tagttggaga aagttttgtc + 11341 ccgactatga aattattgaa tggactgaaa aaaatttttg tattcaaaat caaaatcaat + 11401 ttgtaaaaga tgcgtataaa aataaggcat gggcttttgt tagcgactat gctagactca + 11461 aaattgttta tgaaaatgga ggtatctatt tagatactga tgttgagatt attaaaaagc + 11521 tagatttgtt actggataac acagcattct ttggtgttca tcaagttaat catctagtta + 11581 atacaggatt aggttttggg gctgaaaagg ggtcattcat tttaaaagaa ttattagatt + 11641 cttatgatga agtgaaattt gatattaaca agaaagacga gctattatgt ccagaattaa + 11701 acacgcaaat atttaaacaa ctaggttatg tttattctaa ttcagttata aaaagtcaat + 11761 atttcacaat ctatcccgaa gaatacttcg atcccatttc attgggagat gaagttgcta + 11821 atattttatc agataaaaca ttttctattc atcattataa tgcatcttgg acttccttga + 11881 tgaatcgggt gaagagaaaa ataattcgta aactaggtag aagtaatgtc tcggagttaa + 11941 aaagaatatt aaaggggaaa actagatgag aatatcacca tcgaagctga tatttgcatt + 12001 ttttagcagt ttttatattc ttgtaatcct tttcccgaga ggaattttcc tagggcattc + 12061 tactttagct tctcgtttat ggattattta caaagaaagt ttatatctat caatactact + 12121 tggttcaata tatgttattt taaaaatatt atctcgaaat atcgccattc atcagcatgc + 12181 tttttttatc ttacaatatt attttattgt aatgatttta acttttatgt taagtgggtc + 12241 aatcggtgat ggggtacaat cgattttcta tccaatattc atctatttgt tttttaatga + 12301 agttcgagat aagaaatcaa tagtgttaat ttttgatata tttctttata tacttaccgc + 12361 tttattcgtt atcaatacga ttgatatttt tctgaatttc acaaatattt ttcatgttac + 12421 ttttttagga catgttcagg tgatttccca atatagtatt ctcggatttc tcgtatcagc + 12481 ttattatcta ttagaagaaa agaggaatat attagtcgca cagttgctgt tgattttaac + 12541 gattatcaat tgtttttttt cagatgtctc tctctctaaa gctattgctt tgtttatgat + 12601 tatttatatt atttcataca agttaaaaaa actattttgg aaaagaggaa ggaagatatc + 12661 tgttataact tttattgcat ctgttgtgat gttagcatta gtgatttttg gatatttttt + 12721 accatatctt agatattttg attttacttt taatggtcga taccaaattt ggcgcattgt + 12781 gtatgccacc attcttcaag tgaaatggtt tggatatggt gtgtttggct ttcaatttaa + 12841 acttccgtgg caggaattgg gagaaattgg aataaattat actcataatc aaattttaca + 12901 gttagcactt gatagtggca ttgttgggat tatctcattc tttactatga ttttttatat + 12961 gatcttttca actaaaaata ttcaaaatcc cgcaataggc tccctattta tttttgccta + 13021 tttttgtcta tttattataa tgtttataga gagtgttact tattatccat actattttat + 13081 tataatagtt cttcaaactt tgtacttaaa attggaaaga gaaagaaatg ttaaatagat + 13141 tgataagaaa ttttaataaa gtatattata gttatcgtat aaaaagaaag gccgcacaat + 13201 gcagtgggag agtgtatacg ggaggcaaaa cgtttgttac tgcaaatacg taccttgatg + 13261 aaaatgtttc atttaatggt atgtcaatgt atggtgaagg gaaaataagc attggtaaaa + 13321 attttcattc aggattaaat tgccaaatta tcacttcctt tcataattat gacttgggtg + 13381 ataaaattcc ttatgatgag agttacatac ataaagacgt cttaattgaa gataacgttt + 13441 gggtagggaa taatgtgata attttaggtg gtgcgattat tgaggaaggt gcaatcattc + 13501 aagcaggaag tacagttgct ggaagaattc cagcaggtgc gattgcaggt ggacatccgg + 13561 caaaaccatt cagatttaga aatatggaac attataatcg gcttaaacgg caaaaaaaat + 13621 ttcattagag gttaagaatg aatattgtaa gttatctaaa aaaaaacggt attacacata + 13681 ctttaaaaat tattaatgaa tataaaatgc aagagctgtt tgatagtctt gttagtattt + 13741 ttacaaagca gaaggaactt cgtgacagta ttgtcattga atgtcatact gattttgaga + 13801 ataatggtgg tgcgttctat gactatctaa tcaataatga gtataacaaa aaatataaaa + 13861 ttgtcttact attgaaggat aaattatcta aagaattacc agaaaatgta gattattttt + 13921 atttaagaaa gcccagttta cgaaaatcct acgtaatgtc attaagtaaa ttctttactt + 13981 ttgataatga tatgcttcgt aaatatagaa aagatcaaaa acacttttat ttaacacatg + 14041 gatgctttcc tttaaaaaat acaataggta aaataacagt tccgaattat gttgattttg + 14101 ttctatctcc atcgggcaat gtagataata ttatagttaa gcagtttgga ttaacatcta + 14161 aagagcaatg tcttcacact ggatttccgt gtcatgatat cttttattca aaaacagaac + 14221 ctctagtatt tttatctgat tatgataaaa aaattatctg ggcaccaact tttagaaagg + 14281 gtggtggcta taatagaaat gatagtacag ctagctatcc tttaggtatt ccattacttg + 14341 gaacactaga tgaacttgca cacctaaaca catatctaag ccaacgggat attgtcctga + 14401 ttgtaaagtt acatccaatg caagatattt cagatttgga gttgaaacaa tttagtcata + 14461 ttaagtttct gacaaatcaa aatctgaaac gtaaaaatat aaatatgtat caattgctga + 14521 tgaattcaga tgctttactt agtgactatt ctgcaatctc gtatgattat ttacatcttg + 14581 ataaaccaat agggtatgtt ttttcagatc taaatgatta taagttgggg ttttcagttg + 14641 ataatgtaga tgattacata gcaggtgata agataatgtc ttttaacgac ttgctgcact + 14701 ttattgataa catttatcta gaaattgata aaaataaaga aaaacgcaag gaattattta + 14761 ataaaatatt tgaaaaacag gatggagaat cgtgtgaaag attggcccaa attatggaat + 14821 tataggagac gttacgaaga aatgtctgtt gggatgaaag cggcactctg gtatactgtt + 14881 gcaaatttta ttcaaaaggg ttttgtattt ctttcaactc cgattttaac cagaatactt + 14941 aatgttaatg attacggtac attgatactt taccaatcat ggtttgtact atttgctatt + 15001 tttgctacct tgaatctttc tcaaacagct tataataagg gattagtaga atttgagaat + 15061 gataaagata attttacatt ttctttgttg tttttgtcta agattattac gataattgtt + 15121 gcttttttgt attttacttt taatatactg gttaaagata gtactggatt aactcccggt + 15181 ttcatgatat ttttattcag tgatatttta tttaatatta gtatagaatt ttatttggca + 15241 cgtcagagat ttgaattcaa atatagaaaa gcagttctaa tttcaatttc ttcaagtttt + 15301 ttaattgtag ctattagtac aactatctta ttagtgatta agaatgattt attcattaaa + 15361 attgtattag atgctattat ccgaattatc tttggtttat attgttttta tctcttgttt + 15421 ttttcaggga gaaggcaact taagatagaa aaaaaatata ttaaatatgg tttgagttat + 15481 tcattacctt tgatgccgca tttcttatcg cactatattt tgaatcagtc tgatcgtttg + 15541 atgattaaca tgtttgatgg taaggagaaa ttagctatat atagtctagc ttattctgta + 15601 tcaatgatta tgtttttgtt tactaatgca attaatcaat caataatgcc gtatacattt + 15661 caagctttga aaaaaaagga ttatcgtggg atacatggga gcaccaaatg gctttttata + 15721 acagttgggg gagtcacagt tctctcaatt ctatttgcac cagaactaat tgttatttta + 15781 ggcggcaata aatataagga atcaatttgg ctagtacctc caattgctat ctcggtttat + 15841 ttcctttttg tgtattctat gtttagtaat atcagttttt attataagat gaataaactg + 15901 atttcgttag tttccacagg tgcagctctt tcaaatatta ttttaaatta tatttttatt + 15961 aatatatttg ggtatcaagc tgcatcttac actacattat tatgctatat attgttagca + 16021 ttttctcatt ttttcttata tagattttta ttaaaaaaag aggaaattca tgaggaactt + 16081 tataatatga agatgattct aataatatct ttaatattat taacaatact atttttgata + 16141 cttgttattt ataacttagc ctttataagg tatgcaatta ttgtaattat tgtatttctt + 16201 ttgtttacaa agagaaataa aataattaca tccctaaaaa gttgatattg aaaatttaga + 16261 ttcaaattaa gaatatagtg gatatcaaac cagtaataat aatgaataat tgtttttatg + 16321 taatttggga ttaataaaaa attgaaagga aatatcaatg aaaagagtga ttacttatgg + 16381 aacctttgat ttgcttcatt atggacatat caatttgcta aagagagcga agcaattagg + 16441 agattatctc attgttgtag tttcaagtga tgagttcaat ttgaaagaaa aaaataaagt + 16501 ttgttacttt aattttgaac atagaaaaaa tttggttgaa gcgataagat atgttgattt + 16561 ggtgattcct gaaacaagct gggaacagaa aaaaacagat attaaagaat atcacattga + 16621 tacatttgtt atgggggatg attggaaagg aaaatttgat tatttaaaag aagaaggagt + 16681 ggaagtagtt tatttaccaa gaactaaaga aatatctaca actaaaatta aagaagattt + 16741 agcagattag attttttaca aaaatatttt gagatcagat aataaatttg tttccataat + 16801 tattaatgtt ttgactattt aaatctcatt ttttaaaaaa ttcggattga ttaataataa + 16861 aaaaatctag tttaagatat gaaagaaaat tatatccata actattatat tgtttgtaat + 16921 atgtatcgtg ataatgtata agaaattagt agatataaat gtgatatata gctaaaacta + 16981 atattattca ttgctattta aaatgtagtt agaagtaaag catctaataa acttgaaggt + 17041 acataaaaat ttagcattaa attataaaac aaggtatttt tctgtgaaaa ttgggtagat + 17101 atacaataat atttgtattg ttagagaaag aattcttaat attatattgt aatggaggca + 17161 ttttgaattg actaaagtaa gaattaattg ggtagatttt gggaaaggat ttgcaatatt + 17221 cttagttcta gtagggcatg tatttattgg tttatatgaa tccaataagt tttcaattgc + 17281 aaatgatgtg ttattattcc tgatagctca aatctatata tttcatatac cagtgttttt + 17341 tgcgttatca ggatactttt tcagacctgt atcagatttg aaggagtttt ggcattatgc + 17401 taaaaagaaa accattattt taggcatacc atatattttt tattcaatta ttcacttttg + 17461 tcttcaaaag gttgcgggtg cttctgtccg agtacccact acgatattta acctattgaa + 17521 tatctataaa tttcctctgg gagtttcatg gtatctatat acgttatggt cgatattgat + 17581 agtttatggt ttactatctg ttgttttcaa aaatcgtaag tcccttttgt tagttagtgt + 17641 ttttgcctat attttcacac tatttattca aactgatatt tttattgtgc aacggacgtt + 17701 ggtttggggg atttgtttcc ttcttggcag tgtattgagt gaaattcact ttgataaaat + 17761 taattttaaa aaaattcttg ttttctttgt gttatttgat tttatttata tgttcgcttg + 17821 gttcttgttt tatgaagtag gatctaagaa ggattatgta agctatagta acccaggttt + 17881 gtgggggatt gcttttattg tctgtgtatt agttgctttt gcgatttttc ctaaaatgga + 17941 gaaaaatttt cctaaaactt tcctatattt cactaaatac gggaaagata gtttagggat + 18001 ctatattctt catgcaccaa tttgtagcat gattcggatt ctaatgttga aagtgggaat + 18061 aaactcagtt tttcttcacg ttgttgttgg gattgtgcta ggctggtatt tatccatact + 18121 ggcaacttat atattgaaaa aaattccatt tttgaatatt gttttattac cacaaaagta + 18181 tattaaatta aaataaatta ttttagattt ataatgtggc tctttgtcaa ctaacatctg + 18241 gagaggacaa tcactgtctt ctcttttttt gtcttttcag aatataccaa attaacacaa + 18301 aaattctgaa aattctgttg acatctttct gaaaagagtc tataatggag agaaagcttt + 18361 aaaggagaaa atgatgaaaa gttcaaaact atttgccctt gcgggcgtga cattattggc + 18421 ggcgactact ttagctgcat gctctggatc aggttcaagc actaaaggtg agaagacatt + 18481 ctcatacatt tatgagacag accctgataa cctcaactat ttgacaactg ctaaggctgc + 18541 gacagcaaat attacaagta acgtggttga tggtttgcta gaaaatgatc gctacgggaa + 18601 ctttgtgccg tctatggctg aggattggtc tgtatccaag gatggattga cttacactta + 18661 tactatccgt aaggatgcaa aatggtatac ttctgaaggt gaagaatacg cggcagtcaa + 18721 agctcaagac tttgtaacag gactaaaata tgctgctgat aaaaaatcag atgctcttta + 18781 ccttgttcaa gaatcaatca aagggttgga tgcctatgta aaaggggaaa tcaaagattt + 18841 ctcacaagta ggaattaagg ctctggatga acagacagtt cagtacactt tgaacaaacc + 18901 agaaagcttc tggaattcta agacaaccat gggtgtgctt gcgccagtta atgaagagtt + 18961 tttgaattca aaaggagatg attttgccaa agctacggat ccaagtagtc tcttgtataa + 19021 cggtccttat ttgttgaaat ccattgtgac caaatcctct gttgaatttg cgaaaaatcc + 19081 gaactactgg gataaggaca atgtgcatgt tgacaaagtt aaattgtcat tctgggatgg + 19141 tcaagatacc agcaaacctg cagaaaactt taaagatggt agccttacag cagctcgtct + 19201 ctatccaaca agtgcaagtt tcgcagagct tgagaagagt atgaaggaca atattgtcta + 19261 tactcaacaa gactctatta cgtatctagt tggtacaaat attgaccgtc agtcctataa + 19321 atacacatct aagaccagcg acgaacaaaa ggcatcgact aaaaaggctc tcttaaacaa + 19381 ggatttccgt caggctattg cctttggatt tgaccgtaca gcctatgcct ctcagttgaa + 19441 tggacaaact ggagcaagta aaatcttgcg taatctcttt gtgccaccaa catttgttca + 19501 agcagatggt aaaaactttg gcgatatggt caaagagaaa ttggtcactt atggggatga + 19561 atggaaggat gttaatcttg cagattctca ggatggtctt tacaatccag aaaaagccaa + 19621 ggctgaattt gctaaagcta aatcagcctt acaagcagaa ggagtccaat tcccaattca + 19681 tttggatatg ccagttgacc agacagcaac tacaaaagtt cagcgcgtcc aatctatgaa + 19741 acaatccttg gaagcaactt taggagctga taatgtcatt attgatattc aacaactaca + 19801 aaaagacgaa gtaaacaata ttacatattt tgctgaaaat gctgctggcg aagactggga + 19861 tttatcagat aatgtcggtt ggggtccaga ctttgccgat ccatcaacct accttgatat + 19921 tatcaaacct tctgtaggag aaagtactaa aacatattta gggtttgact caggggaaga + 19981 taatgtagct gctaaaaaag taggtctata tgactacgaa aaattggtta ctgaggctgg + 20041 tgatgagact acagatgttg ctaaacgcta tgataaatac gctgcagccc aagcttggtt + 20101 gacagatagt gctttgatta ttccaactac atctcgtaca gggcgtccaa tcttgtctaa + 20161 gatggtacca tttacaatac catttgcatt gtcaggaaat aaaggtacaa gtgaaccagt + 20221 cttgtataaa tacttggaac ttcaagacaa ggcagtcact gtagatgaat accaaaaagc + 20281 tcaggaaaaa tggatgaaag aaaaagaaga gtctaataaa aaggctcaag aagatctcgc + 20341 aaaacatgtg aaataa +// + diff --git a/public/res/serotype_genbank/serotype_12A.gb b/public/res/serotype_genbank/serotype_12A.gb new file mode 100644 index 0000000..83bbae3 --- /dev/null +++ b/public/res/serotype_genbank/serotype_12A.gb @@ -0,0 +1,1198 @@ +LOCUS CR931658 27104 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 559/66 (serotype 12a). +ACCESSION CR931658 +VERSION CR931658.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 27104) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 27104) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..27104 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="559/66" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC12A_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC12A_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33214.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SPC12A_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SPC12A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(491..1024,1026..1232,2935..3060)) + /gene="tnp" + /locus_tag="SPC12A_0003" + /pseudo + CDS complement(join(491..1024,1026..1232,2935..3060)) + /gene="tnp" + /locus_tag="SPC12A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(order(962..1024,1026..1232,2935..3042)) + /gene="tnp" + /locus_tag="SPC12A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3e-20" + /pseudo + gene complement(1423..2769) + /gene="tnp" + /locus_tag="SPC12A_0004" + CDS complement(1423..2769) + /gene="tnp" + /locus_tag="SPC12A_0004" + /note="member of homology group 225" + /codon_start=1 + /transl_table=11 + /product="putative IS1380-Spn1 transposase" + /protein_id="CAI33217.1" + /db_xref="GOA:Q97CV5" + /db_xref="InterPro:IPR002559" + /db_xref="InterPro:IPR012337" + /db_xref="UniProtKB/TrEMBL:Q97CV5" + /translation="MNSLPNHHFQNKSFYQLSFDGGHLTQYGGLIFFQELFSQLKLKE + RISKYLVTNDQRRYCRYSDSDILVQFLFQLLTGYGTDYACKELSADAYFPKLLEGGQL + ASQPTLSRFLSRTDEETVHSLRCLNLELVEFFLQFHQLNQLIVDIDSTHFTTYGKQEG + VAYNAHYRAHGYHPLYAFEGKTGYCFNAQLRPGNRYCSEEADSFITPVLERFNQLLFR + MDSGFATPKLYDLIEKTGQYYLIKLKKNTVLSRLGDLSLPCPQDEDLTILPHSAYSET + LYQAGSWSHKRRVCQFSERKEGNLFYDVISLVTNMTSGTSQDQFQLYRGRGQAENFIK + EMKEGFFGDKTDSSTLIKNEVRMMMSCIAYNLYLFLKHLAGGDFQTLTIKRFRHLFLH + VVGKCVRTGRKQLLKLSSLYAYSELFSALYSRIRKVNLNLPVPYEPPRRKASLMMH" + misc_feature complement(1672..2340) + /gene="tnp" + /locus_tag="SPC12A_0004" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 6.9e-24" + gene 3265..4719 + /gene="wzg" + /locus_tag="SPC12A_0005" + CDS 3265..4719 + /gene="wzg" + /locus_tag="SPC12A_0005" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33218.1" + /db_xref="GOA:Q4JYN0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYN0" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + FAFRYLNLVVTVLVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIIDSLQNSIQTNMPLETMINLVNAQLESGGSYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 3265..3402 + /gene="wzg" + /locus_tag="SPC12A_0005" + /note="Signal peptide predicted for SPC0545 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 46 and 47" + misc_feature 3478..3825 + /gene="wzg" + /locus_tag="SPC12A_0005" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 4003..4446 + /gene="wzg" + /locus_tag="SPC12A_0005" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 4721..5452 + /gene="wzh" + /locus_tag="SPC12A_0006" + CDS 4721..5452 + /gene="wzh" + /locus_tag="SPC12A_0006" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33219.1" + /db_xref="GOA:Q4JYM9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYM9" + /translation="MIDIHSHIVFDVDDGPKSREESKALLVEAYRQGVRTIVSTSHRR + KGMFETPEEKIEENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHAIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 4724..5332 + /gene="wzh" + /locus_tag="SPC12A_0006" + /note="HMMPfam hit to PF02811, PHP domain, score 7.8e-36" + gene 5458..6153 + /gene="wzd" + /locus_tag="SPC12A_0007" + CDS 5458..6153 + /gene="wzd" + /locus_tag="SPC12A_0007" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33220.1" + /db_xref="GOA:Q4JYM8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JYM8" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSAFI + VKPEYTSTTRIYVVNRDQGDKSGLTNQDLQAGTYLVKDYREIILSQNVLEKVATNLKL + DIPAKTLARKVQVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVRLNSLFGFFGGAVVTVIAVLLIELFDIRVKRPEDVEDVLQI + PLLGVVPDLNKMK" + misc_feature 5458..5574 + /gene="wzd" + /locus_tag="SPC12A_0007" + /note="Signal peptide predicted for SPC0547 by SignalP 2.0 + HMM (Signal peptide probability 0.729) with cleavage site + probability 0.460 between residues 39 and 40" + misc_feature 5479..5895 + /gene="wzd" + /locus_tag="SPC12A_0007" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.5e-54" + misc_feature 6001..6078 + /gene="wzd" + /locus_tag="SPC12A_0007" + /note="PS00217 Sugar transport proteins signature 2." + gene 6163..6837 + /gene="wze" + /locus_tag="SPC12A_0008" + CDS 6163..6837 + /gene="wze" + /locus_tag="SPC12A_0008" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33221.1" + /db_xref="GOA:Q4K1Y2" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1Y2" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + QGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITQKCDASILVTKAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGKK" + gene order(7111..7536,7548..7925) + /gene="tnp" + /locus_tag="SPC12A_0009" + /pseudo + CDS join(7111..7536,7548..7925) + /gene="tnp" + /locus_tag="SPC12A_0009" + /note="member of homology group 148" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1515 transposase" + misc_feature order(7444..7536,7548..7916) + /gene="tnp" + /locus_tag="SPC12A_0009" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 1.1e-10" + /pseudo + gene 8057..8656 + /gene="wciI" + /locus_tag="SPC12A_0010" + CDS 8057..8656 + /gene="wciI" + /locus_tag="SPC12A_0010" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI33223.1" + /db_xref="GOA:Q4JYM6" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JYM6" + /translation="MYREIKRLGDILLSFIGIIVLFPVFIIIAIAIKLDSKGPVIFKQ + KRFGLHKKSFYVLKFRTMKVESPKYVATRDLDKPEQWITKVGACLRKTSLDELPQLWN + ILVGDMSVVGPRPVAINELDLIKEREQYGANDILPGLTGWAQINGRDNLSTEMKAEID + GYYVKHMSLRMDLRCILRTIPYVLKRKGIVEGSGKKELE" + misc_feature 8057..8149 + /gene="wciI" + /locus_tag="SPC12A_0010" + /note="Signal peptide predicted for SPC0551 by SignalP 2.0 + HMM (Signal peptide probability 0.855) with cleavage site + probability 0.449 between residues 31 and 32" + misc_feature 8072..8626 + /gene="wciI" + /locus_tag="SPC12A_0010" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.4e-36" + gene 8622..9887 + /gene="wciJ" + /locus_tag="SPC12A_0011" + CDS 8622..9887 + /gene="wciJ" + /locus_tag="SPC12A_0011" + /note="member of homology group 35" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33224.1" + /db_xref="GOA:Q4JYM5" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYM5" + /translation="MWRVVVRKSWSDAMKILFVCQHYKPEPFRLSDICEDLVQRGHEV + AVLTGIPNYPEGEIYADYRKRKKRRETINGVAIFRSYTIARRQNTLYRILNYFSFALS + STIGVIFGRYKAKDGSDFDCVFVNQLSPVMMAWAGIAYKNKYNKPMFLYCMDVWPDSL + IVGGVKENGLIYKIFEFVSKKVYQASDYIFVTSLSFKDYFVKKFNIPLHKITYLPQYA + EDLFVPNELKTNKNTIDLTFAGNIGKAQNLETILKAASAIEQIPDLAKRVHFHFVGDG + TELLNMQKLACELELENTSFYGRRPLEEMPDFYTKSDAMLVSLIGDSIISRTLPGKVQ + SYMAAGKPIIGAISGDTQRVVKEAKCGFISPEGNVDQLVRNIRKFCLLSVEEREKLGR + QARCCYEEQFSKEWFMTYLENHLKEGFLS" + misc_feature 9279..9812 + /gene="wciJ" + /locus_tag="SPC12A_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.7e-14" + gene 9836..11053 + /gene="wcxB" + /locus_tag="SPC12A_0012" + CDS 9836..11053 + /gene="wcxB" + /locus_tag="SPC12A_0012" + /note="member of homology group 55" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33225.1" + /db_xref="GOA:Q4K1Z8" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1Z8" + /translation="MVYDILRKSFKRGVSIMKVLMINSVCGIRSTGRICTDLATALTE + EGYEVKIAYGREYVPKQFQQYAVKIGTKSDIRFHAIRSRLFDESGFGSRQATVNFIKW + IKEFDPDVIHLHNLHGYYINIELLFDYLRICGKKIIWTLHDCWAFTGHSAHFDCLECE + SKGVCDHPSQKNDYPKSFVNFSKRNYQRKKKCFTHIPNLTIVTPSQWLANLVGQSFLK + EYPVKVIHNGIDTTVFQPRLIAAQKLKKRYHLEGKQVLLGVAAIWTDKKGFSDMLVLA + SHLADNQRIVLIGLKDRQLKKLPKGIIGLTETNSPEELAAWYTLADVFLNPTYQDSYP + TTNLEAISCGTPVISYPTGGSVESAKLYGLVCQDRNVASILSSLEKVSQLSKTEKLDF + SIASFIKQMKYLY" + misc_feature 10556..11038 + /gene="wcxB" + /locus_tag="SPC12A_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.6e-12" + gene 11091..12302 + /gene="wzy" + /locus_tag="SPC12A_0013" + CDS 11091..12302 + /gene="wzy" + /locus_tag="SPC12A_0013" + /note="member of homology group 71" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33226.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K1Z7" + /translation="MMKRIYYHLLAILAWTLPNSYAFIDSLKVFFPNISLQIAGSLLA + VISIGIFITRIYYTGYEVFISLLVCIFILIFYSTRFFYSINVELYQSFFNSFLIRPVP + GILVAMLLAKNNHIKGFIKWSEPMMLFYTLTSFLAALSPRNSIIIYQSLSYYAMTAYM + INVFNIIYKEKILEEQLTYFRFSAWNFIRYFLLLIQAFNALSGGGRGAFILLIIFTGI + LLIRIAMNFKFLFSFIGGLSAIALVVFCIKDLDFTWLLNMDGGERLLNFFGRPERIST + DNRLLIYDTVWSAIQEKPFLGWGVGSTFLKFNGYSHNIVLDLLHDMGSFGLLIILSAF + FASSVILYKLRKIDWKVNLFILMFLEVYVHMSFSGSYLADGRLWFLVIFTYCYYRWKV + QEKDEVSNFII" + misc_feature 11907..12074 + /gene="wzy" + /locus_tag="SPC12A_0013" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1.1e-08" + gene 12277..13353 + /gene="wcxD" + /locus_tag="SPC12A_0014" + CDS 12277..13353 + /gene="wcxD" + /locus_tag="SPC12A_0014" + /note="member of homology group 72" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33227.1" + /db_xref="GOA:Q4K1Z6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1Z6" + /translation="MKLAILLSDISKIGGVQRVTTALVNELCQNIDVTIISIFSENEL + PAFGLSDRVQVSYLLKEHVNLKKNFFKVSGALRKVLKKQQFDVVLSSGTGLVSFLWFA + SLGIPTRLLAWEHQCFYFGRSFGLEWLGRKLACRFAESIVVLTKKDEGFYKENRPKAH + IEQIYNILDMDSQTAKCQLSSKKIISVGSLGRQKGFDLALEVASQIQLSYPDWQWDIY + GDGPDREKLEEKVREYQLEGFINLKGLVQNVRELYPDYSIYALTSRYEGLSMALLEAK + NCQMPAISFDCNCGPSDIISDGRNGFLIDCFDVNIYAKTLSKLMTSLELREQVAKSSV + IPAEELSTTYILDKWNNLLKIERR" + misc_feature 12778..13284 + /gene="wcxD" + /locus_tag="SPC12A_0014" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.6e-32" + gene 13355..14533 + /gene="wcxE" + /locus_tag="SPC12A_0015" + CDS 13355..14533 + /gene="wcxE" + /locus_tag="SPC12A_0015" + /note="member of homology group 73" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33228.1" + /db_xref="GOA:Q4K1X6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1X6" + /translation="MKIVHVEDFFHPDAGYQINVLPKYLAKFGHEQVIITSEMDKIPD + NLTQFFGRENIEERDRSYEEKHHVKIIRLPLHGFVSGRAIFSGKLISAIKGLSPEVLY + IHGNDTLTGIRLLLARKKLNCRIVTDSHMLEMASRNPFNNYFRRFYKTLITPILIKEQ + IPIIRTQDDNYVEKHLGIPLSQAPWISYGSDTAFFHADSQIKEDFRSQYQIASDALIC + VYAGKLDEHKGGMFLAESLSKKLNTEQPIVFIIVGNTNGEYGEAVEKSFSQSENQILR + FPTQKYQKLAQFFQVADFALFPKQCSLSFYDAQACGLPVLLEDNNINLDRTSHYNGWT + FKANSKLSLRDSLKMIASLDKEKRQEYSQNALHYILEHYNYEDKAREYEKILIGERTK + " + misc_feature 13958..14458 + /gene="wcxE" + /locus_tag="SPC12A_0015" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00013" + gene 14566..15762 + /gene="wcxF" + /locus_tag="SPC12A_0016" + CDS 14566..15762 + /gene="wcxF" + /locus_tag="SPC12A_0016" + /note="member of homology group 74" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33229.1" + /db_xref="GOA:Q4K1Z4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1Z4" + /translation="MDLMKICIVSVGVGGLPIPAVKGGAVENLIDNYLSYNEKYNHDE + ITVVSCDHKEAREASKKYKYAQFVYIDIHSLKYKINKTIRYAINKYSPFFVGNAYISQ + LPDLSGFDTVLIENRPEYGYYIRKKFKGNLVLHLHNDLLMDNEYSVDYSVYDKIITIS + DYIRDRSEVVTSGVPIQTVYNGIDTELFLQNFSEIDLSDLKNQLEILSDDFVIVFFGR + INKNKGIKELLEAFLLIPKNLNIKLLAVGSSIFGQTELDTFTTELRQLAKQASDKVVF + TGYVNYKDIPKYHHIADCIVVPSIWEEPAGLTVCEALISGKYVITTDAGGIPEIVAGS + EALVVANDECIVEHLKTALLSVYQKGKCSSVITSNRDRGAYFSIEKYGRDLRKELTQN + ERIINI" + misc_feature 14566..14640 + /gene="wcxF" + /locus_tag="SPC12A_0016" + /note="Signal peptide predicted for SPC0557 by SignalP 2.0 + HMM (Signal peptide probability 0.653) with cleavage site + probability 0.406 between residues 25 and 26" + misc_feature 15154..15681 + /gene="wcxF" + /locus_tag="SPC12A_0016" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.2e-28" + gene 15759..17303 + /gene="wzx" + /locus_tag="SPC12A_0017" + CDS 15759..17303 + /gene="wzx" + /locus_tag="SPC12A_0017" + /note="member of homology group 56" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33230.1" + /db_xref="GOA:Q4JYL9" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYL9" + /translation="MSRVKNSFFNILAGIVGTIISSVLAFIVRTVFIRVLGETYLGFN + GLYTNILTVLSLTELGIGSSIAYLMYKPLAEKDGDKLAQVVQFYKKIYRVIGIIILIL + GLCLVPFLPVIVNLKNAEDLNYTALYLLYLADTVSTYLFFAYKRGVLAADQKIYVANI + FDIIITTILSIFQIITLMIFKDFYLYIILKIAKNLTLNLVISLKVDKMYPSIHKFKGI + APLPKMERRLVWKNVYATSVRQIFNELMNSTDSIVISIVLGIVMVGKYSNYAYILSIV + YIFFGGIFNPIQASIGNLSLSASIEKKNEIFNRLRFINFFFLSFCSSCLLVLVNPFIT + IWIGENYTLSFTGVIAIVGMLFVRQTGNCTTIFRLGEGYFRDYHFSPLIAGILNLVVS + VILVNYIGIAGVFVGTMLGFGFQFILVDTIVTYKKVLSRPLSEFYLRWLQTILLTVGL + CIASYYLSRLVRVNSIYDLILLFVVVIGFNFFALCFIYWRNDDFQYFIQLVKNFMKNL + EEKNHD" + misc_feature 15759..15833 + /gene="wzx" + /locus_tag="SPC12A_0017" + /note="Signal peptide predicted for SPC0558 by SignalP 2.0 + HMM (Signal peptide probability 0.819) with cleavage site + probability 0.398 between residues 25 and 26" + gene 17296..18519 + /gene="mnaB" + /locus_tag="SPC12A_0018" + CDS 17296..18519 + /gene="mnaB" + /locus_tag="SPC12A_0018" + /note="member of homology group 75" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylmannosamine dehydrogenase MnaB" + /protein_id="CAI33231.1" + /db_xref="GOA:Q4K1X3" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K1X3" + /translation="MINVIGLGYIGLPTILMLATNGVKVVGTDYNQDLVRTLNEGQTT + FKEDGLDELFHKAVESGVDFTTEYQQTDTYIISVPTPYDSFSKKIDPSYVIEATKTVL + DNCNKGAVIIIESTVSPGTVDKFIRPVVEEKGFVIGSDIHLVHAPERIIPGNMVYELV + NNNRTIGADDLEIGYKVKELYASFCKGDIVVTDIRTAEMTKVVENTFRAVNIAFANEL + AQICSYDNMNVYEIIRICNMHPRVNILQPGPGVGGHCISVDPWFLVGDYPELTNVIEH + SMRTNAAMPEFVLNRIYTIMNEHHLTDISRVGLYGLTYKENVDDMRESPTLQLLESMS + RHLATPAIKVYDPFIEKDVVANQSHDLDEFLSNVDIVVLLVGHDEILQNMDKLKDKIV + LDTRYICHLDGTYRL" + misc_feature 17299..17853 + /gene="mnaB" + /locus_tag="SPC12A_0018" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.4e-45" + misc_feature 17875..18135 + /gene="mnaB" + /locus_tag="SPC12A_0018" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 4.5e-33" + misc_feature 18217..18480 + /gene="mnaB" + /locus_tag="SPC12A_0018" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 2.5e-15" + gene 18542..19645 + /gene="mnaA" + /locus_tag="SPC12A_0019" + CDS 18542..19645 + /gene="mnaA" + /locus_tag="SPC12A_0019" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33232.1" + /db_xref="GOA:Q4K1V3" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1V3" + /translation="MTMKKIVVIFGTRPEAIKMCPLVKELRTRENLETLVCVTGQHRQ + MLDQVLDTFRITPDFDLSIMKDKQTLFDVTIGILEGMKTVLESVNPDLILVHGDTSTT + FASSLAAFYLQIPIGHVEAGLRTYDIYSPYPEEFNRQAVGALAQYHFTPTQLSKDNLL + REGKNSEAIFITGNTAIDALQTTIQEDYTHPELNWVGDSKLILITAHRRENIGDPMRH + MFRAIRRIIEEHSDIKALYPIHMNPLVRQIAEEELSGCERIKMIDPLEVLDFHNFLSR + SYLILTDSGGIQEEAPSLGKPVLVMRDTTERPEGIKAGTLKLVGTDEDNIYRHFKELL + ENDLVYQAMSQASNPYGDGTACKKIADILEGEV" + misc_feature 18611..19633 + /gene="mnaA" + /locus_tag="SPC12A_0019" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 2.5e-174" + gene 19649..20704 + /gene="fnlA" + /locus_tag="SPC12A_0020" + CDS 19649..20704 + /gene="fnlA" + /locus_tag="SPC12A_0020" + /note="member of homology group 36" + /codon_start=1 + /transl_table=11 + /product="FnlA" + /protein_id="CAI33233.1" + /db_xref="GOA:Q4JYL6" + /db_xref="InterPro:IPR003869" + /db_xref="InterPro:IPR013692" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYL6" + /translation="MSQFTGKTLLITGGTGSFGNAVLNRFLQTDIGEIRIFSRDEKKQ + DDMRHEFQVKVPEVAGKIRFYLGDVRDLASVKNAMHGVDYVFHAAALKQVPSCEFFPV + EAVKTNILGTENVLTAAIEAGVKQVICLSTDKAAYPVNAMGTSKAMMEKIAVAKSRTV + NPEHTKICVTRYGNVLCSRGSVVPLWIEQIKQGNALTITEPSMTRFVMTLEEAVDLVL + FAFEEGKSGDILVQKAPACTIEVLAKAVSEIFASEQDIKIIGIRHGEKRYETLLTNEE + CANAIDLGDFYRVPSDNRNLNYDKYFKDGSTNRNLLTEFNSNNTDLMDVEQVKRKLLE + LDEIQTAIRDMVADEEM" + misc_feature 19670..20524 + /gene="fnlA" + /locus_tag="SPC12A_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0018" + misc_feature 19673..20521 + /gene="fnlA" + /locus_tag="SPC12A_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 3.1e-162" + misc_feature 19673..20344 + /gene="fnlA" + /locus_tag="SPC12A_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 8.3e-09" + misc_feature 19676..20311 + /gene="fnlA" + /locus_tag="SPC12A_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 8.4e-09" + misc_feature 20522..20665 + /gene="fnlA" + /locus_tag="SPC12A_0020" + /note="HMMPfam hit to PF08485, Polysaccharide biosynthesis + protein C, score 2e-23" + gene 20804..22033 + /gene="fnlB" + /locus_tag="SPC12A_0021" + CDS 20804..22033 + /gene="fnlB" + /locus_tag="SPC12A_0021" + /note="member of homology group 37" + /codon_start=1 + /transl_table=11 + /product="FnlB" + /protein_id="CAI33234.1" + /db_xref="GOA:Q4K1Y9" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1Y9" + /translation="MIKNILITGAKGFVGKNLICTLEALKDGRDRTRPNLEIGEIFQY + DRDTDPILLDEYCKKADFVFHLAGVNRPQNPDEFMEGNYGFSSRLLEILEKYENTCPV + LLSSSTQASLEGRFSNSIYGQSKLAGEELFFEYGKKTGAPVLVYRFPNLYGKWCRPNY + NSAVATFCHNIAHDLPIQVNDPSVELELLYIDDLIQECLTALEGNPHRCNLDGLQILP + SPSGNYCYVPTTHRATLGEIVSLLETFKKQPNSLVMPEIPQGSFKKKLYSTYLSYLPV + DKFRFPLKMNIDERGSFTELLKTENTGQFSVNISKPGITKGQHWHHSKWEFFMVVSGR + ALIQERRIGLDENGQEYPILNFEVSGDKIEAIHMIPGYAHNIINLSDTENLITVMWAN + ESFDPRHPDTFFEQVEK" + misc_feature 20816..21439 + /gene="fnlB" + /locus_tag="SPC12A_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 3.5e-09" + gene 22034..23218 + /gene="fnlC" + /locus_tag="SPC12A_0022" + CDS 22034..23218 + /gene="fnlC" + /locus_tag="SPC12A_0022" + /note="member of homology group 38" + /codon_start=1 + /transl_table=11 + /product="UDP-L-fucosamine FnlC" + /protein_id="CAI33235.1" + /db_xref="GOA:Q4K1W9" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1W9" + /translation="MKIKTDYSDIHFKDNGKLKLLIIVGTRPEIIRLSSVITKCRKYF + DVILAHTGQNYDYNLNGIFFDNLGLDTPDVYMDAVGDDLGATVGNIINTSYKLMNQIK + PDALLILGDTNSCLSAIAAKRLHIPIFHMEAGNRCKDECLPEETNRRIVDIISDVNLA + YSEHARKYLHECGLPKERTYVTGSPMAEVLHKNLSAIESSDIHERLGLKKGGYILLSA + HREENIDTDKNFISLFTAINQLAEKYNMPILYSCHPRSKKRLQESGFKLDKRVIQHEP + LGFHDYNCLQMNAFVVVSDSGTLPEESSFFTSQGYPFPAVCIRTSTERPESLDKAGFI + LAGIDENSLLQAVETAVSLAEDEDFGLPVPDYVEENVSTKVVKIIQSYTGIVDKIVWR + KS" + misc_feature 22145..23173 + /gene="fnlC" + /locus_tag="SPC12A_0022" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 4.8e-105" + gene complement(23413..23502) + /gene="tnp" + /locus_tag="SPC12A_0023" + /pseudo + CDS complement(23413..23502) + /gene="tnp" + /locus_tag="SPC12A_0023" + /note="Lone member of homology group 0226" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase (fragment)" + gene complement(23584..24639) + /gene="tnp" + /locus_tag="SPC12A_0024" + /pseudo + CDS complement(join(23584..23901,23903..24253,24253..24639)) + /gene="tnp" + /locus_tag="SPC12A_0024" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + gene 24720..24908 + /gene="tnp" + /locus_tag="SPC12A_0025" + /pseudo + CDS 24720..24908 + /gene="tnp" + /locus_tag="SPC12A_0025" + /note="member of homology group 0047 7" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene complement(25120..25693) + /gene="tnp" + /locus_tag="SPC12A_0026" + /pseudo + CDS complement(join(25120..25443,25424..25693)) + /gene="tnp" + /locus_tag="SPC12A_0026" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature complement(order(25126..25443,25424..25428)) + /gene="tnp" + /locus_tag="SPC12A_0026" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 1.7e-52" + /pseudo + gene order(25760..25966,25968..26078,26095..26484) + /gene="tnp" + /locus_tag="SPC12A_0027" + /pseudo + CDS join(25760..25966,25968..26078,26095..26484) + /gene="tnp" + /locus_tag="SPC12A_0027" + /note="member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase (orf2)" + misc_feature order(26007..26078,26095..26472) + /gene="tnp" + /locus_tag="SPC12A_0027" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 4.6e-14" + /pseudo + gene 26745..>27104 + /gene="aliA" + /locus_tag="SPC12A_0028" + CDS 26745..>27104 + /gene="aliA" + /locus_tag="SPC12A_0028" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33241.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 26745..26831 + /gene="aliA" + /locus_tag="SPC12A_0028" + /note="Signal peptide predicted for SPC0574 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 26991..27059 + /gene="aliA" + /locus_tag="SPC12A_0028" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttatcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa aatgaacata aagaagcgtg tccttagtgc aggtctgact + 361 tttgcatctg ctttgctttt agctgcttgc gaccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaattacc tgttagacta ttacgctgat + 481 aatatagtca attgaaacaa gagcaggaca aaagagcctc gtaaaaggta ttgcaacttg + 541 gtaatacctt ttacgaggct ttttgatatg agcccatgtt ttctcaatag gattgtactc + 601 aggtgagtag ggaggaagaa ggtaaaagtt tatgcccaaa ctcttcgcat aaaagttcta + 661 gcttccccat tctatggaat cttgcattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagaa aaacttctga aaccaagctt caaaaaagtc gctcgtcatc atctcttcgt + 781 aagtcattgg agtgattaac tcaccatttg ttagacctgc aaccaaagaa atcctctgat + 841 atcttcttcc agatactttg cctcttatta actgaccttt taatgagcga ccatattctc + 901 gataaaaata agtatcgaat cctgtttcgt caatctaaac aggtgctagg tgctttaatc + 961 tattaaaatt cttaagaaac aaggctactt tttctgggtc ttgttcatag taggtgtggt + 1021 tctttttttc gagtgtagcc catagctttg agcgcatagt ggatggtagt tggatgacag + 1081 ccaaattcag aagctatttc agtcaaataa gcgtctggat tgtcagtaag atagttttta + 1141 agtctatctc tatcaacttt tcttggtttt attcctttta cttggtggtt tagctctcct + 1201 gttttctctt ttagctttaa ccagccataa acccaaatca ttcatacctc tctcaactag + 1261 atgtaactta ccaaacccct gacctcatga gccactttct tcctcctcat gaggtcagtt + 1321 ttactttctg ctgttccagt atcgtttttc ctcgctagat ttcctcaaaa gggcagactc + 1381 ctcccttggt gcgtcacacg attttttcat ctcgactgtt ctttaatgca tcattaacga + 1441 cgcttttctt ctaggtggtt cataaggaac aggaagattc aggttgactt ttctaatcct + 1501 agaataaagt gctgaaaaca attcggaata ggcatagaga ctagacaatt tgaggagctg + 1561 cttgcgtcct gttcgaacac attttcctac cacgtgaaga aaaagatggc ggaagcgttt + 1621 gattgttaaa gtttggaagt cacctccagc tagatgtttg agaaaaagat agagattgta + 1681 ggcgatacag ctcatcatca tacgaacttc gtttttgatt aaggttgaac tatccgtttt + 1741 atcgccaaaa aatccctcct tcatctcctt gatgaaattc tcggcttgac cacgtccacg + 1801 ataaagctga aactggtctt ggcttgttcc actcgtcata tttgtaacga gagaaataac + 1861 atcgtagaac aagtttcctt cttttcgttc agagaactgg cagacacgac gcttgtgcga + 1921 ccaagatcct gcttgataga gagtttctga gtaggcggag tggggcaaga tggttaagtc + 1981 ctcatcctgt gggcaaggga gggaaaggtc tccaagacgg ctcagaacag tatttttctt + 2041 gagttttatg aggtagtatt gccctgtttt ttcaattaaa tcgtataatt ttggggtcgc + 2101 aaagccacta tccattcgaa agagaagttg attaaaccgt tctaaaacag gtgtgataaa + 2161 gctgtctgcc tcttcagaac aataacgatt accaggacga agctgggcat tgaaacaata + 2221 acctgtcttc ccctcgaaag cataaagagg atgatagcca tgagcacgat agtgggcgtt + 2281 ataagcaaca ccttcttgct tgccataagt tgtgaaatgg gtagaatcga tatctacaat + 2341 gagttggttt agctggtgaa actgtaaaaa gaattcgacc aattcaaggt tgaggcatcg + 2401 caaactatgg actgtttcct cgtcagttct ggaaagaaaa cgggataagg ttggctgtga + 2461 agcaagctgc cctccttcca acaattttgg aaagtaggca tcagctgaca attctttaca + 2521 agcatagtcc gttccataac ctgttaacag ttgaaagagg aactggacaa ggatatctga + 2581 atccgaataa cgacagtagc ggcgttggtc attcgttact aaatacttag aaatccgctc + 2641 ttttagtttc aactgggaaa aaagttcctg aaaaaagata agaccaccat actgggttaa + 2701 atgacctcca tcgaaagata gttggtaaaa agacttgttt tggaagtgat gatttggtaa + 2761 actgttcatg tgagtttcct ttctttttgt gtttttttct acacttatac cataaagggg + 2821 aaactctttt ttgtctagta aaaaacaccc attgggtgaa aaaagaaacc atccaggatc + 2881 taagctaagg caaggattct ggatggtttt tagatttggg gtgaataatt ggggataaat + 2941 ggtattacgt gagatttgga aaacgtgtga tgcttctgtt atactacctg ttcgctcaca + 3001 ataagagaga acttttttac gaaaatctat tgaatatgcc ataaaaagat tataccacat + 3061 tgtgtactat attagattga aactagaata gtacacatct gcttctaaaa cattgttaga + 3121 aatcgatttg actgtcctta tttcatttta ctatattttt ggttcgcggg aagtctacta + 3181 agatacttaa agatgcagat agtaaaaaaa gatgtagaca ttaccgtaaa aaagtgatat + 3241 aattgtatga tgttcaaggt ataggtgtta atcatgagta gacgttttaa aaaatcacgt + 3301 tcacagaaag tgaagcgaag tgttaatatc gttttgctga ctatttattt attattagtt + 3361 tgttttttat tgttcttaat ctttaagtat aatatctttg cttttagata tcttaatcta + 3421 gtggtaactg tgttagtcct actagttgcc ttggtagggc tactcttgat tatctataaa + 3481 aaggctgaaa agtttactat ttttctgttg gtgttctcta tccttgtcag ctctgtgtcg + 3541 ctctttgcag tacagcagtt tgttggactg accaatcgtt taaatgcgac ttctaattac + 3601 tcagaatatt caatcagtgt cgctgtttta gcagatagtg agatcgaaaa tgttacgcaa + 3661 ctgacgagtg tgacagcacc gactgggact gataatgaaa atattcaaaa actactagct + 3721 gatatcaagt caagtcagaa taccgatttg acggtcaacc agagttcgtc ttacttggca + 3781 gcttacaaga gtttgattgc aggggagact aaggccattg tcctaaatag tgtctttgaa + 3841 aatatcatcg agtcagagta tccagactac gcatcgaaga taaaaaagat ttataccaag + 3901 ggattcacta aaaaagtaga agctcctaag acgtctaaga atcagtcttt caatatctat + 3961 gttagtggaa ttgacaccta tggtcctatt agttcggtgt cgcgatcaga tgtcaatatc + 4021 ctgatgactg tcaatcgaga taccaagaaa atcctcttga ccacaacgcc gcgtgatgcc + 4081 tatgtaccaa tcgcagatgg tggaaataat caaaaagata aattaaccca tgcgggcatt + 4141 tatggagttg attcgtccat tcacacctta gaaaatctct atggagtgga tatcaattac + 4201 tatgtgcgat tgaacttcac ttctttcttg aaaatgattg acttattggg aggggtagat + 4261 gttcataatg atcaagagtt ttcagctcta catgggaagt tccatttccc agtagggaat + 4321 gtccatctag actctgagca ggctctaggt tttgtacgtg aacgctactc cctagcagat + 4381 ggcgatcgtg accgtggtcg caaccaacaa aaggtgattg tggctatcct tcaaaaatta + 4441 acgtcaaccg aagcactgaa aaattatagt acgatcattg atagcttgca aaattctatc + 4501 caaacaaata tgccacttga gaccatgata aatttggtca atgctcagtt agaaagtgga + 4561 gggagttata aagtaaattc tcaagattta aaagggacag gtcggatgga tcttccttct + 4621 tatgcaatgc cagacagtaa cctctatgtg atggaaatag atgatagtag tttagctgta + 4681 gttaaagcag ctatacagga tgtgatggag ggtagatgag atgatagaca tccattcgca + 4741 tatcgttttt gatgtagatg acggtcccaa gtcaagagag gaaagcaagg ctctcttggt + 4801 agaagcctac agacaggggg tgcgaaccat tgtctctacc tctcaccgtc gcaagggcat + 4861 gtttgaaact ccggaagaga agatagaaga aaactttctt caggttcggg aaatagctaa + 4921 ggaagtggcg agtgatttag tcatcgctta cggggctgaa atttactaca caccagatgt + 4981 tctggataag ctagaaaaaa agcggattcc gaccctcaat gatagtcgtt atgccttgat + 5041 agagtttagt atgaacactc cttatcgcga tattcatagc gccttgagca agatcttgat + 5101 gttgggaatt actccagtca ttgcccacat tgagcgctat gatgctcttg aaaataatga + 5161 aaaacgcgtt cgagaattga tcgatatggg ctgttacacg caagtaaata gttcacatgt + 5221 cctcaaatcc aaactttttg gcgaacgtta taaattcatg aaaaaaagag ctcagtattt + 5281 tttagagcag gatttggtcc atgccattgc aagtgatatg cacaatctag acggcagacc + 5341 tcctcatatg gcagaagcat atgaccttgt tacccaaaaa tacggagaag cgaaggctca + 5401 ggaacttttt atagacaatc ctcgaaaaat tgtaatggat caactaattt aggagaaatg + 5461 atgaaagaac aaaacacgat agaaatcgat gtatttcaat tatttaaaac cttgtggaaa + 5521 cgcaagctaa tgattttatt agtggcactt gtgacaggtg cgggggcttt tgcatatagc + 5581 gcttttattg ttaagccaga atatacgagt accacgcgaa tttacgtagt gaatcgcgat + 5641 caaggagaca agtcggggct gacaaatcag gatttgcagg caggaactta tctggtaaaa + 5701 gactaccgtg agattatcct ttcgcagaat gtattggaaa aagtagcgac aaatttgaag + 5761 ttggatatac cagccaaaac gttagctaga aaagttcaag tgactgtacc agttgacact + 5821 cgtatcgtct caatctctgt caaggataaa cagccagagg aagccagtcg tatcgctaat + 5881 tctctacgag aagttgctgc agaaaagatc atcgctgtaa cgcgagtatc tgatgtaacg + 5941 acacttgaag aagcgcgacc agctacgact ccctcttctc caaatgttcg tctcaattcc + 6001 ttgtttggtt tttttggagg agcagtcgta acagtaattg ctgttctttt gattgagttg + 6061 ttcgacatcc gtgtgaaacg tcctgaagat gtcgaagatg tactgcaaat tccactttta + 6121 ggggtcgttc cagatttgaa caaaatgaaa taggaggaag ttatgccaac attagaaatc + 6181 tcacaggcaa aattggattt tgtaaaaaag gcagaggaaa attataacgc tttgtgcacg + 6241 aacctacagt taagtggaga tgatttgaaa gtattttcta tcacttctgt gaaacaagga + 6301 gaaggaaaat caacgacttc caccaatatt gcttgggctt ttgcgcgtgc aggttacaaa + 6361 acgctgctga ttgatggaga tattcgcaat tctgttatgt taggtgtctt taaagcaaga + 6421 gataagatta caggcctgac agaattttta tcaggaacta cagacctatc acaagggctt + 6481 tgtgatacca atatcgaaaa tctctttgta attcaggctg gctctgtgtc accgaatccg + 6541 acagctcttc ttcaaagtaa gaatttcagt acaatgcttg aaaccttgcg taaatatttt + 6601 gactatatca ttgtagatac tgctcctgtc ggtgtcgtga ttgatgcggc tattattacg + 6661 caaaaatgcg atgcttctat tttagtgacg aaggcaggtg aaataaatcg acgggatatt + 6721 caaaaagcaa aagaacagtt ggaacacaca gggaagccgt ttttgggagt tgtgttgaat + 6781 aaattcgata cttcagtaga caaatacggt tcttatggaa attacggaaa aaaataagtc + 6841 gttaagtatt tgtgtaagga catttttaga actacaatca aaatctttgg aattgctggc + 6901 ttcaaatcat attgatttga aatgaaactt gcaaaagagt tttttaggtg agtttcttaa + 6961 tttgtgactg aaatcaatct tctacttcca taccttggaa aaatagggta aacgagaaat + 7021 gttttttcca taataaagtt ttgatatggc tagtagagta gtaatataat agacttgttc + 7081 ggtaactgta aaaagtgtta tactattttt atggaaacag tatacgacaa agcacaaaaa + 7141 cttaactcaa aaaacttcaa actattgatt ggtgtcaaaa aggaaacctt tcaactcatg + 7201 ctagaacacc tgaattcagc ctatcagatt cagcaccgaa aaggtggacg tccacgtagt + 7261 ctgcccatgg aagaccagct cattatgacc ctccgttact tgcgatatta tcccactcag + 7321 cgtctgctgg cctttgattt tggcgtcggt gtagctacgg taaatgccat catcacttgg + 7381 gtggaggata cacttcgtgc gtcaggtagc tttgatttgg accatttaga agccccgagt + 7441 gctgctgtgg ctattgacgt gaccgaaagt ccgattcagc gtccaaaaaa aaccaaagca + 7501 aaaattattc tggtaaaaag aaacgacaca ccttaaaaac tcaaattatg ctggatttga + 7561 cgacacataa agtctgtcaa atggcctttt ctgacggaca tacgcatgat tttactctct + 7621 tcaaagaaag tattggacaa agtttgcctg aaacgacgct tgcctttgtt gacctaggtt + 7681 atttaggcat cttgaaattt catgagaata ctttcattcc tgctaaaaat tccaaaaatc + 7741 gccgcctgag tgaggatgat aagcagttaa ataaagagat gtcagcgata cgaattgaaa + 7801 ttgaacattt taacgctaaa ttcaagacct tccaaatcat gtcagtccct tatcgtaacc + 7861 gcagaaaacg tttcgagtta cgggcggaat taatttgtgc catcatcaat tatgaagtga + 7921 actagattcc gaacaagtct aatgaattgt aatcattagt gttcatacca agaaatatca + 7981 agtacctatt tttggaaatt ataaatgtta gatagtgttt aaatttttac ggagagattg + 8041 ttttgagagg taatttatgt atagggaaat aaaacgatta ggtgatattt tactttcttt + 8101 cataggaata atagtactgt ttccagtgtt tattataatt gcaatcgcaa taaagcttga + 8161 ttcaaaaggt ccagtaatat ttaagcaaaa gcgatttgga cttcataaga aatcgttcta + 8221 tgtcttgaag tttcgaacta tgaaggttga atcgccaaaa tatgtggcga ctcgagactt + 8281 agataaacca gaacagtgga ttaccaaagt aggagcttgt ttgcggaaaa catctttaga + 8341 tgaactgcct caactgtgga acattcttgt tggtgatatg agtgttgtag gacctaggcc + 8401 tgtagctata aatgaacttg atttgataaa agaaagagaa cagtatggtg ccaatgatat + 8461 cttaccagga ttaactggat gggcacaaat taatggacgt gataatttgt caacagagat + 8521 gaaggcagag atagatggtt attatgtaaa acatatgtcg ttaagaatgg atcttagatg + 8581 tatccttaga acaatcccct acgtattaaa acgtaaggga attgtggagg gtagtggtaa + 8641 gaaagagttg gagtgatgca atgaaaattc tatttgtttg tcaacattat aagccagaac + 8701 cttttagatt gtcagatatt tgtgaggatc tagttcaaag agggcacgag gtggctgttt + 8761 tgacagggat tcctaactat cccgaggggg aaatatatgc tgattatcgt aagagaaaaa + 8821 aaagaagaga gactataaat ggtgttgcta tttttcgttc atacaccatt gctaggaggc + 8881 aaaatacttt ataccgtata ttgaattatt ttagttttgc tctttcttct acgataggtg + 8941 ttatatttgg gcgttataaa gcgaaagatg gctcagattt tgattgtgtc tttgttaatc + 9001 aactatctcc agttatgatg gcttgggctg gtatagctta taagaacaag tacaataaac + 9061 ctatgttttt gtattgcatg gatgtttggc cggatagttt aattgtaggt ggggtgaagg + 9121 aaaatggatt gatttacaag atatttgaat ttgtttcaaa aaaagtatat caagccagcg + 9181 attatatatt tgttactagt ctatctttta aagattattt tgtaaaaaaa tttaatattc + 9241 ctctccacaa aattacttac ttaccacaat atgcagagga tttatttgta ccaaatgaat + 9301 taaaaacgaa caaaaatact attgacttaa cttttgctgg aaatattgga aaagctcaga + 9361 atttagagac tattttgaaa gcagccagtg caatagaaca gattcccgat ttagcaaaga + 9421 gagttcattt tcattttgtt ggagatggta cggaactatt aaacatgcaa aaattagcat + 9481 gtgaactaga attagagaac acttcatttt atggtagacg tccattagaa gagatgccgg + 9541 atttttatac aaaatcagat gcgatgctag tttctttaat aggcgactct ataatttctc + 9601 gcaccttacc aggtaaggta caatcttata tggcggcagg aaaaccaatt ataggagcga + 9661 tttcaggaga tactcagaga gttgtaaaag aagcaaaatg tggtttcata agtccggaag + 9721 ggaatgttga tcagttagtg agaaatattc gtaagttctg tttgctttct gtagaggaaa + 9781 gagagaaact aggaaggcaa gctcgttgtt gttatgaaga acagttttcg aaagagtggt + 9841 ttatgacata cttagaaaat catttaaaag aggggtttct atcatgaagg ttttaatgat + 9901 taattccgtt tgtggtatta ggagcactgg gagaatttgt acggatctcg caactgcttt + 9961 gacagaagaa ggatatgagg ttaaaatcgc ctatggtcgt gagtatgttc cgaaacaatt + 10021 tcaacagtat gcagtgaaaa ttggtacaaa gtctgatatt cgttttcatg cgattcgttc + 10081 tcgattattt gacgaatctg gctttggaag tagacaggca actgttaatt ttattaaatg + 10141 gataaaagag tttgaccctg atgttattca tcttcataat cttcatggat attatatcaa + 10201 tattgaactg ttatttgatt atctccgtat atgcggtaaa aagattatat ggactttgca + 10261 tgattgttgg gcatttacag gacactcggc tcactttgat tgtttggaat gtgagtcaaa + 10321 gggggtttgt gaccatccat ctcagaaaaa tgattatcct aagtcgttcg tgaatttttc + 10381 aaagcgaaat tatcaaagga agaaaaaatg ttttacacat attcctaatc tcactattgt + 10441 tactccttcg caatggctag ctaacttggt aggacagtca tttttaaaag aatatccagt + 10501 gaaagtaatt cataatggca ttgatactac tgtctttcaa ccgaggctaa tagccgctca + 10561 aaagttgaaa aaaagatacc atcttgaagg aaagcaggta ttgcttggtg tggctgctat + 10621 ctggactgat aaaaagggat tttctgatat gttagtcctt gcgagtcatc tagctgataa + 10681 tcagagaata gttttgatag ggttaaaaga taggcaactc aaaaaattac ccaaaggtat + 10741 tattgggcta acagagacta atagtccaga agagttggca gcatggtata cactagcgga + 10801 tgtattctta aatcctactt atcaagatag ttacccgaca actaatttag aagctatttc + 10861 ttgtgggaca ccagttatca gctatccgac aggtggtagt gtagaaagtg ctaaacttta + 10921 tggtctcgtt tgtcaggata gaaacgtagc ttctatttta tcttcgttag aaaaagtctc + 10981 tcagctatct aaaacagaaa aattagattt ttcaattgca agttttatta aacaaatgaa + 11041 atatttatac tagaacttga attataggaa aatgaggaat ttgcattaaa atgatgaaaa + 11101 gaatttatta tcaccttttg gctattttgg cttggactct tccaaattct tatgctttta + 11161 ttgattcgtt aaaggtgttt tttccgaata ttagtttaca aattgcaggt tctcttttgg + 11221 ctgttatctc gataggaatt tttatcacta gaatatatta tacaggatac gaagttttta + 11281 tatctctatt ggtttgtatt tttattttaa ttttttattc aactcgcttt ttttattcga + 11341 ttaatgtaga gttgtatcag tctttcttca attcctttct gattcgtcca gttcctggga + 11401 tattagtagc gatgctgtta gctaagaata atcatataaa aggtttcata aaatggtcag + 11461 aacctatgat gcttttctat acattgacat catttttagc agccctatct cctagaaata + 11521 gcattattat ttaccaatct ttatcttatt atgccatgac agcttatatg attaatgtgt + 11581 ttaatattat atacaaagag aaaatattgg aggagcaact gacgtatttc agattctcag + 11641 cgtggaattt tattagatat tttttacttt tgattcaagc ttttaatgca ctctcaggag + 11701 gtgggagagg tgcctttatc ttattaatta tttttacagg aatattatta ataagaattg + 11761 ctatgaattt taagttcctt ttctcattca ttggaggctt atctgctata gctctagttg + 11821 ttttttgtat aaaagatttg gatttcacat ggctcttgaa tatggacggt ggagagcgat + 11881 tgttgaactt cttcggcaga cctgaacgta tatctacaga taatagacta ttgatttatg + 11941 atactgtttg gtctgcaata caggaaaaac cctttttagg atggggagtt ggttcaactt + 12001 ttttaaaatt taatggatat tcacataata ttgtattgga tttattgcat gatatgggaa + 12061 gttttggttt attaattatt ctttcggctt tctttgcttc ttcagtaata ttgtacaaat + 12121 tacgtaaaat agattggaaa gtgaatttat ttattctgat gtttctagaa gtatatgttc + 12181 acatgagttt cagtggaagc tatcttgcag atggtagact atggtttttg gtgatcttta + 12241 cttattgtta ctacaggtgg aaagtgcagg aaaaggatga agttagcaat tttattatct + 12301 gatatttcaa aaataggagg agtgcagcgt gtcacgacag ctcttgttaa tgaactttgt + 12361 caaaatatag acgttacaat tatcagcatc ttttcggaaa atgagctacc agcttttgga + 12421 ctttcagata gagttcaggt gagctatctt ttgaaagaac atgttaattt gaagaagaat + 12481 ttttttaaag ttagtggagc tttgcgaaaa gtgttgaaaa aacagcagtt tgatgttgtt + 12541 ctatcgtcag gaactggtct agtatccttt ctttggtttg ctagtttggg aattcctacc + 12601 agacttttgg catgggaaca tcagtgtttt tactttggga gatcgtttgg tctagagtgg + 12661 ttggggcgaa agctagcctg tcgttttgct gagagtattg ttgtcttgac taaaaaagat + 12721 gaaggatttt acaaagagaa tcgtcctaag gctcatattg aacaaatcta taatatccta + 12781 gacatggatt cacaaacagc taagtgtcag ctctcttcta aaaaaattat cagtgttggc + 12841 tctttaggac gacaaaaagg ttttgatctg gctcttgagg tagctagtca aatacaatta + 12901 agttatccag attggcagtg ggacatttat ggtgatggcc ccgatagaga aaaattagag + 12961 gagaaagtca gggaatacca attagaaggc tttataaatt tgaaagggct tgttcagaat + 13021 gttcgggagc tctatcctga ctactctatc tacgccttga catcacgata tgaaggatta + 13081 tcaatggcat tattagaagc taaaaactgc cagatgcctg ctatttcatt tgattgtaac + 13141 tgtggaccct ctgatattat ttcagatgga agaaatggtt ttttgattga ttgttttgat + 13201 gtaaatatct atgcaaaaac tttatctaaa ttaatgacta gtttagagtt gcgagaacaa + 13261 gttgcaaaat cgagtgttat tccagcagaa gaattgtcaa caacctatat cctagataag + 13321 tggaacaatc tattaaagat agaaagaaga taatatgaaa atagtccatg tagaagattt + 13381 ttttcatcca gatgcaggtt accagattaa tgttttacca aaatatctag caaagtttgg + 13441 tcatgaacaa gtgattatca cttcagaaat ggataaaatc cccgataatc ttacccaatt + 13501 ttttggacga gaaaatatag aagagagaga tagaagttac gaagagaagc atcatgtgaa + 13561 gattattcgc ttgcctcttc atggatttgt aagcggacgt gcgatttttt ctggaaagct + 13621 tatttcggct attaagggtc tttctccaga ggtattgtat attcatggga atgacacttt + 13681 aacagggatt cgtctccttt tagctcgaaa gaaacttaat tgcagaatcg tcaccgatag + 13741 tcatatgctt gaaatggcat caagaaatcc tttcaacaac tactttagga gattttataa + 13801 aaccttgatt actcccattt tgataaaaga acagatacca attattcgga cgcaagatga + 13861 taattatgtt gaaaaacact tgggaattcc tttatcgcaa gctccatgga tttcttatgg + 13921 gtcggataca gcgttctttc acgcagatag ccagattaag gaagattttc gttctcagta + 13981 tcaaatcgct tcagatgctc ttatttgtgt ttacgcagga aagttagatg agcataaggg + 14041 tgggatgttt ttagcagagt ctctaagtaa aaagttaaat acggagcaac caattgtttt + 14101 cattatagtg ggtaatacaa atggagagta tggagaagct gtcgagaaaa gtttctccca + 14161 atctgaaaac caaattttgc gctttccgac tcaaaaatat caaaaattag cacagttttt + 14221 tcaggtagca gattttgctt tatttcctaa acaatgtagt ttaagttttt atgatgcaca + 14281 ggcctgtggt ttaccagttt tattggaaga taataatatc aacctcgata gaacttctca + 14341 ttataatggt tggacgttca aggctaacag caaattaagt ttgagagatt cattaaaaat + 14401 gattgcgagt ctagataaag agaagagaca agagtactct cagaatgcac tgcactatat + 14461 ccttgaacat tataattatg aagataaagc aagagaatat gaaaagattc ttatagggga + 14521 acgtacgaaa tgagatagtt aatatttcgt tattttatag gaaaggtgga tttaatgaaa + 14581 atttgcattg tttcagtcgg agtgggcgga ctaccgattc cagctgtaaa agggggagca + 14641 gtagaaaatc tcattgataa ttatttaagt tacaatgaga aatataatca tgatgaaatt + 14701 acggtcgtta gttgtgacca taaggaggcg cgtgaggctt caaaaaaata caagtatgcc + 14761 caatttgtct atatagatat tcattcactt aaatataaaa taaacaaaac aatacgttat + 14821 gccattaata aatattcacc tttcttcgta gggaacgctt atatcagtca attgccagac + 14881 ttgtctggtt ttgatacagt tttgattgaa aatcgccctg aatacggtta ttatattcgt + 14941 aaaaagttta aaggaaatct tgttttacat cttcacaatg atttattaat ggacaatgag + 15001 tattctgtag attatagcgt ttatgataaa attatcacaa tatctgacta tattagggat + 15061 aggtcagaag tagtaacgtc aggtgttccg atacagactg tctataatgg tattgacaca + 15121 gaactttttt tgcagaattt ctctgaaatt gatttatcag atcttaaaaa tcagttggaa + 15181 attttgtcgg atgattttgt gattgttttt tttggacgta tcaacaaaaa taaaggtatc + 15241 aaagaactgc ttgaagcctt cttgttgata ccaaagaatt tgaatataaa attactagct + 15301 gttggtagtt ctatatttgg tcagacggag ttggatactt tcacaacaga gctacggcaa + 15361 ttggcaaaac aagcatcaga taaagttgtt tttacaggct atgttaatta caaagacatt + 15421 cctaagtatc atcatattgc agattgcatt gttgttccat ctatttggga ggaaccagcg + 15481 ggtttgacgg tctgtgaagc tttgatatca gggaaatatg ttattacaac agatgctgga + 15541 gggataccag agattgtagc tggcagtgaa gcccttgtgg tagcaaatga tgagtgtata + 15601 gttgaacacc tcaaaacagc cctattgagt gtctaccaaa aagggaaatg ctcttcggtt + 15661 attacttcta atagagatag aggagcctat ttttctattg aaaaatatgg aagagactta + 15721 cggaaagagc tcacacaaaa tgaaagaatc attaacatat gagtcgtgta aaaaatagtt + 15781 tttttaatat tttagctgga atagttggta ctatcatatc gagtgtttta gctttcatag + 15841 ttagaacagt gtttatccga gttttgggag agacttatct aggtttcaat ggtctataca + 15901 ccaatatctt aacagtttta tccctaactg aattagggat cggatcatca attgcttatt + 15961 tgatgtacaa acctttagca gaaaaagatg gggacaaatt agctcaagta gttcaattct + 16021 ataaaaaaat atatcgagtg attggtatca ttattcttat tttaggtttg tgtctcgttc + 16081 cttttttacc agtcattgta aatttaaaaa atgcagaaga tttgaactat acagcattgt + 16141 atttgcttta tttagcagat acagtttcta cttatctatt ctttgcatat aaaagagggg + 16201 tattggctgc tgatcaaaag atctatgttg cgaatatctt tgatataatt ataacgacaa + 16261 ttttatctat tttccaaatt atcactttga tgatttttaa agacttttat ctatatatta + 16321 ttttaaaaat tgctaaaaat cttactttga acctagtaat tagtttaaaa gtagataaaa + 16381 tgtatccaag tattcataaa tttaaaggga tagctccgct tccaaaaatg gaaagacgac + 16441 tagtttggaa aaatgtatat gctacctctg ttcgacaaat ctttaacgaa ttaatgaatt + 16501 caacagatag tatagttatt tccattgtct taggaatagt tatggttggt aagtattcga + 16561 actatgctta tattttatca atcgtatata ttttctttgg aggaattttt aatccgattc + 16621 aggcttctat tggaaaccta tctctgtcag cttctataga gaaaaaaaat gaaatcttca + 16681 atagattacg ttttataaat tttttctttt tatcattttg ctcaagttgt cttctagtat + 16741 tggtaaatcc ttttatcact atttggattg gagaaaatta cactttatca tttacaggtg + 16801 tgattgcaat agttggtatg ttattcgtta gacaaactgg aaattgtaca accatttttc + 16861 gtttgggaga aggatatttt agagattatc atttttctcc tttaatcgcg ggcattttaa + 16921 atttagttgt ttcagtaatt ttagtgaatt atataggtat tgcaggtgtt tttgttggaa + 16981 caatgttagg atttggtttc caatttatac tggtggatac aattgttact tataaaaaag + 17041 tacttagtcg tccactatca gagttttatt taagatggtt gcagacgatc ttattaactg + 17101 taggtttatg tattgcgagt tactatttat ctcgattggt tagagtgaat agtatatatg + 17161 atttgatact gttgtttgta gtggttattg gatttaattt ttttgcttta tgttttattt + 17221 attggcgaaa tgatgatttt caatatttta ttcaattggt taaaaatttt atgaaaaatt + 17281 tggaggaaaa aaatcatgat taatgtaatc ggattaggtt atattggatt gccaacaatt + 17341 ttaatgttgg caacaaacgg cgtgaaagta gttggaactg actacaatca ggatttggtg + 17401 agaactttaa atgaaggtca aacaaccttt aaagaagatg gattggatga actatttcat + 17461 aaagcagtgg agtcgggtgt ggactttaca accgaatatc aacaaacgga tacctatatt + 17521 atttccgttc caacaccata tgactccttc tctaaaaaaa ttgatccaag ctatgtgatt + 17581 gaagctacga aaacggtact tgataattgc aataaaggag cggttattat tattgaatcg + 17641 accgtatcac caggaacggt tgataaattt attcgacctg ttgtagaaga aaaaggtttt + 17701 gttattggta gtgatattca tcttgtccat gctccagaac gtattattcc agggaatatg + 17761 gtctatgaat tggtgaataa taaccgtaca attggagctg atgacctaga aatcggctat + 17821 aaagtgaaag agctttatgc ttcattttgt aagggcgata ttgttgttac agatattaga + 17881 actgcggaga tgaccaaggt agtagaaaat acatttagag ctgtaaatat tgctttcgct + 17941 aacgaattag cacagatctg tagttatgat aatatgaatg tttatgaaat tatccggatc + 18001 tgtaatatgc acccacgggt aaatattcta caacctggac ctggtgttgg tgggcattgt + 18061 atttctgtgg atccttggtt cttagttgga gattatcctg agttgacaaa tgttattgaa + 18121 cattctatgc gaacaaatgc tgccatgcca gaatttgtat taaatcgtat ctataccatt + 18181 atgaacgaac atcatctaac agatattagt cgggttggtc tatatggtct tacctacaaa + 18241 gagaatgtag atgatatgcg tgaatctcca acgcttcagt tattagaatc tatgagccgc + 18301 catctggcaa cacctgctat taaagtatat gatccattta tagaaaaaga tgttgtggcg + 18361 aatcagtcac atgatttaga tgaattttta tctaatgttg atattgttgt actgttggtt + 18421 ggtcatgatg agattttaca aaatatggat aaactaaaag ataagatagt gttagataca + 18481 cgttatatct gtcatcttga tggaacttac agattataat tagtgataaa taaagtaagg + 18541 attgactatg aaaaaaatag ttgtaatttt cggaactcgt cccgaagcta tcaagatgtg + 18601 tcccttggtt aaagagctaa gaacacgtga gaatcttgaa acattggtct gtgttacggg + 18661 tcaacatcgt caaatgctgg atcaagtttt ggatactttt aggattacgc ctgattttga + 18721 tttatctatt atgaaggaca aacaaactct ctttgatgtc acaattggca ttttggaagg + 18781 catgaagact gtcttagagt cagttaatcc tgatttaata ttagttcatg gggatacgag + 18841 tacaacattt gccagttcac tggccgcctt ttatctacag attccaattg gacatgtaga + 18901 ggctggtttg cgtacttatg atatttattc accttatcct gaagaattta atcgtcaagc + 18961 agtaggtgct ttggctcagt atcattttac accaacacaa ctctcaaaag acaatctctt + 19021 gagagaagga aaaaattctg aagctatatt tatcacaggt aacacagcaa ttgatgcttt + 19081 acaaactaca attcaagagg attatactca tcctgagtta aattgggttg gggatagcaa + 19141 actaatatta attactgctc atcgtcgtga aaatattggt gacccgatga ggcacatgtt + 19201 tagagcaatc cgacgtatca ttgaagaaca ttcggatata aaggctcttt accccattca + 19261 tatgaatcct ctagttcgtc agattgctga ggaagaacta agcggatgtg aacgtatcaa + 19321 aatgatcgat ccgttggaag tattagattt tcataacttt ttatcacgga gttatctcat + 19381 tttaacagat agtggtggta tccaagaaga ggcacctagt ttaggaaaac ctgttttagt + 19441 tatgagagat acaactgaac gtccggaggg aattaaagca ggaactttga agcttgtagg + 19501 tactgatgag gacaatattt atagacattt taaagaattg ttagaaaatg atttagttta + 19561 tcaagcgatg agccaagctt caaatccgta tggagatgga acagcttgca agaaaattgc + 19621 agacatacta gaaggagaag tataatatat gtcacaattt acaggaaaaa ctctcctaat + 19681 tacaggagga acaggttcat ttggtaatgc tgtccttaat cgttttttac agactgatat + 19741 tggtgaaatt cgtatttttt cccgtgatga aaaaaaacag gatgatatgc gtcatgagtt + 19801 tcaggtaaaa gtaccagaag tagctgggaa aatccgtttt taccttggag atgtgcgtga + 19861 cttagcttcg gtaaaaaatg ctatgcatgg tgtggattat gtttttcatg ctgctgctct + 19921 taaacaagta ccttcgtgtg aatttttccc tgtagaagcg gtaaaaacta acattttggg + 19981 aacggagaat gtcctcactg cggctatcga agctggtgta aagcaagtta tctgtctttc + 20041 tacagataag gcggcttatc ctgtcaatgc tatgggaaca tccaaggcta tgatggaaaa + 20101 gattgctgtt gctaagtcca ggacggtaaa tcctgagcat acaaagatat gtgtgactcg + 20161 ctatgggaat gttctgtgta gccgtggatc tgtcgttcct ctttggattg agcaaattaa + 20221 gcaaggaaat gctcttacaa ttactgaacc tagcatgaca cgttttgtga tgacattaga + 20281 agaagcagta gacttggttt tatttgcatt tgaagaaggg aaatctggag atatactagt + 20341 tcagaaagca ccagcatgta cgattgaagt gttggctaag gctgtatcag aaatttttgc + 20401 ctcagaacaa gatattaaga ttataggtat tagacacgga gaaaaaaggt atgaaacact + 20461 attaactaat gaagagtgcg caaatgcaat tgatttgggt gatttttata gagttcctag + 20521 tgataatcgt aatcttaact atgataagta tttcaaagat ggtagtacga atagaaattt + 20581 gttgacagaa ttcaatagta ataataccga tttgatggat gtagagcaag ttaaaagaaa + 20641 gttgctagaa ttagatgaaa tacagacagc aattcgtgat atggtagcag atgaagagat + 20701 gtaaaatctt ttaagataca ttaaaattat caaggatata taatgtatca tgtattgtcg + 20761 agagagttga ctattaaaac agcatataaa acaaggaggg ggcatgatta aaaatatttt + 20821 aatcacagga gcgaaaggat ttgtaggaaa aaatcttatc tgtactctgg aagctttgaa + 20881 agatggacga gataggactc gtcctaattt agagattgga gagatttttc agtatgatcg + 20941 tgatacagat ccgattttat tagatgaata ttgtaagaag gccgatttcg tattccattt + 21001 agctggtgtc aatcgtccac agaatcctga tgaattcatg gagggaaatt acggtttttc + 21061 aagtagatta ttggagattt tagaaaagta tgaaaacact tgtcctgttc tactctcaag + 21121 ttctactcaa gctagtttag aaggccgatt ttcaaactct atatatggac aatctaagct + 21181 agcaggggaa gaactcttct ttgaatatgg aaagaaaacg ggagcacctg tcttagttta + 21241 ccgtttcccg aatctttatg ggaagtggtg ccgtcctaac tacaattctg ctgtagcaac + 21301 tttctgtcat aatatagctc acgatttacc tattcaagta aatgatccaa gtgtagaatt + 21361 ggagttgctg tatattgatg atttgataca agagtgtcta actgcattgg aaggaaatcc + 21421 tcatcgttgt aatctagatg gattacaaat cttacctagc ccatcaggaa actactgcta + 21481 cgtaccaacg actcatcgtg caaccttagg agagattgtc tctctattag aaacatttaa + 21541 aaaacagcct aatagtttag ttatgcctga aattcctcaa ggatcgttta aaaagaaatt + 21601 gtattctacc tacctatctt atttaccagt agataagttt aggtttcctc taaaaatgaa + 21661 tatagatgaa cgaggtagtt ttacggaatt attaaaaaca gaaaatacgg gtcaattttc + 21721 tgttaatatt tctaaacctg gcattaccaa agggcaacat tggcatcatt ctaagtggga + 21781 atttttcatg gttgtttctg gtcgtgcttt aatacaagag cgtaggatag ggctggatga + 21841 aaacggtcaa gagtatccta ttctgaactt tgaagtgtcg ggcgataaga ttgaagcaat + 21901 acatatgata ccgggctatg cacataatat tattaatctt tctgatacag aaaatctaat + 21961 tactgtcatg tgggctaatg agtcatttga tcctagacat ccagatactt tttttgaaca + 22021 agtggagaaa taaatgaaaa ttaagacaga ttatagtgat attcatttta aagataatgg + 22081 caaacttaag ttattgatta ttgtgggaac acgtccagag attatacgtc taagtagtgt + 22141 tatcactaaa tgtcgaaagt attttgatgt tattttggca catactggac aaaactatga + 22201 ttacaattta aatggtattt tctttgataa tttagggtta gacactccgg acgtatacat + 22261 ggatgctgtt ggagatgatc ttggtgctac tgtagggaat attattaata cttcatacaa + 22321 attgatgaat caaattaaac cagatgcttt attgatttta ggggatacaa attcttgttt + 22381 atcagctatt gctgccaagc gtttacatat tccaattttt catatggagg ctggcaatcg + 22441 ctgtaaagat gagtgcctgc cggaagagac taatcgtcgg attgttgata ttatttcaga + 22501 tgttaactta gcatactctg aacatgcacg taagtattta catgagtgtg gtttacctaa + 22561 agagcgcaca tatgtaactg gttctcctat ggcagaagtg ctacataaaa atttatctgc + 22621 cattgagtct tcagatatcc atgaacgttt gggattgaaa aaaggaggtt atatcttact + 22681 ttcagctcac cgtgaggaaa atattgatac agataaaaat tttatttctc tctttacagc + 22741 aattaatcaa ttagctgaaa agtataatat gccaatctta tattcttgcc atcctagatc + 22801 aaagaaaagg ctacaagaga gcggttttaa actagataaa cgtgtgattc agcatgagcc + 22861 actaggattc catgactata attgtttaca gatgaatgca tttgttgtag tatctgattc + 22921 gggaacttta ccggaagaaa gtagtttctt tactagtcaa ggttatcctt ttcccgctgt + 22981 atgtattcgt acaagtacag aacgtcctga gtccttagat aaggcaggat ttattttggc + 23041 aggcattgat gaaaattctc ttcttcaagc agttgaaact gctgttagct tggcagaaga + 23101 tgaggatttt ggattaccgg ttccagatta tgttgaggaa aatgtctcta ctaaagttgt + 23161 taagataata cagagctata cagggatagt ggataaaata gtttggagga aaagctgaat + 23221 tgtatatttt taataaatca aaacgagatg attaattctt agtagaacaa gagtaaaatt + 23281 gaacgtattt gatggaaatg tcttacttga tagtcgaggg atagccattc tatcggattt + 23341 ttggcttgtt tttgcgcttc atgtttgata gaataaaggg ctctttgtca actgtagtgg + 23401 gttgaagaaa agctaagctt gagaaaggac aaatttcgtc ctttcttttt tgatgttcag + 23461 agcgataaaa atccgttttt tgaagttttc aaagtttcga aagtaaccgc ccaataacga + 23521 agtatattga aaaatctcca gactagagaa ctcacggata gttcctaatc tggagatttc + 23581 ttatttgcac ttttcttgta caactttagt ccatggtaaa taagcctcta aaacctcttt + 23641 gtttacgaga gtttcctcgt ttggaagaca ttctagaaga taggatagat atttctcgct + 23701 atttataatg gattgaaata agatatgaac aaatcgatta ggaaaggaaa attgatttat + 23761 agaaatgttt tagcagtcga tgcgtactgt tatagattca acgcactata attgatgacg + 23821 tttagctgtt tccaacaagc tcataataat agctcttgct ttagctcctt caaaactttg + 23881 agaaaataac caccctcgct tttttaaact gagctcaggc taaaagagtc cactggactc + 23941 ttttactccg tcccataacc aatgatttaa tggcgcgttc agctagatta ttggaaagga + 24001 ccagatgtcc gtctttcaaa atagtcttaa aggtttcttc atacttgagg ctgtattcaa + 24061 ttgcccttcc tagttttgaa cctgctaaaa ctgactgacg gcggcaccaa gcaaagaagt + 24121 cttccattag gggctggaga tgttcttgac gtttctgtag tcgttcatca gctggcaaag + 24181 cctcccagtc tctttccaag gaaaataact gatcacaata ggctaaacct ttagctccta + 24241 aggatgattt atctgcttgg gggtcgcttc aaaaaacttc cttctcacat gtgcccaaca + 24301 tccaacaagt gcagcttctt ccagttgacg ataagcttct agcggttcgc agtttaccaa + 24361 gcttagcgtc gccttgctcc taaaccttgg actgctatcg cataggcaga actagaggac + 24421 taaagtccta agttactgcc gcaacatgtc acaatgaaca tagccagaat aatctcctag + 24481 gaattcttgt actactaaac cactccgacg ctgatcatgg tggtacagcg tgattgcttg + 24541 attctcagct ttcccagaca aaaaggtcca atagtaagtc agctgactat cactctctag + 24601 caccctataa gaagtttcat ctgcatgaag taagggcttg agtcaatagt ctcgttataa + 24661 aggggcttta ggaataggag ctttcacaag cttatccaga tgattatctt ttactcgtta + 24721 tggacaatgc tatatggcat aaatcaagta ccttaaagat tccgactaat attggtttta + 24781 cctttattcc tccatacaca ccagagatga accccattga acaagtgtgg aaagagattc + 24841 gtaaacgtgg atttaagaat aaagcctttc gaactttgga agatgtcata caaggactgg + 24901 agaaggaggt gataaagtcc atcgttaatc ggagatggac tagaatgctt tttgaaagca + 24961 gatgagtata aaaagaaagt cctcatttca atagaaatca cgactttctg atggatttat + 25021 agtaaaatga aataagaaca ggacaaatcg atcaggacag tcaaatcgat ttctaacaat + 25081 gttttagaag cagatgtgta ctattctagt ttcaatctac tatatttttg gagtgataga + 25141 aaagcccttc atcagccaat ctacttgttc aggtgcgaga gctttgacat ccttttctgt + 25201 actgggccaa gtcagtctgc cgttctcaaa gcgtttatat agtagccaaa atccttgacc + 25261 atcccagtaa agggctttaa agcggtcttt acgtccacca caaaagagaa aaacttgacc + 25321 tgagaaagga tctaattcaa agtgggtttt aaccagataa gccagtgaat caatgccttg + 25381 cctcatatcc gttttcccac atacgagata gacctgccct aggctagata gatgaattgt + 25441 catagagcaa caccttatcc aaaagctgtt ctatcatttc gagattgaga gattgaaaaa + 25501 aacttacttc aagcttgcca atacgaattt taagcagaat atcatttctc tttttagaat + 25561 caaaaggacg agattgtgga atctctacag gaacaatagg ttgtggcatt aaaatatcct + 25621 ccaatagttt tactttacta atagtataca ggaggagctc catgaatgat agataccttg + 25681 ttatgacgcg cttactaaac aactaactga tgcacgattt aagcgccttg ttggtgttca + 25741 gcgcacgact tttgaagaga tattagctgt attaaaaaca gcttatcaac ttaaacacgc + 25801 aaaaggtgga cgaaaaccta aattaagcct agaagacctt cttatggcca ctcttcaata + 25861 tatgcgagaa tatcgcactt atgaacaaat tgcggctgat tttggtatcc acgaaagcaa + 25921 cttactccgt cggagccaat gggttgaagt aactcttgtt caaaggtggt gttacgattt + 25981 caagaactcc tctcagttct gaggacacgg taatgattga tgcgacggaa gtacaaatca + 26041 atcgccctaa aaaaacaatt agcgaatcat tctggtaaaa agaaatttca cgctatgaag + 26101 gctcaagcga ttgtcacaag tcaagggaga attgtttctt tggatatcgc tgtgaactat + 26161 agtcatgata tgaagttgtt caaaatgagt tgcagaaata tcggacaagc tggtaaaatc + 26221 ttggccgaca gtggttatca agggctcatg aagatatatc ctcaagcaca aactccacgt + 26281 aaatccagca aactcaagcc gctaacagct gaagataaag cctgtaacca tgcgctatct + 26341 aaggagagaa gcaaggttga gaacatcttt gccaaagtaa aaacgtttaa aatgttttca + 26401 acaacctatc gaaatcatcg taaacgcttc ggattacgaa tgaatttgat tgctggtatt + 26461 atcaatcatg aactaggatt ctagttttgc aggaagtcta ttgaaggatc ttttgcttta + 26521 gttccttggt caaggttgat tattttcacg gagcgcttcc gattgttttc ataaaccatt + 26581 tgcgcatagt cagcagaata aatctttttg aaacgtccct ttcctagaca ttatagaact + 26641 ttcagattca tctgaattta ccaaatcaac acaaaaattc tgaaaattct gttgacatct + 26701 ttctgaaaag agtctataat ggagagaaag ttttaaagga gaaaatgatg aaaagttcga + 26761 aactatttgc ccttgcgggc gtgacattat tggcggcgac tactttagct gcatgctctg + 26821 gatcaggttc aagcactaaa ggtgagaaga cattctcata catttatgag acagaccctg + 26881 ataacctcaa ctatttgaca actgctaagg ctgcgacagc aaatattacc agtaacgtgg + 26941 ttgatggttt gctagaaaat gatcgctacg ggaactttgt gccgtctatg gctgaggatt + 27001 ggtctgtatc caaggatgga ttgacttaca cttatactat ccgtaaggat gcaaaatggt + 27061 atacttctga aggtgaagaa tacgcggcag tcaaagctca agac +// + diff --git a/public/res/serotype_genbank/serotype_12B.gb b/public/res/serotype_genbank/serotype_12B.gb new file mode 100644 index 0000000..e63dc11 --- /dev/null +++ b/public/res/serotype_genbank/serotype_12B.gb @@ -0,0 +1,1072 @@ +LOCUS CR931659 23673 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Gambia 1/81 (serotype 12b). +ACCESSION CR931659 +VERSION CR931659.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 23673) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 23673) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..23673 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Gambia 1/81" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC12B_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC12B_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33242.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..458 + /gene="aliB" + /locus_tag="SPC12B_0002" + /pseudo + CDS 293..458 + /gene="aliB" + /locus_tag="SPC12B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..980) + /gene="tnp" + /locus_tag="SPC12B_0003" + /pseudo + CDS complement(459..980) + /gene="tnp" + /locus_tag="SPC12B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1203..2648 + /gene="wzg" + /locus_tag="SPC12B_0004" + CDS 1203..2648 + /gene="wzg" + /locus_tag="SPC12B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33245.1" + /db_xref="GOA:Q4K1Y5" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K1Y5" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLICFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYESKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNVPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1203..1319 + /gene="wzg" + /locus_tag="SPC12B_0004" + /note="Signal peptide predicted for SPC0578 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1407..1754 + /gene="wzg" + /locus_tag="SPC12B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 3.7e-63" + misc_feature 1932..2375 + /gene="wzg" + /locus_tag="SPC12B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 2650..3381 + /gene="wzh" + /locus_tag="SPC12B_0005" + CDS 2650..3381 + /gene="wzh" + /locus_tag="SPC12B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33246.1" + /db_xref="GOA:Q4K1Y4" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K1Y4" + /translation="MIDIHSHIVFDVDDGPKSREESKALLVEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2653..3261 + /gene="wzh" + /locus_tag="SPC12B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 9e-37" + gene 3387..4082 + /gene="wzd" + /locus_tag="SPC12B_0006" + CDS 3387..4082 + /gene="wzd" + /locus_tag="SPC12B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33247.1" + /db_xref="GOA:Q4K1W4" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K1W4" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSAFI + VKPEYTSTTRIYVVNRDQGDKSGLTNQDLQAGSYLVKDYREIILSQNVLEKVATNLKL + DIPAKTLARKVQVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVGRNSLFGFFGGAVVTVIAVLLIELFDIRVKRPEDVEDVLQI + PLLGVVPDLDKMK" + misc_feature 3387..3503 + /gene="wzd" + /locus_tag="SPC12B_0006" + /note="Signal peptide predicted for SPC0580 by SignalP 2.0 + HMM (Signal peptide probability 0.729) with cleavage site + probability 0.460 between residues 39 and 40" + misc_feature 3408..3824 + /gene="wzd" + /locus_tag="SPC12B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.4e-54" + misc_feature 3930..4007 + /gene="wzd" + /locus_tag="SPC12B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4092..4766 + /gene="wze" + /locus_tag="SPC12B_0007" + CDS 4092..4766 + /gene="wze" + /locus_tag="SPC12B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33248.1" + /db_xref="GOA:Q4K1Y2" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1Y2" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + QGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITQKCDASILVTKAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGKK" + gene 5113..5712 + /gene="wciI" + /locus_tag="SPC12B_0008" + CDS 5113..5712 + /gene="wciI" + /locus_tag="SPC12B_0008" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI33249.1" + /db_xref="GOA:Q4K1Y1" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4K1Y1" + /translation="MYREIKRLGDILLSFIGIIVLFPVFIIIAIAIKLDSKGPVIFKQ + KRFGLHKKSFYVLKFRTMKVESPKYVATRDLDKPEQWITKVGACLRKTSLDELPQLWN + ILVGDMSVVGPRPVAINELDLIKEREQYGANDILPGLTGWAQINGRDNLSTEMKAEID + GYYVKHMSLRMDLRCILRTIPYVLKRKGIVEGSGKKELD" + misc_feature 5113..5205 + /gene="wciI" + /locus_tag="SPC12B_0008" + /note="Signal peptide predicted for SPC0582 by SignalP 2.0 + HMM (Signal peptide probability 0.855) with cleavage site + probability 0.449 between residues 31 and 32" + misc_feature 5128..5682 + /gene="wciI" + /locus_tag="SPC12B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.4e-36" + gene 5717..6943 + /gene="wciJ" + /locus_tag="SPC12B_0009" + CDS 5717..6943 + /gene="wciJ" + /locus_tag="SPC12B_0009" + /note="member of homology group 35" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33250.1" + /db_xref="GOA:Q4K1Y0" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1Y0" + /translation="MKILFVCQHYKPEPFRLSDICEDLVQRGHEVAVLTGIPNYPEGE + IYADYRKRKKRRETINGVAIFRSYTIARRQNTLYRILNYFSFALSSTIGVIFGRYKAK + DGSDFDCVFVNQLSPVMMAWAGIAYKNKYNKPMFLYCMDVWPDSLIVGGVKENGLIYK + IFEFVSKKVYQASDYIFVTSLSFKDYFVKKFNIPLHKITYLPQYAEDLFVPNELKTNK + NTIDLTFAGNIGKAQNLETILKAASAIEQIPDLAKRVHFHFVGDGTELLNMQKLACEL + ELENTSFYGRRPLEEMPDFYTKSDAMLVSLIGDSIISRTLPGKVQSYMAAGKPIIGAI + SGDTQRVVKEAKCGFISPEGNVDQLVRNIRKFCLLSVEEREKLGRQARCYYEEQFSKE + WFMTYLENHLKEGFLS" + misc_feature 6335..6868 + /gene="wciJ" + /locus_tag="SPC12B_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.8e-16" + gene 6940..8109 + /gene="wcxB" + /locus_tag="SPC12B_0010" + CDS 6940..8109 + /gene="wcxB" + /locus_tag="SPC12B_0010" + /note="member of homology group 55" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33251.1" + /db_xref="GOA:Q4K1X9" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1X9" + /translation="MKVLMINSVCGIRSTGRICTDLATALTEEGYEVKIAYGREYVPK + QFQQYAVKIGTKSDIRFHAIRSRLFDESGFGSRQATVNFIKWMKEFDPDIIHLHNLHG + YYINVELLFDYLRICGKKIIWTLHDCWAFTGHSAYFDCLECESKGVCDHPSQKNDYPK + SFVNFSKRNYQRKKKCFTHIPNLTIVTPSQWLANLVRQSFLKEYPVKVIHNGIDTTVF + QPRLIAAQKLRKRHHLEGKQVLLGVAAIWDNRKGFSDMLALANDLTDNQRIVLIGLKD + RQLKELPKGIIGLTETNSPEELVAWYTLADVFLNPTYQDNYPTTNLEAISCGTPVISY + PTGGSVESAKLYGLVCQDRNVASILSSLEKVSQLSKTEKLDFSIASFIKQMKYLY" + misc_feature 7612..8094 + /gene="wcxB" + /locus_tag="SPC12B_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 4.2e-12" + gene 8147..9358 + /gene="wzy" + /locus_tag="SPC12B_0011" + CDS 8147..9358 + /gene="wzy" + /locus_tag="SPC12B_0011" + /note="member of homology group 71" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33252.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K1V9" + /translation="MMKRIYYHLLAIWAWTLPNSYAFIDSLKVFFPNISLQIAGSLLA + VVSIGIFITRIYYTRYEVFISLLVCISILIFYSTRFFYSTNVELYQSFFNSFLIRPVP + AILVAMLLAKNNHIKGFIKWSEPMMLFYTLTSFLAALSPRNSIITYQSLSYYAMTAYM + INVFNIIYKEKILEEQLTYFRFSAWNFIRYFLLLIQAFNALSGGGRGAFILLIIFTGI + LLIRTAMKFKFLFSFIGGLSAIALVVFFTKGLDLTWLLNMDGGERLLNFFGRPEHIST + DNRLLIYDTVWSAIQEKPFLGWGVGSTFLKFNGYSHNIVLDLLHDMGSFGLLIILSAF + FASSVILYKLRKIDWKVNLFILMFLEVYVHMSFSGSYLADGRLWFLVIFTYCYYRWKV + QEKDEVSNFII" + misc_feature 8963..9130 + /gene="wzy" + /locus_tag="SPC12B_0011" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 9.9e-08" + gene 9333..10409 + /gene="wcxD" + /locus_tag="SPC12B_0012" + CDS 9333..10409 + /gene="wcxD" + /locus_tag="SPC12B_0012" + /note="member of homology group 72" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33253.1" + /db_xref="GOA:Q4K1V8" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1V8" + /translation="MKLAILLSDISKIGGVQRVTTALVNELCQNIDVTIISIFSENEL + PAFGLSDRVQVSYLLKEHVNLKKNFFKVSGALRKVLKKQQFDVVLSSGTGLVSFLWFA + SLGIPTRLLAWEHQCFYFGRSFGLEWLGRKLACRFAESIVVLTKKDEGFYKENRPKAH + IEQIYNILDMDSQTAKCQLSSKKIISVGSLVRQKGFDLALEVASQIQLSYPDWQWDIY + GDGPDREKLEEKVREYQLEGFINLKGLVQNVRELYPDYSIYALTSRYEGLSMVLLEAK + NCQMPAISFDCNCGPSDIISDGRNGFLIDCFDVNIYAKTLSKLMTSLELREQVAKSSV + IPAEELSTTYILDKWNNLLKIERR" + misc_feature 9834..10340 + /gene="wcxD" + /locus_tag="SPC12B_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.2e-33" + gene 10411..11589 + /gene="wcxE" + /locus_tag="SPC12B_0013" + CDS 10411..11589 + /gene="wcxE" + /locus_tag="SPC12B_0013" + /note="member of homology group 73" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33254.1" + /db_xref="GOA:Q4K1X6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1X6" + /translation="MKIVHVEDFFHPDAGYQINVLPKYLAKFGHEQVIITSEMDKIPD + NLTQFFGRENIEERDRSYEEKHHVKIIRLPLHGFVSGRAIFSGKLISAIKGLSPEVLY + IHGNDTLTGIRLLLARKKLNCRIVTDSHMLEMASRNPFNNYFRRFYKTLITPILIKEQ + IPIIRTQDDNYVEKHLGIPLSQAPWISYGSDTAFFHADSQIKEDFRSQYQIASDALIC + VYAGKLDEHKGGMFLAESLSKKLNTEQPIVFIIVGNTNGEYGEAVEKSFSQSENQILR + FPTQKYQKLAQFFQVADFALFPKQCSLSFYDAQACGLPVLLEDNNINLDRTSHYNGWT + FKANSKLSLRDSLKMIASLDKEKRQEYSQNALHYILEHYNYEDKAREYEKILIGERTK + " + misc_feature 11014..11514 + /gene="wcxE" + /locus_tag="SPC12B_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00013" + gene 11622..12818 + /gene="wcxF" + /locus_tag="SPC12B_0014" + CDS 11622..12818 + /gene="wcxF" + /locus_tag="SPC12B_0014" + /note="member of homology group 74" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33255.1" + /db_xref="GOA:Q4K1X5" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1X5" + /translation="MDLMKICIVSVGVGGLPIPAVKGGAVENLIDNYLSYNEKYNHDE + ITVVSCDHKEAREASKKYKYAQFVYIDIHSLKYKINKTIRYAINKYSPFFVGNAYISQ + LPDLSGFDTVLIENRPEYGYYIRKKFKGNLVLHLHNDLLMDNEYSVDYSVYDKIITIS + DYIRDRSEVVTSGVPIQTVYNGIDTELFLQNFSEIDLSDLKNQLEILSDDFVIVFFGR + INKNKGIKELLEAFLLLPKNLNIKLLAVGSSIFGQTELDTFTTELRQLAKQASDKVVF + TGYVNYKDIPKYHHIADCIVVPSIWEEPAGLTVCEALISGKYVITTDAGGIPEIVAGS + EALVVANDECIVEHLKTALLSVYQKGKCSSVITSNRDRGAYFSIEKYGRDLRKELTQN + ERIINI" + misc_feature 11622..11696 + /gene="wcxF" + /locus_tag="SPC12B_0014" + /note="Signal peptide predicted for SPC0588 by SignalP 2.0 + HMM (Signal peptide probability 0.653) with cleavage site + probability 0.406 between residues 25 and 26" + misc_feature 12210..12737 + /gene="wcxF" + /locus_tag="SPC12B_0014" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.3e-28" + gene 12815..14359 + /gene="wzx" + /locus_tag="SPC12B_0015" + CDS 12815..14359 + /gene="wzx" + /locus_tag="SPC12B_0015" + /note="member of homology group 56" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33256.1" + /db_xref="GOA:Q4K1X4" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K1X4" + /translation="MSRVKNSFFNILAGIVGTIISSVLAFIVRTVFIRVLGETYLGFN + GLYTNILTVLSLAELGIGSSIAYLMYKPLAEKDGDKLAQVVQFYKKIYRVIGIIILIL + GLCLVPFLPVIVNLKNAEDLNYTALYLLYLADTVSTYLFFAYKRGVLVADQKVYVANI + FDIIITTILSIFQIITLMIWKDFYLYIILKIAKNLTLNLVISLKVDKMYPSIHKFKEI + APLPKMERRLVWKNVYATSVRQIFNELMNSTDSIVISIVLGIVMVGKYSNYAYILSIV + YIFFGGIFNPIQASIGNLSLLASIEKKNEIFNRLRFINFFFLSFCSSCLLVLVNPFIT + IWIGENYTLSFTGVIAIVGMLFVRQTGNCTTIFRLGEGYFRDYHFSPLIAGILNLVVS + VILVNYIGIAGVFVGTMLGFGFQFILVDTIVTYKKVLSRPLSEFYLRWLQTILLTVGL + CIASYYLSRLVRVNSIYDLILLFVVVIGFNFFALCFIYWRNDDFQYFIQLVKNFMKNL + EEKNHD" + misc_feature 12815..12889 + /gene="wzx" + /locus_tag="SPC12B_0015" + /note="Signal peptide predicted for SPC0589 by SignalP 2.0 + HMM (Signal peptide probability 0.820) with cleavage site + probability 0.397 between residues 25 and 26" + gene 14352..15575 + /gene="mnaB" + /locus_tag="SPC12B_0016" + CDS 14352..15575 + /gene="mnaB" + /locus_tag="SPC12B_0016" + /note="member of homology group 75" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylmannosamine dehydrogenase MnaB" + /protein_id="CAI33257.1" + /db_xref="GOA:Q4K1X3" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K1X3" + /translation="MINVIGLGYIGLPTILMLATNGVKVVGTDYNQDLVRTLNEGQTT + FKEDGLDELFHKAVESGVDFTTEYQQTDTYIISVPTPYDSFSKKIDPSYVIEATKTVL + DNCNKGAVIIIESTVSPGTVDKFIRPVVEEKGFVIGSDIHLVHAPERIIPGNMVYELV + NNNRTIGADDLEIGYKVKELYASFCKGDIVVTDIRTAEMTKVVENTFRAVNIAFANEL + AQICSYDNMNVYEIIRICNMHPRVNILQPGPGVGGHCISVDPWFLVGDYPELTNVIEH + SMRTNAAMPEFVLNRIYTIMNEHHLTDISRVGLYGLTYKENVDDMRESPTLQLLESMS + RHLATPAIKVYDPFIEKDVVANQSHDLDEFLSNVDIVVLLVGHDEILQNMDKLKDKIV + LDTRYICHLDGTYRL" + misc_feature 14355..14909 + /gene="mnaB" + /locus_tag="SPC12B_0016" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.4e-45" + misc_feature 14931..15191 + /gene="mnaB" + /locus_tag="SPC12B_0016" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 4.5e-33" + misc_feature 15273..15536 + /gene="mnaB" + /locus_tag="SPC12B_0016" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 2.5e-15" + gene 15604..16701 + /gene="mnaA" + /locus_tag="SPC12B_0017" + CDS 15604..16701 + /gene="mnaA" + /locus_tag="SPC12B_0017" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33258.1" + /db_xref="GOA:Q4K1X2" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1X2" + /translation="MKKIVVIFGTRPEAIKMCPLVKELRTRENLETLVCVTGQHRQML + DQVLDTFRITPDFDLSIMKDKQTLFDVTIGILEGMKTVLESVNPDLILVHGDTSTTFA + SSLAAFYLQIPIGHVEAGLRTYDIYSPYPEEFNRQAVGALAQYHFTPTQLSKDNLLRE + GKNSEAIFITGNTAIDALQTTIQEDYTHPELNWVGDSKLILITAHRRENIGDPMRHMF + RAIRRIIEEHSDIKALYPIHMNPLVRQIAEEELSGCERIKMIDPLEVLDFHNFLSRSY + LILTDSGGIQEEAPSLGKPVLVMRDTTERPEGIKAGTLKLVGTDEDNIYRHFKELLEN + DLVYQAMSQASNPYGDGTACKKIADILEGEV" + misc_feature 15667..16689 + /gene="mnaA" + /locus_tag="SPC12B_0017" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 2.5e-174" + gene 16705..17760 + /gene="fnlA" + /locus_tag="SPC12B_0018" + CDS 16705..17760 + /gene="fnlA" + /locus_tag="SPC12B_0018" + /note="member of homology group 36" + /codon_start=1 + /transl_table=11 + /product="FnlA" + /protein_id="CAI33259.1" + /db_xref="GOA:Q4K1X1" + /db_xref="InterPro:IPR003869" + /db_xref="InterPro:IPR013692" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1X1" + /translation="MSQFTGKTLLITGGTGSFGNAVLNRFLQTDIGEIRIFSRDEKKQ + DDMRHEFQVKVPEVAGKIRFYLGDVRDLASVKNAMHGVDYVFHAAALKQVPSCEFFPV + EAVKTNILGTENVLTAAIEAGVKQVICLSTDKAAYPVNAMGTSKAMMEKIAVAKSRTV + NPEHTKICVTRYGNVLCSRGSVVPLWIEQIKQGNALTITEPSMTRFVMTLEEAVDLVL + FAFEEGKSGDILVQKAPACTIEVLAKAVSEIFASEQDIKIIGIRHGEKKYETLLTNEE + CANAIDLGDFYRVPSDNRNLNYDKYFKDGSTNRNLLTEFNSNNTDLMDVEQVKRKLLE + LDEIQTAIRDMVADEEM" + misc_feature 16726..17580 + /gene="fnlA" + /locus_tag="SPC12B_0018" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0018" + misc_feature 16729..17577 + /gene="fnlA" + /locus_tag="SPC12B_0018" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 1.1e-162" + misc_feature 16729..17400 + /gene="fnlA" + /locus_tag="SPC12B_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 8.3e-09" + misc_feature 16732..17367 + /gene="fnlA" + /locus_tag="SPC12B_0018" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 8.4e-09" + misc_feature 17578..17721 + /gene="fnlA" + /locus_tag="SPC12B_0018" + /note="HMMPfam hit to PF08485, Polysaccharide biosynthesis + protein C, score 2e-23" + gene 17860..19089 + /gene="fnlB" + /locus_tag="SPC12B_0019" + CDS 17860..19089 + /gene="fnlB" + /locus_tag="SPC12B_0019" + /note="member of homology group 37" + /codon_start=1 + /transl_table=11 + /product="FnlB" + /protein_id="CAI33260.1" + /db_xref="GOA:Q4K1V1" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1V1" + /translation="MIKNILITGAKGFVGKNLICTLEALKDGRDRTRPNLEIGEIFQY + DRDTDPILLDEYCKKADFVFHLAGVNRPQNPDEFMEGNYGFSSRLLEILEKYENTCPV + LLSSSTQASLEGRFSNSIYGQSKLAGEELFFEYGKKTGAPVLVYRFPNLYGKWCRPNY + NSAVATFCHNLAHDLPIQVNDPSVELELLYIDDLIQECLTALEGNPHRCNLDGLQILP + SPSGNYCYVPTTHRATLGEIVSLLETFKKQPNSLVMPEIPQGSFKKKLYSTYLSYLPV + DKFRFPLKMNIDERGSFTELLKTENTGQFSVNISKPGITKGQHWHHSKWEFFMVVSGR + ALIQERRIGLDENGQEYPILNFEVSGDKIEAIHMIPGYAHNIINLSDTENLITVMWAN + ESFDPRHPDTFFEQVEK" + misc_feature 17872..18495 + /gene="fnlB" + /locus_tag="SPC12B_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 6.9e-09" + gene 19090..20274 + /gene="fnlC" + /locus_tag="SPC12B_0020" + CDS 19090..20274 + /gene="fnlC" + /locus_tag="SPC12B_0020" + /note="member of homology group 38" + /codon_start=1 + /transl_table=11 + /product="UDP-L-fucosamine FnlC" + /protein_id="CAI33261.1" + /db_xref="GOA:Q4K1W9" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1W9" + /translation="MKIKTDYSDIHFKDNGKLKLLIIVGTRPEIIRLSSVITKCRKYF + DVILAHTGQNYDYNLNGIFFDNLGLDTPDVYMDAVGDDLGATVGNIINTSYKLMNQIK + PDALLILGDTNSCLSAIAAKRLHIPIFHMEAGNRCKDECLPEETNRRIVDIISDVNLA + YSEHARKYLHECGLPKERTYVTGSPMAEVLHKNLSAIESSDIHERLGLKKGGYILLSA + HREENIDTDKNFISLFTAINQLAEKYNMPILYSCHPRSKKRLQESGFKLDKRVIQHEP + LGFHDYNCLQMNAFVVVSDSGTLPEESSFFTSQGYPFPAVCIRTSTERPESLDKAGFI + LAGIDENSLLQAVETAVSLAEDEDFGLPVPDYVEENVSTKVVKIIQSYTGIVDKIVWR + KS" + misc_feature 19201..20229 + /gene="fnlC" + /locus_tag="SPC12B_0020" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 4.8e-105" + gene complement(20469..20570) + /gene="tnp" + /locus_tag="SPC12B_0021" + /pseudo + CDS complement(20469..20570) + /gene="tnp" + /locus_tag="SPC12B_0021" + /note="Lone member of homology group 0227" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase (fragment)" + /db_xref="PSEUDO:CAI33262.1" + gene complement(20637..21582) + /gene="tnp" + /locus_tag="SPC12B_0022" + /pseudo + CDS complement(join(20637..20858,20869..21582)) + /gene="tnp" + /locus_tag="SPC12B_0022" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + gene 21679..21864 + /gene="tnp" + /locus_tag="SPC12B_0023" + /pseudo + CDS 21679..21864 + /gene="tnp" + /locus_tag="SPC12B_0023" + /note="Lone member of homology group 0228" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene complement(21974..22574) + /gene="tnp" + /locus_tag="SPC12B_0024" + /pseudo + CDS complement(join(21974..22324,22305..22574)) + /gene="tnp" + /locus_tag="SPC12B_0024" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature complement(order(21983..22324,22305..22309)) + /gene="tnp" + /locus_tag="SPC12B_0024" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 4.2e-56" + /pseudo + gene order(22641..22835,22837..22959,22976..23365) + /gene="tnp" + /locus_tag="SPC12B_0025" + /pseudo + CDS join(22641..22835,22837..22959,22976..23365) + /gene="tnp" + /locus_tag="SPC12B_0025" + /note="member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature order(22888..22959,22976..23353) + /gene="tnp" + /locus_tag="SPC12B_0025" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 4.7e-11" + /pseudo + gene 23626..>23673 + /gene="aliA" + /locus_tag="SPC12B_0026" + CDS 23626..>23673 + /gene="aliA" + /locus_tag="SPC12B_0026" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33267.1" + /db_xref="UniProtKB/TrEMBL:Q4K2C2" + /translation="MMKSSRLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaaagca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctacttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtt ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgaat agggaggaag aggtaaaagt + 601 ttatgaccaa actcttcgca taaaagttct agcttaccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaatttctg aaaccatact + 721 tcaaaaaagt cgttcgtcat cgtctcttcg taagtcattg gagcgattaa ttcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata attagattga aactagagta gtacaccttt gcttctaaaa + 1021 cattgttaga aatcgattta actgtcctga ttgatttatc ctattcttgt ttcaatctac + 1081 tatatttttg tttcgcggga agtctactta agatacttaa agatgcagat agtaaaaaag + 1141 atgtagacat taccgtaaaa aagtgatata atcgtatgat gttcaaggta taggtgttaa + 1201 tcatgagtag acgttttaaa aaatcacgtt cacagaaagt gaagcgaagt gttaatatcg + 1261 ttttgctgac tatttattta ttgttaattt gttttttatt gttcttaatc tttaagtaca + 1321 atatccttgc ttttagatat cttaatctag tggtaactgc gttagtccta ctagttgcct + 1381 tggtagggct actcttgatt atctataaaa aagctgaaaa gtttactatt tttctgttgc + 1441 tgttctctat ccttgtcagc tctgtgtcgc tctttgcagt acagcagttt gttggactga + 1501 ccaatcgttt aaatgcgact tctaattact cagaatattc aatcagtgtc gctgttttag + 1561 cagatagtga tatcgaaaat gttacgcaac tgacgagtgt gacagcaccg actgggactg + 1621 ataatgaaaa tattcaaaaa ctactagctg atattaagtc aagtcagaat accgatttga + 1681 cggtcgacca gagttcgtct tacttggcag cttacaagag tttgattgca ggggagacta + 1741 aggccattgt cttaaatagt gtctttgaaa atatcatcga gtcagagtat ccagactacg + 1801 aatcgaagat aaagaagatt tataccaagg gattcactaa aaaagtagaa gctcctaaga + 1861 cgtctaagaa tcagtctttc aatatctatg ttagtggaat tgacacctat ggtcctatta + 1921 gttcggtgtc gcgatcagat gtcaatatcc tgatgactgt caatcgagat accaagaaaa + 1981 tcctcttgac cacaacgccg cgtgatgcct atgtaccaat cgcagatggt ggaaataatc + 2041 aaaaggataa attgactcat gctggtatat atggggttga ttcatccatt cataccctag + 2101 agaaccttta tggtgtagat attaattatt atgttcgttt gaattttacc tcatttttga + 2161 aattgattga cttattggga ggggtagatg ttcataatga tcaagagttt tcagctctac + 2221 atgggaagtt ccatttccca gtagggaatg tccatctaga ctctgagcag gctctaggtt + 2281 ttgtacgtga acgctactca ctagccgatg gagaccgtga ccgtggtcgc aaccaacaaa + 2341 aggtgattgt ggctatcctt caaaaattaa cgtcaaccga agcactgaaa aattatagta + 2401 cgatcattaa tagcttgcaa gattccatcc aaacaaatgt gccacttgag actatgataa + 2461 atttggtcaa tgctcagtta gaaagtggag ggaattataa agtaaattct caagatttaa + 2521 aaggtacagg tcggacggat cttccttctt atgcaatgcc agacagtaac ctctatgtga + 2581 tggaaataga tgatagtagt ttagctgtag ttaaagcagc tatacaggat gtgatggagg + 2641 gtagatgaga tgatagacat ccattcgcat atcgtttttg atgtagatga cggtcccaag + 2701 tcaagagagg aaagcaaggc tctcttggta gaagcctaca gacagggggt gcgaaccatt + 2761 gtctctacct ctcaccgtcg caagggtatg tttgaaactc cggaagagaa gatagcagaa + 2821 aactttcttc aggttcggga aatagctaag gaagtggcga gtgatttagt catcgcttac + 2881 ggggctgaaa tttactacac accagatgtt ctggataagc tagaaaaaaa gcggattccg + 2941 accctcaatg atagtcgtta tgccttgata gagtttagta tgaacactcc ttatcgcgat + 3001 attcatagcg ccttgagcaa gatcttgatg ttgggaatta ctccagtcat tgcccacatt + 3061 gagcgctatg atgctcttga aaataatgaa aaacgcgttc gagaattgat cgatatgggc + 3121 tgttacacgc aagtaaatag ttcacatgtc ctcaaatcca aactttttgg cgaacgttat + 3181 aaattcatga aaaaaagagc tcagtatttt ttagagcagg atttggtcca tgtcattgca + 3241 agtgatatgc acaatctaga cggcagacct cctcatatgg cagaagcata tgaccttgtt + 3301 acccaaaaat acggagaagc gaaggctcag gaacttttta tagacaatcc tcgaaaaatt + 3361 gtaatggatc aactaattta ggagaaatga tgaaagaaca aaacacgata gaaatcgatg + 3421 tatttcaatt atttaaaacc ttgtggaaac gcaagctaat gattttatta gtggcacttg + 3481 tgacaggtgc gggggctttt gcatatagcg cttttattgt taagccagaa tatacgagta + 3541 ccacgcgaat ttacgtagtg aatcgcgatc aaggagacaa gtcggggctg acaaatcagg + 3601 atttgcaggc aggatcttat ctggtaaaag actaccgtga gattatcctt tcgcagaatg + 3661 tattggaaaa agtagcgaca aatttgaagt tggatatacc agccaaaacg ttagctagaa + 3721 aagttcaagt gactgtacca gttgacactc gtatcgtctc aatctctgtc aaggataaac + 3781 agccagagga agccagtcgt atcgctaatt ctctacgaga agttgctgca gaaaagatca + 3841 tcgctgtaac gcgagtatct gatgtaacga cacttgaaga agcgcgacca gctacgactc + 3901 cctcttctcc aaatgttgga cgcaattcct tgtttggttt ttttggagga gcagtcgtaa + 3961 cagtaattgc tgttcttttg attgagttgt tcgacatccg tgtgaaacgt cctgaagatg + 4021 tcgaagatgt actgcaaatt ccacttttag gggtcgttcc agatttggac aaaatgaaat + 4081 aggaggaagt tatgccaaca ttagaaatct cacaggcaaa attggatttt gtaaaaaagg + 4141 cagaggaaaa ttataacgct ttgtgcacga acctacagtt aagtggagat gatttgaaag + 4201 tattttctat cacttctgtg aaacaaggag aaggaaaatc aacgacttcc accaatattg + 4261 cttgggcttt tgcgcgtgca ggttacaaaa cgctgctgat tgatggagat attcgcaatt + 4321 ctgttatgtt aggtgtcttt aaagcaagag ataagattac aggcctgaca gaatttttat + 4381 caggaactac agacctatca caagggcttt gtgataccaa tatcgaaaat ctctttgtaa + 4441 ttcaggctgg ctctgtgtca ccgaatccga cagctcttct tcaaagtaag aatttcagta + 4501 caatgcttga aaccttgcgt aaatattttg actatatcat tgtagatact gctcctgtcg + 4561 gtgtcgtgat tgatgcggct attattacgc aaaaatgcga tgcttctatt ttagtgacga + 4621 aggcaggtga aataaatcga cgggatattc aaaaagcaaa agaacagttg gaacacacag + 4681 ggaagccgtt tttgggagtt gtgttgaata aattcgatac ttcagtagac aaatacggtt + 4741 cttatggaaa ttacggaaaa aaataagtcg ttaagtattt gtgtaaggac atttttagaa + 4801 ctacaatcaa aatctttgga attgctggct tcaaatcata ttgatttgaa atgaaacttg + 4861 caaaagagtt tttaaggtga gtttcttaat ttgtgactga aatcaatctt ctacttccat + 4921 accttggaaa aatagggtaa acgagaaatg ttttttccat aataaagttt tgatatggct + 4981 agtagagtag taatataatg aattgtaatc attagtgttc ataccaagaa atatcaagta + 5041 cctatttttg gaaattataa atgttagata gtgtttaaat ttttacggag agattgtttt + 5101 gagaggtaat ttatgtatag ggaaataaaa cgattaggtg atattttact ttctttcata + 5161 ggaataatag tactgtttcc agtgtttatt ataattgcaa tcgcaataaa gcttgattca + 5221 aaaggtccag taatatttaa gcaaaagcga tttggacttc ataagaaatc gttctatgtc + 5281 ttgaagtttc gaactatgaa ggttgaatcg ccaaaatatg tggcgactcg agacttagat + 5341 aaaccagaac agtggattac caaagtagga gcttgtttgc ggaaaacatc tttagatgaa + 5401 ctgcctcaac tgtggaacat tcttgttggt gatatgagtg ttgtaggacc taggcctgta + 5461 gctataaatg aacttgattt gataaaagaa agagaacagt atggtgccaa tgatatctta + 5521 ccaggattaa ctggatgggc acaaattaat ggacgtgata atttgtcaac agagatgaag + 5581 gcagagatag atggttatta tgtaaaacat atgtcgttaa gaatggatct tagatgtatc + 5641 cttagaacaa tcccctacgt attaaaacgt aagggaattg tggagggtag tggtaagaaa + 5701 gagttggatt gatgcaatga aaattctatt tgtttgtcaa cattataagc cagaaccttt + 5761 tagattgtca gatatttgtg aggatctagt tcaaagaggg cacgaggtgg ctgttttgac + 5821 agggattcct aactatcccg agggggaaat atatgctgat tatcgtaaga gaaaaaaaag + 5881 aagagagact ataaatggtg ttgctatttt tcgttcatac accattgcta ggaggcaaaa + 5941 tactttatac cgtatattga attattttag ttttgctctt tcttctacga taggtgttat + 6001 atttgggcgt tataaagcga aagatggctc agattttgat tgtgtctttg ttaatcaact + 6061 atctccagtt atgatggctt gggctggtat agcttataag aacaagtaca ataaacctat + 6121 gtttttgtat tgcatggatg tttggccgga tagtttaatt gtaggtgggg tgaaggaaaa + 6181 tggattgatt tacaagatat ttgaatttgt ttcaaaaaaa gtatatcaag ccagcgatta + 6241 tatatttgtt actagtctat cttttaaaga ttattttgta aaaaaattta atattcctct + 6301 ccacaaaatt acttacttac cacaatatgc agaggattta tttgtaccaa atgaattaaa + 6361 aacgaacaaa aatactattg acttaacttt tgctggaaat attggaaaag ctcagaattt + 6421 agagactatt ttgaaagcag ccagtgcaat agaacagatt cccgatttag caaagagagt + 6481 tcattttcat tttgttggag atggtacgga actattaaac atgcaaaaat tagcatgtga + 6541 actagaatta gagaacactt cattttatgg tagacgtcca ttagaagaga tgccggattt + 6601 ttatacaaaa tcagatgcga tgctagtttc tttaataggc gactctataa tttctcgcac + 6661 cttaccaggt aaggtacaat cttatatggc ggcaggaaaa ccaattatag gagcgatttc + 6721 aggagatact cagagagttg taaaagaagc aaaatgtggc ttcataagtc cggaagggaa + 6781 tgttgatcag ttagtgagaa atattcgtaa gttctgtttg ctttctgtag aggaaagaga + 6841 gaaactagga aggcaagctc gttgttatta tgaagaacag ttttcgaaag agtggtttat + 6901 gacatactta gaaaatcatt taaaagaggg gtttctatca tgaaggtttt aatgattaat + 6961 tccgtttgtg gtattaggag cactgggaga atttgtacgg atctcgcaac tgctttgaca + 7021 gaagaaggat atgaggttaa aatcgcctat ggtcgtgagt atgttccgaa acaatttcaa + 7081 cagtatgcag tgaaaattgg tacaaagtct gatattcgtt ttcatgcgat tcgttctcga + 7141 ttatttgacg aatctggctt tggaagtaga caggcaactg ttaattttat taaatggatg + 7201 aaagagtttg atcctgatat tattcatctc cataaccttc atgggtatta tatcaatgtt + 7261 gaactgttat ttgattatct ccgaatatgc ggtaaaaaga ttatatggac tttgcatgat + 7321 tgttgggcat ttacaggaca ctcggcttat tttgattgtt tggaatgtga gtcaaaggga + 7381 gtttgtgacc atccatctca gaaaaatgat tatcccaagt cgttcgtgaa tttttcaaag + 7441 cgaaattatc aaagaaagaa aaaatgtttt actcatattc ctaatctcac tattgttact + 7501 ccgtctcaat ggctagctaa tttagtaaga cagtcatttt taaaagaata tccagtgaaa + 7561 gtaattcata atggtattga tactactgtc tttcaaccga ggctaatagc cgctcaaaaa + 7621 ttgagaaaaa gacaccatct tgaaggaaag caggtactgc ttggtgtggc tgctatctgg + 7681 gataatagaa agggattttc tgatatgtta gcgctcgcga atgatctaac tgataatcag + 7741 agaatagttt tgatagggtt aaaagatagg caactcaaag aactacccaa agggatcatt + 7801 gggttaacag aaactaatag cccagaagag ttggtagcat ggtatacact agcggatgta + 7861 tttctaaatc ctacttatca agataattac ccgacaacta atttagaagc tatttcttgt + 7921 gggacaccag ttatcagcta tccgacaggt ggtagtgtag aaagtgctaa actttatggt + 7981 ctcgtttgtc aggatagaaa cgtagcttct attttatctt cgttagaaaa agtctctcag + 8041 ctatctaaaa cagaaaaatt ggatttttca attgcaagtt ttattaaaca aatgaaatat + 8101 ttatattaga acttgaatta taggaaaatg aggaatttgc attaaaatga tgaaaagaat + 8161 ttattatcac cttttggcta tttgggcttg gactcttcca aattcttatg cttttattga + 8221 ttcgttaaag gtgttttttc cgaatattag cttacaaatt gcaggttctc ttttggctgt + 8281 tgtctcaata ggaattttta tcactagaat atattataca agatatgaag tttttatatc + 8341 tctattggtt tgtatttcta ttttaatttt ttattcaact cgcttttttt attcgactaa + 8401 cgtagagttg tatcagtctt tcttcaattc ctttctgatt cgtccagttc ctgcgatatt + 8461 agtagcgatg ctgttagcta agaataatca tataaaaggt ttcataaaat ggtcagaacc + 8521 tatgatgctt ttctatacat tgacatcatt tttagcagcc ctatctccta gaaacagcat + 8581 tattacttac caatctttat cttattatgc catgacagct tatatgatta atgtgtttaa + 8641 tattatatac aaagagaaaa tattggagga gcaactgacg tatttcagat tctcagcgtg + 8701 gaattttatt agatattttt tacttttgat tcaagctttt aatgcactct caggaggtgg + 8761 gagaggtgcc tttattttat taattatttt tacaggaata ttattaataa gaactgctat + 8821 gaaatttaag ttccttttct catttattgg aggcctgtct gctatagctc tagttgtttt + 8881 ttttacaaaa ggtttggatt tgacatggct cttgaatatg gacggtggag agcgattgtt + 8941 gaacttcttc ggcagacctg aacatatatc tacagataat agactattga tttatgatac + 9001 tgtttggtct gcaatacagg aaaaaccctt tttaggatgg ggagttggtt caactttttt + 9061 aaaatttaat ggatattcac ataatattgt attggattta ttgcatgata tgggaagttt + 9121 tggtttatta attattcttt cggctttctt tgcttcttca gtaatattgt acaaattacg + 9181 taaaatagat tggaaagtga atttatttat tctgatgttt ctagaagtat atgttcacat + 9241 gagtttcagt ggaagctatc ttgcagatgg tagactatgg tttttggtga tctttactta + 9301 ttgttactac aggtggaaag tgcaggaaaa ggatgaagtt agcaatttta ttatctgata + 9361 tttcaaaaat aggaggagtg cagcgtgtca cgacagctct tgttaatgaa ctttgtcaaa + 9421 atatagacgt tacaattatc agcatctttt cggaaaatga gctaccagct tttggacttt + 9481 cagatagagt tcaggtgagc tatcttttga aagaacatgt taatttgaag aagaattttt + 9541 ttaaagttag tggagctttg cgaaaagtgt tgaaaaaaca gcagtttgat gttgttctat + 9601 cgtcaggaac tggtctagta tcctttcttt ggtttgctag tttgggaatt cctaccagac + 9661 ttttggcatg ggaacatcag tgtttttact ttgggagatc gtttggtcta gagtggttgg + 9721 ggcgaaagct agcctgtcgt tttgctgaga gtattgttgt cttgactaaa aaagatgaag + 9781 gattttacaa agagaatcgt cctaaggctc atattgaaca aatctataat atcctagaca + 9841 tggattcaca aacagctaag tgtcagctct cttctaaaaa aattatcagt gttggatctt + 9901 tagtacgaca aaaaggtttt gatctggctc ttgaggtagc tagtcaaata caattaagtt + 9961 atccagattg gcagtgggac atttatggtg atggccccga tagagaaaaa ttagaggaga + 10021 aagtcaggga ataccaatta gaaggcttta taaatttgaa agggcttgtt cagaatgttc + 10081 gggagctcta tcctgactac tctatctacg ccttgacatc acgatatgaa ggattatcaa + 10141 tggtattatt agaagctaaa aactgccaga tgcctgctat ttcatttgat tgtaactgtg + 10201 gaccctctga tattatttca gatggaagaa atggtttttt gattgattgt tttgatgtaa + 10261 atatctatgc aaaaacttta tctaaattaa tgactagttt agagttgcga gaacaagttg + 10321 caaaatcgag tgttattcca gcagaagaat tgtcaacaac ttatatccta gataagtgga + 10381 acaatctatt aaagatagaa agaagataat atgaaaatag tccatgtaga agattttttt + 10441 catccagatg caggttacca gattaatgtt ttaccaaaat atctagcaaa gtttggtcat + 10501 gaacaagtga ttatcacttc agaaatggat aaaatccccg ataatcttac ccaatttttt + 10561 ggacgagaaa atatagaaga gagagataga agttacgaag agaagcatca tgtgaagatt + 10621 attcgcttgc ctcttcatgg atttgtaagc ggacgtgcga ttttttctgg aaagcttatt + 10681 tcggctatta agggtctttc tccagaggta ttgtatattc atgggaatga cactttaaca + 10741 gggattcgtc tccttttagc tcgaaagaaa cttaattgca gaatcgtcac cgatagtcat + 10801 atgcttgaaa tggcatcaag aaatcctttc aacaactact ttaggagatt ttataaaacc + 10861 ttgattactc ccattttgat aaaagaacag ataccaatta ttcggacgca agatgataat + 10921 tatgttgaaa aacacttggg aattccttta tcgcaagctc catggatttc ttatgggtcg + 10981 gatacagcgt tctttcacgc agatagccag attaaggaag attttcgttc tcagtatcaa + 11041 atcgcttcag atgctcttat ttgtgtttac gcaggaaagt tagatgagca taagggtggg + 11101 atgtttttag cagagtctct aagtaaaaag ttaaatacgg agcaaccaat tgttttcatt + 11161 atagtgggta atacaaatgg agagtatgga gaagctgtcg agaaaagttt ctcccaatct + 11221 gaaaaccaaa ttttgcgctt tccgactcaa aaatatcaaa aattagcaca gttttttcag + 11281 gtagcagatt ttgctttatt tcctaaacaa tgtagtttaa gtttttatga tgcacaggcc + 11341 tgtggtttac cagttttatt ggaagataat aatatcaacc tcgatagaac ttctcattat + 11401 aatggttgga cgttcaaggc taacagcaaa ttaagtttga gagattcatt aaaaatgatt + 11461 gcgagtctag ataaagagaa gagacaagag tactctcaga atgcactgca ctatatcctt + 11521 gaacattata attatgaaga taaagcaaga gaatatgaaa agattcttat aggggaacgt + 11581 acgaaatgag atagttaata tttcgttatt ttataggaaa ggtggattta atgaaaattt + 11641 gcattgtttc agtcggagtg ggcggactac cgattccagc tgtaaaaggg ggagcagtag + 11701 aaaatctcat tgataattat ttaagttaca atgagaaata taatcatgat gaaattacgg + 11761 tcgttagttg tgaccataag gaggcgcgtg aggcttcaaa aaaatacaag tatgcccaat + 11821 ttgtctatat agatattcat tcacttaaat ataaaataaa caaaacaata cgttatgcca + 11881 ttaataaata ttcacctttc ttcgtaggga acgcttatat cagtcaattg ccagacttgt + 11941 ctggttttga tacagttttg attgaaaatc gccctgaata cggttattat attcgtaaaa + 12001 agtttaaagg aaatcttgtt ttacatcttc acaatgattt attaatggac aatgagtatt + 12061 ctgtagatta tagcgtttat gataaaatta tcacaatatc tgactatatt agggataggt + 12121 cagaagtagt aacgtcaggt gttccgatac agactgtcta taatggtatt gacacagaac + 12181 tttttttgca gaatttctct gaaattgatt tatcagatct taaaaatcag ttggaaattt + 12241 tgtcggatga ttttgtgatt gttttttttg gacgtatcaa caaaaataaa ggtatcaaag + 12301 aactgcttga agccttcttg ttgctaccaa agaatttgaa tataaaatta ctagctgttg + 12361 gtagttctat atttggtcag acggagttgg atactttcac aacagagcta cggcaattgg + 12421 caaaacaagc atcagataaa gttgttttta caggctatgt taattacaaa gacattccta + 12481 agtatcatca tattgcagat tgcattgttg ttccatctat ttgggaggaa ccagcgggtt + 12541 tgacggtctg tgaagctttg atatcaggga aatatgttat tacaacagat gctggaggga + 12601 taccagagat tgtagctggc agtgaagccc ttgtggtagc aaatgatgag tgtatagttg + 12661 aacacctcaa aacagcccta ttgagtgtct accaaaaagg gaaatgctct tcggttatta + 12721 cttctaatag agatagagga gcctattttt ctattgaaaa atatggaaga gacttacgga + 12781 aagagctcac acaaaatgaa agaatcatta acatatgagt cgtgtaaaaa atagtttttt + 12841 taatatttta gctggaatag ttggtactat catatcgagt gttttagctt tcatagttag + 12901 aacagtgttt atccgagttt tgggagagac ttatctaggt ttcaatggtc tatacaccaa + 12961 tatcttaaca gttttatccc tagctgaatt agggatcgga tcatcaattg cttatttgat + 13021 gtacaaacct ttagcagaaa aagatgggga caaattagct caagtagttc aattctataa + 13081 aaaaatatat cgagtaattg gtatcattat tcttatttta ggtttgtgtc tcgttccttt + 13141 tttaccagtc attgtaaatt taaaaaatgc agaagatttg aactatacag cattgtattt + 13201 gctttattta gcagatacag tttctactta tctattcttt gcatataaaa gaggggtatt + 13261 ggttgctgat caaaaggtct atgttgcgaa tatctttgat ataattataa cgacaatttt + 13321 atctattttc caaattatca ctttgatgat ttggaaagat ttttatctat atattatttt + 13381 aaaaattgct aaaaatctta ctttgaacct agtaattagt ttaaaagtag ataaaatgta + 13441 tccaagtatt cataaattta aagagatagc tccacttcca aaaatggaaa gacgactagt + 13501 ttggaaaaat gtatatgcta cctctgttcg acaaatcttt aacgaattaa tgaattcaac + 13561 agatagtata gttatttcca ttgttttagg aatagttatg gttggtaagt attcgaacta + 13621 tgcttatatt ttatcaatcg tatatatttt ctttggagga atttttaatc cgattcaggc + 13681 ttctattgga aacctatctc tgttagcttc tatagagaaa aaaaatgaaa tcttcaatag + 13741 attacgtttt ataaattttt tctttttatc attttgctca agttgtcttc tagtattggt + 13801 aaatcctttt atcactattt ggattggaga aaattacact ttatcattta caggtgtgat + 13861 tgcaatagtt ggtatgttat tcgttagaca aactggaaat tgtacaacca tttttcgttt + 13921 gggagaagga tattttagag attatcattt ttctccttta atcgcgggca ttttaaattt + 13981 agttgtttca gtaattttag tgaattatat aggtattgca ggtgtttttg ttggaacaat + 14041 gttaggattt ggtttccaat ttatactggt ggatacaatt gttacttata aaaaagtact + 14101 tagtcgtcca ctatcagagt tttatttaag atggttgcag acgatcttat taactgtagg + 14161 tttatgtatt gcgagttact atttatctcg attggttaga gtgaatagta tatatgattt + 14221 gatactgttg tttgtagtgg ttattggatt taattttttt gctttatgtt ttatttattg + 14281 gcgaaatgat gattttcaat attttattca attggttaaa aattttatga aaaatttgga + 14341 ggaaaaaaat catgattaat gtaatcggat taggttatat tggattgcca acaattttaa + 14401 tgttggcaac aaacggcgtg aaagtagttg gaactgacta caatcaggat ttggtgagaa + 14461 ctttaaatga aggtcaaaca acctttaaag aagatggatt ggatgaacta ttccataaag + 14521 cagtggagtc gggtgtggac tttacaaccg aatatcaaca aacggatacc tatattattt + 14581 ccgttccaac accatatgac tccttctcta aaaaaattga tccaagctat gtgattgaag + 14641 ctacgaaaac ggtacttgat aattgcaata aaggagcggt tattattatt gaatcgaccg + 14701 tatcaccagg aacggttgat aaatttattc gacctgttgt agaagaaaaa ggttttgtta + 14761 ttggtagtga tattcatctt gtccatgctc cagaacgtat tattccaggg aatatggtct + 14821 atgaattggt gaataataac cgtacaattg gagctgatga cctagaaatc ggctataaag + 14881 tgaaagagct ttatgcttca ttttgtaagg gcgatattgt tgttacagat attagaactg + 14941 cggagatgac caaggtagta gaaaatacat ttagagctgt aaatattgct ttcgctaacg + 15001 aattagcaca gatctgtagt tatgataata tgaatgttta tgaaattatc cggatctgta + 15061 atatgcaccc acgggtaaat attctacaac ctggacctgg tgttggtggg cattgtattt + 15121 ctgtggatcc ttggttctta gttggagatt atcctgagtt gacaaatgtt attgaacatt + 15181 ctatgcgaac aaatgctgcc atgccagaat ttgtattaaa tcgtatctat accattatga + 15241 acgaacatca tctaacagat attagtcggg ttggtctata tggtcttacc tacaaagaga + 15301 atgtagatga tatgcgtgaa tctccaacgc ttcagttatt agaatctatg agccgccatc + 15361 tggcaacacc tgctattaaa gtatatgatc catttataga aaaagatgtt gtggcgaatc + 15421 agtcacatga tttagatgaa tttttatcta atgttgatat tgttgtactg ttggttggtc + 15481 atgatgagat tttacaaaat atggataaac taaaagataa gatagtgtta gatacacgtt + 15541 atatctgtca tcttgatgga acttacagat tataattagt gataaataaa gtaaggattg + 15601 actatgaaaa aaatagttgt aattttcgga actcgtcccg aagctatcaa gatgtgtccc + 15661 ttggttaaag agctaagaac acgtgagaat cttgaaacat tggtctgtgt tacgggtcaa + 15721 catcgtcaaa tgctggatca agttttggat acttttagga ttacgcctga ttttgattta + 15781 tctattatga aggacaaaca aactctcttt gatgtcacaa ttggcatttt ggaaggcatg + 15841 aagactgtct tagagtcagt taatcctgat ttaatattag ttcatgggga tacgagtaca + 15901 acatttgcca gttcactggc cgccttttat ctacagattc caattggaca tgtagaggct + 15961 ggtttgcgta cttatgatat ttattcacct tatcctgaag aatttaatcg tcaagcagta + 16021 ggtgctttgg ctcagtatca ttttacacca acacaactct caaaagacaa tctcttgaga + 16081 gaaggaaaaa attctgaagc tatatttatc acaggtaaca cagcaattga tgctttacaa + 16141 actacaattc aagaggatta tactcatcct gagttaaatt gggttgggga tagcaaacta + 16201 atattaatta ctgctcatcg tcgtgaaaat attggtgacc cgatgaggca catgtttaga + 16261 gcaatccgac gtatcattga agaacattcg gatataaagg ctctttaccc cattcatatg + 16321 aatcctctag ttcgtcagat tgctgaggaa gaactaagcg gatgtgaacg tatcaaaatg + 16381 atcgatccgt tggaagtatt agattttcat aactttttat cacggagtta tctcatttta + 16441 acagatagtg gtggtatcca agaagaggca cctagtttag gaaaacctgt tttagttatg + 16501 agagatacaa ctgaacgtcc ggagggaatt aaagcaggaa ctttgaagct tgtaggtact + 16561 gatgaggaca atatttatag acattttaaa gaattgttag aaaatgattt agtttatcaa + 16621 gcgatgagcc aagcttcaaa tccgtatgga gatggaacag cttgcaagaa aattgcagac + 16681 atactagaag gagaagtata atatatgtca caatttacag gaaaaactct cctaattaca + 16741 ggaggaacag gttcatttgg taatgctgtc cttaatcgtt ttttacagac tgatattggt + 16801 gaaattcgta ttttttcccg tgatgaaaaa aaacaggatg atatgcgtca tgagtttcag + 16861 gtaaaagtac cagaagtagc tgggaaaatc cgtttttacc ttggagatgt gcgtgactta + 16921 gcttcggtaa aaaatgctat gcatggtgtg gattatgttt ttcatgctgc tgctcttaaa + 16981 caagtacctt cgtgtgaatt tttccctgta gaagcggtaa aaactaacat tttgggaacg + 17041 gagaatgtcc tcactgcggc tatcgaagct ggtgtaaagc aagttatctg tctttctaca + 17101 gataaggcgg cttatcctgt caatgctatg ggaacatcca aggctatgat ggaaaagatt + 17161 gctgttgcta agtccaggac ggtaaatcct gagcatacaa agatatgtgt gactcgctat + 17221 gggaatgttc tgtgtagccg tggatctgtc gttcctcttt ggattgagca aattaagcaa + 17281 ggaaatgctc ttacaattac tgaacctagc atgacacgtt ttgtgatgac attagaagaa + 17341 gcagtagact tggttttatt tgcatttgaa gaagggaaat ctggagatat actagttcag + 17401 aaagcaccag catgtacgat tgaagtgttg gctaaggctg tatcagaaat ttttgcctca + 17461 gaacaagata ttaagattat aggtattaga cacggagaaa aaaagtatga aacactatta + 17521 actaatgaag agtgcgcaaa tgcaattgat ttgggtgatt tttatagagt tcctagtgat + 17581 aatcgtaatc ttaactatga taagtatttc aaagatggta gtacgaatag aaatttgttg + 17641 acagaattca atagtaataa taccgatttg atggatgtag agcaagttaa aagaaagttg + 17701 ctagaattag atgaaataca gacagcaatt cgtgatatgg tagcagatga agagatgtaa + 17761 aatcttttaa gatacattaa aattatcaag gatatataat gtatcatgta ttgtcgagag + 17821 agttgactat taaaacagca tataaaacaa ggagggggca tgattaaaaa tattttaatc + 17881 acaggagcga aaggatttgt aggaaaaaat cttatctgta ctctggaagc tttgaaagat + 17941 ggacgagata ggactcgtcc taatttagag attggagaga tttttcagta tgatcgtgat + 18001 acagatccga ttttattaga tgaatattgt aagaaggccg atttcgtatt ccatttagct + 18061 ggtgtcaatc gtccacagaa tcctgatgaa ttcatggagg gaaattacgg tttttcaagt + 18121 agattattgg agattttaga aaagtatgaa aacacttgtc ctgttctact ctcaagttct + 18181 actcaagcta gtttagaagg ccgattttca aactctatat atggacaatc taagctagca + 18241 ggggaagaac tcttctttga atatggaaag aaaacgggag cacctgtctt agtttaccgt + 18301 ttcccgaatc tttatgggaa gtggtgccgt cctaactaca attctgctgt agcaactttc + 18361 tgtcataatc tagctcacga tttacctatt caagtaaatg atccaagtgt agaattggag + 18421 ttgctgtata ttgatgattt gatacaagag tgtctaactg cattggaagg aaatcctcat + 18481 cgttgtaatc tagatggatt acaaatctta cctagcccat caggaaacta ctgctacgta + 18541 ccaacgactc atcgtgcaac cttaggagag attgtctctc tattagaaac atttaaaaaa + 18601 cagcctaata gtttagttat gcctgaaatt cctcaaggat cgtttaaaaa gaaattgtat + 18661 tctacctacc tatcttattt accagtagat aagtttaggt ttcctctaaa aatgaatata + 18721 gatgaacgag gtagttttac ggaattatta aaaacagaaa atacgggtca attttctgtt + 18781 aatatttcta aacctggcat taccaaaggg caacattggc atcattctaa gtgggaattt + 18841 ttcatggttg tttctggtcg tgctttaata caagagcgta ggatagggct ggatgaaaac + 18901 ggtcaagagt atcctattct gaactttgaa gtgtcgggcg ataagattga agcaatacat + 18961 atgataccgg gctatgcaca taatattatt aatctttctg atacagaaaa tctaattact + 19021 gtcatgtggg ctaatgagtc atttgatcct agacatccag atactttttt tgaacaagtg + 19081 gagaaataaa tgaaaattaa gacagattat agtgatattc attttaaaga taatggcaaa + 19141 cttaagttat tgattattgt gggaacacgt ccagagatta tacgtctaag tagtgttatc + 19201 actaaatgtc gaaagtattt tgatgttatt ttggcacata ctggacaaaa ctatgattac + 19261 aatttaaatg gtattttctt tgataattta gggttagaca ctccggacgt atacatggat + 19321 gctgttggag atgatcttgg tgctactgta gggaatatta ttaatacttc atacaaattg + 19381 atgaatcaaa ttaaaccaga tgctttattg attttagggg atacaaattc ttgtttatca + 19441 gctattgctg ccaagcgttt acatattcca atttttcata tggaggctgg caatcgctgt + 19501 aaagatgagt gcctgccgga agagactaat cgtcggattg ttgatattat ttcagatgtt + 19561 aacttagcat actctgaaca tgcacgtaag tatttacatg agtgtggttt acctaaagag + 19621 cgcacatatg taactggttc tcctatggca gaagtgttac ataaaaattt atctgccatt + 19681 gagtcttcag atatccatga acgtttggga ttgaaaaaag gaggttatat cttactttca + 19741 gctcaccgtg aggaaaatat tgatacagat aaaaatttta tttctctctt tacagcaatt + 19801 aatcaattag ctgaaaagta taatatgcca atcttatatt cttgccatcc tagatcaaag + 19861 aaaaggctac aagagagcgg ttttaaacta gataaacgtg tgattcagca tgagccacta + 19921 ggattccatg actataattg tttacagatg aatgcatttg ttgtagtatc tgattcggga + 19981 actttaccgg aagaaagtag tttctttact agtcaaggtt atccttttcc cgctgtatgt + 20041 attcgtacaa gtacagaacg tcctgagtcc ttagataagg caggatttat tttggcaggc + 20101 attgatgaaa attctcttct tcaagcagtt gaaactgctg ttagcttggc agaagatgag + 20161 gattttggat taccggttcc agattatgtt gaggaaaatg tctctactaa agttgttaag + 20221 ataatacaga gctatacagg gatagtggat aaaatagttt ggaggaaaag ctgaattgta + 20281 tatttttaat aaatcaaaac gagatgatta attcttagta gaacaagagt aaaattgaac + 20341 gtatttgatg gaaatgtctt acttgatagt cgagggatag ccattctatc ggatttttgg + 20401 cttgtttttg cgcttcatgt ttgatagaat aaagggctct ttgtcaactg tagtgggttg + 20461 aagaaaagct aagcttgaga aaggacaaat ttcgtccttt cttttttgat gttcagagcg + 20521 ataaaaatcc gttttttgaa gttttcaaag tttcgaaagt aaccgcccaa taacgaagta + 20581 tattgaaaaa tctccagact agagaactca cggatagttc ctaatctgga gatttcttat + 20641 ttgcactttt cttgtacaac tttagtccat ggtaaataag cctctaaaac ctctttgttt + 20701 acgagagttt cctcgtttgg aagacattct agaagatagg atagatattt ctcactattt + 20761 agttgatgac gtttagctgt ttccaacaag ctcataataa tagctcttgc tttagctcct + 20821 tcaaaacttt gagaaaataa ccaccctcgc ttttttaaac tgagctcagg ctaaaagagt + 20881 ccactggact cttttactcc gtcccataac caatgattta atggcgcgtt cagctagatt + 20941 attggaaagg accagatgtc cgtctttcaa aatagtctta aaggtttctt catacttgag + 21001 gctgtattca attgcccttc ctagttttga acctgctaaa actgactgac gccggcacca + 21061 agcaaagaag tcttccatta ggggctggag atgttcttga cgtttctgta gtcgttcatc + 21121 agctggcaaa gcctcccagt ctctttccaa ggaaaataac tgatcacaat aagctaaacc + 21181 tttagctcct aaggatgatt tatctgcttg cttgggggtc gcttcaaaaa atttccttct + 21241 cacatgcgcc caacatccaa caagttcagc ttcttccagt tgacgataag cttctagcgg + 21301 ttcgcagttt accaagctta gcgtcgcctt gctcctaaac cttggactgc tatcgcatag + 21361 gcagaactag aggactaaag tcctaagtta ctgccgcaac atatcacaat gaacatagcc + 21421 agaataatct cctaggaatt cttgtactac cgaaccactc cgactctgat catgatggta + 21481 cagcgtgatt gcttgattct caactttccc agacaaaaag gtccaatagt aggtcagatg + 21541 gctatgactc tctagaaccc gataagaagt ttcatccgca tgaagtaagg gctgagtcaa + 21601 tagtctctct cgcaagaggt tataaagggg ctttaggaat aggagctttc acaagcttat + 21661 ccagatgatt atcttttatt cgttatggac aatgctatat ggcataaatc aagtacctta + 21721 aagattccga ctaatattgg ctttgcattt attcctccat acacaccaga gatgaacccc + 21781 attgaacaag tgtggaaaga gattcgtaaa cgtggattta aaaataaagc ctttcaaact + 21841 ttggaagatg tcatgaatca actttaagat atcatacaag gactggagaa ggaggtgata + 21901 aagcccatcg ttaatcggag atggactaga atgctttttg aaagcagatg agtataaaaa + 21961 gaaagtcctc atttcaatag aaatcacgac tttctgatgg atttattttt ggagtgatag + 22021 aaaagccctt cataagccag tctacttgtt caggtgtgag agctttgaca tccttttctg + 22081 tactgggcca agtcagtctg ccgttctcaa agcgtttata tagtagccaa aatccttgac + 22141 catcccagta aagggcttta aagcggtctt tacgtccacc acaaaagaga aagacttgac + 22201 cggagaaagg atccaattca aagtgggttt taaccagata agtcagtgaa tcaatgcctt + 22261 gcctcatatc cgttttccca catacgagat agacctgccc taggctagat agatgaattg + 22321 tcatagagca acaccttatc caaaagctgt tctatcattt cgagattgag agattgaaaa + 22381 aaacttactt caagcttgcc aatacgaatt ttaagcagaa tatcatttct ctttttagaa + 22441 tcaaaaggac gagattgtgg aatctctaca ggaacaatag gttgtggcat taaaatatcc + 22501 tccaatagtt ttactttact aatagtatac aggaggagct ccatgaatga tagatacctt + 22561 gttatgacgc gcttactaaa caactaactg atgcacgatt taagcgcctt gttggtgttc + 22621 agcgcacgac ttttgaagag atgttagctg tattaaaaac agcttatcaa cttaaacacg + 22681 caaaaggtgg acgaaaacct aaattaagcc tagaagacct tcttatggcc actcttcaat + 22741 atgtgcgaga atatcgaact tatgaagaaa ttgcggctga ttttggtatc cacgaaagca + 22801 acttaatccg tcggagccaa tgggttgaag taactcttgt tcaaaggtgg tgttacgatt + 22861 tcaagaactc ctctcagttc tgaggacacg gtaatgattg atgcgacgga agtaaaaatc + 22921 aatcgcccta aaaaaacaat tagcgaatta ttctggtaaa aagaaatgcc acgctatgaa + 22981 ggctcaagcg attgtcacaa gtcaagggag aattgtttct ttggatatca ctgtgaacta + 23041 ttgtcgtaat atgaagttgt tcaaaatgag ttgcagaaat atcggacaag ctggaaaaat + 23101 cttggctgac agtggttatc aagggctcat gaagatatat cctcaagcac aaactccacg + 23161 taaatccagc aaactcaatc cgctaacagc taaagataaa gcctataacc atgcgctatc + 23221 taaggataga agcaaggttg agaacatctt tgccaaagta aaaacgttta aaatgttttc + 23281 aacaacctat cgaaatcatc gtaaacgctt cggattacga atgaatttga ttgctggtat + 23341 tatcaatcat gaactaggat tctagttttg caggaagtct attgaaggat cttttgcttt + 23401 agttccttgg tcaaggttga ttattttcac ggagcgcttc cgattgtttt cataaaccat + 23461 ttgcgcatag tcagcagaat aaatcttttt gaaacgtccc tttcctagac attatagaac + 23521 tttcagattc atctgaattt accaaattaa caaaaaaatt ctgaaaattc tgttgacaac + 23581 tttctgaaaa gagtctataa tggagagaaa gttttaaagg agaaaatgat gaaaagttca + 23641 agactacttg cccttgcggg cgtgacatta ttg +// + diff --git a/public/res/serotype_genbank/serotype_12F.gb b/public/res/serotype_genbank/serotype_12F.gb new file mode 100644 index 0000000..dd317b3 --- /dev/null +++ b/public/res/serotype_genbank/serotype_12F.gb @@ -0,0 +1,1075 @@ +LOCUS CR931660 23778 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 6312 (serotype 12f). +ACCESSION CR931660 +VERSION CR931660.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 23778) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 23778) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..23778 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="6312" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC12F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC12F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33268.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..466 + /gene="aliB" + /locus_tag="SPC12F_0002" + /pseudo + CDS 293..466 + /gene="aliB" + /locus_tag="SPC12F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI33269.1" + gene complement(479..983) + /gene="tnp" + /locus_tag="SPC12F_0003" + /pseudo + CDS complement(join(479..778,780..983)) + /gene="tnp" + /locus_tag="SPC12F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1195..2649 + /gene="wzg" + /locus_tag="SPC12F_0004" + CDS 1195..2649 + /gene="wzg" + /locus_tag="SPC12F_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33271.1" + /db_xref="GOA:Q4K1W6" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K1W6" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDL + PSYAMPDSNLYVLEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1195..1320 + /gene="wzg" + /locus_tag="SPC12F_0004" + /note="Signal peptide predicted for SPC0608 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 1408..1755 + /gene="wzg" + /locus_tag="SPC12F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.7e-65" + misc_feature 1933..2376 + /gene="wzg" + /locus_tag="SPC12F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 2651..3382 + /gene="wzh" + /locus_tag="SPC12F_0005" + CDS 2651..3382 + /gene="wzh" + /locus_tag="SPC12F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33272.1" + /db_xref="GOA:Q4JYS1" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYS1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRIIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2654..3262 + /gene="wzh" + /locus_tag="SPC12F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.3e-36" + gene 3388..4083 + /gene="wzd" + /locus_tag="SPC12F_0006" + CDS 3388..4083 + /gene="wzd" + /locus_tag="SPC12F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33273.1" + /db_xref="GOA:Q4K1W4" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K1W4" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSAFI + VKPEYTSTTRIYVVNRDQGDKSGLTNQDLQAGSYLVKDYREIILSQNVLEKVATNLKL + DIPAKTLARKVQVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVGRNSLFGFFGGAVVTVIAVLLIELFDIRVKRPEDVEDVLQI + PLLGVVPDLDKMK" + misc_feature 3388..3504 + /gene="wzd" + /locus_tag="SPC12F_0006" + /note="Signal peptide predicted for SPC0610 by SignalP 2.0 + HMM (Signal peptide probability 0.729) with cleavage site + probability 0.460 between residues 39 and 40" + misc_feature 3409..3825 + /gene="wzd" + /locus_tag="SPC12F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.4e-54" + misc_feature 3931..4008 + /gene="wzd" + /locus_tag="SPC12F_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4093..4767 + /gene="wze" + /locus_tag="SPC12F_0007" + CDS 4093..4767 + /gene="wze" + /locus_tag="SPC12F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33274.1" + /db_xref="GOA:Q4K1Y2" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1Y2" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + QGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITQKCDASILVTKAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGKK" + gene 5114..5713 + /gene="wciI" + /locus_tag="SPC12F_0008" + CDS 5114..5713 + /gene="wciI" + /locus_tag="SPC12F_0008" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI33275.1" + /db_xref="GOA:Q4K1W2" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4K1W2" + /translation="MYRVTKRLGDILLSLIGIIVLFPVFIVIAIAINTDSEGPIIFKQ + KRFGIYKEPFYILKFRSMKIGAPKNVAPRNLDNPEQWITKVGAFLRKTSLDELPQLWN + ILIGNMSIVGPRPAGINELDLLTEREKFGANDVLPGLTGWAQINGRDTLSIEMKAEAD + GYYVKHMSLSMDLRCIIRTIPYVLKRKGIVEGSGKKELD" + misc_feature 5114..5206 + /gene="wciI" + /locus_tag="SPC12F_0008" + /note="Signal peptide predicted for SPC0612 by SignalP 2.0 + HMM (Signal peptide probability 0.994) with cleavage site + probability 0.844 between residues 31 and 32" + misc_feature 5129..5683 + /gene="wciI" + /locus_tag="SPC12F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.2e-32" + gene 5679..6944 + /gene="wciJ" + /locus_tag="SPC12F_0009" + CDS 5679..6944 + /gene="wciJ" + /locus_tag="SPC12F_0009" + /note="member of homology group 35" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33276.1" + /db_xref="GOA:Q4JYR7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYR7" + /translation="MWRAVVRKSWIDAMKILFVCQHYKPEPFRLSDICEDLVQRGHEV + AVLTGIPNYPEGEIYADYRKRKKRRETINGVAIFRSYTIARRQNTLYRILNYFSFALS + STIGVIFGRYKAKDGSDFDCVFVNQLSPVMMAWAGIAYKNKYNKPMFLYCMDVWPDSL + IVGGVKENGLIYKIFEFVSKKVYQASDYIFVTSLSFKDYFVKKFNIPLHKITYLPQYA + EDLFVPNELKTNKNTIDLTFAGNIGKAQNLETILKAASAIEQIPDLAKRVHFHFVGDG + TELLNMQKLACELELENTSFYGRRPLEEMPDFYTKSDAMLVSLIGDSIISRTLPGKVQ + SYMAAGKPIIGAISGDTQRVVKEAKCGFISPEGNVDQLVRNIRKFCLLSVEEREKLGR + QARCYYEEQFSKEWFMTYLENHLKEGFLS" + misc_feature 6336..6869 + /gene="wciJ" + /locus_tag="SPC12F_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.8e-16" + gene 6893..8110 + /gene="wcxB" + /locus_tag="SPC12F_0010" + CDS 6893..8110 + /gene="wcxB" + /locus_tag="SPC12F_0010" + /note="member of homology group 55" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33277.1" + /db_xref="GOA:Q4JYR6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYR6" + /translation="MVYDILRKSFKRGVSIMKVLMINSVCGIRSTGRICADLATALTE + EGYEVKIAYGREYVPKQFQQYAVKIGTKSDIRFHAIRSRLFDESGFGSRQATVNFIKW + MKEFDPDIIHLHNLHGYYINVELLFDYLRICGKKIIWTLHDCWAFTGHSAYFDCLECE + SKGVCDHPSQKNDYPKSFVNFSKRNYQRKKKCFTHIPNLTIVTPSQWLANLVRQSFLK + EYPVKVIHNGIDTTVFQPRLIAAQKLRKRHHLEGKQVLLGVAAIWDNRKGFSDMLALA + NDLTDNQRIVLIGLKDRQLKELPKGIIGLTETNSPEELVAWYTLADVFLNPTYQDNYP + TTNLEAISCGTPVISYPTGGSVESAKLYGLVCQDRNVASILSSLEKVSQLSKTEKLDF + SIASFIKQMKYLY" + misc_feature 7613..8095 + /gene="wcxB" + /locus_tag="SPC12F_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 4.2e-12" + gene 8148..9359 + /gene="wzy" + /locus_tag="SPC12F_0011" + CDS 8148..9359 + /gene="wzy" + /locus_tag="SPC12F_0011" + /note="member of homology group 71" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33278.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K1V9" + /translation="MMKRIYYHLLAIWAWTLPNSYAFIDSLKVFFPNISLQIAGSLLA + VVSIGIFITRIYYTRYEVFISLLVCISILIFYSTRFFYSTNVELYQSFFNSFLIRPVP + AILVAMLLAKNNHIKGFIKWSEPMMLFYTLTSFLAALSPRNSIITYQSLSYYAMTAYM + INVFNIIYKEKILEEQLTYFRFSAWNFIRYFLLLIQAFNALSGGGRGAFILLIIFTGI + LLIRTAMKFKFLFSFIGGLSAIALVVFFTKGLDLTWLLNMDGGERLLNFFGRPEHIST + DNRLLIYDTVWSAIQEKPFLGWGVGSTFLKFNGYSHNIVLDLLHDMGSFGLLIILSAF + FASSVILYKLRKIDWKVNLFILMFLEVYVHMSFSGSYLADGRLWFLVIFTYCYYRWKV + QEKDEVSNFII" + misc_feature 8964..9131 + /gene="wzy" + /locus_tag="SPC12F_0011" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 9.9e-08" + gene 9334..10410 + /gene="wcxD" + /locus_tag="SPC12F_0012" + CDS 9334..10410 + /gene="wcxD" + /locus_tag="SPC12F_0012" + /note="member of homology group 72" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33279.1" + /db_xref="GOA:Q4K1V8" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1V8" + /translation="MKLAILLSDISKIGGVQRVTTALVNELCQNIDVTIISIFSENEL + PAFGLSDRVQVSYLLKEHVNLKKNFFKVSGALRKVLKKQQFDVVLSSGTGLVSFLWFA + SLGIPTRLLAWEHQCFYFGRSFGLEWLGRKLACRFAESIVVLTKKDEGFYKENRPKAH + IEQIYNILDMDSQTAKCQLSSKKIISVGSLVRQKGFDLALEVASQIQLSYPDWQWDIY + GDGPDREKLEEKVREYQLEGFINLKGLVQNVRELYPDYSIYALTSRYEGLSMVLLEAK + NCQMPAISFDCNCGPSDIISDGRNGFLIDCFDVNIYAKTLSKLMTSLELREQVAKSSV + IPAEELSTTYILDKWNNLLKIERR" + misc_feature 9835..10341 + /gene="wcxD" + /locus_tag="SPC12F_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.2e-33" + gene 10412..11590 + /gene="wcxE" + /locus_tag="SPC12F_0013" + CDS 10412..11590 + /gene="wcxE" + /locus_tag="SPC12F_0013" + /note="member of homology group 73" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33280.1" + /db_xref="GOA:Q4K1V7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1V7" + /translation="MKIVHVEDFFHPDAGYQINVLPKYLAKFGHEQVIITSEMDKIPD + NLTQFFGRENIEERDRSYEEKHHVKIIRLPLHGFVSGRAIFSGKLISAIKGLSPEVLY + IHGNDTLTGIRLLLARKKLNCRIVTDSHMLEKASRNPFNNYFRRFYKTLITPILIKEQ + IPIIRTQDDNYVEKHLGIPLSQAPWISYGSDTAFFHADSQIKEDFRSQYQIASDALIC + VYAGKLDEHKGGMFLAESLSKKLNTEQPIVFIIVGNTNGEYGEAVEKSFSQSENQILR + FPTQKYQKLAQFFQVADFALFPKQCSLSFYDAQACGLPVLLEDNNINLDRTSHYNGWT + FKANSKLSLRDSLKMIASLDKEKRQEYSQNALHYILEHYNYEDKAREYEKILIGERTK + " + misc_feature 11015..11515 + /gene="wcxE" + /locus_tag="SPC12F_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00013" + gene 11623..12819 + /gene="wcxF" + /locus_tag="SPC12F_0014" + CDS 11623..12819 + /gene="wcxF" + /locus_tag="SPC12F_0014" + /note="member of homology group 74" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33281.1" + /db_xref="GOA:Q4K1V6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1V6" + /translation="MDLMKICIVSVGVGGLPIPAVKGGAVENLIDNYLSYNEKYNHDE + ITVVSCDHKEAREASKKYKYAQFVYIDIHSLKYKINKTIRYAINKYSPFFVGNAYISQ + LPDLSGFDTVLIENRPEYGYYIRKKFKGNLVLHLHNDLLMDNEYSVDYSVYDKIITIS + DYIRDRSEVVMSGVPIQTVYNGIDTELFLQNFSEIDLSDLKNQLEILSDDFVIVFFGR + INKNKGIKELLEAFLLLPKNLNIKLLAVGSSIFGQTELDTFTTELRQLAKQASDKVVF + TGYVNYKDIPKYHHIADCIVVPSIWEEPAGLTVCEALISGKYVITTDAGGIPEIVAGS + EALVVANDECIVEHLKTALLSVYQKGKCSSVITSNRDRGAYFSIEKYGRDLRKELTQN + ERIINI" + misc_feature 11623..11697 + /gene="wcxF" + /locus_tag="SPC12F_0014" + /note="Signal peptide predicted for SPC0618 by SignalP 2.0 + HMM (Signal peptide probability 0.653) with cleavage site + probability 0.406 between residues 25 and 26" + misc_feature 12211..12738 + /gene="wcxF" + /locus_tag="SPC12F_0014" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.3e-28" + gene 12816..14360 + /gene="wzx" + /locus_tag="SPC12F_0015" + CDS 12816..14360 + /gene="wzx" + /locus_tag="SPC12F_0015" + /note="member of homology group 56" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33282.1" + /db_xref="GOA:Q4K1V5" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K1V5" + /translation="MSRVKNSFFNILAGIVGTIISSVLAFIVRTVFIRVLGETYLGFN + GLYTNILTVLSLAELGIGSSIAYLMYKPLAEKDGDKLAQVVQFYKKIYRVIGIIILIL + GLCLVPFLPVIVNLKNAEDLNYTALYLLYLADTVSTYLFFAYKRGVLVADQKVYVANI + FDIIITTILSIFQIITLMIFKDFYLYIILKIAKNLTLNLVISLKVDKMYPSIHKFKEI + APLPKMERRLVWKNVYATSVRQIFNELMNSTDSIVISIVLGIVMVGKYSNYAYILSIV + YIFFGGIFNPIQASIGNLSLLASIEKKNEIFNRLRFINFFFLSFCSSCLLVLVNPFIT + IWIGENYTLSFTGVIAIVGMLFVRQTGNCTTIFRLGEGYFRDYHFSPLIAGILNLVVS + VILVNYIGIAGVFVGTMLGFGFQFILVDTIVTYKKVLSRPLSEFYLRWLQTILLTVGL + CIASYYLSRLVRVNSIYDLILLFVVVIGFNFFALCFIYWRNDDFQYFIQLVKNFMKNL + EEKNHD" + misc_feature 12816..12890 + /gene="wzx" + /locus_tag="SPC12F_0015" + /note="Signal peptide predicted for SPC0619 by SignalP 2.0 + HMM (Signal peptide probability 0.820) with cleavage site + probability 0.397 between residues 25 and 26" + gene 14353..15576 + /gene="mnaB" + /locus_tag="SPC12F_0016" + CDS 14353..15576 + /gene="mnaB" + /locus_tag="SPC12F_0016" + /note="member of homology group 75" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylmannosamine dehydrogenase MnaB" + /protein_id="CAI33283.1" + /db_xref="GOA:Q4K1X3" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K1X3" + /translation="MINVIGLGYIGLPTILMLATNGVKVVGTDYNQDLVRTLNEGQTT + FKEDGLDELFHKAVESGVDFTTEYQQTDTYIISVPTPYDSFSKKIDPSYVIEATKTVL + DNCNKGAVIIIESTVSPGTVDKFIRPVVEEKGFVIGSDIHLVHAPERIIPGNMVYELV + NNNRTIGADDLEIGYKVKELYASFCKGDIVVTDIRTAEMTKVVENTFRAVNIAFANEL + AQICSYDNMNVYEIIRICNMHPRVNILQPGPGVGGHCISVDPWFLVGDYPELTNVIEH + SMRTNAAMPEFVLNRIYTIMNEHHLTDISRVGLYGLTYKENVDDMRESPTLQLLESMS + RHLATPAIKVYDPFIEKDVVANQSHDLDEFLSNVDIVVLLVGHDEILQNMDKLKDKIV + LDTRYICHLDGTYRL" + misc_feature 14356..14910 + /gene="mnaB" + /locus_tag="SPC12F_0016" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.4e-45" + misc_feature 14932..15192 + /gene="mnaB" + /locus_tag="SPC12F_0016" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 4.5e-33" + misc_feature 15274..15537 + /gene="mnaB" + /locus_tag="SPC12F_0016" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 2.5e-15" + gene 15599..16702 + /gene="mnaA" + /locus_tag="SPC12F_0017" + CDS 15599..16702 + /gene="mnaA" + /locus_tag="SPC12F_0017" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33284.1" + /db_xref="GOA:Q4K1V3" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1V3" + /translation="MTMKKIVVIFGTRPEAIKMCPLVKELRTRENLETLVCVTGQHRQ + MLDQVLDTFRITPDFDLSIMKDKQTLFDVTIGILEGMKTVLESVNPDLILVHGDTSTT + FASSLAAFYLQIPIGHVEAGLRTYDIYSPYPEEFNRQAVGALAQYHFTPTQLSKDNLL + REGKNSEAIFITGNTAIDALQTTIQEDYTHPELNWVGDSKLILITAHRRENIGDPMRH + MFRAIRRIIEEHSDIKALYPIHMNPLVRQIAEEELSGCERIKMIDPLEVLDFHNFLSR + SYLILTDSGGIQEEAPSLGKPVLVMRDTTERPEGIKAGTLKLVGTDEDNIYRHFKELL + ENDLVYQAMSQASNPYGDGTACKKIADILEGEV" + misc_feature 15668..16690 + /gene="mnaA" + /locus_tag="SPC12F_0017" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 2.5e-174" + gene 16706..17761 + /gene="fnlA" + /locus_tag="SPC12F_0018" + CDS 16706..17761 + /gene="fnlA" + /locus_tag="SPC12F_0018" + /note="member of homology group 36" + /codon_start=1 + /transl_table=11 + /product="FnlA" + /protein_id="CAI33285.1" + /db_xref="GOA:Q4K1V2" + /db_xref="InterPro:IPR003869" + /db_xref="InterPro:IPR013692" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1V2" + /translation="MSQFTGKTLLITGGTGSFGNAVLNRFLQTDIGEIRIFSRDEKKQ + DDMRHEFQVKVPEVTGKIRFYLGDVRDLASVKNAMHGVDYVFHAAALKQVPSCEFFPV + EAVKTNILGTENVLTAAIEAGVKQVICLSTDKAAYPVNAMGTSKAMMEKIAVAKSRTV + NPEHTKICVTRYGNVLCSRGSVVPLWIEQIKQGNALTITEPSMTRFVMTLEEAVDLVL + FAFEEGKSGDILVQKAPACTIEVLAKAVSEIFASEQDIKIIGIRHGEKRYETLLTNEE + CANAIDLGDFYRVPSDNRNLNYDKYFKDGSTNRNLLTEFNSNNTDLMDVEQVKRKLLE + LDEIQTAIRDMVADEEM" + misc_feature 16727..17581 + /gene="fnlA" + /locus_tag="SPC12F_0018" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0017" + misc_feature 16730..17578 + /gene="fnlA" + /locus_tag="SPC12F_0018" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 4.6e-162" + misc_feature 16730..17401 + /gene="fnlA" + /locus_tag="SPC12F_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.6e-09" + misc_feature 16733..17368 + /gene="fnlA" + /locus_tag="SPC12F_0018" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 8e-09" + misc_feature 17579..17722 + /gene="fnlA" + /locus_tag="SPC12F_0018" + /note="HMMPfam hit to PF08485, Polysaccharide biosynthesis + protein C, score 2e-23" + gene 17861..19090 + /gene="fnlB" + /locus_tag="SPC12F_0019" + CDS 17861..19090 + /gene="fnlB" + /locus_tag="SPC12F_0019" + /note="member of homology group 37" + /codon_start=1 + /transl_table=11 + /product="FnlB" + /protein_id="CAI33286.1" + /db_xref="GOA:Q4K1V1" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1V1" + /translation="MIKNILITGAKGFVGKNLICTLEALKDGRDRTRPNLEIGEIFQY + DRDTDPILLDEYCKKADFVFHLAGVNRPQNPDEFMEGNYGFSSRLLEILEKYENTCPV + LLSSSTQASLEGRFSNSIYGQSKLAGEELFFEYGKKTGAPVLVYRFPNLYGKWCRPNY + NSAVATFCHNLAHDLPIQVNDPSVELELLYIDDLIQECLTALEGNPHRCNLDGLQILP + SPSGNYCYVPTTHRATLGEIVSLLETFKKQPNSLVMPEIPQGSFKKKLYSTYLSYLPV + DKFRFPLKMNIDERGSFTELLKTENTGQFSVNISKPGITKGQHWHHSKWEFFMVVSGR + ALIQERRIGLDENGQEYPILNFEVSGDKIEAIHMIPGYAHNIINLSDTENLITVMWAN + ESFDPRHPDTFFEQVEK" + misc_feature 17873..18496 + /gene="fnlB" + /locus_tag="SPC12F_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 6.9e-09" + gene 19091..20275 + /gene="fnlC" + /locus_tag="SPC12F_0020" + CDS 19091..20275 + /gene="fnlC" + /locus_tag="SPC12F_0020" + /note="member of homology group 38" + /codon_start=1 + /transl_table=11 + /product="UDP-L-fucosamine FnlC" + /protein_id="CAI33287.1" + /db_xref="GOA:Q4K1W9" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1W9" + /translation="MKIKTDYSDIHFKDNGKLKLLIIVGTRPEIIRLSSVITKCRKYF + DVILAHTGQNYDYNLNGIFFDNLGLDTPDVYMDAVGDDLGATVGNIINTSYKLMNQIK + PDALLILGDTNSCLSAIAAKRLHIPIFHMEAGNRCKDECLPEETNRRIVDIISDVNLA + YSEHARKYLHECGLPKERTYVTGSPMAEVLHKNLSAIESSDIHERLGLKKGGYILLSA + HREENIDTDKNFISLFTAINQLAEKYNMPILYSCHPRSKKRLQESGFKLDKRVIQHEP + LGFHDYNCLQMNAFVVVSDSGTLPEESSFFTSQGYPFPAVCIRTSTERPESLDKAGFI + LAGIDENSLLQAVETAVSLAEDEDFGLPVPDYVEENVSTKVVKIIQSYTGIVDKIVWR + KS" + misc_feature 19202..20230 + /gene="fnlC" + /locus_tag="SPC12F_0020" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 4.8e-105" + gene complement(20473..20559) + /gene="tnp" + /locus_tag="SPC12F_0021" + /pseudo + CDS complement(20473..20559) + /gene="tnp" + /locus_tag="SPC12F_0021" + /note="Lone member of homology group 0229" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase (fragment)" + gene complement(20638..21583) + /gene="tnp" + /locus_tag="SPC12F_0022" + /pseudo + CDS complement(join(20638..20859,20870..21583)) + /gene="tnp" + /locus_tag="SPC12F_0022" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + gene 21686..21871 + /gene="tnp" + /locus_tag="SPC12F_0023" + /pseudo + CDS 21686..21871 + /gene="tnp" + /locus_tag="SPC12F_0023" + /note="member of homology group 0047 7" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene complement(22107..22680) + /gene="tnp" + /locus_tag="SPC12F_0024" + /pseudo + CDS complement(join(22107..22430,22411..22680)) + /gene="tnp" + /locus_tag="SPC12F_0024" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature complement(order(22113..22430,22411..22415)) + /gene="tnp" + /locus_tag="SPC12F_0024" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 4.9e-50" + /pseudo + gene order(22747..23055,23081..23470) + /gene="tnp" + /locus_tag="SPC12F_0025" + /pseudo + CDS join(22747..23055,23081..23470) + /gene="tnp" + /locus_tag="SPC12F_0025" + /note="member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature order(22993..23055,23081..23458) + /gene="tnp" + /locus_tag="SPC12F_0025" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 1.8e-14" + /pseudo + gene 23731..>23778 + /gene="aliA" + /locus_tag="SPC12F_0026" + CDS 23731..>23778 + /gene="aliA" + /locus_tag="SPC12F_0026" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33293.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaaagca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctacttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagcagct caaaaaggta ttgcaacttg gtaatacctt tttgagctgc tttttgatat + 541 gagcccatgt tttctcaata ggattgtact caggcgagta gggaggaaga ggtaaaagtt + 601 tatgcccaaa ctcttcacac aagagttcta gcttccccat tctatggaat cttgcattat + 661 ccataataat aaccgatggt gtggttaatg ttggtaagag aaacttctga aaccaagctt + 721 caaaaaagtc gctcgtcatc atctcttcgt aagtcattgg agcgattaac tcaccattca + 781 tttgttagac ctgcaaccaa agaaatcctc tgatatcttc ttccagatac tttacctctt + 841 attaactgac cttttaatga gcgaccatat tctcgatgaa aataagtatc gaatcctgtt + 901 tcatcaatct aaacaggtgc taggtgcttt aaactattaa aattcttaag aaataaggct + 961 actttttctg ggtcttgttc ataattagat tgaaactaga gtagtacacc tctgcttcta + 1021 aaaaattttt agaaatcgat ttaactgtcc tgatcgattt gtcatgttct tatttcattt + 1081 tactatattt ttgtttcgcg ggaagtctac taagatactt aaagatgcag atagtaaaaa + 1141 aatgtagaca ttaccgtaaa aaagtgatat aatcgtatga tgttcaaggt ataggtgtta + 1201 atcatgagta gacgttttaa aaaatcacgt tcacagaaag tgaagcgaag tgttaatatc + 1261 gttttgctga ctatttattt attgttagtt tgttttttat tgttcttaat ctttaagtac + 1321 aatatccttg cttttagata tcttaaccta gtggtaactg cgttagtcct actagttgcc + 1381 ttggtagggc tactcttgat tatctataaa aaagctgaaa agtttactat ttttctgttg + 1441 gtgttctcta tccttgtcag ctctgtgtcg ctctttgcag tacagcagtt tgttggactg + 1501 accaatcgtt taaatgcgac ttctaattac tcagaatatt caatcagtgt cgctgtttta + 1561 gcagatagtg atatcgaaaa tgttacgcaa ctgacgagtg tgacagcacc gactgggact + 1621 gataatgaaa atattcaaaa actactagct gatattaagt caagtcagaa taccgatttg + 1681 acggtcgacc agagttcgtc ttacttggca gcttacaaga gtttgattgc aggggagact + 1741 aaggccattg tcttaaatag tgtctttgaa aatatcatcg agtcagagta tccagactac + 1801 gcatcgaaga taaaaaagat ttataccaag ggattcacta aaaaagtaga agctcctaag + 1861 acgtctaaga atcagtcttt caatatctat gttagtggaa ttgacaccta tggccctatt + 1921 agttcggtgt cgcgatcaga tgtcaatatc ctgatgactg tcaatcgaga taccaagaaa + 1981 atcctcttga ccacaacgcc acgtgatgcc tatgtaccaa tcgcagatgg tggaaataat + 2041 caaaaagata aattaaccca tgcgggcatt tatggagttg attcgtccat tcacacctta + 2101 gaaaatctct atggagtgga tatcaattac tatgtgcgat tgaacttcac ttctttcttg + 2161 aaaatgattg acttattggg aggggtagat gttcataatg atcaagagtt ttcagctcta + 2221 catgggaagt tccatttccc agtagggaat gtccatctag actctgagca ggctctaggt + 2281 tttgtacgtg aacgctactc actagccgat ggagaccgtg accgtggtcg caaccaacaa + 2341 aaggtgattg tggctatcct tcaaaaatta acgtcaaccg aagcactgaa aaattatagt + 2401 acgatcatta atagcttgca agattctatc caaacaaata tgccacttga gactatgata + 2461 aatttggtca atgctcagtt agaaagtgga gggaattata aagtaaattc tcaagattta + 2521 aaagggacag gtcggacgga tcttccttct tatgcaatgc cagacagtaa cctctatgtg + 2581 ttggaaatag atgatagtag tttagctgta gttaaagcag ctatacagga tgtgatggag + 2641 ggtagatgaa atgatagaca tccattcgca tatcgttttt gatgtagatg acggtcccaa + 2701 gtcaagagag gaaagcaagg ctctcttggc agaatcctac aggcaagggg tacgaatcat + 2761 tgtctctacc tctcaccgtc gcaagggcat gtttgaaact ccggaagaga agatagcaga + 2821 aaactttctt caggttcggg aaatagctaa ggaagtggcg agtgacttag tcatcgctta + 2881 cggggctgaa atttactaca caccagatgt tctggataag ctagaaaaaa agcggattcc + 2941 gaccctcaat gatagtcgtt atgccttgat agagtttagt atgaacactc cttatcgcga + 3001 tattcatagc gccttgagca agatcttgat gttgggaatt actccagtca ttgcccacat + 3061 tgagcgctat gatgctcttg aaaataatga aaaacgcgtt cgagaattga tcgatatggg + 3121 ctgttacacg caagtaaata gttcacatgt cctcaaatcc aaactttttg gcgaacgtta + 3181 taaattcatg aaaaaaagag ctcagtattt tttagagcag gatttggtcc atgtcattgc + 3241 aagtgatatg cacaatctag acggcagacc tcctcatatg gcagaagcat atgaccttgt + 3301 tacccaaaaa tacggagaag cgaaggctca ggaacttttt atagacaatc ctcgaaaaat + 3361 tgtaatggat caactaattt aggagaaatg atgaaagaac aaaacacgat agaaatcgat + 3421 gtatttcaat tatttaaaac cttgtggaaa cgcaagctaa tgattttatt agtggcactt + 3481 gtgacaggtg cgggggcttt tgcatatagc gcttttattg ttaagccaga atatacgagt + 3541 accacgcgaa tttacgtagt gaatcgcgat caaggagaca agtcggggct gacaaatcag + 3601 gatttgcagg caggatctta tctggtaaaa gactaccgtg agattatcct ttcgcagaat + 3661 gtattggaaa aagtagcgac aaatttgaag ttggatatac cagccaaaac gttagctaga + 3721 aaagttcaag tgactgtacc agttgacact cgtatcgtct caatctctgt caaggataaa + 3781 cagccagagg aagccagtcg tatcgctaat tctctacgag aagttgctgc agaaaagatc + 3841 atcgctgtaa cgcgagtatc tgatgtgacg acacttgaag aagcgcgacc agctacgact + 3901 ccctcttctc caaatgttgg acgcaattcc ttgtttggtt tttttggagg agcagtcgta + 3961 acagtaattg ctgttctttt gattgagttg ttcgacatcc gtgtgaaacg tcctgaagat + 4021 gtcgaagatg tactgcaaat tccactttta ggggtcgttc cagatttgga caaaatgaaa + 4081 taggaggaag ttatgccaac attagaaatc tcacaggcaa aattggattt tgtaaaaaag + 4141 gcagaggaaa attataacgc tttgtgcacg aacctacagt taagtggaga tgatttgaaa + 4201 gtattttcta tcacttctgt gaaacaagga gaaggaaaat caacgacttc caccaatatc + 4261 gcttgggctt ttgcgcgtgc aggttacaaa acgctgctga ttgatggaga tattcgcaat + 4321 tctgttatgt taggtgtctt taaagcaaga gataagatta caggcctgac agaattttta + 4381 tcaggaacta cagacctatc acaagggctt tgtgatacca atatcgaaaa tctctttgta + 4441 attcaggctg gctctgtgtc accgaatccg acagctcttc ttcaaagtaa gaatttcagt + 4501 acaatgcttg aaaccttgcg taaatatttt gactacatca ttgtagatac tgctcctgtc + 4561 ggtgtcgtga ttgatgcggc tattattacg caaaaatgcg atgcttctat tttagtgacg + 4621 aaggcaggtg aaataaatcg acgggatatt caaaaagcaa aagaacagtt ggaacacaca + 4681 gggaagccgt ttttgggagt tgtgttgaat aaattcgata cttcagtaga caaatacggt + 4741 tcttatggaa attacggaaa aaaataagtc gttaagtatt tgtgtaagga catttttaga + 4801 actacaatca aaatctttgg aattgctggc ttcaaatcat attgatttga aatgaaactt + 4861 gcaaaagagt ttttaaggtg agtttcttaa tttgtgactg aaatcaatct tctacttcca + 4921 taccttggaa aaacagggta aacgagagat gttttttcca taataaagtt ttgatatggc + 4981 tagtagagta gtaatataat gaattgtaat cattagtgtt cataccaaga aatatcaagt + 5041 atctattttt gaaaatcata aatatgagat agtttttaaa tctctaagga gagctagttt + 5101 tgagaggtaa tttatgtata gagtaacaaa acgattaggg gatattttac tttctttaat + 5161 aggaataata gtactgtttc cagtgtttat tgtaattgca attgcgataa acactgattc + 5221 ggagggtccg attatattta aacaaaaacg atttgggata tacaaggaac ctttttatat + 5281 cctgaaattt aggtccatga aaataggagc accgaaaaat gtagctccac ggaacttgga + 5341 taatccagaa cagtggatta ccaaagtggg agctttctta agaaaaacat ctttggacga + 5401 actgccacaa ttatggaata ttcttattgg taatatgagc attgtaggac ctaggccagc + 5461 aggtataaat gagcttgatt tgctcaccga aagagaaaag tttggtgcga atgatgtctt + 5521 acctggatta actggatggg cacaaattaa tgggcgagat actttgtcaa tagagatgaa + 5581 ggcagaagca gatggttatt atgtgaaaca tatgtcgtta agcatggatc ttagatgtat + 5641 cattaggaca atcccctacg tattaaaacg taagggaatt gtggagggca gtggtaagaa + 5701 agagttggat tgatgcaatg aaaattctat ttgtttgtca acattataag ccagaacctt + 5761 ttaggttgtc agatatttgt gaggatctag ttcaaagagg gcatgaggtg gctgttttga + 5821 cagggattcc taactatcct gagggggaaa tatatgctga ttatcgtaag agaaaaaaaa + 5881 gaagagagac tataaatggt gttgctattt ttcgttcata caccattgct aggaggcaaa + 5941 atactttata ccgtatattg aattatttta gttttgctct ttcttctacg ataggtgtta + 6001 tatttgggcg ttataaagcg aaagatggct cagattttga ttgtgtcttt gtcaatcaac + 6061 tatctccagt tatgatggct tgggctggta tagcttataa gaacaagtac aataaaccta + 6121 tgtttttgta ttgcatggat gtttggccgg atagtttaat tgtaggtggg gtgaaggaaa + 6181 atggattgat ttacaagata tttgaatttg tttcaaaaaa agtatatcaa gccagcgatt + 6241 atatatttgt tactagtcta tcttttaaag attattttgt aaaaaaattt aatattcctc + 6301 tccacaaaat tacttactta ccacaatatg cagaggattt atttgtacca aatgaattaa + 6361 aaacgaacaa aaatactatt gacttaactt ttgctggaaa tattggaaaa gctcagaatt + 6421 tagagactat tttgaaagca gccagtgcaa tagaacagat tcccgattta gcaaagagag + 6481 ttcattttca ttttgttgga gatggtacgg aactattaaa tatgcaaaaa ttagcatgtg + 6541 aactagaatt agagaacact tcattttatg gtagacgtcc attagaagag atgccggatt + 6601 tttatacaaa atcagatgcg atgctagttt ctttaatagg cgactctata atttctcgca + 6661 ccttaccagg caaggtacaa tcttatatgg cggcaggaaa accaattata ggagcgattt + 6721 caggagatac tcagagagtt gtaaaagaag caaaatgtgg tttcataagt ccggaaggga + 6781 atgttgatca gttagtgaga aatattcgta agttctgttt gctttctgta gaggaaagag + 6841 agaaactagg aaggcaagct cgttgttatt atgaagaaca gttttcgaaa gagtggttta + 6901 tgacatactt agaaaatcat ttaaaagagg ggtttctatc atgaaggttt taatgattaa + 6961 ttccgtttgt ggtattagga gcactgggag aatttgtgca gatctcgcaa ctgctttgac + 7021 agaagaagga tatgaggtta aaatcgccta tggtcgtgag tatgttccga aacaatttca + 7081 acagtatgca gtgaaaattg gtacaaagtc tgatattcgt tttcatgcga ttcgttctcg + 7141 attatttgac gaatctggct ttggaagtag acaggcaact gttaatttta ttaaatggat + 7201 gaaagagttt gatcctgata ttattcatct ccataacctt catgggtatt atatcaatgt + 7261 tgaactgtta tttgattatc tccgaatatg cggtaaaaag attatatgga ctttgcatga + 7321 ttgttgggca tttacaggac actcggctta ttttgattgt ttggaatgtg agtcaaaggg + 7381 agtttgtgac catccatctc agaaaaatga ttatcccaag tcgttcgtga atttttcaaa + 7441 gcgaaattat caaagaaaga aaaaatgttt tactcatatt cctaatctca ctattgttac + 7501 tccgtctcaa tggctagcta atttagtaag acagtcattt ttaaaagaat atccagtgaa + 7561 agtaattcat aatggtattg atactactgt ctttcaaccg aggctaatag ccgctcaaaa + 7621 attgagaaaa agacaccatc ttgaaggaaa gcaggtactg cttggtgtgg ctgctatctg + 7681 ggataataga aagggatttt ctgatatgtt agcgctcgcg aatgatctaa ctgataatca + 7741 gagaatagtt ttgatagggt taaaagatag gcaactcaaa gaactaccca aagggatcat + 7801 tgggttaaca gaaactaata gcccagaaga gttggtagca tggtatacac tagcggatgt + 7861 atttctaaat cctacttatc aagataatta cccgacaact aatttagaag ctatttcttg + 7921 tgggacacca gttatcagct atccgacagg tggtagtgta gaaagtgcta aactttatgg + 7981 tctcgtttgt caggatagaa acgtagcttc tattttatct tcgttagaaa aagtctctca + 8041 gctatctaaa acagaaaaat tggatttttc aattgcaagt tttattaaac aaatgaaata + 8101 tttatattag aacttgaatt ataggaaaat gaggaatttg cattaaaatg atgaaaagaa + 8161 tttattatca ccttttggct atttgggctt ggactcttcc aaattcttat gcttttattg + 8221 attcgttaaa ggtgtttttt ccgaatatta gcttacaaat tgcaggttct cttttggctg + 8281 ttgtctcaat aggaattttt atcactagaa tatattatac aagatatgaa gtttttatat + 8341 ctctattggt ttgtatttct attttaattt tttattcaac tcgctttttt tattcgacta + 8401 acgtagagtt gtatcagtct ttcttcaatt cctttctgat tcgtccagtt cctgcgatat + 8461 tagtagcgat gctgttagct aagaataatc atataaaagg tttcataaaa tggtcagaac + 8521 ctatgatgct tttctataca ttgacatcat ttttagcagc cctatctcct agaaacagca + 8581 ttattactta ccaatcttta tcttattatg ccatgacagc ttatatgatt aatgtgttta + 8641 atattatata caaagagaaa atattggagg agcaactgac gtatttcaga ttctcagcgt + 8701 ggaattttat tagatatttt ttacttttga ttcaagcttt taatgcactc tcaggaggtg + 8761 ggagaggtgc ctttatttta ttaattattt ttacaggaat attattaata agaactgcta + 8821 tgaaatttaa gttccttttc tcatttattg gaggcctgtc tgctatagct ctagttgttt + 8881 tttttacaaa aggtttggat ttgacatggc tcttgaatat ggacggtgga gagcgattgt + 8941 tgaacttctt cggcagacct gaacatatat ctacagataa tagactattg atttatgata + 9001 ctgtttggtc tgcaatacag gaaaaaccct ttttaggatg gggagttggt tcaacttttt + 9061 taaaatttaa tggatattca cataatattg tattggattt attgcatgat atgggaagtt + 9121 ttggtttatt aattattctt tcggctttct ttgcttcttc agtaatattg tacaaattac + 9181 gtaaaataga ttggaaagtg aatttattta ttctgatgtt tctagaagta tatgttcaca + 9241 tgagtttcag tggaagctat cttgcagatg gtagactatg gtttttggtg atctttactt + 9301 attgttacta caggtggaaa gtgcaggaaa aggatgaagt tagcaatttt attatctgat + 9361 atttcaaaaa taggaggagt gcagcgtgtc acgacagctc ttgttaatga actttgtcaa + 9421 aatatagacg ttacaattat cagcatcttt tcggaaaatg agctaccagc ttttggactt + 9481 tcagatagag ttcaggtgag ctatcttttg aaagaacatg ttaatttgaa gaagaatttt + 9541 tttaaagtta gtggagcttt gcgaaaagtg ttgaaaaaac agcagtttga tgttgtttta + 9601 tcgtcaggaa ctggtctagt atcctttctt tggtttgcta gtttgggaat tcctaccaga + 9661 cttttggcat gggaacatca gtgtttttac tttgggagat cgtttggttt agagtggttg + 9721 gggcgaaagc tagcctgtcg ttttgctgag agtattgttg tcttgactaa aaaagatgaa + 9781 ggattttaca aagagaatcg tcctaaggct catattgaac aaatctataa tatcctagac + 9841 atggattcac aaacagctaa gtgtcagctc tcttctaaaa aaattatcag tgttggatct + 9901 ttagtacgac aaaaaggttt tgatctggct cttgaggtag ctagtcaaat acaattaagt + 9961 tatccagatt ggcagtggga catttatggt gatggccccg atagagaaaa attagaggag + 10021 aaagtcaggg aataccaatt agaaggcttt ataaatttga aagggcttgt tcagaatgtt + 10081 cgggagctct atcctgacta ctctatctac gccttgacat cacgatatga aggattatca + 10141 atggtattat tagaagctaa aaactgccag atgcctgcta tttcatttga ttgtaactgt + 10201 ggaccctctg atattatttc agatggaaga aatggttttt tgattgattg ttttgatgta + 10261 aatatctatg caaaaacttt atctaaatta atgactagtt tagagttgcg agaacaagtt + 10321 gcaaaatcga gtgttattcc agcagaagaa ttgtcaacaa cttatatcct agataagtgg + 10381 aacaatctat taaagataga aagaagataa tatgaaaata gtccatgtag aagatttttt + 10441 tcatccagat gcaggttacc agattaatgt tttaccaaaa tatctagcaa agtttggtca + 10501 tgaacaagtg attatcactt cagaaatgga taaaatcccc gataatctta cccaattttt + 10561 tggacgagaa aatatagaag agagagatag aagttacgaa gagaagcatc atgtgaagat + 10621 tattcgcttg cctcttcatg gatttgtaag cggacgtgcg attttttctg gaaagcttat + 10681 ttcggctatt aagggtcttt ctccagaggt attgtatatt catgggaatg acactttaac + 10741 agggattcgt ctccttttag ctcgaaagaa acttaattgc agaatcgtca ccgatagtca + 10801 tatgcttgaa aaggcatcaa gaaatccttt caacaactac tttaggagat tttataaaac + 10861 cttgattact cccattttga taaaagaaca gataccaatt attcggacgc aagatgataa + 10921 ttatgttgaa aaacacttgg gaattccttt atcgcaagct ccatggattt cttatgggtc + 10981 ggatacagcg ttctttcacg cagatagcca gattaaggaa gattttcgtt ctcagtatca + 11041 aatcgcttca gatgctctta tttgtgttta cgcaggaaag ttagatgagc ataagggtgg + 11101 gatgttttta gcagagtctc taagtaaaaa gttaaatacg gagcaaccaa ttgttttcat + 11161 tatagtgggt aatacaaatg gagagtatgg agaagctgtc gagaaaagtt tctcccaatc + 11221 tgaaaaccaa attttgcgct ttccgactca aaaatatcaa aaattagcac agttttttca + 11281 ggtagcagat tttgctttat ttcctaaaca atgtagttta agtttttatg atgcacaggc + 11341 ctgtggttta ccagttttat tggaagataa taatatcaac ctcgatagaa cttctcatta + 11401 taatggttgg acgttcaagg ctaacagcaa attaagtttg agagattcat taaaaatgat + 11461 tgcgagtcta gataaagaga agagacaaga gtactctcag aatgcactgc actatatcct + 11521 tgaacattat aattatgaag ataaagcaag agaatatgaa aagattctta taggggaacg + 11581 tacgaaatga gatagttaat atttcgttat tttataggaa aggtggattt aatgaaaatt + 11641 tgcattgttt cagtcggagt gggcggacta ccgattccag ctgtaaaagg gggagcagta + 11701 gaaaatctca ttgataatta tttaagttac aatgagaaat ataatcatga tgaaattacg + 11761 gtcgttagtt gtgaccataa ggaggcgcgt gaggcttcaa aaaaatacaa gtatgcccaa + 11821 tttgtctata tagatattca ttcacttaaa tataaaataa acaaaacaat acgttatgcc + 11881 attaataaat attcaccttt cttcgtaggg aacgcttata tcagtcaatt gccagacttg + 11941 tctggttttg atacagtttt gattgaaaat cgccctgaat acggttatta tattcgtaaa + 12001 aagtttaaag gaaatcttgt tttacatctt cacaatgatt tattaatgga caatgagtat + 12061 tctgtagatt atagcgttta tgataaaatt atcacaatat ctgactatat tagggatagg + 12121 tcagaagtag taatgtcagg tgttccgata cagactgtct ataatggtat tgacacagaa + 12181 ctttttttgc agaatttctc tgaaattgat ttatcagatc ttaaaaatca gttggaaatt + 12241 ttgtcggatg attttgtgat tgtttttttt ggacgtatca acaaaaataa aggtatcaaa + 12301 gaactgcttg aagccttctt gttgctacca aagaatttga atataaaatt actagctgtt + 12361 ggtagttcta tatttggtca gacggagttg gatactttca caacagagct acggcaattg + 12421 gcaaaacaag catcagataa agttgttttt acaggctatg ttaattacaa agacattcct + 12481 aagtatcatc atattgcaga ttgcattgtt gttccatcta tttgggagga accagcgggt + 12541 ttgacggtct gtgaagcttt gatatcaggg aaatatgtta ttacaacaga tgctggaggg + 12601 ataccagaga ttgtagctgg cagtgaagcc cttgtggtag caaatgatga gtgtatagtt + 12661 gaacacctca aaacagccct attgagtgtc taccaaaaag ggaaatgctc ttcggttatt + 12721 acttctaata gagatagagg agcctatttt tctattgaaa aatatggaag agacttacgg + 12781 aaagagctca cacaaaatga aagaatcatt aacatatgag tcgtgtaaaa aatagttttt + 12841 ttaatatttt agctggaata gttggtacta tcatatcgag tgttttagct ttcatagtta + 12901 gaacagtgtt tatccgagtt ttgggagaga cttatctagg tttcaatggt ctatacacca + 12961 atatcttaac agttttatcc ctagctgaat tagggatcgg atcatcaatt gcttatttga + 13021 tgtacaaacc tttagcagaa aaagatgggg acaaattagc tcaagtagtt caattctata + 13081 aaaaaatata tcgagtaatt ggtataatta ttcttatttt aggtttgtgt ctcgttcctt + 13141 ttttaccagt cattgtaaat ttaaaaaatg cagaagattt gaactataca gcattgtatt + 13201 tgctttattt agcagataca gtttctactt atctattctt tgcatataaa agaggggtat + 13261 tggttgctga tcaaaaggtc tatgttgcga atatctttga tataattata acgacaattt + 13321 tatctatttt ccaaattatc actttgatga tttttaaaga tttttatcta tatattattt + 13381 taaaaattgc taaaaatctt actttgaacc tagtaattag tttaaaagta gataaaatgt + 13441 atccaagtat tcataaattt aaagagatag ctccacttcc aaaaatggaa agacgactag + 13501 tttggaaaaa tgtatatgct acctctgttc gacaaatctt taacgaatta atgaattcaa + 13561 cagatagtat agttatttcc attgtcttag gaatagttat ggttggtaag tattcgaact + 13621 atgcttatat tttatcaatc gtatatattt tctttggagg aatttttaat ccgattcagg + 13681 cttctattgg aaacctatct ctgttagctt ctatagagaa aaaaaatgaa atcttcaata + 13741 gattacgttt tataaatttt ttctttttat cattttgctc aagttgtctt ctagtattgg + 13801 taaatccttt tatcactatt tggattggag aaaattacac tttatcattt acaggtgtga + 13861 ttgcaatagt tggtatgtta ttcgttagac aaactggaaa ttgtacaacc atttttcgtt + 13921 tgggagaagg atattttaga gattatcatt tttctccttt aatcgcgggc attttaaatt + 13981 tagttgtttc agtaatttta gtgaattata taggtattgc aggtgttttt gttggaacaa + 14041 tgttaggatt tggtttccaa tttatactgg tggatacaat tgttacttat aaaaaagtac + 14101 ttagtcgtcc actatcagag ttttatttaa gatggttgca gacgatctta ttaactgtag + 14161 gtttatgtat tgcgagttac tatttatctc gattggttag agtgaatagt atatatgatt + 14221 tgatactgtt gtttgtagtg gttattggat ttaatttttt tgctttatgt tttatttatt + 14281 ggcgaaatga tgattttcaa tattttattc aattggttaa aaattttatg aaaaatttgg + 14341 aggaaaaaaa tcatgattaa tgtaatcgga ttaggttata ttggattgcc aacaatttta + 14401 atgttggcaa caaacggcgt gaaagtagtt ggaactgact acaatcagga tttggtgaga + 14461 actttaaatg aaggtcaaac aacctttaaa gaagatggat tggatgaact attccataaa + 14521 gcagtggagt cgggtgtgga ctttacaacc gaatatcaac aaacggatac ctatattatt + 14581 tccgttccaa caccatatga ctccttctct aaaaaaattg atccaagcta tgtgattgaa + 14641 gctacgaaaa cggtacttga taattgcaat aaaggagcgg ttattattat tgaatcgacc + 14701 gtatcaccag gaacggttga taaatttatt cgacctgttg tagaagaaaa aggttttgtt + 14761 attggtagtg atattcatct tgtccatgct ccagaacgta ttattccagg gaatatggtc + 14821 tatgaattgg tgaataataa ccgtacaatt ggagctgatg acctagaaat cggctataaa + 14881 gtgaaagagc tttatgcttc attttgtaag ggcgatattg ttgttacaga tattagaact + 14941 gcggagatga ccaaggtagt agaaaataca tttagagctg taaatattgc tttcgctaac + 15001 gaattagcac agatctgtag ttatgataat atgaatgttt atgaaattat ccggatctgt + 15061 aatatgcacc cacgggtaaa tattctacaa cctggacctg gtgttggtgg gcattgtatt + 15121 tctgtggatc cttggttctt agttggagat tatcctgagt tgacaaatgt tattgaacat + 15181 tctatgcgaa caaatgctgc catgccagaa tttgtattaa atcgtatcta taccattatg + 15241 aacgaacatc atctaacaga tattagtcgg gttggtctat atggtcttac ctacaaagag + 15301 aatgtagatg atatgcgtga atctccaacg cttcagttat tagaatctat gagccgccat + 15361 ctggcaacac ctgctattaa agtatatgat ccatttatag aaaaagatgt tgtggcgaat + 15421 cagtcacatg atttagatga atttttatct aatgttgata ttgttgtact gttggttggt + 15481 catgatgaga ttttacaaaa tatggataaa ctaaaagata agatagtgtt agatacacgt + 15541 tatatctgtc atcttgatgg aacttacaga ttataattag tgataaataa agtaaggatt + 15601 gactatgaaa aaaatagttg taattttcgg aactcgtccc gaagctatca agatgtgtcc + 15661 cttggttaaa gagctaagaa cacgtgagaa tcttgaaaca ttggtctgtg ttacgggtca + 15721 acatcgtcaa atgctggatc aagttttgga tacttttagg attacgcctg attttgattt + 15781 atctattatg aaggacaaac aaactctctt tgatgtcaca attggcattt tggaaggcat + 15841 gaagactgtc ttagagtcag ttaatcctga tttaatatta gttcatgggg atacgagtac + 15901 aacatttgcc agttcactgg ccgcctttta tctacagatt ccaattggac atgtagaggc + 15961 tggtttgcgt acttatgata tttattcacc ttatcctgaa gaatttaatc gtcaagcagt + 16021 aggtgctttg gctcagtatc attttacacc aacacaactc tcaaaagaca atctcttgag + 16081 agaaggaaaa aattctgaag ctatatttat cacaggtaac acagcaattg atgctttaca + 16141 aactacaatt caagaggatt atactcatcc tgagttaaat tgggttgggg atagcaaact + 16201 aatattaatt actgctcatc gtcgtgaaaa tattggtgac ccgatgaggc acatgtttag + 16261 agcaatccga cgtatcattg aagaacattc ggatataaag gctctttacc ccattcatat + 16321 gaatcctcta gttcgtcaga ttgctgagga agaactaagc ggatgtgaac gtatcaaaat + 16381 gatcgatccg ttggaagtat tagattttca taacttttta tcacggagtt atctcatttt + 16441 aacagatagt ggtggtatcc aagaagaggc acctagttta ggaaaacctg ttttagttat + 16501 gagagataca actgaacgtc cggagggaat taaagcagga actttgaagc ttgtaggtac + 16561 tgatgaggac aatatttata gacattttaa agaattgtta gaaaatgatt tagtttatca + 16621 agcgatgagc caagcttcaa atccgtatgg agatggaaca gcttgcaaga aaattgcaga + 16681 catactagaa ggagaagtat aatatatgtc acaatttaca ggaaaaactc tcctaattac + 16741 aggaggaaca ggttcatttg gtaatgctgt ccttaatcgt tttttacaga ctgatattgg + 16801 tgaaattcgt attttttccc gtgatgaaaa aaaacaggat gatatgcgtc atgagtttca + 16861 ggtaaaagta ccagaagtaa ctgggaaaat ccgtttttac cttggagatg tgcgtgactt + 16921 agcttcggta aaaaatgcta tgcatggtgt ggattatgtt tttcatgctg ctgctcttaa + 16981 acaagtacct tcgtgtgaat ttttccctgt agaagcggta aaaactaaca ttttgggaac + 17041 ggagaatgtc ctcactgcgg ctatcgaagc tggtgtaaag caagttatct gtctttctac + 17101 agataaggcg gcttatcctg tcaatgctat gggaacatcc aaggctatga tggaaaagat + 17161 tgctgttgct aagtccagga cggtaaatcc tgagcataca aagatatgtg tgactcgcta + 17221 tgggaatgtt ctgtgtagcc gtggatctgt cgttcctctt tggattgagc aaattaagca + 17281 aggaaatgct cttacaatta ctgaacctag catgacacgt tttgtgatga cattagaaga + 17341 agcagtagac ttggttttat ttgcatttga agaagggaaa tctggagata tactagttca + 17401 gaaagcacca gcatgtacga ttgaagtgtt ggctaaggct gtatcagaaa tttttgcctc + 17461 agaacaagat attaagatta taggtattag acacggagaa aaaaggtatg aaacactatt + 17521 aactaatgaa gagtgcgcaa atgcaattga tttgggtgat ttttatagag ttcctagtga + 17581 taatcgtaat cttaactatg ataagtattt caaagatggt agtacgaata gaaatttgtt + 17641 gacagaattc aatagtaata ataccgattt gatggatgta gagcaagtta aaagaaagtt + 17701 gctagaatta gatgaaatac agacagcaat tcgtgatatg gtagcagatg aagagatgta + 17761 aaatctttta agatacatta aaattatcaa ggatatataa tgtatcatgt attgtcgaga + 17821 gagttgacta ttaaaacagc atataaaaca aggagggggc atgattaaaa atattttaat + 17881 cacaggagcg aaaggatttg taggaaaaaa tcttatctgt actctggaag ctttgaaaga + 17941 tggacgagat aggactcgtc ctaatttaga gattggagag atttttcagt atgatcgtga + 18001 tacagatccg attttattag atgaatattg taagaaggcc gatttcgtat tccatttagc + 18061 tggtgtcaat cgtccacaga atcctgatga attcatggag ggaaattacg gtttttcaag + 18121 tagattattg gagattttag aaaagtatga aaacacttgt cctgttctac tctcaagttc + 18181 tactcaagct agtttagaag gccgattttc aaactctata tatggacaat ctaagctagc + 18241 aggggaagaa ctcttctttg aatatggaaa gaaaacggga gcacctgtct tagtttaccg + 18301 tttcccgaat ctttatggga agtggtgccg tcctaactac aattctgctg tagcaacttt + 18361 ctgtcataat ctagctcacg atttacctat tcaagtaaat gatccaagtg tagaattgga + 18421 gttgctgtat attgatgatt tgatacaaga gtgtctaact gcattggaag gaaatcctca + 18481 tcgttgtaat ctagatggat tacaaatctt acctagccca tcaggaaact actgctacgt + 18541 accaacgact catcgtgcaa ccttaggaga gattgtctct ctattagaaa catttaaaaa + 18601 acagcctaat agtttagtta tgcctgaaat tcctcaagga tcgtttaaaa agaaattgta + 18661 ttctacctac ctatcttatt taccagtaga taagtttagg tttcctctaa aaatgaatat + 18721 agatgaacga ggtagtttta cggaattatt aaaaacagaa aatacgggtc aattttctgt + 18781 taatatttct aaacctggca ttaccaaagg gcaacattgg catcattcta agtgggaatt + 18841 tttcatggtt gtttctggtc gtgctttaat acaagagcgt aggatagggc tggatgaaaa + 18901 cggtcaagag tatcctattc tgaactttga agtgtcgggc gataagattg aagcaataca + 18961 tatgataccg ggctatgcac ataatattat taatctttct gatacagaaa atctaattac + 19021 tgtcatgtgg gctaatgagt catttgatcc tagacatcca gatacttttt ttgaacaagt + 19081 ggagaaataa atgaaaatta agacagatta tagtgatatt cattttaaag ataatggcaa + 19141 acttaagtta ttgattattg tgggaacacg tccagagatt atacgtctaa gtagtgttat + 19201 cactaaatgt cgaaagtatt ttgatgttat tttggcacat actggacaaa actatgatta + 19261 caatttaaat ggtattttct ttgataattt agggttagac actccggacg tatacatgga + 19321 tgctgttgga gatgatcttg gtgctactgt agggaatatt attaatactt catacaaatt + 19381 gatgaatcaa attaaaccag atgctttatt gattttaggg gatacaaatt cttgtttatc + 19441 agctattgct gccaagcgtt tacatattcc aatttttcat atggaggctg gcaatcgctg + 19501 taaagatgag tgcctgccgg aagagactaa tcgtcggatt gttgatatta tttcagatgt + 19561 taacttagca tactctgaac atgcacgtaa gtatttacat gagtgtggtt tacctaaaga + 19621 gcgcacatat gtaactggtt ctcctatggc agaagtgtta cataaaaatt tatctgccat + 19681 tgagtcttca gatatccatg aacgtttggg attgaaaaaa ggaggttata tcttactttc + 19741 agctcaccgt gaggaaaata ttgatacaga taaaaatttt atttctctct ttacagcaat + 19801 taatcaatta gctgaaaagt ataatatgcc aatcttatat tcttgccatc ctagatcaaa + 19861 gaaaaggcta caagagagcg gttttaaact agataaacgt gtgattcagc atgagccact + 19921 aggattccat gactataatt gtttacagat gaatgcattt gttgtagtat ctgattcggg + 19981 aactttaccg gaagaaagta gtttctttac tagtcaaggt tatccttttc ccgctgtatg + 20041 tattcgtaca agtacagaac gtcctgagtc cttagataag gcaggattta ttttggcagg + 20101 cattgatgaa aattctcttc ttcaagcagt tgaaactgct gttagcttgg cagaagatga + 20161 ggattttgga ttaccggttc cagattatgt tgaggaaaat gtctctacta aagttgttaa + 20221 gataatacag agctatacag ggatagtgga taaaatagtt tggaggaaaa gctgaattgt + 20281 atatttttaa taaatcaaaa cgagatgatt aattcttagt agaacaagag taaaattgaa + 20341 cgtatttgat ggaaatgtct tacttgatag tcgagggata gccattctat cggatttttg + 20401 gcttgttttt gcgcttcatg tttgatagaa taaagggctc tttgtcaact gtagtgggtt + 20461 gaagaaaagc taagcttgag aaaggacaaa tttcgtcctt tcttttttga tgttcagagc + 20521 gataaaaatc cgttttttga agttttcaaa gtttcgaaag taaccgccca ataacgaagt + 20581 atattgaaaa atctccagac tagagaactc acggatagtt cctaatctgg agatttctta + 20641 tttgcacttt tcttgtacaa ctttagtcca tggtaaataa gcctctaaaa cctctttgtt + 20701 tacgagagtt tcctcgtttg gaagacattc tagaagatag gatagatatt tctcactatt + 20761 tagttgatga cgtttagctg tttccaacaa gctcataata atagctcttg ctttagctcc + 20821 ttcaaaactt tgagaaaata accaccctcg cttttttaaa ctgagctcag gctaaaagag + 20881 tccactggac tcttttactc cgtcccataa ccaatgattt aatggcgcgt tcagctagat + 20941 tattggaaag gaccagatgt ccgtctttca aaatagtctt aaaggtttct tcatacttga + 21001 ggctgtattc aattgccctt cctagttttg aacctgctaa aactgactga cggcggcacc + 21061 aagcaaagaa gtcttccatt aggggctgga gatgttcttg acgtttctgt agtcgttcat + 21121 cagctggcaa agcctcccag tctctttcca aggaaaataa ctgatcacaa taagctaaac + 21181 ctttagctcc taaggatgat ttatctgctt gcttgggggt cgcttcaaaa aatttccttc + 21241 tcacatgcgc ccaacatcca acaagttcag cttcttccag ttgacgataa gcttctagcg + 21301 gttcgtagtt taccaagctt agcgtcgcct tgctcctaaa ccttggactg ctatcgcata + 21361 ggcagaacta gaggactaaa gtcctaagtt actgccgcaa catatcacaa tgaacatagc + 21421 cagaataatc tcctaggaat tcttgtacta ccgaaccact ccgactctga tcatgatggt + 21481 acagcgtgat tgcttgattc tcaactttcc cagacaaaaa ggtccaatag taggtcagat + 21541 ggctatgact ctctagaacc cgataagaag tttcatccgc atgaagtaag ggctgagtca + 21601 atagtctctc tcgcaagagg ttataaaggg gctttaggaa taggagcttt cacaagctta + 21661 tccagatgat tatcttttac tcgttatgga caatgctata tggcataaat caagtacctt + 21721 aaagattccg actaatattg gttttgcatt tattcctcca tacacaccag agatgaaccc + 21781 cattgaacaa gtgtggaaag agattcgtaa acgtggattt aagaataaag cctttcgaac + 21841 tttggaagat gtcatgaatc aactccaaga tgttatacaa ggactggaga aggaggtgat + 21901 aaagtccatc gttaatcgga gatggactag aatgcttttt gaaagcagat gagtataaaa + 21961 agaaagtcct catttcaata gaaatcacga ctttctgatg gatttatagt aaaatgaaat + 22021 aagaacagga caaatcgatc aggacagtca aatcgatttc taacaatgtt ttagaagcag + 22081 aggtgtacta ttctagtttc aatctactat atttttggag tgatagaaaa gcccttcatc + 22141 agccaatcta cttgttcagg tgcgagagct ttgacatcct tttctgtact gggccaagtc + 22201 agtctgccgt tctcaaagcg tttatatagt agccaaaatc cttgaccatc ccagtaaagg + 22261 gctttaaagc ggtctttacg tccaccacaa aagagaaaaa cttgacctga gaaagaatcc + 22321 aattcaaagt gggttttaac cagataagcc agtgaatcga ttccttgtct catatccgtt + 22381 ttcccacata cgagatagac ctgccctagg ctagatagat gaattgtcat agagcaacac + 22441 cttatccaaa agctgttcta tcatttcgag attgagagat tgaaaaaaac ttacttcaag + 22501 cttgccaata cgaattttaa gcagaatatc atttctcttt ttagaatcaa aaggacgaga + 22561 ttgtggaatc tctacaggaa caataggttg tagcattaaa atatcctcca atagttttac + 22621 tttactaata gtatacagga ggagctccat gaatgataga taccttgtta tgacgcgctt + 22681 actaaacaac taactgatgc acgatttaag cgccttgttg gtgttcagcg cacgactttt + 22741 gaagagatgt tagctgtatt aaaaacagct tatcaactta aacacgcaaa aggtggacga + 22801 aaacctaaat taagcctaga agaccttctt atggccactc ttcaatatgt gcgagaatat + 22861 cgaacttatg aagaaattgc ggctgatttt ggtatccacg aaagcaactt aatccgtcgg + 22921 agccaatggg ttgaagtaac tcttgttcaa agtggtgtta cgatttcaag aactcctctc + 22981 agctctgagg acacggtaat gattgatgcg acggaagtac aaatcaatcg ccctaaaaaa + 23041 agaattagcg aatgattctg gtaaaaagaa atgccacgct atgaaggctc aagcgattgt + 23101 cacaagtcaa aggagaattg tttctttgga tatcactgtg aactattgtc atgatatgaa + 23161 gttgttcaaa atgagtcgca gaaatatcgg acaagctggt aaaatcttgg ctgacagtgg + 23221 ttatcaaggg ctcatgaaga tatatcctca agcacaaact ccacgtaaat ccagcaaact + 23281 caagccgcta acagctgaag ataaagcctg taatcatgcg ctatccaagg agagaagcaa + 23341 ggttgagaac atctttgcca aagtaaaaac gtttaaaatg ttttcaacaa cctatcgaaa + 23401 tcatcgtaaa cgcttcggat tacgaatgaa tttgattgct ggtattatca atcatgaact + 23461 aggattctag ttttgcagga agtctattga aggatctttt gctttagttc cttggtcaag + 23521 gttgattatt ttcacggagc gcttccgatt gttttcataa accatttgcg catagtcagc + 23581 agaataaatc tttttgaaac gtccctttcc tagacattat agaactttca gattcatctg + 23641 aatttaccaa attaacacaa aaattctgaa aattctgttg acatctttct gaaaagagtt + 23701 tataatggag agaaagtttt aaaggagaaa atgatgaaaa gttcaaaact acttgccctt + 23761 gcgggcgtga cattattg +// + diff --git a/public/res/serotype_genbank/serotype_13.gb b/public/res/serotype_genbank/serotype_13.gb new file mode 100644 index 0000000..4f7cc74 --- /dev/null +++ b/public/res/serotype_genbank/serotype_13.gb @@ -0,0 +1,793 @@ +LOCUS CR931661 17717 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 34357 (serotype 13). +ACCESSION CR931661 +VERSION CR931661.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17717) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17717) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17717 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="34357" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC13_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC13_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33294.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..466 + /gene="aliB" + /locus_tag="SPC13_0002" + /pseudo + CDS 293..466 + /gene="aliB" + /locus_tag="SPC13_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI33295.1" + gene complement(order(459..995,997..1323)) + /gene="tnp" + /locus_tag="SPC13_0003" + /pseudo + CDS complement(join(459..995,997..1323)) + /gene="tnp" + /locus_tag="SPC13_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(933..995,997..1305)) + /gene="tnp" + /locus_tag="SPC13_0003" + /note="HMMPfam hit to PF01710, Transposase, score 4.2e-23" + /pseudo + gene 1536..2981 + /gene="wzg" + /locus_tag="SPC13_0004" + CDS 1536..2981 + /gene="wzg" + /locus_tag="SPC13_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33297.1" + /db_xref="GOA:Q4K1U7" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K1U7" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVVVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIELEYPNYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFYFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1536..1652 + /gene="wzg" + /locus_tag="SPC13_0004" + /note="Signal peptide predicted for SPC0636 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 1740..2087 + /gene="wzg" + /locus_tag="SPC13_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.8e-63" + misc_feature 2265..2708 + /gene="wzg" + /locus_tag="SPC13_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.5e-69" + gene 2983..3714 + /gene="wzh" + /locus_tag="SPC13_0005" + CDS 2983..3714 + /gene="wzh" + /locus_tag="SPC13_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33298.1" + /db_xref="GOA:Q4K0T7" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0T7" + /translation="MIDIHSHIVFDVDDGPKSIEESKALLREAYNQGVRMIVSTSHRR + KGMFETPEEKIATNFIKVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHAGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + misc_feature 2986..3594 + /gene="wzh" + /locus_tag="SPC13_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.1e-38" + gene 3723..4415 + /gene="wzd" + /locus_tag="SPC13_0006" + CDS 3723..4415 + /gene="wzd" + /locus_tag="SPC13_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33299.1" + /db_xref="GOA:Q4K0T6" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0T6" + /translation="MKEQNTLEIDVLQLFRTLWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 3741..4157 + /gene="wzd" + /locus_tag="SPC13_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 7.4e-54" + misc_feature 4263..4340 + /gene="wzd" + /locus_tag="SPC13_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4425..5108 + /gene="wze" + /locus_tag="SPC13_0007" + CDS 4425..5108 + /gene="wze" + /locus_tag="SPC13_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33300.1" + /db_xref="GOA:Q4K1U4" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1U4" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQGKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVILNKFDVQHKKYGSY + GDYGNYGKK" + gene 5124..6491 + /gene="wchA" + /locus_tag="SPC13_0008" + CDS 5124..6491 + /gene="wchA" + /locus_tag="SPC13_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33301.1" + /db_xref="GOA:Q4K1U3" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K1U3" + /translation="MDEKGLKIFLAILQSIIVILLVYFLSFVRETELERSSIVILYLL + HFFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHMISKRILDICGATIGLVL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKMDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFI + RDGAK" + misc_feature 5907..6488 + /gene="wchA" + /locus_tag="SPC13_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 5.1e-145" + gene 6495..6944 + /gene="wchJ" + /locus_tag="SPC13_0009" + CDS 6495..6944 + /gene="wchJ" + /locus_tag="SPC13_0009" + /note="member of homology group 26" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="CAI33302.1" + /db_xref="GOA:Q4K1U2" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:Q4K1U2" + /translation="MKVCLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKEDARSILGN + EIFYSCHYPTNRNLKNLIKNTILAFNILRKEHPDIIVSSGAAVAVPFFYLGKIFGAKT + VYIEVFDRIDAPTMTGKLVYPVTDRFIVQWEEMKKVYPKAINLGGIF" + gene 6944..7417 + /gene="wchK" + /locus_tag="SPC13_0010" + CDS 6944..7417 + /gene="wchK" + /locus_tag="SPC13_0010" + /note="member of homology group 27" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33303.1" + /db_xref="GOA:Q4K1U1" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q4K1U1" + /translation="MIFVTVGTHEQQFDRLIKEVDRLKKENLIQDEVFIQTGYSKYIP + KYCEWEKIISYEKMNQLIEKSDIVITHGGPATFMGVIAKGKIPIVVPRQKKFEEHVND + HQLEFCNKVKQTYPIIVINDIKNLVINLRNNKSKETINSNNKEFCRKLEERIGSL" + misc_feature 6944..7414 + /gene="wchK" + /locus_tag="SPC13_0010" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 1.3e-44" + gene 7417..8555 + /gene="whaG" + /locus_tag="SPC13_0011" + /pseudo + CDS join(7417..7500,7500..8555) + /gene="whaG" + /locus_tag="SPC13_0011" + /note="member of homology group 189" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /db_xref="PSEUDO:CAI33304.1" + misc_feature 7950..8549 + /gene="whaG" + /locus_tag="SPC13_0011" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 3.2e-16" + /pseudo + gene 8567..9289 + /gene="abp1" + /locus_tag="SPC13_0012" + CDS 8567..9289 + /gene="abp1" + /locus_tag="SPC13_0012" + /note="member of homology group 57" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (arabinitol) + Abp1" + /protein_id="CAI33305.1" + /db_xref="GOA:Q4K1U0" + /db_xref="InterPro:IPR001228" + /db_xref="UniProtKB/TrEMBL:Q4K1U0" + /translation="MKIALLTASGIGSRIKQDIPKQFIHVDNKPLIIHTLEKFQNHPN + IDEICVVVLKGWEEMLKTYARQFNITKLKYIVNGGETGQLSIYNGLNEIKKNNIDRQV + TVLIHDGNRPMVSNEIIDDAFSTYSRYGNAVAAIPCVEVTFVLDNETENHSISSLKRE + LLRRTQTPHVYNLDDILELHNRALENGITEVAASCELMKMFGKETYFSMGSEKNLKIT + TLDDLEIFKALLKSKKEDWIKD" + misc_feature 8573..9262 + /gene="abp1" + /locus_tag="SPC13_0012" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF0007, score 5e-14" + gene 9293..10381 + /gene="abp2" + /locus_tag="SPC13_0013" + CDS 9293..10381 + /gene="abp2" + /locus_tag="SPC13_0013" + /note="member of homology group 58" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (arabinitol) + Abp2" + /protein_id="CAI33306.1" + /db_xref="GOA:Q4K1T9" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1T9" + /translation="MNLFDISLYKDYVDKSIKNIVGVETLKDKSILITGSTGLICSTV + IDQLIILNKNHQFGVKIYACARSEEGLKRRFGNYVDDENIIYVPYDANKDIDFNFTVD + YIIHGASNASPDLYISNPVDTMLSNFLGMKNLLDYALKKSVSSIVYVSSSEVYGKTEN + HTPYQEDEYGYVNILDVRASYSSSKRATETLCKSYSEQYDVSIKIVRPGHIYGPSLKI + TDKRISSAFMYDAIRGQNLVMKSKGEQLRSYCHSLDCASAILTVLLKGQSGDAYNISN + KKSIISIREMASIIAEVAGVELLFELPNEVEEKQKNPMDNSSLDSTKLEELGWVGMFE + AKEGLESTYKVLDISKIQKISKNIYNID" + misc_feature 9383..10117 + /gene="abp2" + /locus_tag="SPC13_0013" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 2.4e-37" + misc_feature 9386..10204 + /gene="abp2" + /locus_tag="SPC13_0013" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 0.0015" + gene 10421..11380 + /gene="wciF" + /locus_tag="SPC13_0014" + CDS 10421..11380 + /gene="wciF" + /locus_tag="SPC13_0014" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33307.1" + /db_xref="GOA:Q4K1T8" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K1T8" + /translation="MEKVSVIVPIYNVEKYLKYSIGGILKQSYKNLEIILVNDGSQDN + SLAICEEYSKIDNRIKIISVENGGQGKARNIGLQHSTSDWILFLDADDYYDNNAVEYL + VELAERYGSDLVVTPLRVVRDHIQGGNASSIKNEKILNLNKDRLIEEMYYGRLLGATP + CGKLYKREILEKWPFPDQLFEDLAIAYKHLMSAKKVAVSNQYYYNYYQRVGSTTKSRY + TSKLEDFYRAIEKNYKYLEEDFPNNKELSIALKTRMFTGGFQVVNSMIESGMTKEVKD + KSLEYRKDLLMIIFNSRITKNHKIKHILFSINPKLYTFVLKSI" + misc_feature 10433..10942 + /gene="wciF" + /locus_tag="SPC13_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.2e-45" + gene 11418..12407 + /gene="wcrD" + /locus_tag="SPC13_0015" + CDS 11418..12407 + /gene="wcrD" + /locus_tag="SPC13_0015" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33308.1" + /db_xref="GOA:Q4K1T7" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K1T7" + /translation="MILSIVVPTYNIEKYIERNIESFLNVEDELKSLFEILIINDGST + DKTLQVVTELISKIDCLNIRVINKSNGGHGSAVNRGIEEAKGKYFKIVDGDDWVKKSD + FEEYLKRLEKTNVDMVVTNFSKQYTYENRVELEKVINVEDYYKSNKIPKIFPMHSVTY + KTCILKENNIKLTEKIFYVDIQYIVFPLKYISDWEYWNLDVYQYFLGRPDQSMTIENR + MKNIEHSRKVTESILEFYSTLGDVYFKDIVNSLLKGLLNTRYLLAFLSDDRERLLKET + TDYIRKYKIKYTYDSRMKTSYLLYLNEIHNRRYSFIVYPIVGFKLNRLSKYGI" + misc_feature 11427..11948 + /gene="wcrD" + /locus_tag="SPC13_0015" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.2e-34" + gene 12410..13570 + /gene="wzy" + /locus_tag="SPC13_0016" + CDS 12410..13570 + /gene="wzy" + /locus_tag="SPC13_0016" + /note="member of homology group 230" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33309.1" + /db_xref="UniProtKB/TrEMBL:Q4K1T6" + /translation="MSNMSSIKVSIYQLLFYVSFIIIVGSKYLRETVFVNAYPLLSEL + IKVLIIIACIFLLLKYILEPHTKKFIIFSIVILTIGVVVSYNSDSFFILMPVVALILN + MSNIDITKVIKVWLIEIIALMIFLAICYRLNIVGEVINSAIRSDGKIRYALGYKYSTF + SSNYFFHVTIFYLYLRKHMIKYVEIITLFLINLYLYALTDTRAVFYYSTAAIVICLLL + KMFKIKTYSIILNKYSMLFSAIIAGVLSWSYRYRLPFFDQLDLILTGRLRLGSAAFNN + FHITFFGQKIRWIYEQNMFSELIYNYVDSSYLNILFGFGIIILLLILVGYYIIGEKKL + SRDTYYTMMIVFLSLHSTFDPQLIDIVYNPAILFLGYVIYNEDEIKNLNKIY" + gene 13820..15235 + /gene="wzx" + /locus_tag="SPC13_0017" + CDS 13820..15235 + /gene="wzx" + /locus_tag="SPC13_0017" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33310.1" + /db_xref="GOA:Q4K1T5" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K1T5" + /translation="MKILKNYAYNLSYQLLVIILPIITTPYVTRVFSSYALGTYGYFN + SIVTYFILLATLGVANYGTKVISGNRKEIEKNFWGIYSLQLCAAVLSLSLYVVLCLTL + SLMQNPVAYILGLSVVSKGLDISWLFQGLEDFRKITVRNITVKLIGVISIFLFVKSES + DLYLYIFLLTIFELLGQLSMWLPAREFIGRDHFDIAYVRHHLKPVILLFLPQVAISMY + ITLDRTMLGALASTKDVGIYDQALKLVNILMTLVTSLGSVMLPRVAHLLSKGEQKAVN + KMHEISFLIYNLVIFPVIVVILIVNDDFVQFFLGQDFQDARYAIAIMIFRMFFIGWTN + IMGIQMLIPHNQNKEFMISTTAPAIISVGLNLLFLPKFGYIGAAIVSVLTEAFVWAIQ + LFYTRRYLKGVPIIGSMAKIILASTIMYGLLLSSKTVIHFSPTLNVLAFAALGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 13826..14620 + /gene="wzx" + /locus_tag="SPC13_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.1e-62" + gene 15237..16235 + /gene="wciG" + /locus_tag="SPC13_0018" + CDS 15237..16235 + /gene="wciG" + /locus_tag="SPC13_0018" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33311.1" + /db_xref="GOA:Q4K1T4" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K1T4" + /translation="MKKIRNINLDLLKVLACVGVVLLHTTMAGFKETDSWNLLAYLYY + LSTYSIPLFFMVNGYLLLGKREITYHYILQKVKWILITVSSWTFIVWIFKRDFTTNPI + KKIVGSLIQRDYFPQFWFFGALILIYLCLPILRKFLNSKRSYLYSLSLLLIIGLIFEL + SNILLQMPIQTYVVQTFRLWTGFFYYILGGFIAQFTIEEIESRFKNWMKIVSILLLLI + SPIILFFIAKTIYHNLFAEYFYDTLFVKVSTLGIFLTILTLTLNENRRESIVSLSNQT + MGVFIIHTYIIKVWEKLFGFNFVGAYLLFALFTLSVSFIITGMLMKIPYFNRIVKL" + gene 16249..17352 + /gene="glf" + /locus_tag="SPC13_0019" + CDS 16249..17352 + /gene="glf" + /locus_tag="SPC13_0019" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33312.1" + /db_xref="GOA:Q4K1T3" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1T3" + /translation="MYDYLIVGAGLFGAVFAHESALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIDEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPAFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKFADEQ + GNVIFGGRLGHYRYYDMHQVIGAALQCVRNELD" + misc_feature 16684..17292 + /gene="glf" + /locus_tag="SPC13_0019" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1e-112" + gene 17670..>17717 + /gene="aliA" + /locus_tag="SPC13_0020" + CDS 17670..>17717 + /gene="aliA" + /locus_tag="SPC13_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33313.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attatcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga aaatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attacgctga taatatagtc aattgaaaca agagcaggac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct tttacgaggc tttttgatat + 541 gagcccatgt tttctcaata ggattgtact caggtgagta gggaggaaga aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga aaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat catctcttcg taagtcattg gagtgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttatt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaat ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaattca gaagctattt cagtcaaata + 1081 agcgtctgga ttgtcagtaa gatagttttt aagtctatct ctatcaactt ttcttggttt + 1141 tattcctttt acttggtggt ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatggtatta cgtgagattt ggaaaacgtg tgatgcttct gttatactat ctgttcgctc + 1261 acaataagag agaacttttt tacgaaaatc tattgaatat gccataaaaa gattatacca + 1321 cattgtgtac tatattagat tgaaactaga atagtacaca tctgcttcta aaacattgtt + 1381 agaaatcgat ttgactgtcc ttatttcatt ttattatatt tttggttcgc gggaagtcta + 1441 ctaagatact taaagatgca gatagtaaaa aaaatgtaga cattaccgta aaaaagtgat + 1501 ataattgtat gatgttcaag gtataggtgt taatcatgag tagacgtttt aaaaaatcag + 1561 gttcacagaa agtgaagcga agtgttaata tcgttttgct gactatttat ttattgttag + 1621 tttgtttttt attgttctta atctttaagt acaatatcct tgcttttaga tatcttaacc + 1681 tagtggtaac tgcgttagtc ctactagttg ccttggtagg gctactcttg attatctata + 1741 aaaaagctga aaagtttact atttttctgt tgctgttctc tatccttgtc agctctgtgt + 1801 cgctctttgc agtacagcag tttgttggac tgaccaatcg tttaaatgcg acttctaatt + 1861 actcagaata ttcaatcagt gtcgttgttt tagcagatag tgatatcgaa aatgttacgc + 1921 aactgacgag tgtgacagca ccgactggga ctgataatga aaatattcaa aaactactag + 1981 ctgatatcaa gtcaagtcag aataccgatt tgacggtcaa ccagagttcg tcttacttgg + 2041 cagcttacaa gagtttgatt gcaggggaga ctaaggccat tgtcctaaat agtgtctttg + 2101 aaaacatcat cgagttagag tatccaaact acgcatcgaa gataaaaaag atttatacca + 2161 agggattcac taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct + 2221 atgttagtgg aattgacacc tatggtccta ttagttcggt gtcgcgatca gatgtcaata + 2281 tcctgatgac tgtcaatcga gataccaaga aaatcctctt gaccacaacg ccacgtgatg + 2341 cctatgtacc aatcgcagat ggtggaaata atcaaaaaga taaattaacc catgcaggca + 2401 tttatggagt tgattcgtcc attcacacct tagaaaatct ctatggagtg gatatcaatt + 2461 actatgtgcg attgaacttc acttctttct tgaaaatgat tgacttattg ggaggggtag + 2521 atgttcataa tgatcaagag ttttcagctc tacatgggaa gttctatttc ccagtaggga + 2581 atgtccatct agactctgag caggctctag gttttgtacg tgaacgctac tcactagccg + 2641 atggagaccg tgaccgtggt cgcaaccaac aaaaggtgat tgtggctatc cttcaaaaat + 2701 taacgtcaac cgaagcactg aaaaattata gtacgatcat taatagcttg caagattcta + 2761 tccaaacaaa tatgccactt gagactatga taaatttggt caatgctcag ttagaaagtg + 2821 gagggaatta taaagtaaat tctcaagatt taaaaggtac aggtcggacg gatcttcctt + 2881 cttatgcaat gccagacagt aacctctatg tgatggaaat agatgatagt agtttagctg + 2941 tagttaaagc agctatacag gatgtgatgg agggtagatg aaatgataga catccattcg + 3001 catatcgttt ttgatgtaga tgacggtccc aagtcaatag aggaaagcaa ggcactttta + 3061 agagaagctt ataatcaagg agttcgaatg attgtgtcta cttcgcatcg tcgaaaaggg + 3121 atgtttgaaa ctccagaaga aaaaattgca acaaatttta ttaaggttcg tgaaattgca + 3181 aaagaagtag cagatgattt agtcatagct tatggcgcag agatatacta tactctggat + 3241 gctctagaaa agctagaaaa aaaagaaatt cctaccctta atgatagtcg ttatgctttg + 3301 attgagttta gcatgcatac ttcctatcgt gagattcatg cgggattgag caatattttg + 3361 atgttgggaa tcacgccagt aattgctcat attgaacgtt atgatgcctt agagaataac + 3421 gaaaaacgtg ttcgtgaact gattgatatg gggtgctata ctcagataaa tagttatcat + 3481 gttttaaaac ctaagttctt tggtgaaaaa tataaattca tgaaaaagag agctcggtat + 3541 tttttggaac gtgatttagt tcatgtagtt gcaagtgaca tgcacaattt agacagtaga + 3601 cctccatata tgcaacaggc atatgatatc attgctaaga aatatggagc gaaaaaagcg + 3661 aaagaatttt ttgtagataa tcccagaaaa attataatgg atcaattaat ttaggagaaa + 3721 atatgaagga acaaaacact ttggaaatcg atgtattgca actattcaga actttatgga + 3781 aaagaaagtt ggtcatttta ttagtggcaa ttataacttc ttcagttgct tttgcctaca + 3841 gtacttttgt tatcaaacct gagtttacta gtacgactcg gatttatgta gttaaccgta + 3901 atcaggaaga gaagtctggt ttaaccaatc aagacttgca ggcaggatca tacttggtca + 3961 aagactatcg tgaaattatc ctatcgcagg atgttttgga ggaagttatt tctgatttga + 4021 aactagattt gacgccaaaa ggtttggcta ataaaattaa agtaacagta ccagttgata + 4081 cccgtattgt ctctgtttca gttaatgatc gagttcctga agaggcaagc cgtatcgcta + 4141 actctttgag agaagtagct gctcaaaaaa ttatcagtat tactcgtgtt tctgatgtga + 4201 caacactgga ggaagcaaga ccggcgatat caccatcttc gccaaatatt aaacgcaata + 4261 cactaattgg ttttttggca ggggggattg gaactagtgt tatagttttt cttcttgaac + 4321 ttttggacac tcatgtgaaa cgtccggaag atatcgaaga tacactgcag atgacacttt + 4381 tgggagttgt accaaacttg agtaagttga aataggagag aggaatgccg acattagaaa + 4441 tagcacaaaa aaaactggag ttcattaaga aggcagaaga atattacaat gccttgtgta + 4501 caaatataca gttgagcgga gataaactaa aagtaatttc cgttacttct gttaaccctg + 4561 gggaaggaaa aacaactact tccgtaaata tagcaaggtc gtttgcgcgt gcaggctata + 4621 aaactctttt gatcgatggc gatactcgaa attcagttat atcaggagtt tttaaatcgc + 4681 gtgaaaaaat tacagggcta acagaatttt tatctgggac agctgattta tctcacggtt + 4741 tatgtgatac aaatattgaa aatttatttg taattcaatc gggatctgta tcaccaaacc + 4801 ctacagcctt gttacaaggt aaaaatttta atgatatgat tgaaacattg cgtaaatatt + 4861 ttgattatat cattgttgat acagcaccta ttggaattgt tattgatgcg gcaattatca + 4921 ctcaaaagtg tgatgcgtcc atcttggtaa cagcaacagg tgaggtgaat aaacgtgatg + 4981 tccaaaaagc gaaacaacaa ttagaacaaa cagggaaact gtttttaggt gtcattctca + 5041 ataaatttga tgttcaacat aaaaaatatg gttcttacgg tgactatggt aattatggta + 5101 aaaaataact taggaaagat tttatggatg aaaaaggatt gaaaattttt ctggcaatat + 5161 tacagagtat tattgtcatt ttattggttt attttcttag ctttgttaga gagacagaac + 5221 ttgaacgttc ttcgatagtt atactatacc ttctccactt ttttgtattc tattttagtt + 5281 cctatggtaa taattttttt aaaagagggc acttagttga gtttaatagt actataagat + 5341 atattttttt ctttgcaata gctataagtg tattaaactt ttttatagcg gaacggttta + 5401 gtatctctag aagaggaatg gtatacttct taactttaga aggaatatcc ttatacttgt + 5461 taaatttctt agtaaagaaa tattggaagc atgtgttttt taatctaaaa aatagcaaga + 5521 aaattttact gttaacagta acgaaaaata tggaaaaagt tcttgataaa ttgctagaat + 5581 ctgatgaact ttcatggaaa ttggtagcag taagtgtttt ggataaatct gattttcaac + 5641 atgataaaat acctgtaatt gaaaaggaaa aaattattga atttgcaacg catgaagttg + 5701 tggatgaggt gtttgtcaat cttccagggg agagctacga tattggagaa attatctcta + 5761 ggtttgagac aatggggata gatgtaactg taaatcttaa agcatttgat aagaatttgg + 5821 gtcgcaataa acaaattcat gagatggtag gattgaatgt agtcactttc tctacaaatt + 5881 tttataaaac tagtcatatg atttcaaaga gaattctcga tatttgtggt gccactattg + 5941 gccttgttct ttttgctata gctagtctag ttttagttcc attgattcgt aaagatggcg + 6001 gaccagctat ttttgctcaa actcgtatag ggaaaaatgg tcgacatttt accttttata + 6061 aattccgttc gatgcggatc gatgctgaag ctatcaaaga acaattgatg gatcaaaata + 6121 cgatgcaagg tggtatgttt aagatggaca atgatcctcg tgttacaaaa attggtcgct + 6181 ttattcgtaa aaccagtttg gatgaattgc cgcagttttg gaatgtcttt ataggagata + 6241 tgagtttggt gggaacacgt ccacctacag tagacgagta tgatcagtat actccagaac + 6301 agaaacgtcg actcagcttt aaacctggta ttacaggttt atggcaggtt agcggccgta + 6361 gtaaaataac cgattttgac gatgttgtaa aattagatgt ggcttatatt gataattgga + 6421 caatctggaa agatattgaa attttgctta aaactgttaa agttgtattt ataagagatg + 6481 gagcgaagta aggaatgaaa gtatgtctag ttggatctag tggaggccat ttaactcatt + 6541 tgtatttatt aaaacctttc tggaaagata aagaaagatt ttgggttact tttgataaag + 6601 aagatgcaag aagtattttg ggaaatgaaa tattttactc atgtcattat cctactaatc + 6661 gtaatctaaa aaatcttatt aaaaatacga ttcttgcttt caatattttg agaaaggaac + 6721 accctgatat tatcgtatca tcaggggcag ctgtagcagt tcctttcttt tatctaggga + 6781 aaatatttgg tgctaagaca gtctatatag aagtatttga tagaattgat gctccgacaa + 6841 tgacggggaa acttgtttat ccagtaactg acaggtttat tgtccaatgg gaagaaatga + 6901 aaaaagtata cccaaaagca attaacctag gagggatatt ctaatgattt ttgtgactgt + 6961 aggtacacat gaacaacaat ttgatcgatt gattaaagaa gttgatcgtt taaaaaaaga + 7021 aaatcttatt caagatgaag tatttattca aacaggatat tccaaatata ttccgaaata + 7081 ttgtgagtgg gaaaagataa tttcttatga aaaaatgaat caattgattg agaaatcaga + 7141 tattgtcatt actcatggtg gaccagcgac gtttatgggg gttattgcta aaggaaaaat + 7201 tccgatagtt gttcctagac aaaaaaaatt tgaagagcat gtgaatgacc atcagttaga + 7261 attctgtaat aaagtaaagc agacttaccc aattattgta attaatgata taaaaaatct + 7321 agttataaat ttaagaaata ataaatcaaa ggaaactata aatagtaata ataaggagtt + 7381 ttgtagaaaa ttggaagaaa gaataggtag tttgtaatga atttaaagaa atcatttcgt + 7441 ttatttgctc aacaaacaat atttaaagtg ttttctctca ttaataaata cataaaaaaa + 7501 aaaaacaaat acttatatat tcccctaaag aactttctga taattcatta tctctatttg + 7561 aatacttaat agacaatgaa tattatataa agtataagat atactgttct tgcactgatt + 7621 atcataattt gaattcgaaa tataataatc taaaaaatgt atattttata aacggcatta + 7681 atggggtatt aaaatacttt acaagtagct ttgtatttta ctcttttggg aaaattccta + 7741 ttatcccttc taatcaacgc gtagtacaat tgtggcatgg tatgttcttt aaagatattg + 7801 ataaatatca gaaaaagatt gtcaaaaaag aaaaatacta cactgatgta attgttacaa + 7861 gcgagatgtt taaagaacta gctactaaag ttcattcttg tgatatcgga gttgttaaaa + 7921 tctgtggtca aagtagaaca gatgtttttt ttaatgaaga caaaaaagtt acttccaaat + 7981 acattgtctg gttgccaaca tttaggcaat ctgagaaatt aggatatagt gataccaatt + 8041 cggaagaaat tttgatagga gattattcgt ttgaagaatt aaaaaaagta aatagtctct + 8101 taaaagaaga caatctaaat atgatagtga agcttcatcc gcttcaaaca cttcctgcta + 8161 atatgcctaa ctatagtaat attcagatac tgtcagaaga aaagagtagg aaaaagaata + 8221 taaagttata tgaattgtta agagacagta tagcattaat aacagattat tcttcagttt + 8281 tttacgatta ttatttatta gataaaccaa tagctttttg tataagagat tttgaggatt + 8341 acaataaaaa tagaggattt atagtagaga atccgatgga ctacctaaag ggaaataaaa + 8401 tcaaatcatt agatgatatg tgtaatttta taaatgaaat tacacataat gtggataaat + 8461 ttaaagaaga acgaagggga tttaatgaaa aagtaaataa atatagagat gggaataata + 8521 gtaaaagatt gctagaaaaa attggaatta actaaggagg gctgttatga aaattgcact + 8581 actgacagcg tcaggaatag gaagccgaat aaaacaagat ataccgaaac aatttataca + 8641 tgttgacaat aagccactca tcattcatac gctagaaaaa tttcaaaatc atccaaacat + 8701 tgatgaaatt tgtgtagtag tattaaaagg ctgggaagaa atgttgaaaa catatgctag + 8761 acagtttaat attacgaaac taaaatatat agtaaatggc ggagaaactg gtcagttatc + 8821 tatctataat ggtcttaatg aaataaagaa aaataatata gatcggcaag tgactgtttt + 8881 aattcatgat ggtaatcgac cgatggtaag caacgaaatc attgatgatg cgttttcaac + 8941 gtatagtaga tatggaaatg cagtggctgc aattccttgt gttgaggtta cttttgtatt + 9001 agataatgag actgaaaatc attctattag ttctttaaaa agagagttat tgaggagaac + 9061 gcagacacca catgtttata atttagatga tatactagaa cttcataaca gagctttaga + 9121 aaatggaata actgaggttg cagcttcctg tgaattaatg aagatgttcg gaaaagaaac + 9181 gtatttttct atggggtctg aaaaaaattt aaaaataacg accttagatg atttagaaat + 9241 ttttaaagct cttctcaaat ctaaaaaaga agattggatt aaggattaaa ctgtgaactt + 9301 atttgacata agtctatata aggattatgt agacaaatct ataaaaaata tagttggcgt + 9361 tgagacttta aaggataaat caattcttat tacgggatcg acaggtctta tttgttcgac + 9421 tgttattgat caattgatta tactgaataa gaatcatcaa ttcggagtta aaatttatgc + 9481 ttgtgcaagg agtgaagaag gactaaaaag acgatttgga aattatgtag atgatgaaaa + 9541 tattatttat gttccatatg atgctaataa agatattgat tttaatttca ctgtagatta + 9601 tataattcac ggagctagta atgccagtcc agatttatac attagtaatc ctgtagatac + 9661 aatgcttagt aattttttag gtatgaaaaa tttactagat tatgctttga aaaaatcagt + 9721 aagttctata gtttatgttt cgtccagtga agtatatgga aaaacagaaa atcatactcc + 9781 gtatcaagaa gatgagtatg ggtatgtaaa cattttagat gttagagctt cctattcaag + 9841 ttcaaagcga gcaacagaga cattgtgtaa aagttattct gaacaatatg acgtatctat + 9901 aaaaattgtt cgtccaggtc atatttatgg tcctagctta aaaataacag ataaaaggat + 9961 ttcatctgct tttatgtatg atgcaatcag gggacaaaat ttagtaatga aaagtaaagg + 10021 agaacaacta cgatcatatt gtcatagttt ggactgtgca agtgcaattt tgacagttct + 10081 tttgaaaggt cagtctggcg atgcatacaa tatttcaaat aaaaaatcta ttatttcaat + 10141 aagagagatg gcctctataa tagctgaagt agctggagta gaattactgt ttgaattacc + 10201 taatgaagta gaagaaaaac aaaaaaatcc tatggataat tctagcttag atagtacaaa + 10261 attggaagag ttaggatggg taggtatgtt tgaagctaag gaaggattag aaagtacata + 10321 taaagtttta gatataagta aaattcaaaa gatatctaag aatatataca atatagattg + 10381 atttccagtc tctttagcag aaatatcagt aggaggagta atggaaaaag tttcagtaat + 10441 agttccaata tataatgttg aaaaatattt aaaatatagc ataggaggta ttctaaaaca + 10501 aagttataaa aatttagaaa ttattttagt aaatgatggt tcccaggata attctcttgc + 10561 tatatgtgaa gaatattcta agatagataa tagaattaaa ataatttcag ttgagaatgg + 10621 aggacaagga aaagctagaa atattggatt gcaacattca acttctgact ggattttatt + 10681 tttagatgca gatgattatt atgataataa tgcggtagaa tatcttgtag aactggctga + 10741 acgatatgga tcggatttag tagtaacccc attgagagta gtaagagatc atattcaagg + 10801 tggaaatgca tcctcaatca agaatgaaaa aatacttaac ttgaataaag atagattgat + 10861 agaagaaatg tattacggaa gactcttagg ggctacacca tgtggtaaat tatataaaag + 10921 ggaaatatta gaaaaatggc ctttcccaga tcaacttttt gaagatttgg ctatagctta + 10981 taaacattta atgagtgcta agaaggtagc tgtatcaaat caatattatt ataattatta + 11041 tcaacgtgtt ggaagtacaa cgaagagtag atatacatca aaattagaag atttttatag + 11101 agctatagaa aaaaactata aatatttaga agaagatttt ccaaataata aagaattatc + 11161 tattgctttg aaaaccagaa tgtttacagg aggttttcaa gtagtgaact ctatgattga + 11221 atctggaatg actaaagaag taaaagataa gtctttagag tataggaaag atctactcat + 11281 gataattttc aatagtagaa tcactaaaaa ccataaaata aagcatatac tattcagcat + 11341 caatcctaaa ttatatactt ttgttctaaa aagtatataa ctaacaaata aataactaaa + 11401 taataaggag ggaagtaatg attttaagta ttgttgttcc aacatataat atagaaaaat + 11461 atatagagag gaatatagag tcttttctca atgtagagga tgagttgaag agtttgtttg + 11521 aaattttgat tattaatgat ggaagcacag ataagactct tcaagtagta acagaattaa + 11581 tatcaaaaat agattgttta aatataagag taataaacaa gagtaatggt ggacatggtt + 11641 cagcagtaaa tagagggata gaggaagcta aaggaaagta ttttaagata gtagatggag + 11701 atgattgggt aaaaaaatca gattttgaag agtacttaaa aagattagaa aaaaccaatg + 11761 tagatatggt tgtgacgaat tttagtaagc agtatactta tgaaaataga gtggaattag + 11821 aaaaggtaat caatgttgaa gattattata aaagtaataa aattcccaaa atttttccaa + 11881 tgcatagtgt tacatacaaa acatgtatcc taaaagaaaa taatatcaaa ttgacagaaa + 11941 aaatctttta tgtagatatt cagtatatag tatttcctct gaaatatatt agcgattggg + 12001 aatactggaa tttagatgtg tatcagtatt tcttgggtag acctgatcaa agtatgacta + 12061 tagaaaatag aatgaaaaat attgagcata gtagaaaagt tacagaaagt atattggaat + 12121 tttatagcac gttgggagat gtatatttta aagatatagt gaattctctt ttgaaaggtt + 12181 tacttaacac gagatattta ttggcattct tatcagatga tagagaacga ttattaaagg + 12241 aaactacaga ttatattaga aaatataaaa taaaatatac ctacgactct cgtatgaaga + 12301 caagctattt attatatcta aatgagatac ataatagaag atattcattt atagtgtatc + 12361 ctatagttgg ttttaaatta aataggttaa gcaaatacgg tatataggag tgtccaatat + 12421 gagtagtata aaagtaagta tatatcagtt acttttttac gtatctttta ttattatagt + 12481 tggttcaaaa tatttaaggg aaacggtttt tgtaaatgca tatcctctgt taagtgaatt + 12541 gataaaagtt ttaataatta tagcatgtat ctttttatta ttaaaatata tattagaacc + 12601 acatactaaa aagttcatta ttttttcgat agttatttta acgataggag tagtagtatc + 12661 ttataattca gatagttttt ttattttaat gccagtagta gcactaatat taaatatgag + 12721 taatatagat ataaccaagg ttataaaagt ttggcttata gagattatag cattaatgat + 12781 ttttctagca atatgttata gactaaatat agtaggggaa gttataaact cagcaattag + 12841 atcagatggg aaaatacgat atgctctagg gtataaatat tcaacattta gctcaaatta + 12901 ctttttccat gttacgattt tctatttata tttaagaaaa catatgatta agtatgtaga + 12961 gataataact ttatttctta taaatttgta tctatatgct ttaactgata cgagggcagt + 13021 attctactac tctacagcag ctattgttat ttgtttgttg ttaaagatgt ttaagataaa + 13081 aacatatagc attattttga ataaatacag tatgttattt tcagcaataa tagctggagt + 13141 tttgtcatgg agttatcggt atagactacc attttttgat cagttagatt taatattaac + 13201 aggtagatta cgacttggaa gtgctgcttt taataatttt cacataacat tttttggaca + 13261 aaaaataaga tggatttatg aacaaaatat gttttctgaa ttgatatata attatgtgga + 13321 ctcttcatac ctaaatattt tatttggatt tggaataata attttactat taatattagt + 13381 tggatattat attattggag aaaaaaaact aagtagagat acatattata caatgatgat + 13441 tgtgttctta tcactacatt ctacatttga tcctcaatta atagacatag tgtataatcc + 13501 agcgattttg tttttgggat atgttatata taatgaagat gagataaaaa atctaaataa + 13561 aatttactaa gaaatctcta aaaatagtcg ttttatatgt attatattta aaaaactttg + 13621 taaatcaaca gtttaaaaaa ataaatatgt ttgtttctgt atttactaat aaggaatcaa + 13681 agtatctata gtaaatcgaa tatagaatag gaaaaacaac atctaaagta ttgttagaaa + 13741 ttaatttaaa tactctaatt tatttgttca tattttattt caacacacta taaaaaccaa + 13801 gtaggagttt ctctttaaaa tgaaaatctt aaaaaactac gcctacaatc tttcttatca + 13861 attgttggtg attatactcc caatcattac aactccctat gtgacacgag tcttttcttc + 13921 gtatgcttta gggacttatg gttattttaa ttccatcgtt acttatttta tcctcttagc + 13981 tactctagga gttgctaact atggtactaa ggtaatctct ggaaatcgaa aggaaattga + 14041 aaaaaacttt tggggaatct actccctgca attgtgtgcg gcagttctgt ctctgtcctt + 14101 atacgttgtt ctttgtctaa ctctttcttt gatgcaaaat ccagtcgcct atattctagg + 14161 attgagtgtg gtttctaaag gcttagatat ttcttggctc tttcaagggt tagaggattt + 14221 tagaaagata actgttcgaa atatcacggt taaactgata ggtgtaatct ctatcttcct + 14281 ttttgtcaaa tctgaaagtg acctttatct ctatatcttt ttactaacca tatttgaact + 14341 cttaggacaa ctaagtatgt ggttgcctgc tcgagaattt attggtagag atcattttga + 14401 tatagcatat gttagacatc atttgaaacc tgtcatatta ttattccttc ctcaagtagc + 14461 tatttctatg tatattacgt tagatcgtac catgcttggg gcattagctt ctacaaaaga + 14521 tgtagggatt tatgaccagg ctctaaagtt ggtcaatatc cttatgaccc tggtaacttc + 14581 tttgggaagc gttatgttac ctcgtgttgc gcatctgcta tccaaagggg aacaaaaagc + 14641 ggttaataaa atgcatgaga tatccttcct catttataat ttagtgattt ttccagtgat + 14701 agtagtgatt ttgattgtga atgatgattt tgttcaattt ttccttgggc aagattttca + 14761 ggatgcgcgt tatgcaattg ccatcatgat ttttcggatg ttctttatcg gttggactaa + 14821 catcatggga attcagatgc tgatacctca taatcaaaat aaagaattca tgatttcaac + 14881 aactgctcct gcaattatca gtgtaggttt aaacttgcta ttcctgccaa agtttggtta + 14941 tatcggggca gccattgtct cggttttaac agaggcattt gtatgggcaa tccaattgtt + 15001 ctatactcgc agatatttaa aaggagttcc tataatcgga tcaatggcaa aaattatact + 15061 agcatctacc attatgtatg gacttttact aagttcaaaa acagttatac atttttcacc + 15121 gactttaaat gttctagcat ttgcagcgct tggtggaata atttatcttt ttgcaattct + 15181 atctctgaaa gtggtagatg tgaaagaatt aaaacaaatt attaggaaaa attagaatga + 15241 aaaaaattcg aaatattaac ttagatttac taaaagtgct tgcatgtgtt ggagttgttt + 15301 tacttcatac aacaatggcc ggatttaaag agaccgactc atggaatctt ttggcatatt + 15361 tatattattt aagtacctac tctattcccc tgttttttat ggtcaatggt tatttattgt + 15421 taggcaagag ggaaataact tatcattaca tactccagaa agtaaaatgg attttaataa + 15481 cagtgtcatc atggacattt atcgtatgga tttttaagcg tgattttaca actaatccta + 15541 ttaaaaaaat tgtaggttct ttgatacaaa gagattattt ccctcagttt tggtttttcg + 15601 gtgcactaat acttatctat ttatgtttac caattttgag aaaatttcta aattcaaaaa + 15661 gaagctattt atacagtctg tctttattgc tgattattgg tttgattttt gagttatcaa + 15721 atatcttact tcagatgcca atacaaacat atgttgtaca aactttcaga ttatggactg + 15781 ggtttttcta ttatatttta ggtggtttta tagcgcaatt cactatagaa gaaatcgaat + 15841 caaggtttaa aaattggatg aaaatagtta gcatactttt gttattgatt tcaccaataa + 15901 tattattttt catagcgaag actatatacc ataatctatt tgctgaatac ttttatgata + 15961 ctttatttgt aaaagtcagt actctaggaa tttttctaac tatcctcacg cttactttga + 16021 atgaaaaccg aagagaatcg attgtttccc tttctaatca aacaatggga gtttttataa + 16081 tacatactta tattattaaa gtgtgggaaa aactatttgg ttttaatttt gtaggagcat + 16141 atttgctttt tgctctattt actttaagtg ttagttttat tattactgga atgttaatga + 16201 agattcctta cttcaatcga attgtcaaat tataaaaagg agcataagat gtacgattat + 16261 cttatcgttg gtgccggtct ttttggtgca gtatttgccc atgaatcagc cttaaaagga + 16321 aaaaaagtaa aagttattga aaaacgaaat catattgcgg gtaatatcta tactcgtgaa + 16381 gaggaaggaa ttcaagttca tcagtatggt gctcatatct ttcatacttc tgataaggag + 16441 atctgggatt atgtgaacca gtttgcagag tttaaccgtt atacaaattc tcctgttgca + 16501 aactataagg gagagattta taacttacct tttaatatga ataccttcaa taaactctgg + 16561 ggagttgtga cgccagcaga agcacaagct aagattgatg aacaacgtgc tattttaaat + 16621 ggtaaaactc ctgaaaattt ggaagaacag gcgatttctc ttgtaggtac agacatctac + 16681 gaaaaattaa tcaaagacta tacagagaaa cagtggggca aaccgactac tgaacttcca + 16741 gcctttatta ttcgtcgttt gccggtacgc ctgacctatg ataacaacta ttttaacgat + 16801 acctatcaag ggattccaat tggtggatac actcaaatag ttgaaaaaat gttggatcat + 16861 gaaaatattg atgtagaaac aaatgttgat ttctttgtga ataaagagca atatctgaaa + 16921 gattttccta agattgtctt tactggtatg attgatgaat tctttgacta taagttgggc + 16981 gaactagagt accgtagtct tcgttttgaa aatgagacct tggatatgga aaattaccaa + 17041 ggaaatgcag ttgtgaacta tacggatgca gaaaccccat atactcgcat tattgaacac + 17101 aaacattttg agtttgggag tcaagcaaag accatcatta ctaaagaaca ttctaaaaca + 17161 tgggaaaaag gtgatgagcc ttattatcca gttaataatg atcgtaataa tcatttgtat + 17221 aaatcgtata aaaaatttgc tgatgagcaa gggaatgtta tctttggtgg ccgcttagga + 17281 cactatcgtt attacgatat gcaccaagta attggagccg ctttgcagtg cgtgagaaat + 17341 gagttagatt aatactcaat gaaaatcaaa gagcaaacta ggaagctagc cacaggttgc + 17401 tcaaaatact gttttgaggt tgcagatgga agctgacgcg gtttgaagag attttcgaag + 17461 agtataaaca agtaaaactg actaccagtt attatttaga aatagtatta aaaattcctt + 17521 gactatgtga tatagttgag ggatttttaa atgatattca tattttttgc aaagatgttg + 17581 tttgaaaaat aattttcaaa aattctgaaa attctgttga catctttctg aaaagagtct + 17641 ataatggaga gaaagtttta aaggagaaaa tgatgaaaag ttcaaaacta tttgcccttg + 17701 cgggcgtgac attattg +// + diff --git a/public/res/serotype_genbank/serotype_14.gb b/public/res/serotype_genbank/serotype_14.gb new file mode 100644 index 0000000..1cd3ffd --- /dev/null +++ b/public/res/serotype_genbank/serotype_14.gb @@ -0,0 +1,834 @@ +LOCUS CR931662 19918 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 34359 (serotype 14). +ACCESSION CR931662 +VERSION CR931662.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 19918) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 19918) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..19918 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="34359" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC14_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC14_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33314.1" + /db_xref="GOA:Q4K1T1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K1T1" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVELL" + gene 293..435 + /gene="aliB" + /locus_tag="SPC14_0002" + /pseudo + CDS join(293..352,349..435) + /gene="aliB" + /locus_tag="SPC14_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(433..978) + /gene="tnp" + /locus_tag="SPC14_0003" + /pseudo + CDS complement(433..978) + /gene="tnp" + /locus_tag="SPC14_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1200..2645 + /gene="wzg" + /locus_tag="SPC14_0004" + CDS 1200..2645 + /gene="wzg" + /locus_tag="SPC14_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33317.1" + /db_xref="GOA:Q9R928" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q9R928" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1200..1316 + /gene="wzg" + /locus_tag="SPC14_0004" + /note="Signal peptide predicted for SPC0656 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1404..1751 + /gene="wzg" + /locus_tag="SPC14_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.7e-65" + misc_feature 1929..2372 + /gene="wzg" + /locus_tag="SPC14_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 2647..3378 + /gene="wzh" + /locus_tag="SPC14_0005" + CDS 2647..3378 + /gene="wzh" + /locus_tag="SPC14_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33318.1" + /db_xref="GOA:Q4K1S9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K1S9" + /translation="MIDIHSHIVFDVDDGPKSREESKALLIESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKHVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 2650..3258 + /gene="wzh" + /locus_tag="SPC14_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.3e-35" + gene 3387..4079 + /gene="wzd" + /locus_tag="SPC14_0006" + CDS 3387..4079 + /gene="wzd" + /locus_tag="SPC14_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33319.1" + /db_xref="GOA:Q4K1S8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K1S8" + /translation="MKEQNTLEIDVLQLSRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRDQGEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGVSGTSVIVFLLEFLNTRVKRPEDIENTLQMT + LLGVVPNLSKLK" + misc_feature 3405..3821 + /gene="wzd" + /locus_tag="SPC14_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 5.4e-51" + misc_feature 3927..4004 + /gene="wzd" + /locus_tag="SPC14_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4089..4772 + /gene="wze" + /locus_tag="SPC14_0007" + CDS 4089..4772 + /gene="wze" + /locus_tag="SPC14_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33320.1" + /db_xref="GOA:Q4K1S7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1S7" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SYGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPVGIVI + DAVIITQKCDASILVTATGEANKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + ASYGNYGKK" + gene 4788..6155 + /gene="wchA" + /locus_tag="SPC14_0008" + CDS 4788..6155 + /gene="wchA" + /locus_tag="SPC14_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33321.1" + /db_xref="GOA:P72513" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:P72513" + /translation="MDKKGLEIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNKFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNPKNSKKILLLTVTENIEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVDLPGESYDIGEIISKFETMG + IDVTVNLNAFNKNLGRNKQIHEIVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEVIKEQLMDQNTM + RGGMFKMDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RNGAK" + misc_feature 5571..6152 + /gene="wchA" + /locus_tag="SPC14_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.5e-144" + gene 6159..6608 + /gene="wchJ" + /locus_tag="SPC14_0009" + CDS 6159..6608 + /gene="wchJ" + /locus_tag="SPC14_0009" + /note="member of homology group 26" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="CAI33322.1" + /db_xref="GOA:P72514" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:P72514" + /translation="MKVCLVGSSGGHLTHLYLLKPFWKDRERFWVTFDKEDARSILEN + EIFYPCYYPTNRNLKNLIKNTILAFKILRKERPDIIVSSGAAVAVPFFYLGKIFGAKT + VYIEVFDRIDAPTMTGKLVYPVTDRFIVQWEEMKKVYPKAINLGGIF" + gene 6608..7111 + /gene="wchK" + /locus_tag="SPC14_0010" + CDS 6608..7111 + /gene="wchK" + /locus_tag="SPC14_0010" + /note="member of homology group 27" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33323.1" + /db_xref="GOA:Q4K1S4" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q4K1S4" + /translation="MIFVTVGTHEQQFNRLIKEVDRLKGEGFIQDDVFIQTGYSNYVP + KFCKWEKLISYEKMNQLIKESDIIITHGGPATFMAVIAKGKNPIIVPRLKKFGEHVND + HQMQFVKITKEIYNLIVIDDISDLHLILHNFKDKHFETYLNNERFNVRFNVEISNLFK + GNKINEN" + misc_feature 6608..7081 + /gene="wchK" + /locus_tag="SPC14_0010" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 4e-56" + gene 7101..8273 + /gene="wzy" + /locus_tag="SPC14_0011" + CDS 7101..8273 + /gene="wzy" + /locus_tag="SPC14_0011" + /note="member of homology group 103" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33324.1" + /db_xref="UniProtKB/TrEMBL:P72516" + /translation="MKIRIEPQYFLYKYLWFIILLPKQFMQLILFFLIALTLLPTYIK + EKQVFKIDTPSFCMVLWTIIYSISIIFNSLIDGLAVQVLFSDLSKAFNWLIAVFFYNY + YLKMPINIDRIKRYMYYNFTILVVFVGLFYIQRGSNVILFGRSLLDWDGFTLATSYGV + RYTGFLEYATLNGQLILFLLPLIRLFRFRFFTQTIIFAFLLEVLVLSKSRIAIVAMLI + YIAFAVVNEINSNNKWLIGIFCPIIPFMLFYNFEKIKQIFFQMFSSRSGSNATRFRVY + EESLKAINGMEMLLGAGVRIPSTVDILLGSHSMYISFIYRTGVLGSIIITVMFYYLFS + KFLKCDSSERLRSIGYILALSVFWLFEELDPHYWCLILFFSTISIFINNRKEEIVG" + gene 8270..9289 + /gene="wchL" + /locus_tag="SPC14_0012" + CDS 8270..9289 + /gene="wchL" + /locus_tag="SPC14_0012" + /note="member of homology group 76" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33325.1" + /db_xref="GOA:Q4K1S2" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K1S2" + /translation="MIEVSIIIPIYNAEKTIKNCVDSALKQNLESLEVILVNDGSNDS + TSKILEQYGDNPQVMIFHQVNMGVSAARNVGLSYASGEYVFFLDSDDILDEGMLSKMY + QFAKSNKIDLLSCWHKEPSTTQYGGNDNSSASFIARTKEEIGNHFVDIFPRSACAKLF + LRRRIEENNIAFSTEMSLGEDMSFVCQYLMVSRSIAVIDGLYYTIQNVNPQSLSKRYV + SNIENSLLMQNQLWDQLLEVYPKIEENYYKQHMDFRFYLASLYVNNLFKFDSPYSSKE + KWDNIAQQLKKYRPFLDEKVSKEKKPKNMNEMVIFYLLKSKIPALIYSFYSFKEWWKK + KRLKN" + misc_feature 8282..8749 + /gene="wchL" + /locus_tag="SPC14_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 9.5e-43" + gene 9304..10260 + /gene="wchM" + /locus_tag="SPC14_0013" + CDS 9304..10260 + /gene="wchM" + /locus_tag="SPC14_0013" + /note="member of homology group 77" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33326.1" + /db_xref="GOA:O07340" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:O07340" + /translation="MEDLVSIVVPVYNVEKYLKKSIESILNQTYDNLEVLLVDDGSTD + SSGEICDSFIKVDSRIRVFHKENGGLSDARNFGIEHMKGQYVSFIDGDDYISKDYVWK + LYHSLKNNNSEVSICSFSLVDETGEKIKDELLDSGEVSLSGQQILEKALTADGYRYVV + AWNKLYRSTLFEKLKFKKGMLYEDEFLNYPLFWDCKRVSIVEEPLYLYVQRKGSIIQS + NMTLEKIKMKDKMHTSRIEFYAEKKNSFLHQRSCQQYCNWIVTITVSHYNVLNVAFLK + YLQHQFRRIVKYTQNDDKKLIIQNILGYINIRLAAYVKSKVM" + misc_feature 9319..9828 + /gene="wchM" + /locus_tag="SPC14_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 8e-49" + gene 10348..11196 + /gene="wchN" + /locus_tag="SPC14_0014" + CDS 10348..11196 + /gene="wchN" + /locus_tag="SPC14_0014" + /note="member of homology group 34" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33327.1" + /db_xref="GOA:O07341" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:O07341" + /translation="MFPIYIISNQNIAFQQEIDIAYRKMKRQFSHISLTESEQKNDMN + ISNKVWICWFQGEERPPELIRTCIQSMRTHFLGREIIVLTEENISDYIDIPDYITDKY + KKGSISRAHYSDILRVELLCRYGGLWVDVTVLNTGGDFSNLELPLFVYKYLDLSRKDS + QAIVASSWLISSYSNHPILLYARKLLWEYWRRKNSLCNYFLFHIFFTTATELYPIEWS + AVLTFNNHSPHMLNFELNNQFSEKRWEQLKQISVFHKLNHHIDYSIGVNNFYKFIVSS + KVEKNE" + misc_feature 10348..11181 + /gene="wchN" + /locus_tag="SPC14_0014" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 5.5e-152" + gene 11189..12652 + /gene="wzx" + /locus_tag="SPC14_0015" + CDS 11189..12652 + /gene="wzx" + /locus_tag="SPC14_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33328.1" + /db_xref="GOA:O07342" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:O07342" + /translation="MSNKISKNLAYNIGYQLIGIAFPLITSPYLSRILGAENLGIHSF + TISVALYFMMFMLLGIANYGNRTIATVKREGKEILSKTFWNIYYVQLLMSVLVTIAYL + IYLYFWVSSYKFIAILQLFLLLSNAVDITWLFYGLEDFKQIVFRNALVKLLGLFLIFS + FVHESSDLWKYTLINGGVTLVGQLLLWGQLKGRLSWVKIQKKDLLSHIKPILVLFIPV + LAISIFSNMDKYMLGLMVGVKQVGFYDNANRIIDIPKALIAALEAVMLPRTSYLLAEG + QEEKSNYYIEVTILYAMMISSVLIFGIISVSDIFSLVFWGEEFLESGRLIAAMAPVFV + FSVPGNIIRTQYLIPRAKDKDYVLSLIIGALVNILLNCFLIKPFGAMGATISTVLAEF + VLYGVQFWTVRRDLDFKKYLKNGFIFYLFGMIMYLAIIAAKAHLQYNIINLVLLIVLG + GIVYTGFCCFYILISRNVHFEILREKIKRKIGYENIL" + misc_feature 11201..12007 + /gene="wzx" + /locus_tag="SPC14_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.2e-83" + gene 12636..13715 + /gene="wciY" + /locus_tag="SPC14_0016" + CDS 12636..13715 + /gene="wciY" + /locus_tag="SPC14_0016" + /note="member of homology group 78" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33329.1" + /db_xref="GOA:O07343" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:O07343" + /translation="MKIYYKLLLKRLIFPPFYLVVTNKYWLPLNKRKVVFDNFGGRGY + GDNPKYIADELLKQDENLDLVWVVENMSTFVPKGVRKVWYGSWGAFFEWSTAKVWIDN + IRNSDRPWKRKNQVYLQTWHGSDGVKIIEKDAESTLSKSYIRMAKYDGSISDAIISSC + QLQTQTEQFKKSFWLADNVEILEYGLPRNDDFFQKKKVDHINHTVRSKYNISLDELVI + LYMPTFRDDASTKAYNLDYDKVINSFQDFYNRKVKVLIRFHPNVDNTFFNNTDKRLIN + VTDYPNPQDLMFVADIMISDYSSAPIDFLLLNRVVFLYLPDFKEYQSDKNPFFEVFKV + SKTKGIALDPFDEIIGRFQFGVRIV" + misc_feature 13248..13700 + /gene="wciY" + /locus_tag="SPC14_0016" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 7e-19" + gene 14075..18154 + /gene="lrp" + /locus_tag="SPC14_0017" + CDS 14075..18154 + /gene="lrp" + /locus_tag="SPC14_0017" + /note="member of homology group 190" + /codon_start=1 + /transl_table=11 + /product="putative surface anchored protein" + /protein_id="CAI33330.1" + /db_xref="GOA:Q4K1R7" + /db_xref="InterPro:IPR001899" + /db_xref="InterPro:IPR019931" + /db_xref="InterPro:IPR019948" + /db_xref="UniProtKB/TrEMBL:Q4K1R7" + /translation="MTVITSDTHENSDNFAFCLANGKRFPSFTDEKPKGIYTLVKDIN + KEQYTKLLKENHKWSSIPNLNQAWDTFSRLSYMYLKDPTDIVKRAWGTDLNTARTYFH + QVIQYEIWRYTDGMRVSSDTNVYIYEKFSPQQKKALEMIRTDLYNFTVPYENLEYRFY + KPDWVFGLGFQALATVRWKIEPATITVTKKWENVKEGAEKPEVWIQLLKDDKPEGDRK + RIEPDKGRTTFEIPNKDEINKYSVKEVDKEGRDWKHKDFTAGQPVNKGNGHFEITNTK + KEKPKIKVTFKKIAGDTNKDLAGAHLVLKKIFDDGNGLLIKQWDTIGQPVDIDLDAGS + YTLTEEKAPDGYMLAAPVSFYVEEDGQIILPKGEDLEAQNDKTITMVDEKIKEKPTKP + SGKLATTVEVDGTKADAQKELELSVATDKVTKTVKDTVVYENLLAGETYKLTGQLMKI + TADKEEEVATKETTFVADASGNGTTSLEFEDVSLEAGVKYVVYETAESEKEIDFKEGK + EKHKVEHKDKDDKAQTVVVTKEKPTKPSGKLATTVEVDGTKADAQKELELSVATDKVT + KTVKDTVVYENLLAGETYKLTGQLMKITADKEEEVATKETTFVADASGNGTTSLEFED + VSLEAGVKYVVYETAESEKEIDFKEGKEKHKVEHKDKDDKAQTVVVTKEKPTKPSGKL + ATTVEVDGTKADAQKELELSVATDKVTKTVKDTVVYENLLAGETYKLTGQLMKITADK + EEEVATKETTFVADASGNGTTSLEFEDVSLEAGVKYVVYETAESEKEIDFKEGKEKHK + VEHKDKDDKAQTVVVTKEKPTKPSGKLATTVEVDGTKADAQKELELSVATDKVTKTVK + DTVVYENLLAGETYKLTGQLMKITADKEEEVATKETTFVADASGNGTTSLEFEDVSLE + AGVKYVVYETAESEKEIDFKEGKEKHKVEHKDKDDKAQTVVVTKEKPTKPSGKLATTV + EVDGTKADAQKELELSVATDKVTKTVKDTVVYENLLAGETYKLTGQLMKITADKEEEV + ATKETTFVADASGNGTTSLEFEDVSLEAGVKYVVYETAESEKEIDFKEGKEKHKVEHK + DKDDKAQTVVVSKIKPEPGAQEVHFSKVNVGGEEIAGAEIHIKQGDTVVASWVSEAGK + THTLKLKPGHYIFHEAVAPGGYLAVTDIHFSVDETGQVTVTDVNGNTAVAEGNKLTVT + DQTKPVTPPSPEEPGAQEVHFSKVNVGGEEIAGAEIHIKQGDTVVASWVSEAGKTHTL + KLKPGHYIFHEAVAPGGYLAVTDIHFSVDETGQVTVTDVNGNTAVAEGNKLTVTDQSA + DKDKQDKLPNTGETTGTYLSILGMITAVFASLLYRSKKK" + misc_feature 14963..15169 + /gene="lrp" + /locus_tag="SPC14_0017" + /note="HMMPfam hit to PF05738, Cna protein B-type domain, + score 0.00012" + misc_feature 17441..17641 + /gene="lrp" + /locus_tag="SPC14_0017" + /note="HMMPfam hit to PF05738, Cna protein B-type domain, + score 0.00041" + misc_feature 17777..17977 + /gene="lrp" + /locus_tag="SPC14_0017" + /note="HMMPfam hit to PF05738, Cna protein B-type domain, + score 0.00041" + misc_feature 18032..18151 + /gene="lrp" + /locus_tag="SPC14_0017" + /note="HMMPfam hit to PF00746, Gram positive anchor, score + 6.3e-10" + misc_feature 18056..18073 + /gene="lrp" + /locus_tag="SPC14_0017" + /note="PS00343 Gram-positive cocci surface proteins + 'anchoring' hexapeptide." + gene complement(order(18312..18893,18947..19635)) + /gene="tnp" + /locus_tag="SPC14_0018" + /pseudo + CDS complement(join(18312..18893,18947..19120,19120..19635)) + /gene="tnp" + /locus_tag="SPC14_0018" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(18813..18893,18947..19120,19120..19143)) + /gene="tnp" + /locus_tag="SPC14_0018" + /note="HMMPfam hit to PF01610, Transposase, score 1.6e-33" + /pseudo + gene 19871..>19918 + /gene="aliA" + /locus_tag="SPC14_0019" + CDS 19871..>19918 + /gene="aliA" + /locus_tag="SPC14_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33332.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcatg taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt agctgcttgc + 361 ggccaatcag gttcagatac aaaaacttac tcatcaacct ttagtggaaa tccaactaca + 421 tttaactatc tattagacta ttacgctgat aatacagtca attgaaataa gagcaggata + 481 aaaaagcctc gtaaaaggta ttgcaacttg gtaatacctt ttacgaggct ttttgatatg + 541 agcccatgtt ttctcaatag gattgtactc aggtgagtag ggaggaagag gtaaaagttt + 601 atgcccaaac tcttcgcata aaagttctag cttccccatt ctatggaatc ttgcattatc + 661 cataataata accgatggtg tggttaatgt tggtaagaaa aacttctgaa accatacttc + 721 aaaaaagtcg ctcgtcatcg tttcttcgta agtcattgga gcgattaact caccatttgt + 781 tagacctgca accaaagaaa tcctctgata tcttcttcca gatactttgc ctcttcttaa + 841 ctgacctttt aatgagcgac catattctcg ataaaaataa gtatcgaatc ctgtttcatc + 901 aatctaaaca ggtgataggt gctttaaact attaaaattc ttaagaaata aggctacttt + 961 ttctgggtct tgttcataat tagattgaaa ctagaatagt acacttctgc ttctaaaaca + 1021 ttgttagaaa tcgatttgac tgtcctgatc gatttgtcat gttcttattt cattttacta + 1081 tatttttgtt tcgcgggaag tctactaaga tacttaaaga tgcagatagt aaaaaaaatg + 1141 tagacattac cgtaaaaaag tgatataatt gtacgatgtt caaggtatag gtgttaatca + 1201 tgagtagacg ttttaaaaaa tcacgttcac agaaagtgaa gcgaagtgtt aatatcgttt + 1261 tgctgactat ttatttattg ttagtttgtt ttttattgtt cttaatcttt aagtacaata + 1321 tccttgcttt tagatatctt aacctagtgg taactgcgtt agtcctacta gttgccttgg + 1381 tagggctact cttgattatc tataaaaaag ctgaaaagtt tactattttt ctgttggtgt + 1441 tctctatcct tgtcagctct gtgtcgctct ttgcagtaca gcagtttgtt ggactgacca + 1501 atcgtttaaa tgcgacttct aattactcag aatattcaat cagtgtcgct gttttagcag + 1561 atagtgatat cgaaaatgtt acgcaactga cgagtgtgac agcaccgact gggactgata + 1621 atgaaaatat tcaaaaacta ctagctgata ttaagtcaag tcagaatacc gatttgacgg + 1681 tcgaccagag ttcgtcttac ttggcagctt acaagagttt gattgcaggg gagactaagg + 1741 ccattgtctt aaatagtgtc tttgaaaata tcatcgagtc agagtatcca gactacgcat + 1801 cgaagataaa aaagatttat accaagggat tcactaaaaa agtagaagct cctaagacgt + 1861 ctaagaatca gtctttcaat atctatgtta gtggaattga cacctatggt cctattagtt + 1921 cggtgtcgcg atcagatgtc aatatcctga tgactgtcaa tcgagatacc aagaaaatcc + 1981 tcttgaccac aacgccacgt gatgcctatg taccaatagc agatggtgga aataatcaaa + 2041 aagataaatt aacccatgcg ggcatttatg gagttgattc gtccattcac accttagaaa + 2101 atctctatgg agtggatatc aattactatg tgcgattgaa cttcacttct ttcttgaaaa + 2161 tgattgactt attgggaggg gtagatgttc ataatgatca agagttttca gctctacatg + 2221 ggaagttcca tttcccagta gggaatgtcc atctagactc tgagcaggct ctaggttttg + 2281 tacgtgaacg ctactcacta gccgatggag accgtgaccg tggtcgcaac caacaaaagg + 2341 tgattgtggc tatccttcaa aaattaacgt caaccgaagc actgaaaaat tatagtacga + 2401 tcattgatag cttgcaagat tctatccaaa caaatatgcc acttgagact atgataaatt + 2461 tggtcaatgc tcagttagaa agtggaggga attataaagt aaattctcaa gatttaaaag + 2521 gtacaggtcg gacggatctt ccttcttatg caatgccaga cagtaacctc tatgtgatgg + 2581 aaatagatga tagtagttta gctgtagtta aagcagctat acaggatgtg atggagggta + 2641 gatgaaatga tagacatcca ttcgcatatc gtttttgatg tagatgacgg tcccaagtca + 2701 agagaggaaa gcaaggctct cttgatagaa tcctacaggc agggggtgcg aaccattgtc + 2761 tctacctctc accgtcgcaa gggcatgttt gaaactccgg aagagaagat agcagaaaac + 2821 tttcttcagg ttcgggaaat tgcaaaagaa gtagcagatg atttagtcat tgcttatggc + 2881 gcagagatat actatactct ggatgctcta gaaaagctag aaaaaaaaga aattcctacc + 2941 cttaatgata gtcgttatgc cttgattgag tttagcatgc atacttccta tcgtcagatt + 3001 catacgggat tgagcaatat tttgatgttg ggaatcacgc cagtaattgc tcatattgaa + 3061 cgttatgatg ctttagagaa taacgaaaaa catgttcgtg aactgattga tatggggtgc + 3121 tatactcaga taaatagtta tcatgtttca aaacctaagt tctttggtga aaaatataaa + 3181 ttcatgaaaa agagagctcg gtattttttg gaacgtgatt tagttcatgt agttgcaagt + 3241 gacatgcaca atttagacag tagacctcca tatatgcaac aggcatatga tatcattgct + 3301 aagaaatatg gagcgaaaaa agcgaaagaa ctttttgtag ataatcccag aaaaattata + 3361 atggatcaat taatttagga gaaaatatga aggaacaaaa cactttggaa atcgatgtat + 3421 tgcaactatc cagagcttta tggaaaagaa agttagtcat tttattagtg gcaattataa + 3481 cttcttcagt tgcttttgcc tacagtactt ttgttatcaa acctgagttt actagtacga + 3541 ctcggattta tgtagttaac cgtgatcagg gagagaagtc tggtttaacc aatcaagact + 3601 tgcaggcagg atcatacttg gttaaagact atcgtgaaat tatcctatcg caggatgttt + 3661 tggaggaagt tgtttctgat ttgaaactag atttgacgcc aaaaggtttg gctaataaaa + 3721 ttaaagtaac agtaccagtt gatacccgta ttgtctctgt ttcagttaat gatcgagttc + 3781 ctgaagaggc aagccgtatc gctaactctt tgagagaagt agctgctcaa aaaattatca + 3841 gtattactcg tgtttctgat gtgacaacac tggaggaggc aagaccggcg atatcaccgt + 3901 cttcgccaaa tattaaacgc aatacactaa ttggtttttt ggcaggggtg agtggaacta + 3961 gtgttatagt ttttcttctt gaatttttga acactcgtgt gaaacgtccg gaagatatcg + 4021 aaaatacact gcagatgaca cttttgggag ttgtaccaaa cttgagtaag ttgaaatagg + 4081 agagaggaat gccgacatta gaaatagcac aaaaaaaact ggagttcatt aagaaggcag + 4141 aagaatatta caatgccttg tgtacaaata tacagttgag cggagataaa ctaaaagtaa + 4201 tttccgttac ttctgttaac cctggggaag gaaaaacaac tacttccgta aatatagcaa + 4261 ggtcgtttgc gcgtgcaggc tataaaactc ttttgatcga tggcgatact cgaaattcag + 4321 ttatatcagg agtttttaaa tcgcgtgaaa aaattacagg gctaacagaa tttttatctg + 4381 ggacagctga tttatcttac ggtttatgtg atacaaatat tgaaaattta tttgtagttc + 4441 aatcgggatc tgtatcacca aaccctacag ccttgttaca aagtaaaaat tttaatgata + 4501 tgattgaaac attgcgtaaa tattttgatt atatcattgt tgatacacca cctgttggaa + 4561 ttgttattga tgcggtaatt atcactcaaa agtgtgatgc gtccatcttg gtaacagcaa + 4621 caggtgaggc gaataaacgt gatgtccaaa aagcgaaaca acaattagaa caaacaggga + 4681 aactgttcct aggagttgtt ttaaataaat tggatatctc ggttgataag tatggagttt + 4741 acgcttccta tggaaattat ggtaaaaaat aacttaggaa agattttatg gataaaaaag + 4801 gattggaaat ttttctggca gtattacaga gtattattgt cattttattg gtttattttc + 4861 ttagctttgt tagagagaca gaacttgaac gttcttcgat ggttatacta taccttctcc + 4921 acttttttgt attctatttt agttcctatg gtaacaaatt ttttaaaaga gggtacctag + 4981 ttgagtttaa tagtactata agatatattt ttttctttgc aatagctata agtgtattaa + 5041 acttttttat agcggaacgg tttagtatct ctagaagagg aatggtatac ttcttaactt + 5101 tagaaggaat atccttatac ttgttaaatt tcttagtaaa gaaatattgg aagcatgtgt + 5161 tttttaatcc aaaaaatagc aagaaaattt tactgttaac agtaacggaa aatatagaaa + 5221 aagttcttga taaattgcta gaatctgatg aactttcatg gaaactggta gcagtaagtg + 5281 ttttggataa atctgatttt caacatgata aaatacctgt aattgaaaag gaaaaaatta + 5341 ttgaatttgc aacgcatgaa gttgtggatg aggtgtttgt cgatcttcca ggagagagct + 5401 atgatattgg agaaattatc tctaagtttg agacaatggg gatagatgta actgtaaatc + 5461 ttaatgcatt taataagaat ttgggtcgta ataaacaaat tcatgagata gtaggattga + 5521 atgtagtcac tttctctaca aatttttata aaactagtca tgtgatttca aagagaattc + 5581 tcgatatttg tggtgccact attggcctta ttctttttgc tatagctagt ctagttttag + 5641 ttccattgat tcgtaaagat ggcggaccag ctatttttgc tcaaactcgt atagggaaaa + 5701 atggtcgaca ttttaccttt tataaattcc gttcgatgcg gatcgatgct gaagttatca + 5761 aagaacagtt gatggatcaa aatacgatgc gaggtggtat gtttaagatg gacaatgatc + 5821 ctcgtgttac aaaaattggt cgctttattc gtaaaaccag tttagatgag ttaccccagt + 5881 tttggaatgt ctttatagga gatatgagtt tggtgggaac acgtccacct acagtagacg + 5941 agtatgatca gtatactcca gaacagaaac gtcgactcag ctttaaacct ggtattacag + 6001 gtttatggca ggttagcggc cgtagtaaaa taaccgattt tgacgatgtt gtaaaattag + 6061 atgtggctta tattgataat tggacaatct ggaaagatat tgaaattttg cttaaaactg + 6121 ttaaagttgt atttatgaga aatggagcga agtaagggat gaaagtatgt ctagttggat + 6181 ctagtggagg tcatttaact catttgtatt tattaaaacc tttctggaaa gatagagaaa + 6241 gattttgggt gacttttgat aaagaagatg caagaagtat tttagaaaat gaaatatttt + 6301 atccatgtta ttatcctact aatcgtaatc taaaaaatct tattaaaaat acgattcttg + 6361 ctttcaaaat tttgagaaag gaacgccctg atattatcgt ctcatcaggg gcagctgtag + 6421 cagttccttt cttttatcta gggaaaatat ttggtgctaa gacagtctat atagaagtat + 6481 ttgatagaat tgatgctccg acaatgactg ggaaacttgt ttatccagta actgacaggt + 6541 ttattgtaca atgggaagaa atgaaaaaag tatatccgaa agcaatcaat ctcggaggga + 6601 ttttctaatg atttttgtga cagtaggtac tcatgaacaa cagtttaatc gacttataaa + 6661 agaggttgat agattaaaag gtgagggatt tattcaggat gatgttttta ttcaaacagg + 6721 atactctaat tatgttccaa aattttgtaa atgggaaaaa ttaatatctt atgaaaaaat + 6781 gaatcaattg attaaggaat cagatattat cattacccat ggcggtccag ctacgtttat + 6841 ggcagttatt gctaaaggta aaaatccaat aattgttccg cggctaaaaa aatttggtga + 6901 gcatgtaaat gatcaccaga tgcaatttgt aaaaataacg aaagaaatat acaatttaat + 6961 agttatagat gatatttcag acttacattt aattcttcat aattttaagg acaaacattt + 7021 tgaaacttat ttgaataacg agagatttaa tgtacgtttc aatgtggaaa tcagtaacct + 7081 ttttaaagga aataaaataa atgaaaatta gaatagaacc tcagtatttt ctttataaat + 7141 acctttggtt tattatccta cttccaaaac agtttatgca attaatatta ttctttttaa + 7201 ttgctttaac tcttttacca acctatataa aagaaaaaca agtttttaaa atagatacac + 7261 cgtctttttg tatggtgcta tggactatta tatattctat atctataata tttaattctc + 7321 tgattgatgg attggctgtt caagtgttat tttcagattt gagtaaagca tttaattggc + 7381 taatagcagt atttttttat aattattatt tgaaaatgcc aatcaatatt gacaggataa + 7441 agagatatat gtattataat tttactatct tagttgtttt tgtcggttta ttctatatac + 7501 aaagaggctc caatgtaatt ttgtttggaa gaagtttgtt agactgggac ggatttacat + 7561 tagctactag ttatggtgta agatatacag gttttttaga atacgcaact ttaaatggtc + 7621 agttaattct ttttttatta ccgttaatta gattgtttag atttagattt tttacacaaa + 7681 ctatcatttt tgcttttctt ctagaggttt tggtactaag caaatctaga atagcgattg + 7741 ttgcaatgct tatatatata gcatttgcag tagtcaatga gattaattca aacaataaat + 7801 ggcttattgg aattttctgt ccaattattc cttttatgtt attttacaat tttgaaaaaa + 7861 ttaaacagat tttttttcaa atgtttagtt ctagatcggg tagcaatgcg acacgcttta + 7921 gagtgtatga ggaatcccta aaagctatta atggaatgga aatgttactt ggcgcaggtg + 7981 tcagaattcc ctctacagta gatatattat tggggtcaca ttctatgtat ataagtttta + 8041 tttataggac aggagtttta ggaagtataa taataacagt aatgttttat tatctgtttt + 8101 ctaaattttt aaaatgtgat tcatctgaga gactaagaag tattggctat attctagctt + 8161 tgtcagtatt ttggcttttt gaagagttag atccacatta ttggtgttta attttatttt + 8221 tttcaacaat aagtattttc ataaacaata gaaaagagga aatagttgga tgatagaagt + 8281 atcaatcata attccaatat acaatgctga aaaaactatt aaaaattgtg ttgatagtgc + 8341 cttaaagcaa aatttagaat ctcttgaagt gattttggtg aatgatgggt ctaacgattc + 8401 tacatcaaaa attcttgaac agtatggtga taatccccaa gtgatgattt tccatcaagt + 8461 gaacatggga gtatctgctg ccagaaacgt aggattatcg tatgcaagcg gagagtatgt + 8521 gttcttttta gattcagatg atatattaga tgaaggtatg ctatctaaaa tgtatcagtt + 8581 tgcaaaaagt aataaaattg atcttttatc ttgttggcat aaagagccta gtacaacaca + 8641 atacggtggt aatgataata gttcagcttc atttattgca cgaacaaaag aggaaatagg + 8701 aaatcatttt gtggatattt ttccgagaag tgcttgtgct aagttatttc ttcgtagaag + 8761 aattgaggaa aacaatattg ctttttcgac tgaaatgtca ctaggagaag atatgtcatt + 8821 cgtttgccaa tacttgatgg tctcaaggag tattgcagta attgatggac tgtattatac + 8881 tattcagaat gttaatccac agtcattatc taagcgatat gtaagtaata tcgaaaactc + 8941 cctattaatg cagaatcagt tatgggatca attattagaa gtttatccta aaattgagga + 9001 gaactactac aagcaacata tggattttag attttatctt gctagtttat atgtgaataa + 9061 tttatttaaa tttgattctc cgtattcctc aaaagaaaaa tgggataata ttgcacaaca + 9121 attaaaaaaa tatagaccat ttttagatga gaaagtgagc aaagaaaaga agcctaaaaa + 9181 tatgaatgag atggtcattt tttatttact gaagtctaaa attcccgcgt taatctattc + 9241 tttttactca tttaaagaat ggtggaagaa aaagcgatta aaaaattgaa ggagaaatca + 9301 gttatggaag atttagtaag cattgtcgtt ccggtctata atgtagaaaa atatttaaaa + 9361 aaatcaatag aaagtatttt gaatcaaacg tatgataacc ttgaggttct attagtcgat + 9421 gatggcagta cagatagtag tggggaaatt tgcgattcat ttattaaagt tgattcaaga + 9481 ataagagtgt ttcataaaga aaacggtggt ttatcggatg ctcgaaattt tggaatagag + 9541 catatgaaag gccaatatgt atcgtttatt gatggcgatg attatatatc taaggattat + 9601 gtgtggaagt tgtatcattc tctaaaaaac aataattcag aggtgtctat atgttctttt + 9661 tcattggttg atgaaacggg tgaaaagata aaagatgagc tactagattc tggggaagta + 9721 tccttgtctg gtcaacaaat attagaaaaa gcgttaacag cagatggtta tcgctatgtt + 9781 gttgcttgga ataagcttta tcggtcaact ttatttgaaa aattaaaatt taaaaaagga + 9841 atgttgtatg aggatgaatt tcttaactat cctctatttt gggactgtaa aagggtatca + 9901 attgtagagg agccgttata tttatacgtt caacgaaaag gaagcattat acaaagtaat + 9961 atgactttag aaaaaataaa gatgaaggat aaaatgcata catcgcgtat tgaattttat + 10021 gcagaaaaaa agaattcctt tttacaccaa cgttcgtgtc aacagtattg taactggatt + 10081 gttacaataa ctgttagtca ttacaatgtt ttgaatgtag cctttttaaa atatttgcaa + 10141 catcaattta gaagaattgt taaatataca caaaacgatg ataagaaact gattatacag + 10201 aatattttag gctatataaa tattcgttta gcagcttatg taaaatcaaa agtaatgtag + 10261 ggtgtaagga gaaataatgc tggaaaaaat tttagcttct attaacaatc gctctttttt + 10321 agtaaattga aaaataaaat tcatagaatg tttccgatat atattatcag caatcaaaat + 10381 atagcttttc aacaagagat tgatattgct tatagaaaaa tgaagcgaca atttagccat + 10441 atttcgttga ctgaaagtga acaaaaaaat gatatgaaca tttcgaataa agtttggatt + 10501 tgttggtttc agggcgaaga acgccctccg gagttaatta gaacatgtat tcaatcaatg + 10561 agaactcatt ttcttggaag agagattatc gtactgacag aagaaaatat aagtgactat + 10621 atagatatac cagattatat cactgataaa tataaaaagg gttcgatttc tcgtgcacat + 10681 tattcagata tccttcgggt agaactctta tgtcgttatg gaggattatg ggtagatgta + 10741 acagtgttga atacaggagg agatttctca aatcttgagt tgccactttt tgtatataaa + 10801 tatttggatt tatcaagaaa agattctcaa gccattgtag catcaagttg gttaatttcg + 10861 tcatatagta atcatcctat attgctgtat gcgagaaaac tactctggga gtattggcgt + 10921 agaaaaaata gtttatgcaa ttatttttta tttcatatat tctttacaac agctacagag + 10981 ctgtacccaa tcgaatggtc tgctgtcctt acttttaaca atcattctcc tcatatgctt + 11041 aattttgagt taaataatca attttcagaa aaaaggtggg aacagctaaa acagatatcg + 11101 gtgtttcata aattaaatca tcatatagat tattctatcg gtgttaacaa tttttataag + 11161 tttatagtat cttcgaaagt tgagaaaaat gagtaataaa atcagtaaaa atttagccta + 11221 caatatagga tatcaattaa ttggtattgc ctttcctttg ataacttctc cttatttatc + 11281 acggatatta ggcgctgaaa atttaggtat tcattctttt actatctcag tagcacttta + 11341 ctttatgatg tttatgctac ttggaattgc aaattatgga aataggacaa tagcgaccgt + 11401 taaacgagaa gggaaagaga ttttatcaaa aacgttttgg aatatctact atgtccagtt + 11461 gctaatgtcg gttctagtaa ctatcgcata tctcatttat ttatattttt gggtgtcgag + 11521 ttacaagttc attgcgattt tacaactttt tttgttatta tcgaatgcag ttgatattac + 11581 ttggttattt tatggattag aagattttaa acaaattgtt tttagaaatg cattagttaa + 11641 acttcttggt ttgtttttaa tattttcgtt tgtacatgaa agctcagatt tatggaagta + 11701 caccttaata aacggaggag tgactttagt tgggcaactt ttgttatggg gacaattaaa + 11761 aggcagatta tcttgggtga agattcaaaa aaaggattta ctatctcata tcaaaccaat + 11821 tttagttctt ttcattcctg tgttagcaat cagtatcttt agtaatatgg ataaatatat + 11881 gcttggttta atggttggtg ttaagcaagt tggattttat gataatgcaa atcgtattat + 11941 cgatattcct aaagcattaa ttgcagcatt agaggctgtt atgttaccac gaacatctta + 12001 tttattagca gaaggtcagg aggaaaaaag taattactat atagaggtta caatccttta + 12061 tgcgatgatg atttcgagtg tattgatatt tggtataata tcggtttctg atattttctc + 12121 gcttgtattt tggggagaag aattccttga atcaggaaga ttaattgctg ctatggcacc + 12181 agtttttgtt ttttctgttc caggaaatat aattagaaca cagtatttga ttcctagagc + 12241 aaaggataaa gattatgtgt tgtctctaat aataggtgct ctagttaata tattattgaa + 12301 ctgtttctta ataaaacctt ttggagccat gggtgctacg attagtacag ttttggcaga + 12361 atttgtcttg tatggagtgc aattttggac agtcagaaga gatttagact ttaaaaaata + 12421 tttaaagaat ggttttatat tttacctatt tggtatgatt atgtatttag ctattatagc + 12481 agcaaaagct catttgcaat ataatataat aaatcttgtt ctccttatag tgctgggagg + 12541 aatagtatat actggctttt gttgtttcta cattttaata tcaagaaacg tacattttga + 12601 gatattacgg gaaaaaatta aacgaaagat tggttatgaa aatatattat aaattattat + 12661 taaagagatt aatatttccc cccttttatt tagtggtaac caataaatat tggttaccac + 12721 taaataaaag aaaagttgta tttgataact ttggtggtag aggatatgga gacaatccaa + 12781 agtatattgc tgatgaacta ttaaaacaag atgagaatct tgatttagtt tgggtagtgg + 12841 aaaatatgag tacttttgtt ccaaaaggag ttagaaaagt atggtatgga agttggggag + 12901 ctttttttga atggagcacc gcaaaggtat ggattgacaa cattagaaat tcagatcgtc + 12961 cttggaaaag gaaaaatcaa gtttatttgc aaacatggca tggttctgat ggagttaaaa + 13021 taatcgaaaa agatgcagag tcaacacttt caaaatcata tatcaggatg gctaaatacg + 13081 atggtagcat ctctgatgca atcatttcta gttgccaact gcaaacacaa acagaacagt + 13141 ttaaaaaatc attttggttg gctgataatg ttgaaatctt ggagtatggt ttaccaagaa + 13201 atgatgattt ttttcaaaaa aagaaagttg accatataaa ccatacagtc agatctaagt + 13261 ataatatctc cctagatgaa ttggtaattt tgtatatgcc tacttttagg gatgatgctt + 13321 caacgaaggc gtataatctt gattacgata aggtaataaa ttcatttcaa gatttttata + 13381 acagaaaagt taaagtattg attcgttttc atccaaatgt agataataca ttttttaata + 13441 atactgataa aagattaatt aatgtgacag attatcctaa tccgcaggat ttaatgtttg + 13501 tggctgatat tatgatttca gactattcgt cagcacccat agattttttg ttattaaatc + 13561 gagtagtctt tctgtatcta ccagatttta aagaatatca gagcgataaa aatccgtttt + 13621 ttgaagtttt caaagtttcg aaaaccaaag gcattgcgct tgatccgttt gatgagatta + 13681 ttggtcgctt ccagtttggc gttagaatag tgtagttgaa gggcgttgat aatctttttg + 13741 gagtttacag aaagaattaa ctagaacata aggagaaaaa taattgttaa aattgataca + 13801 aaacaagaaa aaggcgggaa ctaaaaagtg aaaaaatcta taatgacaaa ttttgttaaa + 13861 tttagaaaaa acaatttaac tagacgcaaa ggaatattga gctttgttgt agcgtttacg + 13921 ctcttactta cttacttact tacttactgc gtcgcgaccc gtatttgcag ggggatttcc + 13981 gaatgatgca aaaggaatat cagggaacgg taaatattat tctttaggac aaattgaaaa + 14041 attatattct aatcaattcg caacgtataa taatttgacg gtgattacat ctgatacaca + 14101 cgagaactct gataattttg ccttttgttt agcgaatgga aaaaggtttc catcatttac + 14161 tgatgagaaa cctaaaggaa tctacacctt ggttaaagat attaataagg agcagtatac + 14221 taagttacta aaagagaacc ataaatggtc atcaattcca aatcttaatc aagcatggga + 14281 tactttctca agattatctt atatgtattt gaaagatccc actgatattg ttaaaagagc + 14341 ctggggaacc gatttaaata cagctcgaac ttattttcat caggttatac agtacgaaat + 14401 atggagatat acggatggta tgagagtatc tagtgataca aacgtctata tatacgaaaa + 14461 attttctccg caacaaaaaa aggccttgga aatgattcgt actgacttat ataattttac + 14521 agtcccatat gaaaatcttg aatatagatt ttataagcca gattgggtat ttggtttagg + 14581 atttcaagct ttagcaacag ttagatggaa aattgaacca gctaccatta ctgttactaa + 14641 aaaatgggaa aatgtaaaag aaggagctga aaagcctgag gtctggattc aattgctcaa + 14701 agatgacaaa cctgaagggg atcgaaaacg tatagagcca gataagggtc ggactacatt + 14761 tgaaattcca aataaggatg agattaacaa atattctgta aaagaagttg ataaagaagg + 14821 tcgcgattgg aaacataaag actttacagc aggtcaacct gtaaacaaag gaaatggtca + 14881 ctttgaaatt accaatacta aaaaagagaa acctaaaata aaagttacat ttaaaaagat + 14941 tgcaggcgac acaaataaag atttggcagg cgcacatctt gtcttaaaga aaatctttga + 15001 tgatggtaat ggtttgctga taaaacaatg ggatacaatt ggacagcctg ttgatatcga + 15061 cctggatgca ggctcctata cattaacaga agaaaaagca ccagatggct acatgctagc + 15121 tgcacccgta tctttctatg tggaagaaga tggacaaatt atcctaccaa aaggtgagga + 15181 tttagaagct cagaatgata agaccatcac gatggtggat gaaaagatta aagaaaaacc + 15241 aacaaaacca tcaggtaagc ttgcgacaac tgtagaagtt gacggaacaa aagctgatgc + 15301 acagaaagag cttgagttgt cagttgcaac agataaagtt acgaagacag taaaagatac + 15361 tgttgtgtac gaaaatctgt tagctggcga aacctacaaa ctaacaggtc agttgatgaa + 15421 gattacagct gacaaagaag aggaagtagc aacgaaagaa acaactttcg tcgcagatgc + 15481 ctcaggcaac ggtacaacca gcctagagtt tgaagatgtg agccttgaag caggcgttaa + 15541 gtatgtagta tatgaaactg cagagagcga aaaagaaatt gacttcaaag aaggcaaaga + 15601 aaagcacaag gtagaacaca aagacaaaga tgacaaagct cagactgtag ttgttacgaa + 15661 agaaaaacca acaaaaccat caggtaagct tgcgacaact gtagaagttg acggaacaaa + 15721 agctgatgca cagaaagagc ttgagttgtc agttgcaaca gataaagtta cgaagacagt + 15781 aaaagatact gttgtgtacg aaaatctgtt agctggcgaa acctacaaac taacaggtca + 15841 gttgatgaag attacagctg acaaagaaga ggaagtagca acgaaagaaa caactttcgt + 15901 cgcagatgcc tcaggcaacg gtacaaccag cctagagttt gaagatgtga gccttgaagc + 15961 aggcgttaag tatgtagtat atgaaactgc agagagcgaa aaagaaattg acttcaaaga + 16021 aggcaaagaa aagcacaagg tagaacacaa agacaaagat gacaaagctc agactgtagt + 16081 tgttacgaaa gaaaaaccaa caaaaccatc aggtaagctt gcgacaactg tagaagttga + 16141 cggaacaaaa gctgatgcac agaaagagct tgagttgtca gttgcaacag ataaagttac + 16201 gaagacagta aaagatactg ttgtgtacga aaatctgtta gctggcgaaa cctacaaact + 16261 aacaggtcag ttgatgaaga ttacagctga caaagaagag gaagtagcaa cgaaagaaac + 16321 aactttcgtc gcagatgcct caggcaacgg tacaaccagc ctagagtttg aagatgtgag + 16381 ccttgaagca ggcgttaagt atgtagtata tgaaactgca gagagcgaaa aagaaattga + 16441 cttcaaagaa ggcaaagaaa agcacaaggt agaacacaaa gacaaagatg acaaagctca + 16501 gactgtagtt gttacgaaag aaaaaccaac aaaaccatca ggtaagcttg cgacaactgt + 16561 agaagttgac ggaacaaaag ctgatgcaca gaaagagctt gagttgtcag ttgcaacaga + 16621 taaagttacg aagacagtaa aagatactgt tgtgtacgaa aatctgttag ctggcgaaac + 16681 ctacaaacta acaggtcagt tgatgaagat tacagctgac aaagaagagg aagtagcaac + 16741 gaaagaaaca actttcgtcg cagatgcctc aggcaacggt acaaccagcc tagagtttga + 16801 agatgtgagc cttgaagcag gcgttaagta tgtagtatat gaaactgcag agagcgaaaa + 16861 agaaattgac ttcaaagaag gcaaagaaaa gcacaaggta gaacacaaag acaaagatga + 16921 caaagctcag actgtagttg ttacgaaaga aaaaccaaca aaaccatcag gtaagcttgc + 16981 gacaactgta gaagttgacg gaacaaaagc tgatgcacag aaagagcttg agttgtcagt + 17041 tgcaacagat aaagttacga agacagtaaa agatactgtt gtgtacgaaa atctgttagc + 17101 tggcgaaacc tacaaactaa caggtcagtt gatgaagatt acagctgaca aagaagagga + 17161 agtagcaacg aaagaaacaa ctttcgtcgc agatgcctca ggcaacggta caaccagcct + 17221 agagtttgaa gatgtgagcc ttgaagcagg cgttaagtat gtagtatatg aaactgcaga + 17281 gagcgaaaaa gaaattgact tcaaagaagg caaagaaaag cacaaggtag aacacaaaga + 17341 caaagatgac aaagctcaga ctgtagttgt atctaaaatt aagccagagc caggagcaca + 17401 agaagttcac tttagtaaag tcaatgtagg cggagaagaa attgcaggtg cggaaattca + 17461 catcaagcaa ggcgacactg tcgtggcaag ctgggtatca gaagccggta agacacatac + 17521 attgaaacta aaaccaggtc actatatctt ccatgaagca gtagctccag gtggctatct + 17581 agcagtaaca gatattcact ttagtgtaga tgaaactggt caagtgacag taactgatgt + 17641 aaatggaaat acagctgtag cggaaggcaa caagcttacg gttacagacc aaaccaaacc + 17701 agtaacccca ccaagcccag aagagccagg agcacaagaa gttcacttta gtaaagtcaa + 17761 tgtaggcgga gaagaaattg caggtgcgga aattcacatc aagcaaggcg acactgtcgt + 17821 ggcaagctgg gtatcagaag ccggtaagac acatacattg aaactaaaac caggtcacta + 17881 tatcttccat gaagcagtag ctccaggtgg ctatctagca gtaacagata ttcactttag + 17941 tgtagatgaa actggtcaag tgacagtaac tgatgtaaat ggaaatacag ctgtagcgga + 18001 aggcaacaag cttacggtta cagaccaaag tgctgataaa gataagcaag ataagttgcc + 18061 aaatacagga gaaacaacag gaacttattt gtcaatactt ggtatgatta ctgcagtttt + 18121 tgcaagccta ttgtaccgta gtaagaaaaa atagtttttg ctattctctc caatttgtga + 18181 gctacattaa agtttttgag gacgattttt gtatttttgt taacgacaaa gagggacaaa + 18241 agtctaacct taaatataaa aagcgaataa aatcggctct ttgtcaactg tagtgggttg + 18301 aaaaaaagct aagctcgaga aaggacaaat tttgtccttt cttttttgat gttcaaagcg + 18361 ataaaaatcc gttttttgaa gttttcaaag tttcgaaaac caaaggcatt gcgcttgata + 18421 agtttgatga gattattggt cgcttccagt ttggcattag aatagtgtag ttgaagggcg + 18481 ttgacgattt tctctttgtc ctttagaaag gttttaaaga cagtctgaaa aataggatga + 18541 acctgcttaa gattgtcctc gataagtccg aaaaatttct ctggttcctt attctggaag + 18601 tgaaaaagca agagctgata gagctgatag tgatgtttca agtcttgtga atagctcaaa + 18661 agcttgtcta aaatctcttt attggttaaa tgcatacgaa aagtaggacg ataaaatcgc + 18721 ttatcactca gtttacggct atcctgttga atgagtttcc agtagcgctt gatagccttg + 18781 tattcatggg atttttgatg aaactgattc atgatttgaa cacgcacacg actcatagca + 18841 cggctaagat gttgtacaat gtgaaagcga tcaagaacga ttttagcatt cgggagtgaa + 18901 acagtctggg agactgtttc agcctgagcc tagaaatttg aaagcgaagc tgtttagcca + 18961 agtcatagta aggactaaac atatccatag taataatttt gacgcgacat cggacggctc + 19021 tatcatattt aagaaagtga tctcggatga cagcttgtgt tctaccttca agaacagtga + 19081 tgatattgag attgttaaaa tcttgcgcaa tgaagctcat ctccatctcc cgattgaaac + 19141 agtcactccc cggactgttt caacgtccca agacataatc ttaggcagat ttctaaaatt + 19201 acactcaaag tggaagtcat tgagctttcg aatgacagtt gaagttgaaa tggccagctg + 19261 atgagcaata tcggtcatag aaatcttctc aatcaacttt tgcgcaattt tttggttgat + 19321 aatacgagga atttggtgat ttttcttgac gatagaagtt tcagcgacca tcattttaga + 19381 acaatgatag cacttgaaac gacgctttct aaggagaatt ctagtaggca taccagtcgt + 19441 ttcaagataa ggaattttag aaggtttttg aaagtcatat ttcttcattt gacttccgca + 19501 ctcaggacaa gatggagctt catagtccag tttggcgatg atttccttgt gtgtatcctt + 19561 attgacaatg tctaaaatct ggatattagg gtctttaatg tctagtaatt ttgtgataaa + 19621 atgtaattgt tccatatgaa tctttctaat gagttgtttt gtcgcttttc attatagatc + 19681 ttatgggact ttttttctac acaaaaatag gctccataat atctatagtg gatttaccca + 19741 ctacaaatat tatagagccc atattttttg caaagatgtt gtttgaaaaa taattttcaa + 19801 aaattctgaa aattctgttg acatctttct gaaaagagtc tataatggag agaaagtttt + 19861 aaaggagaaa atgatgaaaa gttcaaaact acttgccctt gcgggcgtga cattattg +// + diff --git a/public/res/serotype_genbank/serotype_15A.gb b/public/res/serotype_genbank/serotype_15A.gb new file mode 100644 index 0000000..70ac714 --- /dev/null +++ b/public/res/serotype_genbank/serotype_15A.gb @@ -0,0 +1,858 @@ +LOCUS CR931663 18517 bp DNA linear UNK 10-JUN-2024 +DEFINITION CR931663, whole genome shotgun sequence. +ACCESSION CR931663 +VERSION CR931663 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/10/2024, 18:12:51 + CDSs :: 21 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..18517 + /mol_type="genomic DNA" + gene 294..467 + /locus_tag="JANJDB_00005" + CDS 294..467 + /db_xref="RefSeq:WP_001022224.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00016DB8BC" + /db_xref="UniRef:UniRef100_A0A0B7M524" + /db_xref="UniRef:UniRef50_A0A0H2ZQL8" + /db_xref="UniRef:UniRef90_A0A0H2ZQL8" + /product="Lipoprotein" + /locus_tag="JANJDB_00005" + /protein_id="gnl|Bakta|JANJDB_00005" + /translation="MNIKKRVLSAGLTFASALLLAACGQSGSDTKTYSSTFGGNPTTFN + YLLDYYADNIVN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001022224.1" + gene complement(435..797) + /locus_tag="JANJDB_00010" + CDS complement(435..797) + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0002D877B2" + /db_xref="UniRef:UniRef100_A0A9Q9U2D4" + /db_xref="UniRef:UniRef50_A0A0H2UQ11" + /db_xref="UniRef:UniRef90_A0A4J1UQC1" + /product="IS630-Spn1, transposase Orf2" + /locus_tag="JANJDB_00010" + /protein_id="gnl|Bakta|JANJDB_00010" + /translation="MVAGLTNGELIAPMTYEETMTSDFFEAWFQKFLLPTLTTPSVIIM + DNARFHRMGKLELLCEEFGYKLLPLPPYSPEYNPIEKTWAHIKKPRKRYYQVAIPFMRL + FCLVLVSIDYVISVIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef100_A0A9Q9U2D4" + gene 1202..2647 + /locus_tag="JANJDB_00015" + /gene="wzg" + CDS 1202..2647 + /db_xref="BlastRules:WP_000091082" + /db_xref="COG:COG1316" + /db_xref="COG:M" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF26" + /db_xref="UniRef:UniRef100_Q4K1R4" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_O54604" + /db_xref="UniprotKB:Q4K1R4" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="JANJDB_00015" + /protein_id="gnl|Bakta|JANJDB_00015" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYDILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVDQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIQKLTSTEVLKNYS + SILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSYAIPDSNLY + VMEIDDSSLAVVKAAIEDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1R4" + /gene="wzg" + gene 2649..3380 + /locus_tag="JANJDB_00020" + /gene="wzh" + CDS 2649..3380 + /db_xref="BlastRules:WP_000565352" + /db_xref="RefSeq:WP_000567604.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF27" + /db_xref="UniRef:UniRef100_Q4K1R3" + /db_xref="UniRef:UniRef90_Q9AHD4" + /db_xref="UniprotKB:Q4K1R3" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="JANJDB_00020" + /protein_id="gnl|Bakta|JANJDB_00020" + /translation="MIDVHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDSRY + ALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVTQKYG + EAKAQELFVDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000567604.1" + /gene="wzh" + gene 3389..4081 + /locus_tag="JANJDB_00025" + /gene="wzd" + CDS 3389..4081 + /db_xref="RefSeq:WP_000392514.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF28" + /db_xref="UniRef:UniRef100_Q4K1K7" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_Q4K1K7" + /db_xref="UniprotKB:Q4K1K7" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="JANJDB_00025" + /protein_id="gnl|Bakta|JANJDB_00025" + /translation="MEEQNTLEIDVLQLFRSLWKRKLVILLVAIITSSVAFAYSTFVIK + PEFTSTTRIYVVNRDQGEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVVSDLKLDLT + PKGLANKIKVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVTTLE + EARPATTPSSPNVRRNTLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQIPLLGL + VPDLDKMK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000392514.1" + /gene="wzd" + gene 4091..4780 + /locus_tag="JANJDB_00030" + /gene="wze" + CDS 4091..4780 + /db_xref="RefSeq:WP_001142531.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF29" + /db_xref="UniRef:UniRef100_Q4K1K6" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_O84996" + /db_xref="UniprotKB:Q4K1K6" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="JANJDB_00030" + /protein_id="gnl|Bakta|JANJDB_00030" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDGLKVFSITSVKL + GEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDLSQ + GLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVIDAA + IITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSYGNYG + DYGKNKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001142531.1" + /gene="wze" + gene 4795..6162 + /locus_tag="JANJDB_00035" + /gene="wchA" + CDS 4795..6162 + /db_xref="RefSeq:WP_001013462.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2A" + /db_xref="UniRef:UniRef100_Q4K1R0" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_Q8VU30" + /db_xref="UniprotKB:Q4K1R0" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="JANJDB_00035" + /protein_id="gnl|Bakta|JANJDB_00035" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYILH + YFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYFLT + LHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKLVAV + SVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMGIDVT + VNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLILCGLAS + IVLVPLIRKDGGSTIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTMQGGMFK + VDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQKRRLSF + KPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFMRDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001013462.1" + /gene="wchA" + gene 6166..6615 + /locus_tag="JANJDB_00040" + /gene="wchJ" + CDS 6166..6615 + /db_xref="GO:0016740" + /db_xref="RefSeq:WP_000686638.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2B" + /db_xref="UniRef:UniRef100_Q4K1K4" + /db_xref="UniRef:UniRef50_J9W567" + /db_xref="UniRef:UniRef90_Q4K1M2" + /db_xref="UniprotKB:Q4K1K4" + /db_xref="UserProtein:wchJ" + /product="""putative glycosyl transferase enhancer""" + /locus_tag="JANJDB_00040" + /protein_id="gnl|Bakta|JANJDB_00040" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKADARSVLSEE + VVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKTVY + IEVFDRIDASTLTGKLVYPVTDRFIVQWEEMKKVYPKAINLGGIF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000686638.1" + /gene="wchJ" + gene 6615..7121 + /locus_tag="JANJDB_00045" + /gene="wchK" + CDS 6615..7121 + /db_xref="KEGG:K25904" + /db_xref="RefSeq:WP_000578432.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2C" + /db_xref="UniRef:UniRef100_Q4K1K3" + /db_xref="UniRef:UniRef50_Q9AQJ2" + /db_xref="UniRef:UniRef90_Q4K1K3" + /db_xref="UniprotKB:Q4K1K3" + /db_xref="UserProtein:wchK" + /product="""putative glycosyl transferase""" + /locus_tag="JANJDB_00045" + /protein_id="gnl|Bakta|JANJDB_00045" + /translation="MIFVTVGTHEQQFNRLIKEVDRLKGEGFIQDDVFIQTGYSNYVPK + FCKWEKLISYEKMNQFIEEADTIITHGGPATFMAVIAKGKSPIIVPRLKKFGEHVNDHQ + LEFVEKVLNVYNLTVITNISDLNSYISNFDERKKSDLKSKNNLFMEKFIDMINQLMETG + DIKYD" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000578432.1" + /gene="wchK" + gene 7114..8313 + /locus_tag="JANJDB_00050" + /gene="wzy" + CDS 7114..8313 + /db_xref="RefSeq:WP_000170479.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2D" + /db_xref="UniRef:UniRef100_Q4K1Q7" + /db_xref="UniRef:UniRef50_E0Q2S4" + /db_xref="UniRef:UniRef90_Q4K1K2" + /db_xref="UniprotKB:Q4K1Q7" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="JANJDB_00050" + /protein_id="gnl|Bakta|JANJDB_00050" + /translation="MTKYINSCIKLLFIYSLFSELLYSYYSVSLLFTIPDLLLLAAAVI + VFVDSYSAGKIRVKNPHISLMLFFILLIFLLISFTWGTLNIYGFVMRGRYILGAFLVYF + MTNSYLDDRTFSSLINIAYFMQILNLLLVLHQNIVLHLHPDFTNGIFGFTNYANGIQGF + YCLALSVLSTVYYLYGKWGTMKSLILIAISCIICALAEIKIFFVIFIFSIILIFIFQKS + ETVKKIRIISTAAGISLLFLIAYKLIEIVLPDNLYTFFNVTKALSYENRTEFAGRTNTI + SFLWDNLFYHDYISAIFGKGLGSYSVNYIYELGKMLADGGFISVILLYSFLLSLFIRGT + ITRGKNKQSERLIVSIIAFVVMISIIVWNSTFTRSTYLVFFFLAIGNAAYKSTKLIRRD + " + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000170479.1" + /gene="wzy" + gene 8315..9343 + /locus_tag="JANJDB_00055" + /gene="wchL" + CDS 8315..9343 + /db_xref="RefSeq:WP_000405438.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2E" + /db_xref="UniRef:UniRef100_Q4K1K1" + /db_xref="UniRef:UniRef50_Q4K1K1" + /db_xref="UniRef:UniRef90_Q4K1K1" + /db_xref="UniprotKB:Q4K1K1" + /db_xref="UserProtein:wchL" + /product="""putative glycosyl transferase""" + /locus_tag="JANJDB_00055" + /protein_id="gnl|Bakta|JANJDB_00055" + /translation="MEIQISVVIPVYNAENTINNCIESALKQDLESFEVILVNDGSNDS + TSRILEQYSDNPQVKIFHQVNMGVSAARNLGLSHASGEYVFFLDSDDILDDGMLSKMYQ + FVKNNKVDLLSCWHKEPATTQYGGNENKSTSFIARTREEIGAHFVDIFPRSACAKLFFR + KIIEENNITFSTEMSLGEDMSFVYQYLMVSKSIGVIDGVYYNIQNVNPQSLSKRYVQNI + ENSLMIQNQLWNQLLEVYPKIEENYYKQHMDFRFYLANLYVNNLFKFDSPYSSKEKLDQ + IAQQLKKYRLFLDEKVSKEKMPKNINEMIVFYLLKLKIPVLIYSFYSFKEWWKRRKIKN + EG" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000405438.1" + /gene="wchL" + gene 9351..10307 + /locus_tag="JANJDB_00060" + /gene="wchM" + CDS 9351..10307 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2F" + /db_xref="UniRef:UniRef100_Q4K1Q5" + /db_xref="UniRef:UniRef50_E0Q2S2" + /db_xref="UniRef:UniRef90_A0A4J2AN51" + /db_xref="UniprotKB:Q4K1Q5" + /db_xref="UserProtein:wchM" + /product="""putative glycosyl transferase""" + /locus_tag="JANJDB_00060" + /protein_id="gnl|Bakta|JANJDB_00060" + /translation="MEDLISIVVPVYNVEKYLKKSIESVLNQTYQNIEILLVDDGSTDS + SGKICESFSKVDPRIRVFHKENGGLSDARNFGIEQMKGQYVAFIDSDDYISKDYVWKLY + SSIKNNDSEVSICSFLLVDEKGEKIKDELLDSGKICLTGQQILEKVLTADGYRYVVAWN + KLYRSTLFEKLKFKKGMLYEDEFLNYLLFWDCKRVSIVEEPLYLYVQRKGSIVQSNMTL + EKIKMKDEMHTSRIEFYSEKGHSFLHEKACQQYCNWIVTATTNHSKILNPNFSKYLQRQ + FRKFAKYTRNNDIRLIVQNILGFIDIRLAAYVKSKVM" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1Q5" + /gene="wchM" + gene 10323..11231 + /locus_tag="JANJDB_00065" + /gene="wchN" + CDS 10323..11231 + /db_xref="RefSeq:WP_000570495.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF30" + /db_xref="UniRef:UniRef100_Q4K1J9" + /db_xref="UniRef:UniRef50_B2ILQ2" + /db_xref="UniRef:UniRef90_Q6X853" + /db_xref="UniprotKB:Q4K1J9" + /db_xref="UserProtein:wchN" + /product="""putative glycosyl transferase""" + /locus_tag="JANJDB_00065" + /protein_id="gnl|Bakta|JANJDB_00065" + /translation="MIEKILDSIKNHSFYSKLKDKIHRIIPLYIIKNQNIAFQQDTDIA + YRKLKKKFRHISLTGDELKYKMEFSNKVWICWFQGEEHAPELIKTCIQSMRNQLQGREI + IVLTEKNISDYTEIPGYIIEKYKKGWISRAHYSDILRIDLLCRHGGLWVDATVLNTGGD + FSNLEVPLFVYKSLNLSRKDSQAIVASSWLISSYSNHPILLYTRKLLWAYWRRKNSLCN + YFLFHICFTIATERYPIEWSAVPTFNNHSPHILHFELNEQFSEKRWEQLKHISAFHKLN + HHIDYSSGVNTFYKFIVSSKV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000570495.1" + /gene="wchN" + gene 11236..12699 + /locus_tag="JANJDB_00070" + /gene="wzx" + CDS 11236..12699 + /db_xref="RefSeq:WP_000066241.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF31" + /db_xref="UniRef:UniRef100_Q4K1J8" + /db_xref="UniRef:UniRef50_O07342" + /db_xref="UniRef:UniRef90_Q6X852" + /db_xref="UniprotKB:Q4K1J8" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="JANJDB_00070" + /protein_id="gnl|Bakta|JANJDB_00070" + /translation="MSNKISKNLAYNMGYQLIGIAAPLITSPYLSRILGAENLGIHSFT + MSVALYFMMFMLLGIANYGNRTIATVKREGKDILSKTFWSIYSIQLIMSILVTIAYLAY + LYLGAVHYKVIAILQLFLLLSNAVDITWFFYGLENFKQIVFRNTLVKLLGLFLIFLCVR + QGTDLWKYTFINGSVTLVGQLLLWGQLKGILTWKKIQLKELLPHIKPILILFIPVLAIS + IFTNMDKYMLGLMVDVKQVGFYDNAGRIIEIPKALIAALGAVMLPRTSYLLAEGQKEKS + KYYIEVTILYVMIISSVLMFGLISVSDIFSIIFWGEEFLESGRLISAMSPAFVFSVLGN + IIRTQYLIPRAKDKDYVVSLIAGAVVNLVLNYFFIKPFGAMGATVSTVLAEFVLSGMQF + WSVRRDLDLKRYLKNGLIFYLFGLIMYLVIITLKTQLPYNIMSLILLIVLGGIVYVIFC + CCYILMSRNLHFKLLKEKIIRKVVHKNTL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000066241.1" + /gene="wzx" + gene 13057..13302 + /locus_tag="JANJDB_00075" + CDS 13057..13302 + /db_xref="RefSeq:WP_224332055.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI001CCE6D4A" + /db_xref="UniRef:UniRef100_UPI001CCE6D4A" + /db_xref="UniRef:UniRef50_UPI0005E8C243" + /db_xref="UniRef:UniRef90_UPI0005E8C243" + /product="acyltransferase family protein" + /locus_tag="JANJDB_00075" + /protein_id="gnl|Bakta|JANJDB_00075" + /translation="MVTKDKGLTYNSTLHAIKVLACFSVVAIHIWLPGKIGAFYQIIAR + FAVPMFFLISGFYSYNISKNRIKKIFRLILRSTFFM" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_224332055.1" + gene 13391..13891 + /locus_tag="JANJDB_00080" + /gene="wciZ" + CDS 13391..13891 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E21D46" + /db_xref="UniRef:UniRef100_A0A9P1RFF5" + /db_xref="UniRef:UniRef50_A0A1Z3GXH7" + /db_xref="UniRef:UniRef90_A0A1Z3GXH7" + /product="WciZ" + /locus_tag="JANJDB_00080" + /protein_id="gnl|Bakta|JANJDB_00080" + /translation="MLLLFSFIMEATISDSIFYRNFLFMGIPFFGIGILIAQNQKKIIN + CKIINKILILGTIIYPILIFLEYYILGNSFEVYISSVLATIILMIFAIKSPKAINIKIL + NGIGDKYATFVYIIHQFIIVIFKFLVSNVYILKFGTIFVFLICCFLGVLFQFIKNRLLK + RFS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef100_A0A9P1RFF5" + /gene="wciZ" + gene 13893..15041 + /locus_tag="JANJDB_00085" + /gene="wchX" + CDS 13893..15041 + /db_xref="RefSeq:WP_000261151.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF32" + /db_xref="UniRef:UniRef100_Q4K1Q2" + /db_xref="UniRef:UniRef50_Q9R922" + /db_xref="UniRef:UniRef90_A0A4J2AK78" + /db_xref="UniprotKB:Q4K1Q2" + /db_xref="UserProtein:wchX" + /product="""putative glycerol phosphotransferase""" + /locus_tag="JANJDB_00085" + /protein_id="gnl|Bakta|JANJDB_00085" + /translation="MVVLQNVKFLVRVVFMVIISIVLWPVRIKKNKILFINFNGKGYGD + NPKSICEYLRVTYPELDLVWLAKDNEDFPDGVRVVRYKSLQSFYEQASSKVWVYNVRNF + ERLLKKRGQFYIQTWHGASSFKLIEKQADLPLKYILEAKYDARVTDIMISDSRKQTEEF + QKYFWYSGEIFEVGMPRNDALFHYKEDYDKLNNIRKELSIDSDDYVILYAPTFRDDGDA + SYLDINFERLLQSIEQEIKKKCKILIRLHPNDSHFSNNISFNHDIIDVTLFSDMQELIL + LADVLLTDYSSAIFDFMLLNKPYVRYVNDLEKYAELRGLSDTYYELPDPIIKTAEELYD + LLPKKIENFDYDSIKKYRNEILCPIFNGTASENVGRRIIQEL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000261151.1" + /gene="wchX" + gene 15077..16105 + /locus_tag="JANJDB_00090" + /gene="gtp1" + CDS 15077..16105 + /db_xref="RefSeq:WP_000794264.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF33" + /db_xref="UniRef:UniRef100_Q4K1Q1" + /db_xref="UniRef:UniRef50_Q9R921" + /db_xref="UniRef:UniRef90_Q9R921" + /db_xref="UniprotKB:Q4K1Q1" + /db_xref="UserProtein:gtp1" + /product="""putative glycerol-2-phosphate dehydrogenase""" + /locus_tag="JANJDB_00090" + /protein_id="gnl|Bakta|JANJDB_00090" + /translation="MKNNDLKIGSGAIHQISATLSQNNISGKILYCADPVVDDLYGSIV + RSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFISKR + PYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKAGIG + DTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLVNSLV + LSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENSVDAVV + DYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQIYKELIS + EL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000794264.1" + /gene="gtp1" + gene 16121..16825 + /locus_tag="JANJDB_00095" + /gene="gtp2" + CDS 16121..16825 + /db_xref="RefSeq:WP_000645464.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF34" + /db_xref="UniRef:UniRef100_Q4K1J4" + /db_xref="UniRef:UniRef50_O85005" + /db_xref="UniRef:UniRef90_O85005" + /db_xref="UniprotKB:Q4K1J4" + /db_xref="UserProtein:gtp2" + /product="""putative nucleotidyl transferase""" + /locus_tag="JANJDB_00095" + /protein_id="gnl|Bakta|JANJDB_00095" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQNN + ITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLMMN + ADVFYDASVIKSLLLHKAPNAIVTDLGTYIEESMKVVEKNGRLVEISKQISPEEALGAS + IDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILPEVEFIACPLDGRWLEIDN + HEDLAVAEKLFA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000645464.1" + /gene="gtp2" + gene 16846..17673 + /locus_tag="JANJDB_00100" + /gene="gtp3" + CDS 16846..17673 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q4K1N0" + /db_xref="UniRef:UniRef90_Q4K1N0" + /db_xref="UniprotKB:Q4K1N0" + /db_xref="UserProtein:gtp3" + /product="""putative phosphotransferase""" + /locus_tag="JANJDB_00100" + /protein_id="gnl|Bakta|JANJDB_00100" + /translation="MTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLELLDY + IHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPKSKVY + CQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDVPFIAT + NPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRKKLNYSLFETVVI + GDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQGSIKPTYTFKNVKEMWKGIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K1N0" + /gene="gtp3" + gene complement(17762..18151) + /locus_tag="JANJDB_00105" + /gene="tnp" + CDS complement(17762..18151) + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A4N9BSH4" + /db_xref="UniRef:UniRef90_A0A4M3K117" + /product="IS5 family transposase ORF B" + /locus_tag="JANJDB_00105" + /protein_id="gnl|Bakta|JANJDB_00105" + /translation="MKAQTIVTSQGRIISLDITVNYSHDMKLFKMSRRNIGQAGKILAD + SGYQGLMKIYPQAQTPRKSSELKPLTAEDKACNHALSTERSKVENIFAKVKTFKMFSTT + YRNHRKRFGLRMNLIAGIINHELGF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A4M3K117" + /gene="tnp" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactattt aaggagaaag aagatgaaca + 301 taaagaagcg agtccttagt gcaggcctga cttttgcatc tgctttgctt ttagctgctt + 361 gcggccaatc aggttcagat acaaaaactt actcatcaac ctttggtgga aatccaacta + 421 catttaacta tctattagac tattacgctg ataacatagt caattgaaac aagaacaaga + 481 caaaagagcc tcataaaagg tatggcaact tggtaatacc ttttacgagg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatacccaa actcttcaca caagagttct aacttaccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt acctcttatt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata attagattga aactagaata gtacacctct gcttctaaaa + 1021 cattgttaga aatcgatttg actgtcctga tcgatttgtc atgttcttat ttcattttac + 1081 tatatttttg tttcgcggga agtctactaa gatacttaaa gatgcagata gtaaaaaaaa + 1141 tgtagacatt accgtaaaaa agtgatataa tcgtatgatg ttcaaggtat aggtgttaat + 1201 catgagtaga cgttttaaaa aatcacgttc acagaaagtg aagcgaagtg ttaatatcgt + 1261 tttgctgact atttatttat tgttagtttg ttttttattg ttcttaatct ttaagtacga + 1321 tatccttgct tttagatatc ttaacctagt ggtaactgcg ttagtcctac tagttgcctt + 1381 ggtagggcta ctcttgatta tctataaaaa agctgaaaag tttactattt ttctgttggt + 1441 gttctctatc cttgtcagct ctgtgtcgct ctttgcagta cagcagtttg ttggactgac + 1501 caatcgttta aatgcgactt ctaattactc agaatattca atcagtgtcg ctgttttagc + 1561 agatagtgat atcgaaaatg ttacgcaact gacgagtgtg acagcaccga ctgggactga + 1621 taatgaaaat attcaaaaac tactagctga tattaagtca agtcagaata ccgatttgac + 1681 ggtcgaccag agttcgtctt acttggcagc ttacaagagt ttgattgcag gggagactaa + 1741 ggccattgtc ttaaatagtg tctttgaaaa tatcatcgag tcagagtatc cagactacgc + 1801 atcgaagata aaaaagattt ataccaaggg attcactaaa aaagtagaag ctcctaagac + 1861 gtctaagaat cagtctttca atatctatgt tagtggaatt gacacctatg gtcctattag + 1921 ttcggtgtcg cgatcagatg tcaatatcct gatgactgtc aatcgagata ccaagaaaat + 1981 cctcttgacc acaacgccac gtgatgccta tgtaccaatc gcagatggtg gaaataatca + 2041 aaaagataaa ttaacccatg cgggcattta tggagttgat tcgtccattc acaccttaga + 2101 aaatctctat ggagtggata tcaattacta tgtgcgattg aacttcactt ctttcttgaa + 2161 aatgattgac ttattgggag gggtagatgt tcataatgat caagagtttt cagctctaca + 2221 tgggaagttc catttcccag tagggaatgt ccatctagac tctgagcagg ctctaggttt + 2281 tgtacgtgaa cgctactcac tagccgatgg agaccgtgac cgtggtcgca accaacaaaa + 2341 ggtcattgta gcaattattc agaagttaac ttctacagag gttttgaaaa actatagtag + 2401 tattcttcaa ggattgcagg attctcttca aacaaatatg ccgattgaga ctatgataga + 2461 tttagtgaat actcagttgg aaagtggggg gaattataaa gtaaattctc aagatttaaa + 2521 agggacaggt cggatggatc ttccttctta tgcaatacca gacagtaacc tctatgtgat + 2581 ggaaatagat gatagtagtt tagctgtagt taaagcagct atagaggatg tgatggaggg + 2641 tagatgaaat gatagacgtc cattcgcata tcgtttttga tgtagatgac ggtcccaagt + 2701 caagagagga aagcaaggct ctcttggcag aatcctacag gcagggggtg cgaaccattg + 2761 tctctacctc tcaccgtcgc aagggcatgt ttgaaactcc ggaagagaag atagcagaaa + 2821 actttcttca ggttcgggaa atagctaagg aagtggcgag tgacttggtc attgcttacg + 2881 gggctgaaat ttactacaca ccagatgttc tggataagct agaaaaaaag cggattccga + 2941 ccctcaatga tagtcgttat gccttgatag agtttagtat gaacactcct tatcgcgata + 3001 ttcatagcgc cttgagcaag atcttgatgt tgggaattac tccagtcatt gcccacattg + 3061 agcgctatga tgctcttgaa aataatgaaa aacgcgttcg agaattgatc gatatgggct + 3121 gttacacgca agtaaatagt tcacatgtcc tcaaatccaa actttttggc gaacgttata + 3181 aattcatgaa aaaaagagct cagtattttt tagagcagga tttggtccat gtcattgcaa + 3241 gtgatatgca caatctagac ggcagacctc ctcatatggc agaagcatat gaccttgtta + 3301 cccaaaaata cggagaagcg aaggctcagg aactttttgt agataatccc agaaaaatta + 3361 taatggatca attaatttag gagaaaatat ggaggaacaa aacactttgg aaatcgatgt + 3421 attgcaacta ttcagatctt tgtggaaaag aaagttggtc attttattag tggcaattat + 3481 aacttcttca gttgcttttg cctacagtac ttttgttatc aaacctgagt ttactagtac + 3541 gactcggatt tatgtagtta accgtgatca gggagagaag tctggtttaa ccaatcaaga + 3601 cttgcaggca ggaacatact tggttaaaga ctatcgtgaa attatcctat cgcaggatgt + 3661 tttggaggaa gttgtttctg atttgaaact agatttgacg ccaaaaggtt tggctaataa + 3721 aattaaagtg acagtaccag ttgatacccg tattgtctca atctctgtca aggataaaca + 3781 gccagaggaa gccagtcgta tcgctaattc tctacgagaa gttgctgcag aaaagatcgt + 3841 cgctgtaacg cgagtatctg atgtaacgac acttgaagaa gcgcgaccag ctacgactcc + 3901 ctcttctcca aatgttcgac gcaacacctt gtttggtttt cttggaggag ccgtcgtaac + 3961 agtaattgct gttcttttga ttgagttgct cgacacccgt gtgaaacgtc ctgaagatgt + 4021 tgaagatgta ctgcaaattc cacttttagg gctcgttcca gatttggaca aaatgaaata + 4081 ggaggaagtt atgccaacgt tagaaatctc acaggcaaaa ttggattttg taaaaaaggc + 4141 agaggaatat tataacgctt tgtgcacgaa cctacagtta agtggagatg gtttgaaagt + 4201 attttctatc acttctgtga aactaggaga aggaaaatca acgacttcca ccaatatcgc + 4261 ttgggctttt gcgcgtgcag gttacaaaac gctgctgatt gatggagata ttcgcaattc + 4321 tgttatgtta ggtgtcttta aagcaaggga taagattaca ggcctgacag aatttttatc + 4381 aggaactaca gacctatcac aagggctttg tgataccaat atcgaaaatc tctttgtaat + 4441 tcaggctggc tctgtgtcac cgaatccgac agctcttctt caaagtaaga atttcagtac + 4501 aatgcttgaa acattgcgta aatattttga ctacatcatt gtagatactg ctcctgtcgg + 4561 tgtcgtgatt gatgcggcta ttattacgcg aaaatgcgat gcttctattt tagtgacgga + 4621 ggcaggtgaa ataaatcgac gggatattca aaaagcaaaa gaacagttgg aacacacagg + 4681 gaagccgttt ttgggagttg tgttgaataa attcgatact tcagtagaca aatacggttc + 4741 ttatggaaat tatggagatt acgggaaaaa taaaaaatag gtcgggggat agagatgaat + 4801 ggaaaaatag taaagtcttc attggccata atccagagtt ttcttgttat tttattgact + 4861 tatctactta gtgctgtgag agaagcggag attgtttcaa caacagctat tgcactttat + 4921 atcctccatt attttgtctt ttatatcagt gattatggac aggatttctt taaaagggga + 4981 tatttgattg aacttgtcca gacattgaaa tatatcctat tctttgcact agcgattagt + 5041 atttctaatt ttttcttaga ggatcgattt agtatttcca gacgaggcat gatttacttc + 5101 ctcacattac atgctctctt agtctatgtg ctaaacctat ttatcaagtg gtattggaag + 5161 cgggcttatc ccaactttaa aggaagtaag aagattctcc tacttacagc aacttctcgt + 5221 gtcgaaaagg tactggatag attaatagaa tcaaatgagg ttgttgggaa gttggtagcc + 5281 gtcagtgtct tagataaacc agattttcag catgattgtt taaaggtagt agcagagggg + 5341 gagatagtaa actttgcgac tcatgaggtg gtcgatgaag tctttatcaa tcttccaagt + 5401 gaaaaataca atattggaga gcttgtctct cagtttgaaa cgatgggaat tgatgtaaca + 5461 gtcaatctaa atgcttttga tcgtagtttg gcacgtaaca agcaaatccg tgagatggca + 5521 ggattaaacg ttgtgacttt ttctacaaca ttttataaga ctagtcatgt aattgctaag + 5581 cggattattg atatcgtggg tgcattggta gggctgatac tatgtggtct agccagtatt + 5641 gtactggttc ctttgattcg aaaggatggg ggctctacta tttttgctca gacgcgtata + 5701 ggaaaaaatg gtcgtcagtt cactttttat aagtttcgct ctatgtgtgt agatgccgag + 5761 gcgaaaaaaa gagaactcat ggaacaaaat accatgcagg gtggaatgtt taaggtggac + 5821 gatgatcctc gtatcacgaa aattggtcgt tttatacgga agactagctt ggacgagcta + 5881 ccacagtttt ataatgttct aaagggagat atgagtttgg ttggcacacg gccaccaaca + 5941 gtggacgagt atgaacacta taccccagaa caaaaacgtc ggctaagttt taaacctggt + 6001 ataacaggct tatggcaggt cagtggacga agtgagatta agaattttga tgaagttgtc + 6061 aaattagatg tagcctatat agacgattgg acaatttgga aagacattga aattttattg + 6121 aagacagtta aagttgtatt tatgagagac ggagcgaagt aggaaatgaa aatatgttta + 6181 gttggatcta gtggaggtca tctgactcat ttatatcttt taaaaccttt ctggaaagat + 6241 aaagaaagat tttgggttac ttttgataag gcggacgctc ggagtgtact ctctgaggaa + 6301 gttgtatatc cctgttatta tccaaccaat cgtaatataa aaaatttaat aaaaaatact + 6361 tttctcgcct ataaaatttt aaaaaaagag agaccagatt tgattatttc ttctggtgcc + 6421 gctatcgctg ttcctttctt ttatattggg aagttatttg gatcaaagac agtgtatata + 6481 gaagtttttg atagaattga tgcttcaaca ctgacaggaa aacttgttta tccagtaacg + 6541 gataggttta ttgttcaatg ggaagaaatg aaaaaagtat acccaaaggc aattaatctc + 6601 ggagggattt tctaatgatt tttgtgacag taggtactca tgaacaacag tttaatcgac + 6661 ttattaaaga ggttgataga ttaaaaggtg agggatttat tcaggatgat gtttttattc + 6721 aaacaggata ctctaattat gttccaaaat tttgtaaatg ggaaaaatta atatcttatg + 6781 aaaaaatgaa tcaatttatt gaggaagctg atacaatcat tacccatggc ggtccagcta + 6841 cgtttatggc agttattgct aaagggaaaa gtccgataat tgttccgaga ttaaaaaaat + 6901 ttggtgagca tgtgaacgac catcaacttg aatttgttga gaaagtgtta aatgtctata + 6961 atttgacagt catcactaac ataagtgatc ttaattccta tatttctaat tttgatgagc + 7021 gaaaaaaatc agatttgaag agcaaaaata atctatttat ggagaaattt atagatatga + 7081 ttaatcagtt gatggagaca ggtgacatca agtatgacta agtacataaa tagctgtatc + 7141 aagttgttat tcatatattc gttatttagt gaattgctat actcatatta ttctgtatct + 7201 ctattattta cgatacctga cttattattg ttggcagcag cagtaattgt ttttgtagat + 7261 tcttattctg cagggaaaat aagagttaaa aatcctcaca ttagtttaat gctctttttt + 7321 atattgctga tatttctatt aattagtttt acttggggta ctcttaatat atatggattt + 7381 gttatgagag gaagatatat actgggagca tttctagttt attttatgac aaatagctat + 7441 ctagatgata gaaccttttc atcattgata aacattgctt attttatgca gatattgaac + 7501 ctattattag ttttacatca aaatatagta ttacatttgc accctgactt cactaatggg + 7561 atttttggtt ttactaatta tgcaaatgga atccaaggat tttattgctt agccttaagt + 7621 gttttatcta ctgtatatta tctgtatggt aaatggggaa caatgaagtc attaatattg + 7681 attgctattt cgtgtataat ttgtgcatta gcagaaataa agattttttt tgtcattttt + 7741 atattttcta ttattctaat ttttatattt caaaagtcag aaacagtaaa aaaaatacga + 7801 ataattagta cagctgctgg aatatctctt ctttttttaa ttgcctataa actcattgag + 7861 atagttttac ctgataattt gtatactttt tttaatgtta caaaggcatt atcatatgag + 7921 aataggacag agtttgcggg acgaacaaat actatttcct tcctatggga caacttattt + 7981 tatcatgatt atattagtgc tatatttggg aaaggactag gttcatactc tgttaattat + 8041 atttatgaac ttggtaaaat gcttgcagat ggtggtttta tttcagtgat tttgctttat + 8101 tcatttttgt tgtcattatt catacgggga actattacta gaggaaaaaa taagcaaagt + 8161 gaaagactaa ttgtatccat catagctttt gtggtgatga ttagcattat tgtttggaat + 8221 agtacgttca ctagatcaac ttatcttgta tttttctttc tagcaatagg taatgcagcg + 8281 tataagtcta ctaaattaat aagaagggat tgagatggaa attcaaatat cagtggtgat + 8341 tccagtatac aatgctgaaa acacgattaa taattgtatt gaaagtgctt taaaacaaga + 8401 tttagaatct tttgaagtaa ttttagtaaa cgatggatcg aacgattcta catcaagaat + 8461 tcttgaacag tatagtgata atccccaagt gaagatattt catcaagtga acatgggagt + 8521 atctgctgcc agaaatttag gtttatctca tgcaagcgga gaatacgtat tctttttaga + 8581 ttcagatgat attttagatg atggtatgct ttctaaaatg taccaatttg taaaaaataa + 8641 taaagttgat ctcttatctt gttggcataa agaacctgct acaactcaat acggtggaaa + 8701 tgagaataag tcaacttcat ttattgcacg tacaagagaa gaaataggtg ctcattttgt + 8761 tgatatcttt ccgagaagtg cttgtgccaa attgtttttt cgcaaaataa ttgaagaaaa + 8821 taatattact ttttcgactg agatgtcact aggtgaagat atgtcatttg tgtatcaata + 8881 cttaatggtt tctaaaagta ttggagttat tgacggggtg tattataata ttcaaaatgt + 8941 aaatccacag tcgttatcta agcgctatgt gcagaatatt gaaaattccc taatgattca + 9001 gaaccagtta tggaatcaac tgttggaagt ttatcctaaa attgaggaga actactataa + 9061 gcaacatatg gattttagat tttaccttgc taacttgtat gtaaataatt tatttaaatt + 9121 tgattctccg tattcatcaa aagaaaaact agaccaaatt gctcaacaat taaaaaagta + 9181 tagattattt ttagatgaaa aagtcagcaa agaaaagatg cctaaaaata taaatgagat + 9241 gattgttttt tatttactaa aattgaaaat tccagtgttg atttattctt tttattcgtt + 9301 taaagagtgg tggaagagaa gaaaaattaa aaatgaagga taaataagtt atggaagatt + 9361 tgataagcat tgttgttcca gtctataacg tggaaaaata tttaaaaaaa tcaatagaaa + 9421 gtgttttgaa tcagacttat caaaatatcg agattttatt ggttgatgac ggaagcacag + 9481 atagtagtgg gaaaatttgt gaatcattta gcaaagttga tcctaggata agagtatttc + 9541 ataaagaaaa tggtggttta tcagatgctc ggaattttgg aattgagcaa atgaaaggtc + 9601 aatatgtagc gtttattgat agcgatgact acatatctaa ggattatgtc tggaagttgt + 9661 attcttctat aaaaaataat gattccgagg tgtcgatttg ttctttttta ttagtcgatg + 9721 aaaaagggga aaaaataaaa gatgagctat tagattcggg aaaaatatgc ttgactggtc + 9781 aacaaatatt agaaaaagta ttaacagccg acggctatcg ctatgttgtt gcttggaata + 9841 agctttatcg gtcaacttta tttgaaaaat taaaatttaa aaaaggaatg ttgtatgagg + 9901 atgaatttct taactatctt ctattttggg actgtaaaag ggtatcaatt gtagaggagc + 9961 cgttatattt atacgttcaa cgaaaaggaa gcattgtaca aagtaatatg actttagaaa + 10021 aaataaagat gaaggatgag atgcatactt cacgcattga gttttattca gaaaaggggc + 10081 attctttttt gcacgaaaaa gcgtgtcaac agtactgcaa ttggattgtt acagcgacta + 10141 ccaatcatag taagatttta aatcctaatt tttcgaagta tttacaacga cagtttagaa + 10201 agttcgctaa atatacacga aacaatgata ttagactaat tgtgcagaac attctaggat + 10261 ttatagatat tcgtttagca gcttatgtaa aatcaaaagt aatgtagagt ataggaaaca + 10321 taatgataga aaaaatttta gattctatta aaaatcattc tttttatagt aaattgaagg + 10381 ataaaattca tagaattatt ccattatata ttataaaaaa tcaaaatata gcttttcaac + 10441 aagataccga tatagcatat agaaaactaa agaagaagtt taggcatatt tcgttgactg + 10501 gagatgagct taaatataaa atggagtttt caaataaagt ttggatttgt tggtttcagg + 10561 gagaagagca tgccccagag ttaattaaaa catgtattca atcaatgagg aatcaacttc + 10621 aaggaagaga aatcattgtg ttgacagaaa aaaatataag tgattataca gagattccag + 10681 gctatattat tgaaaaatac aaaaaaggat ggatttctcg tgcgcattac tctgatatcc + 10741 ttaggataga tcttctatgt cgccatggag gattatgggt agatgcaaca gtgttgaata + 10801 caggaggaga tttctcaaat cttgaggtac cactttttgt atataaatct ttgaatttat + 10861 caagaaaaga ttcacaagct attgtagcat caagttggtt aatttcgtca tatagtaatc + 10921 atcctatatt actctatacg agaaaactcc tatgggccta ctggcgaaga aaaaatagtt + 10981 tatgtaatta ttttttgttc catatatgtt ttacaatagc tacagagcgg tacccaatcg + 11041 aatggtctgc tgtccctact tttaataatc attctcctca tatacttcat tttgagttga + 11101 atgaacaatt ttcggaaaaa cggtgggaac aactgaagca tatttcggcg tttcataaat + 11161 taaatcatca tatagattat tctagcggtg ttaacacttt ttataagttc atagtatctt + 11221 cgaaagttta gaaaaatgag taataaaatt agtaaaaatt tagcctacaa tatggggtat + 11281 cagttaattg ggattgcagc tcccttgata acttctcctt atttatcacg gatattaggt + 11341 gctgaaaatt taggtattca ttcttttact atgtcggttg cactttactt tatgatgttt + 11401 atgcttcttg gaattgcaaa ttacggaaat agaacaattg cgactgttaa acgagaagga + 11461 aaggatattc tatcaaaaac gttttggagt atctactcta tccagttgat aatgtctatt + 11521 ctggtaacta tagcttatct tgcttatcta tatttggggg cagtacatta caaagttatt + 11581 gcaatattac aactcttttt attgttatca aatgctgttg atattacttg gtttttctat + 11641 ggattagaaa attttaagca aatcgttttt aggaatacat tagtcaaact tttaggatta + 11701 tttttaattt ttttatgtgt gcgtcaaggc acagatttat ggaaatacac atttataaac + 11761 ggatcagtaa ctttagttgg ccaactttta ctatggggac aattaaaagg aatattaact + 11821 tggaaaaaaa ttcaattaaa ggaattacta cctcatatca agccaatttt aattcttttt + 11881 attcctgtac tagccattag tatttttact aatatggata aatatatgct tggtttaatg + 11941 gttgatgtaa agcaggttgg attttatgac aatgcaggta gaattattga aattcctaaa + 12001 gctttgattg cagctttagg ggccgttatg ttaccaagaa cttcctattt attagcggaa + 12061 ggacagaaag aaaagagtaa atactacata gaggtaacaa ttttatacgt gatgattatt + 12121 tctagtgtat tgatgtttgg gctaatatcg gtatctgata ttttttccat tatattttgg + 12181 ggagaagaat ttcttgaatc aggtagattg atttctgcta tgtctccggc ttttgtcttc + 12241 tctgtattag gaaatatcat taggactcag tatttgattc ctagagctaa ggataaagat + 12301 tatgtagtgt ctctaattgc gggggctgtt gttaatctag tgctaaacta tttttttata + 12361 aaaccttttg gtgctatggg agcaacagtt agtacagttt tggcagaatt tgtattgtct + 12421 ggaatgcagt tttggtcagt aagaagagac ttagatttaa aaagatattt gaaaaacggt + 12481 ttgatattct acctatttgg tctgattatg taccttgtta ttataacact caaaactcag + 12541 ttaccataca atataatgag tcttatttta ctaatagttt tgggtggaat agtatatgtt + 12601 attttttgtt gttgctatat tttaatgtca agaaatttac attttaagtt attgaaggaa + 12661 aagattatac gaaaggttgt acataaaaat acattataaa atattagttt tattttattt + 12721 agttggatac tattaaataa acgaaagtat ttgaaacttt ggtaattgag attatagaga + 12781 taaactaagc tatattatag cttcattatt aaagtaagaa tatcggtgca gtgtagttaa + 12841 cgaataatgt gagtactcat ttcttagatg gagctagggg tcattataag ggattgatat + 12901 gacattttga gtaagttaca gctagagttt aggtttgatt atatcagata tttagatgat + 12961 ttggaaaata ataaaataag ttaggaacta tttttttatt gttttgagtg acaggtttga + 13021 ttttgggaaa tgtattttgt taaataggta ggaaagatgg ttactaaaga taaaggatta + 13081 acatataata gtactttgca tgcaataaaa gtattagcat gttttagtgt tgttgctatt + 13141 catatatggc taccaggaaa aattggagcg ttttatcaaa taatagcacg atttgcagtt + 13201 ccaatgttct ttttgatttc tggcttttat tcatataata tttcaaagaa tagaattaaa + 13261 aaaatattta gattgatatt aagaagtaca ttttttatgt aataatattt gtatggatgt + 13321 tttggagaga aggtaatatg cagtttattt ttccaataaa agactactat tgacaaaacg + 13381 atggatttct atgcttttac tattttcttt cattatggaa gctacaatta gcgattcaat + 13441 tttttataga aattttttat ttatgggaat accatttttt ggaataggaa ttcttattgc + 13501 acagaatcaa aagaagatta ttaattgtaa aataataaac aaaatattaa tcttgggaac + 13561 aattatctat ccaatactaa tatttttaga atattatatc ttgggtaatt cttttgaggt + 13621 ctatataagt tctgtgctag caaccataat attgatgatt ttcgcgatta aatcacctaa + 13681 agcgattaat atcaaaatac tgaatggaat tggagataaa tatgcgactt ttgtttacat + 13741 tatacaccag tttatcattg tgatatttaa atttttagta tctaatgttt atattctcaa + 13801 atttgggacg atatttgtct ttttgatatg ttgttttcta ggggttctat ttcaatttat + 13861 caaaaacaga ctattaaaaa ggtttagtta agatggttgt tttacaaaat gttaaatttt + 13921 tagtaagagt tgtttttatg gttattatca gtatagtgtt atggcctgtt cggataaaga + 13981 agaataagat actatttatt aattttaatg gtaagggata tggtgataat ccgaaaagta + 14041 tttgtgagta tcttcgagtt acatatccag agttagattt agtttggctt gcaaaagata + 14101 atgaagattt tccagatgga gtgagagttg taagatataa atctctacaa tctttttatg + 14161 agcaagctag ttcgaaggtt tgggtttata atgtaagaaa ttttgaaaga ctactaaaaa + 14221 aacgcggaca gttttatatt caaacttggc acggtgcttc tagttttaaa ctgatagaaa + 14281 agcaggctga tttaccatta aaatatattt tagaagcaaa gtatgatgca agagtcacag + 14341 atataatgat ttcagatagc agaaaacaaa ctgaagaatt tcaaaagtat ttttggtatt + 14401 caggagaaat ttttgaggtg gggatgccga gaaatgatgc cttgtttcac tataaggaag + 14461 actacgacaa gttaaataat atcagaaaag aactaagcat tgattcagat gattatgtta + 14521 ttttatatgc ccctactttc agagatgatg gggatgcatc ttatttagat ataaattttg + 14581 aacggctttt gcaaagtatt gaacaagaaa ttaagaagaa atgtaaaatt ttaattagat + 14641 tacatcctaa tgactctcat tttagtaata atatttcttt taatcatgac ataattgatg + 14701 ttacgctatt ctcagatatg caggaactta tattattggc agatgtttta ctgacagatt + 14761 attcttccgc gatatttgat tttatgcttt taaacaagcc ttatgtcaga tatgtgaatg + 14821 atttagaaaa atatgctgag cttaggggac tatcagatac atattacgaa ttgccggacc + 14881 ctatcattaa aactgctgaa gaattgtatg acttactgcc taaaaaaata gaaaattttg + 14941 attatgattc tataaaaaaa tatagaaatg aaatactgtg tccaatcttt aatggaaccg + 15001 ctagtgaaaa tgtaggaagg agaataattc aagagttgtg aagtaaaaca ttgggttatt + 15061 tttaaggtaa cgagatttga aaaataatga tttaaagata ggaagtggag ctattcatca + 15121 aatctccgct acactttctc aaaataatat ttcgggaaag attttatatt gtgctgatcc + 15181 agttgtcgat gacttgtacg gttcgatagt acgttcacaa atagaggaaa ttggtcgggt + 15241 aaaggaagaa agttgcaatt ataatactat tgcttatgcg atgaatatag cagaaagggc + 15301 tattgccaca gatattgact gtattgtggg aatgggagga ggtcgtgttt tagatgtctg + 15361 caagtatgca tcttttattt cgaaacgtcc ttacctatcg attccgacaa cagcagcaaa + 15421 tgatggcatt gcttccccag ttgctgtttt gaaaaggcag gatgatagac caaaaagctt + 15481 aggggcggct atcccctcaa tgacactaat tgatattgat gttattgcat caggacctat + 15541 acaaaacata aaagctggta tcggtgatac aatatccaat tacactgcat tgaaagattg + 15601 ggagttggca gttgagcgag ggaaagatga gatgcatggt tttgcatatc taatgtcgca + 15661 aaattcttta gatgctttaa tgaaaacgaa gtataattct attacccctg attttattga + 15721 agttttggta aactctttag ttttatcagg cattgcaatg gattttgcgg gaagtagtag + 15781 acctgtcagt gggtcagagc acttatttag tcatgcatta gattactatg gttctacaag + 15841 gaatcttcat ggaattcagg ttgcattagg tacagtcgca gttttgaaat taattgaaaa + 15901 ttctgttgat gctgtggtgg attacttgca aagatttgag gttcatatta acccgaaact + 15961 tttggggata gatgaagagt tgtttattta ttgtatgcaa catgctacaa aaatgagaag + 16021 taatcgctat acttatctgc atgaggttga tcttagtaca gatagattga aacaaatata + 16081 taaggaactc ataagcgagt tgtagaaaag agagaaaaaa atgaaagcac ttattttagc + 16141 agcagggtta ggaacacgtc tagccccaat taccaatgag gtaccaaaat ctttggtacc + 16201 agtcaatggt aagccaattt tgatgaaaca aattgaaaat ttatatcaaa ataatattac + 16261 agatattacg attattgctg gatataagtc atctgtatta acagatgcag ttactgaaaa + 16321 gtatccagaa attaatatta ttgataatgt tgattttaaa acgactaata atatgtattc + 16381 agcctatcta ggaaaagctg caatgggtga tagtgacttc ttaatgatga atgcagatgt + 16441 attttatgat gcttctgtta ttaaaagtct gttgcttcat aaagctccaa atgcaattgt + 16501 aactgattta ggtacttata ttgaagagtc tatgaaagtc gtagaaaaaa atgggcgttt + 16561 agtggaaatt tctaaacaga tttcacctga ggaggcttta ggggcttcta ttgatgttta + 16621 taaattctct tatgaagcag gtgctcgatt ctttgaaaag tgtaaggaat ttattgaaga + 16681 taaacgagaa cttcaaatgt ggagtgaggt tgctcttaat gcaatccttc cagaagttga + 16741 gtttatagca tgtccattgg atggccgttg gttagaaatt gataatcatg aagacctagc + 16801 tgttgcagaa aaactatttg cttaaaccga atatggagaa tgaaattgac aaatagagtt + 16861 gattattttg gtgctgatat tagtgaactt cagaataaaa aattattctt atttgatatg + 16921 gatggtacca tttatgaaga agatagattg tttgagggta ctctcgaatt attagactat + 16981 attcataata ttggcggtga gtatattttt attacaaaca attcatctaa gtctgttgtt + 17041 gactatgttg aaaaagttaa cagattaggt attaaagctg aacgagataa tttttttacc + 17101 tctgctcaag ccacaattgt ttatattaaa gaaaattatc ctaaatctaa agtttattgc + 17161 caaggaacaa aatctttgat aaaagaacta tctgacgcag gaattgatgt aactgagcaa + 17221 gttagtgctg atatagatgt tgttcttgtt ggttttgata cagaattaac cagtgataaa + 17281 attcgcaata cctgcgagat tctatcaaca aaggacgtac ctttcatagc tactaaccct + 17341 gatattcgct gcccagtatc gtttggattc atcccagatt gtggttctat ttgtgatatg + 17401 attagtaaat cagtcgatag gaaacctgtt tacataggta aacctgaacc tacgatggtt + 17461 gatattgttc gaaaaaaatt aaattattct ctatttgaaa cagttgtgat tggagatcgc + 17521 ttgtatacgg atatcatgac tggtataaat gcaggagtaa cttcagtttg tgtgctgaca + 17581 ggagaagcaa cggtgaatga tattcaacaa ggtagtataa aaccgactta tacatttaaa + 17641 aacgtgaaag aaatgtggaa aggaattgtc tgattttttc attctgaata gtgaattcat + 17701 gaatactgtc aaaatactcg tatgtattta aattgatttt attattagac ttcctgcaaa + 17761 actagaatcc tagttcatga ttgataatac cagcaatcaa attcattcgt aatccgaagc + 17821 gtttacgatg atttcgataa gttgttgaaa acattttaaa cgtttttact ttggcaaaga + 17881 tgttctcaac cttgcttctc tccgtagata gtgcatggtt acaggcttta tcttcagctg + 17941 ttagcggctt gagttcgctg gatttacgtg gagtttgtgc ttgaggatat atcttcataa + 18001 gcccttgata accactgtca gccaagattt taccagcttg tccgatattt ctgcgactca + 18061 ttttgaacaa cttcatatca tgactatagt tcacagtgat atccaaagaa ataattctcc + 18121 cttgacttgt gacaatcgtc tgagccttca tagcgagaaa tatctattct atcttctaga + 18181 atgtcttcca aacgaggaaa ctctcgtaaa caaagaggtt ttagaggctt atttaccatg + 18241 gactaaagtt gtacaagaaa agtgcaaata agaaatctcc agattaggaa ctatatatga + 18301 gttctctagt ctggagattt ttcaatagac ttcgttattg ggcggttaca atgatattca + 18361 tattttttgc aaagatgttg tttgaaaaat aattttcaaa aattctgaaa attctgttga + 18421 catctttctg aaaagagtct ataatggaga gaaagtttta aaggagaaaa tgatgaaaag + 18481 ttcaaaacta cttgcccttg cgggcgtgac attattg +// diff --git a/public/res/serotype_genbank/serotype_15B.gb b/public/res/serotype_genbank/serotype_15B.gb new file mode 100644 index 0000000..59d98d8 --- /dev/null +++ b/public/res/serotype_genbank/serotype_15B.gb @@ -0,0 +1,861 @@ +LOCUS CR931664 18624 bp DNA linear UNK 10-JUN-2024 +DEFINITION CR931664, whole genome shotgun sequence. +ACCESSION CR931664 +VERSION CR931664 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/10/2024, 18:20:43 + CDSs :: 20 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..18624 + /mol_type="genomic DNA" + gene 293..445 + /locus_tag="EMIKCJ_00005" + CDS 293..445 + /db_xref="RefSeq:WP_001022222.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000152F245" + /db_xref="UniRef:UniRef100_A0A0T7KK87" + /db_xref="UniRef:UniRef50_A0A0H2ZQL8" + /db_xref="UniRef:UniRef90_A0A0H2ZQL8" + /product="Lipoprotein" + /locus_tag="EMIKCJ_00005" + /protein_id="gnl|Bakta|EMIKCJ_00005" + /translation="MNIKKRVLSAGLTFASALLLAACDQSGSDTKTYSSTFSGNPTTFN + YLLDY" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001022222.1" + gene complement(442..798) + /locus_tag="EMIKCJ_00010" + CDS complement(442..798) + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000152F246" + /db_xref="UniRef:UniRef100_A5LJR5" + /db_xref="UniRef:UniRef50_A0A0H2UQ11" + /db_xref="UniRef:UniRef90_A5LJR5" + /product="IS630-Spn1, transposase Orf2" + /locus_tag="EMIKCJ_00010" + /protein_id="gnl|Bakta|EMIKCJ_00010" + /translation="MVAGLTNGELIAPMTYEETMTSDFFEVWFQKFFLPTLTTPSVIIM + DNVRFHRMGKLELLCEEFGNKLLPLPPYSPEYNPIEKTWTHIKKHLIKGITKLQYLLQG + SFVLFLFRLTILSV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_A5LJR5" + gene 1204..2649 + /locus_tag="EMIKCJ_00015" + /gene="wzg" + CDS 1204..2649 + /db_xref="BlastRules:WP_000091082" + /db_xref="RefSeq:WP_054378039.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF36" + /db_xref="UniRef:UniRef100_Q4K1M7" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_Q9R928" + /db_xref="UniprotKB:Q4K1M7" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="EMIKCJ_00015" + /protein_id="gnl|Bakta|EMIKCJ_00015" + /translation="MSRRFKKSSSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVDQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYS + TIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSYAMPDSNLY + VLEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378039.1" + /gene="wzg" + gene 2651..3382 + /locus_tag="EMIKCJ_00020" + /gene="wzh" + CDS 2651..3382 + /db_xref="EC:3.1.3.48" + /db_xref="GO:0004725" + /db_xref="GO:0030145" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_054378040.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF37" + /db_xref="UniRef:UniRef100_Q4K1P5" + /db_xref="UniRef:UniRef50_Q54518" + /db_xref="UniRef:UniRef90_Q54518" + /db_xref="UniprotKB:Q4K1P5" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="EMIKCJ_00020" + /protein_id="gnl|Bakta|EMIKCJ_00020" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRIIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDSRY + ALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKPKLFGERYKFMKKRAQYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIAKKYG + AKKAKEFFVDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378040.1" + /gene="wzh" + gene 3391..4083 + /locus_tag="EMIKCJ_00025" + /gene="wzd" + CDS 3391..4083 + /db_xref="BlastRules:WP_000664160" + /db_xref="GO:0005351" + /db_xref="GO:0005886" + /db_xref="GO:0009103" + /db_xref="GO:0015774" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_000658143.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF38" + /db_xref="UniRef:UniRef100_Q4K1M5" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_Q54519" + /db_xref="UniprotKB:Q4K1M5" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="EMIKCJ_00025" + /protein_id="gnl|Bakta|EMIKCJ_00025" + /translation="MKEHNTLEIDILQLFRALWKRKLVILLVAIITSSVAFAYSTFVIK + PEFTSTTRIYVVNRNQEEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVISDLKLDLT + PKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVTTLE + EARPAISPSSPNIKRNILIGFLAGGVGTGVIVLLLELLDTHVKRPEDIEDTLQMTLLGV + VPNLSKLK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000658143.1" + /gene="wzd" + gene 4093..4776 + /locus_tag="EMIKCJ_00030" + /gene="wze" + CDS 4093..4776 + /db_xref="BlastRules:WP_001142521" + /db_xref="COG:COG0489" + /db_xref="COG:D" + /db_xref="EC:2.7.10.2" + /db_xref="GO:0004715" + /db_xref="GO:0005524" + /db_xref="GO:0016310" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_001142510.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF39" + /db_xref="UniRef:UniRef100_Q4K1M4" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_Q54520" + /db_xref="UniprotKB:Q4K1M4" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="EMIKCJ_00030" + /protein_id="gnl|Bakta|EMIKCJ_00030" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVNP + GEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVMSGFFKSREKITGLTEFLSGTADLSH + GLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVIDAA + IITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVILNKFDVQHKKYGSYGDYG + NYGKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001142510.1" + /gene="wze" + gene 4792..6159 + /locus_tag="EMIKCJ_00035" + /gene="wchA" + CDS 4792..6159 + /db_xref="RefSeq:WP_000343580.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3A" + /db_xref="UniRef:UniRef100_Q4K1M3" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_P72513" + /db_xref="UniprotKB:Q4K1M3" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="EMIKCJ_00035" + /protein_id="gnl|Bakta|EMIKCJ_00035" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLLH + FFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYFLT + LEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKLVAV + SVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMGIDVT + VNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLVLFAIAS + LVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTMQGGMFK + MDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPEQKRRLSF + KPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFIRDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000343580.1" + /gene="wchA" + gene 6163..6612 + /locus_tag="EMIKCJ_00040" + /gene="wchJ" + CDS 6163..6612 + /db_xref="GO:0016740" + /db_xref="RefSeq:WP_000861663.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3B" + /db_xref="UniRef:UniRef100_Q4K1M2" + /db_xref="UniRef:UniRef50_J9W567" + /db_xref="UniRef:UniRef90_Q4K1M2" + /db_xref="UniprotKB:Q4K1M2" + /db_xref="UserProtein:wchJ" + /product="""putative glycosyl transferase enhancer""" + /locus_tag="EMIKCJ_00040" + /protein_id="gnl|Bakta|EMIKCJ_00040" + /translation="MKVCLVGSSGGHLTHLYLLKPFWNDKERFWVTFDKADARSVLSEE + VVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKTVY + IEVFDRIDASTLTGKLVYPVTDRFIVQWEEMKKVYPKAINLGGIF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000861663.1" + /gene="wchJ" + gene 6612..7115 + /locus_tag="EMIKCJ_00045" + /gene="wchK" + CDS 6612..7115 + /db_xref="RefSeq:WP_000578430.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3C" + /db_xref="UniRef:UniRef100_Q4K1M1" + /db_xref="UniRef:UniRef50_Q4K216" + /db_xref="UniRef:UniRef90_Q4K1M1" + /db_xref="UniprotKB:Q4K1M1" + /db_xref="UserProtein:wchK" + /product="""putative glycosyl transferase""" + /locus_tag="EMIKCJ_00045" + /protein_id="gnl|Bakta|EMIKCJ_00045" + /translation="MIFVTVGTHEQQFDRLIKEVDYLKKENLIQDEVFIQIGYSSYIPK + YCEWEKIISYEKMNQLIKESDIIITHGGPATFMGVIAKGKVPIVVPRQKKFGEHVNDHQ + LQFVKLTKEIYNFIVIDDISDLYLSIRDFKDKYFGICLNNERFNLHFNAEINKLFEGNK + VDEN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000578430.1" + /gene="wchK" + gene 7105..8277 + /locus_tag="EMIKCJ_00050" + /gene="wzy" + CDS 7105..8277 + /db_xref="RefSeq:WP_054378041.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3D" + /db_xref="UniRef:UniRef100_Q4K1M0" + /db_xref="UniRef:UniRef50_P72516" + /db_xref="UniRef:UniRef90_A0A6G2DLE4" + /db_xref="UniprotKB:Q4K1M0" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="EMIKCJ_00050" + /protein_id="gnl|Bakta|EMIKCJ_00050" + /translation="MKIRIEPQYFLYKYLWLIILLPKQFMQLILFSLIVLILLPVYIKD + RQISKIDAPSFYIVLWVMMYSISIIWNFLISGLPIQVLFSDLSKAFNWILAVFFYNYYL + KNPINVDKIKKYMFYNFAILVIIVALFYVQRGANVVLFGRSLLGWDGFVSATSYGVRYA + GFLEYSTLNGQLILFLLPLIRLFKLSFFTQVTILAFLLQVLVLSKSRIAIIALIIYIVF + VVMVQITSINKRMIVAFYPTIPLILLYNWEKIKHIFFQMFNSRTGSNVTRFIVYEESLK + AINGLGILLGAGIRTQSTVGILLGSHSMYISFIYRTGILGSIIIVILFYYLFSKFLKSA + PSGKLISIGYILALLVFWLFEELDPHYWCLILFFSTISIFINNRKEEIVG" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378041.1" + /gene="wzy" + gene 8274..9299 + /locus_tag="EMIKCJ_00055" + /gene="wchL" + CDS 8274..9299 + /db_xref="RefSeq:WP_000573792.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3E" + /db_xref="UniRef:UniRef100_Q4K1L9" + /db_xref="UniRef:UniRef50_Q4K1K1" + /db_xref="UniRef:UniRef90_Q4K1K1" + /db_xref="UniprotKB:Q4K1L9" + /db_xref="UserProtein:wchL" + /product="""putative glycosyl transferase""" + /locus_tag="EMIKCJ_00055" + /protein_id="gnl|Bakta|EMIKCJ_00055" + /translation="MIEVSIIIPIYNAEKTIKNCVDSALKQNLESLEVILVNDGSNDST + AEILNQYDRNSRVKIFHQLNKGVSTARNKGLSHASGEYVFFLDSDDILDDGMLSKMYQF + VKNNKVDLLSCWHKEPATTQYGGNENKSTSFIARTREEIGAHFVDIFPRSACAKLFFRK + IIEENNITFSTEMSLGEDMSFVYQYLMVSKSIGVIDGVYYNIQNVNPQSLSKRYVQNIE + NSLIIQNQLWNQLLEVYPKIEENYYKQHMDFRFYLANLYVNNLFKFDSPYSSKEKLDQI + AQQLKKYRLFLDEKVSKEKMPKNINEMIVFYLLKLKIPVLIYSFYSFKEWWKRRKIKNE + G" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000573792.1" + /gene="wchL" + gene 9307..10263 + /locus_tag="EMIKCJ_00060" + /gene="wchM" + CDS 9307..10263 + /db_xref="RefSeq:WP_000389753.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3F" + /db_xref="UniRef:UniRef100_Q4K1L8" + /db_xref="UniRef:UniRef50_E0Q2S2" + /db_xref="UniRef:UniRef90_A0A4J2AN51" + /db_xref="UniprotKB:Q4K1L8" + /db_xref="UserProtein:wchM" + /product="""putative glycosyl transferase""" + /locus_tag="EMIKCJ_00060" + /protein_id="gnl|Bakta|EMIKCJ_00060" + /translation="MEDLISIVVPVYNVEKYLKKSIESILNQTYQNIEILLVDDGSTDS + SGKICESFSKVDPRIRVFHKENGGLSDARNFGIEQMKGQYVAFIDSDDYISKDYVWKLY + SSIKNNDSEVSICSFLLVDEKGEKIKDELLDSGKICLTGQQILEKVLTADGYRYVVAWN + KLYRSTLFEKLKFKKGMLYEDEFLNYPLFWDCKRVSIVEEPLYLYVQRKGSIVQSNMTL + EKIKMKDEMHTSRIEFYSEKGHSFLHEKACQQYCNWIVTATTNHSKILNPNFSKYLQRQ + FRKFAKYTRNNDIRLIVQNILGFIDIRLAAYVKSKVM" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000389753.1" + /gene="wchM" + gene 10279..11187 + /locus_tag="EMIKCJ_00065" + /gene="wchN" + CDS 10279..11187 + /db_xref="RefSeq:WP_050103050.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD1" + /db_xref="UniRef:UniRef100_Q6X853" + /db_xref="UniRef:UniRef50_B2ILQ2" + /db_xref="UniRef:UniRef90_Q6X853" + /db_xref="UniprotKB:Q6X853" + /db_xref="UserProtein:wchN" + /product="""putative glycosyl transferase""" + /locus_tag="EMIKCJ_00065" + /protein_id="gnl|Bakta|EMIKCJ_00065" + /translation="MIEKILDSIKNHSFYSKLKDKIHRIIPLYIIKNQNIAFQQDTDIA + YRKLKKKFRHISLTGDELKYKMEFSNKVWICWFQGEEHAPELIKTCIQSMRNQLQGREI + IVLTEKNISDYTEIPDYIIEKYKKGWISRAHYSDILRIDLLCRHGGLWVDATVLNTGGD + FSNLEVPLFVYKSLNLSRKDSQAIVASSWLISSYSNHPILLYTRKLLWAYWRRKNSLCN + YFLFHICFTIATERYPIEWSAVPTFNNHSPHILHFELNEQFSEKRWEQLKHISAFHKLN + HHIDYSSGVNTFYKFIVSSKV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050103050.1" + /gene="wchN" + gene 11192..12655 + /locus_tag="EMIKCJ_00070" + /gene="wzx" + CDS 11192..12655 + /db_xref="RefSeq:WP_054378042.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD2" + /db_xref="UniRef:UniRef100_Q6X852" + /db_xref="UniRef:UniRef50_O07342" + /db_xref="UniRef:UniRef90_Q6X852" + /db_xref="UniprotKB:Q6X852" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="EMIKCJ_00070" + /protein_id="gnl|Bakta|EMIKCJ_00070" + /translation="MSNKISKNLAYNMGYQLIGIAAPLITSPYLSRILGAENLGIHSFT + MSVALYFMMFMLLGIANYGNRTIATVKREGKDILSKTFWSIYSIQLIMSILVTIAYLAY + LYLGAVHYKVIAILQLFLLLSNAVDITWFFYGLENFKQIVFRNTLVKLLGLFLIFLCVR + QGTDLWKYTFINGSVTLVGQLLLWGQLKGILTWKKIQLKELLPHIKPILILFIPVLAIS + IFTNMDKYMLGLMVDVKQVGFYDNAGRIIEIPKALIAALGAVMLPRTSYLLAEGQKEKS + KYYIEVTILYVMIISSVLMFGLISVSDIFSIIFWGEEFLESGRLISAMSPAFVFSVLGN + IIRTQYLIPRAKDKDYVVSLIAGAVVNLVLNYFFIKPFGAMGATISTVLAEFVLSGMQF + WSVRRDLDLKRYLKNGLIFYLFGLIMHLIIIALKTQLPYNIMSLILLIVLGGIVYVIFC + CCYILMSRNLHFKLLKEKIIRKVVHKNTL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378042.1" + /gene="wzx" + gene 13021..13998 + /locus_tag="EMIKCJ_00075" + /gene="wciZ" + CDS 13021..13998 + /db_xref="RefSeq:WP_000256585.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD3" + /db_xref="UniRef:UniRef100_Q6X851" + /db_xref="UniRef:UniRef50_E0Q2R6" + /db_xref="UniRef:UniRef90_Q6X851" + /db_xref="UniprotKB:Q6X851" + /db_xref="UserProtein:wciZ" + /product="""putative acetyl transferase""" + /locus_tag="EMIKCJ_00075" + /protein_id="gnl|Bakta|EMIKCJ_00075" + /translation="MVTKDKGLTYNSTLHAIKVLACFSVVAIHIWLPGKIGAFYQIIAR + FAVPMFFLISGFYSYNISKNKIQNRIKKIFRLILRSTFFYVIIFVWMFWREGNMQFIFQ + NFNLTNIIRFVIFNRISDLIGYLATPLWYLFAILYIYIYLYFSNKRLLLTKRWISILLL + FSFIMEATISDSIFYRNFLFMGIPFFGIGILIAQKQKKIINCKIINKILILGTIIYPIL + IFLEYYILGNSFEIYISSVLATIILMIFAIKSPKAINIKILNEIGDKYATFVYIIHQFI + IVIFKFLVSNVYILKFGTIFVFLICCFLGVLFQFIKNRLLKRFS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000256585.1" + /gene="wciZ" + gene 14000..15148 + /locus_tag="EMIKCJ_00080" + /gene="wchX" + CDS 14000..15148 + /db_xref="RefSeq:WP_054378043.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD4" + /db_xref="UniRef:UniRef100_A0A9X8NAZ6" + /db_xref="UniRef:UniRef50_Q9R922" + /db_xref="UniRef:UniRef90_A0A4J2AK78" + /db_xref="UniprotKB:Q6X850" + /db_xref="UserProtein:wchX" + /product="""putative glycerol phosphotransferase""" + /locus_tag="EMIKCJ_00080" + /protein_id="gnl|Bakta|EMIKCJ_00080" + /translation="MVVLQNVKFLVRVVFMVIISIVLWPVRIKKNKILFINFNGKGYGD + NPKSICEYLRVTYPELDLVWLTKDNEDFPDGVRVVRYKSLQSFYEQASSKVWVYNVRNF + ERLLKKRGQFYIQTWHGASSFKLIEQQADLPLKYILEAKYDARVTDIMISDSRKQTEEF + QKYFWYSGEIFEVGMPRNDALFHYKEDYDKLNNIRKKLSIDSDDYVILYAPTFRDDGDA + SYLDINFERLLQSIEQEIKKKCKILIRLHPNDSHFSNNISFNHDIIDVTLFSDMQELIL + LADVLLTDYSSAIFDFMLLNKPYVRYVNDLEKYAELRGVSDTYYELPDSIIKTAEELYD + LLPKKIENFDYDSIKKYRNEILCPIFNGTASENVGRRIIQEL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378043.1" + /gene="wchX" + gene 15184..16212 + /locus_tag="EMIKCJ_00085" + /gene="gtp1" + CDS 15184..16212 + /db_xref="RefSeq:WP_000794265.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD5" + /db_xref="UniRef:UniRef100_Q6X849" + /db_xref="UniRef:UniRef50_Q9R921" + /db_xref="UniRef:UniRef90_Q9R921" + /db_xref="UniprotKB:Q6X849" + /db_xref="UserProtein:gtp1" + /product="""putative glycerol-2-phosphate dehydrogenase""" + /locus_tag="EMIKCJ_00085" + /protein_id="gnl|Bakta|EMIKCJ_00085" + /translation="MKNNDLKIGSGAIHQISATLSQNNISGKILYCADPVVDDLYGSIV + RSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFISKR + PYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKAGIG + DTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLVNSLV + LSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENSVDTVV + DYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQIYKELIS + EL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000794265.1" + /gene="gtp1" + gene 16228..16932 + /locus_tag="EMIKCJ_00090" + /gene="gtp2" + CDS 16228..16932 + /db_xref="RefSeq:WP_054378044.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD6" + /db_xref="UniRef:UniRef100_Q6X848" + /db_xref="UniRef:UniRef50_O85005" + /db_xref="UniRef:UniRef90_O85005" + /db_xref="UniprotKB:Q6X848" + /db_xref="UserProtein:gtp2" + /product="""putative nucleotidyl transferase""" + /locus_tag="EMIKCJ_00090" + /protein_id="gnl|Bakta|EMIKCJ_00090" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQNN + ITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLMMN + ADVFYDASVIKSLLLHKAPNAIVTDLGIYIEESMKVVEKNGRLVEISKQISPEETLGVS + IDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILSEVEFVACPLEGRWLEIDN + HEDLVAAEKLFA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378044.1" + /gene="gtp2" + gene 16953..17780 + /locus_tag="EMIKCJ_00095" + /gene="gtp3" + CDS 16953..17780 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q4K1N0" + /db_xref="UniRef:UniRef90_Q4K1N0" + /db_xref="UniprotKB:Q4K1N0" + /db_xref="UserProtein:gtp3" + /product="""putative phosphotransferase""" + /locus_tag="EMIKCJ_00095" + /protein_id="gnl|Bakta|EMIKCJ_00095" + /translation="MTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLELLDY + IHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPKSKVY + CQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDVPFIAT + NPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRKKLNYSLFETVVI + GDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQGSIKPTYTFKNVKEMWKGIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K1N0" + /gene="gtp3" + gene complement(17869..18258) + /locus_tag="EMIKCJ_00100" + /gene="tnp" + CDS complement(17869..18258) + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_C1CER1" + /db_xref="UniRef:UniRef90_A0A0T8BYQ3" + /product="IS5 family transposase ORF B" + /locus_tag="EMIKCJ_00100" + /protein_id="gnl|Bakta|EMIKCJ_00100" + /translation="MKAQAIVTSQGRIVSLDITVNYCHDMKLFKMSRRNIGQAGKILAD + SGYQGLMKIYPQAQTPRKSSKLKPLTVEDKAYNHALSKERSKVENIFAKVKTFKMFSTT + YRNHRKRFGLRMNLIAAIINHELGF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A0T8BYQ3" + /gene="tnp" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctattagact attaaactga taatatagtc aatcgaaaca agaacaagac + 481 aaaagagcct tgtaaaaggt attgcaactt ggtaatacct tttatgaggt gctttttgat + 541 atgagtccat gttttctcaa taggattgta ctcaggtgag tagggaggaa gaggtaaaag + 601 tttattccca aactcttcac acaagagttc tagcttcccc attctatgga atcttacatt + 661 atccataata ataaccgatg gtgtggttaa tgttggtaag aaaaacttct gaaaccatac + 721 ttcaaaaaag tcgctcgtca tcgtctcttc gtaagtcatt ggagcgatta actcaccatt + 781 tgttagacct gcaaccaaag aaatcctctg atatcttctt ccagatactt tacctcttat + 841 taactgacct tttaatgagc gaccatattc tcgataaaaa taagtatcga atcctgtttc + 901 gtcaatctaa acaggtgcta ggtgctttaa tctattaaaa ttcttaagaa ataaggctac + 961 tttttctggg tcttgttcat aattagattg aaactagaat agtacacctc tgcttctaaa + 1021 acattgttag aaatcgattt gactgtcctg atcgatttat catgttctta tttcatttta + 1081 ctatattttt gtttcgcggg aagtctacta agatacttaa agatgcagat agtgaaaaaa + 1141 ggtgtagaca ttaccgtaaa aaagtgatat aatcgtatga tgttcaatgt ataggtgtta + 1201 atcatgagta gacgttttaa aaaatcaagt tcacagaaag tgaagcgaag tgttaatata + 1261 gttttgttga ctatttattt attgttagtt tgttttttat tgttcttaat ctttaagtac + 1321 aatatccttg cttttagata tcttaattta gtggtaactg cgttagtcct actagttgcc + 1381 ttggtagggc tactcctgat tatctataaa aaagctgaaa aatttactat ttttctgttg + 1441 gtgttctcta tccttgtcag ctctgtgtcg ctctttgcag tacagcagtt tgttggactg + 1501 accaatcgtt taaatgcgac ttctaattac tcagaatatt caatcagtgt cgctgtttta + 1561 gcagatagtg atatcgaaaa tgttacgcaa ctgacgagtg tgacagcacc gactgggact + 1621 gataatgaaa atattcaaaa actactagct gatattaagt caagtcagaa taccgatttg + 1681 acggtcgacc agagttcgtc ttacttggca gcttacaaga gtttgattgc aggggagact + 1741 aaggccattg tcttaaatag tgtctttgaa aatatcattg agtcagagta tccagactac + 1801 gcatcgaaga taaaaaagat ttataccaag ggattcacta aaaaagtaga agctcctaag + 1861 acgtctaaga atcagtcttt caatatctat gttagtggaa ttgacaccta tggtcctatt + 1921 agttcggtgt cgcgatcaga tgtcaatatc ctgatgactg tcaatcgaga taccaagaaa + 1981 atcctcttga ccacaacacc acgtgatgcc tatgtaccaa tagcagatgg tggaaataat + 2041 caaaaagata aattaaccca tgcgggcatt tatggagttg attcgtccat tcacacctta + 2101 gaaaatctct atggagtgga tatcaattac tatgtgcgat tgaacttcac ttctttcttg + 2161 aaaatgattg acttattggg aggggtagat gttcataatg atcaagagtt ttcagctcta + 2221 catgggaagt tccatttccc agtagggaat gtccatctag actctgagca ggctctaggt + 2281 tttgtacgtg aacgctactc actagccgat ggagaccgtg accgtggtcg caaccaacaa + 2341 aaggtgattg tggctatcct tcaaaaatta acgtcaaccg aagcactgaa aaattatagt + 2401 acgatcatta atagcttgca agattctatc caaacaaata tgccacttga gactatgata + 2461 aatttggtca atgctcagtt agaaagtgga gggaattata aagtaaattc tcaagattta + 2521 aaagggacag gtcggacgga tcttccttct tatgcaatgc cagacagtaa cctctatgtg + 2581 ttggaaatag atgatagtag tttagctgta gttaaagcag ctatacagga tgtgatggag + 2641 ggtagatgaa atgatagaca tccattcgca tatcgttttt gatgtagatg acggtcccaa + 2701 gtcaagagag gaaagcaagg ctctcttggc agaatcctac aggcaagggg tacgaatcat + 2761 tgtctctacc tctcaccgtc gcaagggcat gtttgaaact ccggaagaga agatagcaga + 2821 aaactttctt caggttcggg aaatagctaa ggaagtggcg agtgacttgg tcattgctta + 2881 cggagctgaa atttactaca caccagatgt tctggataag ctggaaaaaa agcggattcc + 2941 gaccctcaat gatagtcgtt atgccttgat agagtttagt atgaacactc cttatcgcga + 3001 tattcatagc gccttgagca agatcttgat gttgggaatt actccagtca ttgcccacat + 3061 tgagcgctat gatgctcttg aaaataatga aaaacgcgtt cgagaactga tcgatatggg + 3121 ctgttacacg caagtaaata gttcacatgt cctcaaaccc aaactttttg gcgaacgtta + 3181 taaattcatg aaaaaaagag ctcagtattt tttggaacgt gatttagttc atgtagttgc + 3241 aagtgacatg cacaatttag acagtagacc tccatatatg caacaggcat atgatatcat + 3301 tgctaagaaa tatggagcga aaaaagcgaa agaatttttt gtagataatc ccagaaaaat + 3361 tataatggat caattaattt aggagaaaat atgaaggaac acaacacttt ggaaatcgat + 3421 atattgcaac tattcagagc tttatggaaa agaaagttgg tcattttatt agtggcaatt + 3481 ataacttctt cagttgcttt tgcctacagt acttttgtta tcaaacctga gtttactagt + 3541 acgactcgga tttatgtagt taaccgtaat caggaagaga agtctggttt aaccaatcaa + 3601 gacttgcagg caggaactta tctggtaaaa gactaccgtg agattatcct ttcgcaggat + 3661 gttttggagg aagttatttc tgatttgaaa ctagatttga cgccaaaagg tttggctaat + 3721 aaaattaaag taacagtacc agttgatacc cgtattgtct ctgtttcagt taatgatcga + 3781 gttcctgaag aggcaagccg tatcgctaac tctttgagag aagtagctgc tcaaaaaatt + 3841 atcagtatta ctcgtgtttc tgatgtgaca acactggagg aggcaagacc ggcgatatca + 3901 ccgtcttcgc caaatattaa acgcaatata ctaattggtt ttttggcagg gggggttgga + 3961 actggtgtta tagttcttct tcttgaactt ttggacactc atgtgaaacg tccggaagat + 4021 atcgaagata cactgcagat gacacttttg ggagttgtac caaacttgag taagttgaaa + 4081 taggagagag gaatgccgac attagaaata gcacaaaaaa aactggagtt cattaagaag + 4141 gcagaagaat attacaatgc cttgtgtaca aatatacagt tgagcggaga taaactaaaa + 4201 gtaatttccg ttacttctgt taaccctggg gaaggaaaaa caactacttc cgtaaatata + 4261 gcaaggtcgt ttgcgcgtgc aggctataaa actcttttga tcgatggcga tactcgaaat + 4321 tcagttatgt caggattttt taaatctcgt gaaaaaatta cagggctaac agaattttta + 4381 tctgggacag ctgatttatc tcacggttta tgtgatacaa atattgaaaa tttatttgta + 4441 gttcaatcgg ggtctgtatc accaaaccct acagccttgt tacaaagtaa aaattttaat + 4501 gatatgattg aaacattgcg taaatatttt gattatatca ttgttgatac agcacctatt + 4561 ggaattgtta ttgatgcggc aattatcact caaaagtgtg atgcgtccat cttggtaaca + 4621 gcaacaggtg aggtgaataa acgtgatgtc caaaaagcga aacaacaatt agaacaaaca + 4681 gggaaactgt ttttaggtgt cattctcaat aaatttgatg ttcaacataa aaaatatggt + 4741 tcttacggtg actatggtaa ttatggtaaa aaataactta ggaaagattt tatggatgaa + 4801 aaaggattga aaatttttct ggcagtatta cagagtatta ttgtcatttt attggtttat + 4861 tttcttagct ttgttagaga gacagaactt gaacgttctt cgatggttat actatacctt + 4921 ctccactttt ttgtattcta ttttagttcc tatggtaata atttttttaa aagagggcac + 4981 ttagttgagt ttaatagtac tataagatat atttttttct ttgcaatagc tataagtgta + 5041 ttaaactttt ttatagcgga acggtttagt atctctagaa gaggaatggt atacttctta + 5101 actttagaag gaatatcctt atacttgtta aatttcttag taaagaaata ttggaagcat + 5161 gtgtttttta atctaaaaaa tagcaagaaa attttactgt taacagtaac gaaaaatatg + 5221 gaaaaagttc ttgataaatt gctagaatct gatgaacttt catggaaatt ggtagcagta + 5281 agtgttttgg ataaatctga ttttcaacat gataaaatac ctgtaattga aaaggaaaaa + 5341 attattgaat ttgcaacgca tgaagttgtg gatgaggtgt ttgtcaatct tccaggagag + 5401 agctacgata ttggagaaat tatctctagg tttgagacaa tggggataga tgtaactgta + 5461 aatcttaaag catttgataa gaatttgggt cgcaataaac aaattcatga gatggtagga + 5521 ttgaatgtag tcactttctc tacaaatttt tataaaacta gtcatgtgat ttcaaagaga + 5581 attctcgata tttgtggtgc cactattggc cttgttcttt ttgctatagc tagtctagtt + 5641 ttagttccat tgattcgtaa agatggcgga ccagctattt ttgctcaaac tcgtataggg + 5701 aaaaatggtc gacattttac cttttataaa ttccgttcga tgaggatcga tgctgaagct + 5761 atcaaagaac agttgatgga tcaaaatacg atgcaaggtg gtatgtttaa gatggacaat + 5821 gatcctcgtg ttacaaaaat tggtcgcttt attcgtaaaa ccagtttgga tgaattgccg + 5881 cagttttgga atgtctttat aggagatatg agtttggtgg gaacacgtcc acctacagta + 5941 gacgagtatg atcagtatac tccagaacag aaacgtcgac tcagctttaa acctggtatt + 6001 acaggtttat ggcaggttag cggccgtagt aaaataaccg attttgacga tgttgtaaaa + 6061 ttagatgtgg cttatattga taattggaca atctggaaag atattgaaat tttgcttaaa + 6121 actgttaaag ttgtatttat aagagatgga gcgaagtaag gaatgaaagt atgtctagtt + 6181 ggatctagtg gaggccattt aactcatttg tatttattaa aacctttctg gaatgataaa + 6241 gaaagatttt gggttacttt tgataaggcg gacgctcgga gtgtactctc tgaggaagtt + 6301 gtatatccct gttattatcc aaccaatcgt aatataaaaa atttaataaa aaatactttt + 6361 ctcgcctata aaattttaaa aaaagagaga ccagatttga ttatttcttc tggtgccgct + 6421 atcgctgttc ctttctttta tattgggaag ttatttggat caaagacagt gtatatagaa + 6481 gtgtttgata gaattgatgc ttcaacactg acaggaaaac ttgtttatcc agtaacggat + 6541 aggtttattg tacaatggga agaaatgaaa aaagtatacc caaaagcaat taacctagga + 6601 gggatattct aatgattttt gtgactgtag gtacacacga acaacaattt gatcgattga + 6661 ttaaagaagt tgattatcta aaaaaagaaa atcttattca agatgaagta tttattcaaa + 6721 taggatattc cagttatatt ccgaaatatt gtgagtggga aaagataatt tcttatgaaa + 6781 aaatgaatca attgattaag gaatcagata ttatcattac tcatggtgga ccagcgacgt + 6841 ttatgggggt tattgctaaa ggaaaagttc cgatagttgt tccgaggcaa aaaaaatttg + 6901 gagagcatgt gaatgaccat cagcttcaat tcgtaaaact gacgaaagaa atatacaatt + 6961 ttatagtcat agatgatatt tccgacttat atttaagtat acgtgatttt aaggataaat + 7021 attttggaat ttgtttgaac aatgaaagat ttaatctaca ttttaatgcg gaaattaata + 7081 aactatttga aggaaataaa gtagatgaaa attagaatag agcctcaata ttttctttat + 7141 aagtaccttt ggcttatcat actgctccca aaacagttta tgcaattaat attattttct + 7201 ttaattgtct taattctatt accggtctat ataaaagata gacaaatttc caaaatagat + 7261 gcaccgtctt tttatatagt tctatgggtc atgatgtatt ctatatcaat aatttggaat + 7321 tttttaatta gtggcttacc tattcaagtg ttgttttcag atttgagtaa ggcattcaat + 7381 tggatattag cagtattttt ttataattat tatttgaaaa atcccattaa cgttgacaag + 7441 ataaagaaat atatgtttta taatttcgct atattagtta ttattgttgc tttattctat + 7501 gttcaaagag gcgctaatgt agtattgttt ggaagaagct tattaggttg ggacggattc + 7561 gtatcagcta ccagttacgg agtaagatat gcaggatttt tagaatattc aacattaaat + 7621 gggcagttga ttcttttttt gttaccgtta attaggttat ttaaacttag tttttttaca + 7681 caagtaacta ttcttgcttt tttgctacag gttttagtat tgagtaaatc tagaatagct + 7741 attattgctc tgattatata catagtattt gtagtaatgg ttcagattac ttcaattaat + 7801 aagcggatga ttgtagcgtt ttatccaact atacctctta tattgcttta taattgggaa + 7861 aaaattaaac atatcttttt tcaaatgttt aattcaagaa caggtagtaa tgtgacacgt + 7921 tttatagtgt acgaagaatc tcttaaagct attaatgggc tgggaatttt acttggagca + 7981 ggaatcagaa cacaatctac agtaggtata ttattaggat cacattcaat gtatattagt + 8041 tttatttata ggacagggat tttaggaagt ataataatag taatactgtt ctattatttg + 8101 ttttctaaat ttttaaaaag tgccccatct ggaaagttaa tcagtatagg ctatatttta + 8161 gctttattgg tgttttggct ttttgaagaa ttagatccac attattggtg tttaatttta + 8221 tttttttcaa caataagtat tttcataaac aatagaaaag aggaaatagt tggatgatag + 8281 aagtatcaat cataattcca atatacaatg ctgaaaaaac tattaaaaat tgtgttgata + 8341 gtgccttaaa gcaaaattta gaatctcttg aagtgatttt ggtgaatgat gggtctaacg + 8401 attctacagc agaaattttg aaccagtacg acaggaattc aagggttaag atttttcatc + 8461 agcttaataa aggggtgtct actgctagaa ataaggggtt atctcatgct agtggagagt + 8521 atgtattttt tctagattca gatgatattt tagatgatgg tatgctttct aaaatgtacc + 8581 aatttgtaaa aaataataaa gttgatctct tatcttgttg gcataaagaa cctgctacaa + 8641 ctcaatacgg tggaaatgag aataagtcaa cttcatttat tgcacgtaca agagaagaaa + 8701 taggtgctca ttttgttgat atctttccga gaagtgcttg tgccaaattg ttttttcgca + 8761 aaataattga agaaaataat attacttttt cgactgagat gtcactaggt gaagatatgt + 8821 catttgtgta tcaatactta atggtttcta aaagtattgg agttattgac ggggtgtatt + 8881 ataatattca aaatgtaaat ccacagtcgt tatctaagcg ctatgtgcag aatattgaaa + 8941 attccctaat aattcagaac cagttatgga atcaactgtt ggaagtttat cctaaaattg + 9001 aggagaacta ctataagcaa catatggatt ttagatttta ccttgctaac ttgtatgtaa + 9061 ataatttatt taaatttgat tctccgtatt catcaaaaga aaaactagac caaattgctc + 9121 aacaattaaa aaagtataga ttatttttag atgaaaaagt cagcaaagaa aagatgccta + 9181 aaaatataaa tgagatgatt gttttttatt tactaaaatt gaaaattcca gtgttgattt + 9241 attcttttta ttcgtttaaa gagtggtgga agagaagaaa aattaaaaat gaaggataaa + 9301 taagttatgg aagatttgat aagcattgtt gttccagtct ataacgtgga aaaatattta + 9361 aaaaaatcaa tagaaagtat tttgaatcag acttatcaaa atatcgagat tttattggtt + 9421 gatgacggaa gcacagatag tagtgggaaa atttgtgaat catttagtaa agttgatcct + 9481 aggataagag tatttcataa agaaaatggt ggtttatcag atgctcggaa ttttggaatt + 9541 gagcaaatga aaggtcaata tgtagcgttt attgatagcg atgactacat atctaaggat + 9601 tatgtctgga agttgtattc ttctataaaa aataatgatt ccgaggtgtc gatttgttct + 9661 tttttattag tcgatgaaaa aggggaaaaa ataaaagatg agctattaga ttcgggaaaa + 9721 atatgcttga ctggtcaaca aatattagaa aaagtattaa cagccgacgg ctatcgctat + 9781 gttgttgctt ggaataagct ttatcggtca actttatttg aaaaattaaa atttaaaaaa + 9841 ggaatgttgt atgaggatga atttcttaac tatcctctat tttgggactg taaaagggta + 9901 tcaattgtag aggagccgtt atatttatac gttcaacgaa aaggaagcat tgtacaaagt + 9961 aatatgactt tagaaaaaat aaagatgaag gatgagatgc atacttcacg cattgagttt + 10021 tattcagaaa aggggcattc ttttttgcac gaaaaagcgt gtcaacagta ctgcaattgg + 10081 attgttacag cgactaccaa tcatagtaag attttaaatc ctaatttttc aaagtattta + 10141 caacgacagt ttagaaagtt cgctaaatat acacgaaaca atgatattag actaattgta + 10201 cagaacattc taggatttat agatattcgt ttagcagctt atgtaaaatc aaaagtaatg + 10261 tagagtatag gaaacataat gatagaaaaa attttagatt ctattaaaaa tcattctttt + 10321 tatagtaaat tgaaggataa aattcataga attattccat tatatattat aaaaaatcaa + 10381 aatatagctt ttcaacaaga taccgatata gcatatagaa aactaaagaa gaagtttaga + 10441 catatttcgt tgactggaga tgagcttaaa tataaaatgg agttttcaaa taaagtttgg + 10501 atttgttggt ttcagggaga agagcatgcc ccagagttaa ttaaaacatg tattcaatca + 10561 atgaggaatc aacttcaagg aagagaaatc attgtgttga cagaaaaaaa tataagtgat + 10621 tatacagaga ttccagacta tattattgaa aaatacaaaa aaggatggat ttctcgtgcg + 10681 cattactctg atatccttag gatagatctt ctatgtcgcc atggaggatt atgggtagat + 10741 gcaacagtgt tgaatacagg aggagatttc tcaaatcttg aggtaccact ttttgtatat + 10801 aaatctttga atttatcaag aaaagattca caagctattg tagcatcaag ttggttaatt + 10861 tcgtcatata gtaatcatcc tatattactc tatacgagaa aactcctatg ggcctactgg + 10921 cgaagaaaaa atagtttatg taattatttt ttgttccata tatgttttac aatagctaca + 10981 gagcggtacc caatcgaatg gtctgctgtc cctactttta ataatcattc tcctcatata + 11041 cttcattttg agttgaatga acaattttcg gaaaaacggt gggaacaact gaagcatatt + 11101 tcggcgtttc ataaattaaa tcatcatata gattattcta gcggtgttaa cactttttat + 11161 aagttcatag tatcttcgaa agtttagaaa aatgagtaat aaaattagta aaaatttagc + 11221 ctacaatatg gggtatcagt taattggtat tgcagctccc ttgataactt ctccttattt + 11281 atcacggata ttaggtgctg aaaatttagg tattcattct tttactatgt cggttgcact + 11341 ttactttatg atgtttatgc ttcttggaat tgcaaattac ggaaatagaa caattgcgac + 11401 tgttaaacga gaaggaaagg atattctatc aaaaacgttt tggagtatct actctatcca + 11461 gttgataatg tctattctgg taactatagc ttatcttgct tatctatatt tgggggcagt + 11521 acattacaaa gttattgcaa tattacaact ctttttattg ttatcaaatg ctgttgatat + 11581 tacttggttt ttctatggat tagaaaattt taagcaaatc gtttttagga atacattagt + 11641 caaactttta ggattatttt taattttttt atgtgtgcgt caaggcacag atttatggaa + 11701 atacacattt ataaacggat cagtaacttt agttggccaa cttttactat ggggacaatt + 11761 aaaaggaata ttaacttgga aaaaaattca attaaaggaa ttactacctc atatcaagcc + 11821 aattttaatt ctttttattc ctgtactagc cattagtatt tttactaata tggataaata + 11881 tatgcttggt ttaatggttg atgtaaagca ggttggattt tatgacaatg caggtagaat + 11941 tattgaaatt cctaaagctt tgattgcagc tttaggggcc gttatgttac caagaacttc + 12001 ctatttatta gcggaaggac agaaagaaaa gagtaaatac tacatagagg taacaatttt + 12061 atacgtgatg attatttcta gtgtattgat gtttgggcta atatcggtat ctgatatttt + 12121 ttccattata ttttggggag aagaatttct tgaatcaggt agattgattt ctgctatgtc + 12181 tccggctttt gtcttctctg tattaggaaa tatcattagg actcagtatt tgattcctag + 12241 agctaaggat aaagattatg tagtgtctct aattgcgggg gctgttgtta atctagtgct + 12301 aaactatttt tttataaaac cttttggtgc tatgggagca acaattagta cagttttggc + 12361 agaatttgta ttgtctggaa tgcagttttg gtcagtaaga agagacttag atttaaaaag + 12421 atatttgaaa aacggtttga tattctacct atttggtctg attatgcacc tcattattat + 12481 agcactcaaa actcagttac catacaatat aatgagtctt attttactaa tagttttggg + 12541 tggaatagta tatgttattt tttgttgttg ctatatttta atgtcaagaa atttacattt + 12601 taagttattg aaggaaaaga ttatacgaaa ggttgtacat aaaaatacat tataaaatat + 12661 tagtttatct tatttagttg gatactatta aataaacgaa agtatttgaa actttggtaa + 12721 ttgagattat agagattata gagataaact aagctatatt atagcttcat tattaaagta + 12781 agaatatcgg tgcagtgtag ttaacgaata atgtgagtac tcatttctta gatggagcta + 12841 ggggtcatta taagggattg atatgacatt ttgagtaagt tacagctaga gtttaggttt + 12901 gattatatca gatatttaga tgatttggaa aataataaaa taagttggga actatttttt + 12961 tattgttttg agtgacaggt ttgattttgg gaaatgtatt ttgttaaata ggtaggaaag + 13021 atggttacta aagataaagg attaacatat aatagtactt tgcatgcaat aaaagtatta + 13081 gcatgtttta gtgttgttgc tattcatata tggctaccag gaaaaattgg agcgttttat + 13141 caaataatag cacgatttgc agttccaatg ttctttttga tttctggctt ttattcatat + 13201 aatatttcaa agaataaaat acagaataga attaaaaaaa tatttagatt gatattaaga + 13261 agtacatttt tttatgtaat aatatttgta tggatgtttt ggagagaagg taatatgcag + 13321 tttatttttc aaaactttaa tttaacaaat attataagat ttgtgatttt taataggatt + 13381 tcagatttaa taggctatct agcaacaccg ttgtggtatt tatttgctat attatatata + 13441 tatatatatc tttatttttc caataaaaga ctactattga caaaacgatg gatttctata + 13501 cttttactat tttctttcat tatggaagct acaattagcg attcaatttt ttatagaaat + 13561 tttttattta tgggaatacc attttttgga ataggaattc ttattgcaca gaagcaaaag + 13621 aagattatta attgtaaaat aataaacaaa atattaatct tgggaacaat tatctatcca + 13681 atactaatat ttttagaata ttatatcttg ggtaattctt ttgagatcta tataagttct + 13741 gtgctagcaa ccataatatt gatgattttc gcgattaaat cacctaaagc gattaatata + 13801 aaaatactga atgaaattgg agataaatat gcgacttttg tttacattat acaccagttt + 13861 atcattgtga tatttaaatt tttagtatct aatgtttata ttctcaaatt tgggacgata + 13921 tttgtctttt tgatatgttg ttttctaggg gttctatttc aatttatcaa aaacagacta + 13981 ttaaaaaggt ttagttaaga tggttgtttt acaaaatgtt aaatttttag taagagttgt + 14041 ttttatggtt attatcagta tagtgttatg gcctgttcgg ataaagaaga ataagatact + 14101 atttattaat tttaatggta agggatatgg tgataatccg aaaagtattt gtgagtatct + 14161 tcgagttaca tatccagagt tagatttagt ttggcttaca aaagataatg aagattttcc + 14221 agatggagtg agagttgtaa gatataaatc tctacaatct ttttatgagc aagctagttc + 14281 gaaggtttgg gtttataatg taagaaattt tgaaagacta ctaaaaaaac gcggacagtt + 14341 ttatattcaa acttggcacg gtgcttctag ttttaaactg atagaacagc aggctgattt + 14401 accattaaaa tatattttag aagcaaagta tgatgcaaga gtcacagata taatgatttc + 14461 agatagcaga aaacaaactg aagaatttca aaagtatttt tggtattcag gagaaatttt + 14521 tgaggtgggg atgccgagaa atgatgcctt gtttcactat aaggaagact acgacaagtt + 14581 aaataatatc agaaaaaaac taagcattga ttcagatgat tatgttattt tatatgcccc + 14641 tactttcaga gatgatgggg atgcatctta tttagatata aattttgaac ggcttttgca + 14701 aagtattgaa caagaaatta agaagaaatg taaaatttta attagattac atcctaatga + 14761 ctctcatttt agtaataata tttcttttaa tcatgacata attgatgtta cgctattctc + 14821 agatatgcag gaacttatat tattggcaga tgttttactg acagattatt cttccgcgat + 14881 atttgatttt atgcttttaa acaagcctta tgtcagatat gtgaatgatt tagaaaaata + 14941 tgctgagctt aggggggtat cagatacata ttatgaattg ccggattcta ttattaaaac + 15001 tgctgaagaa ttgtatgact tactgcctaa aaaaatagaa aattttgatt atgattctat + 15061 aaaaaaatat agaaatgaaa tactgtgtcc aatctttaat ggaaccgcta gtgaaaatgt + 15121 aggaaggaga ataattcaag agttgtgaag taaaacattg ggttattttt aaggtaacga + 15181 gatttgaaaa ataatgattt aaagatagga agtggagcta ttcatcaaat ctccgctaca + 15241 ctttctcaaa ataatatttc gggaaagatt ttatattgtg ctgatccagt tgtcgatgac + 15301 ttgtacggtt cgatagtacg ttcacaaata gaggaaattg gtcgggtaaa ggaagaaagt + 15361 tgcaattata atactattgc ttatgcgatg aatatagcag aaagggctat tgccacagat + 15421 attgactgta ttgtgggaat gggaggaggt cgtgttttag atgtctgcaa gtatgcatct + 15481 tttatttcga aacgtcctta cctatcgatt ccgacaacag cagcaaatga tggcattgct + 15541 tccccagttg ctgttttgaa aaggcaggat gatagaccaa aaagcttagg ggcggctatc + 15601 ccctcaatga cactaattga tattgatgtt attgcatcag gacctataca aaatataaaa + 15661 gctggtatcg gtgatacaat atccaattac actgcattga aagattggga gttggcagtt + 15721 gagcgaggga aagatgagat gcatggtttt gcatatctaa tgtcgcaaaa ttctttagat + 15781 gctttaatga aaacgaagta taattctatt acccctgatt ttattgaagt tttggtaaac + 15841 tctttagttt tatcaggcat tgcaatggat tttgcgggaa gtagtagacc tgtcagtggg + 15901 tcagagcact tatttagtca tgcattagat tactatggtt ctacaaggaa tcttcatgga + 15961 attcaggttg cattaggtac agtcgcagtt ttgaaattaa ttgaaaattc tgttgatact + 16021 gtagtggatt acttgcaaag atttgaggtt catattaacc cgaaactttt ggggatagat + 16081 gaagagttgt ttatttattg tatgcaacat gctacaaaaa tgagaagtaa tcgctatacc + 16141 tatctgcatg aagttgatct tagcacagat agattgaaac aaatatataa ggaactcata + 16201 agcgagttgt agaaaagaga ggaaaaaatg aaagcactta ttttagcagc agggttagga + 16261 acacgtctag ctccaattac caatgaggta ccaaaatctt tggtaccagt caatggtaag + 16321 ccaattttga tgaaacaaat tgaaaattta tatcaaaata atattacaga tattacgatt + 16381 attgctggat ataagtcatc tgtattaaca gatgcagtta ctgaaaagta tccagaaatt + 16441 aatattattg ataatgttga ttttaaaacg actaataata tgtattcagc ctatctagga + 16501 aaagctgcaa tgggtgatag tgacttctta atgatgaatg cagatgtatt ttatgatgct + 16561 tctgttatta aaagtctgtt gcttcataaa gctccaaatg caattgtaac tgatttaggt + 16621 atttatattg aagagtctat gaaagtcgta gaaaaaaatg gtcgtttagt agaaatttct + 16681 aaacagattt cacctgagga aactttagga gtttctattg atgtttataa attctcttat + 16741 gaagcaggtg ctcgattctt tgaaaagtgt aaggaattta ttgaagataa acgagaactt + 16801 caaatgtgga gtgaggttgc tcttaatgca attctttctg aagttgaatt tgtagcatgt + 16861 ccattagagg gtcgttggtt agaaattgat aatcatgaag acttagttgc tgcagaaaaa + 16921 ctatttgctt gaaccgaata cggagaatga aattgacaaa tagagttgat tattttggtg + 16981 ctgatattag tgaacttcag aataaaaaat tattcttatt tgatatggat ggtaccattt + 17041 atgaagaaga taggttgttt gagggtactc tcgaattatt agactatatt cataatattg + 17101 gcggtgagta tatttttatt acaaacaatt catctaagtc tgttgttgac tatgtagaaa + 17161 aagttaacag attaggtatt aaagctgaac gagataattt ttttacctct gctcaagcca + 17221 caattgttta tattaaagaa aattatccta aatctaaagt ttattgccaa ggaacaaaat + 17281 ctttgataaa agaactatct gacgcaggaa ttgatgtaac tgagcaagtt agtgctgata + 17341 tagatgttgt tcttgttggt tttgatacag aattaaccag tgataaaatt cgcaatacct + 17401 gcgagattct atcaacaaag gacgtacctt tcatagctac taaccctgat attcgctgcc + 17461 cagtatcgtt tggattcatc ccagattgtg gttctatttg tgatatgatt agtaaatcag + 17521 tcgataggaa acctgtttac ataggtaaac ctgaacctac gatggttgat attgttcgaa + 17581 aaaaattaaa ttattctcta tttgaaacag ttgtgattgg agatcgcttg tatacggata + 17641 tcatgactgg tataaatgca ggagtaactt cagtttgtgt gctgacagga gaagcaacgg + 17701 tgaatgatat tcaacaaggt agtataaaac cgacttatac atttaaaaac gtgaaagaaa + 17761 tgtggaaagg aattgtctga ttttttcatt ctgaatagtg aattcatgaa tactgtcaaa + 17821 atactcgtat gtatttaaat tgattttatt attagacttc ctgcaaaact agaatcctag + 17881 ttcatgattg ataatagcag caatcaaatt cattcgtaat ccgaagcgtt tacgatgatt + 17941 tcgataggtt gttgaaaaca ttttaaacgt ttttactttg gcaaagatgt tctcgacctt + 18001 gcttctctcc ttggatagcg catggttata ggctttatct tcaactgtta gcggcttgag + 18061 tttgctggat ttacgtggag tttgtgcttg aggatatatc ttcatgagcc cttgataacc + 18121 actgtcagcc aagattttac cagcttgtcc gatatttctg cgactcattt tgaacaactt + 18181 catatcatga caatagttca cagtgatatc caaagaaaca attctccctt gacttgtgac + 18241 aatcgcctga gccttcatag cgagaaatat ctattctatc ttctagaatg tcttccaaac + 18301 gaggaaactc tcgtaaacaa agaggtttta gaggcttatt taccatggac taaagttgta + 18361 caagaaaagt gcaaataaga aatctccaga ttaggaacta tccgtgagtt ctctagtctg + 18421 gagatttttc aatatacttc gttattgggc gcttacaatg atattcatat tttttgcaaa + 18481 gatgttgttt gaaaaataat tttcaaaaat tctgaaaatt ctgttgacaa ctttctgaaa + 18541 agagtctata atggagagaa agttttaaag gagaaaatga tgaaaagttc aaaactactt + 18601 gcccttgcgg gcgtgacatt attg +// diff --git a/public/res/serotype_genbank/serotype_15C.gb b/public/res/serotype_genbank/serotype_15C.gb new file mode 100644 index 0000000..58fc0e3 --- /dev/null +++ b/public/res/serotype_genbank/serotype_15C.gb @@ -0,0 +1,877 @@ +LOCUS CR931665 18626 bp DNA linear UNK 10-JUN-2024 +DEFINITION CR931665, whole genome shotgun sequence. +ACCESSION CR931665 +VERSION CR931665 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/10/2024, 18:34:40 + CDSs :: 21 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..18626 + /mol_type="genomic DNA" + gene 293..445 + /locus_tag="FCDNMA_00005" + CDS 293..445 + /db_xref="RefSeq:WP_001022222.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000152F245" + /db_xref="UniRef:UniRef100_A0A0T7KK87" + /db_xref="UniRef:UniRef50_A0A0H2ZQL8" + /db_xref="UniRef:UniRef90_A0A0H2ZQL8" + /product="Lipoprotein" + /locus_tag="FCDNMA_00005" + /protein_id="gnl|Bakta|FCDNMA_00005" + /translation="MNIKKRVLSAGLTFASALLLAACDQSGSDTKTYSSTFSGNPTTFN + YLLDY" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001022222.1" + gene complement(442..798) + /locus_tag="FCDNMA_00010" + CDS complement(442..798) + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000152F246" + /db_xref="UniRef:UniRef100_A5LJR5" + /db_xref="UniRef:UniRef50_A0A0H2UQ11" + /db_xref="UniRef:UniRef90_A5LJR5" + /product="IS630-Spn1, transposase Orf2" + /locus_tag="FCDNMA_00010" + /protein_id="gnl|Bakta|FCDNMA_00010" + /translation="MVAGLTNGELIAPMTYEETMTSDFFEVWFQKFFLPTLTTPSVIIM + DNVRFHRMGKLELLCEEFGNKLLPLPPYSPEYNPIEKTWTHIKKHLIKGITKLQYLLQG + SFVLFLFRLTILSV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_A5LJR5" + gene 1204..2649 + /locus_tag="FCDNMA_00015" + /gene="wzg" + CDS 1204..2649 + /db_xref="BlastRules:WP_000091082" + /db_xref="RefSeq:WP_054378039.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF36" + /db_xref="UniRef:UniRef100_Q4K1M7" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_Q9R928" + /db_xref="UniprotKB:Q4K1M7" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="FCDNMA_00015" + /protein_id="gnl|Bakta|FCDNMA_00015" + /translation="MSRRFKKSSSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVDQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYS + TIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSYAMPDSNLY + VLEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378039.1" + /gene="wzg" + gene 2651..3382 + /locus_tag="FCDNMA_00020" + /gene="wzh" + CDS 2651..3382 + /db_xref="EC:3.1.3.48" + /db_xref="GO:0004725" + /db_xref="GO:0030145" + /db_xref="GO:0045227" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF40" + /db_xref="UniRef:UniRef100_Q4K1M6" + /db_xref="UniRef:UniRef50_Q54518" + /db_xref="UniRef:UniRef90_Q54518" + /db_xref="UniprotKB:Q4K1M6" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="FCDNMA_00020" + /protein_id="gnl|Bakta|FCDNMA_00020" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRIIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKRRIPTLNDSRY + ALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKPKLFGERYKFMKKRAQYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIAKKYG + AKKAKEFFVDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1M6" + /gene="wzh" + gene 3391..4083 + /locus_tag="FCDNMA_00025" + /gene="wzd" + CDS 3391..4083 + /db_xref="BlastRules:WP_000664160" + /db_xref="GO:0005351" + /db_xref="GO:0005886" + /db_xref="GO:0009103" + /db_xref="GO:0015774" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_000658143.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF38" + /db_xref="UniRef:UniRef100_Q4K1M5" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_Q54519" + /db_xref="UniprotKB:Q4K1M5" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="FCDNMA_00025" + /protein_id="gnl|Bakta|FCDNMA_00025" + /translation="MKEHNTLEIDILQLFRALWKRKLVILLVAIITSSVAFAYSTFVIK + PEFTSTTRIYVVNRNQEEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVISDLKLDLT + PKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVTTLE + EARPAISPSSPNIKRNILIGFLAGGVGTGVIVLLLELLDTHVKRPEDIEDTLQMTLLGV + VPNLSKLK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000658143.1" + /gene="wzd" + gene 4093..4776 + /locus_tag="FCDNMA_00030" + /gene="wze" + CDS 4093..4776 + /db_xref="BlastRules:WP_001142521" + /db_xref="COG:COG0489" + /db_xref="COG:D" + /db_xref="EC:2.7.10.2" + /db_xref="GO:0004715" + /db_xref="GO:0005524" + /db_xref="GO:0016310" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_001142510.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF39" + /db_xref="UniRef:UniRef100_Q4K1M4" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_Q54520" + /db_xref="UniprotKB:Q4K1M4" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="FCDNMA_00030" + /protein_id="gnl|Bakta|FCDNMA_00030" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVNP + GEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVMSGFFKSREKITGLTEFLSGTADLSH + GLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVIDAA + IITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVILNKFDVQHKKYGSYGDYG + NYGKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001142510.1" + /gene="wze" + gene 4792..6159 + /locus_tag="FCDNMA_00035" + /gene="wchA" + CDS 4792..6159 + /db_xref="RefSeq:WP_000343580.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3A" + /db_xref="UniRef:UniRef100_Q4K1M3" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_P72513" + /db_xref="UniprotKB:Q4K1M3" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="FCDNMA_00035" + /protein_id="gnl|Bakta|FCDNMA_00035" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLLH + FFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYFLT + LEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKLVAV + SVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMGIDVT + VNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLVLFAIAS + LVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTMQGGMFK + MDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPEQKRRLSF + KPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFIRDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000343580.1" + /gene="wchA" + gene 6163..6612 + /locus_tag="FCDNMA_00040" + /gene="wchJ" + CDS 6163..6612 + /db_xref="GO:0016740" + /db_xref="RefSeq:WP_000861663.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3B" + /db_xref="UniRef:UniRef100_Q4K1M2" + /db_xref="UniRef:UniRef50_J9W567" + /db_xref="UniRef:UniRef90_Q4K1M2" + /db_xref="UniprotKB:Q4K1M2" + /db_xref="UserProtein:wchJ" + /product="""putative glycosyl transferase enhancer""" + /locus_tag="FCDNMA_00040" + /protein_id="gnl|Bakta|FCDNMA_00040" + /translation="MKVCLVGSSGGHLTHLYLLKPFWNDKERFWVTFDKADARSVLSEE + VVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKTVY + IEVFDRIDASTLTGKLVYPVTDRFIVQWEEMKKVYPKAINLGGIF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000861663.1" + /gene="wchJ" + gene 6612..7115 + /locus_tag="FCDNMA_00045" + /gene="wchK" + CDS 6612..7115 + /db_xref="RefSeq:WP_000578430.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3C" + /db_xref="UniRef:UniRef100_Q4K1M1" + /db_xref="UniRef:UniRef50_Q4K216" + /db_xref="UniRef:UniRef90_Q4K1M1" + /db_xref="UniprotKB:Q4K1M1" + /db_xref="UserProtein:wchK" + /product="""putative glycosyl transferase""" + /locus_tag="FCDNMA_00045" + /protein_id="gnl|Bakta|FCDNMA_00045" + /translation="MIFVTVGTHEQQFDRLIKEVDYLKKENLIQDEVFIQIGYSSYIPK + YCEWEKIISYEKMNQLIKESDIIITHGGPATFMGVIAKGKVPIVVPRQKKFGEHVNDHQ + LQFVKLTKEIYNFIVIDDISDLYLSIRDFKDKYFGICLNNERFNLHFNAEINKLFEGNK + VDEN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000578430.1" + /gene="wchK" + gene 7105..8277 + /locus_tag="FCDNMA_00050" + /gene="wzy" + CDS 7105..8277 + /db_xref="RefSeq:WP_054378041.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3D" + /db_xref="UniRef:UniRef100_Q4K1M0" + /db_xref="UniRef:UniRef50_P72516" + /db_xref="UniRef:UniRef90_A0A6G2DLE4" + /db_xref="UniprotKB:Q4K1M0" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="FCDNMA_00050" + /protein_id="gnl|Bakta|FCDNMA_00050" + /translation="MKIRIEPQYFLYKYLWLIILLPKQFMQLILFSLIVLILLPVYIKD + RQISKIDAPSFYIVLWVMMYSISIIWNFLISGLPIQVLFSDLSKAFNWILAVFFYNYYL + KNPINVDKIKKYMFYNFAILVIIVALFYVQRGANVVLFGRSLLGWDGFVSATSYGVRYA + GFLEYSTLNGQLILFLLPLIRLFKLSFFTQVTILAFLLQVLVLSKSRIAIIALIIYIVF + VVMVQITSINKRMIVAFYPTIPLILLYNWEKIKHIFFQMFNSRTGSNVTRFIVYEESLK + AINGLGILLGAGIRTQSTVGILLGSHSMYISFIYRTGILGSIIIVILFYYLFSKFLKSA + PSGKLISIGYILALLVFWLFEELDPHYWCLILFFSTISIFINNRKEEIVG" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378041.1" + /gene="wzy" + gene 8274..9299 + /locus_tag="FCDNMA_00055" + /gene="wchL" + CDS 8274..9299 + /db_xref="RefSeq:WP_000573792.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3E" + /db_xref="UniRef:UniRef100_Q4K1L9" + /db_xref="UniRef:UniRef50_Q4K1K1" + /db_xref="UniRef:UniRef90_Q4K1K1" + /db_xref="UniprotKB:Q4K1L9" + /db_xref="UserProtein:wchL" + /product="""putative glycosyl transferase""" + /locus_tag="FCDNMA_00055" + /protein_id="gnl|Bakta|FCDNMA_00055" + /translation="MIEVSIIIPIYNAEKTIKNCVDSALKQNLESLEVILVNDGSNDST + AEILNQYDRNSRVKIFHQLNKGVSTARNKGLSHASGEYVFFLDSDDILDDGMLSKMYQF + VKNNKVDLLSCWHKEPATTQYGGNENKSTSFIARTREEIGAHFVDIFPRSACAKLFFRK + IIEENNITFSTEMSLGEDMSFVYQYLMVSKSIGVIDGVYYNIQNVNPQSLSKRYVQNIE + NSLIIQNQLWNQLLEVYPKIEENYYKQHMDFRFYLANLYVNNLFKFDSPYSSKEKLDQI + AQQLKKYRLFLDEKVSKEKMPKNINEMIVFYLLKLKIPVLIYSFYSFKEWWKRRKIKNE + G" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000573792.1" + /gene="wchL" + gene 9307..10263 + /locus_tag="FCDNMA_00060" + /gene="wchM" + CDS 9307..10263 + /db_xref="RefSeq:WP_000389753.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3F" + /db_xref="UniRef:UniRef100_Q4K1L8" + /db_xref="UniRef:UniRef50_E0Q2S2" + /db_xref="UniRef:UniRef90_A0A4J2AN51" + /db_xref="UniprotKB:Q4K1L8" + /db_xref="UserProtein:wchM" + /product="""putative glycosyl transferase""" + /locus_tag="FCDNMA_00060" + /protein_id="gnl|Bakta|FCDNMA_00060" + /translation="MEDLISIVVPVYNVEKYLKKSIESILNQTYQNIEILLVDDGSTDS + SGKICESFSKVDPRIRVFHKENGGLSDARNFGIEQMKGQYVAFIDSDDYISKDYVWKLY + SSIKNNDSEVSICSFLLVDEKGEKIKDELLDSGKICLTGQQILEKVLTADGYRYVVAWN + KLYRSTLFEKLKFKKGMLYEDEFLNYPLFWDCKRVSIVEEPLYLYVQRKGSIVQSNMTL + EKIKMKDEMHTSRIEFYSEKGHSFLHEKACQQYCNWIVTATTNHSKILNPNFSKYLQRQ + FRKFAKYTRNNDIRLIVQNILGFIDIRLAAYVKSKVM" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000389753.1" + /gene="wchM" + gene 10279..11187 + /locus_tag="FCDNMA_00065" + /gene="wchN" + CDS 10279..11187 + /db_xref="RefSeq:WP_050103050.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD1" + /db_xref="UniRef:UniRef100_Q6X853" + /db_xref="UniRef:UniRef50_B2ILQ2" + /db_xref="UniRef:UniRef90_Q6X853" + /db_xref="UniprotKB:Q6X853" + /db_xref="UserProtein:wchN" + /product="""putative glycosyl transferase""" + /locus_tag="FCDNMA_00065" + /protein_id="gnl|Bakta|FCDNMA_00065" + /translation="MIEKILDSIKNHSFYSKLKDKIHRIIPLYIIKNQNIAFQQDTDIA + YRKLKKKFRHISLTGDELKYKMEFSNKVWICWFQGEEHAPELIKTCIQSMRNQLQGREI + IVLTEKNISDYTEIPDYIIEKYKKGWISRAHYSDILRIDLLCRHGGLWVDATVLNTGGD + FSNLEVPLFVYKSLNLSRKDSQAIVASSWLISSYSNHPILLYTRKLLWAYWRRKNSLCN + YFLFHICFTIATERYPIEWSAVPTFNNHSPHILHFELNEQFSEKRWEQLKHISAFHKLN + HHIDYSSGVNTFYKFIVSSKV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050103050.1" + /gene="wchN" + gene 11192..12655 + /locus_tag="FCDNMA_00070" + /gene="wzx" + CDS 11192..12655 + /db_xref="RefSeq:WP_054378042.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD2" + /db_xref="UniRef:UniRef100_Q6X852" + /db_xref="UniRef:UniRef50_O07342" + /db_xref="UniRef:UniRef90_Q6X852" + /db_xref="UniprotKB:Q6X852" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="FCDNMA_00070" + /protein_id="gnl|Bakta|FCDNMA_00070" + /translation="MSNKISKNLAYNMGYQLIGIAAPLITSPYLSRILGAENLGIHSFT + MSVALYFMMFMLLGIANYGNRTIATVKREGKDILSKTFWSIYSIQLIMSILVTIAYLAY + LYLGAVHYKVIAILQLFLLLSNAVDITWFFYGLENFKQIVFRNTLVKLLGLFLIFLCVR + QGTDLWKYTFINGSVTLVGQLLLWGQLKGILTWKKIQLKELLPHIKPILILFIPVLAIS + IFTNMDKYMLGLMVDVKQVGFYDNAGRIIEIPKALIAALGAVMLPRTSYLLAEGQKEKS + KYYIEVTILYVMIISSVLMFGLISVSDIFSIIFWGEEFLESGRLISAMSPAFVFSVLGN + IIRTQYLIPRAKDKDYVVSLIAGAVVNLVLNYFFIKPFGAMGATISTVLAEFVLSGMQF + WSVRRDLDLKRYLKNGLIFYLFGLIMHLIIIALKTQLPYNIMSLILLIVLGGIVYVIFC + CCYILMSRNLHFKLLKEKIIRKVVHKNTL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378042.1" + /gene="wzx" + gene 13021..13482 + /locus_tag="FCDNMA_00075" + /gene="wciZ" + CDS 13021..13482 + /db_xref="RefSeq:WP_224757692.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005DC34F8" + /db_xref="UniRef:UniRef100_A0A1Z3GXH2" + /db_xref="UniRef:UniRef50_A0A1Z3GXH2" + /db_xref="UniRef:UniRef90_A0A1Z3GXH2" + /product="WciZ" + /locus_tag="FCDNMA_00075" + /protein_id="gnl|Bakta|FCDNMA_00075" + /translation="MVTKDKGLTYNSTLHAIKVLACFSVVAIHIWLPGKIGAFYQIIAR + FAVPMFFLISGFYSYNISKNKIQNRIKKIFRLILRSTFFYVIIFVWMFWREGNMQFIFQ + NFNLTNIIRFVIFNRISDLIGYLATPLWYLFAILYIYIYIFIFPIKDYY" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_224757692.1" + /gene="wciZ" + gene 13479..14000 + /locus_tag="FCDNMA_00080" + /gene="wciZ" + CDS 13479..14000 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000A4FFFE9" + /db_xref="UniRef:UniRef100_A0A1Z3GXJ9" + /db_xref="UniRef:UniRef50_A0A1Z3GXH7" + /db_xref="UniRef:UniRef90_A0A1Z3GXH7" + /product="WciZ" + /locus_tag="FCDNMA_00080" + /protein_id="gnl|Bakta|FCDNMA_00080" + /translation="MTKRWISILLLFSFIMEATISDSIFYRNFLFMGIPFFGIGILIAQ + KQKKIINCKIINKILILGTIIYPILIFLEYYILGNSFEIYISSVLATIILMIFAIKSPK + AINIKILNEIGDKYATFVYIIHQFIIVIFKFLVSNVYILKFGTIFVFLICCFLGVLFQF + IKNRLLKRFS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef100_A0A1Z3GXJ9" + /gene="wciZ" + gene 14002..15150 + /locus_tag="FCDNMA_00085" + /gene="wchX" + CDS 14002..15150 + /db_xref="RefSeq:WP_054378043.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD4" + /db_xref="UniRef:UniRef100_A0A9X8NAZ6" + /db_xref="UniRef:UniRef50_Q9R922" + /db_xref="UniRef:UniRef90_A0A4J2AK78" + /db_xref="UniprotKB:Q6X850" + /db_xref="UserProtein:wchX" + /product="""putative glycerol phosphotransferase""" + /locus_tag="FCDNMA_00085" + /protein_id="gnl|Bakta|FCDNMA_00085" + /translation="MVVLQNVKFLVRVVFMVIISIVLWPVRIKKNKILFINFNGKGYGD + NPKSICEYLRVTYPELDLVWLTKDNEDFPDGVRVVRYKSLQSFYEQASSKVWVYNVRNF + ERLLKKRGQFYIQTWHGASSFKLIEQQADLPLKYILEAKYDARVTDIMISDSRKQTEEF + QKYFWYSGEIFEVGMPRNDALFHYKEDYDKLNNIRKKLSIDSDDYVILYAPTFRDDGDA + SYLDINFERLLQSIEQEIKKKCKILIRLHPNDSHFSNNISFNHDIIDVTLFSDMQELIL + LADVLLTDYSSAIFDFMLLNKPYVRYVNDLEKYAELRGVSDTYYELPDSIIKTAEELYD + LLPKKIENFDYDSIKKYRNEILCPIFNGTASENVGRRIIQEL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378043.1" + /gene="wchX" + gene 15186..16214 + /locus_tag="FCDNMA_00090" + /gene="gtp1" + CDS 15186..16214 + /db_xref="RefSeq:WP_000794265.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD5" + /db_xref="UniRef:UniRef100_Q6X849" + /db_xref="UniRef:UniRef50_Q9R921" + /db_xref="UniRef:UniRef90_Q9R921" + /db_xref="UniprotKB:Q6X849" + /db_xref="UserProtein:gtp1" + /product="""putative glycerol-2-phosphate dehydrogenase""" + /locus_tag="FCDNMA_00090" + /protein_id="gnl|Bakta|FCDNMA_00090" + /translation="MKNNDLKIGSGAIHQISATLSQNNISGKILYCADPVVDDLYGSIV + RSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFISKR + PYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKAGIG + DTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLVNSLV + LSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENSVDTVV + DYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQIYKELIS + EL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000794265.1" + /gene="gtp1" + gene 16230..16934 + /locus_tag="FCDNMA_00095" + /gene="gtp2" + CDS 16230..16934 + /db_xref="RefSeq:WP_054378044.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD6" + /db_xref="UniRef:UniRef100_Q6X848" + /db_xref="UniRef:UniRef50_O85005" + /db_xref="UniRef:UniRef90_O85005" + /db_xref="UniprotKB:Q6X848" + /db_xref="UserProtein:gtp2" + /product="""putative nucleotidyl transferase""" + /locus_tag="FCDNMA_00095" + /protein_id="gnl|Bakta|FCDNMA_00095" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQNN + ITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLMMN + ADVFYDASVIKSLLLHKAPNAIVTDLGIYIEESMKVVEKNGRLVEISKQISPEETLGVS + IDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILSEVEFVACPLEGRWLEIDN + HEDLVAAEKLFA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054378044.1" + /gene="gtp2" + gene 16955..17782 + /locus_tag="FCDNMA_00100" + /gene="gtp3" + CDS 16955..17782 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q4K1N0" + /db_xref="UniRef:UniRef90_Q4K1N0" + /db_xref="UniprotKB:Q4K1L2" + /db_xref="UserProtein:gtp3" + /product="""putative phosphotransferase""" + /locus_tag="FCDNMA_00100" + /protein_id="gnl|Bakta|FCDNMA_00100" + /translation="MTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLELLDY + IHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPKSKVY + CQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDIPFIAT + NPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRKKLNYSLFETVVI + GDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQGSIKPTYTFKNVKEMWKGIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K1N0" + /gene="gtp3" + gene complement(17871..18260) + /locus_tag="FCDNMA_00105" + /gene="tnp" + CDS complement(17871..18260) + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_C1CER1" + /db_xref="UniRef:UniRef90_A0A0T8BYQ3" + /product="IS5 family transposase ORF B" + /locus_tag="FCDNMA_00105" + /protein_id="gnl|Bakta|FCDNMA_00105" + /translation="MKAQAIVTSQGRIVSLDITVNYCHDMKLFKMSRRNIGQAGKILAD + SGYQGLMKIYPQAQTPRKSSKLKPLTVEDKAYNHALSKERSKVENIFAKVKTFKMFSTT + YRNHRKRFGLRMNLIAAIINHELGF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A0T8BYQ3" + /gene="tnp" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctattagact attaaactga taatatagtc aatcgaaaca agaacaagac + 481 aaaagagcct tgtaaaaggt attgcaactt ggtaatacct tttatgaggt gctttttgat + 541 atgagtccat gttttctcaa taggattgta ctcaggtgag tagggaggaa gaggtaaaag + 601 tttattccca aactcttcac acaagagttc tagcttcccc attctatgga atcttacatt + 661 atccataata ataaccgatg gtgtggttaa tgttggtaag aaaaacttct gaaaccatac + 721 ttcaaaaaag tcgctcgtca tcgtctcttc gtaagtcatt ggagcgatta actcaccatt + 781 tgttagacct gcaaccaaag aaatcctctg atatcttctt ccagatactt tacctcttat + 841 taactgacct tttaatgagc gaccatattc tcgataaaaa taagtatcga atcctgtttc + 901 gtcaatctaa acaggtgcta ggtgctttaa tctattaaaa ttcttaagaa ataaggctac + 961 tttttctggg tcttgttcat aattagattg aaactagaat agtacacctc tgcttctaaa + 1021 acattgttag aaatcgattt gactgtcctg atcgatttat catgttctta tttcatttta + 1081 ctatattttt gtttcgcggg aagtctacta agatacttaa agatgcagat agtgaaaaaa + 1141 ggtgtagaca ttaccgtaaa aaagtgatat aatcgtatga tgttcaatgt ataggtgtta + 1201 atcatgagta gacgttttaa aaaatcaagt tcacagaaag tgaagcgaag tgttaatata + 1261 gttttgttga ctatttattt attgttagtt tgttttttat tgttcttaat ctttaagtac + 1321 aatatccttg cttttagata tcttaattta gtggtaactg cgttagtcct actagttgcc + 1381 ttggtagggc tactcctgat tatctataaa aaagctgaaa aatttactat ttttctgttg + 1441 gtgttctcta tccttgtcag ctctgtgtcg ctctttgcag tacagcagtt tgttggactg + 1501 accaatcgtt taaatgcgac ttctaattac tcagaatatt caatcagtgt cgctgtttta + 1561 gcagatagtg atatcgaaaa tgttacgcaa ctgacgagtg tgacagcacc gactgggact + 1621 gataatgaaa atattcaaaa actactagct gatattaagt caagtcagaa taccgatttg + 1681 acggtcgacc agagttcgtc ttacttggca gcttacaaga gtttgattgc aggggagact + 1741 aaggccattg tcttaaatag tgtctttgaa aatatcattg agtcagagta tccagactac + 1801 gcatcgaaga taaaaaagat ttataccaag ggattcacta aaaaagtaga agctcctaag + 1861 acgtctaaga atcagtcttt caatatctat gttagtggaa ttgacaccta tggtcctatt + 1921 agttcggtgt cgcgatcaga tgtcaatatc ctgatgactg tcaatcgaga taccaagaaa + 1981 atcctcttga ccacaacacc acgtgatgcc tatgtaccaa tagcagatgg tggaaataat + 2041 caaaaagata aattaaccca tgcgggcatt tatggagttg attcgtccat tcacacctta + 2101 gaaaatctct atggagtgga tatcaattac tatgtgcgat tgaacttcac ttctttcttg + 2161 aaaatgattg acttattggg aggggtagat gttcataatg atcaagagtt ttcagctcta + 2221 catgggaagt tccatttccc agtagggaat gtccatctag actctgagca ggctctaggt + 2281 tttgtacgtg aacgctactc actagccgat ggagaccgtg accgtggtcg caaccaacaa + 2341 aaggtgattg tggctatcct tcaaaaatta acgtcaaccg aagcactgaa aaattatagt + 2401 acgatcatta atagcttgca agattctatc caaacaaata tgccacttga gactatgata + 2461 aatttggtca atgctcagtt agaaagtgga gggaattata aagtaaattc tcaagattta + 2521 aaagggacag gtcggacgga tcttccttct tatgcaatgc cagacagtaa cctctatgtg + 2581 ttggaaatag atgatagtag tttagctgta gttaaagcag ctatacagga tgtgatggag + 2641 ggtagatgaa atgatagaca tccattcgca tatcgttttt gatgtagatg acggtcccaa + 2701 gtcaagagag gaaagcaagg ctctcttggc agaatcctac aggcaagggg tacgaatcat + 2761 tgtctctacc tctcaccgtc gcaagggcat gtttgaaact ccggaagaga agatagcaga + 2821 aaactttctt caggttcggg aaatagctaa ggaagtggcg agtgacttgg tcattgctta + 2881 cggagctgaa atttactaca caccagatgt tctggataag ctggaaaaaa ggcggattcc + 2941 gaccctcaat gatagtcgtt atgccttgat agagtttagt atgaacactc cttatcgcga + 3001 tattcatagc gccttgagca agatcttgat gttgggaatt actccagtca ttgcccacat + 3061 tgagcgctat gatgctcttg aaaataatga aaaacgcgtt cgagaactga tcgatatggg + 3121 ctgttacacg caagtaaata gttcacatgt cctcaaaccc aaactttttg gcgaacgtta + 3181 taaattcatg aaaaaaagag ctcagtattt tttggaacgt gatttagttc atgtagttgc + 3241 aagtgacatg cacaatttag acagtagacc tccatatatg caacaggcat atgatatcat + 3301 tgctaagaaa tatggagcga aaaaagcgaa agaatttttt gtagataatc ccagaaaaat + 3361 tataatggat caattaattt aggagaaaat atgaaggaac acaacacttt ggaaatcgat + 3421 atattgcaac tattcagagc tttatggaaa agaaagttgg tcattttatt agtggcaatt + 3481 ataacttctt cagttgcttt tgcctacagt acttttgtta tcaaacctga gtttactagt + 3541 acgactcgga tttatgtagt taaccgtaat caggaagaga agtctggttt aaccaatcaa + 3601 gacttgcagg caggaactta tctggtaaaa gactaccgtg agattatcct ttcgcaggat + 3661 gttttggagg aagttatttc tgatttgaaa ctagatttga cgccaaaagg tttggctaat + 3721 aaaattaaag taacagtacc agttgatacc cgtattgtct ctgtttcagt taatgatcga + 3781 gttcctgaag aggcaagccg tatcgctaac tctttgagag aagtagctgc tcaaaaaatt + 3841 atcagtatta ctcgtgtttc tgatgtgaca acactggagg aggcaagacc ggcgatatca + 3901 ccgtcttcgc caaatattaa acgcaatata ctaattggtt ttttggcagg gggggttgga + 3961 actggtgtta tagttcttct tcttgaactt ttggacactc atgtgaaacg tccggaagat + 4021 atcgaagata cactgcagat gacacttttg ggagttgtac caaacttgag taagttgaaa + 4081 taggagagag gaatgccgac attagaaata gcacaaaaaa aactggagtt cattaagaag + 4141 gcagaagaat attacaatgc cttgtgtaca aatatacagt tgagcggaga taaactaaaa + 4201 gtaatttccg ttacttctgt taaccctggg gaaggaaaaa caactacttc cgtaaatata + 4261 gcaaggtcgt ttgcgcgtgc aggctataaa actcttttga tcgatggcga tactcgaaat + 4321 tcagttatgt caggattttt taaatctcgt gaaaaaatta cagggctaac agaattttta + 4381 tctgggacag ctgatttatc tcacggttta tgtgatacaa atattgaaaa tttatttgta + 4441 gttcaatcgg ggtctgtatc accaaaccct acagccttgt tacaaagtaa aaattttaat + 4501 gatatgattg aaacattgcg taaatatttt gattatatca ttgttgatac agcacctatt + 4561 ggaattgtta ttgatgcggc aattatcact caaaagtgtg atgcgtccat cttggtaaca + 4621 gcaacaggtg aggtgaataa acgtgatgtc caaaaagcga aacaacaatt agaacaaaca + 4681 gggaaactgt ttttaggtgt cattctcaat aaatttgatg ttcaacataa aaaatatggt + 4741 tcttacggtg actatggtaa ttatggtaaa aaataactta ggaaagattt tatggatgaa + 4801 aaaggattga aaatttttct ggcagtatta cagagtatta ttgtcatttt attggtttat + 4861 tttcttagct ttgttagaga gacagaactt gaacgttctt cgatggttat actatacctt + 4921 ctccactttt ttgtattcta ttttagttcc tatggtaata atttttttaa aagagggcac + 4981 ttagttgagt ttaatagtac tataagatat atttttttct ttgcaatagc tataagtgta + 5041 ttaaactttt ttatagcgga acggtttagt atctctagaa gaggaatggt atacttctta + 5101 actttagaag gaatatcctt atacttgtta aatttcttag taaagaaata ttggaagcat + 5161 gtgtttttta atctaaaaaa tagcaagaaa attttactgt taacagtaac gaaaaatatg + 5221 gaaaaagttc ttgataaatt gctagaatct gatgaacttt catggaaatt ggtagcagta + 5281 agtgttttgg ataaatctga ttttcaacat gataaaatac ctgtaattga aaaggaaaaa + 5341 attattgaat ttgcaacgca tgaagttgtg gatgaggtgt ttgtcaatct tccaggagag + 5401 agctacgata ttggagaaat tatctctagg tttgagacaa tggggataga tgtaactgta + 5461 aatcttaaag catttgataa gaatttgggt cgcaataaac aaattcatga gatggtagga + 5521 ttgaatgtag tcactttctc tacaaatttt tataaaacta gtcatgtgat ttcaaagaga + 5581 attctcgata tttgtggtgc cactattggc cttgttcttt ttgctatagc tagtctagtt + 5641 ttagttccat tgattcgtaa agatggcgga ccagctattt ttgctcaaac tcgtataggg + 5701 aaaaatggtc gacattttac cttttataaa ttccgttcga tgaggatcga tgctgaagct + 5761 atcaaagaac agttgatgga tcaaaatacg atgcaaggtg gtatgtttaa gatggacaat + 5821 gatcctcgtg ttacaaaaat tggtcgcttt attcgtaaaa ccagtttgga tgaattgccg + 5881 cagttttgga atgtctttat aggagatatg agtttggtgg gaacacgtcc acctacagta + 5941 gacgagtatg atcagtatac tccagaacag aaacgtcgac tcagctttaa acctggtatt + 6001 acaggtttat ggcaggttag cggccgtagt aaaataaccg attttgacga tgttgtaaaa + 6061 ttagatgtgg cttatattga taattggaca atctggaaag atattgaaat tttgcttaaa + 6121 actgttaaag ttgtatttat aagagatgga gcgaagtaag gaatgaaagt atgtctagtt + 6181 ggatctagtg gaggccattt aactcatttg tatttattaa aacctttctg gaatgataaa + 6241 gaaagatttt gggttacttt tgataaggcg gacgctcgga gtgtactctc tgaggaagtt + 6301 gtatatccct gttattatcc aaccaatcgt aatataaaaa atttaataaa aaatactttt + 6361 ctcgcctata aaattttaaa aaaagagaga ccagatttga ttatttcttc tggtgccgct + 6421 atcgctgttc ctttctttta tattgggaag ttatttggat caaagacagt gtatatagaa + 6481 gtgtttgata gaattgatgc ttcaacactg acaggaaaac ttgtttatcc agtaacggat + 6541 aggtttattg tacaatggga agaaatgaaa aaagtatacc caaaagcaat taacctagga + 6601 gggatattct aatgattttt gtgactgtag gtacacacga acaacaattt gatcgattga + 6661 ttaaagaagt tgattatcta aaaaaagaaa atcttattca agatgaagta tttattcaaa + 6721 taggatattc cagttatatt ccgaaatatt gtgagtggga aaagataatt tcttatgaaa + 6781 aaatgaatca attgattaag gaatcagata ttatcattac tcatggtgga ccagcgacgt + 6841 ttatgggggt tattgctaaa ggaaaagttc cgatagttgt tccgaggcaa aaaaaatttg + 6901 gagagcatgt gaatgaccat cagcttcaat tcgtaaaact gacgaaagaa atatacaatt + 6961 ttatagtcat agatgatatt tccgacttat atttaagtat acgtgatttt aaggataaat + 7021 attttggaat ttgtttgaac aatgaaagat ttaatctaca ttttaatgcg gaaattaata + 7081 aactatttga aggaaataaa gtagatgaaa attagaatag agcctcaata ttttctttat + 7141 aagtaccttt ggcttatcat actgctccca aaacagttta tgcaattaat attattttct + 7201 ttaattgtct taattctatt accggtctat ataaaagata gacaaatttc caaaatagat + 7261 gcaccgtctt tttatatagt tctatgggtc atgatgtatt ctatatcaat aatttggaat + 7321 tttttaatta gtggcttacc tattcaagtg ttgttttcag atttgagtaa ggcattcaat + 7381 tggatattag cagtattttt ttataattat tatttgaaaa atcccattaa cgttgacaag + 7441 ataaagaaat atatgtttta taatttcgct atattagtta ttattgttgc tttattctat + 7501 gttcaaagag gcgctaatgt agtattgttt ggaagaagct tattaggttg ggacggattc + 7561 gtatcagcta ccagttacgg agtaagatat gcaggatttt tagaatattc aacattaaat + 7621 gggcagttga ttcttttttt gttaccgtta attaggttat ttaaacttag tttttttaca + 7681 caagtaacta ttcttgcttt tttgctacag gttttagtat tgagtaaatc tagaatagct + 7741 attattgctc tgattatata catagtattt gtagtaatgg ttcagattac ttcaattaat + 7801 aagcggatga ttgtagcgtt ttatccaact atacctctta tattgcttta taattgggaa + 7861 aaaattaaac atatcttttt tcaaatgttt aattcaagaa caggtagtaa tgtgacacgt + 7921 tttatagtgt acgaagaatc tcttaaagct attaatgggc tgggaatttt acttggagca + 7981 ggaatcagaa cacaatctac agtaggtata ttattaggat cacattcaat gtatattagt + 8041 tttatttata ggacagggat tttaggaagt ataataatag taatactgtt ctattatttg + 8101 ttttctaaat ttttaaaaag tgccccatct ggaaagttaa tcagtatagg ctatatttta + 8161 gctttattgg tgttttggct ttttgaagaa ttagatccac attattggtg tttaatttta + 8221 tttttttcaa caataagtat tttcataaac aatagaaaag aggaaatagt tggatgatag + 8281 aagtatcaat cataattcca atatacaatg ctgaaaaaac tattaaaaat tgtgttgata + 8341 gtgccttaaa gcaaaattta gaatctcttg aagtgatttt ggtgaatgat gggtctaacg + 8401 attctacagc agaaattttg aaccagtacg acaggaattc aagggttaag atttttcatc + 8461 agcttaataa aggggtgtct actgctagaa ataaggggtt atctcatgct agtggagagt + 8521 atgtattttt tctagattca gatgatattt tagatgatgg tatgctttct aaaatgtacc + 8581 aatttgtaaa aaataataaa gttgatctct tatcttgttg gcataaagaa cctgctacaa + 8641 ctcaatacgg tggaaatgag aataagtcaa cttcatttat tgcacgtaca agagaagaaa + 8701 taggtgctca ttttgttgat atctttccga gaagtgcttg tgccaaattg ttttttcgca + 8761 aaataattga agaaaataat attacttttt cgactgagat gtcactaggt gaagatatgt + 8821 catttgtgta tcaatactta atggtttcta aaagtattgg agttattgac ggggtgtatt + 8881 ataatattca aaatgtaaat ccacagtcgt tatctaagcg ctatgtgcag aatattgaaa + 8941 attccctaat aattcagaac cagttatgga atcaactgtt ggaagtttat cctaaaattg + 9001 aggagaacta ctataagcaa catatggatt ttagatttta ccttgctaac ttgtatgtaa + 9061 ataatttatt taaatttgat tctccgtatt catcaaaaga aaaactagac caaattgctc + 9121 aacaattaaa aaagtataga ttatttttag atgaaaaagt cagcaaagaa aagatgccta + 9181 aaaatataaa tgagatgatt gttttttatt tactaaaatt gaaaattcca gtgttgattt + 9241 attcttttta ttcgtttaaa gagtggtgga agagaagaaa aattaaaaat gaaggataaa + 9301 taagttatgg aagatttgat aagcattgtt gttccagtct ataacgtgga aaaatattta + 9361 aaaaaatcaa tagaaagtat tttgaatcag acttatcaaa atatcgagat tttattggtt + 9421 gatgacggaa gcacagatag tagtgggaaa atttgtgaat catttagtaa agttgatcct + 9481 aggataagag tatttcataa agaaaatggt ggtttatcag atgctcggaa ttttggaatt + 9541 gagcaaatga aaggtcaata tgtagcgttt attgatagcg atgactacat atctaaggat + 9601 tatgtctgga agttgtattc ttctataaaa aataatgatt ccgaggtgtc gatttgttct + 9661 tttttattag tcgatgaaaa aggggaaaaa ataaaagatg agctattaga ttcgggaaaa + 9721 atatgcttga ctggtcaaca aatattagaa aaagtattaa cagccgacgg ctatcgctat + 9781 gttgttgctt ggaataagct ttatcggtca actttatttg aaaaattaaa atttaaaaaa + 9841 ggaatgttgt atgaggatga atttcttaac tatcctctat tttgggactg taaaagggta + 9901 tcaattgtag aggagccgtt atatttatac gttcaacgaa aaggaagcat tgtacaaagt + 9961 aatatgactt tagaaaaaat aaagatgaag gatgagatgc atacttcacg cattgagttt + 10021 tattcagaaa aggggcattc ttttttgcac gaaaaagcgt gtcaacagta ctgcaattgg + 10081 attgttacag cgactaccaa tcatagtaag attttaaatc ctaatttttc aaagtattta + 10141 caacgacagt ttagaaagtt cgctaaatat acacgaaaca atgatattag actaattgtg + 10201 cagaacattc taggatttat agatattcgt ttagcagctt atgtaaaatc aaaagtaatg + 10261 tagagtatag gaaacataat gatagaaaaa attttagatt ctattaaaaa tcattctttt + 10321 tatagtaaat tgaaggataa aattcataga attattccat tatatattat aaaaaatcaa + 10381 aatatagctt ttcaacaaga taccgatata gcatatagaa aactaaagaa gaagtttaga + 10441 catatttcgt tgactggaga tgagcttaaa tataaaatgg agttttcaaa taaagtttgg + 10501 atttgttggt ttcagggaga agagcatgcc ccagagttaa ttaaaacatg tattcaatca + 10561 atgaggaatc aacttcaagg aagagaaatc attgtgttga cagaaaaaaa tataagtgat + 10621 tatacagaga ttccagacta tattattgaa aaatacaaaa aaggatggat ttctcgtgcg + 10681 cattactctg atatccttag gatagatctt ctatgtcgcc atggaggatt atgggtagat + 10741 gcaacagtgt tgaatacagg aggagatttc tcaaatcttg aggtaccact ttttgtatat + 10801 aaatctttga atttatcaag aaaagattca caagctattg tagcatcaag ttggttaatt + 10861 tcgtcatata gtaatcatcc tatattactc tatacgagaa aactcctatg ggcctactgg + 10921 cgaagaaaaa atagtttatg taattatttt ttgttccata tatgttttac aatagctaca + 10981 gagcggtacc caatcgaatg gtctgctgtc cctactttta ataatcattc tcctcatata + 11041 cttcattttg agttgaatga acaattttcg gaaaaacggt gggaacaact gaagcatatt + 11101 tcggcgtttc ataaattaaa tcatcatata gattattcta gcggtgttaa cactttttat + 11161 aagttcatag tatcttcgaa agtttagaaa aatgagtaat aaaattagta aaaatttagc + 11221 ctacaatatg gggtatcagt taattggtat tgcagctccc ttgataactt ctccttattt + 11281 atcacggata ttaggtgctg aaaatttagg tattcattct tttactatgt cggttgcact + 11341 ttactttatg atgtttatgc ttcttggaat tgcaaattac ggaaatagaa caattgcgac + 11401 tgttaaacga gaaggaaagg atattctatc aaaaacgttt tggagtatct actctatcca + 11461 gttgataatg tctattctgg taactatagc ttatcttgct tatctatatt tgggggcagt + 11521 acattacaaa gttattgcaa tattacaact ctttttattg ttatcaaatg ctgttgatat + 11581 tacttggttt ttctatggat tagaaaattt taagcaaatc gtttttagga atacattagt + 11641 caaactttta ggattatttt taattttttt atgtgtgcgt caaggcacag atttatggaa + 11701 atacacattt ataaacggat cagtaacttt agttggccaa cttttactat ggggacaatt + 11761 aaaaggaata ttaacttgga aaaaaattca attaaaggaa ttactacctc atatcaagcc + 11821 aattttaatt ctttttattc ctgtactagc cattagtatt tttactaata tggataaata + 11881 tatgcttggt ttaatggttg atgtaaagca ggttggattt tatgacaatg caggtagaat + 11941 tattgaaatt cctaaagctt tgattgcagc tttaggggcc gttatgttac caagaacttc + 12001 ctatttatta gcggaaggac agaaagaaaa gagtaaatac tacatagagg taacaatttt + 12061 atacgtgatg attatttcta gtgtattgat gtttgggcta atatcggtat ctgatatttt + 12121 ttccattata ttttggggag aagaatttct tgaatcaggt agattgattt ctgctatgtc + 12181 tccggctttt gtcttctctg tattaggaaa tatcattagg actcagtatt tgattcctag + 12241 agctaaggat aaagattatg tagtgtctct aattgcgggg gctgttgtta atctagtgct + 12301 aaactatttt tttataaaac cttttggtgc tatgggagca acaattagta cagttttggc + 12361 agaatttgta ttgtctggaa tgcagttttg gtcagtaaga agagacttag atttaaaaag + 12421 atatttgaaa aacggtttga tattctacct atttggtctg attatgcacc tcattattat + 12481 agcactcaaa actcagttac catacaatat aatgagtctt attttactaa tagttttggg + 12541 tggaatagta tatgttattt tttgttgttg ctatatttta atgtcaagaa atttacattt + 12601 taagttattg aaggaaaaga ttatacgaaa ggttgtacat aaaaatacat tataaaatat + 12661 tagtttatct tatttagttg gatactatta aataaacgaa agtatttgaa actttggtaa + 12721 ttgagattat agagattata gagataaact aagctatatt atagcttcat tattaaagta + 12781 agaatatcgg tgcagtgtag ttaacgaata atgtgagtac tcatttctta gatggagcta + 12841 ggggtcatta taagggattg atatgacatt ttgagtaagt tacagctaga gtttaggttt + 12901 gattatatca gatatttaga tgatttggaa aataataaaa taagttagga actatttttt + 12961 tattgttttg agtgacaggt ttgattttgg gaaatgtatt ttgttaaata ggtaggaaag + 13021 atggttacta aagataaagg attaacatat aatagtactt tgcatgcaat aaaagtatta + 13081 gcatgtttta gtgttgttgc tattcatata tggctaccag gaaaaattgg agcgttttat + 13141 caaataatag cacgatttgc agttccaatg ttctttttga tttctggctt ttattcatat + 13201 aatatttcaa agaataaaat acagaataga attaaaaaaa tatttagatt gatattaaga + 13261 agtacatttt tttatgtaat aatatttgta tggatgtttt ggagagaagg taatatgcag + 13321 tttatttttc aaaactttaa tttaacaaat attataagat ttgtgatttt taataggatt + 13381 tcagatttaa taggctatct agcaacaccg ttgtggtatt tatttgctat attatatata + 13441 tatatatata tctttatttt tccaataaaa gactactatt gacaaaacga tggatttcta + 13501 tacttttact attttctttc attatggaag ctacaattag cgattcaatt ttttatagaa + 13561 attttttatt tatgggaata ccattttttg gaataggaat tcttattgca cagaagcaaa + 13621 agaagattat taattgtaaa ataataaaca aaatattaat cttgggaaca attatctatc + 13681 caatactaat atttttagaa tattatatct tgggtaattc ttttgagatc tatataagtt + 13741 ctgtgctagc aaccataata ttgatgattt tcgcgattaa atcacctaaa gcgattaata + 13801 taaaaatact gaatgaaatt ggagataaat atgcgacttt tgtttacatt atacaccagt + 13861 ttatcattgt gatatttaaa tttttagtat ctaatgttta tattctcaaa tttgggacga + 13921 tatttgtctt tttgatatgt tgttttctag gggttctatt tcaatttatc aaaaacagac + 13981 tattaaaaag gtttagttaa gatggttgtt ttacaaaatg ttaaattttt agtaagagtt + 14041 gtttttatgg ttattatcag tatagtgtta tggcctgttc ggataaagaa gaataagata + 14101 ctatttatta attttaatgg taagggatat ggtgataatc cgaaaagtat ttgtgagtat + 14161 cttcgagtta catatccaga gttagattta gtttggctta caaaagataa tgaagatttt + 14221 ccagatggag tgagagttgt aagatataaa tctctacaat ctttttatga gcaagctagt + 14281 tcgaaggttt gggtttataa tgtaagaaat tttgaaagac tactaaaaaa acgcggacag + 14341 ttttatattc aaacttggca cggtgcttct agttttaaac tgatagaaca gcaggctgat + 14401 ttaccattaa aatatatttt agaagcaaag tatgatgcaa gagtcacaga tataatgatt + 14461 tcagatagca gaaaacaaac tgaagaattt caaaagtatt tttggtattc aggagaaatt + 14521 tttgaggtgg ggatgccgag aaatgatgcc ttgtttcact ataaggaaga ctacgacaag + 14581 ttaaataata tcagaaaaaa actaagcatt gattcagatg attatgttat tttatatgcc + 14641 cctactttca gagatgatgg ggatgcatct tatttagata taaattttga acggcttttg + 14701 caaagtattg aacaagaaat taagaagaaa tgtaaaattt taattagatt acatcctaat + 14761 gactctcatt ttagtaataa tatttctttt aatcatgaca taattgatgt tacgctattc + 14821 tcagatatgc aggaacttat attattggca gatgttttac tgacagatta ttcttccgcg + 14881 atatttgatt ttatgctttt aaacaagcct tatgtcagat atgtgaatga tttagaaaaa + 14941 tatgctgagc ttaggggggt atcagataca tattatgaat tgccggattc tattattaaa + 15001 actgctgaag aattgtatga cttactgcct aaaaaaatag aaaattttga ttatgattct + 15061 ataaaaaaat atagaaatga aatactgtgt ccaatcttta atggaaccgc tagtgaaaat + 15121 gtaggaagga gaataattca agagttgtga agtaaaacat tgggttattt ttaaggtaac + 15181 gagatttgaa aaataatgat ttaaagatag gaagtggagc tattcatcaa atctccgcta + 15241 cactttctca aaataatatt tcgggaaaga ttttatattg tgctgatcca gttgtcgatg + 15301 acttgtacgg ttcgatagta cgttcacaaa tagaggaaat tggtcgggta aaggaagaaa + 15361 gttgcaatta taatactatt gcttatgcga tgaatatagc agaaagggct attgccacag + 15421 atattgactg tattgtggga atgggaggag gtcgtgtttt agatgtctgc aagtatgcat + 15481 cttttatttc gaaacgtcct tacctatcga ttccgacaac agcagcaaat gatggcattg + 15541 cttccccagt tgctgttttg aaaaggcagg atgatagacc aaaaagctta ggggcggcta + 15601 tcccctcaat gacactaatt gatattgatg ttattgcatc aggacctata caaaatataa + 15661 aagctggtat cggtgataca atatccaatt acactgcatt gaaagattgg gagttggcag + 15721 ttgagcgagg gaaagatgag atgcatggtt ttgcatatct aatgtcgcaa aattctttag + 15781 atgctttaat gaaaacgaag tataattcta ttacccctga ttttattgaa gttttggtaa + 15841 actctttagt tttatcaggc attgcaatgg attttgcggg aagtagtaga cctgtcagtg + 15901 ggtcagagca cttatttagt catgcattag attactatgg ttctacaagg aatcttcatg + 15961 gaattcaggt tgcattaggt acagtcgcag ttttgaaatt aattgaaaat tctgttgata + 16021 ctgtagtgga ttacttgcaa agatttgagg ttcatattaa cccgaaactt ttggggatag + 16081 atgaagagtt gtttatttat tgtatgcaac atgctacaaa aatgagaagt aatcgctata + 16141 cctatctgca tgaagttgat cttagcacag atagattgaa acaaatatat aaggaactca + 16201 taagcgagtt gtagaaaaga gaggaaaaaa tgaaagcact tattttagca gcagggttag + 16261 gaacacgtct agctccaatt accaatgagg taccaaaatc tttggtacca gtcaatggta + 16321 agccaatttt gatgaaacaa attgaaaatt tatatcaaaa taatattaca gatattacga + 16381 ttattgctgg atataagtca tctgtattaa cagatgcagt tactgaaaag tatccagaaa + 16441 ttaatattat tgataatgtt gattttaaaa cgactaataa tatgtattca gcctatctag + 16501 gaaaagctgc aatgggtgat agtgacttct taatgatgaa tgcagatgta ttttatgatg + 16561 cttctgttat taaaagtctg ttgcttcata aagctccaaa tgcaattgta actgatttag + 16621 gtatttatat tgaagagtct atgaaagtcg tagaaaaaaa tggtcgttta gtagaaattt + 16681 ctaaacagat ttcacctgag gaaactttag gagtttctat tgatgtttat aaattctctt + 16741 atgaagcagg tgctcgattc tttgaaaagt gtaaggaatt tattgaagat aaacgagaac + 16801 ttcaaatgtg gagtgaggtt gctcttaatg caattctttc tgaagttgaa tttgtagcat + 16861 gtccattaga gggtcgttgg ttagaaattg ataatcatga agacttagtt gctgcagaaa + 16921 aactatttgc ttgaaccgaa tacggagaat gaaattgaca aatagagttg attattttgg + 16981 tgctgatatt agtgaacttc agaataaaaa attattctta tttgatatgg atggtaccat + 17041 ttatgaagaa gataggttgt ttgagggtac tctcgaatta ttagactata ttcataatat + 17101 tggcggtgag tatattttta ttacaaacaa ttcatctaag tctgttgttg actatgtaga + 17161 aaaagttaac agattaggta ttaaagctga acgagataat ttttttacct ctgctcaagc + 17221 cacaattgtt tatattaaag aaaattatcc taaatctaaa gtttattgcc aaggaacaaa + 17281 atctttgata aaagaactat ctgacgcagg aattgatgta actgagcaag ttagtgctga + 17341 tatagatgtt gttcttgttg gttttgatac agaattaacc agtgataaaa ttcgcaatac + 17401 ctgcgagatt ctatcaacaa aggacatacc tttcatagct actaaccctg atattcgctg + 17461 cccagtatcg tttggattca tcccagattg tggttctatt tgtgatatga ttagtaaatc + 17521 agtcgatagg aaacctgttt acataggtaa acctgaacct acgatggttg atattgttcg + 17581 aaaaaaatta aattattctc tatttgaaac agttgtgatt ggagatcgct tgtatacgga + 17641 tatcatgact ggtataaatg caggagtaac ttcagtttgt gtgctgacag gagaagcaac + 17701 ggtgaatgat attcaacaag gtagtataaa accgacttat acatttaaaa acgtgaaaga + 17761 aatgtggaaa ggaattgtct gattttttca ttctgaatag tgaattcatg aatactgtca + 17821 aaatactcgt atgtatttaa attgatttta ttattagact tcctgcaaaa ctagaatcct + 17881 agttcatgat tgataatagc agcaatcaaa ttcattcgta atccgaagcg tttacgatga + 17941 tttcgatagg ttgttgaaaa cattttaaac gtttttactt tggcaaagat gttctcgacc + 18001 ttgcttctct ccttggatag cgcatggtta taggctttat cttcaactgt tagcggcttg + 18061 agtttgctgg atttacgtgg agtttgtgct tgaggatata tcttcatgag cccttgataa + 18121 ccactgtcag ccaagatttt accagcttgt ccgatatttc tgcgactcat tttgaacaac + 18181 ttcatatcat gacaatagtt cacagtgata tccaaagaaa caattctccc ttgacttgtg + 18241 acaatcgcct gagccttcat agcgagaaat atctattcta tcttctagaa tgtcttccaa + 18301 acgaggaaac tctcgtaaac aaagaggttt tagaggctta tttaccatgg actaaagttg + 18361 tacaagaaaa gtgcaaataa gaaatctcca gattaggaac tatccgtgag ttctctagtc + 18421 tggagatttt tcaatatact tcgttattgg gcgcttacaa tgatattcat attttttgca + 18481 aagatgttgt ttgaaaaata attttcaaaa attctgaaaa ttctgttgac aactttctga + 18541 aaagagtcta taatggagag aaagttttaa aggagaaaat gatgaaaagt tcaaaactac + 18601 ttgcccttgc gggcgtgaca ttattg +// diff --git a/public/res/serotype_genbank/serotype_15D.gb b/public/res/serotype_genbank/serotype_15D.gb new file mode 100644 index 0000000..76bc24b --- /dev/null +++ b/public/res/serotype_genbank/serotype_15D.gb @@ -0,0 +1,897 @@ +LOCUS SRR11130100 20128 bp DNA linear UNK 10-JUN-2024 +DEFINITION SRR11130100, whole genome shotgun sequence. +ACCESSION SRR11130100 +VERSION SRR11130100 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/10/2024, 18:43:26 + CDSs :: 21 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..20128 + /mol_type="genomic DNA" + gene 1..1608 + /locus_tag="ILOCDJ_00005" + /gene="dexB" + CDS 1..1608 + /db_xref="COG:COG0366" + /db_xref="COG:G" + /db_xref="EC:3.2.1.70" + /db_xref="GO:0005737" + /db_xref="GO:0005975" + /db_xref="GO:0043896" + /db_xref="KEGG:K01215" + /db_xref="RefSeq:WP_001156799.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0001DDD446" + /db_xref="UniRef:UniRef100_A0A4J1NL93" + /db_xref="UniRef:UniRef50_Q99040" + /db_xref="UniRef:UniRef90_Q54796" + /product="Glucan 1,6-alpha-glucosidase" + /locus_tag="ILOCDJ_00005" + /protein_id="gnl|Bakta|ILOCDJ_00005" + /translation="MQEKWWHNAVVYQVYPKSFMDSNGDGIGDLPGITSKLDYLAKLGI + TAIWLSPVYDSPMDDNGYDIADYQAIAAIFGTMEDMDQLIAEAKKRDIRIIMDLVVNHT + SDEHAWFVEACENPNSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSKKQP + DLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYLKEMN + QATFGDKDLLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKWHYQKE + LNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKAFAILLH + LMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKGVPIEEIMDSIRVIGRD + NARTPMQWDESKNAGFSTGQPWLAVNPNYEMINVQEALANPDSIFYTYQKLVQIRKENS + WLVRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQE + VFEKQILVPWDAFCVELL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001156799.1" + /gene="dexB" + gene 1767..1940 + /locus_tag="ILOCDJ_00010" + CDS 1767..1940 + /db_xref="RefSeq:WP_061753596.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000765355D" + /db_xref="UniRef:UniRef100_UPI000765355D" + /db_xref="UniRef:UniRef50_A0A0H2ZQL8" + /db_xref="UniRef:UniRef90_A0A0H2ZQL8" + /product="Lipoprotein" + /locus_tag="ILOCDJ_00010" + /protein_id="gnl|Bakta|ILOCDJ_00010" + /translation="MNIKKRVLSAGLTFASALLLAACDQSGSDTKTYSSTFSGNPTTFN + YLLDYYVDNIVN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061753596.1" + gene complement(2450..2779) + /locus_tag="ILOCDJ_00015" + /gene="tnp" + CDS complement(2450..2779) + /gene="tnp" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A7G1IQ53" + /db_xref="UniRef:UniRef90_A5LML9" + /product="IS630-Spn1 transposase" + /locus_tag="ILOCDJ_00015" + /protein_id="gnl|Bakta|ILOCDJ_00015" + /translation="MAYSIDFRKKVLSYCERTGSITEASHVFQISRNTIYGWLKLKEKT + GELNHQVKGTKPRKVDRDRLKNYLTDNPDAYLTEIASEFSCHPTTIHYALKAMGYTRKK + EPHLL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_A5LML9" + gene 3028..4473 + /locus_tag="ILOCDJ_00020" + /gene="wzg" + CDS 3028..4473 + /db_xref="BlastRules:WP_000091082" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_Q9R928" + /db_xref="UniprotKB:Q4K1R4" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="ILOCDJ_00020" + /protein_id="gnl|Bakta|ILOCDJ_00020" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVDQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIQKLTSTEVLKNYS + SILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSYAMPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q9R928" + /gene="wzg" + gene 4475..5206 + /locus_tag="ILOCDJ_00025" + /gene="wzh" + CDS 4475..5206 + /db_xref="BlastRules:WP_000565352" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF43" + /db_xref="UniRef:UniRef100_Q4K1K8" + /db_xref="UniRef:UniRef90_Q9AHD4" + /db_xref="UniprotKB:Q4K1R3" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="ILOCDJ_00025" + /protein_id="gnl|Bakta|ILOCDJ_00025" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDSRY + ALIEFSMNTPYRDIHSALNKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVTQKYG + EAKAQELFVDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1K8" + /gene="wzh" + gene 5215..5907 + /locus_tag="ILOCDJ_00030" + /gene="wzd" + CDS 5215..5907 + /db_xref="RefSeq:WP_000392514.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF28" + /db_xref="UniRef:UniRef100_Q4K1K7" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_Q4K1K7" + /db_xref="UniprotKB:Q4K1K7" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="ILOCDJ_00030" + /protein_id="gnl|Bakta|ILOCDJ_00030" + /translation="MEEQNTLEIDVLQLFRSLWKRKLVILLVAIITSSVAFAYSTFVIK + PEFTSTTRIYVVNRDQGEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVVSDLKLDLT + PKGLANKIKVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVTTLE + EARPATTPSSPNVRRNTLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQIPLLGL + VPDLDKMK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000392514.1" + /gene="wzd" + gene 5917..6606 + /locus_tag="ILOCDJ_00035" + /gene="wze" + CDS 5917..6606 + /db_xref="RefSeq:WP_001142531.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF29" + /db_xref="UniRef:UniRef100_Q4K1K6" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_O84996" + /db_xref="UniprotKB:Q4K1K6" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="ILOCDJ_00035" + /protein_id="gnl|Bakta|ILOCDJ_00035" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDGLKVFSITSVKL + GEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDLSQ + GLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVIDAA + IITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSYGNYG + DYGKNKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001142531.1" + /gene="wze" + gene 6621..7988 + /locus_tag="ILOCDJ_00040" + /gene="wchA" + CDS 6621..7988 + /db_xref="RefSeq:WP_203520214.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0010E58AE0" + /db_xref="UniRef:UniRef100_UPI0010E58AE0" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_Q8VU30" + /db_xref="UniprotKB:Q4K1R0" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="ILOCDJ_00040" + /protein_id="gnl|Bakta|ILOCDJ_00040" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYILH + YFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYFLT + LHALLVYVLNLFIKWYWKRTYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKLVAV + SVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMGIDVT + VNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLILCGLAS + IVLVPLIRKDGGSTIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTMQGGMFK + VDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQKRRLSF + KPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFMRDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_203520214.1" + /gene="wchA" + gene 7992..8441 + /locus_tag="ILOCDJ_00045" + /gene="wchJ" + CDS 7992..8441 + /db_xref="GO:0016740" + /db_xref="RefSeq:WP_000686638.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2B" + /db_xref="UniRef:UniRef100_Q4K1K4" + /db_xref="UniRef:UniRef50_J9W567" + /db_xref="UniRef:UniRef90_Q4K1M2" + /db_xref="UniprotKB:Q4K1K4" + /db_xref="UserProtein:wchJ" + /product="""putative glycosyl transferase enhancer""" + /locus_tag="ILOCDJ_00045" + /protein_id="gnl|Bakta|ILOCDJ_00045" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKADARSVLSEE + VVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKTVY + IEVFDRIDASTLTGKLVYPVTDRFIVQWEEMKKVYPKAINLGGIF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000686638.1" + /gene="wchJ" + gene 8441..8947 + /locus_tag="ILOCDJ_00050" + /gene="wchK" + CDS 8441..8947 + /db_xref="KEGG:K25904" + /db_xref="RefSeq:WP_000578432.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2C" + /db_xref="UniRef:UniRef100_Q4K1K3" + /db_xref="UniRef:UniRef50_Q9AQJ2" + /db_xref="UniRef:UniRef90_Q4K1K3" + /db_xref="UniprotKB:Q4K1K3" + /db_xref="UserProtein:wchK" + /product="""putative glycosyl transferase""" + /locus_tag="ILOCDJ_00050" + /protein_id="gnl|Bakta|ILOCDJ_00050" + /translation="MIFVTVGTHEQQFNRLIKEVDRLKGEGFIQDDVFIQTGYSNYVPK + FCKWEKLISYEKMNQFIEEADTIITHGGPATFMAVIAKGKSPIIVPRLKKFGEHVNDHQ + LEFVEKVLNVYNLTVITNISDLNSYISNFDERKKSDLKSKNNLFMEKFIDMINQLMETG + DIKYD" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000578432.1" + /gene="wchK" + gene 8940..10139 + /locus_tag="ILOCDJ_00055" + /gene="wzy" + CDS 8940..10139 + /db_xref="RefSeq:WP_050102558.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E97811" + /db_xref="UniRef:UniRef100_UPI0005E97811" + /db_xref="UniRef:UniRef50_E0Q2S4" + /db_xref="UniRef:UniRef90_Q4K1K2" + /db_xref="UniprotKB:Q4K1Q7" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="ILOCDJ_00055" + /protein_id="gnl|Bakta|ILOCDJ_00055" + /translation="MTKYINSCIKLLFIYSLFSELLYSYYSVSLLFTIPDLLLLAAAVI + AFVDSYSAGKIRVKNPHISLMLFFILLIFLLISFTWGTLNIYGFVMRGRYILGAFLVYF + MTNSYLDDRTFSSLINIAYFMQILNLLLVLHQNIVLHLHPDFTNGIFGFTNYANGIQGF + YCLALSVLSTVYYLYGKWGTMKSLILIAISCIICALAEIKIFFVIFIFSIILIFIFQKS + ETVKKIRIISTAAGISLLFLIAYKLIEIVLPDNLYTFFNVTKALSYENRTEFAGRTNTI + SFLWDNLFYHDYISAIFGKGLGSYSVNYIYELGKMLADGGFISVILLYSFLLSLFIRGT + ITRGKNKQSERLIVSIIAFVVMISIIVWNSTFTRSTYLVFFFLAIGNAAYKSTKLIRRD + " + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050102558.1" + /gene="wzy" + gene 10141..11169 + /locus_tag="ILOCDJ_00060" + /gene="wchL" + CDS 10141..11169 + /db_xref="RefSeq:WP_000405438.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2E" + /db_xref="UniRef:UniRef100_Q4K1K1" + /db_xref="UniRef:UniRef50_Q4K1K1" + /db_xref="UniRef:UniRef90_Q4K1K1" + /db_xref="UniprotKB:Q4K1K1" + /db_xref="UserProtein:wchL" + /product="""putative glycosyl transferase""" + /locus_tag="ILOCDJ_00060" + /protein_id="gnl|Bakta|ILOCDJ_00060" + /translation="MEIQISVVIPVYNAENTINNCIESALKQDLESFEVILVNDGSNDS + TSRILEQYSDNPQVKIFHQVNMGVSAARNLGLSHASGEYVFFLDSDDILDDGMLSKMYQ + FVKNNKVDLLSCWHKEPATTQYGGNENKSTSFIARTREEIGAHFVDIFPRSACAKLFFR + KIIEENNITFSTEMSLGEDMSFVYQYLMVSKSIGVIDGVYYNIQNVNPQSLSKRYVQNI + ENSLMIQNQLWNQLLEVYPKIEENYYKQHMDFRFYLANLYVNNLFKFDSPYSSKEKLDQ + IAQQLKKYRLFLDEKVSKEKMPKNINEMIVFYLLKLKIPVLIYSFYSFKEWWKRRKIKN + EG" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000405438.1" + /gene="wchL" + gene 11177..12133 + /locus_tag="ILOCDJ_00065" + /gene="wchM" + CDS 11177..12133 + /db_xref="RefSeq:WP_000389755.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000254D331" + /db_xref="UniRef:UniRef100_A0A9Q9R705" + /db_xref="UniRef:UniRef50_E0Q2S2" + /db_xref="UniRef:UniRef90_A0A4J2AN51" + /db_xref="UniprotKB:Q4K1Q5" + /db_xref="UserProtein:wchM" + /product="""putative glycosyl transferase""" + /locus_tag="ILOCDJ_00065" + /protein_id="gnl|Bakta|ILOCDJ_00065" + /translation="MEDLISIVVPVYNVEKYLKKSIESVLNQTYQNIEILLVDDGSTDS + SGKICESFSKVDPRIRVFHKENGGLSDARNFGIEQMKGQYVAFIDSDDYISKDYVWKLY + SSIKNNDSEVSICSFLLVDEKGEKIKDELLDSGKICLTGQQILEKVLTADGYRYVVAWN + KLYRSTLFEKLKFKKGMLYEDEFLNYPLFWDCKRVSIVEEPLYLYVQRKGSIVQSNMTL + EKIKMKDEMHTSRIEFYSEKGHSFLHEKACQQYCNWIVTATTNHSKILNPNFSKYLQRQ + FRKFAKYTRNNDIRLIVQNILGFIDIRLAAYVKSKVM" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000389755.1" + /gene="wchM" + gene 12149..13057 + /locus_tag="ILOCDJ_00070" + /gene="wchN" + CDS 12149..13057 + /db_xref="RefSeq:WP_000570495.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF30" + /db_xref="UniRef:UniRef100_Q4K1J9" + /db_xref="UniRef:UniRef50_B2ILQ2" + /db_xref="UniRef:UniRef90_Q6X853" + /db_xref="UniprotKB:Q4K1J9" + /db_xref="UserProtein:wchN" + /product="""putative glycosyl transferase""" + /locus_tag="ILOCDJ_00070" + /protein_id="gnl|Bakta|ILOCDJ_00070" + /translation="MIEKILDSIKNHSFYSKLKDKIHRIIPLYIIKNQNIAFQQDTDIA + YRKLKKKFRHISLTGDELKYKMEFSNKVWICWFQGEEHAPELIKTCIQSMRNQLQGREI + IVLTEKNISDYTEIPGYIIEKYKKGWISRAHYSDILRIDLLCRHGGLWVDATVLNTGGD + FSNLEVPLFVYKSLNLSRKDSQAIVASSWLISSYSNHPILLYTRKLLWAYWRRKNSLCN + YFLFHICFTIATERYPIEWSAVPTFNNHSPHILHFELNEQFSEKRWEQLKHISAFHKLN + HHIDYSSGVNTFYKFIVSSKV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000570495.1" + /gene="wchN" + gene 13062..14525 + /locus_tag="ILOCDJ_00075" + /gene="wzx" + CDS 13062..14525 + /db_xref="RefSeq:WP_000066240.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000230F834" + /db_xref="UniRef:UniRef100_A0A0I6TSP5" + /db_xref="UniRef:UniRef50_O07342" + /db_xref="UniRef:UniRef90_Q6X852" + /db_xref="UniprotKB:Q4K1J8" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="ILOCDJ_00075" + /protein_id="gnl|Bakta|ILOCDJ_00075" + /translation="MSNKISKNLAYNMGYQLIGIAAPLITSPYLSRILGAENLGIHSFT + MSVALYFMMFMLLGIANYGNRTIATVKREGKDILSKTFWSIYSIQLIMSILVTIAYLAY + LYLGAVHYKVIAILQLFLLLSNAVDITWFFYGLENFKQIVFRNTLVKLLGLFLIFLCVR + QGTDLWKYTFINGSVTLVGQLLLWGQLKGILTWKKIQLKELLPHIKPILILFIPVLAIS + IFTNMDKYMLGLMVDVKQVGFYDNAGRIIEIPKALIAALGAVMLPRTSYLLAEGQKEKS + KYYIEVTILYVMIISSVLMFGLISVSDIFSIIFWGEEFLESGRLISAMSPAFVFSVLGN + IIRTQYLIPRAKDKDYVVSLIAGAVVNLVLNYFFIKPFGAMGATVSTVLAEFVLSGMQF + WSVRRDLDLKRYLKNGLIFYLFGLIMHLIIIALKTQLPYNIMSLILLIVLGGIVYVIFC + CCYILMSRNLHFKLLKEKIIRKVVHKNTL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000066240.1" + /gene="wzx" + gene 14891..15868 + /locus_tag="ILOCDJ_00080" + CDS 14891..15868 + /db_xref="RefSeq:WP_000256585.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD3" + /db_xref="UniRef:UniRef100_Q6X851" + /db_xref="UniRef:UniRef50_E0Q2R6" + /db_xref="UniRef:UniRef90_Q6X851" + /product="Putative O-acetyltransferase" + /locus_tag="ILOCDJ_00080" + /protein_id="gnl|Bakta|ILOCDJ_00080" + /translation="MVTKDKGLTYNSTLHAIKVLACFSVVAIHIWLPGKIGAFYQIIAR + FAVPMFFLISGFYSYNISKNKIQNRIKKIFRLILRSTFFYVIIFVWMFWREGNMQFIFQ + NFNLTNIIRFVIFNRISDLIGYLATPLWYLFAILYIYIYLYFSNKRLLLTKRWISILLL + FSFIMEATISDSIFYRNFLFMGIPFFGIGILIAQKQKKIINCKIINKILILGTIIYPIL + IFLEYYILGNSFEIYISSVLATIILMIFAIKSPKAINIKILNEIGDKYATFVYIIHQFI + IVIFKFLVSNVYILKFGTIFVFLICCFLGVLFQFIKNRLLKRFS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000256585.1" + gene 15870..17018 + /locus_tag="ILOCDJ_00085" + /gene="wchX" + CDS 15870..17018 + /db_xref="RefSeq:WP_000261152.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000230F835" + /db_xref="UniRef:UniRef100_A0A0I6WHZ7" + /db_xref="UniRef:UniRef50_Q9R922" + /db_xref="UniRef:UniRef90_A0A4J2AK78" + /db_xref="UniprotKB:Q4K1Q2" + /db_xref="UserProtein:wchX" + /product="""putative glycerol phosphotransferase""" + /locus_tag="ILOCDJ_00085" + /protein_id="gnl|Bakta|ILOCDJ_00085" + /translation="MVVLQNVKFLVRVVFMVIISIVLWPVRIKKNKILFINFNGKGYGD + NPKSICEYLRVTYPELDLVWLTKDNEDFPDGVRVVRYKSLQSFYEQASSKVWVYNVRNF + ERLLKKRGQFYIQTWHGASSFKLIEKQADLPLKYILEAKYDARVTDIMISDSRKQTEEF + QKYFWYSGEIFEVGMPRNDALFHYKEDYDKLNNIRKKLSIDSDDYVILYAPTFRDDGDA + SYLDINFERLLQSIEQEIKKKCKILIRLHPNDSHFSNNISFNHDIIDVTLFSDMQELIL + LADVLLTDYSSAIFDFMLLNKPYVRYVNDLEKYAELRGVSDTYYELPDSIIKTAEELYD + LLPKKIENFDYDSIKKYRNEILCPIFNGTASENVGRRIIQEL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000261152.1" + /gene="wchX" + gene 17054..18082 + /locus_tag="ILOCDJ_00090" + /gene="gtp1" + CDS 17054..18082 + /db_xref="RefSeq:WP_000794265.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00001D8FD5" + /db_xref="UniRef:UniRef100_Q6X849" + /db_xref="UniRef:UniRef50_Q9R921" + /db_xref="UniRef:UniRef90_Q9R921" + /db_xref="UniprotKB:Q4K1Q1" + /db_xref="UserProtein:gtp1" + /product="""putative glycerol-2-phosphate dehydrogenase""" + /locus_tag="ILOCDJ_00090" + /protein_id="gnl|Bakta|ILOCDJ_00090" + /translation="MKNNDLKIGSGAIHQISATLSQNNISGKILYCADPVVDDLYGSIV + RSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFISKR + PYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKAGIG + DTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLVNSLV + LSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENSVDTVV + DYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQIYKELIS + EL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000794265.1" + /gene="gtp1" + gene 18098..18802 + /locus_tag="ILOCDJ_00095" + /gene="gtp2" + CDS 18098..18802 + /db_xref="RefSeq:WP_000645462.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00000B4F25" + /db_xref="UniRef:UniRef100_O85005" + /db_xref="UniRef:UniRef50_O85005" + /db_xref="UniRef:UniRef90_O85005" + /db_xref="UniprotKB:Q4K1J4" + /db_xref="UserProtein:gtp2" + /product="""putative nucleotidyl transferase""" + /locus_tag="ILOCDJ_00095" + /protein_id="gnl|Bakta|ILOCDJ_00095" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQNN + ITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLMMN + ADVFYDASVIKSLLLHKAPNAIVTDLGIYIEESMKVVEKNGRLVEISKQISPEETLGAS + IDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILSEVEFVACPLEGRWLEIDN + HEDLVAAEKLFA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000645462.1" + /gene="gtp2" + gene 18823..19650 + /locus_tag="ILOCDJ_00100" + /gene="gtp3" + CDS 18823..19650 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q4K1N0" + /db_xref="UniRef:UniRef90_Q4K1N0" + /db_xref="UniprotKB:Q4K1N0" + /db_xref="UserProtein:gtp3" + /product="""putative phosphotransferase""" + /locus_tag="ILOCDJ_00100" + /protein_id="gnl|Bakta|ILOCDJ_00100" + /translation="MTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLELLDY + IHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPKSKVY + CQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDVPFIAT + NPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRKKLNYSLFETVVI + GDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQGSIKPTYTFKNVKEMWKGIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K1N0" + /gene="gtp3" + gene complement(19739..20128) + /locus_tag="ILOCDJ_00105" + /gene="tnp" + CDS complement(19739..20128) + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A4N9BSH4" + /db_xref="UniRef:UniRef90_A0A4M3K117" + /product="IS5 family transposase ORF B" + /locus_tag="ILOCDJ_00105" + /protein_id="gnl|Bakta|ILOCDJ_00105" + /translation="MKAQAIVTSQGRIVSLDIAVNYCHDIKLFKMSRRNIGQAGKILAD + SGYQGLMKIYPQAQTPRKSSKLKPLTVEDKACNHALSKERSKVENIFAKVKTFKMFSTT + YRNHRKRFGLRMNLIAAIINHELGF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A4M3K117" + /gene="tnp" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg gagatggaat tggcgatttg ccaggaatta ccagtaagtt ggactatcta + 121 gccaagctag gaatcacagc aatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctacg atattgctga ttatcaagcg attgcggcta tttttggaac catggaggac + 241 atggatcagc tgattgcaga agctaagaag cgtgatatcc gtatcatcat ggacttggtg + 301 gtcaatcata cctcggatga gcatgcctgg tttgtagagg cctgtgaaaa tcctaatagc + 361 cctgagcgag actactatat ctggcgggat gagcctaacg atttagattc tatctttagt + 421 gggtctgctt gggaatacga tgaaaagtca ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaggg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agataaggat ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcagc ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttgcttcat + 1021 cttatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatctctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaacct + 1261 tggttggcgg ttaatccaaa ttacgagatg atcaatgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 gttcgagctg actttgaatt gcttgatacg gctgataagg tctttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacaccc tagctcaaga agtctttgaa + 1561 aaacaaatct tagttccatg ggatgctttc tgtgtggaat tactataaat attttttgca + 1621 gaaaaattta aaattgaaat cgtataaaaa caagggagga ctgtataaaa gacagaaatc + 1681 ctttgttttt tataaccaag gtttataaac tttcattctc gaaattcaat taactttaca + 1741 aattcccact attaaggaga aagaaaatga acataaagaa gcgtgtcctt agtgcaggtc + 1801 tgacttttgc atctgctttg cttttagctg cttgcgacca atcaggttca gatacaaaaa + 1861 cttactcatc aacctttagt ggaaatccaa ctacatttaa ttacctgtta gactattacg + 1921 ttgataatat agtcaattga aacaagagca ggacaaaaaa gcctcgtaaa aggtattgca + 1981 acttggtaat acctttttga ggtgcttttt gatatgagcc catgttttct caataggatt + 2041 gtactcaggt gagtagggag gaagaggtaa aagtttatgt ccaaactctt cacacaagag + 2101 ttctaactta cccattctat ggaatcttgc attatccata ataataaccg atggtgtggt + 2161 taatgttggt aagagaaatt tctgaaacta agcttcaaaa aagtcgctcg tcaccatctc + 2221 ttcgtaagtc attggagcga ttaactcacc atttgttaga cctgcaacca aagaaatcct + 2281 ctgatatctt cttccagata ctttgcctct tcttaactga ccttttaatg agcgaccata + 2341 ttctcgataa aaataagtat cgaatcctgt ttcgtcaatc taaacaggtg ctaggtgctt + 2401 taaactatta aaattcttaa gaaataaggc tactttttct gcctcttgtt catagtaggt + 2461 gtggttcttt ttttcgagtg tagcccatag ctttgagcgc atagtggatg gtagttggat + 2521 gacagctaaa ttcagaagct atttcagtca aataagcgtc tggattgtca gtaagatagt + 2581 ttttaagtct atctctatca acctttcttg gttttgttcc ttttacttgg tggtttagct + 2641 ctcctgtttt ctcttttagc tttaaccagc cataaatggt attacgtgag atttggaaaa + 2701 cgtgtgatgc ttctgttata ctacctgttc gctcacaata agagagaact tttttacgaa + 2761 aatctattga atatgccata aaaagattat gccacattgt gtactatagt agattgaaac + 2821 tagaatagta cacctctgct tctaaaaaat ttttagaaat cgatttaact gccctgatcg + 2881 atttgtcatg ttcttatttc attttactat atttttgttt cgcgggaagt ctactaagat + 2941 acttaaagat gcagatagta aaaaaatgta gacattaccg taaaaaagtg atataatcgt + 3001 atgatgttca aggtataggt gttaatcatg agtagacgtt ttaaaaaatc acgttcacag + 3061 aaagtgaagc gaagtgttaa tatcgttttg ctgactattt atttattgtt agtttgtttt + 3121 ttattgttct taatctttaa gtacaatatc cttgctttta gatatcttaa cctagtggta + 3181 actgcgttag tcctactagt tgccttggta gggctactct tgattatcta taaaaaagct + 3241 gaaaagttta ctatttttct gttggtgttc tctatccttg tcagctctgt gtcgctcttt + 3301 gcagtacagc agtttgttgg actgaccaat cgtttaaatg cgacttctaa ttactcagaa + 3361 tattcaatca gtgtcgctgt tttagcagat agtgatatcg aaaatgttac gcaactgacg + 3421 agtgtgacag caccgactgg gactgataat gaaaatattc aaaaactact agctgatatt + 3481 aagtcaagtc agaataccga tttgacggtc gaccagagtt cgtcttactt ggcagcttac + 3541 aagagtttga ttgcagggga gactaaggcc attgtcttaa atagtgtctt tgaaaatatc + 3601 atcgagtcag agtatccaga ctacgcatcg aagataaaaa agatttatac caagggattc + 3661 actaaaaaag tagaagctcc taagacgtct aagaatcagt ctttcaatat ctatgttagt + 3721 ggaattgaca cctatggtcc tattagttcg gtgtcgcgat cagatgtcaa tatcctgatg + 3781 actgtcaatc gagataccaa gaaaatcctc ttgaccacaa cgccacgtga tgcctatgta + 3841 ccaatcgcag atggtggaaa taatcaaaaa gataaattaa cccatgcggg catttatgga + 3901 gttgattcgt ccattcacac cttagaaaat ctctatggag tggatatcaa ttactatgtg + 3961 cgattgaact tcacttcttt cttgaaaatg attgacttat tgggaggggt agatgttcat + 4021 aatgatcaag agttttcagc tctacatggg aagttccatt tcccagtagg gaatgtccat + 4081 ctagactctg agcaggctct aggttttgta cgtgaacgct actcactagc cgatggagac + 4141 cgtgaccgtg gtcgcaacca acaaaaggtc attgtagcaa ttattcagaa gttaacttct + 4201 acagaggttt tgaaaaacta tagtagtatt cttcaaggat tgcaggattc tcttcaaaca + 4261 aatatgccga ttgagactat gatagattta gtgaatactc agttggagag tggagggaat + 4321 tataaagtaa attcgcaaga cttgaaaggt acaggtcgga tggatcttcc ttcttatgca + 4381 atgccagaca gtaacctcta tgtgatggaa atagatgata gtagtttagc tgtagttaaa + 4441 gcagctatac aggatgtgat ggagggtaga tgaaatgata gacatccatt cgcatatcgt + 4501 ttttgatgta gatgacggtc ccaagtcaag agaggaaagc aaggctctct tggcagaagc + 4561 ctacagacag ggggtgcgaa ccattgtctc tacctctcac cgtcgcaagg gcatgtttga + 4621 aactccggaa gagaagatag cagaaaactt tcttcaggtt cgggaaatag ctaaggaagt + 4681 ggcgagtgac ttagtcattg cttacggggc tgaaatttac tacacaccag atgttctgga + 4741 taagctggga aaaaagcgga ttccgaccct caatgatagt cgttatgcct tgatagagtt + 4801 tagtatgaac actccttatc gcgatattca tagcgccttg aacaagatct tgatgttggg + 4861 aattactcca gtcattgccc acattgagcg ctatgatgct cttgaaaata atgaaaaacg + 4921 cgttcgagaa ttgatcgata tgggctgtta cacgcaagta aatagttcac atgtcctcaa + 4981 atccaaactt tttggcgaac gttataaatt catgaaaaaa agagctcagt attttttaga + 5041 gcaggatttg gtccatgtca ttgcaagtga tatgcacaat ctagacggca gacctcctca + 5101 tatggcagaa gcatatgacc ttgttaccca aaaatacgga gaagcgaagg ctcaggaact + 5161 ttttgtagat aatcccagaa aaattataat ggatcaatta atttaggaga aaatatggag + 5221 gaacaaaaca ctttggaaat cgatgtattg caactattca gatctttgtg gaaaagaaag + 5281 ttggtcattt tattagtggc aattataact tcttcagttg cttttgccta cagtactttt + 5341 gttatcaaac ctgagtttac tagtacgact cggatttatg tagttaaccg tgatcaggga + 5401 gagaagtctg gtttaaccaa tcaagacttg caggcaggaa catacttggt taaagactat + 5461 cgtgaaatta tcctatcgca ggatgttttg gaggaagttg tttctgattt gaaactagat + 5521 ttgacgccaa aaggtttggc taataaaatt aaagtgacag taccagttga tacccgtatt + 5581 gtctcaatct ctgtcaagga taaacagcca gaggaagcca gtcgtatcgc taattctcta + 5641 cgagaagttg ctgcagaaaa gatcgtcgct gtaacgcgag tatctgatgt aacgacactt + 5701 gaagaagcgc gaccagctac gactccctct tctccaaatg ttcgacgcaa caccttgttt + 5761 ggttttcttg gaggagccgt cgtaacagta attgctgttc ttttgattga gttgctcgac + 5821 acccgtgtga aacgtcctga agatgttgaa gatgtactgc aaattccact tttagggctc + 5881 gttccagatt tggacaaaat gaaataggag gaagttatgc caacgttaga aatctcacag + 5941 gcaaaattgg attttgtaaa aaaggcagag gaatattata acgctttgtg cacgaaccta + 6001 cagttaagtg gagatggttt gaaagtattt tctatcactt ctgtgaaact aggagaagga + 6061 aaatcaacga cttccaccaa tatcgcttgg gcttttgcgc gtgcaggtta caaaacgctg + 6121 ctgattgatg gagatattcg caattctgtt atgttaggtg tctttaaagc aagggataag + 6181 attacaggcc tgacagaatt tttatcagga actacagacc tatcacaagg gctttgtgat + 6241 accaatatcg aaaatctctt tgtaattcag gctggctctg tgtcaccgaa tccgacagct + 6301 cttcttcaaa gtaagaattt cagtacaatg cttgaaacct tgcgtaaata ttttgactac + 6361 atcattgtag atactgctcc tgtcggtgtc gtgattgatg cggctattat tacgcgaaaa + 6421 tgcgatgctt ctattttagt gacggaggca ggtgaaataa atcgacggga tattcaaaaa + 6481 gcaaaagaac agttggaaca cacagggaag ccgtttttgg gagttgtgtt gaataaattc + 6541 gatacttcag tagacaaata cggttcttat ggaaattatg gagattacgg gaaaaataaa + 6601 aaataggtcg ggggatagag atgaatggaa aaatagtaaa gtcttcattg gccataatcc + 6661 agagttttct tgttatttta ttgacttatc tacttagtgc tgtgagagaa gcggagattg + 6721 tttcaacaac agctattgca ctttatatcc tccattattt tgtcttttat atcagtgatt + 6781 atggacagga tttctttaaa aggggatatt tgattgaact tgtccagaca ttgaaatata + 6841 tcctattctt tgcactagcg attagtattt ctaatttttt cttagaggat cgatttagta + 6901 tttccagacg aggcatgatt tacttcctca cattacatgc tctcttagtc tatgtgctaa + 6961 acctatttat caagtggtat tggaagcgga cttatcccaa ctttaaagga agtaagaaga + 7021 ttctcctact tacagcaact tctcgtgtcg aaaaggtact ggatagatta atagaatcaa + 7081 atgaggttgt tgggaagttg gtagccgtca gtgtcttaga taaaccagat tttcagcatg + 7141 attgtttaaa ggtagtagca gagggggaga tagtaaactt tgcgactcat gaggtggtcg + 7201 atgaagtctt tatcaatctt ccaagtgaaa aatacaatat tggagagctt gtctctcagt + 7261 ttgaaacgat gggaattgat gtaacagtca atctaaatgc ttttgatcgt agtttggcac + 7321 gtaacaagca aatccgtgag atggcaggat taaacgttgt gactttttct acaacatttt + 7381 ataagactag tcatgtaatt gctaagcgga ttattgatat cgtgggtgca ttggtagggc + 7441 tgatactatg tggtctagcc agtattgtac tggttccttt gattcgaaag gatgggggct + 7501 ctactatttt tgctcagacg cgtataggaa aaaatggtcg tcagttcact ttttataagt + 7561 ttcgctctat gtgtgtagat gccgaggcga aaaaaagaga actcatggaa caaaatacca + 7621 tgcagggtgg aatgtttaag gtggacgatg atcctcgtat cacgaaaatt ggtcgtttta + 7681 tacggaagac tagcttggac gagctaccac agttttataa tgttctaaag ggagatatga + 7741 gtttggttgg cacacggcca ccaacagtgg acgagtatga acactatacc ccagaacaaa + 7801 aacgtcggct aagttttaaa cctggtataa caggcttatg gcaggtcagt ggacgaagtg + 7861 agattaagaa ttttgatgaa gttgtcaaat tagatgtagc ctatatagac gattggacaa + 7921 tttggaaaga cattgaaatt ttattgaaga cagttaaagt tgtatttatg agagacggag + 7981 cgaagtagga aatgaaaata tgtttagttg gatctagtgg aggtcatctg actcatttat + 8041 atcttttaaa acctttctgg aaagataaag aaagattttg ggttactttt gataaggcgg + 8101 acgctcggag tgtactctct gaggaagttg tatatccctg ttattatcca accaatcgta + 8161 atataaaaaa tttaataaaa aatacttttc tcgcctataa aattttaaaa aaagagagac + 8221 cagatttgat tatttcttct ggtgccgcta tcgctgttcc tttcttttat attgggaagt + 8281 tatttggatc aaagacagtg tatatagaag tttttgatag aattgatgct tcaacactga + 8341 caggaaaact tgtttatcca gtaacggata ggtttattgt tcaatgggaa gaaatgaaaa + 8401 aagtataccc aaaggcaatt aatctcggag ggattttcta atgatttttg tgacagtagg + 8461 tactcatgaa caacagttta atcgacttat taaagaggtt gatagattaa aaggtgaggg + 8521 atttattcag gatgatgttt ttattcaaac aggatactct aattatgttc caaaattttg + 8581 taaatgggaa aaattaatat cttatgaaaa aatgaatcaa tttattgagg aagctgatac + 8641 aatcattacc catggcggtc cagctacgtt tatggcagtt attgctaaag ggaaaagtcc + 8701 gataattgtt ccgagattaa aaaaatttgg tgagcatgtg aacgaccatc aacttgaatt + 8761 tgttgagaaa gtgttaaatg tctataattt gacagtcatc actaacataa gtgatcttaa + 8821 ttcctatatt tctaattttg atgagcgaaa aaaatcagat ttgaagagca aaaataatct + 8881 atttatggag aaatttatag atatgattaa tcagttgatg gagacaggtg acatcaagta + 8941 tgactaagta cataaatagc tgtatcaagt tgttattcat atattcgtta tttagtgaat + 9001 tgctatactc atattattct gtatctctat tatttacgat acctgactta ttattgttgg + 9061 cagcagcagt aattgctttt gtagattctt attctgcagg gaaaataaga gttaaaaatc + 9121 ctcacattag tttaatgctc ttttttatat tgctgatatt tctattaatt agttttactt + 9181 ggggtactct taatatatat ggatttgtta tgagaggaag atatatactg ggagcatttc + 9241 tagtttattt tatgacaaat agctatctag atgatagaac cttttcatca ttgataaaca + 9301 ttgcttattt tatgcagata ttgaacctat tattagtttt acatcaaaat atagtattac + 9361 atttgcaccc tgacttcact aatgggattt ttggttttac taattatgca aatggaatcc + 9421 aaggatttta ttgcttagcc ttaagtgttt tatctactgt atattatctg tatggtaaat + 9481 ggggaacaat gaagtcatta atattgattg ctatttcgtg tataatttgt gcattagcag + 9541 aaataaagat tttttttgtc atttttatat tttctattat tctaattttt atatttcaaa + 9601 agtcagaaac agtaaaaaaa atacgaataa ttagtacagc tgctggaata tctcttcttt + 9661 ttttaattgc ctataaactc attgagatag ttttacctga taatttgtat acttttttta + 9721 atgttacaaa ggcattatca tatgagaata ggacagagtt tgcgggacga acaaatacta + 9781 tttccttcct atgggacaac ttattttatc atgattatat tagtgctata tttgggaaag + 9841 gactaggttc atactctgtt aattatattt atgaacttgg taaaatgctt gcagatggtg + 9901 gttttatttc agtgattttg ctttattcat ttttgttgtc attattcata cggggaacta + 9961 ttactagagg aaaaaataag caaagtgaaa gactaattgt atccatcata gcttttgtgg + 10021 tgatgattag cattattgtt tggaatagta cgttcactag atcaacttat cttgtatttt + 10081 tctttctagc aataggtaat gcagcgtata agtctactaa attaataaga agggattgag + 10141 atggaaattc aaatatcagt ggtgattcca gtatacaatg ctgaaaacac gattaataat + 10201 tgtattgaaa gtgctttaaa acaagattta gaatcttttg aagtaatttt agtaaacgat + 10261 ggatcgaacg attctacatc aagaattctt gaacagtata gtgataatcc ccaagtgaag + 10321 atatttcatc aagtgaacat gggagtatct gctgccagaa atttaggttt atctcatgca + 10381 agcggagaat acgtattctt tttagattca gatgatattt tagatgatgg tatgctttct + 10441 aaaatgtacc aatttgtaaa aaataataaa gttgatctct tatcttgttg gcataaagaa + 10501 cctgctacaa ctcaatacgg tggaaatgag aataagtcaa cttcatttat tgcacgtaca + 10561 agagaagaaa taggtgctca ttttgttgat atctttccga gaagtgcttg tgccaaattg + 10621 ttttttcgca aaataattga agaaaataat attacttttt cgactgagat gtcactaggt + 10681 gaagatatgt catttgtgta tcaatactta atggtttcta aaagtattgg agttattgac + 10741 ggggtgtatt ataatattca aaatgtaaat ccacagtcgt tatctaagcg ctatgtgcag + 10801 aatattgaaa attccctaat gattcagaac cagttatgga atcaactgtt ggaagtttat + 10861 cctaaaattg aggagaacta ctataagcaa catatggatt ttagatttta ccttgctaac + 10921 ttgtatgtaa ataatttatt taaatttgat tctccgtatt catcaaaaga aaaactagac + 10981 caaattgctc aacaattaaa aaagtataga ttatttttag atgaaaaagt cagcaaagaa + 11041 aagatgccta aaaatataaa tgagatgatt gttttttatt tactaaaatt gaaaattcca + 11101 gtgttgattt attcttttta ttcgtttaaa gagtggtgga agagaagaaa aattaaaaat + 11161 gaaggataaa taagttatgg aagatttgat aagcattgtt gttccagtct ataacgtgga + 11221 aaaatattta aaaaaatcaa tagaaagtgt tttgaatcag acttatcaaa atatcgagat + 11281 tttattggtt gatgacggaa gcacagatag tagtgggaaa atttgtgaat catttagtaa + 11341 agttgatcct aggataagag tatttcataa agaaaatggt ggtttatcag atgctcggaa + 11401 ttttggaatt gagcaaatga aaggtcaata tgtagcgttt attgatagcg atgactacat + 11461 atctaaggat tatgtctgga agttgtattc ttctataaaa aataatgatt ccgaggtgtc + 11521 gatttgttct tttttattag tcgatgaaaa aggggaaaaa ataaaagatg agctattaga + 11581 ttcgggaaaa atatgcttga ctggtcaaca aatattagaa aaagtattaa cagccgacgg + 11641 ctatcgctat gttgttgctt ggaataagct ttatcggtca actttatttg aaaaattaaa + 11701 atttaaaaaa ggaatgttgt atgaggatga atttcttaac tatcctctat tttgggactg + 11761 taaaagggta tcaattgtag aggagccgtt atatttatac gttcaacgaa aaggaagcat + 11821 tgtacaaagt aatatgactt tagaaaaaat aaagatgaag gatgagatgc atacttcacg + 11881 cattgagttt tattcagaaa aggggcattc ttttttgcac gaaaaagcgt gtcaacagta + 11941 ctgcaattgg attgttacag cgactaccaa tcatagtaag attttaaatc ctaatttttc + 12001 gaagtattta caacgacagt ttagaaagtt cgctaaatat acacgaaaca atgatattag + 12061 actaattgtg cagaacattc taggatttat agatattcgt ttagcagctt atgtaaaatc + 12121 aaaagtaatg tagagtatag gaaacataat gatagaaaaa attttagatt ctattaaaaa + 12181 tcattctttt tatagtaaat tgaaggataa aattcataga attattccat tatatattat + 12241 aaaaaatcaa aatatagctt ttcaacaaga taccgatata gcatatagaa aactaaagaa + 12301 gaagtttagg catatttcgt tgactggaga tgagcttaaa tataaaatgg agttttcaaa + 12361 taaagtttgg atttgttggt ttcagggaga agagcatgcc ccagagttaa ttaaaacatg + 12421 tattcaatca atgaggaatc aacttcaagg aagagaaatc attgtgttga cagaaaaaaa + 12481 tataagtgat tatacagaga ttccaggcta tattattgaa aaatacaaaa aaggatggat + 12541 ttctcgtgcg cattactctg atatccttag gatagatctt ctatgtcgcc atggaggatt + 12601 atgggtagat gcaacagtgt tgaatacagg aggagatttc tcaaatcttg aggtaccact + 12661 ttttgtatat aaatctttga atttatcaag aaaagattca caagctattg tagcatcaag + 12721 ttggttaatt tcgtcatata gtaatcatcc tatattactc tatacgagaa aactcctatg + 12781 ggcctattgg cgaagaaaaa atagtttatg taattatttt ttgttccata tatgttttac + 12841 aatagctaca gagcggtacc caatcgaatg gtctgctgtc cctactttta ataatcattc + 12901 tcctcatata cttcattttg agttgaatga acaattttcg gaaaaacggt gggaacaact + 12961 gaagcatatt tcggcgtttc ataaattaaa tcatcatata gattattcta gcggtgttaa + 13021 cactttttat aagttcatag tatcttcgaa agtttagaaa aatgagtaat aaaattagta + 13081 aaaatttagc ctacaatatg gggtatcagt taattgggat tgcagctccc ttgataactt + 13141 ctccttattt atcacggata ttaggtgctg aaaatttagg tattcattct tttactatgt + 13201 cggttgcact ttactttatg atgtttatgc ttcttggaat tgcaaattac ggaaatagaa + 13261 caattgcgac tgttaaacga gaaggaaagg atattctatc aaaaacgttt tggagtatct + 13321 actctatcca gttgataatg tctattctgg taactatagc ttatcttgct tatctatatt + 13381 tgggggcagt acattacaaa gttattgcaa tattacaact ctttttattg ttatcaaatg + 13441 ctgttgatat tacttggttt ttctatggat tagaaaattt taagcaaatc gtttttagga + 13501 atacattagt caaactttta ggattatttt taattttttt atgtgtgcgt caaggcacag + 13561 atttatggaa atacacattt ataaacggat cagtaacttt agttggccaa cttttactat + 13621 ggggacaatt aaaaggaata ttaacttgga aaaaaattca attaaaggaa ttactgcctc + 13681 atatcaagcc aattttaatt ctttttattc ctgtactagc cattagtatt tttactaata + 13741 tggataaata tatgcttggt ttaatggttg atgtaaagca ggttggattt tatgacaatg + 13801 caggtagaat tattgaaatt cctaaagctt tgattgcagc tttaggggcc gttatgttac + 13861 caagaacttc ctatttatta gcggaaggac agaaagaaaa gagtaaatac tacatagagg + 13921 taacaatttt atacgtgatg attatttcta gtgtattgat gtttgggcta atatcggtat + 13981 ctgatatttt ttccattata ttttggggag aagaatttct tgaatcaggt agattgattt + 14041 ctgctatgtc tccggctttt gtcttctctg tattaggaaa tatcattagg actcagtatt + 14101 tgattcctag agctaaggat aaagattatg tagtgtctct aattgcgggg gctgttgtta + 14161 atctagtgct aaactatttt tttataaaac cttttggtgc tatgggagca acagttagta + 14221 cagttttggc agaatttgta ttgtctggaa tgcagttttg gtcagtaaga agagacttag + 14281 atttaaaaag atatttgaaa aacggtttga tattctacct atttggtctg attatgcacc + 14341 tcattattat agcactcaaa actcagttac catacaatat aatgagtctt attttactaa + 14401 tagttttggg tggaatagta tatgttattt tttgttgttg ctatatttta atgtcaagaa + 14461 atttacattt taagttattg aaggaaaaga ttatacgaaa ggttgtacat aaaaatacat + 14521 tataaaatat tagtttatct tatttagttg gatactatta aataaacgaa agtatttgaa + 14581 actttggtaa ttgagattat agagattata gagataaact aagctatatt atagcttcat + 14641 tattaaagta agaatatcgg tgcagtgtag ttaacgaata atgtgagtac tcatttctta + 14701 gatggagcta ggggtcatta taagggattg atatgacatt ttgagtaagt tacagctaga + 14761 gtttaggttt gattatatca gatatttaga tgatttggaa aataataaaa taagttagga + 14821 actatttttt tattgttttg agtgacaggt ttgattttgg gaaatgtatt ttgttaaata + 14881 ggtaggaaag atggttacta aagataaagg attaacatat aatagtactt tgcatgcaat + 14941 aaaagtatta gcatgtttta gtgttgttgc tattcatata tggctaccag gaaaaattgg + 15001 agcgttttat caaataatag cacgatttgc agttccaatg ttctttttga tttctggctt + 15061 ttattcatat aatatttcaa agaataaaat acagaataga attaaaaaaa tatttagatt + 15121 gatattaaga agtacatttt tttatgtaat aatatttgta tggatgtttt ggagagaagg + 15181 taatatgcag tttatttttc aaaactttaa tttaacaaat attataagat ttgtgatttt + 15241 taataggatt tcagatttaa taggctatct agcaacaccg ttgtggtatt tatttgctat + 15301 attatatata tatatatatc tttatttttc caataaaaga ctactattga caaaacgatg + 15361 gatttctata cttttactat tttctttcat tatggaagct acaattagcg attcaatttt + 15421 ttatagaaat tttttattta tgggaatacc attttttgga ataggaattc ttattgcaca + 15481 gaagcaaaag aagattatta attgtaaaat aataaacaaa atattaatct tgggaacaat + 15541 tatctatcca atactaatat ttttagaata ttatatcttg ggtaattctt ttgagatcta + 15601 tataagttct gtgctagcaa ccataatatt gatgattttc gcgattaaat cacctaaagc + 15661 gattaatata aaaatactga atgaaattgg agataaatat gcgacttttg tttacattat + 15721 acaccagttt atcattgtga tatttaaatt tttagtatct aatgtttata ttctcaaatt + 15781 tgggacgata tttgtctttt tgatatgttg ttttctaggg gttctatttc aatttatcaa + 15841 aaacagacta ttaaaaaggt ttagttaaga tggttgtttt acaaaatgtt aaatttttag + 15901 taagagttgt ttttatggtt attatcagta tagtgttatg gcctgttcgg ataaagaaga + 15961 ataagatact atttattaat tttaatggta agggatatgg tgataatccg aaaagtattt + 16021 gtgagtatct tcgagttaca tatccagagt tagatttagt ttggcttaca aaagataatg + 16081 aagattttcc agatggagtg agagttgtaa gatataaatc tctacaatct ttttatgagc + 16141 aagctagttc gaaggtttgg gtttataatg taagaaattt tgaaagacta ctaaaaaaac + 16201 gcggacagtt ttatattcaa acttggcacg gtgcttctag ttttaaactg atagaaaagc + 16261 aggctgattt accattaaaa tatattttag aagcaaagta tgatgcaaga gtcacagata + 16321 taatgatttc agatagcaga aaacaaactg aagaatttca aaagtatttt tggtattcag + 16381 gagaaatttt tgaggtgggg atgccgagaa atgatgcctt gtttcactat aaggaagact + 16441 acgacaagtt aaataatatc agaaaaaaac taagcattga ttcagatgat tatgttattt + 16501 tatatgcccc tactttcaga gatgatgggg atgcatctta tttagatata aattttgaac + 16561 ggcttttgca aagtattgaa caagaaatta agaagaaatg taaaatttta attagattac + 16621 atcctaatga ctctcatttt agtaataata tttcttttaa tcatgacata attgatgtta + 16681 cgctattctc agatatgcag gaacttatat tattggcaga tgttttactg acagattatt + 16741 cttccgcgat atttgatttt atgcttttaa acaagcctta tgtcagatat gtgaatgatt + 16801 tagaaaaata tgctgagctt aggggggtat cagatacata ttatgaattg ccggattcta + 16861 ttattaaaac tgctgaagaa ttgtatgact tactgcctaa aaaaatagaa aattttgatt + 16921 atgattctat aaaaaaatat agaaatgaaa tactgtgtcc aatctttaat ggaaccgcta + 16981 gtgaaaatgt aggaaggaga ataattcaag agttgtgaag taaaacattg ggttattttt + 17041 aaggtaacga gatttgaaaa ataatgattt aaagatagga agtggagcta ttcatcaaat + 17101 ctccgctaca ctttctcaaa ataatatttc gggaaagatt ttatattgtg ctgatccagt + 17161 tgtcgatgac ttgtacggtt cgatagtacg ttcacaaata gaggaaattg gtcgggtaaa + 17221 ggaagaaagt tgcaattata atactattgc ttatgcgatg aatatagcag aaagggctat + 17281 tgccacagat attgactgta ttgtgggaat gggaggaggt cgtgttttag atgtctgcaa + 17341 gtatgcatct tttatttcga aacgtcctta cctatcgatt ccgacaacag cagcaaatga + 17401 tggcattgct tccccagttg ctgttttgaa aaggcaggat gatagaccaa aaagcttagg + 17461 ggcggctatc ccttcaatga cactaattga tattgatgtt attgcatcag gacctataca + 17521 aaatataaaa gctggtatcg gtgatacaat atccaattac actgcattga aagattggga + 17581 gttggcagtt gagcgaggga aagatgagat gcatggtttt gcatatctaa tgtcgcaaaa + 17641 ttctttagat gctttaatga aaacgaagta taattctatt acccctgatt ttattgaagt + 17701 tttggtaaac tctttagttt tatcaggcat tgcaatggat tttgcgggaa gtagtagacc + 17761 tgtcagtggg tcagagcact tatttagtca tgcattagat tactatggtt ctacaaggaa + 17821 tcttcatgga attcaggttg cattaggtac agtcgcagtt ttgaaattaa ttgaaaattc + 17881 tgttgatact gtagtggatt acttgcaaag atttgaggtt catattaacc cgaaactttt + 17941 ggggatagat gaagagttgt ttatttattg tatgcaacat gctacaaaaa tgagaagtaa + 18001 tcgctatacc tatctgcatg aagttgatct tagcacagat agattgaaac aaatatataa + 18061 ggaactcata agcgagttgt agaaaagaga ggaaaaaatg aaagcactta ttttagcagc + 18121 agggttagga acacgtctag ctccaattac caatgaggta ccaaaatctt tggtaccagt + 18181 caatggtaag ccaattttga tgaaacaaat tgaaaattta tatcaaaata atattacaga + 18241 tattacgatt attgctggat ataagtcatc tgtattaaca gatgcagtta ctgaaaagta + 18301 tccagaaatt aatattattg ataatgttga ttttaaaacg actaataata tgtattcagc + 18361 ctatctagga aaagctgcaa tgggtgatag tgacttctta atgatgaatg cagatgtatt + 18421 ttatgatgct tctgttatta aaagtctgtt gcttcataaa gctccaaatg caattgtaac + 18481 tgatttaggt atttatattg aagagtctat gaaagtcgta gaaaaaaatg gtcgtttagt + 18541 agaaatttct aaacagattt cacctgagga aactttagga gcttctattg atgtttataa + 18601 attctcttat gaagcaggtg ctcgattctt tgaaaagtgt aaggaattta ttgaagataa + 18661 acgagaactt caaatgtgga gtgaggttgc tcttaatgca attctttctg aagttgaatt + 18721 tgtagcatgt ccattagagg gtcgttggtt agaaattgat aatcatgaag acttagttgc + 18781 tgcagaaaaa ctatttgctt gaaccgaata cggagaatga aattgacaaa tagagttgat + 18841 tattttggtg ctgatattag tgaacttcag aataaaaaat tattcttatt tgatatggat + 18901 ggtaccattt atgaagaaga taggttgttt gagggtactc tcgaattatt agactatatt + 18961 cataatattg gcggtgagta tatttttatt acaaacaatt catctaagtc tgttgttgac + 19021 tatgttgaaa aagttaacag attaggtatt aaagctgaac gagataattt ttttacctct + 19081 gctcaagcca caattgttta tattaaagaa aattatccta aatctaaagt ttattgccaa + 19141 ggaacaaaat ctttgataaa agaactatct gacgcaggaa ttgatgtaac tgagcaagtt + 19201 agtgctgata tagatgttgt tcttgttggt tttgatacag aattaaccag tgataaaatt + 19261 cgcaatacct gcgagattct atcaacaaag gacgtacctt tcatagctac taaccctgat + 19321 attcgctgcc cagtatcgtt tggattcatc ccagattgtg gttctatttg tgatatgatt + 19381 agtaaatcag tcgataggaa acctgtttac ataggtaaac ctgaacctac gatggttgat + 19441 attgttcgaa aaaaattaaa ttattctcta tttgaaacag ttgtgattgg agatcgcttg + 19501 tatacggata tcatgactgg tataaatgca ggagtaactt cagtttgtgt gctgacagga + 19561 gaagcaacgg tgaatgatat tcaacaaggt agtataaaac cgacttatac atttaaaaac + 19621 gtgaaagaaa tgtggaaagg aattgtctga ttttttcatt ctgaatagtg aattcatgaa + 19681 tactgtcaaa atactcgtat gtatttaaat tgattttatt attagacttc ctgcaaaact + 19741 agaatcctag ttcatgattg ataatagcag caatcaaatt cattcgtaat ccgaagcgtt + 19801 tacgatgatt tcgataggtt gttgaaaaca ttttaaacgt ttttactttg gcaaagatgt + 19861 tctcaacctt gcttctctcc ttggatagcg catggttaca ggctttatct tcaactgtta + 19921 gcggtttgag tttgctggat ttacgtggag tttgtgcttg aggatatatc ttcatgagcc + 19981 cttgataacc actgtcagcc aagattttac cagcttgtcc gatatttctg cgactcattt + 20041 tgaacaactt tatatcatga caatagttca cagcgatatc caaagaaaca attctccctt + 20101 gacttgtgac aatcgcttga gccttcat +// diff --git a/public/res/serotype_genbank/serotype_15F.gb b/public/res/serotype_genbank/serotype_15F.gb new file mode 100644 index 0000000..55d1d79 --- /dev/null +++ b/public/res/serotype_genbank/serotype_15F.gb @@ -0,0 +1,1004 @@ +LOCUS CR931666 22405 bp DNA linear UNK 10-JUN-2024 +DEFINITION CR931666, whole genome shotgun sequence. +ACCESSION CR931666 +VERSION CR931666 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/10/2024, 18:50:26 + CDSs :: 24 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..22405 + /mol_type="genomic DNA" + gene 293..466 + /locus_tag="FPBPHK_00005" + CDS 293..466 + /db_xref="RefSeq:WP_001022228.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00000E4685" + /db_xref="UniRef:UniRef100_A0A0H2ZQL8" + /db_xref="UniRef:UniRef50_A0A0H2ZQL8" + /db_xref="UniRef:UniRef90_A0A0H2ZQL8" + /product="Lipoprotein" + /locus_tag="FPBPHK_00005" + /protein_id="gnl|Bakta|FPBPHK_00005" + /translation="MNIKKRVLSAGLTFASALLLAACGQSGSDTKTYSSTFSGNPTTFN + YLLDYYADNIVN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001022228.1" + gene complement(434..796) + /locus_tag="FPBPHK_00010" + CDS complement(434..796) + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A0H2UQ11" + /product="IS630-Spn1, transposase Orf2" + /locus_tag="FPBPHK_00010" + /protein_id="gnl|Bakta|FPBPHK_00010" + /translation="MVAGLINGELIVPMTYEETMTSDFFEVWFQKFLLPTLTTPSVIIM + DNARFHRMGKLELLCEKFGINFYLFLPTHLSTILLRKHGLISKSTSKRYYQVAIPFMRL + FCLVLVSIDYIISVIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef50_A0A0H2UQ11" + gene complement(975..1322) + /locus_tag="FPBPHK_00015" + CDS complement(975..1322) + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A7G1IQ53" + /db_xref="UniRef:UniRef90_A0A0H2ZRF4" + /product="IS630-Spn1, transposase Orf1" + /locus_tag="FPBPHK_00015" + /protein_id="gnl|Bakta|FPBPHK_00015" + /translation="MWYNLFMAYSIDFRKKALSYCERTGSITEASHVFQISRNTIYGWL + KLKEKTGELNHQVKGIKPRKVDRDRLKNYLTDNPDAYLTEIASEFGCHPTTIHYALKAM + GYTRKKEPHLL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A0H2ZRF4" + gene 1553..2998 + /locus_tag="FPBPHK_00020" + /gene="wzg" + CDS 1553..2998 + /db_xref="BlastRules:WP_000091082" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniprotKB:Q4K1K9" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="FPBPHK_00020" + /protein_id="gnl|Bakta|FPBPHK_00020" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVDQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSTLH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIKKLTSTEVLKNYS + SILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSYAMPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef50_G3G7D5" + /gene="wzg" + gene 3000..3731 + /locus_tag="FPBPHK_00025" + /gene="wzh" + CDS 3000..3731 + /db_xref="BlastRules:WP_000565352" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF43" + /db_xref="UniRef:UniRef100_Q4K1K8" + /db_xref="UniRef:UniRef90_Q9AHD4" + /db_xref="UniprotKB:Q4K1K8" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="FPBPHK_00025" + /protein_id="gnl|Bakta|FPBPHK_00025" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDSRY + ALIEFSMNTPYRDIHSALNKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVTQKYG + EAKAQELFVDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1K8" + /gene="wzh" + gene 3740..4432 + /locus_tag="FPBPHK_00030" + /gene="wzd" + CDS 3740..4432 + /db_xref="RefSeq:WP_000392514.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF28" + /db_xref="UniRef:UniRef100_Q4K1K7" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_Q4K1K7" + /db_xref="UniprotKB:Q4K1K7" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="FPBPHK_00030" + /protein_id="gnl|Bakta|FPBPHK_00030" + /translation="MEEQNTLEIDVLQLFRSLWKRKLVILLVAIITSSVAFAYSTFVIK + PEFTSTTRIYVVNRDQGEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVVSDLKLDLT + PKGLANKIKVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVTTLE + EARPATTPSSPNVRRNTLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQIPLLGL + VPDLDKMK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000392514.1" + /gene="wzd" + gene 4442..5131 + /locus_tag="FPBPHK_00035" + /gene="wze" + CDS 4442..5131 + /db_xref="RefSeq:WP_001142531.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF29" + /db_xref="UniRef:UniRef100_Q4K1K6" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_O84996" + /db_xref="UniprotKB:Q4K1K6" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="FPBPHK_00035" + /protein_id="gnl|Bakta|FPBPHK_00035" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDGLKVFSITSVKL + GEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDLSQ + GLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVIDAA + IITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSYGNYG + DYGKNKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001142531.1" + /gene="wze" + gene 5146..6513 + /locus_tag="FPBPHK_00040" + /gene="wchA" + CDS 5146..6513 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF44" + /db_xref="UniRef:UniRef100_Q4K1K5" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_Q8VU30" + /db_xref="UniprotKB:Q4K1K5" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="FPBPHK_00040" + /protein_id="gnl|Bakta|FPBPHK_00040" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYILH + YFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYFLT + LHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGELVAV + SVLDKPDFQHDYLKVVAEEEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMGIDVT + VNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLILCGLAS + IVLVPLIRKDGGSTIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTMQGGMFK + VDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQKRRLSF + KPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFMRDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1K5" + /gene="wchA" + gene 6517..6966 + /locus_tag="FPBPHK_00045" + /gene="wchJ" + CDS 6517..6966 + /db_xref="GO:0016740" + /db_xref="RefSeq:WP_000686638.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2B" + /db_xref="UniRef:UniRef100_Q4K1K4" + /db_xref="UniRef:UniRef50_J9W567" + /db_xref="UniRef:UniRef90_Q4K1M2" + /db_xref="UniprotKB:Q4K1K4" + /db_xref="UserProtein:wchJ" + /product="""putative glycosyl transferase enhancer""" + /locus_tag="FPBPHK_00045" + /protein_id="gnl|Bakta|FPBPHK_00045" + /translation="MKICLVGSSGGHLTHLYLLKPFWKDKERFWVTFDKADARSVLSEE + VVYPCYYPTNRNIKNLIKNTFLAYKILKKERPDLIISSGAAIAVPFFYIGKLFGSKTVY + IEVFDRIDASTLTGKLVYPVTDRFIVQWEEMKKVYPKAINLGGIF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000686638.1" + /gene="wchJ" + gene 6966..7472 + /locus_tag="FPBPHK_00050" + /gene="wchK" + CDS 6966..7472 + /db_xref="KEGG:K25904" + /db_xref="RefSeq:WP_000578432.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2C" + /db_xref="UniRef:UniRef100_Q4K1K3" + /db_xref="UniRef:UniRef50_Q9AQJ2" + /db_xref="UniRef:UniRef90_Q4K1K3" + /db_xref="UniprotKB:Q4K1K3" + /db_xref="UserProtein:wchK" + /product="""putative glycosyl transferase""" + /locus_tag="FPBPHK_00050" + /protein_id="gnl|Bakta|FPBPHK_00050" + /translation="MIFVTVGTHEQQFNRLIKEVDRLKGEGFIQDDVFIQTGYSNYVPK + FCKWEKLISYEKMNQFIEEADTIITHGGPATFMAVIAKGKSPIIVPRLKKFGEHVNDHQ + LEFVEKVLNVYNLTVITNISDLNSYISNFDERKKSDLKSKNNLFMEKFIDMINQLMETG + DIKYD" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000578432.1" + /gene="wchK" + gene 7465..8664 + /locus_tag="FPBPHK_00055" + /gene="wzy" + CDS 7465..8664 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_E0Q2S4" + /db_xref="UniRef:UniRef90_Q4K1K2" + /db_xref="UniprotKB:Q4K1K2" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="FPBPHK_00055" + /protein_id="gnl|Bakta|FPBPHK_00055" + /translation="MTKYINSCIKLLFIYSLFSELLYSYYSVSLLFTIPDLLLLAAAVI + AFVDSYSAGKIRVKNPHISLMLFFILLIFLLISFTWGTLNIYGFVMRGRYILGAFLVYF + MTNSYLDDRTFSSLINIAYFMQILNLLLVLHQNIVLHLHPDFTNGIFGFTDYANGIQGF + YCLALSVLSTVYYLYGKWGTMKSLILIAISCIICALAEIKIFFVIFIFSIILIFIFQKS + ETVKKIRIISTAAGISLIFLIAYKLIEIVLPDNLYTFFNVTKALSYENRTEFAGRTNTI + SFLWDNLFYYDYISAIFGKGLGSYSVNYIYELGKMLADGGFISVILLYSFLLSLFIRGT + ITRGKNKQSERLIVSIIAFVVMISIIVWNSTFSRPTYLVFFFLAIGNAAYKSTKLIRRD + " + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K1K2" + /gene="wzy" + gene 8666..9694 + /locus_tag="FPBPHK_00060" + /gene="wchL" + CDS 8666..9694 + /db_xref="RefSeq:WP_000405438.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF2E" + /db_xref="UniRef:UniRef100_Q4K1K1" + /db_xref="UniRef:UniRef50_Q4K1K1" + /db_xref="UniRef:UniRef90_Q4K1K1" + /db_xref="UniprotKB:Q4K1K1" + /db_xref="UserProtein:wchL" + /product="""putative glycosyl transferase""" + /locus_tag="FPBPHK_00060" + /protein_id="gnl|Bakta|FPBPHK_00060" + /translation="MEIQISVVIPVYNAENTINNCIESALKQDLESFEVILVNDGSNDS + TSRILEQYSDNPQVKIFHQVNMGVSAARNLGLSHASGEYVFFLDSDDILDDGMLSKMYQ + FVKNNKVDLLSCWHKEPATTQYGGNENKSTSFIARTREEIGAHFVDIFPRSACAKLFFR + KIIEENNITFSTEMSLGEDMSFVYQYLMVSKSIGVIDGVYYNIQNVNPQSLSKRYVQNI + ENSLMIQNQLWNQLLEVYPKIEENYYKQHMDFRFYLANLYVNNLFKFDSPYSSKEKLDQ + IAQQLKKYRLFLDEKVSKEKMPKNINEMIVFYLLKLKIPVLIYSFYSFKEWWKRRKIKN + EG" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000405438.1" + /gene="wchL" + gene 9702..10658 + /locus_tag="FPBPHK_00065" + /gene="wchM" + CDS 9702..10658 + /db_xref="RefSeq:WP_000389753.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF3F" + /db_xref="UniRef:UniRef100_Q4K1L8" + /db_xref="UniRef:UniRef50_E0Q2S2" + /db_xref="UniRef:UniRef90_A0A4J2AN51" + /db_xref="UniprotKB:Q4K1L8" + /db_xref="UserProtein:wchM" + /product="""putative glycosyl transferase""" + /locus_tag="FPBPHK_00065" + /protein_id="gnl|Bakta|FPBPHK_00065" + /translation="MEDLISIVVPVYNVEKYLKKSIESILNQTYQNIEILLVDDGSTDS + SGKICESFSKVDPRIRVFHKENGGLSDARNFGIEQMKGQYVAFIDSDDYISKDYVWKLY + SSIKNNDSEVSICSFLLVDEKGEKIKDELLDSGKICLTGQQILEKVLTADGYRYVVAWN + KLYRSTLFEKLKFKKGMLYEDEFLNYPLFWDCKRVSIVEEPLYLYVQRKGSIVQSNMTL + EKIKMKDEMHTSRIEFYSEKGHSFLHEKACQQYCNWIVTATTNHSKILNPNFSKYLQRQ + FRKFAKYTRNNDIRLIVQNILGFIDIRLAAYVKSKVM" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000389753.1" + /gene="wchM" + gene 10674..11582 + /locus_tag="FPBPHK_00070" + /gene="wchN" + CDS 10674..11582 + /db_xref="RefSeq:WP_000570495.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF30" + /db_xref="UniRef:UniRef100_Q4K1J9" + /db_xref="UniRef:UniRef50_B2ILQ2" + /db_xref="UniRef:UniRef90_Q6X853" + /db_xref="UniprotKB:Q4K1J9" + /db_xref="UserProtein:wchN" + /product="""putative glycosyl transferase""" + /locus_tag="FPBPHK_00070" + /protein_id="gnl|Bakta|FPBPHK_00070" + /translation="MIEKILDSIKNHSFYSKLKDKIHRIIPLYIIKNQNIAFQQDTDIA + YRKLKKKFRHISLTGDELKYKMEFSNKVWICWFQGEEHAPELIKTCIQSMRNQLQGREI + IVLTEKNISDYTEIPGYIIEKYKKGWISRAHYSDILRIDLLCRHGGLWVDATVLNTGGD + FSNLEVPLFVYKSLNLSRKDSQAIVASSWLISSYSNHPILLYTRKLLWAYWRRKNSLCN + YFLFHICFTIATERYPIEWSAVPTFNNHSPHILHFELNEQFSEKRWEQLKHISAFHKLN + HHIDYSSGVNTFYKFIVSSKV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000570495.1" + /gene="wchN" + gene 11587..13050 + /locus_tag="FPBPHK_00075" + /gene="wzx" + CDS 11587..13050 + /db_xref="RefSeq:WP_000066241.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF31" + /db_xref="UniRef:UniRef100_Q4K1J8" + /db_xref="UniRef:UniRef50_O07342" + /db_xref="UniRef:UniRef90_Q6X852" + /db_xref="UniprotKB:Q4K1J8" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="FPBPHK_00075" + /protein_id="gnl|Bakta|FPBPHK_00075" + /translation="MSNKISKNLAYNMGYQLIGIAAPLITSPYLSRILGAENLGIHSFT + MSVALYFMMFMLLGIANYGNRTIATVKREGKDILSKTFWSIYSIQLIMSILVTIAYLAY + LYLGAVHYKVIAILQLFLLLSNAVDITWFFYGLENFKQIVFRNTLVKLLGLFLIFLCVR + QGTDLWKYTFINGSVTLVGQLLLWGQLKGILTWKKIQLKELLPHIKPILILFIPVLAIS + IFTNMDKYMLGLMVDVKQVGFYDNAGRIIEIPKALIAALGAVMLPRTSYLLAEGQKEKS + KYYIEVTILYVMIISSVLMFGLISVSDIFSIIFWGEEFLESGRLISAMSPAFVFSVLGN + IIRTQYLIPRAKDKDYVVSLIAGAVVNLVLNYFFIKPFGAMGATVSTVLAEFVLSGMQF + WSVRRDLDLKRYLKNGLIFYLFGLIMYLVIITLKTQLPYNIMSLILLIVLGGIVYVIFC + CCYILMSRNLHFKLLKEKIIRKVVHKNTL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000066241.1" + /gene="wzx" + gene 13406..14383 + /locus_tag="FPBPHK_00080" + /gene="wciZ" + CDS 13406..14383 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF46" + /db_xref="UniRef:UniRef100_Q4K1J7" + /db_xref="UniRef:UniRef50_E0Q2R6" + /db_xref="UniRef:UniRef90_Q6X851" + /db_xref="UniprotKB:Q4K1J7" + /db_xref="UserProtein:wciZ" + /product="""putative acetyl transferase""" + /locus_tag="FPBPHK_00080" + /protein_id="gnl|Bakta|FPBPHK_00080" + /translation="MVTKDKGLTYNSTLHAIKVLACFSVVAIHIWLPGKIGAFYQIIAR + FAVPMFFLISGFYSYNISKNKIRNRIKKIFRLILRSTFFYVIIFVWMFWREGNMQFIFQ + NFNLTNIIRFVIFNRISDLIGYLATPLWYLFAILYIYIYLYFSNKRLLLTKRWISILLL + FSFIMEATISDSIFYRNFLFMGIPFFGIGILIAQKQKEIINCKIINKILILGTIIYPIL + IFLEYYILGNSFEVYISSVLATIILMIFAIKSPKAINIKILNEIGDKYATFVYIIHQFI + IVIFKFLVSNVYILKFGTIFVFLICCFLGVLFQFIKNRLLKRFS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1J7" + /gene="wciZ" + gene 14385..15533 + /locus_tag="FPBPHK_00085" + /gene="wchX" + CDS 14385..15533 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF47" + /db_xref="UniRef:UniRef100_Q4K1J6" + /db_xref="UniRef:UniRef50_Q9R922" + /db_xref="UniRef:UniRef90_A0A4J2AK78" + /db_xref="UniprotKB:Q4K1J6" + /db_xref="UserProtein:wchX" + /product="""putative glycerol phosphotransferase""" + /locus_tag="FPBPHK_00085" + /protein_id="gnl|Bakta|FPBPHK_00085" + /translation="MVVLQNVKFLVRVVFMVIISIVLWPVRIKKNKILFINFNGKGYGD + NPKSICEYLRVTYPELDLVWLAKDNEDFPDGVRVVRYKSLQSFYEQASSKVWVYNVRNF + ERLLKKRGQFYIQTWHGASSFKLIEKQADLPLKYILEAKYDARVTDIMISDSRKQTEEF + QKYFWYSGEIFEVGMPRNDALFHYKEDYDKLNNIRKELSIDSDNYVILYAPTFRDDGDA + SYLDINFERLLQSIEQEIKKKCKILIRLHPNDSHFSNNISFNHDIIDVTLFSDMQELIL + LADVLLTDYSSAIFDFMLLNKPYVRYVNDLEKYAELRGVSDTYYELPDSIIKTAEELYD + LLPKKIENFDYDSIKKYRNEILCPIFNGTASENVGRRIIQEL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1J6" + /gene="wchX" + gene 15569..16597 + /locus_tag="FPBPHK_00090" + /gene="gtp1" + CDS 15569..16597 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF48" + /db_xref="UniRef:UniRef100_Q4K1J5" + /db_xref="UniRef:UniRef50_Q9R921" + /db_xref="UniRef:UniRef90_Q9R921" + /db_xref="UniprotKB:Q4K1J5" + /db_xref="UserProtein:gtp1" + /product="""putative glycerol-2-phosphate dehydrogenase""" + /locus_tag="FPBPHK_00090" + /protein_id="gnl|Bakta|FPBPHK_00090" + /translation="MKNNDLKIGSGAIHQISATLSQNNISGKILYCADPVVDDLYGSIV + RSQIEEIGRVKEESCNYNTIAYAMNIAERTIATDIDCIVGMGGGRVLDVCKYASFISKR + PYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKAGIG + DTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLVNSLV + LSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENSVDAVV + DYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQIYKELIS + EL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1J5" + /gene="gtp1" + gene 16613..17317 + /locus_tag="FPBPHK_00095" + /gene="gtp2" + CDS 16613..17317 + /db_xref="RefSeq:WP_000645464.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF34" + /db_xref="UniRef:UniRef100_Q4K1J4" + /db_xref="UniRef:UniRef50_O85005" + /db_xref="UniRef:UniRef90_O85005" + /db_xref="UniprotKB:Q4K1J4" + /db_xref="UserProtein:gtp2" + /product="""putative nucleotidyl transferase""" + /locus_tag="FPBPHK_00095" + /protein_id="gnl|Bakta|FPBPHK_00095" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQNN + ITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLMMN + ADVFYDASVIKSLLLHKAPNAIVTDLGTYIEESMKVVEKNGRLVEISKQISPEEALGAS + IDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILPEVEFIACPLDGRWLEIDN + HEDLAVAEKLFA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000645464.1" + /gene="gtp2" + gene 17338..18165 + /locus_tag="FPBPHK_00100" + /gene="gtp3" + CDS 17338..18165 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q4K1N0" + /db_xref="UniRef:UniRef90_Q4K1N0" + /db_xref="UniprotKB:Q4K1N0" + /db_xref="UserProtein:gtp3" + /product="""putative phosphotransferase""" + /locus_tag="FPBPHK_00100" + /protein_id="gnl|Bakta|FPBPHK_00100" + /translation="MTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLELLDY + IHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPKSKVY + CQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDVPFIAT + NPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRKKLNYSLFETVVI + GDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQGSIKPTYTFKNVKEMWKGIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K1N0" + /gene="gtp3" + gene 18441..19079 + /locus_tag="FPBPHK_00105" + /gene="rmlB" + CDS 18441..19079 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF49" + /db_xref="UniRef:UniRef100_Q4K1J2" + /db_xref="UniRef:UniRef50_Q4K1J2" + /db_xref="UniRef:UniRef90_Q4K1J2" + /db_xref="UniprotKB:Q4K1J2" + /db_xref="UserProtein:rmlB" + /product="""dTDP-D-glucose 4,6-dehydratase RmlB""" + /locus_tag="FPBPHK_00105" + /protein_id="gnl|Bakta|FPBPHK_00105" + /translation="MPGHGEGPGEKFTAETKYNPSSPYSSTKAASDLIVKAWVRSFGVK + ATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLYGEGKNVRDWIHTNDHSSGVWTIL + TKGQIGETYLIGADGEKNNKEVLELILKEMGQATDAYDHVTDRAGHDLRYAIDASKLRD + ELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKEAVEANYAKTQEIITV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K1J2" + /gene="rmlB" + gene 19145..19996 + /locus_tag="FPBPHK_00110" + /gene="rmlD" + CDS 19145..19996 + /db_xref="COG:COG1091" + /db_xref="COG:M" + /db_xref="EC:1.1.1.133" + /db_xref="GO:0008831" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="KEGG:K00067" + /db_xref="RefSeq:WP_000600910.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF4A" + /db_xref="UniRef:UniRef100_Q4K1G6" + /db_xref="UniRef:UniRef50_Q9AH81" + /db_xref="UniRef:UniRef90_Q9AH81" + /db_xref="UniprotKB:Q4K1G6" + /db_xref="UserProtein:rmlD" + /product="""dTDP-4-keto-L-rhamnose reductase RmlD""" + /locus_tag="FPBPHK_00110" + /protein_id="gnl|Bakta|FPBPHK_00110" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEKV + FEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTDYV + FDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKNFVF + TMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDTTWYD + FAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQEFYKQE + VR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000600910.1" + /gene="rmlD" + gene 20059..21168 + /locus_tag="FPBPHK_00115" + /gene="glf" + CDS 20059..21168 + /db_xref="COG:COG0562" + /db_xref="COG:M" + /db_xref="EC:5.4.99.9" + /db_xref="GO:0008767" + /db_xref="GO:0009273" + /db_xref="RefSeq:WP_050208706.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF4B" + /db_xref="UniRef:UniRef100_Q4JZV2" + /db_xref="UniRef:UniRef50_A0A4S2G265" + /db_xref="UniRef:UniRef90_F8WRM7" + /db_xref="UniprotKB:Q4JZV2" + /db_xref="UserProtein:glf" + /product="""UDP-galactopyranose mutase Glf""" + /locus_tag="FPBPHK_00115" + /protein_id="gnl|Bakta|FPBPHK_00115" + /translation="MYDYIIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCENV + EGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYAMW + GTKTPQEVKDKITEQTADMKDVEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSATEL + PPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHREELEA + SAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPYTRIIE + HKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDKVIFCGR + LADYKYYDMHVVIERALEVVEKEFGYDKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050208706.1" + /gene="glf" + gene 21155..22183 + /locus_tag="FPBPHK_00120" + /gene="wcjE" + CDS 21155..22183 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q8KWN9" + /db_xref="UniRef:UniRef90_Q4K0S3" + /db_xref="UniprotKB:Q4K1I9" + /db_xref="UserProtein:wcjE" + /product="""putative acetyl transferase""" + /locus_tag="FPBPHK_00120" + /protein_id="gnl|Bakta|FPBPHK_00120" + /translation="MTKSRINWIDFGKGFSIFLVLAGHVLLGLYQSEKFPTANNILSLL + IAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQKVAG + ASVRVPTTISDLLNIYKFPLGVSWYLYTLWSILIVYGLLSVVFKNRKSLLLVSVFAYIF + TLFIQTDIFIVQRTLVWGICFFLGSVLSEIHFDKINLKKFLFFFVLFDFIYMFAWFLFY + EVGSKKDYVSYINPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSLGIYIL + HAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLLPQKYIK + LK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K0S3" + /gene="wcjE" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaagttt ataaactttc + 241 attcttgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgccaaa cttttcgcat aaaagttcta gcttccccat tctatggaat cttgcattat + 661 ccataataat aaccgatggt gtggttaatg ttggtaagag aaacttctga aaccatactt + 721 caaaaaagtc gctcgtcatc gtctcttcgt aagtcattgg aacgattaat tcaccattta + 781 ttagacctgc aaccaaagaa atcctctgat atcttcttcc agatactttg cctcttatta + 841 actgaccttt taatgagcga ccatattctc gataaaaata agtatcgaat cctgtttcgt + 901 caatctaaac aggtgctagg tgctttaaac tattaaaatt cttaagaaat aaggctactt + 961 tttctgggtc ttgttcatag taggtgtggt tctttttttc gagtgtagcc catagctttg + 1021 agcgcatagt ggatggtagt tggatgacag ccaaattcag aagctatttc agtcaaataa + 1081 gcgtctggat tgtcagtaag atagttttta agtctatctc tatcaacttt tcttggtttt + 1141 attcctttta cttggtggtt tagctctcct gttttctctt ttagctttaa ccagccataa + 1201 atggtattac gtgagatttg gaaaacgtgt gatgcttctg ttatactacc tgttcgctca + 1261 caataagaga gagctttttt acgaaaatct attgaatatg ccataaaaag attataccac + 1321 attgtgtact atattagatt gaaactagaa tagtacaccg ctgcttctaa aacattgtta + 1381 gaaatcgatt tgactgtcct gatcgatttg tcatgttctt atttcatttt actatatttt + 1441 tggttcgcgg gaagtctact aagatactta aagatgcaga tagtaaaaaa atgtagacat + 1501 taccgtaaaa aagtgatata atcgtatgat gttcaaggta taggtgttaa tcatgagtag + 1561 acgttttaaa aaatcacgtt cacagaaagt gaagcgaagt gttaatatcg ttttgctgac + 1621 tatttattta ttgttagttt gttttttatt gttcttaatc tttaagtaca atatccttgc + 1681 ttttagatat cttaacctag tggtaactgc gttagtccta ctagttgcct tggtagggct + 1741 actcttgatt atctataaaa aagctgaaaa gtttactatt tttctgttgg tgttctctat + 1801 ccttgtcagc tctgtgtcgc tctttgcagt acagcagttt gttggactga ccaatcgttt + 1861 aaatgcgact tctaattact cagaatattc aatcagtgtc gctgttttag cagatagtga + 1921 tatcgaaaat gttacgcaac tgacgagtgt gacagcaccg actgggactg ataatgaaaa + 1981 tattcaaaaa ctactagctg atattaagtc aagtcagaat accgatttga cggtcgacca + 2041 gagttcgtct tacttggcag cttacaagag tttgattgca ggggagacta aggccattgt + 2101 cttaaatagt gtctttgaaa atatcatcga gtcagagtat ccagactacg catcgaagat + 2161 aaaaaagatt tataccaagg gattcactaa aaaagtagaa gctcctaaga cgtctaagaa + 2221 tcagtctttc aatatctatg ttagtggaat tgacacctat ggtccaatta gttcggtgtc + 2281 gcgatcagat gtcaatatcc tgatgactgt caatcgagat accaagaaaa tcctcttgac + 2341 cacaacacca cgtgatgcct atgtaccaat cgcagatggt ggaaataatc aaaaagataa + 2401 attaacccat gcgggcattt atggagttga ttcgtccatt cacaccttag aaaatctcta + 2461 tggagtggat atcaattact atgtgcgatt gaacttcact tctttcttga aaatgattga + 2521 cttattggga ggggtagatg ttcataatga tcaagaattt tcaactctac atgggaagtt + 2581 ccatttccca gtagggaatg tccatctaga ctctgagcag gctctcggtt ttgtacgtga + 2641 acgctactca ctagccgatg gagaccgtga ccgtggtcgc aaccaacaaa aggtcattgt + 2701 agcaattatt aagaagttaa cttctacaga ggttttgaaa aactatagta gtattcttca + 2761 aggattgcag gattctcttc aaacaaatat gccgattgag actatgatag atttagtgaa + 2821 tactcagttg gagagtggag ggaattataa agtaaattcg caagacttga aaggtacagg + 2881 tcggatggat cttccttctt atgcaatgcc agacagtaac ctctatgtga tggaaataga + 2941 tgatagtagt ttagctgtag ttaaagcagc tatacaggat gtgatggagg gtagatgaaa + 3001 tgatagacat ccattcgcat atcgtttttg atgtagatga cggtcccaag tcaagagagg + 3061 aaagcaaggc tctcttggca gaagcctaca gacagggggt gcgaaccatt gtctctacct + 3121 ctcaccgtcg caagggcatg tttgaaactc cggaagagaa gatagcagaa aactttcttc + 3181 aggttcggga aatagctaag gaagtggcga gtgacttagt cattgcttac ggggctgaaa + 3241 tttactacac accagatgtt ctggataagc tgggaaaaaa gcggattccg accctcaatg + 3301 atagtcgtta tgccttgata gagtttagta tgaacactcc ttatcgcgat attcatagcg + 3361 ccttgaacaa gatcttgatg ttgggaatta ctccagtcat tgcccacatt gagcgctatg + 3421 atgctcttga aaataatgaa aaacgcgttc gagaattgat cgatatgggc tgttacacgc + 3481 aagtaaatag ttcacatgtc ctcaaatcca aactttttgg cgaacgttat aaattcatga + 3541 aaaaaagagc tcagtatttt ttagagcagg atttggtcca tgtcattgca agtgatatgc + 3601 acaatctaga cggcagacct cctcatatgg cagaagcata tgaccttgtt acccaaaaat + 3661 acggagaagc gaaggctcag gaactttttg tagataatcc cagaaaaatt ataatggatc + 3721 aattaattta ggagaaaata tggaggaaca aaacactttg gaaatcgatg tattgcaact + 3781 attcagatct ttgtggaaaa gaaagttggt cattttatta gtggcaatta taacttcttc + 3841 agttgctttt gcctacagta cttttgttat caaacctgag tttactagta cgactcggat + 3901 ttatgtagtt aaccgtgatc agggagagaa gtctggttta accaatcaag acttgcaggc + 3961 aggaacatac ttggttaaag actatcgtga aattatccta tcgcaggatg ttttggagga + 4021 agttgtttct gatttgaaac tagatttgac gccaaaaggt ttggctaata aaattaaagt + 4081 gacagtacca gttgataccc gtattgtctc aatctctgtc aaggataaac agccagagga + 4141 agccagtcgc atcgctaatt ctctacgaga agttgctgca gaaaagatcg tcgctgtaac + 4201 gcgagtatct gatgtaacga cacttgaaga agcgcgacca gctacgactc cctcttctcc + 4261 aaatgttcga cgcaacacct tgtttggttt tcttggagga gccgtcgtaa cagtaattgc + 4321 tgttcttttg attgagttgc tcgacacccg tgtgaaacgt cctgaagatg ttgaagatgt + 4381 actgcaaatt ccacttttag ggctcgttcc agatttggac aaaatgaaat aggaggaagt + 4441 tatgccaacg ttagaaatct cacaggcaaa attggatttt gtaaaaaagg cagaggaata + 4501 ttataacgct ttgtgcacga acctacagtt aagtggagat ggtttgaaag tattttctat + 4561 cacttctgtg aaactaggag aaggaaaatc aacgacttcc accaatatcg cttgggcttt + 4621 tgcgcgtgca ggttacaaaa cgctgctgat tgatggagat attcgcaatt ctgttatgtt + 4681 aggtgtcttt aaagcaaggg ataagattac aggcctgaca gaatttttat caggaactac + 4741 agacctatca caagggcttt gtgataccaa tatcgaaaat ctctttgtaa ttcaggctgg + 4801 ctctgtgtca ccgaatccga cagctcttct tcaaagtaag aatttcagta caatgcttga + 4861 aaccttgcgt aaatattttg actatatcat tgtagatact gctcctgtcg gtgtcgtgat + 4921 tgatgcggct attattacgc gaaaatgcga tgcttctatt ttagtgacgg aggcaggtga + 4981 aataaatcga cgggatattc aaaaagcaaa agaacagttg gaacacacag ggaagccgtt + 5041 tttgggagtt gtgttgaata aattcgatac ttcagtagac aaatacggtt cttatggaaa + 5101 ttatggagat tacgggaaaa ataaaaaata ggtcggggga tagagatgaa tggaaaaata + 5161 gtaaagtctt cattggccat aatccagagt tttcttgtta ttttattgac ttatctactt + 5221 agtgctgtga gagaagcgga gattgtttca acaacagcta ttgcacttta tatcctccat + 5281 tattttgtct tttatatcag tgattatgga caggatttct ttaaaagagg atatttgatt + 5341 gaacttgtcc agacattgaa atatatccta ttctttgcac tagcgattag tatttctaat + 5401 tttttcttag aggatcgatt tagtatttcc agacgaggca tgatttactt cctcacatta + 5461 catgctctct tagtctatgt gctaaaccta tttatcaagt ggtattggaa gcgggcttat + 5521 cccaacttta aaggaagtaa gaagattctc ctacttacag caacttctcg tgtcgaaaag + 5581 gtactggata gattaataga atcaaatgag gttgttgggg agttggtagc cgtcagtgtc + 5641 ttagataaac cagattttca gcatgattat ttaaaggtag tagcagagga ggagatagta + 5701 aactttgcga ctcatgaggt ggtcgatgaa gtctttatca atcttccaag tgaaaaatac + 5761 aatattggag agcttgtctc tcagtttgaa acgatgggaa ttgatgtaac agtcaatcta + 5821 aatgcttttg atcgtagttt ggcacgtaac aagcaaatcc gtgagatggc aggattaaac + 5881 gttgtgactt tttctacaac attttataag actagtcatg taattgctaa gcggattatt + 5941 gatatcgtgg gtgcattggt agggctgata ctatgtggtc tagccagtat tgtactggtt + 6001 cctttgattc gaaaggatgg gggctctact atttttgctc agacgcgtat aggaaaaaat + 6061 ggtcgtcagt tcacttttta taagtttcgc tctatgtgtg tagatgccga ggcgaaaaaa + 6121 agagaactca tggaacaaaa taccatgcag ggtggaatgt ttaaggtgga cgatgatcct + 6181 cgtatcacga aaattggtcg ttttatacgg aagactagct tggacgagct accacagttt + 6241 tataatgttc taaagggaga tatgagtttg gttggcacac ggccaccaac agtggacgag + 6301 tatgaacact ataccccaga acaaaaacgt cggctaagtt ttaaacctgg tataacaggc + 6361 ttatggcagg tcagtggacg aagtgagatt aagaattttg atgaagttgt caaattagat + 6421 gtagcctata tagacgattg gacaatttgg aaagacattg aaattttatt gaagacagtt + 6481 aaagttgtat ttatgagaga cggagcgaag taggaaatga aaatatgttt agttggatct + 6541 agtggaggtc atctgactca tttatatctt ttaaaacctt tctggaaaga taaagaaaga + 6601 ttttgggtta cttttgataa ggcggacgct cggagtgtac tctctgagga agttgtatat + 6661 ccctgttatt atccaaccaa tcgtaatata aaaaatttaa taaaaaatac ttttctcgcc + 6721 tataaaattt taaaaaaaga gagaccagat ttgattattt cttctggtgc cgctatcgct + 6781 gttcctttct tttatattgg gaagttattt ggatcaaaga cagtgtatat agaagttttt + 6841 gatagaattg atgcttcaac actgacagga aaacttgttt atccagtaac ggataggttt + 6901 attgttcaat gggaagaaat gaaaaaagta tatccaaagg caattaatct cggagggatt + 6961 ttctaatgat ttttgtgaca gtaggtactc atgaacaaca gtttaatcga cttattaaag + 7021 aggttgatag attaaaaggt gagggattta ttcaggatga tgtttttatt caaacaggat + 7081 actctaatta tgttccaaaa ttttgtaaat gggaaaaatt aatatcttat gaaaaaatga + 7141 atcaatttat tgaggaagct gatacaatca ttacccatgg cggtccagct acgtttatgg + 7201 cagttattgc taaagggaaa agtccgataa ttgttccgag attaaaaaaa tttggtgagc + 7261 atgtgaacga ccatcaactt gaatttgttg agaaagtgtt aaatgtctat aatttgacag + 7321 tcatcactaa cataagtgat cttaattcct atatttctaa ttttgatgag cgaaaaaaat + 7381 cagatttgaa gagcaaaaat aatctattta tggagaaatt tatagatatg attaatcagt + 7441 tgatggagac aggtgacatc aagtatgact aagtacataa atagctgtat caagttgtta + 7501 ttcatatatt cgttatttag tgaattgcta tactcatatt attctgtatc tctattattt + 7561 acgatacctg acttattatt gttggcagca gcagtaattg cttttgtaga ttcttattct + 7621 gcagggaaaa taagagttaa aaatcctcac attagtttaa tgctcttttt tatattgctg + 7681 atatttctat taattagttt tacttggggt actcttaata tatatggatt tgttatgaga + 7741 ggaagatata tactgggagc atttctagtt tattttatga caaatagcta tctagatgat + 7801 agaacctttt catcattgat aaacattgct tattttatgc agatattgaa cctattatta + 7861 gttttacatc aaaatatagt attacatttg caccctgact tcactaatgg gatttttggt + 7921 tttactgatt atgcaaatgg aatccaagga ttttattgct tagccttaag tgttttatct + 7981 actgtatatt atctgtatgg taaatgggga acaatgaagt cattaatatt gattgctatt + 8041 tcgtgtataa tttgtgcatt agcagaaata aagatttttt ttgtcatttt tatattttct + 8101 attattctaa tttttatatt tcaaaagtca gaaacagtaa aaaaaatacg aataattagt + 8161 acagctgctg gaatatctct tattttttta attgcctata aactcattga gatagtttta + 8221 cctgataatt tgtatacttt ttttaatgtt acaaaggcat tatcatatga gaataggaca + 8281 gagtttgcgg gacgaacaaa tactatttcc ttcctatggg acaacttatt ttattatgat + 8341 tatattagtg ctatatttgg gaaaggacta ggttcatact ctgttaatta tatttatgaa + 8401 cttggtaaaa tgcttgcaga tggtggtttt atttcagtga ttttgcttta ttcatttttg + 8461 ttgtcattat tcatacgggg aactattact agaggaaaaa ataagcaaag tgaaagacta + 8521 attgtatcca tcatagcttt tgtggtgatg attagcatta ttgtttggaa tagtacgttc + 8581 tctagaccaa cttatcttgt atttttcttt ctagcaatag gtaatgcagc gtataagtct + 8641 actaaattaa taagaaggga ttgagatgga aattcaaata tcagtggtga ttccagtata + 8701 caatgctgaa aacacgatta ataattgtat tgaaagtgct ttaaaacaag atttagaatc + 8761 ttttgaagta attttagtaa acgatggatc gaacgattct acatcaagaa ttcttgaaca + 8821 gtatagtgat aatccccaag tgaagatatt tcatcaagtg aacatgggag tatctgctgc + 8881 cagaaattta ggtttatctc atgcaagcgg agaatacgta ttctttttag attcagatga + 8941 tattttagat gatggtatgc tttctaaaat gtaccaattt gtaaaaaata ataaagttga + 9001 tctcttatct tgttggcata aagaacctgc tacaactcaa tacggtggaa atgagaataa + 9061 gtcaacttca tttattgcac gtacaagaga agaaataggt gctcattttg ttgatatctt + 9121 tccgagaagt gcttgtgcca aattgttttt tcgcaaaata attgaagaaa ataatattac + 9181 tttttcgact gagatgtcac taggtgaaga tatgtcattt gtgtatcaat acttaatggt + 9241 ttctaaaagt attggagtta ttgacggggt gtattataat attcaaaatg taaatccaca + 9301 gtcgttatct aagcgctatg tgcagaatat tgaaaattcc ctaatgattc agaaccagtt + 9361 atggaatcaa ctgttggaag tttatcctaa aattgaggag aactactata agcaacatat + 9421 ggattttaga ttttaccttg ctaacttgta tgtaaataat ttatttaaat ttgattctcc + 9481 gtattcatca aaagaaaaac tagaccaaat tgctcaacaa ttaaaaaagt atagattatt + 9541 tttagatgaa aaagtcagca aagaaaagat gcctaaaaat ataaatgaga tgattgtttt + 9601 ttatttacta aaattgaaaa ttccagtgtt gatttattct ttttattcgt ttaaagagtg + 9661 gtggaagaga agaaaaatta aaaatgaagg ataaataagt tatggaagat ttgataagca + 9721 ttgttgttcc agtctataac gtggaaaaat atttaaaaaa atcaatagaa agtattttga + 9781 atcagactta tcaaaatatc gagattttat tggttgatga cggaagcaca gatagtagtg + 9841 ggaaaatttg tgaatcattt agtaaagttg atcctaggat aagagtattt cataaagaaa + 9901 atggtggttt atcagatgct cggaattttg gaattgagca aatgaaaggt caatatgtag + 9961 cgtttattga tagcgatgac tacatatcta aggattatgt ctggaagttg tattcttcta + 10021 taaaaaataa tgattccgag gtgtcgattt gttctttttt attagtcgat gaaaaagggg + 10081 aaaaaataaa agatgagcta ttagattcgg gaaaaatatg cttgactggt caacaaatat + 10141 tagaaaaagt attaacagcc gacggctatc gctatgttgt tgcttggaat aagctttatc + 10201 ggtcaacttt atttgaaaaa ttaaaattta aaaaaggaat gttgtatgag gatgaatttc + 10261 ttaactatcc tctattttgg gactgtaaaa gggtatcaat tgtagaggag ccgttatatt + 10321 tatacgttca acgaaaagga agcattgtac aaagtaatat gactttagaa aaaataaaga + 10381 tgaaggatga gatgcatact tcacgcattg agttttattc agaaaagggg cattcttttt + 10441 tgcacgaaaa agcgtgtcaa cagtactgca attggattgt tacagcgact accaatcata + 10501 gtaagatttt aaatcctaat ttttcgaagt atttacaacg acagtttaga aagttcgcta + 10561 aatatacacg aaacaatgat attagactaa ttgtgcagaa cattctagga tttatagata + 10621 ttcgtttagc agcttatgta aaatcaaaag taatgtagag tataggaaac ataatgatag + 10681 aaaaaatttt agattctatt aaaaatcatt ctttttatag taaattgaag gataaaattc + 10741 atagaattat tccattatat attataaaaa atcaaaatat agcttttcaa caagataccg + 10801 atatagcata tagaaaacta aagaagaagt ttaggcatat ttcgttgact ggagatgagc + 10861 ttaaatataa aatggagttt tcaaataaag tttggatttg ttggtttcag ggagaagagc + 10921 atgccccaga gttaattaaa acatgtattc aatcaatgag gaatcaactt caaggaagag + 10981 aaatcattgt gttgacagaa aaaaatataa gtgattatac agagattcca ggctatatta + 11041 ttgaaaaata caaaaaagga tggatttctc gtgcgcatta ctctgatatc cttaggatag + 11101 atcttctatg tcgccatgga ggattatggg tagatgcaac agtgttgaat acaggaggag + 11161 atttctcaaa tcttgaggta ccactttttg tatataaatc tttgaattta tcaagaaaag + 11221 attcacaagc tattgtagca tcaagttggt taatttcgtc atatagtaat catcctatat + 11281 tactctatac gagaaaactc ctatgggcct actggcgaag aaaaaatagt ttatgtaatt + 11341 attttttgtt ccatatatgt tttacaatag ctacagagcg gtacccaatc gaatggtctg + 11401 ctgtccctac ttttaataat cattctcctc atatacttca ttttgagttg aatgaacaat + 11461 tttcggaaaa acggtgggaa caactgaagc atatttcggc gtttcataaa ttaaatcatc + 11521 atatagatta ttctagcggt gttaacactt tttataagtt catagtatct tcgaaagttt + 11581 agaaaaatga gtaataaaat tagtaaaaat ttagcctaca atatggggta tcagttaatt + 11641 gggattgcag ctcccttgat aacttctcct tatttatcac ggatattagg tgctgaaaat + 11701 ttaggtattc attcttttac tatgtcggtt gcactttact ttatgatgtt tatgcttctt + 11761 ggaattgcaa attacggaaa tagaacaatt gcgactgtta aacgagaagg aaaggatatt + 11821 ctatcaaaaa cgttttggag tatctactct atccagttga taatgtctat tctggtaact + 11881 atagcttatc ttgcttatct atatttgggg gcagtacatt acaaagttat tgcaatatta + 11941 caactctttt tattgttatc aaatgctgtt gatattactt ggtttttcta tggattagaa + 12001 aattttaagc aaatcgtttt taggaataca ttagtcaaac ttttaggatt atttttaatt + 12061 tttttatgtg tgcgtcaagg cacagattta tggaaataca catttataaa cggatcagta + 12121 actttagttg gccaactttt actatgggga caattaaaag gaatattaac ttggaaaaaa + 12181 attcaattaa aggaattact acctcatatc aagccaattt taattctttt tattcctgta + 12241 ctagccatta gtatttttac taatatggat aaatatatgc ttggtttaat ggttgatgta + 12301 aagcaggttg gattttatga caatgcaggt agaattattg aaattcctaa agctttgatt + 12361 gcagctttag gggccgttat gttgccaaga acttcctatt tattagcgga aggacagaaa + 12421 gaaaagagta aatactacat agaggtaaca attttatacg tgatgattat ttctagtgta + 12481 ttgatgtttg ggctaatatc ggtatctgat attttttcca ttatattttg gggagaagaa + 12541 tttcttgaat caggtagatt gatttctgct atgtctccgg cttttgtctt ctctgtatta + 12601 ggaaatatca ttaggactca gtatttgatt cctagagcta aggataaaga ttatgtagtg + 12661 tctctaattg cgggggctgt tgttaatcta gtgctaaact atttttttat aaaacctttt + 12721 ggtgctatgg gagcaacagt tagtacagtt ttggcagaat ttgtattgtc tggaatgcag + 12781 ttttggtcag taagaagaga cttagattta aaaagatatt tgaaaaacgg tttgatattc + 12841 tacctatttg gtctgattat gtaccttgtt attataacac tcaaaactca gttaccatac + 12901 aatataatga gtcttatttt actaatagtt ttgggtggaa tagtatatgt tattttttgt + 12961 tgttgctata ttttaatgtc aagaaattta cattttaagt tattgaagga aaagattata + 13021 cgaaaggttg tacataaaaa tacattataa aatattagtt ttatcttatt tagttggata + 13081 ctattaaata aacgaaaata tttgaaactt tggtaattga gattatagag ataaactaag + 13141 ttatattata gctttattat taaagtaaga atatcggtgc agtgtaggta acgaataatg + 13201 tgagtactca tttcttagat ggagctaggg gtcatcataa gggattgata tgacattttg + 13261 agtaagttac agctagagtt taggtttgat tatatcagat atttagatga tttggaaaat + 13321 aataaaataa gttaggaact atttttattg ttttgagtga caggtttgat tttgggaaat + 13381 gtattttgtt aaataggtag gaaagatggt tactaaagat aaaggattaa catataatag + 13441 tactttgcat gcaataaaag tattagcatg ttttagtgtt gttgctattc atatatggct + 13501 accaggaaaa attggagcgt tttatcaaat aatagcacga tttgcagttc caatgttctt + 13561 tttgatttct ggcttttatt catataatat ttcaaagaat aaaatacgga atagaattaa + 13621 aaaaatattt agattgatat taagaagtac atttttttat gtaataatat ttgtatggat + 13681 gttttggaga gaaggtaata tgcagtttat ttttcaaaac tttaatttaa caaatattat + 13741 aagatttgtg atttttaata gaatttcaga tttaataggc tatctagcaa caccgttatg + 13801 gtatttattt gccatactat atatatatat ttacctttat ttttccaata aaagactact + 13861 attgacaaaa cgatggatct ctatactttt actattttct ttcattatgg aagctacaat + 13921 tagcgattca attttttata gaaatttttt atttatggga ataccatttt ttggaatagg + 13981 aattcttatt gcacagaagc aaaaggagat tattaattgt aaaataataa acaaaatatt + 14041 aatcttggga acaattatct atccaatact aatattttta gaatattata tcttgggtaa + 14101 ttcttttgag gtctatataa gttctgtgct agcaaccata atattgatga ttttcgcgat + 14161 taaatcacct aaagcgatta atatcaaaat actgaatgaa attggagata aatatgcgac + 14221 ttttgtttac attatacacc agtttatcat tgtgatattt aaatttttag tatctaatgt + 14281 ttatattctc aaatttggga cgatatttgt ctttttgata tgttgttttc taggggttct + 14341 atttcaattt atcaaaaaca gactattaaa aaggtttagt taagatggtt gttttacaaa + 14401 atgttaaatt tttagtaaga gttgttttta tggttattat cagtatagtg ttatggcctg + 14461 ttcggataaa gaagaataag atactattta ttaattttaa tggtaaggga tatggtgata + 14521 atccgaaaag tatttgtgag tatcttcgag ttacatatcc agagttagat ttagtttggc + 14581 ttgcaaaaga taatgaagat tttccagatg gagtgagagt tgtaagatat aaatctctac + 14641 aatcttttta tgagcaagct agttcgaagg tttgggttta taatgtaaga aattttgaaa + 14701 gactactaaa aaaacgcgga cagttttata ttcaaacttg gcacggtgct tctagtttta + 14761 aactgataga aaagcaggct gatttaccat taaaatatat tttagaagca aagtatgatg + 14821 caagagtcac agatataatg atttcagata gcagaaaaca aactgaagaa tttcaaaagt + 14881 atttttggta ttcaggagaa atttttgagg tggggatgcc gagaaatgat gccttgtttc + 14941 actataagga agactacgac aagttaaata atatcagaaa agaactaagc attgattcag + 15001 ataattatgt tattttatat gcccctactt tcagagatga tggggatgca tcttatttag + 15061 atataaattt tgaacggctt ttgcaaagta ttgaacaaga aattaagaag aaatgtaaaa + 15121 ttttaattag attacatcct aatgactctc attttagtaa taatatttct tttaatcatg + 15181 acataattga tgttacgcta ttctcagata tgcaggaact tatattattg gcagatgttt + 15241 tactgacaga ttattcttcc gcgatatttg attttatgct tttaaacaag ccttatgtca + 15301 gatatgtgaa tgatttagaa aaatatgctg agcttagggg ggtatcagat acatattacg + 15361 aattgccgga ttctattatt aaaactgctg aagaattgta tgacttactg cctaaaaaaa + 15421 tagaaaattt tgattatgat tctataaaaa aatatagaaa tgaaatactg tgtccaatct + 15481 ttaatggaac cgctagtgaa aatgtaggaa ggagaataat tcaagagttg tgaagtaaaa + 15541 cattgggtta tttttaaggt aacgagattt gaaaaataat gatttaaaga taggaagtgg + 15601 agctattcat caaatctccg ctacactttc tcaaaataat atttcgggaa agattttata + 15661 ttgtgctgat ccagttgtcg atgacttgta cggttcgata gtacgttcac aaatagagga + 15721 aattggtcgg gtaaaggaag aaagttgcaa ttataatact attgcttatg cgatgaatat + 15781 agcagaaagg actattgcca cagatattga ctgtattgtg ggaatgggag gaggtcgtgt + 15841 tttagatgtc tgcaagtatg catcttttat ttcgaaacgt ccttacctat cgattccgac + 15901 aacagcagca aatgatggca ttgcttcccc agttgctgtt ttgaaaagac aggatgatag + 15961 accaaaaagc ttaggggcgg ctatcccctc aatgacacta attgatattg atgttattgc + 16021 atcaggacct atacaaaaca taaaagctgg tatcggtgat acaatatcca attacactgc + 16081 attgaaagat tgggagttgg cagttgagcg agggaaagat gagatgcatg gttttgcata + 16141 tctaatgtcg caaaattctt tagatgcttt aatgaaaacg aagtataatt ctattacccc + 16201 tgattttatt gaagttttgg taaactcttt agttttatca ggcattgcaa tggattttgc + 16261 gggaagtagt agacctgtca gtgggtcaga gcacttattt agtcatgcat tagattacta + 16321 tggttctaca aggaatcttc atggaattca ggttgcatta ggtacagtcg cagttttgaa + 16381 attaattgaa aattctgttg atgctgtggt ggattacttg caaagatttg aggttcatat + 16441 taacccgaaa cttttgggga tagatgaaga gttgtttatt tattgtatgc aacatgctac + 16501 aaaaatgaga agtaatcgct atacttatct gcatgaggtt gatcttagta cagatagatt + 16561 gaaacaaata tataaggaac tcataagcga gttgtagaaa agagagaaaa aaatgaaagc + 16621 acttatttta gcagcagggt taggaacacg tctagcccca attaccaatg aggtaccaaa + 16681 atctttggta ccagtcaatg gtaagccaat tttgatgaaa caaattgaaa atttatatca + 16741 aaataatatt acagatatta cgattattgc tggatataag tcatctgtat taacagatgc + 16801 agttactgaa aagtatccag aaattaatat tattgataat gttgatttta aaacgactaa + 16861 taatatgtat tcagcctatc taggaaaagc tgcaatgggt gatagtgact tcttaatgat + 16921 gaatgcagat gtattttatg atgcttctgt tattaaaagt ctgttgcttc ataaagctcc + 16981 aaatgcaatt gtaactgact taggtactta tattgaagag tctatgaaag tcgtagaaaa + 17041 aaatgggcgt ttagtggaaa tttctaaaca gatttcacct gaggaggctt taggggcttc + 17101 tattgatgtt tataaattct cttatgaagc aggtgcacga ttctttgaaa agtgtaagga + 17161 atttattgaa gataaacgag aacttcaaat gtggagtgag gttgctctta atgcaatcct + 17221 tccagaagtt gagtttatag catgtccatt ggatggccgt tggttagaaa ttgataatca + 17281 tgaagaccta gctgttgcag aaaaactatt tgcttaaacc gaatatggag aatgaaattg + 17341 acaaatagag ttgattattt tggtgctgat attagtgaac ttcagaataa aaaattattc + 17401 ttatttgata tggatggtac catttatgaa gaagatagat tgtttgaggg tactctcgaa + 17461 ttattagact atattcataa tattggcggt gagtatattt ttattacaaa caattcatct + 17521 aagtctgttg ttgactatgt tgaaaaagtt aacagattag gtattaaagc tgaacgagat + 17581 aattttttta cctctgctca agccacaatt gtttatatta aagaaaatta tcctaaatct + 17641 aaagtttatt gccaaggaac aaaatctttg ataaaagaac tatctgacgc aggaattgat + 17701 gtaactgagc aagttagtgc tgatatagat gttgttcttg ttggttttga tacagaatta + 17761 accagtgata aaattcgcaa tacctgcgag attctatcaa caaaggacgt acctttcata + 17821 gctactaacc ctgatattcg ctgcccagta tcgtttggat tcatcccaga ttgtggttct + 17881 atttgtgata tgattagtaa atcagtcgat aggaaacctg tttacatagg taaacctgaa + 17941 cctacgatgg ttgatattgt tcgaaaaaaa ttaaattatt ctctatttga aacagttgtg + 18001 attggagatc gcttgtatac ggatatcatg actggtataa atgcaggagt aacttcagtt + 18061 tgtgtgctga caggagaagc aacggtgaat gatattcaac aaggtagtat aaaaccgact + 18121 tatacattta aaaacgtgaa agaaatgtgg aaaggaattg tctgattttt tcattctgaa + 18181 tagtgaattc atgaatactg tcaaaatact cgtatgtatt taaattgatt tcattatttt + 18241 aataatggac aaattaaaat tatttttctc cccaaatcgt tcgtgaacgt aaagtactca + 18301 tcaacaatga tccatcgcca tttattcata ctaacttcat cggaacctat actcttttag + 18361 aagctgctcg taagtatgat attcgcttcc accatgtatc gacagatgaa gtttatgggg + 18421 atctcccttt acgcgaagat ttgccaggtc atggtgaagg accaggtgag aaatttactg + 18481 ctgaaacaaa atacaaccca agctctccgt actcatcaac caaggcagcc tcagatttga + 18541 ttgtcaaagc ctgggtgcgt tcttttggag tcaaggcaac gatttccaac tgttcaaata + 18601 actacggtcc ttatcaacat atcgaaaaat tcatcccacg tcagattact aacatcctaa + 18661 gtggaattaa gccaaaactt tacggtgaag gtaagaatgt tcgtgactgg attcatacca + 18721 atgaccattc ttcaggagtt tggacaatct tgacaaaagg gcaaatcggt gaaacctact + 18781 tgattggggc tgatggtgag aagaacaata aggaagtttt ggaacttatc cttaaggaaa + 18841 tgggacaagc tacggatgcc tatgatcatg tgactgaccg tgcaggacat gaccttcgct + 18901 atgcgattga tgccagcaag ctccgtgatg agttggggtg gaaacctgaa tttaccaact + 18961 ttgaagctgg gctcaaggca acaatcaagt ggtatacaga taaccaagaa tggtggaaag + 19021 cagaaaaaga agctgttgaa gccaattatg ctaagactca ggagattatt acagtgtaaa + 19081 aaccaggaaa tagctgcttt ttattgctat attgggaaga gttacatatt agaaaggtct + 19141 agagatgatt ttaattacag gggcaaatgg ccaattagga acggaacttc gctatttatt + 19201 ggatgaacgt aatgaagaat acgtggcagt agatgtggct gagatggaca ttaccaatga + 19261 agaaatggtt gagaaagttt ttgaagaggt gaaaccgact ttagtctacc attgtgcagc + 19321 ctacaccgct gttgatgcag cagaggatga aggaaaagag ttggacttcg ccatcaatgt + 19381 gacggggaca aaaaatgtcg caaaagcatc tgaaaagcat ggtgcaactc tagtttatat + 19441 ttctacggac tatgtctttg acggtaagaa accagttgga caagagtggg aagttgatga + 19501 ccgaccagat ccacagacag aatatggacg cactaagcgt atgggggaag agttagttga + 19561 gaagcatgtg tctaatttct atattatccg tactgcctgg gtatttggaa attatggcaa + 19621 aaacttcgtt tttaccatgc aaaatcttgc gaaaactcat aagactttaa cagttgtaaa + 19681 tgaccagtac ggtcgtccga cttggactcg taccttggct gagttcatga cctacctagc + 19741 tgaaaatcgt aaggaatttg gttattatca tttgtcaaat gatgcgacag aagacacaac + 19801 atggtatgat tttgcagttg aaattttgaa agatacagat gtcgaagtca agccagtaga + 19861 ttccagtcaa tttccagcca aagctaaacg tccgctaaac tcaacgatga gcctggccaa + 19921 agccaaagct actggatttg ttattccaac ttggcaagat gcattgcaag aattttacaa + 19981 acaagaagtg agataagtag tagaatgatt ttctagtcta ataaaagagg cagagaatga + 20041 actccaaagg agcttaagat gtacgattat attattgtcg gtgctggttt gtcaggagca + 20101 atttttgctt atgaggcgac caagcgtgga aaaaaagtaa aagtgattga taaacgtaac + 20161 cacattggtg ggaatatcta ctgtgagaat gtagaaggag ttaatgttca taaatatggt + 20221 gcccatatct ttcatacttc taataagaaa gtttgggatt atgttaatca atttgctgaa + 20281 tttaacaact acgtcaactc gcctgtagct aattacaagg gtagcctcta taatctacct + 20341 ttcaatatga ataccttcta tgctatgtgg gggacaaaaa ctcctcaaga agtcaaagat + 20401 aagattactg agcagacagc tgatatgaag gatgttgagc cgaaaaatct ggaagaacag + 20461 gctatcaagt tgattggtcc agatgtctat gaaaagttaa tcaagggtta tactgaaaag + 20521 cagtggggac gctcagcaac ggaacttcct ccatttatca ttaaacgtct tccagttcgt + 20581 ttaacatttg ataataacta ttttaacgac cgttaccaag gaattcctat tggtggttac + 20641 aatgtcatca tcgaaaatat gcttaaagac gttgaagttg agcttggtgt tgatttcttt + 20701 gctcatcgtg aagagttaga agcatcagct gaaaaagttg tctttacagg gatgatcgac + 20761 cagtattttg actacaagca cggagagtta gaataccgta gccttcgttt tgagcatgag + 20821 attttagacg aggaaaatta tcaaggaaat gctgtagtga actatacgga gcgtgagatt + 20881 ccttatactc gtattatcga acacaagcat tttgaatatg gaacgcaggc aaagacagtt + 20941 atcacgcgtg aatatccagc tgactggaag cgtggggacg agccttacta tccgatcaac + 21001 gatgagaaaa ataatgctat gtttgctaag taccaagagg aagcttcaaa gaatgataag + 21061 gttattttct gtggacgttt agcagattat aaatattatg atatgcatgt ggtgattgaa + 21121 cgggcgcttg aggttgtgga gaaagagttt ggatatgaca aaaagtagaa tcaattggat + 21181 agattttgga aaaggctttt ccatattttt agtcttagca gggcatgtgt tgcttggact + 21241 gtatcaatcg gaaaaatttc ccacagcaaa taacatacta tcgttgttga tagcacaagt + 21301 ctacatattt catataccag tattttttgc cttatcagga tactttttca aacctgtgtc + 21361 ggatttgaag gagttctggc aatatgctaa aaagaagaca attgtttttg gtctgccata + 21421 tattttctat tcgatcattc actttggtct tcaaaaagtt gcaggggcat ctgttcgtgt + 21481 tcctacaacc atatctgatt tgctaaatat ctataaattt cctctgggag tttcatggta + 21541 tctatatacg ttatggtcga tattgatagt ttatggttta ctatctgttg ttttcaaaaa + 21601 tcgtaagtcc cttttgttag ttagtgtttt tgcctatatt ttcacactat ttattcaaac + 21661 tgatattttt attgtgcaac ggacgttggt ttgggggatt tgtttctttc ttggcagtgt + 21721 attgagtgaa attcactttg ataaaattaa tttgaaaaaa tttctttttt tctttgtgtt + 21781 atttgatttt atttatatgt tcgcttggtt cttgttttat gaagtagggt ctaagaagga + 21841 ttatgtaagc tatattaacc caggtttgtg ggggattgct tttattgtct gtgtattagt + 21901 tgcttttgcg atttttccta aaatggagaa aaattttcct aaaactttcc tatatttcac + 21961 taaatacggg aaagatagtt tagggatcta tattcttcat gcaccaattt gtagcatgat + 22021 tcggattcta atgttgaaag tgggaataaa ctcagttttt cttcacgttg ttgttgggat + 22081 tgtgctaggc tggtatttat ccatactagc aacttatata ttgaaaaaaa ttccattttt + 22141 gaatattgtt ttattaccac aaaagtatat taaattaaaa taaattattt tagatttata + 22201 atgtggctct ttgtcaacta acatctggag aggacaatca ctgtcttctc tttttttgtc + 22261 ttttcagaat ataccaaatt aacacaaaaa ttctgaaaat tctgttgaca tctttctgaa + 22321 aagagtttat aatggagaga aagttttaaa ggagaaaatg atgaaaagtt caaaactact + 22381 tgcccttgcg ggcgtgacat tattg +// diff --git a/public/res/serotype_genbank/serotype_16A.gb b/public/res/serotype_genbank/serotype_16A.gb new file mode 100644 index 0000000..c10288d --- /dev/null +++ b/public/res/serotype_genbank/serotype_16A.gb @@ -0,0 +1,1033 @@ +LOCUS CR931667 21730 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain R105 (serotype 16a). +ACCESSION CR931667 +VERSION CR931667.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21730) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21730) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21730 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="R105" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC16A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC16A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33427.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..466 + /gene="aliB" + /locus_tag="SPC16A_0002" + /pseudo + CDS 293..466 + /gene="aliB" + /locus_tag="SPC16A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..980) + /gene="tnp" + /locus_tag="SPC16A_0003" + /pseudo + CDS complement(459..980) + /gene="tnp" + /locus_tag="SPC16A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1197..2642 + /gene="wzg" + /locus_tag="SPC16A_0004" + CDS 1197..2642 + /gene="wzg" + /locus_tag="SPC16A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33430.1" + /db_xref="GOA:Q4K1I6" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K1I6" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKIIVAIIQKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESEGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1197..1313 + /gene="wzg" + /locus_tag="SPC16A_0004" + /note="Signal peptide predicted for SPC0767 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1401..1748 + /gene="wzg" + /locus_tag="SPC16A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.7e-65" + misc_feature 1926..2369 + /gene="wzg" + /locus_tag="SPC16A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.2e-69" + gene 2644..3375 + /gene="wzh" + /locus_tag="SPC16A_0005" + CDS 2644..3375 + /gene="wzh" + /locus_tag="SPC16A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33431.1" + /db_xref="GOA:Q4JZ86" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ86" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHTGLSNILMLGITPVIAHIERYDALENNEKRVCELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPHMAEAYDLVT + QKYGEAKAQELFVDNPRKIIMDQLI" + misc_feature 2647..3255 + /gene="wzh" + /locus_tag="SPC16A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 7.1e-37" + gene 3384..4076 + /gene="wzd" + /locus_tag="SPC16A_0006" + CDS 3384..4076 + /gene="wzd" + /locus_tag="SPC16A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33432.1" + /db_xref="GOA:Q4K1I4" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K1I4" + /translation="MKEQNTLEIDVLQLFRILWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 3402..3818 + /gene="wzd" + /locus_tag="SPC16A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.3e-53" + misc_feature 3924..4001 + /gene="wzd" + /locus_tag="SPC16A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4086..4769 + /gene="wze" + /locus_tag="SPC16A_0007" + CDS 4086..4769 + /gene="wze" + /locus_tag="SPC16A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33433.1" + /db_xref="GOA:Q4JZ84" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZ84" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFAYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 4785..6152 + /gene="wchA" + /locus_tag="SPC16A_0008" + CDS 4785..6152 + /gene="wchA" + /locus_tag="SPC16A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33434.1" + /db_xref="GOA:Q4K1I2" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K1I2" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKISHVISKRILDICGATIGLVL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFI + RDGAK" + misc_feature 5568..6149 + /gene="wchA" + /locus_tag="SPC16A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 5.9e-145" + gene 6156..6557 + /gene="gct" + /locus_tag="SPC16A_0009" + CDS 6156..6557 + /gene="gct" + /locus_tag="SPC16A_0009" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33435.1" + /db_xref="GOA:Q4K1I1" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K1I1" + /translation="MKKVITYGTFDLLHYGHINLLKRAKSLGDYLIVVISTDEFNWNE + KQKKCYFTYEQRKTLVEAVRYVDLVIPEESWEQKVTDVHEYHIDTFVMGDDWKGKFDF + LEKEGVEVVYLSRTPEISTTEIKNSLATREY" + misc_feature 6168..6536 + /gene="gct" + /locus_tag="SPC16A_0009" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 5.2e-28" + gene 6580..7401 + /gene="wcxR" + /locus_tag="SPC16A_0010" + CDS 6580..7401 + /gene="wcxR" + /locus_tag="SPC16A_0010" + /note="member of homology group 151" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33436.1" + /db_xref="GOA:Q4K1I0" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K1I0" + /translation="MTDELERLHNLELLLASEVLKICGKYNLKIVMLAGTFLGAIRHN + GFIPWDDDMDFGMPREDFERFKELCVSDLDREKYFLQTDQTDLNYPFNFVKLRLNNTH + VSEEFSLDANVHDGIYIDIFPIDNICPKPFRRFIQLKGFWLFRNLLWIKCGYGDNDRK + KRLAYKLAKLATHVFSISFLKKMKEKCILLGQSTNADNVVVSDGSYGIKKETFPKVWL + DEVESYSFDDIKLWGMKNYRAYLKHMYGDYMQLPPENQRNHHKRIKIDFGPYVEK" + misc_feature 6646..7317 + /gene="wcxR" + /locus_tag="SPC16A_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 5.1e-39" + gene 7416..7880 + /gene="wchJ" + /locus_tag="SPC16A_0011" + CDS 7416..7880 + /gene="wchJ" + /locus_tag="SPC16A_0011" + /note="member of homology group 26" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase enhancer" + /protein_id="CAI33437.1" + /db_xref="GOA:Q4K1H9" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:Q4K1H9" + /translation="MSKKEIKLCLVGSSGGHLNHLYLLKPFWQDKDRLWITFDKEDAR + SILSNEKCHYCYYPTNRNIKNLIKNTFLALRILYKERPDVIISSGAAVAIPFFYLGKI + FGAKTVYIEVFDRVDAPTMTGKIVYPVTDRFIVQWEEMKKIYPKAINLGGIF" + gene 7880..8359 + /gene="wchK" + /locus_tag="SPC16A_0012" + CDS 7880..8359 + /gene="wchK" + /locus_tag="SPC16A_0012" + /note="member of homology group 27" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33438.1" + /db_xref="GOA:Q4K1H8" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q4K1H8" + /translation="MIFVTVGTHEQQFNRLIKEIDELKAEGVITSDVFIQVGFSDYQP + RFCRWERFLSYDEMNNLMEEADIVITHGGPATFMNVIANGKRPVVVPRRKKFGEHVND + HQLDFCNRIVQEGYDLVVIEDIKKIREYLNPSSSIAVKSNNECFVQHFSNLIAELVE" + misc_feature 7880..8350 + /gene="wchK" + /locus_tag="SPC16A_0012" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 5.6e-45" + gene 8352..9485 + /gene="wcyK" + /locus_tag="SPC16A_0013" + CDS 8352..9485 + /gene="wcyK" + /locus_tag="SPC16A_0013" + /note="member of homology group 116" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33439.1" + /db_xref="GOA:Q4K1H7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1H7" + /translation="MSKNDEEHRRRHLMKILHIPTGGLFSDGIGTFIYSYLEYMDLSE + IEVTILATNKPLLEDKLKFQVLGVQIVEIERKKSSILAYMREFLELLKVGKYDVVHVH + GSSALMSIELFIAKIMGVPVRIAHSHNTTCNHILLDRMLRPFFYTLYTQSWACGEKAG + EWLFKDKRFKVIHNARDVEKYSFNPHLRRVFRTTHSLKENTLALGHVGRFNIQKNHTF + LLDLMDEMKCKQKDVKLFLVGEGEKVEDVKRYVKERKLEDSIVFLNRYSDMQSFISAM + DIMLLPSLYEGLPLVAIEWQINGIQSILSTTISDECIFTNSIQQLPIDNVSTWIKKAI + EDFSYINRLEKSRENIDLAQKSNYDIRIEAKKLEHEYKKLIGE" + misc_feature 8913..9401 + /gene="wcyK" + /locus_tag="SPC16A_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.6e-08" + gene 9493..10419 + /gene="wcxS" + /locus_tag="SPC16A_0014" + CDS 9493..10419 + /gene="wcxS" + /locus_tag="SPC16A_0014" + /note="member of homology group 104" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33440.1" + /db_xref="GOA:Q4K1H6" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K1H6" + /translation="MNISIVLSTFNGDEYIVEQLDTLRNQTRLAEEVLISDDASTDDT + VQIIEDYIAKYKLDNWSIKKNKENQGWKNNFAMLLEEAKGDIVFLCDQDDIWHLDKIQ + KMSKIMENNDKILLLASNYTPFYVGDGVKIKLDKSDLDNSEAVYQPNFLDNFFHIRRP + GCVYAVNKKIIPYFLEIRSNEDAHDALLWRLASFLNGLYIYSYSTIDFRRHDSNATGS + RERSFLRRKEQVIYYDDLLQRLDKFSKQHDLSLSNEQISVLNDYILWGKNRRELFMKR + NVFIFFKLFKYHKLYWSFRSYITDFIVLYMKE" + misc_feature 9502..10014 + /gene="wcxS" + /locus_tag="SPC16A_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.7e-29" + gene 10435..11640 + /gene="wzy" + /locus_tag="SPC16A_0015" + CDS 10435..11640 + /gene="wzy" + /locus_tag="SPC16A_0015" + /note="member of homology group 152" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33441.1" + /db_xref="UniProtKB/TrEMBL:Q4K1H5" + /translation="MLVKVKGGFKVSLSRVKTDVKLNEFLFGLAFYPWLIAWLFTSTF + YKDFIHPYGIIKTWEYVGLFFLLFKFMLGKSKIKSIIITPIILLIGFIVSYDNGNASF + VAYTLTLIYSSRDINFRNLVRNTMFCQIGVVGTVIVSSLLGIIPNELALTYSEGVIRS + RYGLGFHYTSFTPNYFLSILLEYVYLKGEKYWTIKELFICVLLNIVIYKYTDTRLTFI + MVFILLLISFSRRFVSINMNFKFLKYLLTLIYPIMAYMTYWLTAKFDSRNSLLSLINN + LLSQRLRFGQEGLRRYPLRLFGTHIQWDASANSYLYVDSSYINILISYGTIIFFLTLI + SYSIIMKKVIINQNKTLLIVLIFWSVRACIDPQLFLLWFNPFLFLIARTFLDEREEIG + DDITYMCIE" + gene 11612..12340 + /gene="wcxT" + /locus_tag="SPC16A_0016" + CDS 11612..12340 + /gene="wcxT" + /locus_tag="SPC16A_0016" + /note="member of homology group 153" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="CAI33442.1" + /db_xref="UniProtKB/TrEMBL:Q4K1H4" + /translation="MISLICVSNNYDKLNTILKSSLSRQKDVNYELIIVDSNKYGFNS + AAEALNFGGKQAKGDYLFFVHQDISFQDDFELAKLESYCRNSIFGVAGVAGVKNIEGK + VVSFSNIFHGDPKTKAAGKSISAPVEVDAIDECLIIIPKKVFSTNQFSIIGPTWHLYG + TDYALQMKLINSPVLVFPSELWHVSDGKSLNLNYFDAIQWLLKKYSKNYSVIYTFFGV + WPSNPILLKFKCLYRKLRFYIKGV" + gene 12340..13095 + /gene="wciB" + /locus_tag="SPC16A_0017" + CDS 12340..13095 + /gene="wciB" + /locus_tag="SPC16A_0017" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33443.1" + /db_xref="GOA:Q4K1H3" + /db_xref="UniProtKB/TrEMBL:Q4K1H3" + /translation="MEVKLYVATHKSYNQVQDQDLYIPILVGADKNIGEKNYLRDNQG + DNNISDRNFTFCELTGLYWIWKNSKDDIVGLCHYRRYFGKNKRFLKQNSILKKNDILK + QLNDYDVILPSKSMNEYNGYTAEEFFNKNHDHKVWEMCRQIISENNKDYLDAFNWFSK + EKTGYCYNMFIMSREMMDEYCSWLFPILFELDKKIDYSRYDSYNTRMIGFVAERLINV + WVHKKQLTVKEFPVFSTEEPGFLQRIQKKLFNK" + gene 13214..14629 + /gene="wzx" + /locus_tag="SPC16A_0018" + CDS 13214..14629 + /gene="wzx" + /locus_tag="SPC16A_0018" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33444.1" + /db_xref="GOA:Q4K1H2" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K1H2" + /translation="MKILKNYVYNLLYQILVVVLPIITTPYITRIFSSQELGDYGYYS + SIVTYFILLATLGVANYGTKVISGHRNEINKNFWGIYSLQLGATILSISLYCIFCVNL + PPMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLIGVISIFLFVKSTN + DLYLYVFLLTIFELLGQLSMWLPARGFIGKPHVDLEYARYHLKPIILLFLPQIAISLY + VTLDRTMLGALSSTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVANLLATGDHRAVN + KMHEMAFLIYNLVIFPIISGMLIVNDDFVQFFLGQDFQDARYAIAIMIFRMFFIGWTN + IMGIQILIPHNKNKEFMVSTTAPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LYFTRKYLKEVSIIGSMTKIILASAIMYGILLGSKTFIQFSPTINVLAFAVFGGLIYL + FAILSLKVVDVKELKQMIRKK" + misc_feature 13220..14014 + /gene="wzx" + /locus_tag="SPC16A_0018" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.3e-68" + gene 14631..15629 + /gene="wciG" + /locus_tag="SPC16A_0019" + CDS 14631..15629 + /gene="wciG" + /locus_tag="SPC16A_0019" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33445.1" + /db_xref="GOA:Q4K1H1" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K1H1" + /translation="MHKTRNINLELLKVLACVGVVLLHTTMGGFKEIGSWNLLTYLYY + LGTYSIPLFFMVNGYLLLGKREITYPYILHKVKWILITVLSWTLIVWFLKRDFTVNPV + KKLIGSLVQKGYFFQFWFFGSLILIYLCLPILKKILNSKRRYFYILSLLVVIGLIFEL + INYSLKMPVQFYIIQTFRLWTWLFYYLLGGFIAHFDIDIIKNRFKRWMKLVVVLLFLI + SPLILFFIAKTAYHNLFAEYFYDILFVKVVSLGIFLTILTLTLNEKRSECIVSLSNQT + MGVFIIHTYIMKIWEKLFGFSFVGSYLLFAIFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 15644..16744 + /gene="glf" + /locus_tag="SPC16A_0020" + CDS 15644..16744 + /gene="glf" + /locus_tag="SPC16A_0020" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33446.1" + /db_xref="GOA:Q4K1H0" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1H0" + /translation="MYDYLIIGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYVNQFVEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTAGMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASANKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGMQPKTVITHEYPADWKRGDEPYYPINDEKNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFSN" + misc_feature 16079..16681 + /gene="glf" + /locus_tag="SPC16A_0020" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 5.3e-139" + gene 16771..17640 + /gene="rmlA" + /locus_tag="SPC16A_0021" + CDS 16771..17640 + /gene="rmlA" + /locus_tag="SPC16A_0021" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33447.1" + /db_xref="GOA:Q4K1A5" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K1A5" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 16774..17490 + /gene="rmlA" + /locus_tag="SPC16A_0021" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 4.9e-120" + gene 17641..18234 + /gene="rmlC" + /locus_tag="SPC16A_0022" + CDS 17641..18234 + /gene="rmlC" + /locus_tag="SPC16A_0022" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33448.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 17677..18207 + /gene="rmlC" + /locus_tag="SPC16A_0022" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 18247..19296 + /gene="rmlB" + /locus_tag="SPC16A_0023" + CDS 18247..19296 + /gene="rmlB" + /locus_tag="SPC16A_0023" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33449.1" + /db_xref="GOA:Q4K121" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K121" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18262..19218 + /gene="rmlB" + /locus_tag="SPC16A_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 7.1e-05" + misc_feature 18265..19101 + /gene="rmlB" + /locus_tag="SPC16A_0023" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0039" + misc_feature 18265..19005 + /gene="rmlB" + /locus_tag="SPC16A_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2.7e-76" + misc_feature 18268..19080 + /gene="rmlB" + /locus_tag="SPC16A_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.6e-05" + gene 19362..20213 + /gene="rmlD" + /locus_tag="SPC16A_0024" + CDS 19362..20213 + /gene="rmlD" + /locus_tag="SPC16A_0024" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33450.1" + /db_xref="GOA:Q4K1G6" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G6" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19362..20210 + /gene="rmlD" + /locus_tag="SPC16A_0024" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-147" + misc_feature 19365..20006 + /gene="rmlD" + /locus_tag="SPC16A_0024" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 19365..19994 + /gene="rmlD" + /locus_tag="SPC16A_0024" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 19368..20096 + /gene="rmlD" + /locus_tag="SPC16A_0024" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene order(20276..20743,20861..21166,21228..21449) + /gene="glf" + /locus_tag="SPC16A_0025" + CDS join(20276..20743,20861..21166,21228..21449) + /gene="glf" + /locus_tag="SPC16A_0025" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33451.1" + /db_xref="GOA:Q4K1G5" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G5" + /translation="MYDYLVVGAVFAHEAALEGKKVKVIEKRNHIAGNIYTREEEGIQ + VHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNKLWGVV + TPAEVQAKIDEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGQTNYMLDH + ENIDVETNVDFFVNKEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMEN + YQGNAVVNYTDAETPYTRIIEHKHFEFGSQAKTIITNRTFLYKSYKKLADEQGNVIFG + GRLGHYRYYDMHQVIGAALQCVRNELDSYSMKIKEQTRKLAAGCSKHCFEVADGS" + misc_feature join(20696..20743,20861..21166,21228..21305) + /gene="glf" + /locus_tag="SPC16A_0025" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 9.6e-40" + gene 21683..>21730 + /gene="aliA" + /locus_tag="SPC16A_0026" + CDS 21683..>21730 + /gene="aliA" + /locus_tag="SPC16A_0026" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33452.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggatgactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attcttgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agagaaagac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggcgagt agggaggaag atgtaaaagt + 601 tcatgcccaa actcttcaca caagagttct aacttaccca ttctatggaa tcttgcatta + 661 tccataataa caaccgatgg tgtggttaat gttggtaaga gaaatttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattg + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttatt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata attagattga aactagaata gtacacctct acttctaaaa + 1021 cattgttaga aatcgatttg tcatgttctt atttcatttt actatatttt tgtttcgcgg + 1081 gaagtctact aagatactta aagatgcaga tagaagatgc agatagtaaa aaaaatgtag + 1141 acattaccgt aaaaaagtga tataatcgta tgatgttcaa ggtataggtg ttaatcatga + 1201 gtagacgttt taaaaaatca cgttcacaga aagtgaagcg aagtgttaat atcgttttgc + 1261 tgactattta tttattgtta gtttgttttt tattgttctt aatctttaag tacaatatcc + 1321 ttgcttttag atatcttaac ctagtggtaa ctgcgttagt cctactagtt gccttggtag + 1381 ggctactctt gattatctat aaaaaagctg aaaagtttac tatttttctg ttggtgttct + 1441 ctatccttgt cagctctgtg tcgctctttg cagtacagca gtttgttgga ctgaccaatc + 1501 gtttaaatgc gacttctaat tactcagaat attcaatcag tgtcgctgtt ttagcagata + 1561 gtgatatcga aaatgttacg caactgacga gtgtgacagc accgactggg actgataatg + 1621 aaaatattca aaaactacta gctgatatta agtcaagtca gaataccgat ttgacggtcg + 1681 accagagttc gtcttacttg gcagcttaca agagtttgat tgcaggggag actaaggcca + 1741 ttgtcttaaa tagtgtcttt gaaaatatca tcgagtcaga gtatccagac tacgcatcga + 1801 agataaaaaa gatttatacc aagggattca ctaaaaaagt agaagctcct aagacgtcta + 1861 agaatcagtc tttcaatatc tatgttagtg gaattgacac ctatggtcct attagttcgg + 1921 tgtcgcgatc agatgtcaat atcctgatga ctgtcaatcg agataccaag aaaatcctct + 1981 tgaccacaac gccacgtgat gcctatgtac caatcgcaga tggtggaaat aatcaaaaag + 2041 ataaattaac ccatgcgggc atttatggag ttgattcgtc cattcacacc ttagaaaatc + 2101 tctatggagt ggatatcaat tactatgtgc gattgaactt cacttctttc ttgaaaatga + 2161 ttgacttatt gggaggggta gatgttcata atgatcaaga gttttcagct ctacatggga + 2221 agttccattt cccagtaggg aatgtccatc tggactctga gcaggctcta ggttttgtac + 2281 gtgaacgcta ctcactagcc gatggagacc gtgaccgtgg tcgcaaccaa caaaagatca + 2341 ttgtagcaat tattcagaag ttaacttcta cagaggtttt gaaaaactat agtagtattc + 2401 ttcaaggatt gcaggattct cttcaaacaa atatgccgat tgagactatg atagatttag + 2461 tgaatactca gttggaaagt gaggggaatt ataaagtaaa ttctcaagat ttaaaaggga + 2521 caggtcggat ggatcttcct tcttatgcaa tgccagacag taacctctat gtgatggaaa + 2581 tagatgatag tagtttagct gtagttaaag cagctataca ggatgtgatg gagggtagat + 2641 gaaatgatag acattcattc gcatatcgtt tttgatgtag atgacggtcc caagtcaaga + 2701 gaggaaagca aggctctctt ggcagaatcc tacaggcagg gggtgcgaac cattgtctct + 2761 acctctcacc gtcgcaaggg catgtttgaa actccggaag agaagatagc agaaaacttt + 2821 cttcaggttc gggaaattgc aaaagaagta gcagatgatt tagtcattgc ttatggcgca + 2881 gagatatact atactctgga tgctctagaa aagctagaaa aaaaagaaat tcctaccctt + 2941 aatgatagtc gttatgcttt gattgagttt agcatgcata cttcctatcg tgagattcat + 3001 acgggattga gcaatatttt gatgttggga atcacgccag taattgctca tattgaacgt + 3061 tatgatgctt tagagaataa tgaaaaacgt gtttgtgaac tgattgatat ggggtgctat + 3121 actcagataa atagttatca tgttttaaaa cctaagttct ttggtgaaaa atataaattc + 3181 atgaaaaaga gagctcggta ttttttggaa cgtgatttag ttcatgtagt tgcaagtgac + 3241 atgcacaatt tagacagtag acctcctcat atggcagaag catatgacct tgttacccaa + 3301 aaatacggag aagcgaaggc tcaggaactt tttgtagata atcccagaaa aattataatg + 3361 gatcaattaa tttaggagaa aatatgaagg aacaaaacac tttggaaatc gatgtattgc + 3421 aactattcag aattttatgg aaaagaaagt tggtcatttt attagtggca attataactt + 3481 cttcagttgc ttttgcctac agtacttttg ttatcaaacc tgagtttact agtacgactc + 3541 ggatttatgt agttaaccgt aatcaggaag agaagtctgg tttaaccaat caagacttgc + 3601 aggcaggatc atacttggtt aaagactatc gtgaaattat cctatcgcag gatgttttgg + 3661 aggaagttat ttctgatttg aaattagatt tgacgccaaa aggtttggct aataaaatta + 3721 aagtaacagt accagttgat acccgtattg tctctgtttc agttaatgat cgagttcctg + 3781 aagaggcaag ccgtatcgct aactctttga gagaagtagc tgctcaaaaa attatcagta + 3841 ttactcgtgt ttctgatgtg acaacactgg aggaggcaag accggcgata tcaccatctt + 3901 cgccaaatat taaacgcaat acactaattg gttttttggc aggggggatt ggaactagtg + 3961 ttatagtttt tcttcttgaa cttttggaca ctcatgtgaa acgtccggaa gatatcgaag + 4021 atacactgca gatgacactt ttgggagttg taccaaactt gagtaagttg aaataggaga + 4081 gaggaatgcc gacattagaa atagcacaaa aaaaactgga gttcattaag aaggcagaag + 4141 aatattacaa tgccttgtgt acaaatatac agttgagcgg agataaacta aaagtaattt + 4201 ccgttacttc tgttaaccct ggggaaggaa aaacaactac ttccgtaaat atagcaaggt + 4261 cgtttgcgcg tgcaggctat aaaactcttt tgatcgatgg cgatactcga aattcagtta + 4321 tatcaggagt ttttaaatcg cgtgaaaaaa ttacagggct aacagaattt ttatctggga + 4381 cagctgattt atctcacggt ttatgtgata caaatattga aaatttattt gtaattcaat + 4441 cgggatctgt atcaccaaac cctacagcct tgttacaaag taaaaatttt aatgatatga + 4501 ttgaaacatt gcgtaaatat tttgcttata tcattgttga tacagcacct attggaattg + 4561 ttattgatgc ggcaattatc actcaaaagt gtgatgcgtc catcttggta acagcaacag + 4621 gtgaggtgaa taaacgtgat gtccaaaaag cgaaacaaca attagaacaa acagggaaac + 4681 tgttcctagg agttgtttta aataaattgg atatctcggt tgataagtat ggagtttacg + 4741 gttcctatgg aaattatggt aaaaaataac ttaggaaata ttttatggat gaaaaaggat + 4801 tgaaaatttt tctggcagta ttacagagta taattgtcat tttattggtt tattttctta + 4861 gctttgttag agagacagaa cttgaacgtt cttcgatggt tatactatac cttctccact + 4921 tttttgtatt ctattttagt tcctatggta acaatttttt taaaagaggg tacttagttg + 4981 agtttaatag tactataaga tatatttttt tctttgcaat agctataagt gtattaaact + 5041 tttttatagc ggaacggttt agtatctcta gaagaggaat ggtatacttc ttaactttag + 5101 aaggaatatc cttatacttg ttaaatttct tagtaaagaa atattggaag catgtgtttt + 5161 ttaatctaaa aaatagcaag aaaattttac tgttaacagt aacgaaaaat atggaaaaag + 5221 ttcttgataa attgctagaa tctgatgaac tttcatggaa attggtagca gtaagtgttt + 5281 tggataaatc tgattttcaa catgataaaa tacctgtaat tgaaaaggaa aaaattattg + 5341 aatttgcaac gcatgaagtt gtggatgagg tgtttgtcaa tcttccagga gagagctacg + 5401 atattggaga aattatctct aggtttgaga caatggggat agatgtaact gtaaatctta + 5461 aagcatttga taagaatttg ggtcgcaata aacaaattca tgagatggta ggattgaatg + 5521 tagtcacttt ctctacaaat ttttataaaa ttagtcatgt gatttcaaag agaattctcg + 5581 atatttgtgg tgccactatt ggccttgttc tttttgctat agctagtcta gttttagttc + 5641 cattgattcg taaagatggc ggaccagcta tttttgctca aactcgtata gggaaaaatg + 5701 gtcgacattt taccttttat aaattccgtt cgatgcggat cgatgctgaa gctatcaaag + 5761 aacaattgat ggatcaaaat acgatgcaag gtggtatgtt taagattgac aatgatcctc + 5821 gtgttacaaa aattggtcgc tttattcgta aaaccagttt ggatgaattg ccgcagtttt + 5881 ggaatgtctt tataggagat atgagtttgg tgggaacacg tccacctaca gtagacgagt + 5941 atgatcagta tactccagaa cagaaacgtc gactcagctt taaacctggt attacaggtt + 6001 tatggcaggt tagcggccgt agtaaaataa ccgattttga cgatgttgta aaattagatg + 6061 tggcttatat tgataattgg acaatctgga aagatattga aattttgcta aaaactgtta + 6121 aagttgtatt tataagagat ggagcgaagt aaataatgaa aaaagttata acatatggaa + 6181 catttgattt gttgcactat ggtcatatta atcttcttaa aagggctaaa tcgttaggcg + 6241 attatttaat tgttgtgatt tccactgacg aattcaactg gaatgaaaaa caaaaaaaat + 6301 gttattttac atatgaacaa agaaaaacac tcgtagaggc tgttaggtat gttgatttag + 6361 taatacctga agaatcatgg gaacaaaaag tgacagatgt ccatgaatat cacatagata + 6421 cctttgtcat gggagatgat tggaagggga aatttgattt tttagagaag gaaggagttg + 6481 aagtggtcta tttatcacgg actcctgaaa tcagtacaac tgaaattaag aattcattgg + 6541 caaccagaga atattaaaaa cggagtttaa gataaatata tgacagatga attagaacgg + 6601 ttacataact tagaactttt gttagcttca gaagtgttaa aaatatgtgg aaaatataat + 6661 ttaaaaatcg tgatgctagc aggaactttt ctaggggcta tacgccataa tggattcatc + 6721 ccgtgggacg atgatatgga ttttggtatg ccaagagagg attttgaaag atttaaagaa + 6781 ttatgtgttt cggatttgga cagggaaaaa tattttctac agacagatca aacagatttg + 6841 aattatccat ttaattttgt gaaactacgt ctcaataata cacatgtttc tgaggaattt + 6901 tctttagatg caaatgttca tgatggaatt tatattgata tttttccgat tgataatatc + 6961 tgtcccaagc cttttagacg attcattcaa cttaaaggat tttggttatt ccgaaatcta + 7021 ttatggataa aatgtggata tggggacaac gatagaaaaa aacgattagc gtataaacta + 7081 gctaagcttg ccacacatgt gttctcaata tcttttttga aaaagatgaa ggagaagtgt + 7141 atattactag ggcagagtac caatgctgat aatgtagtgg ttagtgatgg tagttatgga + 7201 ataaagaaag aaacttttcc aaaagtgtgg ttagacgaag ttgaaagtta ttcctttgat + 7261 gatataaaat tatggggaat gaagaattat agagcatact taaaacatat gtatggtgac + 7321 tatatgcagc ttccacctga gaatcaacga aatcatcaca aacgaattaa aattgatttt + 7381 ggcccatacg tggaaaaata ggagaattta taactttgtc taaaaaagag ataaaacttt + 7441 gtctagtagg atctagcggt gggcatttaa atcatctcta tctattgaaa ccattttggc + 7501 aggataaaga tagactatgg attacttttg ataaagaaga tgctcgaagt attttatcaa + 7561 atgaaaaatg tcattattgc tattatccga ctaatcgtaa tataaaaaat ctaataaaaa + 7621 atacatttct tgctttaaga atattatata aagaaaggcc agatgttatc atttcatccg + 7681 gagcagcggt tgcaataccg ttcttttatt taggtaaaat atttggtgct aaaactgttt + 7741 atatagaagt atttgatcgt gtagacgctc caacaatgac tggcaaaata gtataccctg + 7801 ttacagatag attcattgtc caatgggaag aaatgaaaaa aatctatccc aaggcaatca + 7861 atttgggagg aattttctaa tgatttttgt aactgtcggt acgcatgagc aacaatttaa + 7921 tagactaata aaagagattg atgaattgaa agcagaggga gttattacgt cggatgtatt + 7981 tatccaagtt ggtttttcag actatcaacc tcgattttgt agatgggaac gttttctttc + 8041 gtatgatgag atgaataacc taatggaaga agcggatata gttattactc atggtggtcc + 8101 tgctacattt atgaatgtta ttgctaatgg gaaaagacca gtagttgttc cgagaagaaa + 8161 aaaatttgga gaacatgtga atgaccatca gttagatttt tgtaatagga ttgttcagga + 8221 gggatatgat ttagtagtca tagaggatat taaaaaaatc cgagaatacc tgaatccatc + 8281 tagtagtatt gccgttaaat ctaataatga atgctttgta caacattttt caaatttgat + 8341 tgcagaatta gttgagtaaa aatgacgaag agcatagaag gagacacttg atgaaaattt + 8401 tgcatattcc aacaggaggt ttgttttctg atgggattgg aacatttata tattcatacc + 8461 tcgaatacat ggacttgagt gaaattgaag tgacgattct agctaccaat aaaccgttgt + 8521 tagaagataa attaaaattt caagtattag gtgttcagat tgtagaaatt gaaagaaaga + 8581 aatcctcaat actggcatat atgagagaat tccttgaact cttaaaagta ggaaaatacg + 8641 atgttgtaca tgttcacggg agtagtgctc ttatgtcaat tgaattgttt atagcaaaaa + 8701 ttatgggagt tcctgtaaga atagcgcata gtcataatac aacgtgtaat catattctac + 8761 tagacagaat gttacgtcct tttttttaca ctttatatac tcaatcttgg gcgtgtggtg + 8821 aaaaggcagg agaatggctt tttaaggata aacgatttaa agttatacat aatgccaggg + 8881 atgtagaaaa atatagtttt aatcctcatc ttcgccgagt atttcggaca acacattcat + 8941 taaaagaaaa tacacttgca ttaggacatg taggcagatt caatattcaa aaaaatcata + 9001 catttcttct ggatttaatg gatgaaatga aatgtaagca gaaggatgta aaattgtttt + 9061 tggtcggtga aggagaaaaa gtagaagatg ttaagagata tgtaaaagaa cgaaaattag + 9121 aagattcaat tgtttttttg aatcggtatt cggatatgca atcgtttatt tctgctatgg + 9181 atataatgtt attaccgagt ttatacgagg ggttaccttt agttgctatt gagtggcaaa + 9241 ttaatggaat tcaatctatt ctttcaacga caatttctga tgagtgcatc ttcacaaaca + 9301 gtatccaaca attaccaatt gacaacgtaa gtacttggat aaaaaaagct attgaagatt + 9361 tttcatatat aaacagattg gaaaaatcta gagaaaatat tgacctagct caaaaatcaa + 9421 actatgatat caggattgag gctaaaaaat tagagcatga gtataaaaag ttgattgggg + 9481 agtaagaata caatgaatat atcaattgta ttatcaacat ttaatggtga tgaatatatt + 9541 gttgaacagt tagatactct aagaaatcaa acgcgccttg ctgaggaagt cttgattagt + 9601 gatgatgcat ctacagatga tactgttcaa ataattgaag attatattgc taaatataag + 9661 ttggataatt ggtctataaa aaaaaataaa gagaatcaag gatggaagaa taattttgcc + 9721 atgttattag aggaggcgaa aggagatatc gtttttcttt gtgatcaaga tgatatttgg + 9781 catttagata aaattcaaaa aatgtctaag attatggaaa ataatgataa aattttgttg + 9841 ttagcctcta attacacacc tttttatgtt ggtgatggtg tcaagattaa attggataaa + 9901 agtgatttgg ataatagtga ggcagtgtat caaccaaatt ttttagataa cttctttcat + 9961 attagaaggc cagggtgtgt ttatgcggtg aacaaaaaga ttattccata ttttttagaa + 10021 atccgaagta acgaagatgc acatgatgcc ttgttatgga ggctagcttc gtttcttaat + 10081 gggttataca tttactccta ctctactata gattttagaa gacacgatag caacgcgact + 10141 ggtagcagag aaagaagttt cctaaggaga aaagagcaag ttatttatta tgatgatttg + 10201 cttcagagat tagataaatt tagtaaacaa catgatttat cactttcaaa tgaacaaatt + 10261 agtgttttga acgactacat tctatgggga aaaaatcgaa gagaattgtt tatgaaaagg + 10321 aatgtattta tattttttaa attatttaaa tatcataagt tgtattggtc gttcaggtca + 10381 tatattactg attttatagt gttatatatg aaggagtaat tctagtaatg aagagtgtta + 10441 gtgaaagtaa aggggggatt caaagtgagt ctatcaagag ttaaaactga tgtaaaattg + 10501 aatgagtttc tttttggatt agctttttat ccttggctaa tagcatggct gtttacttcg + 10561 accttttata aggattttat acatccttat ggaataataa aaacttggga gtatgtggga + 10621 ttattttttc tattatttaa atttatgtta ggtaaatcta agataaaatc gataatcatt + 10681 actccaatta tacttcttat aggttttatt gtaagttatg ataatggtaa cgcctccttt + 10741 gtagcatata ctttgactct tatatattct tcaagggata ttaattttcg taatttggta + 10801 aggaatacaa tgttctgcca gattggagtt gtaggaactg ttatagtaag ctctttactt + 10861 ggtattattc ctaacgagct agccttaaca tattcagaag gtgtgatccg ctcacggtat + 10921 ggactaggtt ttcactacac atcatttact ccgaattatt tcctgagtat attgctggaa + 10981 tatgtgtatt taaaaggtga aaaatattgg acaataaaag agctttttat ttgtgtacta + 11041 ttaaatatag ttatttataa atacacagat acccgtctta cttttattat ggtatttatc + 11101 cttcttttga tatcgttttc gagaagattt gtatcaatca atatgaattt taaatttcta + 11161 aaatatttac ttactcttat ttatccaatt atggcgtata tgacttattg gctgacagca + 11221 aaatttgata gtagaaatag tttattatct ttaataaata acttattgag tcaaaggttg + 11281 agattcggtc aagaaggttt aaggagatac cctctaagat tatttggaac tcatattcaa + 11341 tgggatgctt cggcgaattc ttatctttat gtagattcgt cgtacattaa tatacttata + 11401 agctatggaa caataatttt tttccttacg ttaataagct attcaattat aatgaaaaaa + 11461 gttataatta atcaaaataa aactttattg attgtgttaa ttttttggtc agtaagagct + 11521 tgtattgacc cacaattatt tttattgtgg ttcaatccat ttttgttttt aattgcgaga + 11581 acgtttttag atgaaagaga ggaaattgga gatgatatca cttatatgtg tatcgaataa + 11641 ttacgataag ttaaatacaa ttcttaaatc atctttatct agacaaaagg atgttaatta + 11701 tgaacttatt atagtggatt ctaataaata tggatttaat tctgctgctg aggctttgaa + 11761 ttttggaggc aaacaagcaa aaggtgatta tctatttttt gttcatcaag atattagttt + 11821 tcaagatgac tttgagttag caaaactaga atcttattgt agaaattcca tatttggagt + 11881 agcaggagta gcaggggtaa agaatattga gggaaaggtc gtcagttttt caaatatttt + 11941 tcatggggac ccgaaaacaa aggcggctgg taaatctata agtgcccctg ttgaagttga + 12001 cgcaattgat gagtgtttga ttattattcc gaaaaaagtt tttagtacaa atcaatttag + 12061 tataatcggt cctacctggc atttatatgg aacagactat gcattacaga tgaagttaat + 12121 caattcgcca gtattagttt ttccaagtga gttatggcat gtgtcagatg ggaaatcttt + 12181 aaaccttaat tattttgatg cgatacaatg gttattgaaa aaatactcta aaaattattc + 12241 agtaatatac actttttttg gagtttggcc aagtaatcct attctattaa aatttaaatg + 12301 tctttatagg aaattaaggt tttatattaa gggagtgtaa tggaagtgaa gctatacgtc + 12361 gcaacacata aatcttataa tcaagttcaa gaccaggacc tatatatccc tatattggtg + 12421 ggcgcggata agaatattgg agaaaagaat tatttaagag ataatcaggg agataataat + 12481 atttctgata gaaactttac attttgtgaa ttaacaggat tgtattggat ttggaaaaat + 12541 tctaaagatg atattgttgg tttatgccat tatagacgtt attttgggaa aaacaagcgt + 12601 tttttaaaac agaattctat tttaaaaaag aatgatattc taaaacaatt aaatgattat + 12661 gatgtaatat taccatcaaa gagtatgaac gagtataacg ggtatactgc tgaagagttt + 12721 tttaacaaga atcacgatca taaagtttgg gaaatgtgta gacagattat ttcagaaaac + 12781 aataaagatt accttgatgc ttttaattgg ttttctaaag aaaaaacagg atactgttat + 12841 aatatgttta taatgtctag agaaatgatg gatgaatatt gcagttggtt atttccgatt + 12901 ctttttgaac tagataagaa gattgattat tcaagatatg atagttacaa tactcgtatg + 12961 attggttttg ttgccgaacg tttaattaac gtatgggtac ataagaaaca actaactgta + 13021 aaagagtttc cggttttttc aacagaagaa ccaggattct tacaaagaat tcagaagaaa + 13081 ttatttaata agtagtagtt tatttataaa agtagattgt taataaatct ttcaaggtgc + 13141 tattcccctt ttccaattaa gttttattgc acggtcctca taaatactcc tagaaagact + 13201 aagttaatta aagatgaaga ttttaaagaa ttatgtttat aatttgttat accagatact + 13261 agtagttgtt ctcccaataa taactactcc ctatattact agaatcttta gttctcaaga + 13321 gttaggtgat tatggatatt atagttctat agtaacttac tttatattgc tcgctacttt + 13381 aggtgtcgcc aactatggga ctaaggtaat ttctggacat cgtaatgaga ttaataaaaa + 13441 tttttggggt atctactctt tacaattagg tgctacaatc ctttcaatct ccttatattg + 13501 tattttttgc gttaaccttc ctccaatgca aaacccagta gcctatattt tgggattgag + 13561 tttagtttct aaaggtttag atatttcctg gctttttcaa ggattagagg atttccgtaa + 13621 aattactgtt cgaaatatta cggtaaaact aattggggta atctctattt tcctgtttgt + 13681 caaatctact aacgaccttt acctttatgt gttcttatta acaatatttg agctattggg + 13741 acaattaagt atgtggttgc cggcccgagg gtttattggt aagccccatg ttgatttaga + 13801 atacgctagg taccatttga aaccaattat tttattattt cttcctcaga tagcaatctc + 13861 tttatacgtt actttagatc gtacgatgct tggtgcttta tcctctacaa aagatgtagg + 13921 aatttatgat caggctctta aattggtaaa tattttatta acattggtaa catcgcttgg + 13981 aagtgttatg ttgcctcgag tagctaactt attagcaaca ggagatcata gagcagtcaa + 14041 taagatgcat gagatggctt tcttgattta taatttagtt atttttccta ttatatccgg + 14101 aatgttaatt gtcaatgatg attttgttca atttttcctt ggtcaagatt ttcaggatgc + 14161 acgttatgca atcgccatta tgattttccg tatgttcttt ataggttgga ccaatattat + 14221 gggaattcaa attttgattc cacacaataa aaataaggaa tttatggttt caacaacagc + 14281 tcccgcaatt atcagtgtag gtttgaacct gctattcctt cctaaacttg gttatatcgg + 14341 agcagctatt gtctctgttt taacagaagc gctagtatgg gcaattcaat tgtactttac + 14401 ccgcaaatac ctaaaggaag tttcaattat tggatctatg acaaaaatta ttctagcatc + 14461 agctatcatg tatggtattt tgcttggttc aaaaacattt atacagtttt caccaaccat + 14521 aaatgttcta gcatttgctg tgtttggtgg actcatttat ctttttgcaa ttctatctct + 14581 gaaagtggta gatgtaaaag aattaaaaca aatgattagg aaaaaataga atgcataaaa + 14641 ctcggaatat taatttagaa ctattaaaag tacttgcatg tgttggagtt gttctacttc + 14701 atacaacgat gggtgggttt aaagagatag gttcatggaa tcttttgaca tatttatatt + 14761 acttaggaac ctattctatc cctctatttt ttatggttaa tggttattta ttgttaggaa + 14821 agagagagat aacatatccc tatatactgc ataaagtaaa atggattcta ataacagtgt + 14881 tgtcatggac ccttatcgtt tggtttttaa aacgggattt tacagttaat ccagttaaaa + 14941 aacttatagg ctcgttggtg caaaaaggtt atttctttca gttttggttt tttggttcgc + 15001 ttatacttat ttatttatgt ctacccattt tgaaaaaaat tcttaattca aaaagaagat + 15061 atttttatat tctatcttta ttggtagtta ttggtttgat ttttgaactg ataaattact + 15121 cacttaaaat gccagtgcag ttttatatta tacaaacatt tagattatgg acttggcttt + 15181 tctattatct tttaggtggt tttatagctc actttgatat agatattatc aaaaataggt + 15241 ttaagagatg gatgaaatta gttgtagtac ttttattctt gatttcgcct ttaatattat + 15301 ttttcatagc gaagactgca taccataatc tttttgctga atatttttat gatattttat + 15361 ttgtaaaagt tgtaagcttg ggaatttttc taactatcct cacgcttact ttgaatgaaa + 15421 aacggagcga atgtattgtt tccctttcta atcaaaccat gggagttttt ataatacaca + 15481 catatattat gaagatatgg gaaaagctat ttggttttag tttcgtagga tcatatttac + 15541 tttttgctat atttacttta agtgttagtt ttattattgt tggaatgtta atgaaaattc + 15601 cttatttcaa tcgaatcgtt aaattataaa taggagattt aatatgtacg actatttaat + 15661 catcggagct ggtttgtctg gagcaatctt cgcacacgaa gctacaaaac gtggtaaaaa + 15721 agtaaaagtg attgataaac gcgatcacat tggagggaac atctactgtg agaatgtaga + 15781 aggtatcaat gttcataaat atggtgccca tatcttccat acgtcaaata aaaaagtctg + 15841 ggactatgtc aatcaatttg tagagtttaa caactatatc aactcacctg tcgcaaacta + 15901 taagggaagt ctttataacc ttcctttcaa tatgaatacc ttctatgcta tgtggggcac + 15961 aaaaactcca caagaagtga aggataagat tgctgagcag acagctggta tgaaggatgt + 16021 tgagccgaaa aatctggaag aacaagctat caagttgatt ggtccggata tctatgaaaa + 16081 gttgatcaag ggttatacag aaaagcaatg gggacgctca gcgacagaac ttcctccatt + 16141 tatcataaaa cgccttccag ttcgtttaac ctttgataat aactatttta atgaccgtta + 16201 ccaagggatt cctattggtg gttacaatgt catcatcgaa aatatgctga aagatgtaga + 16261 agttgaactt ggagtagact tttttgctca tcgtgaagag ttggaagcat ctgctaacaa + 16321 agttgtcttc acaggaatga tcgaccaata ttttgactac aagcacggag agttagaata + 16381 ccgtagcctt cgttttgagc atgagatttt agacgaggaa aattatcaag ggaatgctgt + 16441 agtgaactat acagagcgtg agatccctta tactcgtatc atcgaacaca aacattttga + 16501 atatggaatg cagccaaaga cagttatcac gcatgaatat ccagctgact ggaagcgtgg + 16561 ggacgagccc tactatccta ttaacgatga gaaaaataat gctatgtttg ctaaatacca + 16621 agaagaagca gcgcagaatg ataaagttat cttttgtggg cgtttagcag attataaata + 16681 ttacgatatg catgtggtga ttgaacgggc gcttgaggtt gtggagaaag aatttagtaa + 16741 ttgaaaaaca acgaagaaag gttgcttatt atgaaaggta ttattctagc aggtggttcg + 16801 gggacacgtt tatatccttt gactcgcgct gcatcaaaac aacttatgcc ggtttatgat + 16861 aaaccgatga tttactaccc actttcaaca ttgatgttgg ctgggattag ggatattttg + 16921 attatttcca ctccacagga tttacatcga tttcaagagc ttcttcaaga cggatctgag + 16981 tttgggatca aactttctta tgcagagcaa ccaagtccag atggtttggc acaagccttt + 17041 atcatcgggg aagagtttat ttctgatgat agcgttgcgc taatcttagg tgataatatc + 17101 taccatggtt ctgggctttc caagatgcta caaaaggcag cgagtaagga gtcgggagca + 17161 actgtttttg gctaccatgt caaggatcca gagcgctttg gtgtggttga gtttgatcag + 17221 gatatgaagg ctatttctat tgaagaaaag ccagagcaac ctcgttcaaa ctatgcagtt + 17281 acaggtctct atttctatga taatgatgta gtagagattg ccaagagtat taaaccaagt + 17341 cctcgtggtg aactggaaat tacagatgta aacaaagctt acctagatcg tggtgatttg + 17401 tctgttgagc tcatgggacg tggctttgct tggctggata ctggaactca tgaaagttta + 17461 ctagaggctt cacagtacat cgaaacagtg caacggatgc aaaatgttca ggtagcaaac + 17521 ttagaagaaa ttgcctatcg catgggttat atcagtcgtg aagatgtatt gaccttagcc + 17581 caaccactta agaaaaatga atacggacag tatctgctcc gtttgattgg agaagcatag + 17641 atgacagata attttttcgg taagacgctt gcggcacgca aggttgaagc tattccaggc + 17701 atgttggagt ttgatatccc cgttcatgga gataatcgtg gctggtttaa agaaaatttc + 17761 caaaaggaaa aaatgcttcc acttggattt ccagagtctt tctttgcaga aggaaaattg + 17821 caaaacaatg tatccttctc acgtaaaaat gtccttcgag gactccacgc agagccttgg + 17881 gataagtaca tctctgtagc agatggaggg aaagttctgg gttcttgggt tgatctacgc + 17941 gagggtgaaa cctttgggaa tacctatcag acagtaattg atgcaagcaa gggaatcttt + 18001 gttcctcgag gcgtagctaa tggcttccaa gttctatcag atacagtgtc atatagctat + 18061 ctggtcaatg attactgggc tctcgagctc aaacccaagt atgcctttgt gaactacgct + 18121 gatccaagcc ttggtattga atgggaaaat attgcagaag cagaggtttc agaagcagat + 18181 aaacatcatc ccctacttaa ggatgtaaaa cctttgaaaa aagaagattt gtaaaaagga + 18241 aagaatatga ctgaatacaa aaatattatc gtgacaggtg gagctggctt tatcggttct + 18301 aactttgtcc attatgttta cgagaacttt ccaggtgttc acgtgacagt cctagataag + 18361 ttgacttatg ctggaaatcg cgcgaatatt gaggaaattt taggtaatcg tgttgagtta + 18421 gttgttggtg acattgctga tgcggagttg gtagacaagt tggctgctca agcagatgct + 18481 atcgttcatt atgcagcgga aagccacaat gataattcgc tcaatgatcc atcgccattt + 18541 attcatacta acttcatcgg aacctatact cttttagaag ctgctcgtaa gtatgatatt + 18601 cgcttccacc atgtatcgac agatgaagtt tatggggatc tccctttacg cgaagatttg + 18661 ccaggtcatg gtgaaggacc aggtgagaaa tttactgctg aaacaaaata caacccaagc + 18721 tctccgtact catcaaccaa ggcagcctca gatttgattg tcaaagcctg ggtgcgttct + 18781 tttggagtca aggcaacgat ttccaactgt tcaaataact acggtcctta tcaacatatc + 18841 gaaaaattca tcccacgtca gattactaac atcctaagtg gaattaagcc aaaactttac + 18901 ggtgaaggta agaatgttcg tgactggatt cataccaatg accattcttc aggagtttgg + 18961 acaatcttga caaaagggca aatcggtgaa acctacttga ttggggctga tggtgagaag + 19021 aacaataagg aagttttgga acttatcctt aaggaaatgg gacaagctac ggatgcctat + 19081 gatcatgtga ctgaccgtgc aggacatgac cttcgctatg cgattgatgc cagcaagctc + 19141 cgtgatgagt tggggtggaa acctgaattt accaactttg aagctgggct caaggcaaca + 19201 atcaagtggt atacagataa ccaagaatgg tggaaagcag aaaaagaagc tgttgaagcc + 19261 aattatgcta agactcagga gattattaca gtataaaaag caggaaatag ctgcttttta + 19321 ttgctatatt gggaagagtt acatattaga aaggtctaga gatgatttta attacagggg + 19381 caaatggcca attaggaacg gaacttcgct atttattgga tgaacgtaat gaagaatacg + 19441 tggcagtaga tgtggctgag atggacatta ccaatgaaga aatggttgag aaagtttttg + 19501 aagaggtgaa accgacttta gtctaccact gtgcagccta caccgctgtt gatgcagcag + 19561 aggatgaagg aaaagagttg gacttcgcca tcaatgtgac ggggacaaaa aatgtcgcaa + 19621 aagcatctga aaagcatggt gcaactctag tttatatttc tacggactat gtctttgacg + 19681 gtaaaaaacc agttggacaa gagtgggaag ttgatgaccg accagatcca cagacagaat + 19741 atggacgcac taagcgtatg ggggaagagt tagttgagaa gcatgtgtct aatttctata + 19801 ttatccgtac tgcctgggta tttggaaatt atggcaaaaa cttcgttttt accatgcaaa + 19861 atcttgcgaa aactcataag actttaacag ttgtaaatga ccagtacggt cgtccgactt + 19921 ggactcgtac cttggctgag ttcatgacct acctagctga aaatcgtaag gaatttggtt + 19981 attatcattt gtcaaatgat gcgacagaag acacaacatg gtatgatttt gcagttgaaa + 20041 ttttgaaaga tacagatgtc gaagtcaagc cagtagattc cagtcaattt ccagccaaag + 20101 ctaaacgtcc gctaaactca acgatgagcc tggccaaagc caaagctact ggatttgtca + 20161 ttccaacttg gcaagatgca ttgcaagaat tttacaaaca agaagtgaga taagtagtag + 20221 aatgattttc tagtctaata aaagagacag ataatgaact ccaaaggagc ttaagatgta + 20281 cgattatctt gttgttggtg cagtctttgc ccatgaagca gccttagaag gaaaaaaagt + 20341 aaaagttatt gaaaaacgaa atcatatcgc gggtaatatc tatactcgtg aagaggaagg + 20401 aattcaagtt catcaatatg gtgctcatat cttccatact tctgataagg agatctggga + 20461 ttatgtaaat cagtttgcag agtttaaccg ttataccaat tctcctgttg caaactataa + 20521 gggtgagatt tataaccttc cttttaatat gaataccttc aataaactct ggggagttgt + 20581 aacgccagca gaagtacagg ctaagattga tgaacaacgt gctattttaa atggtaaaac + 20641 tcctgaaaat ttggaagaac aggcgatttc tcttgtaggt acagacatct acgaaaaatt + 20701 aatcaaagac tatacagaga aacagtgggg gcaaaccaac tactgaactt ccatccttta + 20761 ttattcgctg tttaccagta cacctgacct atgataacaa ctattttaac gatacctatc + 20821 aagggattcc aattggtgga tacactcaaa tagttgaaaa atgttggatc atgaaaatat + 20881 tgatgtagaa acaaatgttg atttctttgt gaacaaagag caatatctga aagattttcc + 20941 taagattgtc tttactggta tgattgatga attctttgac tataagttgg gcgaactaga + 21001 gtaccgtagt cttcgttttg aaaatgagac cttggatatg gaaaattacc aaggaaatgc + 21061 agttgtgaac tatacggatg cagaaacccc atatactcgc attattgaac acaaacattt + 21121 tgagtttggg agtcaagcaa agactatcat tactaataga acattctaaa acatgggaaa + 21181 aaggtgatga gccttattat ccagttaata atgatcgtaa taatcatttg tataaatcat + 21241 ataaaaaact tgctgatgag caagggaatg ttatctttgg tggccgctta ggacactatc + 21301 gttattacga tatgcaccaa gtaattggag cagctttgca gtgcgtgaga aatgagttag + 21361 attcatactc aatgaaaatt aaagagcaaa ctaggaagct agccgcaggt tgctcaaagc + 21421 actgttttga ggttgcagat ggaagctgac gcggtttgaa gagattttcg acgagtataa + 21481 acaagtaaaa ctgactacca gttattattt agaaatagta ttaaaaattc cttgactata + 21541 tgatatagtt gagggatttt taaatgatat tcatattttt tgcaaagatg ttgtttgaaa + 21601 aataattttc aaaaattctg aaaattctgt tgacaacttt ctgaaaagag tctataatgg + 21661 agagaaagtt ttaaaggaga aaatgatgaa aagttcaaaa ctacttgccc ttgcgggcgt + 21721 gacattattg +// + diff --git a/public/res/serotype_genbank/serotype_16F.gb b/public/res/serotype_genbank/serotype_16F.gb new file mode 100644 index 0000000..4efd096 --- /dev/null +++ b/public/res/serotype_genbank/serotype_16F.gb @@ -0,0 +1,1004 @@ +LOCUS CR931668 21481 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain nr. 34361 (serotype 16f). +ACCESSION CR931668 +VERSION CR931668.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21481) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21481) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21481 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="nr. 34361" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC16F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC16F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33453.1" + /db_xref="GOA:Q4K1G3" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K1G3" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVFEKQILVPWDAFCVELL" + gene 293..466 + /gene="aliB" + /locus_tag="SPC16F_0002" + /pseudo + CDS 293..466 + /gene="aliB" + /locus_tag="SPC16F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI33454.1" + gene complement(order(459..995,997..1323)) + /gene="tnp" + /locus_tag="SPC16F_0003" + /pseudo + CDS complement(join(459..995,997..1323)) + /gene="tnp" + /locus_tag="SPC16F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + misc_feature complement(join(933..995,997..1305)) + /gene="tnp" + /locus_tag="SPC16F_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.8e-23" + /pseudo + gene 1558..3003 + /gene="wzg" + /locus_tag="SPC16F_0004" + CDS 1558..3003 + /gene="wzg" + /locus_tag="SPC16F_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33456.1" + /db_xref="GOA:Q4K1G2" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K1G2" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVAAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGIDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1558..1674 + /gene="wzg" + /locus_tag="SPC16F_0004" + /note="Signal peptide predicted for SPC0793 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 1762..2109 + /gene="wzg" + /locus_tag="SPC16F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 3.1e-64" + misc_feature 2287..2730 + /gene="wzg" + /locus_tag="SPC16F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.1e-69" + gene 3005..3736 + /gene="wzh" + /locus_tag="SPC16F_0005" + CDS 3005..3736 + /gene="wzh" + /locus_tag="SPC16F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33457.1" + /db_xref="GOA:Q4K1G1" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K1G1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYNALENNEKRVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 3008..3616 + /gene="wzh" + /locus_tag="SPC16F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.7e-39" + gene 3745..4437 + /gene="wzd" + /locus_tag="SPC16F_0006" + CDS 3745..4437 + /gene="wzd" + /locus_tag="SPC16F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33458.1" + /db_xref="GOA:Q4K1G0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K1G0" + /translation="MKEQNTLEIDVLQLFRVLWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQGEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLASKIKVTVPADTRIVSVSVNDRVPEEASRIANSLREVAAKKIISITRVSDVT + TLEEARPAISPSSPNLKRNTLIGFLAGVIGTSVIVLLLELLDTRVKRPEDIEDTLQMT + LLGVVPNLNKLK" + misc_feature 3763..4179 + /gene="wzd" + /locus_tag="SPC16F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 9.5e-53" + misc_feature 4285..4362 + /gene="wzd" + /locus_tag="SPC16F_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4447..5130 + /gene="wze" + /locus_tag="SPC16F_0007" + CDS 4447..5130 + /gene="wze" + /locus_tag="SPC16F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33459.1" + /db_xref="GOA:Q4K1F9" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1F9" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVS + PGEGKTTTSVNIAWSFARAGYKTLLIDGDIRNSVISGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEANKRDVQKAQQQLKQTGKLFLGVVFNKLDISVDKYGVY + GFYGNYGKK" + gene 5146..6513 + /gene="wchA" + /locus_tag="SPC16F_0008" + CDS 5146..6513 + /gene="wchA" + /locus_tag="SPC16F_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33460.1" + /db_xref="GOA:Q4K1F8" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K1F8" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFEKMG + MDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIVSLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMQIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5929..6510 + /gene="wchA" + /locus_tag="SPC16F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 3.7e-146" + gene 6544..7716 + /gene="wchF" + /locus_tag="SPC16F_0009" + CDS 6544..7716 + /gene="wchF" + /locus_tag="SPC16F_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33461.1" + /db_xref="GOA:Q4K1F7" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K1F7" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKTIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIVYDIAAINRAIKIAKENKDEDPIF + YILACRIGPFIHGIKKKIQEIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYIQYQPKTTYIAYGTDTTRSTLNSSDEKVRAWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASSSKKDFVLITNVEQNKFYNQLLASTGFDKDPRV + KFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKIIDELDRQSNQRIVDFFTWEKIVTDYEKLFKK" + gene 7713..8984 + /gene="wciU" + /locus_tag="SPC16F_0010" + CDS 7713..8984 + /gene="wciU" + /locus_tag="SPC16F_0010" + /note="member of homology group 59" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33462.1" + /db_xref="GOA:Q4K1F6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1F6" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMLEQIAQGYQVAALYPGRI + KFFSKKIEIIKETSRQFECYELLNSLPMALFGGISDPTAFLTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKSLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKSTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIKSANSIVLSITNSSINHHQRLTTTNNKIRVA + YIGPDEEYKGYFDFVDFVETLDRESYEVATYGHLPNEECPSFIEQKGYFTKEMIDSVY + ENIDILIVPSKWKETFGLITVEALSYGVNVFVSENVGSKDLLPESHVFKNQNDLIVKF + LKNDIENTKLKTLDEHSIEVIQYYERVINDS" + misc_feature 8487..8948 + /gene="wciU" + /locus_tag="SPC16F_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0011" + gene 8974..9660 + /gene="wcxM" + /locus_tag="SPC16F_0011" + CDS 8974..9660 + /gene="wcxM" + /locus_tag="SPC16F_0011" + /note="member of homology group 105" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33463.1" + /db_xref="GOA:Q4K1F5" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K1F5" + /translation="MIVKSFIKKITGKTVDIHPDVPLSYILQRGINYSFGLFRGVVRG + IGFGQNDKRLFIGQGVSILAKRKLFVGKNVRIGKKVSIDALSKEGIHFADNVKIGDYS + QIIGTGSIKNMGIGLKIGKNSSFSEYSLFGSAGGITIGDNVIAGQNVRFHAENHNYSD + LDKLIVEQGVSRKGISVGDNCWIGAGSVFLDGSSIGSGCVVAANSVITKNFPDNVIVA + GVPAKIIKMK" + misc_feature 9172..9225 + /gene="wcxM" + /locus_tag="SPC16F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 16" + misc_feature 9238..9291 + /gene="wcxM" + /locus_tag="SPC16F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 13" + misc_feature 9379..9432 + /gene="wcxM" + /locus_tag="SPC16F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 10" + misc_feature 9493..9546 + /gene="wcxM" + /locus_tag="SPC16F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 11" + misc_feature 9547..9600 + /gene="wcxM" + /locus_tag="SPC16F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 1.7" + gene 9672..10577 + /gene="wcxN" + /locus_tag="SPC16F_0012" + CDS 9672..10577 + /gene="wcxN" + /locus_tag="SPC16F_0012" + /note="member of homology group 154" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33464.1" + /db_xref="GOA:Q4K1F4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K1F4" + /translation="MRKEIKAVYAILNYNTWEDTARLAQKVATFQHIQSVIIVDNLST + DDSYHYLKRLEGEKISVYQTQRNGGYSVGNNFAARKAYNMGVDILFISNPDVDIDEKD + SLMIAQNLYKNSSYALLSGIEYNAMKEIDLPIVWHENSYYDDLLDCLFLTRKWRRKKE + DINLSMIKSSIIDVDLVKGSFFAVRLSDFHDVGYFDESVFLFCEERILAKKLQKVNKK + IGILPEAKYYHNHSTSINERYKKKKEQINLLYKSRYYYNVKYNNISFVKKLCLKSVMM + LSILEYIILDMMNLLYTKTNYKKIQ" + gene 10669..11136 + /gene="HG191" + /locus_tag="SPC16F_0013" + /pseudo + CDS join(10669..10824,10824..11136) + /gene="HG191" + /locus_tag="SPC16F_0013" + /note="member of homology group 191" + /pseudo + /codon_start=1 + /transl_table=11 + /product="hypothetical protein (pseudogene)" + gene 11267..12529 + /gene="wzy" + /locus_tag="SPC16F_0014" + CDS 11267..12529 + /gene="wzy" + /locus_tag="SPC16F_0014" + /note="member of homology group 234" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33466.1" + /db_xref="UniProtKB/TrEMBL:Q4K1F3" + /translation="MSKLILNLKLNSFLFVIILLLVVVTPTHTLIFDALIPTKIDNLW + REFLLVISFLCILKINAGKIKIGKLGGPIIVMGGIGLVYTICSDRPFTALNLFRIYMF + PAVIYFIIINCNFRKERLLILKQAHVYTACILALWGIFQAWVLKDQFLIKIGYPSQGN + FLKSTAFYIGGFFGQQRVTSTFSAPNLAGVYFGISLIILLSIFDTIKSNRLVLFSIVA + AFVLTFSRSAIISTLVGIVFFQRKKLFSTTKINVMTLVIFPLIFLIVLVIFYLYPENV + IINMLYSSYSSTLNLTDSSAVKHLEDLWLPLLKVIDYPLGLGFGNNGPIVLSLYHSAN + LVESSIYLLAYDFGILGMFIYLFPYFYTIFVYKKYLLSGAICCLVLITYLFLPNVENF + EIIFFIYLFIGMDELALYTKGMNVHEID" + misc_feature 11267..11368 + /gene="wzy" + /locus_tag="SPC16F_0014" + /note="Signal peptide predicted for SPC0803 by SignalP 2.0 + HMM (Signal peptide probability 0.888) with cleavage site + probability 0.749 between residues 34 and 35" + gene 12510..13676 + /gene="wcxP" + /locus_tag="SPC16F_0015" + CDS 12510..13676 + /gene="wcxP" + /locus_tag="SPC16F_0015" + /note="member of homology group 155" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33467.1" + /db_xref="GOA:Q4K1F2" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K1F2" + /translation="MYMKLIKLLKKYINLYISSSVPKTNKLLIFGSWLGEKYADNPRY + LFEYVIKNRPDLKAIWITSNQDVFKELQKKQYLVMMAEAPETRKIVKKAKYIFTATGI + FDIGEQNANFVGGAYLINLWHGIPLKKIMYDDKHSALHKRSKLVTWVEKIPLRNYFVI + STSTAITQIYQSAFRVKKSNILELGQPRNDYFYDKSNPVSSLIQELKSKNIILYMPTH + RNEGKKQIDLDKLMDLEHLNNWCEETKSIFVIKKHFYHSKEKTIDKKYSSIIDVTNEK + VDVQELLKCSNVLITDYSSCYIDYLLLNRPIIFFNYDYDDYLRVDRSLYFPYENVTPG + EKCQNFDELLVTLQNLYVGKDDYREERENIKTFFYSSETQKSVSEKIINHVLNL" + misc_feature 13104..13670 + /gene="wcxP" + /locus_tag="SPC16F_0015" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 7.7e-34" + gene 13682..15133 + /gene="wzx" + /locus_tag="SPC16F_0016" + CDS 13682..15133 + /gene="wzx" + /locus_tag="SPC16F_0016" + /note="member of homology group 52" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33468.1" + /db_xref="GOA:Q4K1F1" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K1F1" + /translation="MESVMKKILNKYYSLSNPVKASIWFTICNVLQKGISMITVPVFT + RVLTTEQYGVYSVYQSWYSIIGVFATLNLYYGVFNNGMIKYEKDKNVFTSSMQGLTTT + VTAIFLLIYLIGIDFWNSLLGLPTLLILVMFFDLFFTPAYSFWVARQRFEYKYRNLVF + ITFIIAIGSPIIGISAVVLSTYKAEARVISFVLVQSCIGLYFYILNLYRGKHFFCKKY + WLYALNFNLPLIPHYLSQSVLNQSDRIMINSMVGMGEAAIYSVAYSISILMLLVTSAI + NSSFIPYTYKCIRDKKYTELGKSANLLITLVGIGSILTISLGPEIIQLFAPKQYYEAI + WIIPPVALSVYFMFLYPIFGNIEFYFEANHFVMWASIGGAIMNIFLNFIFLKHFGYIA + AGYTTLFCYILFALGHYIFMRRVLYQNLSGIQIYNSRYILFFSILLIILMLLIVIIYP + FILIRYLTISLILGGCFLKRKKIMSSIAIIKQQ" + misc_feature 13733..14545 + /gene="wzx" + /locus_tag="SPC16F_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.9e-12" + gene 15143..15958 + /gene="wcxQ" + /locus_tag="SPC16F_0017" + CDS 15143..15958 + /gene="wcxQ" + /locus_tag="SPC16F_0017" + /note="member of homology group 156" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33469.1" + /db_xref="GOA:Q4K1F0" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K1F0" + /translation="MTETNKQLHETLIEILDFVKEICEKHELTYFLVFGTALGAKRHC + GFIPWDDDVDIALPREHYNIFIDALSETDQSIFSLQNEDNEPNYFLPFAKLRKNNTIF + IEKILDVEYENNGIYIDIFPLDFVENPDSFNFKIRRTTFNYIKHILKFSSCRSFYKNK + YSNVRYLIENIMSIPTLFFSNRRLLFLANSLISSTTKADFIGQYDQKSNKRAIMPSNY + YFPPRSAVFEGKTYSVPAKLEDYLKCFYGSDYMELPPIEKRVTHQPITLRFEK" + misc_feature 15209..15883 + /gene="wcxQ" + /locus_tag="SPC16F_0017" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 1.7e-34" + gene 15986..16378 + /gene="gct" + /locus_tag="SPC16F_0018" + CDS 15986..16378 + /gene="gct" + /locus_tag="SPC16F_0018" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33470.1" + /db_xref="GOA:Q4K1E9" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K1E9" + /translation="MKRVITYGTFDLLHHGHINLLRRAKELGDYLVVVVSSDEFNLIE + KNKVCYFNYEHRKSLVEAIRYVDLVIPETSWEQKRSDVKEYHIDTFVMGDDWIGEFDY + LKEEGVEVVYLPRTKEISTTKIKKDLSM" + misc_feature 15998..16366 + /gene="gct" + /locus_tag="SPC16F_0018" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 4.7e-27" + gene 16535..17404 + /gene="rmlA" + /locus_tag="SPC16F_0019" + CDS 16535..17404 + /gene="rmlA" + /locus_tag="SPC16F_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33471.1" + /db_xref="GOA:Q4K1E8" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K1E8" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSNMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 16538..17254 + /gene="rmlA" + /locus_tag="SPC16F_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 6.5e-120" + gene 17405..17998 + /gene="rmlC" + /locus_tag="SPC16F_0020" + CDS 17405..17998 + /gene="rmlC" + /locus_tag="SPC16F_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33472.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 17441..17971 + /gene="rmlC" + /locus_tag="SPC16F_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 18011..19060 + /gene="rmlB" + /locus_tag="SPC16F_0021" + CDS 18011..19060 + /gene="rmlB" + /locus_tag="SPC16F_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33473.1" + /db_xref="GOA:Q4K2P4" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P4" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18026..18982 + /gene="rmlB" + /locus_tag="SPC16F_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0001" + misc_feature 18029..18769 + /gene="rmlB" + /locus_tag="SPC16F_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 2.7e-76" + misc_feature 18032..18844 + /gene="rmlB" + /locus_tag="SPC16F_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.7e-05" + gene 19126..19977 + /gene="rmlD" + /locus_tag="SPC16F_0022" + CDS 19126..19977 + /gene="rmlD" + /locus_tag="SPC16F_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33474.1" + /db_xref="GOA:Q4K2P3" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P3" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVNPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19126..19974 + /gene="rmlD" + /locus_tag="SPC16F_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 5.7e-148" + misc_feature 19129..19770 + /gene="rmlD" + /locus_tag="SPC16F_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 19129..19758 + /gene="rmlD" + /locus_tag="SPC16F_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.6e-19" + misc_feature 19132..19860 + /gene="rmlD" + /locus_tag="SPC16F_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.9e-08" + gene order(20053..21006,21017..21235) + /gene="tnp" + /locus_tag="SPC16F_0023" + /pseudo + CDS join(20053..21006,21017..21235) + /gene="tnp" + /locus_tag="SPC16F_0023" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 20059..20502 + /gene="tnp" + /locus_tag="SPC16F_0023" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 0.00012" + /pseudo + gene 21434..>21481 + /gene="aliA" + /locus_tag="SPC16F_0024" + CDS 21434..>21481 + /gene="aliA" + /locus_tag="SPC16F_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33476.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaaagca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attttcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattaggct attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggcgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttacatta + 661 tccataataa taaccgatgg tgtgtttaat gttggtaaga gaaaattctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ttcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctggct cttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaattca gaagctattt cagtcaaata + 1081 agcgtctgga ttgtcagtaa gatagttttt aagtctatct ctatcaacct ttcttggttt + 1141 tgttcctttt acttggtggt ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatggtatta cgtgagattt ggaaaacgtg tgacgcttct gttatactac ctgttcgctc + 1261 acaataagag agaacttttt tacgaaaatc tattgaatat gccataaaaa gattatagca + 1321 cattgtgtac tatagtagat tgaaactaga atagtacacc tctgcttcta aaatattgtt + 1381 agaaatcgat ttgactgtcc tgatcgattt gtcatgttct tatttcattt tactatattt + 1441 ttggttcgcg ggaagtctac taagatactt aaagatgcag atagtgaaaa taaaggtgta + 1501 gacattaccg taaaaaagtg atataatcgt atgatgttca atgtataggt gttaatcatg + 1561 agtagacgtt ttaaaaaatc aggttcacag aaagtgaagc gaagtgttaa tatagttttg + 1621 ttgactattt atttattgtt agtttgtttt ttattgttct taatctttaa gtacaatatc + 1681 cttgctttta gatatcttaa tctagtggta actgcgttag tcctactagt tgccttggta + 1741 gggctactct tgattatcta taaaaaagct gaaaaattta ctatttttct gttggtgttc + 1801 tctatccttg tcagctctgt gtcgctcttt gcagtacagc agtttgttgg actgaccaat + 1861 cgtttaaatg cgacttctaa ttactcagaa tattcaatca gtgtcgctgt tttagcagat + 1921 agtgagatcg aaaatgttac gcaactgacg agtgtggcag caccgactgg gactgataat + 1981 gaaaatattc aaaaactact agctgatatc aagtcaagtc agaataccga tttgacggtc + 2041 aaccagagtt cgtcttactt ggcagcttac aagagtttga ttgcagggga gactaaggcc + 2101 attgtcctaa atagtgtctt tgaaaatatc atcgagtcag agtatccaga ctacgcatcg + 2161 aagataaaga agatttatac caagggattc actaaaaaag tagaagctcc taagacgtct + 2221 aagaatcagt ctttcaatat ctatgttagt ggaattgaca cctatggtcc tattagttcg + 2281 gtgtcgcgat cagatgtcaa tatcctgatg actgtcaatc gagataccaa gaaaatcctc + 2341 ttgaccacaa caccacgtga tgcctatgta ccaatcgcag atggtggaaa taatcaaaaa + 2401 gataaattaa cccatgcggg catttatgga gttgattcgt ccattcacac cttagaaaat + 2461 ctctatggag tggatatcaa ttactatgtg cgattgaact tcacttcttt cttgaaaatg + 2521 attgacttat tgggagggat agatgttcat aatgatcaag agttttcagc tctacatggg + 2581 aagttccatt tcccagtagg gaatgtccat ctagactctg agcaagcttt aggttttgtt + 2641 cgtgagcgct actccctagc agatggcgat cgtgaccgtg gtcgcaacca acaaaaggtg + 2701 attgtggcta tccttcaaaa attaacgtca accgaagcac tgaaaaatta tagtacgatc + 2761 attgatagct tgcaagattc tatccaaaca aatatgccac ttgagaccat gataaatttg + 2821 gtcaatgctc agttagaaag tggtggaact tacaaagtga attcgcaaga cttgaaaggt + 2881 acaggtcgga tggatcttcc ttcttatgca atgccagaca gtaacctcta tgtgatggaa + 2941 atagatgata gtagtttagc tgtagttaaa gcagctatac aggatgtgat ggagggtaga + 3001 tgaaatgata gacatccatt cgcatatcgt ttttgatgta gatgacggtc ccaaatcaag + 3061 agaggaaagc aaggctctct tggcagaagc ctacagacag ggggtgcgaa ccattgtctc + 3121 tacctctcac cgtcgcaagg gcatgtttga aactccggaa gagaagatag cagaaaactt + 3181 tcttcaggtt cgggaaattg caaaagaagt agcagatgat ttagtcattg cttatggcgc + 3241 agagatatac tatactctgg atgctctaga aaagctagaa aaaaaagaaa ttcctaccct + 3301 taatgatagt cgttatgcct tgattgagtt tagcatgcat acttcctatc gtcagattca + 3361 tacgggattg agcaatattt tgatgttggg aatcacgcca gtaattgctc atattgaacg + 3421 ttataatgct ttagagaata acgaaaaacg tgttcgtgaa ctgattgata tggggtgcta + 3481 tactcagata aatagttatc atgtttcaaa acctaagttc tttggtgaaa aatataaatt + 3541 catgaaaaag agagctcggt attttttgga acgtgattta gttcatgtag ttgcaagtga + 3601 catgcacaat ttagacagta gacctccata tatgcaacag gcatatgata tcattgctaa + 3661 gaaatatgga gcgaaaaaag cgaaagaact ttttgtagat aatcccagaa aaattataat + 3721 ggatcaatta atttaggaga aaatatgaag gaacaaaaca ctttggaaat cgatgtattg + 3781 caactattca gagttttatg gaaaaggaag ttggtcattt tattagtggc aattataact + 3841 tcttcagttg cttttgccta cagtactttt gttatcaaac ctgagtttac tagtacgact + 3901 cggatttatg tagttaaccg taatcaggga gagaagtctg gtttaaccaa tcaagacttg + 3961 caggcaggat cgtacttggt taaagactat cgtgaaatta tcctatcgca ggatgttttg + 4021 gaggaagttg tttctgattt gaaactagat ttgacgccaa aaggtttggc tagtaaaatc + 4081 aaagtaacag taccagctga tacccgtatt gtctctgttt cagttaatga tcgagttcct + 4141 gaagaggcaa gccgtatcgc taactctttg agagaagtag ctgctaaaaa aattatcagt + 4201 attactcgtg tttctgatgt gacaacactg gaggaggcaa gaccggcgat atcaccgtct + 4261 tcgccaaatc ttaaacgcaa tacactaatt ggttttttgg caggggtgat tggaactagt + 4321 gttatagttc ttcttcttga acttttggac actcgtgtga aacgtccgga agatatcgaa + 4381 gatacattac agatgacact tttgggagtt gtaccaaact tgaataagtt gaaataggag + 4441 agagagatgc cgacattaga aatagcacaa aaaaaactgg agttcattaa gaaggcagaa + 4501 gaatattaca atgccttgtg tacaaatata cagttgagcg gagataaact aaaagtaatt + 4561 tccgttactt ctgttagccc gggggaagga aaaacaacta cttccgtaaa tatagcatgg + 4621 tcgtttgcgc gtgcaggcta taaaactctt ttgatcgatg gcgatattcg aaattcagtc + 4681 atatcaggat tttttaaatc tcgtgaaaaa attacagggc taacagaatt tttatctggg + 4741 acagctgatt tatctcacgg tttatgtgat acaaatattg aaaatttatt tgtagttcaa + 4801 tcgggctctg tatcaccaaa ccctacagcc ttgttacaaa gtaaaaattt taatgatatg + 4861 attgaaacat tgcgtaaata ttttgattat atcattgttg atacagcacc tattggaatt + 4921 gttattgatg cggcaattat cactcaaaag tgtgatgcgt ccatcttggt aacagcaaca + 4981 ggtgaggcga ataaacgtga tgtccaaaaa gcgcaacaac aattaaaaca aacagggaaa + 5041 ctgttcctag gagttgtttt taataaatta gatatctcgg ttgataagta tggagtttac + 5101 ggtttctatg gaaattatgg taaaaaataa cttaggaaag attttatgga tgaaaaagga + 5161 ttgaaaattt ttctggcagt attacagagt attattgtca ttttattggt ttattttctt + 5221 agctttgtta gagagacaga acttgaacgt tcttcgatgg ttatactata ccttctccac + 5281 ttttttgtat tctattttag ttcctatggt aacaattttt ttaaaagagg gtacctagtt + 5341 gagtttaata gtactataag atatattttt ttctttgcaa tagctataag tgtattaaac + 5401 ttttttatag cggaacggtt tagcatctct agaagaggaa tggtatactt cttaacttta + 5461 gaaggaatat ccttatactt gttaaatttc ttagtaaaga aatattggaa gcatgtgttt + 5521 tttaatctaa aaaatagcaa gaaaatttta ctgttaacag taacgaaaaa tatggaaaaa + 5581 gttcttgata aattgctaga atctgatgaa ctttcatgga aattggtagc agtaagtgtt + 5641 ttggataaat ctgattttca acatgataaa atacctgtaa ttgaaaagga aaaaattatt + 5701 gaatttgcaa cgcatgaagt tgtggatgag gtgtttgtca atcttccagg agagagctac + 5761 gatattggag aaattatctc taggtttgag aaaatgggga tggatgtaac tgtaaatctt + 5821 aaagcatttg ataagaattt gggtcgcaat aaacaaattc atgagatggt aggattgaat + 5881 gtagtcactt tctctacaaa tttttataaa actagtcatg tgatttcaaa gagaattctc + 5941 gatatttgtg gtgccactat tggccttatt ctttttgcta tagttagtct agttttagtt + 6001 ccattgattc gtaaagatgg cggaccagct atttttgctc aaactcgtat agggaaaaat + 6061 ggtcgacatt ttacctttta taaattccgt tcgatgcaga tcgatgctga agctatcaaa + 6121 gaacagttga tggatcaaaa tacgatgcaa ggtggtatgt ttaagataga caatgatcct + 6181 cgtgttacaa aaattggtcg ctttattcgt aaaaccagtt tagatgagtt accccagttt + 6241 tggaatgtct ttataggaga tatgagtttg gtgggaacac gtccacctac agtagacgag + 6301 tatgatcagt atactccaga acagaaacgt cgactcagct ttaaacccgg tattacaggt + 6361 ttatggcagg ttagcggccg tagtaaaata accgattttg acgatgttgt aaaattagat + 6421 gtggcttata ttgataattg gacaatctgg aaagatattg aaattttgct taaaactgtt + 6481 aaagttgtat ttatgagaga tggagcgaag taatttctgt atatccatca tattaggaga + 6541 gaaatgaaaa agtcagttta tatcattggt tcaaaaggaa ttcctgctaa gtatggagga + 6601 tttgaaactt ttgttgaaaa attaacagcc ttccaacaag ataagactat ccaatattat + 6661 gtggcttgta tgcgtgaaaa ctctgcaaaa tcagggacta ctgaggatgt ttttgaacat + 6721 aatggtgcta tctgttataa cgtcgatgtt cctaatattg gtccagcgcg agccatagta + 6781 tatgatatcg cggcaattaa cagagctatt aaaattgcca aagaaaataa ggatgaagat + 6841 ccaatcttct atattctagc ttgtcgaatc ggtccgttca tccatggaat taagaaaaaa + 6901 atccaggaga taggtgggac tcttctagtt aatccagatg gtcacgagtg gttacgagct + 6961 aagtggagcg ctccagttcg tcgttattgg aaaatttccg aaggtcttat ggtcaaacat + 7021 gcagatcttt tagtgtgtga tagtaagaat attgaaaaat atatccaaga agattatata + 7081 cagtatcaac ctaagacaac ctatatcgct tatgggacag atacaacacg ctccacatta + 7141 aatagcagtg atgaaaaagt gcgtgcttgg ttcaaggaga aaaatgtttc tgaaaacgag + 7201 tattacctag ttgtaggacg ttttgttcca gaaaataatt atgagtctat gatacgtggt + 7261 ttcttggcgt ctagctctaa gaaggatttt gtcctaatca caaatgtaga acagaataaa + 7321 ttttataatc agctattagc aagtactgga tttgataaag atccacgagt gaaatttgtt + 7381 ggaacagtct acgaccaaga acttctgaag tatattcgag aaaatgcttt tgcttacttc + 7441 cacggacatg aagttggtgg aacaaatcct tcgttacttg aagcattagc atccacaaag + 7501 ttaaacttac tactcgatgt tggttttaac cgcgaagttg gggagcaaag tgcgatctat + 7561 tggaaaaaag atgagctttc ccaagtaatc gagaaagttg aacaatttga tgcaaaaatt + 7621 attgatgagt tagatagaca atcaaatcag agaattgtgg attttttcac ttgggaaaag + 7681 attgtcacag actacgagaa attatttaaa aaatgaaaat attacattat actttaggat + 7741 ttcaacccca gcgaacaggt ggtttggtta aatatgctga ggatttaatg ctagagcaaa + 7801 ttgctcaagg ttatcaagtg gctgccctat atccaggaag aattaagttc ttttcaaaaa + 7861 aaatagaaat aattaaagag acgtcaagac agtttgagtg ttatgagctg cttaatagct + 7921 tacctatggc tttatttgga gggatatccg atccaactgc tttcctgaca ccttgtgaca + 7981 aaaatgttta tcgtactttt ttagaaaaag tacaacccga cattatacat attcactcgt + 8041 ttatgggatt gcataaagaa ttcctcgaaa ttgctaaaag cttgaatatt agagttgttt + 8101 ttacgagcca tgattattat ggattagcac ccgtacctca tttctatttt aatggggtgg + 8161 attatagtga taaaagtaca aacttaacat ggaatattat gtcttccaat gctttaagtg + 8221 tgaaaaaact aagacttttt caggtttcat tttatcctac tattcgtaaa cttttgaaac + 8281 tattagggaa aaatccaaaa tctaaaaaga atttagttat tcgagatgtt attgaggagc + 8341 aagattatag tgagcttcga tactattata atgagatgtt tcacttaata gatggttatt + 8401 tgtttaatag tagacttgca aagaaggtat atgagataaa tgagattaag tcagctaata + 8461 gtatagtatt atctataaca aatagttcaa ttaatcatca tcagagattg acaactacaa + 8521 ataataaaat tagagttgct tatattggtc cagatgaaga atataaagga tattttgatt + 8581 ttgttgactt tgttgaaact ttagatcgag agtcctatga agtggcaact tatggccatt + 8641 taccaaatga agagtgtcct tcattcattg aacaaaaagg atattttact aaggaaatga + 8701 ttgacagtgt ctatgaaaat attgatattc ttattgttcc aagtaagtgg aaggaaacat + 8761 ttggattgat aacagtagaa gcattatcct atggggtaaa tgttttcgtg agtgaaaatg + 8821 ttgggtcaaa agacttactt ccagaatcgc atgtttttaa aaatcagaat gatttaatag + 8881 ttaaattttt aaaaaatgat atagaaaata caaaattgaa aactttagat gaacactcga + 8941 tagaagtgat tcagtattat gaaagagtga taaatgatag ttaagagttt cataaaaaag + 9001 attactggaa aaacagtaga cattcatcca gatgtacctt tgtcgtatat actacaaaga + 9061 ggtataaact atagtttcgg actctttcgt ggggttgtac gtggaatcgg atttggtcaa + 9121 aacgacaaac gtttattcat tggacaagga gtttctatct tagcaaagcg taaattattt + 9181 gttggaaaaa atgttcgaat tggtaaaaag gtgtctatag atgcactgtc aaaagaagga + 9241 atccattttg cagataatgt aaagattgga gattattctc aaattattgg cacaggttct + 9301 ataaaaaata tggggattgg cttgaaaatc ggtaagaact catctttttc agaatatagt + 9361 ttatttggtt ctgctggagg tatcacaatt ggtgataatg ttatcgcagg tcagaatgtt + 9421 cgttttcatg ctgaaaatca taattatagt gatttagata aactcattgt tgaacaaggg + 9481 gtatctcgaa agggaatttc agtaggtgat aattgttgga ttggtgctgg atctgttttt + 9541 ttggatgggt ccagcattgg ttcaggttgt gttgtagctg caaattctgt aattacgaaa + 9601 aactttccag ataacgttat tgttgctgga gtaccagcta aaattataaa aatgaaatga + 9661 taggatgtta aatgaggaaa gaaattaaag ctgtttatgc gatattaaat tacaatactt + 9721 gggaagatac tgcgcgttta gcacagaaag ttgcaacatt tcagcatatt caatctgtga + 9781 taatagtgga taatctatca acagatgatt cataccatta tttaaaaaga cttgagggag + 9841 agaaaatttc agtttatcaa acacaaagaa atggtggata ttctgttgga aataattttg + 9901 cagcacgaaa agcttataat atgggagttg atattctttt catttcaaat ccagacgttg + 9961 atattgatga aaaagattcc ttgatgattg cacaaaattt gtataaaaat agttcatatg + 10021 cactgctatc aggtatagaa tataatgcta tgaaggagat agatttgcca attgtctggc + 10081 atgaaaattc ctattacgat gacttacttg attgtttgtt tttaaccaga aaatggcgaa + 10141 gaaaaaaaga agatatcaat ttgtcaatga ttaaatcatc tataatagat gtagatcttg + 10201 ttaaaggatc gttttttgct gtaagactgt ctgattttca tgatgttggt tattttgatg + 10261 aatctgtatt tcttttttgt gaagagagaa tattagctaa aaagttacaa aaagtaaata + 10321 aaaaaatagg tattctgcct gaagcgaaat attaccacaa tcattcaact tctataaatg + 10381 agagatataa aaagaaaaaa gaacagatta atttattata taagtctcga tactactata + 10441 atgtaaagta taataatatt agttttgtca aaaaactatg tttaaaatct gtcatgatgc + 10501 tatccatttt agaatatata atcttagata tgatgaattt attatataca aagactaact + 10561 ataagaaaat tcaatagttt aatctgaaat acttcttgtt tcaaagtgga tgattttaga + 10621 gcacggcaaa atgtccttga aaaagtttat tttttcaaag gttatcttgt ggcaaattca + 10681 ggagttagaa cacttttttt cgtcaaatgc tagcttgttt tttaggagat aaaacagatt + 10741 tctaataagt tttttggcaa ggtgaatgat ggctacattg taatgctttc tttgttacaa + 10801 cttagtccta agataggctt taaaaacagg cgaaaagcga gcatatgctt tggtagcttg + 10861 tatgagtgcc caacgtagat gaggggaacc cagtttgacc attttccctg ctaaatcgat + 10921 ttgacctgac tggtaaatag aaggattcgg tccagcaaaa gcttgtaatt gatgaggctt + 10981 atcgaagata tgaatacttc gaatctcaac taagataacg tcacctaaac gattcccaag + 11041 ctcacttggt tatccacgaa ctttgtgcct tgttacctta cacaatataa aacgtttatg + 11101 cgctatcaaa ctcattacca attgaaacaa aaagctgtgg ttagagcctt tcagaaatcg + 11161 tcaagcgatt ggaggaaatg aactaatcca cagtggctta ttccaagtgt accacttgga + 11221 ctttagcagt agcgaactac actaaatata atataaggag aaataggtga gtaaattaat + 11281 attgaacttg aaattaaatt cttttttatt tgttataatt ttacttttag ttgttgttac + 11341 tccgactcat accttaattt ttgatgcact aattccaacg aaaattgata atttatggag + 11401 agagtttctt ctagtaattt cttttctatg tattctaaag ataaatgcag gaaaaattaa + 11461 aattggaaag ctagggggcc caataattgt tatgggagga attggtttag tttatactat + 11521 ctgttcagat aggccattta cagctttaaa tctttttaga atttatatgt ttcctgctgt + 11581 aatatatttt ataataataa attgtaattt tcgcaaggag agattactga tattgaagca + 11641 agcgcatgta tatactgctt gcatattagc tttatgggga atttttcagg cgtgggtgtt + 11701 aaaagatcag tttttgatta aaataggata tccttcccaa ggaaattttc taaagagtac + 11761 agctttttat attggtggtt ttttcggtca acaacgagtt actagcactt tttctgctcc + 11821 taatttagct ggagtttatt ttggaatatc tttgatcatt ttactctcta tatttgatac + 11881 tataaagagt aatagattgg tattgttttc aattgtagca gcttttgttc ttacatttag + 11941 ccgtagtgct attataagta ctcttgtagg aatcgtattc tttcaacgta agaaattgtt + 12001 ttcaacgacg aagattaatg ttatgacctt ggtaatcttc cccttaattt ttttgattgt + 12061 tttagttata ttttatcttt atcctgagaa tgttattata aatatgctct atagcagtta + 12121 ttcttcaaca cttaatttga cagattcttc agcggttaag catttggaag acttatggct + 12181 tcctcttcta aaagttattg attatccttt gggacttgga tttggtaata atggcccaat + 12241 tgttctgtca ctctatcact cagcaaattt agtagaatct tctatttatc ttcttgcata + 12301 tgattttggt attttaggaa tgttcatata tttgttccct tatttttata cgatttttgt + 12361 atataaaaaa tatttgctta gcggtgctat atgctgctta gttcttataa cttatctatt + 12421 tcttccaaat gtagaaaatt ttgaaatcat attttttatt taccttttca ttgggatgga + 12481 tgaactagca ctatatacaa aaggaatgaa tgtacatgaa attgattaaa ttattgaaaa + 12541 aatatataaa tttatacatt agtagttcgg tgcctaagac aaataaattg ttaatttttg + 12601 gatcatggtt aggtgaaaaa tatgcagaca atccaagata tttgtttgag tatgtgatta + 12661 agaatcgtcc cgatttaaaa gctatatgga ttacaagtaa tcaagatgtt tttaaagaat + 12721 tacagaagaa acaatatctc gtgatgatgg cagaggcacc tgaaactcgg aaaattgtta + 12781 aaaaagcaaa gtatattttt acagcaactg gtatttttga tattggagaa caaaatgcta + 12841 acttcgttgg aggtgcctat ctaattaatc tatggcatgg cattcctttg aaaaaaatca + 12901 tgtatgatga taaacattca gcacttcaca aacgtagtaa actagtgact tgggtagaaa + 12961 aaattcctct tcgaaactat tttgttattt ctactagtac ggcaataact caaatttatc + 13021 agtctgcttt tcgcgtaaag aaatctaata tattagaact tggtcaacct aggaatgact + 13081 atttttatga taagtctaat ccagtgagtt cattaataca ggaattaaaa agtaaaaata + 13141 ttatcttata tatgccgaca catcgcaatg aaggaaagaa acaaatagat ctagataagt + 13201 taatggattt agaacactta aataattggt gtgaagaaac aaagtcaatt tttgtaatta + 13261 aaaagcattt ctatcattca aaagaaaaaa ctatcgataa gaaatattct tcgataattg + 13321 acgtgacaaa tgagaaggtg gatgttcaag aattactcaa atgttcaaat gttttaataa + 13381 ctgactactc aagctgctat attgactact tattgttgaa tcgtccaatt atatttttta + 13441 attatgatta tgatgattac ttgcgggtgg atcgttcgct atattttcca tatgagaatg + 13501 ttactccagg ggagaaatgt caaaactttg atgaattatt agtgactttg caaaatctat + 13561 atgtaggaaa agatgattat agagaagaac gtgaaaatat caaaactttc ttttattcta + 13621 gtgaaactca gaagtcagtt tctgaaaaaa taattaatca cgtactaaat ctataacttt + 13681 attggaatct gtcatgaaaa aaatattaaa taagtattat tctttatcta atcctgtaaa + 13741 agcttcaatt tggtttacta tttgcaatgt tcttcaaaaa ggaatttcaa tgattactgt + 13801 tccagttttt actagagtat tgacaacgga acaatatggt gtatactctg tatatcaatc + 13861 atggtattca ataattggag tttttgcaac actaaaccta tattatggag tctttaataa + 13921 tggaatgatt aaatacgaga aagataaaaa tgtctttact tcctctatgc agggactaac + 13981 aacaacagtt acagctatat ttttactgat atatttaata gggattgatt tttggaactc + 14041 gttgttaggc ttacctacac tactaatctt agtgatgttc tttgatttgt tttttacccc + 14101 tgcttattct ttttgggttg ctcgtcagag atttgaatat aaatatagaa acttagtatt + 14161 tatcacattt attatagcga ttggaagtcc tattattggt atttctgcag ttgttttatc + 14221 gacttataaa gcggaggcta gagttatctc atttgtgtta gttcaatctt gtatagggtt + 14281 atatttctat attttgaacc tttaccgagg taaacatttt ttttgtaaaa aatattggct + 14341 ctatgctttg aattttaatt tacctcttat tcctcattat ttatcgcaat cagttttaaa + 14401 ccaatcggat agaataatga ttaattcaat ggtaggaatg ggagaagcag caatatatag + 14461 tgttgcttac agcatatcaa ttttgatgct tttagtgaca agtgctataa acagctcttt + 14521 tattccttac acatataagt gtattcgaga taagaaatat actgaactag ggaaaagtgc + 14581 aaatctttta attactctgg taggcattgg ttcgatttta actatttctc ttggaccaga + 14641 aatcattcaa ttatttgcac caaaacaata ttacgaagca atatggatta ttcctcctgt + 14701 tgctctgtca gtatatttca tgttcttata tcccattttt ggtaacattg agttttactt + 14761 tgaagcaaat cattttgtaa tgtgggcttc aatcggtgga gcaattatga atattttttt + 14821 gaattttatt tttttaaaac actttggata tattgcggca ggctatacaa ctttattctg + 14881 ttatatttta tttgcgttgg gacattacat ttttatgagg agagtactgt atcagaatct + 14941 ttcgggtatc caaatttata attccagata tattttattt ttttcgattc ttcttattat + 15001 tctaatgcta ctaatcgtga ttatttatcc atttatactg attcgttatc ttactatctc + 15061 actcatccta ggaggatgtt ttttaaagag gaaaaagata atgagttcga tagctatcat + 15121 taaacaacag tgaggtacaa gaatgacaga aacaaataaa cagttacatg aaacattaat + 15181 cgaaatttta gactttgtaa aagaaatttg tgaaaaacat gaattaactt attttttggt + 15241 ctttgggaca gctcttggag caaaacgcca ttgtggattt attccatggg atgatgatgt + 15301 tgatattgct ttgccacgag agcactacaa tatatttatc gatgcattat ctgagacgga + 15361 tcaatctata tttagtcttc aaaatgaaga taacgagccg aattattttt taccatttgc + 15421 taaattaaga aaaaacaata cgatttttat tgagaagatt cttgatgttg aatatgagaa + 15481 taacggcatt tacattgata tttttccact agatttcgta gagaatccgg actctttcaa + 15541 ttttaagatt aggagaacta catttaatta tataaagcat attttaaaat tttcaagttg + 15601 cagaagtttt tataaaaata aatacagtaa tgtgcgttat ttgattgaaa atattatgag + 15661 tattcctacc ctgttttttt caaataggag attattattc ttagcgaata gtttaatttc + 15721 atcaacgact aaagctgatt ttattggtca atatgatcag aaaagtaaca aaagagctat + 15781 tatgccttca aactattatt ttccacctag gtccgctgtg tttgaaggaa agacctatag + 15841 tgttcctgcg aaattagaag attatttaaa atgtttttat ggctcggatt atatggaatt + 15901 accaccaata gaaaaaagag tcactcatca accaataaca cttagattcg aaaaataatt + 15961 tgctattctg tagaaggaga atataatgaa aagagtaatt acatatggaa cgtttgattt + 16021 acttcatcat ggacatatca atttattgcg acgtgcaaaa gaattaggtg actatctagt + 16081 ggtagttgtt tcaagtgatg aattcaacct aattgaaaaa aataaagttt gttatttcaa + 16141 ttatgagcat agaaaaagtc tagttgaagc tattagatat gttgaccttg ttattcctga + 16201 aacgagttgg gaacaaaaac gcagtgatgt caaagagtat catattgata cttttgtgat + 16261 gggggatgat tggattggag aatttgatta tctaaaagaa gaaggagttg aagtcgttta + 16321 cttacctcgg acgaaagaaa tttcgacaac taaaataaaa aaagatttat caatgtaata + 16381 ttcgtaaata agcattgttc tgttattgtt ctcgaataga ccactgtatt tttaagtaga + 16441 aatgctaaaa tcgatagaaa agagaaaaat gataggacac taccaatata ggtaaaaaat + 16501 atcgtaatta gataaataag aaaggtaccc tactatgaaa ggtattattc tagcaggtgg + 16561 ttcggggaca cgtttatatc ctttgactcg cgctgcatca aaacaactta tgccggttta + 16621 tgataaaccg atgatttact acccactttc aacattgatg ttggctggga ttagggatat + 16681 tttgattatt tccactccac aggatttaca tcgatttcaa gagcttcttc aagacggatc + 16741 tgagtttggg atcaaacttt cttatgcaga gcaaccaagt ccagatggtt tggcacaagc + 16801 ctttatcatt ggggaagagt ttatttctga tgatagcgtt gcgctaatct taggtgataa + 16861 tatctaccat ggttctgggc tttccaatat gctacaaaag gcagcgagta aggagtcggg + 16921 agcaactgtt tttggctacc atgtcaagga tccagagcgc tttggtgtgg ttgagtttga + 16981 tcaggatatg aaggctattt ctattgaaga aaagccagag caacctcgtt caaactatgc + 17041 agttacaggt ctctatttct atgataatga tgtagtagag attgccaaga gtattaaacc + 17101 aagtcctcgt ggtgaactgg aaattacaga tgtaaacaaa gcttacctag atcgtggtga + 17161 tttgtctgtt gagcttatgg gacgtggctt tgcttggctg gatactggaa ctcatgaaag + 17221 tttactagag gcttcacagt acatcgaaac agtgcaacgg atgcaaaatg ttcaggtagc + 17281 aaacttagaa gaaattgcct atcgcatggg ttatatcagt cgtgaagatg tattgacctt + 17341 agcccaacca cttaagaaaa atgaatacgg acagtatctg ctccgtttga ttggagaagc + 17401 atagatgaca gataattttt tcggtaagac gcttgcggca cgcaaggttg aagctattcc + 17461 aggcatgttg gagtttgata tccccgttca tggagataat cgtggctggt ttaaagaaaa + 17521 tttccaaaag gaaaaaatgc ttccacttgg atttccagag tctttctttg cagaaggaaa + 17581 attgcaaaac aatgtatcct tctcacgtaa aaatgtcctt cgaggcctcc acgcagagcc + 17641 ttgggataag tacatctctg tagcagatgg agggaaagtt ctgggttctt gggttgatct + 17701 acgcgagggt gaaacctttg ggaataccta tcagacagta attgatgcaa gcaagggaat + 17761 ctttgttcct cgaggcgtag ctaatggctt ccaagttcta tcagatacag tgtcatatag + 17821 ctatctggtc aatgattact gggctctcga gctcaaaccc aagtatgcct ttgtgaacta + 17881 cgctgatcca agccttggta ttgaatggga aaatattgca gaagcagagg tttcagaagc + 17941 agataaacat catcccctac ttaaggatgt aaaacctttg aaaaaagaag atttgtaaaa + 18001 aggaaagaat atgactgaat acaaaaatat tatcgtgaca ggtggagctg gctttatcgg + 18061 ttctaacttt gtccattatg tttacgagaa ctttccaggt gttcacgtga cagtcctaga + 18121 taagttgact tatgctggaa atcgcgcgaa tattgaggaa attttaggta atcgtgttga + 18181 gttagttgtt ggtgacattg ctgatgcgga gttggtagac aagttggctg ctcaagcaga + 18241 tgctatcgtt cattatgcag cggaaagcca caatgataat tcgctcaatg atccatcgcc + 18301 atttattcat actaacttca tcggaaccta tactctttta gaagctgctc gtaagtatga + 18361 tattcgcttc caccatgtat cgacagatga agtttatggg gatctccctt tacgcgaaga + 18421 tttgccaggt catggtgaag gaccaggtga gaaatttact gctgaaacca agtacaatcc + 18481 aagctcgcct tactcatcaa ccaaggcagc atcagatttg attgtcaaag cctgggtccg + 18541 ttcttttgga gtcaaggcaa cgatttccaa ctgttcaaat aactacggtc cttatcaaca + 18601 tatcgaaaaa ttcatcccac gtcagattac taacatccta agtggaatta agccaaaact + 18661 ttacggtgaa ggtaagaacg ttcgtgactg gattcatacc aatgaccatt cttcaggagt + 18721 ttggacaatc ttgacaaaag ggcaaattgg tgaaacctac ttgattgggg ctgatggtga + 18781 gaagaacaat aaggaagttt tggaacttat ccttaaggaa atgggacaag ctgcggatgc + 18841 ctatgatcat gtgactgacc gtgcaggaca tgaccttcgc tatgcgattg atgctagcaa + 18901 gctccgtgat gagttggggt ggaaacctga atttaccaac tttgaagctg ggctcaaggc + 18961 aacaatcaag tggtatacag ataaccaaga atggtggaaa gcagaaaaag aagctgttga + 19021 agccaattat gctaagactc aggagattat tacagtataa aaagcaggaa atagctgctt + 19081 tttattgcta tattgggaag agttacatat tagaaaggtc tagagatgat tttaattaca + 19141 ggggcaaatg gccaattagg aacggaactt cgctatttat tggatgaacg taatgaagaa + 19201 tacgtggcag tagatgtggc cgagatggac attaccgatg cagaaatggt tgagaaagtt + 19261 tttgaagagg tgaaaccgac tttagtctac cactgtgcag cctacaccgc tgttgatgca + 19321 gcagaggatg aaggaaaaga gttggacttc gccatcaatg tgacggggac aaaaaatgtc + 19381 gcaaaagcat ctgaaaagca tggtgcaact ctagtttata tttctacgga ctatgtcttt + 19441 gacggtaaga aaccagttgg acaagagtgg gaagttgatg accgaccaga tccacagaca + 19501 gaatatggcc gtactaagcg tatgggggaa gagttagttg agaagcatgt gtctaatttc + 19561 tatattatcc gtactgcctg ggtatttgga aattatggta aaaacttcgt ttttaccatg + 19621 caaaatcttg cgaaaactca taagacttta acagttgtaa atgaccagta cggtcgtccg + 19681 acttggactc gtaccttggc tgagttcatg acctacctag ctgaaaatcg taaggaattt + 19741 ggttattatc atttgtcaaa tgatgcgaca gaagacacaa catggtatga ttttgcagtt + 19801 gaaattttga aagatacaga tgtcgaagtc aatccagtag attccagtca atttccagcc + 19861 aaagctaaac gtccgctaaa ctcaacgatg agcctggcca aagccaaagc tactggattt + 19921 gttattccaa cttggcaaga tgcattgcaa gaattttaca aacaagaagt gagataagta + 19981 gtagaatgat tttctagtct aataaaagag gcagataatg aactccaaag gagcttaaga + 20041 tgtacgatta tcttgttgtt ggtgctggtc tctttggcgc atagctttgg ctcagtttct + 20101 attatcgctc acaccatcca tcagaagttt aatctgaagg tacccaatta tcgccaagaa + 20161 gaagattggg ctaggatggg tttaccaatc acacgtaagg aaatctctaa ttggcatatc + 20221 aaggcaagtc aatactattt agagtccctt tataagcttt tacgagaaaa gttgttagaa + 20281 caacctcttc ttcatgcgga tgaaacctct tatcgggtct tagaaagtga tagtcagctg + 20341 acctactatt ggaccttttt atctgggaaa gctgagaatc aagcaatcac gctgtaccac + 20401 catgatcagc gtcgaagtgg tttagtagta caagaattcc taggagatta ttctggctat + 20461 gtgcattgtg atatgttgcg gcagtaactt aggactttag tcctctagtt ctgcctatgc + 20521 gatagcagtc caaggtttag gagcaaggcg acgctaagct tggtaaactg cgaaccgcta + 20581 gaagcttatc gtcaactggc agaagctgaa cttgttggat gttgggcaca tgtgagaagg + 20641 aagttttttg aagcgacccc caagcaagcg gataaatcat cgttaggagc taaaggttta + 20701 gcttattgta atcagttatt ttccttggaa agagactggg aggctttgcc agctgatgaa + 20761 cgactacaga aacgtcaaga agagctccaa cccctaatgg aagacttctt tgcttggtgc + 20821 cggcgtcagt cagttttatc gggttcaaaa ctaggaaggg caattgaata cagcctcaag + 20881 tataaagaaa cctttaagac tattttgaaa gacggacatc tggtcctttc caataatcta + 20941 gctgaatgcg ccattaaatc attggttatg ggacggagta aaagagttca gtggactctt + 21001 ttagcctaag ctcagtttaa aaaagcgagg gtggttattt tctcaaaatt ttgaaggagc + 21061 taaagcaaga gctattatta tgagtttgtt ggaaacagct aaacgtcatc aattaaatag + 21121 cgagaaatat ctattctatc ttctagaatg tcttccaaac gaggaaactc tcgtaaacaa + 21181 agaggtttta gaggcttatt taccatggac taaagttgta caagaaaagt gcaaataaga + 21241 aatctccaga ttaggaacta tccgtgagtt ctctagtctg gagatttttc aatatacttc + 21301 gttattggac ggttacgata ttcatatttt ttgcaaagat gttgtttgaa aaatattttt + 21361 caaaaattct gaaaattctg ttgacaactt tctgaaaaga gtctataatg gagagaaagt + 21421 tttaaaggag aaaatgatga aaagttcaaa actacttgcc cttgcgggcg tgacattatt + 21481 g +// + diff --git a/public/res/serotype_genbank/serotype_16X.gb b/public/res/serotype_genbank/serotype_16X.gb new file mode 100755 index 0000000..c3fa0b8 --- /dev/null +++ b/public/res/serotype_genbank/serotype_16X.gb @@ -0,0 +1,975 @@ +LOCUS MK606430 25451 bp DNA linear BCT 30-SEP-2020 +DEFINITION Streptococcus pneumoniae strain GPS_ZA_carriage_SP1571 cps gene + cluster, complete sequence. +ACCESSION MK606430 +VERSION MK606430.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 25451) + AUTHORS van Tonder,A.J., Gladstone,R.A., Lo,S.W., Nahm,M.H., du Plessis,M., + Cornick,J., Kwambana-Adams,B., Madhi,S.A., Hawkins,P.A., + Benisty,R., Dagan,R., Everett,D., Antonio,M., Klugman,K.P., von + Gottberg,A., Breiman,R.F., McGee,L., Bentley,S.D. and The Global + Pneumococcal Sequencing,C.O. + TITLE Putative novel cps loci in a large global collection of pneumococci + JOURNAL Microb Genom 5 (7) (2019) + PUBMED 31184299 +REFERENCE 2 (bases 1 to 25451) + AUTHORS van Tonder,A.J. + TITLE Direct Submission + JOURNAL Submitted (06-MAR-2019) Parasites and Microbes, Wellcome Sanger + Institute, Wellcome Genome Campus, Hinxton, Cambridge CB10 1SA, + United Kingdom +COMMENT ##Assembly-Data-START## + Assembly Method :: Velvet v. 1.2 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..25451 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="GPS_ZA_carriage_SP1571" + /isolation_source="nasopharyngeal swab" + /host="Homo sapiens" + /db_xref="taxon:1313" + /geo_loc_name="South Africa" + /collection_date="2010" + misc_feature 1..25451 + /note="cps gene cluster" + gene 1..1611 + /gene="dexB" + CDS 1..1611 + /gene="dexB" + /EC_number="3.2.1.70" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3280" + /inference="protein motif:CLUSTERS:PRK10933" + /inference="protein motif:Pfam:PF00128.18" + /inference="protein motif:TIGRFAMs:TIGR02403" + /inference="similar to AA sequence:RefSeq:YP_004326655.1" + /inference="similar to AA sequence:UniProtKB:Q99040" + /note="trehalose-6-phosphate hydrolase; maltooligosyl + trehalose synthase; alpha,alpha-phosphotrehalase; alpha + amylase catalytic domain protein" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="QCO91882.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNGDGIGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIATIFGTMEDMDQLIAEAKKRDIRIIMDLVVN + HTSDEHAWFVEACENPNSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGDKDLLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKGVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTGQPWLAVNPNYEMINVQEALANPDSIFYTYQKL + VQIRKENSWLIRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTAAKEVLEKQVLAPWDAFCVEMTD" + CDS complement(1862..2044) + /inference="ab initio prediction:Prodigal:2.60" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="QCO91883.1" + /translation="MGSFSLKEVTLSLTFRREKVRSVRQAFHLIRGLELLGWRAKAKT + SLGLADKTASRIPRVK" + CDS complement(2060..3457) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3415" + /inference="protein motif:Pfam:PF00665.20" + /inference="similar to AA sequence:RefSeq:YP_006065738.1" + /note="integrase core domain protein" + /codon_start=1 + /transl_table=11 + /product="IS1202 transposase" + /protein_id="QCO91884.1" + /translation="MNETKKYLVIKAIAQGKKTKKRACVELNLSERQINRLLLAYQQK + GKEAFRHGNRNRKPKHAIPDEIKERVLKKYLSYETYKPNVLHFCELLAEEEGIKLSDT + TVRKILYKKNILSPKSHRKTKKRVRKQAKLNLNQPLDNPILPTAKDFLENPKKVHPSR + PRKKFAGELIQMDASPHAWFGPETTNLHLAIDDASGNILGAYFDKQETLNAYYHVLEQ + ILVNHGIPLQMKTDKRTVFTYQASNSKKMEDDTYTQFGYACHQLGILLETTSIPQAKG + RVERLNQTLQSRLPIELERNKIHTLEEANTFLLSYIQTFNEQFGNKTKLSVFEEAPNL + SERNLILARLAERVVDSGHHIRFQNRYYIPTEQGKEVYFIRKTKALVIKAFDGDIYLN + IADKIYHTKELLDYELYSKNFEQEPEQKKERRKYIPPQTHPWKLTSFKQYLHKNKKDY + EEFTSEELHSPQLQV" + gene 3608..5053 + /gene="wzg" + CDS 3608..5053 + /gene="wzg" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09379" + /inference="protein motif:Pfam:PF03816.8" + /inference="protein motif:TIGRFAMs:TIGR00350" + /inference="similar to AA sequence:RefSeq:YP_001835063.1" + /inference="similar to AA sequence:UniProtKB:Q7WY78" + /note="putative transcriptional regulator ywtF; + membrane-bound transcriptional regulator LytR; cell + envelope-related function transcriptional attenuator + common domain; cell envelope-related transcriptional + attenuator domain protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + wzg" + /protein_id="QCO91885.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSVSVAVLADSEIEDVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSTLHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGSYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 5055..5786 + /gene="wzh" + CDS 5055..5786 + /gene="wzh" + /EC_number="3.1.3.48" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4464" + /inference="protein motif:Pfam:PF02811.13" + /inference="similar to AA sequence:RefSeq:YP_003878593.1" + /inference="similar to AA sequence:UniProtKB:Q9AHD4" + /note="capsular polysaccharide biosynthesis protein; PHP + domain protein" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein phosphatase wzh" + /protein_id="QCO91886.1" + /translation="MIDIHSHIVFDVDDGPKSIEDSKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREMAKEVASDLVIAYGAEIYYTPDVLEKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYGLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + gene 5795..6487 + /gene="wzd" + CDS 5795..6487 + /gene="wzd" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:Pfam:PF02706.9" + /inference="protein motif:TIGRFAMs:TIGR01006" + /inference="similar to AA sequence:RefSeq:NP_344881.1" + /inference="similar to AA sequence:UniProtKB:P72367" + /note="capsular polysaccharide type 8 biosynthesis protein + cap8A; capsular polysaccharide biosynthesis protein; MPA1 + family polysaccharide export protein; chain length + determinant protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + wzd" + /protein_id="QCO91887.1" + /translation="MKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSAFIV + KPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSISVNNRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTGVIVLLLELLDTHVKRPEDIEDTLQMP + LLGVVPNFNKLK" + gene 6497..7180 + /gene="wze" + CDS 6497..7180 + /gene="wze" + /EC_number="2.7.10.2" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:CLUSTERS:PRK11519" + /inference="protein motif:Pfam:PF01656.17" + /inference="protein motif:TIGRFAMs:TIGR01007" + /inference="similar to AA sequence:RefSeq:YP_001835066.1" + /inference="similar to AA sequence:UniProtKB:Q54520" + /note="tyrosine-protein kinase CpsD; tyrosine kinase; + capsular polysaccharide biosynthesis protein; capsular + exopolysaccharide family protein; CobQ/CobB/MinD/ParA + nucleotide binding domain" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14D" + /protein_id="QCO91888.1" + /translation="MPTLEIAQKKMEFIKKAEEYYNALCTNIQLSGDKLKVISITSVN + AGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVMSGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSASPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDAFILVTATDEVNKRDVQKAKQQLEQTEKLFLGVILNKFDVQYEKYGSY + GDYGNYGKK" + gene 7196..8563 + /gene="wchA" + CDS 7196..8563 + /gene="wchA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15204" + /inference="protein motif:Pfam:PF02397.10" + /inference="protein motif:TIGRFAMs:TIGR03025" + /inference="similar to AA sequence:RefSeq:YP_001835067.1" + /inference="similar to AA sequence:UniProtKB:P71241" + /note="putative colanic biosynthesis UDP-glucose lipid + carrier transferase; undecaprenyl-phosphate galactose + phosphotransferase; exopolysaccharide biosynthesis + polyprenyl glycosylphosphotransferase; Bacterial sugar + transferase" + /codon_start=1 + /transl_table=11 + /product="glucosyl-1-phosphate transferase" + /protein_id="QCO91889.1" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGRLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIYEMVGLNVVTFSTNFYKTSHVISKRILDICGAIIGLIL + FAIASLILVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + gene 8594..9766 + /gene="wchF" + CDS 8594..9766 + /gene="wchF" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF09314.5" + /inference="protein motif:TIGRFAMs:TIGR03088" + /inference="similar to AA sequence:RefSeq:YP_002510379.1" + /note="PEP-CTERM/EpsH1 system-associated sugar + transferase; DUF1972 protein" + /codon_start=1 + /transl_table=11 + /product="rhamnosyltransferase WchF" + /protein_id="QCO91890.1" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDIFEHNGAICYNVDVPNIGPARAIVYDIAAINRAIKIAKENKDEDPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSILKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYEAMIRGFLASNSKKDFVLITNVEQNKFYNQLLASTGFDKDPRV + KFVGTVYDQELLKYIRENTFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIVDSFTWEKIVTDYEKLFKK" + gene 9763..11034 + /gene="wciU" + CDS 9763..11034 + /gene="wciU" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00534.14" + /codon_start=1 + /transl_table=11 + /product="glycosyl transferase group 1" + /protein_id="QCO91891.1" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMLEQIAQGYQVAALYPGRI + KFFSKKIEIIKATSRQFECYELLNSLPMALFGGISDPTAFLTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKSTNLTW + NIMSSNALSVKKLRLFQLSFYPTIRKLLKLLGKNPKSKNNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIKSANSIVLSITNSSINHHQRLITTNNKIRVA + YIGPDEEYKGYFDFVDFVETLDRESYEVATYGHLPNEECPSFIEQKGYFTKEMIDSVY + ENIDILIVPSKWKETFGLITVEALSYGVSVFVSENVGSKDLLPESHVFKNQNDLVVKF + LKNDIENTKLKTLDEHSIEVIQYYERVINDS" + gene 11024..11710 + /gene="wcxM" + CDS 11024..11710 + /gene="wcxM" + /EC_number="2.3.1.-" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0110" + /inference="protein motif:CLUSTERS:PRK09677" + /inference="protein motif:Pfam:PF00132.18" + /inference="protein motif:TIGRFAMs:TIGR03308" + /inference="similar to AA sequence:RefSeq:YP_008629857.1" + /inference="similar to AA sequence:UniProtKB:Q7A3E8" + /note="putative acetyltransferase SA2342; putative + lipopolysaccharide biosynthesis O-acetyl transferase WbbJ; + isoleucine patch superfamily acetyltransferase; + transferase hexapeptide repeat family phosphonate + metabolim protein; Bacterial transferase hexapeptide (six + repeats)" + /codon_start=1 + /transl_table=11 + /product="acetyltransferase" + /protein_id="QCO91892.1" + /translation="MIVKSFIKKITGKTVDIHPDVPLSYILQRGINYGFGLFRGVVRG + IGFGQNDKRLFIGQGVSILAKRKLFVGKNVRIGKKVSIDALSKEGIHFADNVKIGDYS + QIIGTGSIKNMGIGLKIGKNSSFSEYSLFGSAGGITIGDNVIAGQNVRFHAENHNYSD + LDKLIVEQGVSRKGISVGDNCWIGAGAVFLDGSSIGSGCVVAANSVITKNFPDNVIVA + GVPAKIIKMK" + gene 11722..12627 + /gene="wcxN" + CDS 11722..12627 + /gene="wcxN" + /EC_number="2.4.1.-" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00535.20" + /inference="similar to AA sequence:RefSeq:YP_004622337.1" + /note="glycosyltransferase family 2" + /codon_start=1 + /transl_table=11 + /product="rhamnosyltransferase" + /protein_id="QCO91893.1" + /translation="MGKEIKAVYAILNYNTWEDTARLAQKVATFQHIQSVIIVDNLST + DDSYHYLKRLEGEKISVYQTQRNGGYSVGNNFAARKAYNMGVDILFISNPDVDIDEKD + SLMIAQNLYKNSSYALLSGIEYNAMKEIDLPIVWHENSYYDDLLDCLFLTRKWRRKKE + DINLSMIKSSIIDVDLVKGSFFAVRLSDFHDVGYFDESVFLFCEERILAKKLQKANKK + IGILPEAKYYHNHSTSINERYKKKKEQINLLYKSRYYYNVKYNNISFVKKLCLKSVMM + LSILEYIILDMMNLLYTKTNYKKIQ" + gene 13318..14580 + /gene="wzy" + CDS 13318..14580 + /gene="wzy" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3307" + /note="O-antigen ligase" + /codon_start=1 + /transl_table=11 + /product="lipid A core O-antigen ligase-related enzyme wzy" + /protein_id="QCO91894.1" + /translation="MSKLRLNLKLNSFLFVIILLLVVVTPTHTLIFDVLIRTKIDNLW + REFFLVISFLCILKINAGKIKIGKLGGPIIVMGGIGLVYTICSDRPFTALNLFRIYMF + PAVIYFIIINCNFRKERLLILKQAHVYTACILALWGIFQAWVLKDQFLIKIGYPSQGN + FLKSTAFYIGGFFGQQRVTSTFSAPNLAGVYFGISLIILLSIFDTIKSNRLVLFSIVA + ALVFTFSRSAIISTLVGIVFFQRKKLFSTMKINVMTLVIFPLIFLIVLVIFYLYPENT + IINMLYSSYSSTLNLTDSSAVKHLEDLWLPLLKVIDYPLGLGFGNNGPIVLSLYQSAN + LVESSIYLLAYDFGILGMFMYLFPYFYTIFVYKKYLLSGAICCLVLITYLFLPNVENF + EIIFFIYLFIGMDELALYTKGMNVHEID" + gene 14567..15727 + /gene="wchX" + CDS 14567..15727 + /gene="wchX" + /EC_number="2.7.8.12" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04464.8" + /inference="similar to AA sequence:RefSeq:YP_002510384.1" + /inference="similar to AA sequence:UniProtKB:P13485" + /note="CDP-glycerol:poly(glycerophosphate) + glycerophosphotransferase" + /codon_start=1 + /transl_table=11 + /product="glycerol phosphotransferase WchX" + /protein_id="QCO91895.1" + /translation="MRLIKLLKKYINLYISSSVPKTSKLLIFGSWLGEKYADNPRYLF + EYVIKNRPDLKAIWITSNQDIFKELQKKQYLVMMAEAPETRKIVKKAKYIFTATGIFD + IGEQNANFVGGAYLINLWHGIPLKKIMYDDKHSALHKRSKLVTWVEKIPLRNYFVIST + STAITQIYQSAFRVKKSNILELGQPRNDYFYDKSNPVSSLIQELKSKNIILYMPTHRN + EGKKQIDLDKLMDLEHLNNWCEETKSIFVIKKHFYHSKEKTIDKKYSSIIDVTNEKVD + VQELLKYSNVLITDYSSCYIDYLLLNRPIIFFNYDYDDYLRVDRSLYFPYENVTPGEK + CQNFDELLVTLQNLYVGKDDYREERENIKTFFYSSETQKSVSEKIINHVLNL" + gene 15745..17184 + /gene="wzx" + CDS 15745..17184 + /gene="wzx" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF01943.11" + /inference="similar to AA sequence:RefSeq:YP_003875982.1" + /note="polysaccharide biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="QCO91896.1" + /translation="MKKILNKYYSLSNPVKASIWFTICNVLQKGISMITVPVFTRVLT + TEQYGVYSVYQSWYSIIGVFATLNLYYGVFNNGMIKYEKDKNVFTSSMQGLTTTVTAI + FLLIYLIGIDFWNSLLGLPTLLILVMFFDLFFTPAYSFWVARQRFEYKYRNLVFITFI + IAIGSPIIGISAVVLSTYKAEARVISFVLVQSCIGLYFYILNLYRGKHFFCKKYWRYA + LNFNLPLIPHYLSQSVLNQSDRIMINSMVGMGEAAIYSVAYSISILMLLVTSAINSSF + IPYTYKCIRDKKYTELGKSANLLITLVGIGSILTISLGPEIIQLFAPKQYYEAIWIIP + PVALSVYFMFLYPIFGNIEFYFEANHFVMWASIGGAIMNIFLNFIFLKHFGYIAAGYT + TLFCYILFALGHYIFMRRVLYQNLSGIQIYNSRYILFFSILLIILMLLIVIIYPFILI + RYLTISLILGGCFLKRKKIMSSIAIIKQQ" + gene 17194..18009 + /gene="wcxQ" + CDS 17194..18009 + /gene="wcxQ" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3475" + /inference="protein motif:Pfam:PF04991.7" + /inference="similar to AA sequence:RefSeq:YP_004326645.1" + /note="LPS biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="LicD superfamily protein" + /protein_id="QCO91897.1" + /translation="MTETNKQLHETLIEILDFVKEICEKHELTYFLVFGTALGAKRHC + GFIPWDDDVDIALPREHYNIFIDALSETDQSIFSLQNEDNEPNYFLPFAKLRKNNTIF + IEKILDVEYENNGIYIDIFPLDFVENPDSFNFKIRRTTFNYIKHILKFSSCRSFYKNK + YSNVRYLIENIMSIPTLFFSNRRLLFLANSLISSTTKADFIGQYDQKSNKRAIMPSNY + YFPPRSAVFEGKTYSVPAKLEDYLKCFYGSDYMELPPIEKRVTHQPITLRFEK" + gene 18037..18429 + /gene="gct" + CDS 18037..18429 + /gene="gct" + /EC_number="2.7.7.39" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0615" + /inference="protein motif:CLUSTERS:PRK11316" + /inference="protein motif:Pfam:PF01467.1" + /inference="protein motif:TIGRFAMs:TIGR01518" + /inference="similar to AA sequence:RefSeq:YP_003875983.1" + /inference="similar to AA sequence:UniProtKB:P27623" + /note="glycerol-3-phosphate cytidylyltransferase; + bifunctional heptose 7-phosphate kinase/heptose + 1-phosphate adenyltransferase; cytidylyltransferase" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="QCO91898.1" + /translation="MKRVITYGTFDLLHHGHINLLRRAKELGDYLVVVVSSDEFNLIE + KNKVCYFNYEHRKSLVEAIRYVDLVIPETSWEQKRSDVKEYHIDTFVMGDDWIGEFDY + LKEEGVEVVYLPRTKEISTTKIKKDLSM" + gene 18587..19456 + /gene="rmlA" + CDS 18587..19456 + /gene="rmlA" + /EC_number="2.7.7.24" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4750" + /inference="protein motif:CLUSTERS:PRK15480" + /inference="protein motif:Pfam:PF00483.17" + /inference="protein motif:TIGRFAMs:TIGR01207" + /inference="similar to AA sequence:RefSeq:YP_815843.1" + /inference="similar to AA sequence:UniProtKB:P26393" + /note="glucose-1-phosphate thymidylyltransferase RfbA; + CTP:phosphocholine cytidylyltransferase; nucleotidyl + transferase" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase" + /protein_id="QCO91899.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + gene 19457..20050 + /gene="rmlC" + CDS 19457..20050 + /gene="rmlC" + /EC_number="5.1.3.13" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00908.11" + /inference="protein motif:TIGRFAMs:TIGR01221" + /inference="similar to AA sequence:RefSeq:YP_003878604.1" + /inference="similar to AA sequence:UniProtKB:Q5XCG7" + /note="putative dTDP-4-dehydrorhamnose 3,5-epimerase" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-dehydrorhamnose 3,5-epimerase" + /protein_id="QCO91900.1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVYGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTIIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + gene 20063..21112 + /gene="rmlB" + CDS 20063..21112 + /gene="rmlB" + /EC_number="4.2.1.46" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK10084" + /inference="protein motif:Pfam:PF01370.15" + /inference="protein motif:TIGRFAMs:TIGR01181" + /inference="similar to AA sequence:RefSeq:YP_006742612.1" + /inference="similar to AA sequence:UniProtKB:P95780" + /note="dTDP-glucose 4,6 dehydratase; NAD-dependent + epimerase/dehydratase family protein" + /codon_start=1 + /transl_table=11 + /product="dTDP-glucose 4,6-dehydratase" + /protein_id="QCO91901.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + gene 21178..22029 + /gene="rmlD" + CDS 21178..22029 + /gene="rmlD" + /EC_number="1.1.1.133" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09987" + /inference="protein motif:Pfam:PF04321.11" + /inference="protein motif:TIGRFAMs:TIGR01214" + /inference="similar to AA sequence:RefSeq:YP_141831.1" + /inference="similar to AA sequence:UniProtKB:P29781" + /note="dTDP-4-dehydrorhamnose reductase; RmlD + substrate-binding domain protein" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase" + /protein_id="QCO91902.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTQNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + gene 22092..22538 + /gene="tnp" + CDS 22092..22538 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3436" + /inference="protein motif:Pfam:PF03050.8" + /inference="similar to AA sequence:RefSeq:YP_002037044.1" + /note="transposase IS66 Orf2-like protein" + /codon_start=1 + /transl_table=11 + /product="IS66-Spn1 transposase" + /protein_id="QCO91903.1" + /translation="MYDYLVVVLVSLVHSFGSVSIIAHTIHQKFNLKVPNYRQEEDWA + RMGLPITRKEISNWHIKASQYYLESLYNLLREKLLEQPLLHADETSYRVLESDSHLTY + YWTFLSGKDENQAITLYHHDQRRSGLVVQEFLGDYSGYVHCDMLRQ" + gene 22807..23049 + /gene="tnp" + CDS 22807..23049 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF03050.8" + /inference="similar to AA sequence:RefSeq:YP_003879023.1" + /note="transposase IS66 family protein" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO91904.1" + /translation="MNDYRNVQPLMEDFFAWCRRQSVLAGSKPGRAIEYSLKYEETFK + TILKDGHLVLSNNLAERAIKSLVMGRSKRVHWTLLA" + gene 23120..23278 + /gene="tnp" + CDS 23120..23278 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_003878609.1" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO91905.1" + /translation="MSLLETAKRHQLNSEKYLFYLLECLPNEETLVNKEVLEAYLPWT + KVVQEKCK" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg gagatggaat tggcgatttg ccaggaatta ccagtaagtt ggactatcta + 121 gccaagctag gaatcacagc aatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctacg atattgctga ttatcaagcg attgcaacga tttttggaac catggaggat + 241 atggatcaac tgattgcgga agctaagaag cgtgatatcc gtatcatcat ggacttggtg + 301 gtcaatcata cctcggatga gcatgcctgg tttgtagagg cctgtgaaaa tcctaatagc + 361 cctgagcgag actactatat ctggcgcgat gaacccaatg acctagattc tatctttagt + 421 gggtctgctt gggaatacga tgaaaagtca ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaggg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agataaggat ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcagc ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttacttcat + 1021 ctcatgagag gaactcctta tatctaccaa ggtgaggaaa ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatccctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaacct + 1261 tggttggcgg ttaatccaaa ttacgagatg atcaatgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 attcgagctg actttgaatt gcttgatacg gctgataagg tatttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacactg cggctaaaga agtacttgaa + 1561 aaacaggtct tggctccatg ggatgctttc tgtgtggaaa tgactgacta gaatgagcaa + 1621 acctcaagtt tttgaagctt gaggtttttt actatagtgg attgaaacta gaatagtgca + 1681 cctctacttc taaaacattg ttagaaatcg atttgtcctg ttcttatttc attttactat + 1741 atttttgttt cgcgggaagt ctactaagat atttaaagat gcagatagta aaaaaagatg + 1801 tgtcaatcga aagtgattat gtcccccaaa aatggagagt ttgagggcaa ttattttgat + 1861 ttcatttgac acgaggaatc cttgaagctg ttttgtcagc taaaccaagg ctagtcttag + 1921 ccttggctct ccagcctaac agctccaagc ctcttatcaa atgaaatgct tgtcttacac + 1981 tcctcacttt ctctctccta aatgtaaggg atagagtgac ttcctttaag gaaaagcttc + 2041 ccatttagcg agaaatagat tatacttgta gttgaggaga atgaagctcc tcactagtaa + 2101 actcttcata atccttttta tttttatgaa ggtattgttt gaaagatgtg agtttccacg + 2161 gatgggtttg tggagggata tacttgcgtc tttctttttt ttgttctggt tcttgttcaa + 2221 agtttttcga atagagttca taatctagta gctcctttgt gtgatagatt ttgtcagcga + 2281 tattgaggta gatgtcacca tcaaatgctt ttataactaa tgctttcgtc tttctgatga + 2341 aatagacttc ttttccttgt tcggtaggaa tatagtaacg attttggaat cggatatggt + 2401 gtccactatc gacgactctc tccgccagtc tagctagaat gagattccgt tcagagaggt + 2461 taggagcctc ctcaaaaaca gagagttttg tcttgtttcc aaactgttca ttaaaggttt + 2521 ggatgtagga aagaaggaaa gtattggctt cttctaatgt atgaatcttg tttcgttcca + 2581 gttcgatagg caggcgtgat tgtagtgtct gattgagtct ttcgaccctc cctttagctt + 2641 gagggataga ggtggtctca aggagaatcc ctagttggtg acaggcgtat ccaaattgtg + 2701 tataggtgtc gtcctccatt ttcttagagt tggatgcttg ataggtaaag accgttctct + 2761 tatcagtttt catttgaagg ggaatgccgt gattgactaa gatttgttcg aggacatggt + 2821 agtaggcatt caaggtctct tgtttgtcaa aataagcgcc taggatattg ccagaagcat + 2881 catcaatggc taagtgtaag ttggtggttt ctggtccaaa ccaggcatga gggctggcat + 2941 ccatttgaat gagttctcca gcaaatttct ttctgggtct actaggatgt acctttttag + 3001 ggttttccag gaagtcttta gccgtcggta agattggatt gtctaggggt tgattcaggt + 3061 tcagtttagc ttgttttctt actctcttct ttgtctttct gtgagactta ggagaaagga + 3121 tgtttttctt atagagtatt tttctaacag ttgtatcaga gagcttaatt ccctcttctt + 3181 cagctagtaa ttcacagaaa tgaaggacat ttggtttata tgtttcatag gagaggtatt + 3241 tctttaggac acgttctttg atttcatcag ggattgcatg ttttggtttt cgatttctgt + 3301 ttccgtgtct gaaggcttct tttcctttct gttgataggc tagtagcaga cgattgattt + 3361 gtctttcaga aagattgagt tcgacacagg cccgtttctt tgttttcttt ccttgggcta + 3421 tagcttttat tacaagatat tttttcgttt cattcatatt cagttggatc cttttcatat + 3481 gactattcta tcaaatggga cattatcaca ttcgaattac aaaaagatgc ggatagtaaa + 3541 aaaaggtgta gacattaccg taaaaaagtg atataatcgt atgatgttca atgtataggt + 3601 gttaatcatg agtagacgtt ttaaaaaatc acgttcacag aaagtgaagc gaagtgttaa + 3661 tatagttttg ttgactattt atttattgtt agtttgtttt ttattgttct taatctttaa + 3721 gtacaatatc cttgctttta gatatcttaa tctagtggta actgcgttag tcctactagt + 3781 tgccttggta gggctactcc tgattatcta taaaaaagct gaaaaattta ctatttttct + 3841 gttggtgttc tctatccttg tcagctctgt gtcgctcttt gcagtacagc agtttgttgg + 3901 actgaccaat cgtttaaatg cgacttctaa ttactcagaa tattcggtca gtgtcgctgt + 3961 tttagcagat agtgagatcg aagatgttac gcaactgacg agtgtgacag caccgactgg + 4021 gactgataat gaaaatattc aaaaactact agctgatatc aagtcaagtc agaataccga + 4081 tttgacggtc aaccagagtt cgtcttactt ggcagcttac aagagtttga ttgcagggga + 4141 gactaaggcc attgtcctaa atagtgtctt tgaaaatatc atcgagtcag agtatccaga + 4201 ctacgcatcg aagataaaaa agatttatac caagggattc actaaaaaag tagaagctcc + 4261 taagacgtct aagaatcagt ctttcaatat ctatgttagt ggaattgaca cctatggtcc + 4321 tattagttcg gtgtcgcgat cagatgtcaa tatcctgatg actgtcaatc gagataccaa + 4381 gaaaatcctc ttgaccacaa caccacgtga tgcctatgta ccaatcgcag atggtggaaa + 4441 taatcaaaaa gataaattaa cccatgcggg tatttatgga gttgattcgt ccattcacac + 4501 cttagaaaat ctttatggag tggatatcaa ttactatgtg cgattgaact tcacttcttt + 4561 cttgaaaatg attgacttat tgggaggggt agatgttcat aatgatcaag agttttcaac + 4621 tctacatggg aagttccatt tcccagtagg gaatgttcat ctagactctg agcaggctct + 4681 aggttttgta cgtgaacgct actcactagc cgatggagac cgtgaccgtg gtcgcaacca + 4741 acaaaaggtc attgtggcta tccttcaaaa attaacgtca accgaagcac tgaaaaatta + 4801 tagtacgatc attgatagct tgcaagattc tatccaaaca aatatgccac ttgagactat + 4861 gataaatttg gtcaatgctc agttagaaag tggagggagt tataaagtaa attctcaaga + 4921 tttaaaaggt acaggtcgga cggatcttcc ttcttatgca atgccagaca gtaacctcta + 4981 tgtgatggaa atagatgata gtagtttagc tgtagttaaa gcagctatac aggatgtgat + 5041 ggagggtaga tgaaatgata gacatccatt cgcatatcgt ttttgatgta gatgacggtc + 5101 ccaagtcaat agaggatagc aaggctctct tggcagaatc ctacaggcag ggggtgcgaa + 5161 ccattgtctc tacctctcac cgtcgcaagg gcatgtttga aactccggaa gagaagatag + 5221 cagaaaactt tcttcaggtt cgggaaatgg ctaaggaagt ggcgagtgac ttggtcattg + 5281 cttacggggc tgaaatttac tacacaccag atgttctgga aaagctggaa aaaaagcgga + 5341 ttccgaccct caatgatagt cgttatgcct tgatagagtt tagtatgaac actccttatc + 5401 gcgatattca tagcgccttg agcaagatct tgatgttggg aattactcca gtcattgccc + 5461 acattgagcg ctatgatgct cttgaaaata atgaaaaacg cgttcgagaa ctaatcgata + 5521 tgggctgtta cacgcaagta aatagttcac atgtcctcaa acccaaactt tttggcgaac + 5581 gttataaatt catgaaaaaa agagctcagt attttttaga gcaggatttg gttcatgtca + 5641 ttgcaagtga tatgcacaat ctagacggta gacctcctca tatggcagaa gcatatggcc + 5701 ttgttaccca aaaatacgga gaagcgaagg ctcaggaact ttttatagac aatcctcgaa + 5761 aaattgtaat ggatcaacta atttaggaga aatgatgaaa gaacaaaaca cgatagaaat + 5821 cgatgtattt caattattta aaaccttgtg gaaacgcaag ctaatgattt taatagtggc + 5881 acttgtgaca ggtgcggggg cttttgcata tagcgctttt attgttaagc cagaatatac + 5941 gagtaccacg cgaatttacg tagtgaatcg caatcaagga gacaagccgg ggctgacaaa + 6001 tcaggatttg caggcaggat cttatctagt aaaagactac cgtgagatta tcctttcgca + 6061 ggatgttttg gaggaagtta tttctgattt gaaactagat ttgacgccaa aaggtttggc + 6121 taataaaatt aaagtaacag taccagttga tacccgtatt gtctctattt cagttaataa + 6181 tcgagttcct gaagaggcaa gccgtatcgc taactctttg agagaagtag ctgctcaaaa + 6241 aattatcagt attactcgtg tttctgatgt gacaacactg gaggaggcaa gaccggcgat + 6301 atccccgtct tcgccaaata ttaaacgcaa tacactaatt ggttttttgg caggggggat + 6361 tggaactggt gttatagttc ttcttcttga acttttggac actcatgtga aacgtccgga + 6421 agatatcgaa gatacactgc agatgccact tttgggagtt gtaccaaact ttaataagtt + 6481 gaaataggag agaggaatgc cgacattaga aatagcacaa aaaaaaatgg agttcattaa + 6541 gaaggcagaa gaatattaca atgccttgtg tacaaatata cagttgagcg gagataaact + 6601 aaaagtaatt tccattactt ctgttaacgc tggggaagga aaaacaacta cttccgtaaa + 6661 tatagcaagg tcgtttgcgc gtgcaggcta taaaactctt ttgatcgatg gcgatactcg + 6721 aaattcagtt atgtcaggag tttttaaatc tcgtgaaaaa attacagggc taacagaatt + 6781 tttatctggg acagctgatt tatctcacgg tttatgtgat acaaatattg aaaatttatt + 6841 tgtagttcaa tcgggatctg catcaccaaa ccctacagcc ttgttacaaa gtaaaaattt + 6901 taatgacatg attgaaacat tgcgtaaata ttttgattat atcattgttg atacagcacc + 6961 tattggaatt gttattgatg cggcaattat cactcaaaag tgtgatgcgt tcatcttggt + 7021 aacagcaaca gatgaggtga ataaacgtga tgttcaaaaa gcgaaacaac aattagaaca + 7081 aacagagaaa ctgtttttag gtgtcattct caataaattt gatgttcaat atgaaaaata + 7141 tggttcttac ggtgactatg gtaattatgg taaaaaataa cttaggaaag attttatgga + 7201 tgaaaaagga ttgaaaattt ttctggcagt attacagagt attattgtca ttttattggt + 7261 ttattttctt agctttgtta gagagacaga acttgaacgt tcttcgatgg ttatactata + 7321 ccttctccac ttttttgtat tctattttag ttcctatggt aacaattttt ttaaaagagg + 7381 gcgcttagtt gagtttaata gtactataag atatattttt ttctttgcaa tagctataag + 7441 tgtattaaac ttttttatag cggaacggtt tagtatctct agaagaggaa tggtatactt + 7501 cttaacttta gaaggaatat ccttatactt gttaaatttc ttagtaaaga aatattggaa + 7561 gcatgtgttt tttaatctaa aaaatagcaa gaaaatttta ctgttaacag taacgaaaaa + 7621 tatggaaaaa gttcttgata aattgctaga atctgatgaa ctttcatgga aattggtagc + 7681 agtaagtgtt ttggacaaat ctgattttca acatgataaa atacctgtaa ttgaaaagga + 7741 aaaaattatt gaatttgcaa cgcatgaagt tgtggatgag gtgtttgtca atcttccagg + 7801 agagagctac gatattggag aaattatctc taggtttgag acaatgggga tagatgtaac + 7861 tgtaaatctt aaagcatttg ataagaattt gggtcgcaat aaacaaattt atgagatggt + 7921 aggattgaat gtagtcactt tctctacaaa tttttataaa actagtcatg tgatttcaaa + 7981 gagaattctc gatatttgtg gtgccattat tggccttatt ctttttgcta tagctagtct + 8041 aattttagtt ccattgattc gtaaagatgg cggaccagct atttttgctc aaactcgtat + 8101 agggaaaaat ggtcgacatt ttacctttta taaattccgt tcgatgcgga tcgatgctga + 8161 agctatcaaa gaacagttga tggatcaaaa tacgatgcaa ggtggtatgt ttaagataga + 8221 caatgatcct cgtgttacaa aaattggtcg ctttattcgc aaaaccagtt tggatgaatt + 8281 gccacaattt tggaatgtct ttataggaga tatgagtttg gtgggaacac gtccacctac + 8341 agtagacgag tatgatcagt atactccaga acagaaacgt cgactcagtt ttaaacctgg + 8401 gattacaggt ttatggcagg ttagcggccg tagtaaaata accgattttg acgatgttgt + 8461 aaaattagat gtggcttata ttgataattg gacaatctgg aaagatattg aaattttgct + 8521 taaaactgtt aaagttgtat ttatgagaga tggagcgaag taatttctgt atatccatca + 8581 tattaggaga gaaatgaaaa aatcagttta tatcattggt tcaaaaggaa ttcctgctaa + 8641 gtatggaggc tttgaaactt ttgttgaaaa attaacagcc ttccaacaag ataaggctat + 8701 ccaatattat gtggcttgta tgcgtgaaaa ctctgcaaaa tcagggacta ctgaggatat + 8761 ttttgaacat aatggtgcta tctgttataa cgtcgatgtt cctaatattg gtccagcgcg + 8821 agccatagta tatgatatcg cggcaattaa cagagctatt aaaattgcca aagaaaataa + 8881 ggatgaagat ccaatcttct atattctagc ttgtcgaatc ggtccgttca tccatggaat + 8941 taagaaaaaa atccaggcga taggtgggac tcttctagtt aatccagatg gtcacgagtg + 9001 gttacgagct aagtggagcg ctccagttcg tcgttattgg aaaatttccg aaggtcttat + 9061 ggtcaaacat gcagatcttt tagtgtgtga tagtaagaat attgaaaaat atatccaaga + 9121 agattataaa cagtatcaac ctaagacaac ctatatcgct tatgggactg atacaacacg + 9181 ctccatatta aagagtagtg atgaaaaagt acgttcttgg ttcaaagaga agaatgtttc + 9241 tgaaaacgag tattacctag ttgtaggacg ttttgttcca gaaaataact atgaggctat + 9301 gatacgtggg tttttagcat ctaattctaa gaaggacttt gtcctaataa caaatgtaga + 9361 acagaataaa ttttataatc agctattagc aagtactggc tttgataaag atccacgagt + 9421 aaaatttgtt ggaacagtct acgatcaaga acttctgaag tatattcgtg aaaacacctt + 9481 tgcttacttc catggacatg aagttggagg aaccaatcct tcgcttttag aagctctggc + 9541 atcaactaaa ctgaatttat tgctagatgt tggctttaac cgagaagttg gggagcaaag + 9601 tgcgatctat tggaaaaaag atgagctttc ccaagtaatc gagaaagttg aacaatttga + 9661 tgcaaaaatg attgatgagt tagatagaca atcaaatcag agaattgtgg attctttcac + 9721 ttgggaaaag attgtcacag actacgagaa attatttaaa aaatgaaaat attacattat + 9781 actttaggat ttcaacccca gcgaacaggt ggtttggtta aatatgctga ggatttaatg + 9841 ctagagcaaa ttgctcaagg ttatcaagtg gctgccctat atccaggaag aattaagttc + 9901 ttttcaaaaa aaatagaaat aattaaagcg acgtcaagac agtttgagtg ttatgaactg + 9961 cttaatagct tacctatggc tttatttgga ggtatatccg atccaactgc tttcctgaca + 10021 ccttgtgaca aaaatgttta tcgtactttt ttagaaaaag tacaacccga cattatacat + 10081 attcactcgt ttatgggatt gcataaagaa ttcctcgaaa ttgctaaaaa cttgaatatt + 10141 agagtggttt ttacgagcca tgattattat ggattagcac ccgtacctca tttctatttt + 10201 aatggggtgg attatagtga taaaagtaca aacttaacat ggaatattat gtcttccaat + 10261 gctttaagtg tgaaaaaact aagacttttt cagctttcat tttatcctac tattcgtaaa + 10321 cttttgaaac tattagggaa aaatccaaaa tctaaaaata atttagttat tcgggatgtt + 10381 attgaggagc aagattatag tgagcttcga tactattata atgagatgtt tcacttaata + 10441 gatggttatt tgtttaatag tagacttgca aagaaggtat atgagataaa tgagattaag + 10501 tcagctaata gtatagtatt atctataaca aatagttcaa ttaatcatca tcagagattg + 10561 ataactacaa ataataaaat tagagttgct tatattggtc cagatgaaga atataaagga + 10621 tattttgatt ttgttgactt tgttgaaact ttagatcgag agtcctatga agtggcaact + 10681 tatggccatt taccaaatga agagtgtcct tcattcattg aacaaaaagg atattttact + 10741 aaggaaatga ttgacagtgt ctatgaaaat attgatattc ttattgttcc aagtaagtgg + 10801 aaggaaacat ttggattgat aacagtagaa gcgttatcct atggggtaag tgttttcgtg + 10861 agtgaaaatg ttggatcaaa agacttactt ccagaatcgc atgtttttaa aaatcagaat + 10921 gatttagtag ttaaattttt aaaaaatgat atagaaaata caaaattgaa aactttagat + 10981 gaacactcga tagaagtgat tcagtattat gaaagagtga taaatgatag ttaagagttt + 11041 cataaaaaag attactggaa aaacagtaga cattcatcca gatgtacctt tgtcgtatat + 11101 actacaaaga ggtataaact atggtttcgg actctttcgt ggggttgtac gtggaatcgg + 11161 atttggtcaa aacgacaaac gtttattcat tggacaagga gtttctatct tagcaaagcg + 11221 taaattattt gttggaaaaa atgttcgaat tggtaaaaag gtgtctatag atgcactgtc + 11281 aaaagaagga atccattttg cagataatgt aaagattgga gattattctc aaattattgg + 11341 cacaggttct ataaaaaata tggggattgg cttgaaaatc ggtaagaact catctttttc + 11401 agaatatagt ttatttggtt ctgctggagg tatcacaatt ggtgataatg ttatcgcagg + 11461 tcagaatgtt cgttttcatg ctgaaaatca taattatagt gatttagata aactcattgt + 11521 tgaacaaggg gtatctcgaa agggaatttc agtaggtgat aattgttgga ttggtgctgg + 11581 agctgttttt ttggatgggt ccagcattgg ttcaggttgt gttgtagctg caaattctgt + 11641 aattacgaaa aactttccag ataacgttat tgttgctgga gtaccagcta aaattataaa + 11701 aatgaaatga taggatgtta aatggggaaa gaaattaaag ctgtttatgc gatattaaat + 11761 tacaatactt gggaagatac tgcgcgttta gcacagaaag ttgcaacatt tcagcatatt + 11821 caatctgtga taatagtgga taatctatca acagatgatt cataccatta tttaaaaaga + 11881 cttgagggag agaaaatttc agtttatcaa acacaaagaa atggtggata ttctgttgga + 11941 aataattttg cagcacgaaa agcttataat atgggagttg atattctttt catttcaaat + 12001 ccagacgttg atattgatga aaaagattcc ttgatgattg cacaaaattt gtataaaaat + 12061 agttcatatg cactgctatc aggtatagaa tataatgcta tgaaggagat agatttgcca + 12121 attgtctggc atgaaaattc ctattacgat gacttacttg attgtttgtt tttaaccaga + 12181 aaatggcgaa gaaaaaaaga agatatcaat ttatcaatga ttaaatcatc tataatagat + 12241 gtagatcttg ttaaaggatc gttttttgct gtaagactgt ctgattttca tgatgttggt + 12301 tattttgatg aatctgtatt tcttttttgt gaagagagga tattagctaa aaagttacaa + 12361 aaagcaaata aaaaaatagg tattctgcct gaagcgaaat attaccacaa tcattcaact + 12421 tctataaatg agagatataa aaagaaaaaa gaacagatta atttattata taagtctcga + 12481 tactactata atgtaaagta taataatatt agttttgtca aaaaactatg tttaaaatct + 12541 gtcatgatgc tatccatttt agaatatata atcttagata tgatgaattt attatataca + 12601 aagactaact ataagaaaat tcaatagttt aatctgaaat acttcttgtt tcaaagtgga + 12661 tgattttaga gcacggcaaa atgtccttga aaaagtctgt tttttcaaag gttatcttgt + 12721 ggcaaattca ggagttagat cacttttttc gtcaaatggt agcttgtttt ttaggagata + 12781 aaacagattt ctaataagtt ttttggcaag gtgaatgatg gctacattgt aatgctttcc + 12841 ttgttacaac ttagtcctaa gatagacttt aaaagcaggc gaaaagcgag cacatgcttt + 12901 ggtagcttgt atgagtgccc aacgtagatg aggggaaccc agtttgacca ttttccctgc + 12961 taaatcgatt tgacctgact agtaaataga aggatccggt ccagcaaaag cttgtaattg + 13021 atgaggctta tcgaagatat gaatatttcg aatctcaact aagataacgt cacctaaacg + 13081 attcccaagt tcacttgggg ttatccacga actttgtgcc ttgttacctt acacgagata + 13141 aaacgtctat gcgttatcaa actcattacc aattgaaaca aaaagctgta gttagatcct + 13201 ttcagaaatc gtcaagcgat tggaggaaat aaactaatcc acagtggctt attccaagtg + 13261 taccacttgg acttcagcag tagcgaacta cactaaatat aatataagga gaaataggtg + 13321 agtaaattaa gattgaactt gaaattaaat tcttttttat ttgttataat tttactttta + 13381 gttgttgtta ctccgactca taccttaatt tttgatgtac taattcgaac gaaaattgat + 13441 aatttatgga gagagttttt tctagtaatt tcttttctat gtattctaaa gataaatgca + 13501 ggaaaaatta aaattggaaa gctagggggc cccataattg ttatgggagg aattggttta + 13561 gtttatacta tctgttcaga taggccattt acagctttaa atctttttag aatttatatg + 13621 tttcctgctg taatatattt tataataata aattgtaatt ttcgcaagga gagattactg + 13681 atattgaagc aagcgcatgt atatactgct tgcatattag ctttatgggg aatttttcag + 13741 gcgtgggtgt taaaagatca gtttttgatt aaaataggat atccttccca aggaaatttt + 13801 ctaaagagta cagcttttta tattggtggt tttttcggtc aacaacgagt tactagcact + 13861 ttttctgctc ctaatttagc tggagtttat tttggaatat ctttgatcat tttactctct + 13921 atatttgata ctataaagag taatagattg gtattatttt caattgtagc agctttagtt + 13981 tttacattta gccgtagtgc tattataagt actcttgtag gaatcgtatt ctttcaacgt + 14041 aagaaattgt tttcaacgat gaagattaat gttatgacct tggtaatctt ccccttaatt + 14101 tttttgattg ttttagttat attttatctt tatcctgaaa atacgattat aaatatgctc + 14161 tatagcagtt attcttcaac acttaatttg acagattctt cagcagttaa gcatttggaa + 14221 gacttatggc ttcctcttct aaaagttatt gattatcctt tgggacttgg atttggtaat + 14281 aatggcccaa ttgttctgtc actctatcag tcagcaaatt tagtagaatc ttccatttat + 14341 cttcttgcat atgattttgg tattttagga atgttcatgt atttgttccc ttatttttat + 14401 acgatttttg tatataaaaa atatttgctt agcggtgcta tatgttgctt agttcttata + 14461 acttatctat ttcttccaaa tgtagaaaat tttgaaatca tattttttat ttaccttttc + 14521 attgggatgg atgaactagc actatataca aaaggaatga atgtacatga gattgattaa + 14581 attattgaaa aaatatataa atttatacat tagcagttcg gtgcctaaga caagtaaatt + 14641 gttaattttt ggatcatggt taggtgaaaa atatgcagac aatccaagat atttgtttga + 14701 gtatgtgatt aagaatcgtc ccgatttaaa agctatatgg attacaagta atcaagatat + 14761 ttttaaagaa ttacagaaga aacaatatct cgtgatgatg gcagaggcac ctgaaactcg + 14821 gaaaattgtt aaaaaagcaa agtatatttt tacagcaact ggtatttttg atattggaga + 14881 acaaaatgct aacttcgttg gaggtgccta tctaattaat ctatggcatg gcattccttt + 14941 gaaaaaaatc atgtatgatg ataaacattc agcacttcac aaacgtagta aactagtgac + 15001 ttgggtagaa aaaattcctc ttcgaaacta ttttgttatt tctactagta cggcaataac + 15061 tcaaatttat cagtctgctt ttcgcgtaaa gaaatctaat atattagaac ttggtcaacc + 15121 taggaatgac tatttttatg ataagtctaa tccagtgagt tcattaatac aggaattaaa + 15181 aagtaaaaat attatcttat atatgccgac acatcgcaat gaaggaaaga aacaaataga + 15241 tctagataag ttaatggatt tagaacactt aaataattgg tgtgaagaaa caaagtcaat + 15301 ttttgtaatt aaaaagcact tctatcattc aaaagaaaaa actattgata agaaatattc + 15361 ttcgataatt gatgtgacaa atgagaaggt ggatgttcaa gaattactca aatattcaaa + 15421 tgttttaata actgactact caagctgcta tattgactac ttattgttga atcgtccaat + 15481 tatatttttt aattatgatt atgatgatta cttacgggtg gatcgttcgc tatattttcc + 15541 atatgagaat gttactccag gggagaaatg tcaaaacttt gatgaattat tagtgacttt + 15601 gcaaaatcta tatgtaggaa aagatgatta tagagaagaa cgtgaaaata tcaaaacttt + 15661 cttttattct agtgaaactc agaagtcagt ttctgaaaaa ataattaatc acgtactaaa + 15721 tctataattt tattggaatc tgtcatgaaa aaaatattaa ataagtatta ttctttatct + 15781 aatcctgtaa aagcttcaat ttggtttact atttgcaatg ttcttcaaaa aggaatttca + 15841 atgattactg ttccagtttt tactagagta ttgacaacgg aacaatatgg tgtatactct + 15901 gtatatcaat catggtattc aataattgga gtttttgcaa cactaaacct atattatgga + 15961 gtctttaata atggaatgat taaatacgag aaagataaaa atgtctttac ttcctctatg + 16021 cagggactaa caacaacagt tacagctata tttttactga tatatttaat agggattgat + 16081 ttttggaact cgttgttagg cttacctaca ctactaatct tagtgatgtt ctttgatttg + 16141 ttttttaccc ctgcttattc tttttgggtt gctcgtcaga gatttgaata taaatataga + 16201 aacttagtat ttatcacatt tattatagcg attggaagtc ctattattgg tatttctgca + 16261 gttgttttat cgacttataa agcggaggct agagttatct catttgtgtt agttcaatct + 16321 tgtatagggt tatatttcta tattttgaac ctttaccgag gtaaacattt tttttgtaaa + 16381 aaatattggc gctatgcttt gaattttaat ttacctctta ttcctcatta tttatcgcaa + 16441 tcagttttaa accaatcgga tagaataatg attaattcaa tggtaggaat gggagaagca + 16501 gcaatatata gtgttgctta cagcatatca attttgatgc ttttagtgac aagtgctata + 16561 aacagctctt ttattcctta cacatataag tgtattcgag ataagaaata tactgaacta + 16621 gggaaaagtg caaatctttt aattactctg gtaggcattg gttcgatttt aactatttct + 16681 cttggaccag aaatcattca attatttgca ccaaaacaat attacgaagc aatatggatt + 16741 attcctcctg ttgctctgtc agtatatttc atgttcttat atcccatttt tggtaacatt + 16801 gagttttact ttgaagcaaa tcattttgta atgtgggctt caatcggtgg agcaattatg + 16861 aatatttttt tgaattttat ttttttaaaa cactttggat atattgcggc aggctataca + 16921 actttattct gttatatttt atttgcgttg ggacattaca tttttatgag gagagtactg + 16981 tatcagaatc tttcgggtat ccaaatttat aattccagat atattttatt tttttcgatt + 17041 cttcttatta ttctaatgct actaatcgtg attatttatc catttatact gattcgttat + 17101 cttactatct cactcatcct aggaggatgt tttttaaaga ggaaaaagat aatgagttcg + 17161 atagctatca ttaaacaaca gtgaggtaca agaatgacag aaacaaataa acagttacat + 17221 gaaacattaa tcgaaatttt agactttgta aaagaaattt gtgaaaaaca tgaattaact + 17281 tattttttgg tctttgggac agcacttgga gcaaaacgcc attgtggatt tattccatgg + 17341 gatgatgatg ttgatattgc tttgccacga gagcactaca atatatttat cgatgcatta + 17401 tctgagacgg atcaatctat atttagtctt caaaatgaag ataacgagcc gaattatttt + 17461 ttaccatttg ctaaattaag aaaaaacaat acgattttta ttgagaagat ccttgatgtt + 17521 gaatatgaga ataacggtat ttacattgat atttttccac tagatttcgt agagaatccg + 17581 gactctttca attttaagat taggagaact acatttaatt atataaagca tattttaaaa + 17641 ttttcaagtt gcagaagttt ttataaaaat aaatacagta atgtgcgtta tttgattgaa + 17701 aatattatga gtattcctac cctgtttttt tcaaatagga gattactatt cttagcaaat + 17761 agtttaattt catcaacgac taaagctgat tttattggtc aatatgatca aaaaagtaac + 17821 aaaagagcta tcatgccttc aaactattat tttccaccta ggtccgctgt gtttgaagga + 17881 aagacctata gtgttcctgc gaaattagaa gattatttaa aatgttttta tggttcggat + 17941 tatatggaat taccaccaat agaaaaaaga gtcactcatc aaccaataac acttagattc + 18001 gaaaaataat ttgctattct gtagaaggag aatataatga aaagagtaat tacatatgga + 18061 acgtttgatt tacttcatca tggccatatc aatttattgc gacgtgcaaa agaattaggt + 18121 gactatctag tggtagttgt ttcaagtgat gaattcaacc taattgaaaa aaataaagtt + 18181 tgttatttca attatgagca tagaaaaagt ctagttgaag ctattagata tgttgacctt + 18241 gttattcctg aaacgagttg ggaacaaaaa cgcagtgatg tcaaagagta tcatattgat + 18301 acttttgtga tgggggatga ttggattgga gaatttgatt atctaaaaga agaaggagtt + 18361 gaagtcgttt acttacctcg gacgaaagaa atttcgacaa ctaaaataaa aaaagattta + 18421 tcaatgtaat attcgtaaat aagcattgtt ctgttattgt tctcgaatag accactgtat + 18481 ttttaagtag aaatgctaaa gtcgatagaa aagagaaaaa tgataggaca ataccaatat + 18541 aggtaaaaaa tatcgtaatt agataaataa gaaaggtacc ccttttatga aaggtattat + 18601 tctagcaggt ggttcgggaa ctcgcttgta tcctttgact cgagccgcat caaaacaact + 18661 tatgccggtt tatgataaac cgatgattta ctacccactt tcaacattga tgttggctgg + 18721 gattagggat attttgatta tttccactcc acaggattta catcgatttc aagagcttct + 18781 tcaagacgga tctgagtttg ggatcaaact ttcttatgca gagcaaccaa gtccagatgg + 18841 tttggcacaa gcctttatca ttggggaaga gtttatttct gatgatagcg ttgcgctaat + 18901 cttaggtgat aatatctacc atggttctgg gctttccaag atgctacaaa aggcagcgag + 18961 taaggagtcg ggagcaactg tttttggcta ccatgtcaag gatccagagc gctttggtgt + 19021 ggttgagttt gatcaggata tgaaggctat ttctattgaa gaaaagccag agcaacctcg + 19081 ttcaaactat gcagtgacag gactctattt ctatgataat gatgtagtag agattgccaa + 19141 aagtattaaa ccaagtcctc gtggtgaatt ggaaattaca gacgttaaca aggcttatct + 19201 agatcgtgga gacttatccg ttgagcttat gggacgtggc tttgcttggt tggatactgg + 19261 aacacatgaa agtttactag aggcttcaca gtacatcgaa acagtccaac ggatgcaaaa + 19321 tgttcaggta gcaaacttag aagaaattgc ctatcgcatg ggttatatca gtcgtgaaga + 19381 tgtattgacc ttagcccaac cacttaagaa aaatgaatac ggacagtatc tgctccgttt + 19441 gattggagaa gcatagatga cagataattt tttcggtaag acgcttgcgg cacgcaaggt + 19501 tgaagctatt ccaggcatgt tggagtttga tatccccgtt tatggagata atcgtggctg + 19561 gtttaaagaa aatttccaaa aggaaaaaat gcttccactt ggatttccag agtctttctt + 19621 tgcagaagga aaattgcaaa acaatgtatc cttctcacgt aaaaatgtcc ttcgaggcct + 19681 ccacgcagag ccttgggata agtacatctc tgtagcagat ggagggaaag ttctgggttc + 19741 ttgggttgat ctacgcgagg gtgaaacctt tgggaatacc tatcagacaa taattgatgc + 19801 aagcaaggga atctttgttc ctcgaggcgt agctaatggc ttccaagttt tatcagatac + 19861 agtgtcatat agctatctgg tcaatgatta ctgggcgctt gaactcaaac ccaagtatgc + 19921 ctttgtgaac tacgctgatc caagccttgg tattgaatgg gaaaatattg cagaagcaga + 19981 ggtttcagaa gcagataaaa atcatccact acttaaggat gtaaaacctt tgaaaaaaga + 20041 agatttgtaa aaaggaaaga atatgactga atacaaaaat attatcgtga caggtggagc + 20101 tggctttatc ggttctaact ttgtccatta tgtttacgag aactttccag atgttcacgt + 20161 gacagtccta gataagttga cttatgctgg aaaccgcgcg aatattgagg aaattttagg + 20221 taatcgtgtt gagttagttg ttggtgacat tgctgatgcg gagttggtag acaagttggc + 20281 tgctcaagca gatgctatcg ttcattatgc agcggaaagc cacaatgata attcgctcaa + 20341 tgatccatcg ccatttattc atactaactt catcggaacc tatactcttt tagaagctgc + 20401 tcgtaagtat gatattcgct tccatcatgt atcgacagat gaagtttatg gggatctccc + 20461 tttacgagaa gatttgccag gtcatggaga aggaccaggt gagaaattta ctgctgaaac + 20521 aaaatacaac ccaagctctc cgtactcatc aaccaaggcc gcatcagact tgattgtcaa + 20581 agcctgggtg cgttcttttg gagtcaaggc aacgatttcc aactgttcaa ataactacgg + 20641 tccttatcaa catatcgaaa aattcatccc acgtcagatt actaacatcc taagtggaat + 20701 taagccaaaa ctttacggtg aaggtaagaa tgttcgtgac tggattcata ccaatgacca + 20761 ttcttcagga gtttggacaa tcttgacaaa agggcaaatc ggtgaaacct acttgattgg + 20821 ggctgatggt gagaagaaca ataaggaagt tttggaactt atccttaagg aaatgggaca + 20881 agctgcggat gcctatgatc atgtgactga ccgtgcagga catgaccttc gctatgcgat + 20941 tgatgctagc aagctccgtg atgagttggg atggaaacct gaatttacca actttgaagc + 21001 tgggctcaag gcaacaatca agtggtatac agataaccaa gaatggtgga aagcagagaa + 21061 agaagctgtt gaagccaatt atgctaagac tcaggagatt attacagtat aaaaagcagg + 21121 aaatagctgc tttttattgc tatattggga agagttacat attagaaagg tctagagatg + 21181 attttaatta caggggcaaa tggccaatta ggaacggaac ttcgctattt attggatgag + 21241 cgtaatgaag aatacgtggc agtagatgtg gctgagatgg acattaccga tgcagaaatg + 21301 gttgagaaag tttttgaaga ggtgaaaccg actttagtct accactgtgc agcctacacc + 21361 gctgttgatg cagcagagga tgaaggaaaa gagttggact tcgccatcaa tgtgacgggg + 21421 acacaaaatg tcgcaaaagc atctgaaaag catggtgcaa ctctagttta tatttctacg + 21481 gactatgtct ttgacggtaa gaaaccagtt ggacaagagt gggaagttga tgaccgacca + 21541 gatccacaga cagaatatgg acgcactaaa cgtatggggg aagagttagt tgagaagcat + 21601 gtgtctaatt tctatattat ccgtactgcc tgggtatttg gaaattatgg caaaaacttc + 21661 gtttttacca tgcaaaatct tgcgaaaact cataaaactt taacagttgt aaatgaccag + 21721 tacggtcgtc cgacttggac tcgtaccttg gctgagttca tgacctacct agctgaaaac + 21781 cgcaaggaat ttggttatta tcatttgtca aatgatgcga cagaagacac aacatggtat + 21841 gattttgcag ttgaaatttt gaaggataca gatgtcgaag tcaagccagt agattccagt + 21901 caatttccag ccaaagctaa acgtccgcta aactcaacga tgagcctggc caaagccaaa + 21961 gctactggat ttgttattcc aacttggcaa gatgcattgc aagaatttta caaacaagaa + 22021 gtgagataag tagtagaatg attttcttgt ctaataaaag aggcagataa tgaactccaa + 22081 aggagcttaa gatgtacgat tatcttgttg tggtgctggt ctctttggtg catagctttg + 22141 gctcagtttc tattatcgct cacaccatcc atcagaagtt taatctgaag gtacccaatt + 22201 atcgccaaga agaagattgg gctaggatgg gtttaccaat cacacgtaag gaaatctcta + 22261 attggcatat caaggcaagt caatactatt tagagtccct ttataacctt ttacgagaaa + 22321 agttgttaga acaacctctt cttcatgcgg atgaaacctc ttatcgggtt ctagagagtg + 22381 atagccatct tacctactat tggacctttt tgtctgggaa agatgagaat caagcaatca + 22441 cgctgtacca tcatgatcag cgtcggagtg gtttagtagt acaagaattc ctaggagatt + 22501 attctggcta tgtgcattgt gatatgttgc ggcagtaact taggacttta gtcctctagt + 22561 tctgcctatg cgatagcagt ccaaggttta ggagcaaggc gacgctaagc ttggtaaact + 22621 gcgaaccgct agaagcttat cgtcaactgg aagaagctga acttgttgga tgttgggcgc + 22681 atgtgagaag gaaatttttt gaagcgaccc ccaagcaagc agataaatca tccttaggag + 22741 ctaaaggttt agcctatcgt gaccagttat ttgccttgga aagagactgg gaggctttgc + 22801 cagctgatga acgactacag aaacgtccag cccttaatgg aagacttctt tgcttggtgc + 22861 cgccgtcagt cagttttagc aggttcaaaa ccaggaaggg caattgaata cagcctcaag + 22921 tatgaagaaa cctttaagac cattttaaaa gacggacatc tggtcctttc caataatcta + 22981 gctgaacgcg ccattaaatc attggttatg ggacggagta aaagagtcca ctggactctt + 23041 ttagcctaag ctcagtttaa aaaagcgagg gtggttattt tctcaaaatt ttgaaggagc + 23101 taaagcaaga gctattatta tgagtttgtt ggaaacagct aaacgtcatc aattaaatag + 23161 cgagaaatat ctattctatc ttctagaatg tcttccaaac gaggaaactc tcgtaaacaa + 23221 agaggtttta gaggcttatt taccatggac taaagttgta caagaaaagt gcaaataaga + 23281 aatctccaga ttaggaacta tccgtgagtt ctctagtctg gagatttttc aatatacttc + 23341 gttattggac ggttacgata ttcatatttt ttgcaaagat gttgtttgaa aaataatttt + 23401 caaaaattct gaaaattctg ttgacaactt tctgaaaaga gtctataatg gagagaaagt + 23461 tttaaaggag aaaatgatga aaagttcaaa actatttgcc cttgcgggcg tgacattatt + 23521 ggcggcgact actttagctg catgctctgg attaggttca agcactaaag gtgagaagac + 23581 attctcatac atttatgaga cagaccctga taacctcaac tatttgacaa ctgctaagac + 23641 tgcgacagca aatattacca gtaacgtggt tgatggtttg ctagaaaatg atcgctacgg + 23701 gaactttgtg ccgtctatgg ctgaggattg gtctgtatcc aaggatggat tgacttacac + 23761 ttatactatc cgtaaggatg caaaatggta tacttctgaa ggtgaagaat acgcggcagt + 23821 caaagctcaa gactttgtaa caggactaaa atatgctgct gataaaaaat cagatgctct + 23881 ttaccttgtt caagaatcaa tcaaagggtt ggatgcctat gtaaaagggg aaatcaaaga + 23941 tttctcacaa gtaggaatta aggttctgga tgaacagaca gttcagtaca ctttgaacaa + 24001 accagaaagc ttctggaatt ctaagacaac catgggtgtg cttgcgccag ttaatgaaga + 24061 gtttttgaat tcaaaaggag atgattttgc caaagctacg gatccaagta gtctcttgta + 24121 taacggtcct tatttgttga aatccattgt gaccaaatcc tctgttgaat ttgcgaaaaa + 24181 tccgaactac tgggataagg acaatgtgca tattgacaaa gttaaattgt cattctggga + 24241 tggtcaagat accagcaaac ctgcagaaaa ctttaaagat ggtagcctta cagcagctcg + 24301 tctctatcca acaagtgcaa gtttcgcaga gcttgagaag agtatgaagg acaatattgt + 24361 ctatactcaa caagactcta ttacgtatct agttggtaca aatattgacc gtcagtccta + 24421 taaatacaca tctaagacca gcgacgaaca aaaggcatcg actaaaaagg ctctcttaaa + 24481 caaggatttc cgtcaggcta ttgcatttgg atttgaccgt acagcctatg cctctcagtt + 24541 gaatggacaa actggagcaa gtaaaatctt gcgtaatctc tttgtgccac caacatttgt + 24601 tcaagcagat ggtaaaaact ttggcgatat ggtcaaagag aaattggtca cttatgggga + 24661 tgaatggaag gatgttaatc ttgcagattc tcaggatggt ctttacaatc cagaaaaagc + 24721 caaggctgaa tttgctaaag ctaaatcagc cttacaagca gaaggtgtga cattcccaat + 24781 tcatttggat atgccagttg accagacagc aactacaaaa gttcagcgcg tccaatctat + 24841 gaaacaatcc ttggaagcaa ctttaggagc tgataatgtc attattgata ttcaacaact + 24901 acaaaaagac gaagtaaaca atattacata ttttgctgaa aatgctgctg gcgaagactg + 24961 ggatttatca gataatgtcg gttggggtcc agactttgcc gatccatcaa cctaccttga + 25021 tatcatcaaa ccatctgtag gagaaagtac taaaacatat ttagggtttg actcagggga + 25081 agataatgta gctgctaaaa aagtaggtct atatgactac gaaaaattgg ttactgaggc + 25141 tggtgatgag actacagatg ttgctaaacg ctatgataaa tacgctgcag cccaagcttg + 25201 gttgacagat agtgctttga ttattccaac tacatctcgt acagggcgtc caatcttgtc + 25261 taagatggta ccatttacaa taccatttgc attgtcagga aataaaggta caagtgaacc + 25321 agtcttatat aaatacttgg aacttcaaga caaggcagtc actgtagatg aataccaaaa + 25381 agctcaggaa aaatggatga aagaaaaaga agagtctaat aaaaaggctc aagaagatct + 25441 cgcaaaacat g +// + diff --git a/public/res/serotype_genbank/serotype_17A.gb b/public/res/serotype_genbank/serotype_17A.gb new file mode 100644 index 0000000..f8b104e --- /dev/null +++ b/public/res/serotype_genbank/serotype_17A.gb @@ -0,0 +1,1081 @@ +LOCUS CR931669 23198 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain nr. 4704 (serotype 17a). +ACCESSION CR931669 +VERSION CR931669.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 23198) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 23198) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..23198 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="nr. 4704" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC17A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC17A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33477.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene complement(262..453) + /gene="tnp" + /locus_tag="SPC17A_0002" + /pseudo + CDS complement(262..453) + /gene="tnp" + /locus_tag="SPC17A_0002" + /note="Lone member of homology group 0235" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + /db_xref="PSEUDO:CAI33478.1" + gene 695..2140 + /gene="wzg" + /locus_tag="SPC17A_0003" + CDS 695..2140 + /gene="wzg" + /locus_tag="SPC17A_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33479.1" + /db_xref="GOA:Q4K1E2" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K1E2" + /translation="MSRRFKKSSSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + IDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKRILLTTTPRDSYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQAIGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 695..811 + /gene="wzg" + /locus_tag="SPC17A_0003" + /note="Signal peptide predicted for SPC0817 by SignalP 2.0 + HMM (Signal peptide probability 0.997) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 899..1246 + /gene="wzg" + /locus_tag="SPC17A_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 3.7e-63" + misc_feature 1424..1867 + /gene="wzg" + /locus_tag="SPC17A_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.3e-67" + gene 2142..2873 + /gene="wzh" + /locus_tag="SPC17A_0004" + CDS 2142..2873 + /gene="wzh" + /locus_tag="SPC17A_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33480.1" + /db_xref="GOA:Q4JZG9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZG9" + /translation="MIDIHSHIVFDVDDGPKSREESKTLLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMHTSYREIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRVQYFLEQDLVHVIASDMHNLDSRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRRIVMDQLI" + misc_feature 2145..2753 + /gene="wzh" + /locus_tag="SPC17A_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 1.4e-38" + gene 2879..3574 + /gene="wzd" + /locus_tag="SPC17A_0005" + CDS 2879..3574 + /gene="wzd" + /locus_tag="SPC17A_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33481.1" + /db_xref="GOA:Q4K1E0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K1E0" + /translation="MMKEQNTTEIDVFQLVKTLWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIVLSQDVLEKVVTNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANFLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 2879..2995 + /gene="wzd" + /locus_tag="SPC17A_0005" + /note="Signal peptide predicted for SPC0819 by SignalP 2.0 + HMM (Signal peptide probability 0.614) with cleavage site + probability 0.407 between residues 39 and 40" + misc_feature 2900..3316 + /gene="wzd" + /locus_tag="SPC17A_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 5.5e-54" + misc_feature 3422..3499 + /gene="wzd" + /locus_tag="SPC17A_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 3584..4273 + /gene="wze" + /locus_tag="SPC17A_0006" + CDS 3584..4273 + /gene="wze" + /locus_tag="SPC17A_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33482.1" + /db_xref="GOA:Q4JZK1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZK1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 4288..5655 + /gene="wchA" + /locus_tag="SPC17A_0007" + CDS 4288..5655 + /gene="wchA" + /locus_tag="SPC17A_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33483.1" + /db_xref="GOA:Q4K1D8" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K1D8" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELIQTLKYILFFALAISISNFFLEDQFSISRRGMIYF + LTLHALLVYGLNLFIKWYWKRAYPNFKGSKKILLLTATFRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFVTNEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRRFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 4288..4374 + /gene="wchA" + /locus_tag="SPC17A_0007" + /note="Signal peptide predicted for SPC0821 by SignalP 2.0 + HMM (Signal peptide probability 0.844) with cleavage site + probability 0.429 between residues 29 and 30" + misc_feature 5071..5652 + /gene="wchA" + /locus_tag="SPC17A_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 3.3e-157" + gene 5642..6448 + /gene="wciB" + /locus_tag="SPC17A_0008" + CDS 5642..6448 + /gene="wciB" + /locus_tag="SPC17A_0008" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33484.1" + /db_xref="GOA:Q4K1D7" + /db_xref="UniProtKB/TrEMBL:Q4K1D7" + /translation="MERSRLIDVKIIVATHKEVKMPQDSSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENINMDDV + ILSRSNVEILLEKSDIIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDYTPFESRLFGRV + SELLFNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 6432..7529 + /gene="wcrP" + /locus_tag="SPC17A_0009" + CDS 6432..7529 + /gene="wcrP" + /locus_tag="SPC17A_0009" + /note="member of homology group 89" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33485.1" + /db_xref="GOA:Q4K1D6" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K1D6" + /translation="MDRVFEMLEKESPLFSVIVPTYKISESNLRQCIDSLLYDSQDVE + IILVDDNKNLDICGKVLDEYAEKYNNISVIHQENQGVSVARNAGMSIAVGKYLIFVDP + DDWVAENFYSQMTLAVQKNPSSDVIILAAIVDYNGKQFTNHFWHTSRSFQGTDKDDLE + LQLIAKGATSYFPTEIGVGVPWAKIYRNEFVRENGLDFNPSLRRMQDNIFNMYAFEFA + NEIVYIDEPIYYYRKSMDSVTNKKNDKVIYYFDLVNDEVEKFIQKFNKPKIFEDALHI + KRLIGINSYYKLYFKFASTSSEKKKMRQEFRELLEREEYVNSLKKVNTAYLLPKEKIF + ISILKQKDLRIFSLLQKLEKLSVMLKSRQFS" + misc_feature 6477..7016 + /gene="wcrP" + /locus_tag="SPC17A_0009" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.6e-30" + gene 7537..8454 + /gene="wcrQ" + /locus_tag="SPC17A_0010" + CDS 7537..8454 + /gene="wcrQ" + /locus_tag="SPC17A_0010" + /note="member of homology group 106" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33486.1" + /db_xref="GOA:Q4K1D5" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4K1D5" + /translation="MRQLALELVSIIYKVTKRIPISFISNLGEKIYSFKDPYVFNVLS + TLGVDKESAYDLIPPNLFLNKIWICWFQGEDKAPDLVKKCIDSVRKHASGYDVIILTE + GNIEEYVTLPNIVLIKYKNGLFSRTHFSDIVRMNLLAQQGGLWIDATIFVTRDLDLSI + FFKNDFVSLRTTMKSSPLFITGYWTTYFVYTPSNFKLVQYTALLLNKYTEKYDRFIDY + FLQDYIITKAIKDLNYESYMEERPVLGNQRWLLADLANKVMTSDLLQQFKQDTVGIYK + LTYKSKYIREKNGRETVYKKIVEDGEYLE" + misc_feature 7588..8427 + /gene="wcrQ" + /locus_tag="SPC17A_0010" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.3e-45" + gene 8435..9334 + /gene="wcrR" + /locus_tag="SPC17A_0011" + CDS 8435..9334 + /gene="wcrR" + /locus_tag="SPC17A_0011" + /note="member of homology group 90" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33487.1" + /db_xref="GOA:Q4K1D4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K1D4" + /translation="MENILNKKIGIVILNYLNWEDTLDCISSLRLQSNQNFEAVIVEN + GSPNESVSRIRDFIKNDKNIHLYVVENNLGYANGNNMGILYLKNKYSINRIILTNNDV + IFDDKNYISKLIDIEYDGNIGAIGTKIIGSDGLNQNPAYFPISFSSSIKSLIINLLAF + SKVIASIKKRFLSSWAKKANDFSSPKTSKQKYFLHGSVIFLTENYLDKFMGLYGGTFL + YYEEVILGIIFEKAGLDMLYIPEFSIYHKEDQSSIRSFNNDDLVRRRYLLNSIWSSFK + VYLANQEELPNIVSDSIYKHIKE" + misc_feature 8462..8962 + /gene="wcrR" + /locus_tag="SPC17A_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 4.3e-13" + gene 9343..10443 + /gene="wcrT" + /locus_tag="SPC17A_0012" + CDS 9343..10443 + /gene="wcrT" + /locus_tag="SPC17A_0012" + /note="member of homology group 157" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI33488.1" + /db_xref="UniProtKB/TrEMBL:Q4K1D3" + /translation="MVKKIAFYLPQFHTIPENDKWWGKDFTEWTNVKKSQPQYRGHIQ + PEVPLNEEYYNLLDTEVQEKQAKLALEYGIDGFCYYHYWFDGKLLLEKPMENMLQNEN + ITLPFCICWANESWSRTWDGAESKVLIMQNYSDTLDGWKRHFDYLLPFFKDERYIKVD + EKPMMIIYKPQLIENLEEMTVYWNQLAKQNGFKGIHFGHQHVSSFEDSKVIENFDFGI + EFEPIYTVSEMHKSTRSKSEKLKRAIKNPKWFSRNISHKYFGRSLLFDYDEVWSAILR + REGRKNISPGAFVSWDNTPRRGNRSLVFDGANPKKFEKYFAKQVQRAKEEYHSDFIFI + NAWNEWAEGAHLEPDEQYGYGYLEAVRAVKEE" + gene 10445..11071 + /gene="wcrU" + /locus_tag="SPC17A_0013" + CDS 10445..11071 + /gene="wcrU" + /locus_tag="SPC17A_0013" + /note="member of homology group 158" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33489.1" + /db_xref="GOA:Q4K1D2" + /db_xref="InterPro:IPR011004" + /db_xref="InterPro:IPR018357" + /db_xref="UniProtKB/TrEMBL:Q4K1D2" + /translation="MLIGRLKQRLKIEKFRRSWREKNTHNTTMASSIFDIDKVSVGNY + TYGNIDILDFGTNEKLSIGSFCSIAPNVKFILNADHCTNYFTTFPLKVKVLQNQDKEG + ISKGDIIVGDDVWLGLNAVILSGVTIGQGAIIAAGAVVTKNVPPYAIVGGNPARIIKY + RFEAEIIDKLLKVNFSKLSKYDIEKHIKQMYIPLVEVKQLDWIDDLLH" + misc_feature 10763..10816 + /gene="wcrU" + /locus_tag="SPC17A_0013" + /note="HMMPfam hit to PF00132, no description, score 29" + misc_feature 10790..10876 + /gene="wcrU" + /locus_tag="SPC17A_0013" + /note="PS00101 Hexapeptide-repeat containing-transferases + signature." + misc_feature 10817..10870 + /gene="wcrU" + /locus_tag="SPC17A_0013" + /note="HMMPfam hit to PF00132, no description, score 0.93" + gene 11084..13039 + /gene="wcrV" + /locus_tag="SPC17A_0014" + CDS 11084..13039 + /gene="wcrV" + /locus_tag="SPC17A_0014" + /note="member of homology group 159" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33490.1" + /db_xref="GOA:Q4K1D1" + /db_xref="InterPro:IPR001173" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4K1D1" + /translation="MKSEIKVSVVIPIYNQEIYLRKSIHSVLTQSYQNLEIIAVNDGS + IDSSQQIMEEFANQDSRIFLYEKSNGGLVDATIYGVEKATGDYIVFLDPDDYIGENYI + QKFVSYLDHDYDFVAMGFYYDDNDKVTPYRLKENLILNKTHIEVLKSTFLTNFDLGTI + SNQIFISRWNKLYRCDIVKSVISEFKSYKNVTLGEDTIFAALLLKYSQSAKILQQANT + YFYNIANQNSMMKSSDLDKYLNKCYQVFMSFSKLLEEQELDKTQAYYLYFFLTNTLFN + RLRTNDPKQFYGLFDKLKREPVYIKTLNMVRKNTKSKFISFDLFLRLYTTCSQYIYIK + DSIERTKTFVRNFKYFSRQVRKNNIIKAYQLLNFFRSRQNAFYELKNQLPKIEGEINN + ILLQHDSNEFNEEEGIEEKIFVFWWDGFNDLPEIVAECFKSLKKQYQEYQIIPISKDN + FEEYTDIHPVLLKEFKAGKISIQTFSDILRFNLLKNNGGMWVDATIYFTRKVDLFSQL + ERQSFATISFSTSKDFLEYKGEFCSWTGYFIASRKNGRFVQMMDMLFREYYLKYRNFQ + IYFFIDALFMICKVNKIDSGVLDNPLYIEGNMWTLSNLLKSKYDDQLLTLIKKIPQKL + AWFFEPLSDSTDTFYNQLISEKIKQKE" + misc_feature 11105..11629 + /gene="wcrV" + /locus_tag="SPC17A_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 5.2e-39" + misc_feature 12140..13009 + /gene="wcrV" + /locus_tag="SPC17A_0014" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis pro, score 7.7e-22" + gene 13044..14201 + /gene="wzy" + /locus_tag="SPC17A_0015" + CDS 13044..14201 + /gene="wzy" + /locus_tag="SPC17A_0015" + /note="member of homology group 160" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33491.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K1D0" + /translation="MIKVSKQNAILFLLLLPFFMPTYFEILPFGYLLYRLGMMFSIGY + ISLSYLILKKNFSSITWLIVIYEILVVSLTILQKGEIYTAIWNAEKIIGLVLLVDYYQ + ENIISFLKVVLVHFEWLIYINFITILLFSERFFSRFTSAYGFTQEWFLGSVNNFIFWF + FPALVVAWLYYFLSGKIFRTCSLTVVIALTELIRGSATGRIAVFLFILFVTSSWLRKI + ISPKLVFIGVTVLGIFVVFLQNVDFLEPIVVQLLGKKMTFSNRTYIWSNAVTVIQKNF + VGLGLQSSDYVIRLLGNINGYLQPTVTHAHNEFLQVAFQTGILGFILYCWIYIKVLIN + AVKLSGPIAQTVMLFFAVYNVIAITETLELSQIYMLFPLIYFVMQYTAERK" + misc_feature 13806..14009 + /gene="wzy" + /locus_tag="SPC17A_0015" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 6.3e-10" + gene 14206..15648 + /gene="wzx" + /locus_tag="SPC17A_0016" + CDS 14206..15648 + /gene="wzx" + /locus_tag="SPC17A_0016" + /note="member of homology group 236" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33492.1" + /db_xref="GOA:Q4K1C9" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K1C9" + /translation="MNNEKSLSSKIISGSFWKFGERMSAQAVSFFVSLILTRILSPSD + YGIIAIINIFIAIADVLLASGLNTALIQKKNSTRLDYNTIFWCNIILGCVLYLVLFLV + APVLADFYNISILTPVIRIFALRLPISSFQSIQNAFVSKHMQFKKFFYATFLGSLVSA + VVGITMAYTGFGVWALVAQYLVNTVVGTATLFAIISWRPKFEFSLESAKPLVQYGWKI + MFTDLTGTIFNNLGDFIIGAYYNSSSLAFYSKGRQLPYLIRNNIFTSLISVLFPGMSQ + VNDDIERIKSFSRKSVSILSFLIFPTMVGLIVTAEPLTILMYTEKWLPIIPFVVIVCS + EAILSVIPTVTMQTIKALGRSDLTLKIEFIKKPIYLLTIFVSLNFGIVAIAFTLIINA + IIEMIINGLIVQRLIKYSLWEQFNDIFGSLMISIMMGLLSYLVIFLNLNIYLTLLLQV + VTGVSSYLILAIVFKNESFIELKNRFLSTE" + misc_feature 14236..15039 + /gene="wzx" + /locus_tag="SPC17A_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.9e-30" + gene 15869..17089 + /gene="ugd" + /locus_tag="SPC17A_0017" + CDS 15869..17089 + /gene="ugd" + /locus_tag="SPC17A_0017" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI33493.1" + /db_xref="GOA:Q4K1C8" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K1C8" + /translation="MKLAVVGTGYVGLSISVLLSQHHEVVAVDIIPEKVNLINEGKSP + IKDDYIEEYLANKSLNLVATLDASKAYTDADFVIIAAPTNYDSEKNFFDTSAVEKVIE + TVLEINPNAVMVIKSTVPVGYTQWVRNKYKTNNILFSPEFLRESKALYDNLYPSRIIV + GLDMDDAYLRERAETFAKLLQEGAIKEAIETLYMGFTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDTKAIIEGIGLDPRIGNQYNNPSFGYGGYCLPKDSKQLLANYKDVPQ + NMITAIVESNRTRKDFIAEQILKFAEVSSNGDIHTKDVIIGLYRLTMKSNSDNFRQSS + IQGVMKRLKAEGVNVIIYEPTLSDNETFWGSKIVNDLEYFKSISNVIVANRYDDLLKD + VSDKVYSRDIFKRD" + misc_feature 15869..16426 + /gene="ugd" + /locus_tag="SPC17A_0017" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 5.2e-50" + misc_feature 16454..16735 + /gene="ugd" + /locus_tag="SPC17A_0017" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 2.4e-36" + misc_feature 16817..17068 + /gene="ugd" + /locus_tag="SPC17A_0017" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 5.1e-06" + gene 17102..18202 + /gene="glf" + /locus_tag="SPC17A_0018" + CDS 17102..18202 + /gene="glf" + /locus_tag="SPC17A_0018" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33494.1" + /db_xref="GOA:Q4K1C7" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1C7" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCED + VEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPIANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTAHMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TDLPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFANRQ + ELETSAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGMQPKTVITHEYPADWKRGDEPYYPINDEKNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFSN" + misc_feature 17537..18139 + /gene="glf" + /locus_tag="SPC17A_0018" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 7.4e-136" + gene 18230..19099 + /gene="rmlA" + /locus_tag="SPC17A_0019" + CDS 18230..19099 + /gene="rmlA" + /locus_tag="SPC17A_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33495.1" + /db_xref="GOA:Q4K1C6" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K1C6" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLT + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSTMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + misc_feature 18233..18949 + /gene="rmlA" + /locus_tag="SPC17A_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.3e-118" + gene 19100..19696 + /gene="rmlC" + /locus_tag="SPC17A_0020" + CDS 19100..19696 + /gene="rmlC" + /locus_tag="SPC17A_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33496.1" + /db_xref="GOA:Q4K1C5" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4K1C5" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPASFFTEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 19136..19666 + /gene="rmlC" + /locus_tag="SPC17A_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 1.1e-15" + gene 19706..20755 + /gene="rmlB" + /locus_tag="SPC17A_0021" + CDS 19706..20755 + /gene="rmlB" + /locus_tag="SPC17A_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33497.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 19721..20677 + /gene="rmlB" + /locus_tag="SPC17A_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 19724..20464 + /gene="rmlB" + /locus_tag="SPC17A_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 19727..20539 + /gene="rmlB" + /locus_tag="SPC17A_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 20821..21672 + /gene="rmlD" + /locus_tag="SPC17A_0022" + CDS 20821..21672 + /gene="rmlD" + /locus_tag="SPC17A_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33498.1" + /db_xref="GOA:Q4K1C3" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1C3" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELNFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 20821..21669 + /gene="rmlD" + /locus_tag="SPC17A_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 8e-147" + misc_feature 20824..21465 + /gene="rmlD" + /locus_tag="SPC17A_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 20824..21453 + /gene="rmlD" + /locus_tag="SPC17A_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.2e-19" + misc_feature 20827..21555 + /gene="rmlD" + /locus_tag="SPC17A_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.4e-08" + gene order(21717..21830,21834..22917) + /gene="glf" + /locus_tag="SPC17A_0023" + /pseudo + CDS join(21717..21830,21834..22253,22220..22354,22330..22917) + /gene="glf" + /locus_tag="SPC17A_0023" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + misc_feature join(22170..22220,22253..22330,22354..22773) + /gene="glf" + /locus_tag="SPC17A_0023" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.4e-95" + /pseudo + gene 23151..>23198 + /gene="aliA" + /locus_tag="SPC17A_0024" + CDS 23151..>23198 + /gene="aliA" + /locus_tag="SPC17A_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33500.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attatcgaaa ttcaattaac tttacaaatt cccactattt acttggtggt ttagctctcc + 301 tgttttctct tttagcttta accagccata aatggtatta cgcgagattt ggaaaacgtg + 361 tgatgcttct gttatactac ctgttcgctc acaataagag agaacttttt tacgaaaatc + 421 tattgaatat gccataaaaa gattatacca cattgtgtac tatattatat attatattga + 481 aactagaata gtacacatct gcttctaaaa tattgttaga aaacgatttg actgtcctga + 541 tcaatttgtc atgttcttat ttcattttac tatatttttg gttcgcggga agtctactaa + 601 gatacttaaa gatgcagata gtgaaaataa aggtgtagac attaccgtaa aaaagtgata + 661 taattgtatg atgttcaatg tataggtgtt aatcatgagt agacgtttta aaaaatcaag + 721 ttcacagaaa gtgaagcgaa gtgttaatat agttttgctg actatttatt tattgttagt + 781 ttgtttttta ttattcttaa tctttaagta caatatcctt gcttttagat atcttaatct + 841 agtggtaact gcgttagtcc tactagttgc cttggtaggg ctactcttga ttatctataa + 901 aaaagctgaa aaatttacta tttttctgtt ggtgttctct atccttgtca gctctgtgtc + 961 gctctttgca gtacagcagt ttgttggact gaccaatcgt ttaaatgcga cttctaatta + 1021 ctcagaatat tcaatcagtg tcgctgtttt agcagatagt gagatcgaaa atgttacgca + 1081 actgacgagt gtgacagcac cgactgggac tgataatgaa aatattcaaa aactactagc + 1141 tgatatcaag tcaagtcaga ataccgattt gacgatcgac cagagttcgt cttacttggc + 1201 agcttataag agtttgattg caggggagac taaggccatt gtcttaaata gtgtctttga + 1261 aaatatcatc gagtcagagt atccagacta tgcatcgaag ataaaaaaga tttataccaa + 1321 gggattcact aaaaaagtag aagctcctaa aacgtctaag aatcagtctt tcaatatcta + 1381 tgttagtgga attgacacct atggtcctat tagttcggtg tcgcgatcag atgtcaatat + 1441 cctgatgact gtcaataggg atacgaagag aatccttctt acaacaactc ctcgagattc + 1501 atatgttcct attgctgatg gtggaaataa tcaaaaagat aaattgactc atgcgggcat + 1561 ttatggagtt gattcgtcca ttcacacctt agaaaatctc tatggagtgg atatcaatta + 1621 ctatgtgcga ttgaacttca cttcgttttt gaaattgatt gatttgttgg gtggaattga + 1681 tgtttataat gatcaagaat ttactgccca tacgaatgga aagtattatc ctgcaggcaa + 1741 tgttcatctt gattcagaac aggctatcgg ttttgttcgt gagcgctact ccctagcaga + 1801 tggcgatcgt gaccgtggtc gcaaccaaca aaaggtgatt gtggctatcc ttcaaaaatt + 1861 aacgtcaacc gaagcactga aaaattatag tacgatcatt aatagcttgc aagattctat + 1921 ccaaacaaat atgccacttg agactatgat aaatttggtc aatgctcagt tagaaagtgg + 1981 agggaattat aaagtaaatt ctcaagattt aaaaggtaca ggtcggacgg atcttccttc + 2041 ttatgcaatg ccagacagta acctctatgt gatggaaata gatgatagta gtttagctgt + 2101 agttaaagca gctatacagg atgtgatgga gggtagatga aatgatagac atccattcgc + 2161 acatcgtctt tgatgtagat gatggtccca agtcaaggga ggaaagcaag actctcttgg + 2221 cagaagccta cagacagggg gtgcgaacca ttgtctctac ctctcaccgt cgcaagggca + 2281 tgtttgaaac tccggaagag aagatagcag aaaactttct tcaggttcgg gaaatagcta + 2341 aggaagtggc gagtgacttg gtcattgctt acggggctga aatttactac acaccagatg + 2401 ttctggataa gctggaaaaa aagcggattc cgaccctcaa tgatagtcgt tatgctttga + 2461 ttgagtttag catgcatact tcctatcgtg agattcatag cgccttgagc aagatcttga + 2521 tgttgggaat tactccagtc attgcccaca ttgagcgcta tgatgctctt gaaaataatg + 2581 aaaaacgcgt tcgggaactg atcgatatgg gctgttacac gcaagtaaat agttcacatg + 2641 tcctcaaacc caaacttttt ggcgaacgtt ataaattcat gaaaaaaaga gttcagtatt + 2701 ttttagagca ggatttggtt catgtcattg caagtgatat gcacaatcta gacagtagac + 2761 ctcctcatat ggcagaagca tatgaccttg ttacccaaaa atacggagaa gcgaaggctc + 2821 aggaactttt tatagacaat cctcgaagaa ttgtaatgga tcaactaatt taggagaaat + 2881 gatgaaagaa caaaacacga cagaaatcga tgtatttcaa ttagttaaaa ccttgtggaa + 2941 acgcaagcta atgattttat tagtggcact tgtgacaggt gcgggggctt ttgcatatag + 3001 cacttttatt gttaagccag aatatacgag taccacgcga atttacgtag tgaatcgaaa + 3061 tcaaggagac aagccggggc tgacaaatca ggatttgcag gcaggatctt atctggtaaa + 3121 agactaccgt gagattgtcc tttcgcagga tgtattggaa aaagtagtga caaatttgaa + 3181 gttggatatg ccagcaaaaa cgttagccag caaagttcaa gtgactgtac cagctgacac + 3241 tcgtatcgtc tcaatctctg tcaaggataa acagccagag gaagccagtc gtatcgctaa + 3301 ttttctacga gaagttgctg cagaaaagat cgtcgctgta acgcgagtat ctgatgtaac + 3361 gacacttgaa gaagcgcgac cagctacaac tccctcttct ccaaatgttc gacgcaattc + 3421 cttgtttggt tttcttggag gagcagtcgt aacagtaatt gctgttcttt tgattgagtt + 3481 gctcgacacc cgtgtgaaac gtcctgaaga tgttgaagat gtactgaaaa ttccactttt + 3541 agggctcgtt ccagattttg acaaaataaa ataggaggaa gttatgccaa cattagaaat + 3601 ctcacaggca aaattggatt ctgtaaaaaa ggcagaggaa tattataacg ctttgtgcac + 3661 gaacctacag ttaagtggag atggtttgaa agtattttct atcacttctg tgaaaatagg + 3721 agaaggaaaa tcaacgactt ccgccaatat cgcttgggct tttgcgcgtg caggttacaa + 3781 aacgctgctg attgatggag atattcgcaa ttctgttatg ttaggtgtct ttaaagcaag + 3841 gaataagatt acaggcctga cagaattttt atcaggaact acagacctat cacaagggct + 3901 ttgtgatacc aatatcgaaa atctctttgt aattcaggct ggctctgtgt caccgaatcc + 3961 gacagctctt cttcaaagta agaatttcac tacaatgctt gaaaccttgc gtaaatattt + 4021 tgactacatc attgtagata ctgctcctgt tggtgtcgtg attgatgcgg ctattattac + 4081 gcgaaactgc gatgcttcta ttttagtgac ggaggcaggt gaaataaatc gtcgggatat + 4141 tcaaaaagca aaagaacagt tggaacacac aggaaagccg tttttgggaa ttgtgttgaa + 4201 taaattcgat acttcagtag acaaatacgg ttcttatgga aattatggag attacgggaa + 4261 aaataaaaaa taggtcgggg gatagagatg aatggaaaaa tattaaggtc ttcattggcc + 4321 ataatccaga gttttcttgt tattttattg acttatctac ttagtgctgt gagagaaacg + 4381 gagattgttt caacaacagc tattgcactt tatatcctcc attattttgt cttttatatc + 4441 agtgattatg gacaggattt ctttaaaagg ggatatttga ttgaacttat ccagacattg + 4501 aaatatatcc tattctttgc actagcgatt agtatttcta attttttctt agaggatcaa + 4561 tttagtattt ccagacgagg catgatttac ttcctaacat tacatgctct cttagtctat + 4621 gggctaaacc tatttatcaa gtggtattgg aagcgggctt atcccaactt taaaggaagt + 4681 aagaagattc tcctacttac agcaactttt cgtgtcgaaa aggtactgga tagattaata + 4741 gaatcaaatg aggttgttgg ggagttggta gctgtcagtg tcttagataa accagatttt + 4801 cagcatgatt gtttaaaggt agtagcagag ggggagatag taaactttgt gactaatgag + 4861 gtggtcgatg aagtctttat caatcttcca agtgaaaaat acaatattgg agagcttgtc + 4921 tctcagtttg aaacgatggg aattgatgta acagtcaatc taaatgcttt tgatcgtagt + 4981 ttggcacgta acaagcaaat tcgtgagatg gcaggattaa acgttgtgac tttttctaca + 5041 acattttata agactagtca tgtaatcgct aagcggatta ttgatatcat gggtgcattg + 5101 gtagggctga tactatgtgg tttagtcagt attgtactgg ttcctttgat tcgaaaggat + 5161 gggggctctg ctatttttgc tcagacgcgt ataggaaaaa atggtcgtcg gttcactttt + 5221 tataagtttc gctctatgtg tgtagatgcc gaggcgaaaa aaagagaact catggaacaa + 5281 aataccatgc agggtggaat gtttaaggtg gacgatgatc ctcgtatcac gaaaattggt + 5341 cgttttatac ggaagactag cttggacgag ctaccacagt tttataatgt tctaaaggga + 5401 gatatgagtt tggttggcac acgaccacca acagtggacg agtatgaaca ctatacccca + 5461 gaacaaaaac gtcgtctgag ttttaaacct ggcataacag ggttatggca ggtcagtgga + 5521 cgaagtgaga ttaagaattt tgatgaagtt gtcaaattag atgtagccta tatagacgat + 5581 tggacaattt ggaaagatat tgagatttta ttgaagacag ttaaagttgt attgatgaag + 5641 gatggagcga agtagattga tagatgtaaa aatcattgtg gcaacacata aagaagttaa + 5701 aatgcctcaa gacagtagtc tttaccttcc aatacatgtt gggagagacg gtaaatcaga + 5761 tattggtttt atcggtgata atactggcga taatatatcc tctctaaatc catattattg + 5821 tgagttgacg ggactttatt gggcatggaa aaatcttgat tataattact taggtttagt + 5881 tcattaccgt cgttatttta caaataaatc tcaagggtat aatgaaaata tcaatatgga + 5941 tgacgtcatt ttgtctcgat ctaatgttga aatattatta gagaaatctg acataatagt + 6001 tccaaagaag cgaaagtatt atattgaaac tctttattca cattatgccc atacccttaa + 6061 cggcgaacat ctggatcttg ctaggaaaat tattgagcaa aatagttcag agtatctttc + 6121 atcctttgat aaagtgatga aacaaagaag cggttatatg ttcaatatgt ttatcatgaa + 6181 aaaagaacta ttagatgatt atttaccgtg gcttttttct attctggata ctatgtacga + 6241 acagatggac ttgaccgact atactccatt tgagtcacgt ttgttcgggc gagttagtga + 6301 gttgttgttt aatgtttggt tatgtaaaaa aggaataacg cctaaagagg taccatttat + 6361 gtacatggag agagtggatt tatttgaaaa aggaaaatct tttttaatgg ctaaattttt + 6421 tggaaagaag tatggacaga gtttttgaaa tgttagaaaa agaatctcca ctttttagtg + 6481 ttattgttcc aacctataag atatcagaat ctaatctacg ccaatgtata gactctctgt + 6541 tatatgatag tcaagatgtt gagattattt tggtagatga caataaaaac ttggatatat + 6601 gtggaaaagt gttggacgaa tatgctgaaa aatataataa tatttcagtt attcatcaag + 6661 aaaaccaagg tgtgtcagtc gcaagaaatg ctggtatgtc aattgctgta ggaaagtatc + 6721 ttatttttgt agatcccgat gattgggttg ctgaaaattt ttatagtcaa atgacccttg + 6781 cggttcaaaa aaatccttca agcgatgtga ttatattagc tgctattgta gactacaatg + 6841 gtaaacaatt tacgaatcat ttttggcaca cctctcgttc ttttcaggga acagataaag + 6901 atgatctgga acttcaattg attgctaaag gagcaacgag ttatttccca actgagatag + 6961 gggttggtgt tccctgggca aaaatttatc gtaatgagtt tgtgcgagaa aatggcttag + 7021 attttaatcc ttctcttcgc cgaatgcaag ataatatttt caatatgtat gcatttgaat + 7081 ttgcgaatga aatcgtctac attgatgagc cgatttacta ttatagaaag agtatggata + 7141 gtgtaactaa taagaaaaat gataaagtaa tttattattt cgacttagtt aatgatgagg + 7201 ttgaaaaatt tattcaaaaa tttaataaac ctaaaatatt tgaagatgct ctacatataa + 7261 aaagacttat aggtatcaat tcgtattata agttgtattt taagtttgca tctacttcaa + 7321 gcgagaaaaa gaaaatgcga caagaatttc gtgaactttt agaaagggaa gaatatgtaa + 7381 attcgttaaa aaaagtgaat acagcttatc ttcttccaaa agaaaaaatt tttataagca + 7441 ttttaaagca gaaagactta cggatattct cattgttaca aaaacttgaa aagttgtctg + 7501 tgatgttgaa gagtcgtcag tttagttaga ggggatatga gacagttagc attagaatta + 7561 gtcagtatca tttataaagt aacaaagcga atacctatat cttttatttc taatttaggt + 7621 gagaagattt attcattcaa ggatccctat gtttttaacg tattaagtac attgggagtg + 7681 gataaagaga gcgcctatga tttgatacct ccaaatttat ttttgaataa aatttggatt + 7741 tgctggtttc agggtgagga taaagcacca gatttagtaa aaaagtgtat tgatagtgtt + 7801 cgaaaacatg cctcaggcta cgatgtcatt atcttaacag aaggtaatat agaagaatat + 7861 gttacacttc caaatattgt tttaataaaa tataaaaatg gattatttag ccgaactcat + 7921 ttttcggata tagttcgaat gaatcttctt gcacaacagg gggggctttg gattgatgca + 7981 acgatttttg tgactaggga tttagatttg tctatatttt tcaaaaatga ttttgtaagc + 8041 ttgagaacca caatgaaatc tagtcctctt tttattacgg gatactggac gacatacttt + 8101 gtatatacgc cctctaattt taaattggtt caatatactg ctttattatt aaataaatac + 8161 actgagaaat atgatcgctt tatagattat ttcttacaag attatataat tactaaagca + 8221 attaaagatt tgaattatga atcatacatg gaagaacggc ctgtattggg aaatcaacga + 8281 tggcttttag cagatttggc taataaagtt atgacttcgg atcttcttca acaatttaaa + 8341 caagatacag tgggaattta taaattgaca tataaatcca agtacattag agaaaaaaat + 8401 ggtagggaaa cggtttataa aaaaattgta gaggatggag aatatcttga ataaaaaaat + 8461 aggaattgtt attttaaatt atcttaattg ggaggatact ttagattgca taagtagttt + 8521 gcgattgcaa agtaatcaaa actttgaagc tgtcatagta gaaaatggtt ctcccaatga + 8581 atccgtttct aggattagag attttataaa aaatgacaag aatattcatc tttatgtagt + 8641 agagaataac ttaggttatg caaatggaaa taatatgggc atcctctact taaaaaataa + 8701 atactctata aatagaatta tattaactaa taatgatgtt atatttgatg ataaaaatta + 8761 tataagtaaa ttaatagaca ttgaatatga tgggaatatt ggagctattg gaacaaaaat + 8821 tattggttct gatggtttaa accaaaatcc agcttatttt ccaatttctt ttagttctag + 8881 tataaaatca cttattatta atttattggc attttctaaa gttattgctt ctatcaaaaa + 8941 gcgttttcta tcttcatggg cgaaaaaagc taatgatttt tcaagtccaa agactagtaa + 9001 acaaaaatac tttctacatg gatcggttat ttttcttacg gaaaattatt tagataagtt + 9061 tatggggttg tatggtggga cttttcttta ctatgaagaa gtaatcctag gtattatatt + 9121 tgaaaaggca ggtcttgata tgctgtatat acctgagttt tcaatttacc ataaagagga + 9181 ccaatcttca attcgaagct ttaataatga tgacttagta cgacgtcgtt atttgttgaa + 9241 tagcatttgg tctagtttta aagtttatct tgctaaccag gaagaactcc cgaatattgt + 9301 tagtgactct atatataaac atattaagga ataggaatta ttatggtcaa aaaaattgct + 9361 ttctatcttc ctcagtttca taccattcca gaaaacgata agtggtgggg aaaagatttt + 9421 actgaatgga ctaatgtgaa gaaatctcag ccccaataca gaggacatat tcagcctgaa + 9481 gttccattaa atgaagaata ctataacctc ttagatacag aagttcaaga aaaacaagca + 9541 aaattagctt tagagtacgg tattgatggt ttttgctatt atcattattg gtttgatgga + 9601 aagctccttc tggagaaacc tatggagaat atgctgcaaa atgagaatat aactttaccc + 9661 ttttgtattt gttgggctaa tgagagctgg tcgagaactt gggatggtgc tgaaagtaag + 9721 gtcttaatta tgcaaaatta ctcagatact ttggatggat ggaagaggca ttttgattat + 9781 cttttaccct tttttaaaga tgaacgttat atcaaggttg atgaaaaacc aatgatgatt + 9841 atttacaagc ctcaactaat tgagaactta gaagagatga ctgtttattg gaaccaattg + 9901 gctaaacaaa atggttttaa gggtattcat tttggacatc agcatgtttc atcttttgaa + 9961 gattcaaaag taatagaaaa ctttgatttt ggtattgaat ttgaaccaat ctatacggta + 10021 tctgagatgc ataaaagtac aagaagtaag tcagaaaaat taaagcgggc aataaaaaat + 10081 cctaaatggt tttcaagaaa tatcagccat aaatattttg gccgttcgct cttatttgac + 10141 tatgatgaag tatggtcagc tattttacgg cgtgaaggaa gaaaaaatat ttcaccaggt + 10201 gcctttgtgt catgggataa tactccgaga cgcgggaacc gctctctagt atttgatggt + 10261 gcaaatccta aaaagtttga gaaatatttt gctaagcaag tacaacgtgc gaaagaagaa + 10321 tatcattctg atttcatatt tattaacgct tggaatgaat gggcagaagg ggctcattta + 10381 gagcctgatg agcagtatgg ttacggttat ttagaagcgg tgagagctgt aaaggaggaa + 10441 tagtgtgtta attggtcgtc tgaaacaaag gctgaagatt gaaaaattta ggagatcatg + 10501 gcgagaaaaa aatacgcata atactacaat ggcgagtagt atttttgata tagataaagt + 10561 ttcagtggga aattacactt atggaaatat cgatatccta gattttggaa ctaatgaaaa + 10621 acttagtata ggaagttttt gttcaatagc gccgaatgtt aaatttattc tgaatgctga + 10681 ccactgcacc aattacttca ctacctttcc attaaaggta aaagttctac aaaatcaaga + 10741 taaagaagga atttcaaagg gtgatattat cgtgggtgat gatgtatggt tggggcttaa + 10801 tgcagtcatt ctttcaggtg taacgattgg acaaggagct ataattgcgg caggagcagt + 10861 ggtaaccaaa aatgttccac cttatgctat cgtcggtggc aatccagcac gaataataaa + 10921 gtatagattt gaagctgaaa taattgataa actgttaaaa gttaattttt caaaattatc + 10981 taagtatgat atagaaaaac atataaaaca aatgtatata ccattagttg aggtaaaaca + 11041 actagattgg atagacgact tattacatta agaggtagaa taagtgaaat ctgaaattaa + 11101 agtttctgta gtaattccaa tatataatca agagatttac ttaaggaagt caatacattc + 11161 agtactgact cagagttatc aaaatttgga aattatagcc gttaatgacg gttcaattga + 11221 ttcaagtcaa caaattatgg aagaatttgc aaatcaggat agcaggattt ttctttatga + 11281 aaaatcaaat ggtggattag ttgatgcaac aatatatggt gtagaaaagg ctacggggga + 11341 ttatatagtc tttcttgatc cagatgatta cattggggaa aattatattc aaaagtttgt + 11401 atcttacctc gaccatgact atgattttgt agctatggga ttttattatg atgataacga + 11461 taaggttact ccatacagat taaaagagaa tctaattcta aataagactc atatagaagt + 11521 attaaaatca accttcttaa ctaattttga tttagggact atttcgaatc agatatttat + 11581 ttcaagatgg aataaacttt accgctgtga tattgtcaaa agtgttattt cggagtttaa + 11641 gtcatataag aatgtaactc tcggagaaga tacaattttt gctgctctgt tacttaaata + 11701 ttctcagtca gctaaaattt tgcaacaagc taatacttat ttctataata ttgcaaatca + 11761 gaattctatg atgaaaagta gcgatttaga taagtatttg aacaaatgtt atcaagtatt + 11821 tatgagtttt agtaaattac ttgaagagca agaattagat aaaactcaag cttactatct + 11881 gtattttttc ttaactaata ctctttttaa cagattaagg actaatgatc caaaacagtt + 11941 ttatggttta tttgataaac ttaagagaga accagtatat ataaaaacat taaatatggt + 12001 tcgaaaaaat acgaaaagta agtttataag tttcgatctg tttttaagac tctatacgac + 12061 ttgttcacaa tatatatata taaaggatag tattgaacgt actaagacct ttgtacggaa + 12121 ttttaaatat tttagtcggc aagtcagaaa aaataatatt attaaggcct atcagctatt + 12181 gaattttttt aggagtcgtc aaaatgcttt ttatgagtta aaaaatcaac ttcctaagat + 12241 tgagggagaa ataaataaca ttttacttca acatgatagt aatgaattta atgaagaaga + 12301 aggcatagaa gaaaagattt ttgttttttg gtgggatgga tttaatgatt taccagaaat + 12361 tgttgcagaa tgttttaagt ctttgaagaa gcagtatcag gaatatcaga ttattcctat + 12421 ttctaaagac aattttgaag agtatacgga tattcatcct gtgttgttaa aagagtttaa + 12481 agctggtaaa atttctatac agactttttc tgatattttg aggtttaatt tattgaaaaa + 12541 taatggtggt atgtgggtag atgcaacaat ctactttacg aggaaagttg atttgttttc + 12601 acagttagaa agacaatcat ttgctacaat aagtttttcc acaagcaaag attttttgga + 12661 gtataaagga gagttttgca gttggacagg ctattttatt gcttcacgga aaaatggccg + 12721 ctttgttcaa atgatggata tgttatttag agagtattat ctcaaataca gaaattttca + 12781 aatttatttt tttattgatg cattgtttat gatttgtaaa gttaataaaa ttgatagtgg + 12841 tgttttggat aatccattat atattgaagg gaatatgtgg acgctgtcaa acttactaaa + 12901 atcaaaatat gatgatcaat tattaacttt gattaaaaaa attccccaaa agttagcttg + 12961 gttttttgaa ccacttagcg atagcacgga tactttctat aatcaattaa tttcagaaaa + 13021 aatcaagcaa aaggagtaga actatgatta aagtgtctaa acagaatgct atattattct + 13081 tattactgct cccgtttttt atgccaactt attttgaaat tttaccattt ggatacttgt + 13141 tgtatagatt aggcatgatg tttagcatag gatatatttc tttatcttac ctaatattaa + 13201 agaaaaattt ttcttccatc acctggttga ttgttatcta tgagatatta gtagtttctt + 13261 taacaatttt acaaaaaggt gaaatctata ctgcaatatg gaatgcagaa aaaattattg + 13321 gactggtttt attagtagat tactaccaag aaaatattat tagcttctta aaagttgtac + 13381 tggtacattt tgagtggttg atttatatca attttattac aattttatta ttttcagagc + 13441 gctttttttc tagattcact tctgcttatg gttttaccca agaatggttt ctaggttccg + 13501 tcaataactt tattttctgg ttttttccag ctcttgtagt agcgtggttg tattattttt + 13561 tgtcaggtaa aatttttaga acgtgtagtt taacagttgt tattgcttta acagaattaa + 13621 ttagaggctc agcaacgggg aggattgcag tatttctatt tatcttattt gttacctcgt + 13681 cttggttacg taagattatt tcgccaaagt tagtatttat aggtgttact gtcctaggaa + 13741 tttttgttgt atttctccaa aatgtagact tcttagagcc tattgtggta cagttacttg + 13801 gtaaaaaaat gacatttagc aatcgtacct atatctggtc gaatgctgtg acagtaattc + 13861 aaaagaattt cgttggtcta ggtttacaat catctgatta tgtcattcga ttgcttggaa + 13921 atattaatgg ttatttacaa cctacggtaa cccacgccca taatgagttt ttacaagttg + 13981 cttttcaaac aggaatttta ggatttattc tttattgttg gatatatatt aaagtcttga + 14041 tcaatgcagt aaagttgagt ggaccaatag cgcaaactgt tatgctgttt tttgctgttt + 14101 ataatgttat tgctataaca gaaacgttag aactgagtca aatatatatg ttatttcctt + 14161 tgatttattt tgtaatgcaa tatactgcag aaagaaagta aggtaatgaa taacgaaaaa + 14221 agtttaagct ccaagataat atcaggaagt ttttggaaat tcggagaaag aatgagtgca + 14281 caggcggttt ctttttttgt ttctctgatt ttaacacgaa tcttatcccc aagtgattac + 14341 gggattattg cgattattaa tatttttata gctattgctg atgtactttt agctagtggt + 14401 ttaaatactg ctttgataca gaaaaaaaat tcaacgagac tagattataa tacgattttt + 14461 tggtgtaata ttatactggg ttgtgttctg tatctagtat tatttttagt agcaccagtc + 14521 cttgcagatt tttataatat ttctatactt acaccagtca ttcgaatttt tgcactgcgg + 14581 ttacccattt cttcttttca atcaattcaa aacgcatttg tttctaagca tatgcagttt + 14641 aagaagtttt tttacgccac ctttttgggt tcgctagtat ctgctgttgt tggaattaca + 14701 atggcttata caggttttgg tgtatgggca cttgtagcac aatatttagt aaatacggtt + 14761 gttggaacag ctacactatt tgctatcatt agttggcgtc caaaatttga attttctttg + 14821 gaaagtgcca aacccttagt ccaatatggc tggaagataa tgtttacaga ccttacaggt + 14881 acgattttca acaatttagg agactttatc attggcgcat actataattc atcttcactt + 14941 gctttttatt ctaaagggcg ccaattaccc tatctaatta gaaataatat ttttacttct + 15001 ttgataagtg tactcttccc aggaatgtct caggttaatg atgatattga acgtattaaa + 15061 tctttttcac gtaagagtgt ctcaatctta tcttttttaa tttttccaac aatggttggt + 15121 ttaattgtga ctgctgaacc actaactatc ttaatgtata ctgaaaaatg gctacctatt + 15181 attcccttcg ttgtgattgt atgttcggaa gcaattttat cagttatacc aacggtaaca + 15241 atgcagacaa ttaaagcatt aggacgtagt gatttaacac taaaaataga atttataaaa + 15301 aagcccattt atctattaac gatttttgta tctttaaact ttggaatagt ggctattgcc + 15361 tttacattaa ttattaatgc gattattgaa atgattatta atggtttaat tgtacaaaga + 15421 ctaatcaagt actctttgtg ggaacaattt aatgatatat ttggttcatt aatgatttca + 15481 attatgatgg gcttattatc atatttagtg atttttttaa atttaaacat ttatctcaca + 15541 ttattgttac aagttgttac tggtgtctct agttatctca ttttagctat tgtatttaaa + 15601 aacgaatcat tcattgagtt gaaaaataga tttttgagca ctgagtagta ttaagtctaa + 15661 gaattatcct gcgggaatag ctggtgaatt tttgggggtg aaaaggactt gggtaagata + 15721 ttttataatg aagccctagc aataatgtgt ttatttcatg cccccatttg ttctggaaaa + 15781 acttgtaata gttaagtgat aactaatagc caatgaaact tgggattgaa attattccca + 15841 tgaatatgta taatgaggag gagttaaggt gaaacttgca gttgttggaa ccggatacgt + 15901 tggattgtct atctcagttc tattatctca gcatcatgag gtggtggctg tcgatattat + 15961 tccagaaaaa gttaatctaa ttaatgaagg gaagtcccct attaaagatg attatattga + 16021 agaatattta gcaaataagt ctcttaattt ggtagcgacg ttagatgcat ctaaggcata + 16081 tactgatgct gattttgtaa ttattgcagc gccaacaaat tatgattcgg aaaagaactt + 16141 ttttgataca tctgctgtag agaaagttat tgaaacagtg ttagagataa atcctaacgc + 16201 tgttatggtt attaaaagta cagttcctgt aggatatact caatgggttc gtaataaata + 16261 taaaacaaat aatattttat ttagtccaga atttctgcgt gaatcaaagg ctttatatga + 16321 caatttatat cctagccgta taattgttgg acttgatatg gacgatgcat atttgaggga + 16381 gagggccgaa acttttgcaa aactgcttca agaaggagct attaaagagg ctatagaaac + 16441 tctttatatg ggatttacag aagctgaagc agttaaactc tttgcaaata catacttggc + 16501 cttacgagtt tcgtatttca atgagttgga tacttatgca gaagttaaag ggttagatac + 16561 caaagctatt attgagggta ttggcttaga tccacgtatc ggaaaccaat ataataatcc + 16621 ttcttttgga tatgggggat attgccttcc aaaagatagc aaacaattac tggcaaacta + 16681 taaagatgtt ccacagaata tgataacagc tattgttgag agtaatcgta ctagaaaaga + 16741 ttttattgca gagcagattt tgaaatttgc agaagtgtca agtaatgggg acattcatac + 16801 aaaagatgta ataataggtc tttatcggtt aactatgaag agtaattccg ataattttcg + 16861 tcaatcttct attcaaggtg ttatgaaacg attaaaggca gaaggtgtaa atgtcataat + 16921 ttatgaacca accctcagtg acaatgagac attttggggt agtaagattg taaacgattt + 16981 ggagtatttt aaatcaatta gtaatgttat cgtggcaaat cgttatgatg atttgcttaa + 17041 agatgtgagt gacaaggttt atagtcgtga tatttttaag agagattagg tagaagttac + 17101 aatgtatgat tatttaatcg ttggtgctgg tttgtcggga gcaatttttg cttatgaagc + 17161 aaccaagcgt gggaaaaaag taaaagtgat tgataagcgt aatcatattg gtggtaatat + 17221 ctactgtgag gacgttgaag gtatcaacgt tcacaagtac ggtgcccaca ttttccatac + 17281 ttcaaacaaa aaagtctggg attatgtaaa tcaatttgct gaatttaaca actatatcaa + 17341 ctcgcctata gccaattaca agggcagtct ttacaatctt ccttttaaca tgaatacttt + 17401 ctatgctatg tggggaacca agactcctca agaagtgaaa gataagatag ctgaacaaac + 17461 ggctcatatg aaagatgttg agcctaaaaa cttggaagaa caagctatta agttgattgg + 17521 tccggatatc tatgaaaagt tgattaaggg atatactgaa aaacaatggg gacgttctgc + 17581 gacagacctc ccaccattta tcattaaacg tctaccagtt cgtttaacct ttgataataa + 17641 ttattttaat gaccgttatc aagggattcc aattgggggt tacaacgtta tcatcgaaaa + 17701 tatgctgaag gatgtagaag tagaacttgg cgttgacttt tttgccaatc gtcaagaatt + 17761 agagacttct gctgaaaaag ttgtcttcac agggatgatt gaccaatact ttgattataa + 17821 gcatggtgag ttagaatacc gtagtcttcg ttttgagcat gagattttag acgaggaaaa + 17881 ttatcaaggg aatgctgtag tgaactatac agagcgtgag atcccttata ctcgtatcat + 17941 cgaacacaaa cattttgaat atggaatgca gccaaagaca gttatcacgc atgaatatcc + 18001 agctgactgg aagcgtgggg acgagcccta ctatcctatt aacgatgaga aaaataatgc + 18061 tatgtttgct aaataccaag aagaagcagc gcagaatgat aaagttatct tttgtgggcg + 18121 tttagcagac tataaatatt acgatatgca tgtggtgatt gaacgggcgc ttgaggttgt + 18181 ggagaaagaa tttagtaatt gaaaaacaac gaagaaaggt tgcttatata tgaaaggtat + 18241 tattcttgca ggtggttcgg ggacacgatt atatcctttg actcgggctg catcaaaaca + 18301 acttatgccg gtttatgata aacccatgat ttactatcct ttgtcaaccc tgatgttgac + 18361 tggaataaag gacattttga ttatctcaac accacaggat ttgccccgtt ttaaggactt + 18421 gctcttggat ggttccgaat ttgggatcaa gctttcctat gcggaacaac ctagtcccga + 18481 tggacttgct caggctttta ttatcggtga agagtttatc ggtgacgata gcgttgcctt + 18541 gattttaggt gacaatatct accatggtcc tggtctgagc acaatgctac aaaaggcagc + 18601 gagtaaggag tcgggagcaa ctgtttttgg ctaccatgtc aaggatccag agcgctttgg + 18661 tgtggttgag tttgatcagg atatgaaggc tatttctatt gaagaaaagc cagagcaacc + 18721 tcgttcaaac tatgcagtta caggtctcta tttctatgat aatgatgtag tagagattgc + 18781 caagagtatt aaaccaagtc ctcgtggtga actggaaatt acagatgtaa acaaggctta + 18841 cctagatcgt ggtgatttgt ctgttgagct tatgggacgt ggctttgctt ggttggatac + 18901 tggcactcat gaaagtttac tagaggcttc gcagtacatc gaaacagtcc aacggatgca + 18961 aaatgttcag gtagcaaact tagaagaaat tgcttaccgt atgggctata tcagtcgaga + 19021 agatgtattg gccttagccc aaccacttaa gaaaaatgaa tacggacagt atctgctccg + 19081 tttgattgga gaagcataga tgacagataa ttttttcggt aagacgcttg cggcacgcaa + 19141 ggttgaagct attccaggca tgttggagtt tgatatcccc gttcatggag ataatcgtgg + 19201 ctggtttaaa gaaaatttcc aaaaggaaaa aatgcttcca cttggatttc cagcgtcttt + 19261 ctttacagaa ggaaaattgc aaaacaatgt atccttctca cgtaaaaatg tccttcgagg + 19321 cctccacgca gagccttggg ataagtacat ctctgtagca gatggaggga aagttctggg + 19381 ttcttgggtt gatctacgcg agggtgaaac ctttgggaat acctatcaga cagtaattga + 19441 tgcaagcaag ggaatctttg ttcctcgagg cgtagctaat ggcttccaag ttttatcaga + 19501 tacagtgtca tatagctatc tggtcaatga ttactgggcg cttgaactca aacccaagta + 19561 tgcctttgtg aactacgctg atccaagcct tggtattgaa tgggaaaata ttgcagaagc + 19621 agaggtttca gaagcagata aacatcatcc cctacttaag gacgtgaagc ctttgaaaaa + 19681 agaagatttg gaataaggaa agaatatgac tgaatacaaa aatattatcg tgacaggtgg + 19741 agctggcttt atcggttcta actttgtcca ttatgtttac gagaactttc cagatgttca + 19801 cgtgacagtc ctagataagt tgacttatgc tggaaaccgc gcgaatattg aggaaatttt + 19861 aggtaatcgt gttgagttag ttgttggtga cattgctgat gcggagttgg tagacaagtt + 19921 ggctgctcaa gcagatgcta tcgttcatta tgcagcggaa agccacaatg ataattcgct + 19981 caatgatcca tcgccattta ttcatactaa cttcatcgga acctatactc ttttagaagc + 20041 tgctcgtaag tatgatattc gcttccacca tgtatcgaca gatgaagttt atggggatct + 20101 ccctttacgc gaagatttgc caggtcatgg tgaaggacca ggtgagaaat ttactgctga + 20161 aacaaaatac aacccaagct ctccgtactc atcaaccaag gcagcctcag atttgattgt + 20221 caaagcctgg gtgcgttctt ttggagtcaa agcaacgatt tccaactgtt caaataacta + 20281 cggtccttat caacatatcg aaaaattcat cccacgtcag attactaaca tcctaagtgg + 20341 tatcaagcca aaactttacg gtgaaggtaa gaacgttcgt gattggattc ataccaatga + 20401 ccattcttca ggagtttgga caatcttgac aaaagggcaa atcggtgaaa cctacttgat + 20461 tggggctgat ggtgagaaga acaataagga agttttggaa cttatcctta aggaaatggg + 20521 acaagctgcg gatgcctatg atcatgtgac tgaccgtgca ggacatgacc ttcgctatgc + 20581 gattgatgct agcaagctcc gtgatgagtt ggggtggaaa cctgaattta ccaactttga + 20641 agctgggctc aaggcaacaa tcaagtggta tacagataac caagaatggt ggaaagcaga + 20701 gaaagaagct gttgaagcca attatgctaa gactcaggag attattacag tataaaaagc + 20761 aggaaatagc tgctttttat tgctatattg ggaagagtta catattagaa aggtctagag + 20821 atgattttaa ttacaggggc aaatggccaa ttaggaacgg aacttcgcta tttattggat + 20881 gaacgtaatg aagaatacgt ggcagtagat gtggctgaga tggacattac cgatgcagaa + 20941 atggttgaga aagtttttga agaggtgaaa ccgactttag tctaccactg tgcagcctac + 21001 accgctgttg atgcagcaga ggatgaagga aaagagttga acttcgccat caatgtgacg + 21061 gggacaaaaa atgtcgcaaa agcatctgaa aagcatggtg caactctagt ttatatttct + 21121 acggactatg tctttgacgg taagaaacca gttggacaag agtgggaagt tgatgaccga + 21181 ccagatccac agacagaata tgggcgtact aagcgtatgg gggaagagtt agttgagaag + 21241 catgtgtcta atttctatat tatccgtact gcctgggtat ttggaaatta tggcaaaaac + 21301 ttcgttttta ccatgcaaaa tcttgcgaaa actcataaga ctttaacagt tgtaaatgac + 21361 cagtacggtc gtccgacttg gactcgtacc ttggctgagt tcatgaccta cctagctgaa + 21421 aatcgtaagg aatttggtta ttatcatttg tcaaatgatg cgacagaaga cacaacatgg + 21481 tatgattttg cagttgaaat tttgaaagat acagatgtcg aagtcaagcc agtagattcc + 21541 agtcaatttc cagccaaagc taaacgtccg ctaaactcaa cgatgagcct ggccaaagcc + 21601 aaagctactg gatttgttat tccaacttgg caagatgcat tgcaagaatt ttacaaacaa + 21661 gaagtgagat aagtagtaga atgattttct agtctaataa aagaggcaga taatgaactc + 21721 caaaggagct taagatatac aattatcttg ttgttggtgc tggtctcttt ggtgcagtct + 21781 ttgcccatga agcggcctta aaaggaaaaa aagtaaaagt tattgaaaaa tgaaatcata + 21841 tcgcgggtaa tatctatact cgtgaagagg aaggaattca agtttatcaa tatggtgctc + 21901 atatcttcca tacttctgat aaggagatct gggattatgt aaatcagttt gcagagttta + 21961 accgttacat aaattctcct gttgcaaact ataagggtga gatttataac cttcctttta + 22021 atatgaatac tttcaataaa ctctggggag ttgtaacgcc agcagaagca caagctaaga + 22081 ttgatgaaca acgtgctatt ttaaatggta aaactcctga aaatttggaa gaacaggcga + 22141 tttctcttgt agctacagac atctacgaaa aattaatcaa agactataca gagaaacagt + 22201 ggggcaaacc aactactgaa cttccatcct ttattattgt ttgccagtac gcctgaccta + 22261 tgataacaac tattttaacg atacctatca agggattcca attggtgaat acactcaaat + 22321 agttgaaaaa tgttggatca tgaaaatatt gatgtagaaa caaacgttga tttctttgtg + 22381 aataaagagc aatatctgaa agattttcct aagattgtct ttactggtat gattgatgaa + 22441 ttctttgact ataagttggg cgaactagag taccgtagtc ttcgttttga aaatgagacc + 22501 ttggatatgg aaaattacca aggaaatgca gttgtgaact atacggatgc agaaacccca + 22561 tatactcgca ttattgaaca caaacatttt gagtttggga gtcaagcaaa gactatcatt + 22621 actaaagaac attctaaaac atgggaaaaa ggtgatgagc cttattatcc agttaataat + 22681 gatcgtaata atcatttgta taaatcatat aaaaaacttg ctgatgagca agggaatgtt + 22741 atctttggtg gccgcttagg acactatcgt tattacgata tgcaccaagt aattggagca + 22801 gctttgcagt gcgtgagaaa tgagttagat tcatactcaa tgaaaatcaa agagcaaact + 22861 aggaagctag ccgcaggttg ctcaaaacac tgttttgagg ttgcagatgg aagctgacgc + 22921 ggtttgaaga gattttcgaa gagtataaac aagtaaaact gactaccagt tattatttag + 22981 aaatagtatt aaaaattcct tgactatgtg atatagttga gggattttta aatgatattc + 23041 atattttttg caaagatgtt gtttgaaaaa taattttcaa aaattctgaa aattctgttg + 23101 acaactttct gaaaagagtc tataatggag agaaagtttt aaaggagaaa atgatgaaaa + 23161 gttcaaaact atttgccctt gcgggcgtga cattattg +// + diff --git a/public/res/serotype_genbank/serotype_17F.gb b/public/res/serotype_genbank/serotype_17F.gb new file mode 100644 index 0000000..d4f4998 --- /dev/null +++ b/public/res/serotype_genbank/serotype_17F.gb @@ -0,0 +1,1041 @@ +LOCUS CR931670 22896 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Rose (serotype 17f). +ACCESSION CR931670 +VERSION CR931670.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22896) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22896) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22896 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Rose" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC17F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC17F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33501.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene complement(order(462..995,997..1323)) + /gene="tnp" + /locus_tag="SPC17F_0002" + /pseudo + CDS complement(join(462..995,997..1323)) + /gene="tnp" + /locus_tag="SPC17F_0002" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(933..995,997..1305)) + /gene="tnp" + /locus_tag="SPC17F_0002" + /note="HMMPfam hit to PF01710, Transposase, score 3.1e-23" + /pseudo + gene 1539..2984 + /gene="wzg" + /locus_tag="SPC17F_0003" + CDS 1539..2984 + /gene="wzg" + /locus_tag="SPC17F_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33503.1" + /db_xref="GOA:Q4K1C0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K1C0" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1539..1655 + /gene="wzg" + /locus_tag="SPC17F_0003" + /note="Signal peptide predicted for SPC0841 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1743..2090 + /gene="wzg" + /locus_tag="SPC17F_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.6e-63" + misc_feature 2268..2711 + /gene="wzg" + /locus_tag="SPC17F_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2986..3717 + /gene="wzh" + /locus_tag="SPC17F_0004" + CDS 2986..3717 + /gene="wzh" + /locus_tag="SPC17F_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33504.1" + /db_xref="GOA:O86886" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:O86886" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDRGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2989..3597 + /gene="wzh" + /locus_tag="SPC17F_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 4.6e-36" + gene 3723..4418 + /gene="wzd" + /locus_tag="SPC17F_0005" + CDS 3723..4418 + /gene="wzd" + /locus_tag="SPC17F_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33505.1" + /db_xref="GOA:Q4K1B8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K1B8" + /translation="MMKEQNTIEIDVFQLLKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3744..4160 + /gene="wzd" + /locus_tag="SPC17F_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 6.2e-55" + misc_feature 4266..4343 + /gene="wzd" + /locus_tag="SPC17F_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4428..5117 + /gene="wze" + /locus_tag="SPC17F_0006" + CDS 4428..5117 + /gene="wze" + /locus_tag="SPC17F_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33506.1" + /db_xref="GOA:Q4K1B7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1B7" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5132..6499 + /gene="wchA" + /locus_tag="SPC17F_0007" + CDS 5132..6499 + /gene="wchA" + /locus_tag="SPC17F_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33507.1" + /db_xref="GOA:Q4K1B6" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K1B6" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDGWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5132..5224 + /gene="wchA" + /locus_tag="SPC17F_0007" + /note="Signal peptide predicted for SPC0845 by SignalP 2.0 + HMM (Signal peptide probability 0.902) with cleavage site + probability 0.355 between residues 31 and 32" + misc_feature 5915..6496 + /gene="wchA" + /locus_tag="SPC17F_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.5e-160" + gene 6530..7702 + /gene="wchF" + /locus_tag="SPC17F_0008" + CDS 6530..7702 + /gene="wchF" + /locus_tag="SPC17F_0008" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33508.1" + /db_xref="GOA:Q4K1B5" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K1B5" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDEDPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + ALLVCDSKNIEKYIQEDYIQYQPKTTYIAYGTDTTRSTLKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIADYFTWEKIVTDYEKVFKG" + gene 7708..8604 + /gene="wcxG" + /locus_tag="SPC17F_0009" + CDS 7708..8604 + /gene="wcxG" + /locus_tag="SPC17F_0009" + /note="member of homology group 79" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33509.1" + /db_xref="GOA:Q4K1B4" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K1B4" + /translation="MAVKLKYDKSDITFLDDDGLKKYQSELLKMISDVFTFFDENGIA + YSLSGGSILGAIRHKGFIPWDDDVDINIPRESYDKLFSLFESDNSLSRKYYLQSAKSH + PELGLHVSQIRKKGTVARRKYDHSAEECGISIDLYIVENVYNNPVKRFFQGYTSMFLT + FALASVRETKNHALMKEMFRLEGRKLNYSTGKLMVGWFFGIIPIEKWLNWLDKCNSSC + KDSHTKYVSIPTGRKHFRRETYLRENMNIYKKVPFETLMVNVPVWSEEYLEMFYGKDY + MVVPPVDKREQHLFLELSYGEE" + misc_feature 7825..8526 + /gene="wcxG" + /locus_tag="SPC17F_0009" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 2.2e-21" + gene 8605..9324 + /gene="abp1" + /locus_tag="SPC17F_0010" + CDS 8605..9324 + /gene="abp1" + /locus_tag="SPC17F_0010" + /note="member of homology group 57" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (arabinitol) + Abp1" + /protein_id="CAI33510.1" + /db_xref="GOA:Q4K1B3" + /db_xref="InterPro:IPR001228" + /db_xref="UniProtKB/TrEMBL:Q4K1B3" + /translation="MKVAILTASGIGSRIGQDIPKQFIHVENKPVIIYTLEKFQNHPE + IDEICIVILKGWEQMVKAYAEQFGITKLKMITLGGKSGQESIYNGLREVKKAHPNEDV + TVLIHDGNRPLVSNDIISNALATYQQFGNAVAAIPTTEVVFVLENPQSTSSTEALNRD + LLRRTQTPHVYHLDNILSLHEKALENGITDVAASCQLMQLFGEKSYFSLGTEKNLKIT + TVEDLDIFKALLSSTRDKWIK" + misc_feature 8611..9300 + /gene="abp1" + /locus_tag="SPC17F_0010" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF0007, score 2e-15" + gene 9327..10382 + /gene="abp2" + /locus_tag="SPC17F_0011" + CDS 9327..10382 + /gene="abp2" + /locus_tag="SPC17F_0011" + /note="member of homology group 58" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (arabinitol) + Abp2" + /protein_id="CAI33511.1" + /db_xref="GOA:Q4K1B2" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1B2" + /translation="MTLLLNKIYRQDVESSLETIVNINDLNGKSILITGASGLIGSSV + IDQLLLLNEIRNFNIKIFCCGRKFESLEKRFGRQTEYLRFVFYDATKAPHFDFAVDYI + IHAASPASPELYVNQPVETMASNFLGMYNLLTYAKNAKVSNLVYISSSEVYGIGTSNN + PLEESYIGTVDHLSVRSSYASSKRATETLCASFASEYGIKIMIVRPGHIYGPSAKKSD + NRVSSFFMIEAIAGRDIIMKSTGSQLRSYCYSLDCASAILSVLLSGESGQAYNVSNPN + SIITIKQMAEIISRVGNVKLTMDIPSDQDIKQTNPMQNAGLSSDKLEELGWQGHFTAE + ESFQHTFNILKELSSEK" + misc_feature 9414..10364 + /gene="abp2" + /locus_tag="SPC17F_0011" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00091" + misc_feature 9417..10175 + /gene="abp2" + /locus_tag="SPC17F_0011" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.001" + misc_feature 9417..10145 + /gene="abp2" + /locus_tag="SPC17F_0011" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 3.7e-44" + misc_feature 9420..10232 + /gene="abp2" + /locus_tag="SPC17F_0011" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 0.00011" + gene 10372..11355 + /gene="wciP" + /locus_tag="SPC17F_0012" + CDS 10372..11355 + /gene="wciP" + /locus_tag="SPC17F_0012" + /note="member of homology group 97" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33512.1" + /db_xref="GOA:Q4K1B1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K1B1" + /translation="MKSDSILIMMATYNGEEFLREQLDSILCQTISTWELLIRDDNSN + DQTRAIIKEYEEKDRRIKLIENISEYHGAYYNFWGLLNDVRQNENPFDFYMFADQDDI + WDVDKLERLISYYYRKVKTEEPVLIYADMRIIDANGKVIANSMDQLMGIRYTNPISTF + MAHKVYGCNTLFNHELFEILPLLPCYAPELAFLSHDNFTTKIAALKGHVYFYDEPTMS + YRRYGHNVTSKHEYNFTLKRILKRISKIDELAKDHALTYKQTLVATNLLHQQTSIDTE + LLFLDKVEKIIKKGGLNAVKMVWKEKIDWGNRVKTISRSLILASKLYKKYL" + misc_feature 10390..10911 + /gene="wciP" + /locus_tag="SPC17F_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 9.5e-18" + gene 11451..12596 + /gene="wcrT" + /locus_tag="SPC17F_0013" + CDS 11451..12596 + /gene="wcrT" + /locus_tag="SPC17F_0013" + /note="member of homology group 157" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI33513.1" + /db_xref="UniProtKB/TrEMBL:Q4K1B0" + /translation="MSKKEIKPICFYLPQFHPIPENDEAHGEGFTEWTNVKKAYPLYD + GHNQPRVPYNNNYYSLLDKEVLIQQAELAKKYGIYGFCYYHYWFKNGKKLLEKPVEMM + LENKDVDIPFCLSWANENWTRRWDGGNHEIIVEQNYDDLNDLEKHVDYLCQFFKDDRY + IKIDGKPLLLIYKPELIPNLVKTMEIIRNRARKNGFKDLEIIVQFPKFLLNNHQLELF + DGFAEFQPIFEIHMEKHERKNPVYRSVKSFLLKVGARNLVQKLEIRGEKKVHNKALLD + RRDYDATWTNIINRPIKDNKMIAGAFVDWDNTARNKNGRVFDGANPEKFEGYMRQLIE + KIQKEYQSEIVFINAWNEWAEGAYLEPDKKHGYGYLEALKTVIDETR" + gene 12605..13219 + /gene="wcrU" + /locus_tag="SPC17F_0014" + CDS 12605..13219 + /gene="wcrU" + /locus_tag="SPC17F_0014" + /note="member of homology group 158" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33514.1" + /db_xref="GOA:Q4K1A9" + /db_xref="InterPro:IPR011004" + /db_xref="InterPro:IPR018357" + /db_xref="UniProtKB/TrEMBL:Q4K1A9" + /translation="MNIRYKLQFRRCKKEWRKKNLHNETTPRTMFPIELVSVGEKTYG + GLYVLSFNKESKLKIGNFCSIAPEVAFILSADHYINQFSTYPFKSKVFDQGDEGVSKG + DIIIEDDVWIGFRSTILSGVTIGQGAIVGAGSVVTKSVPPYAIVGGVPAKVISYRFET + EIREEMKKIDFSEFKLEKFKKVTEELYQPISSIRQINNINEKLK" + misc_feature 12938..13024 + /gene="wcrU" + /locus_tag="SPC17F_0014" + /note="PS00101 Hexapeptide-repeat containing-transferases + signature." + gene 13235..14428 + /gene="wzy" + /locus_tag="SPC17F_0015" + CDS 13235..14428 + /gene="wzy" + /locus_tag="SPC17F_0015" + /note="member of homology group 160" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33515.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K1A8" + /translation="MFRFQNGTVSINMRGFLMFIAMLIYCQPEYLKSIPVTGRIYRDF + MHVGIMFVTFSYISKKRFPKFFVWLVLLYNSWLTFLTIQNNGDIKRAIFQLLLFTGFV + SMIDIFSENMQDLIESLLFTFEMVVYLNFVTVLFFPDGFFHRVNDAYGITKEWFLGAD + NNFLFTLFPATLIALLYKNLGGVKIRAYSLISIILATQLIKGSGTAKVGIVALILFDL + VPLVKYILTPYRGLVISSTLSFLIVVTGKVEFLRGIVEGILEKDLTFTSRTFIWDNAM + SAIREKPFGYGMMMFTDNVHILGNFPGWIWKGATHAHNNFLQVLFQGGYLGFGVYFLI + ILKGAMLCRKYWDDRNARLLFYGLFIFTIISITENLEMQMMYLVIILPFLLPNILVKE + RGKNE" + misc_feature 14018..14221 + /gene="wzy" + /locus_tag="SPC17F_0015" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1.9e-08" + gene 14421..16367 + /gene="wcrV" + /locus_tag="SPC17F_0016" + CDS 14421..16367 + /gene="wcrV" + /locus_tag="SPC17F_0016" + /note="member of homology group 159" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33516.1" + /db_xref="GOA:Q4K1A7" + /db_xref="InterPro:IPR001173" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4K1A7" + /translation="MNRGILVSIIVPIYNQEEYLNISLPTLKQQTYKNLEFILVDDGS + TDSSKQIINEYLNADSRFKYVYKENGGLVSATIAGVKEASGDYLAFLDPDDKLGLDYI + ENFIKELDCDYDFIAAGFFYDDGKLIKPYYLKENSVLTQSDIKKLRTDFLSDTGGLAI + SNRVFISRWNKLYKTNLVKEIVKEFRKFEMVSLGEDTIFTFLLLQKAQLGKTIALSNS + YFYNVGNPNSMMKEGAIINYVEKCRIAYQSLTKLLIERNLTNEMSCQLYYFLVLSFFN + RLEKEDMESFKKIYDILKRDSLFLKILFSLQKKANKKQKLQLLMIRLCKSGKQYLNIK + RVVSKLHAKLKLFCQNFKLVRKQIFRKNLVQLAYFLKFQQQRKIGFDDMKVFLPIIEE + RLKEDLLEFQKLEVLPSTIEKNIFVFWWDGFDEIPEIVSICLASLKKNYPECKLHLIY + KDNYQDYTNIHPNILNDFNKGKISVQTFSDVLRFNLLKNNGGMWVDSTIYFTKKIDLF + QELEKCSFSTLNFSTSKDFMSYKGEVCTWSGFMIASHKQGRLVSIINELFERYYLKYN + TFSTYFFIDIVFMLCKVYKLDDNVLDQIILKDGNMFQLASVLDQPFNKSLLPYIEKLP + QKLFLHYEDNNLDNFYKYFKEIVS" + misc_feature 14442..14966 + /gene="wcrV" + /locus_tag="SPC17F_0016" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.4e-36" + misc_feature 15510..16358 + /gene="wcrV" + /locus_tag="SPC17F_0016" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis pro, score 4e-12" + gene 16370..17887 + /gene="wzx" + /locus_tag="SPC17F_0017" + CDS 16370..17887 + /gene="wzx" + /locus_tag="SPC17F_0017" + /note="member of homology group 56" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33517.1" + /db_xref="UniProtKB/TrEMBL:Q4K1A6" + /translation="MSNRLVNTRRNIVWGTLNKLIAIALPFLVRTTLIYQLGIQYVGI + SGLFASILQVLSLADLGFANAIVYSMYKPLAHGDNDTVGALLGFYKKIYRVVGVVILI + AGLLIVPFINYLVKGSYPADINIQLIYLIYLANTVVSYFLFAYKRSLLLASQRKDIFD + NIDSVARIILSGLQILLLFLFPDFYVFALVIPCMTILNNVFNEIVTKKNYNYIVENSN + LDKKVKQEIIEKTKGLFVYKVCGITRNSLDNIFISTFLGITTVGIYSNYYYIMISVKG + FLDVVSTGMSASVGHSVATESVEKNHRDLENLTFGFSWLATWFMTCLLCLFQPFMLLW + VGQANILPFSVVVALCFYFYVLAAGDMRSQYIDASGLWDKEKLRSIAETVGNVVLNYI + LVQFLGVLGIVLATALTILFIGIPWSTKIVFDNYFKNGYKKYLWNQAVYAIVTIIVAS + ITYLICTLVGGNNIVVLIIRGIICLFVPNILYYLFFLKNEQTRLFFKIIKSKLLK" + gene 17943..18812 + /gene="rmlA" + /locus_tag="SPC17F_0018" + CDS 17943..18812 + /gene="rmlA" + /locus_tag="SPC17F_0018" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33518.1" + /db_xref="GOA:Q4K1A5" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K1A5" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17946..18662 + /gene="rmlA" + /locus_tag="SPC17F_0018" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 4.9e-120" + gene 18813..19406 + /gene="rmlC" + /locus_tag="SPC17F_0019" + CDS 18813..19406 + /gene="rmlC" + /locus_tag="SPC17F_0019" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33519.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 18849..19379 + /gene="rmlC" + /locus_tag="SPC17F_0019" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 19419..20468 + /gene="rmlB" + /locus_tag="SPC17F_0020" + CDS 19419..20468 + /gene="rmlB" + /locus_tag="SPC17F_0020" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33520.1" + /db_xref="GOA:Q4K2P4" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P4" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 19434..20390 + /gene="rmlB" + /locus_tag="SPC17F_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0001" + misc_feature 19437..20177 + /gene="rmlB" + /locus_tag="SPC17F_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 2.7e-76" + misc_feature 19440..20252 + /gene="rmlB" + /locus_tag="SPC17F_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.7e-05" + gene 20534..21385 + /gene="rmlD" + /locus_tag="SPC17F_0021" + CDS 20534..21385 + /gene="rmlD" + /locus_tag="SPC17F_0021" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33521.1" + /db_xref="GOA:Q4K1A2" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1A2" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAKNRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 20534..21382 + /gene="rmlD" + /locus_tag="SPC17F_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.3e-145" + misc_feature 20537..21172 + /gene="rmlD" + /locus_tag="SPC17F_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00012" + misc_feature 20537..21166 + /gene="rmlD" + /locus_tag="SPC17F_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 7.7e-18" + misc_feature 20540..21268 + /gene="rmlD" + /locus_tag="SPC17F_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 4.8e-08" + gene order(21448..21528,21532..22615) + /gene="glf" + /locus_tag="SPC17F_0022" + CDS join(21448..21528,21532..21918,21918..22052,22052..22615) + /gene="glf" + /locus_tag="SPC17F_0022" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33522.1" + /db_xref="GOA:Q4K1A1" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1A1" + /translation="MYDYLVVGAVFAHEAVLKGKKVKVIEKNHIAGNIYTREEEGIQV + HQYGAHIFHTSDKEIWDYVNQFADFNRYTNSPVANYKGEIYNLPFNMNTFNKLWGVVT + PAEAQAKIDEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPTTETSSL + YYCLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKCWIMKILMVETNVDFFVNKEQYLKD + FPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAEIPYTRIIE + HKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQGNVIFGG + RLGHYRYYDMHQVIGAALQCVRNELDSYSMKIKEQTRKLAAGCSKHCFEVADGS" + misc_feature join(21868..21918,21918..22052,22052..22471) + /gene="glf" + /locus_tag="SPC17F_0022" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 3e-90" + gene 22849..>22896 + /gene="aliA" + /locus_tag="SPC17F_0023" + CDS 22849..>22896 + /gene="aliA" + /locus_tag="SPC17F_0023" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33523.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggatgattgt ataaaaggta gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggctaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatacagtc aattgaaaca agaacaagac + 481 aaaagaacct cgtaaaaggt attgtaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcaca caagagttct aacttaccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gaacgattaa ttcaccattt + 781 gttagacctg caaccaaaga aattctctga tatcttcttc cagatacttt gcctcttatt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaattca gaagctattt cagtcaaata + 1081 agcgtctgga ttgtcagtaa gatagttttt aagtctatct ctatcaactt ttcttggttt + 1141 tgttcctttt acttggtggt ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatggtatta cgtgagattt ggaaaacgtg tgacgcttct gttatactac ctgttcgctc + 1261 acaataagag agaacttttt tacgaaaatc tattgaatat gccataaaaa gattatacca + 1321 cattgtgtac tatattagat tgaaactaga atagtacaca tctgcttcta aaacattgtt + 1381 agaaatcgat ttgactgtcc ttatttcatt ttattatatt tttggttcgc gggaagtcta + 1441 ctaagatact taaagatgca gatagtgaaa ataaaggtgt agacattacc gtaaaaaagt + 1501 gatataatcg tatgatgttc aatgtatagg tgttaatcat gagtagacgt tttaaaaaat + 1561 cacgttcaca gaaagtgaag cgaagtgtta atatagtttt gctgactatt tatttattgt + 1621 tagtttgttt tttattgttc ttaatcttta agtacaatat ccttgctttt agatatctta + 1681 atctagtggt aactgcgtta gtcctactag ttgccttggt agggctactc ttgattatct + 1741 ataaaaaagc tgaaaaattt actatttttc tgttgctgtt ctctatcctt gtcagctctg + 1801 tgtcgctctt tgcagtacag cagtttgttg gactgaccaa tcgtttaaat gcgacttcta + 1861 attactcaga atattcaatc agtgtcgctg ttttagcaga tagtgatatc gaaaatgtta + 1921 cgcaactgac gagtgtgaca gcaccgactg ggactgataa tgaaaatatt caaaaactac + 1981 tagctgatat caagtcaagt cagaataccg atttgacggt caaccagagt tcgtcttact + 2041 tggcagctta caagagtttg attgcagggg agactaaggc cattgtccta aatagtgtct + 2101 ttgaaaatat catcgagtca gagtatccag actacgcatc gaagataaaa aagatttata + 2161 ccaagggatt cactaaaaaa gtagaagctc ctaagacgtc taaaaatcag tctttcaata + 2221 tctatgttag tggaattgac acctatggcc ctattagttc ggtgtcgcga tcagatgtca + 2281 atatcctgat gactgtcaat cgagatacca agaaaatcct cttgaccaca acgccacgtg + 2341 atgcctatgt accaatcgca gatggtggaa ataatcaaaa agataaatta acccatgcgg + 2401 gcatttatgg agttgattcg tccattcaca ccttagaaaa tctctatgga gtggatatca + 2461 attactatgt gcgattgaac ttcacttcgt ttttgaaatt gattgatttg ttgggtggaa + 2521 ttgatgttta taatgatcaa gaatttactg cccatacgaa tggaaagtat taccctgcag + 2581 gcaatgttca tcttgattca gaacaggctc tcggttttgt tcgtgagcgc tactcactag + 2641 cagatggcga tcgtgaccgc gggcgcaatc aacaaaaggt gattgtagct atccttcaaa + 2701 aattaacgtc aaccgaagca ctgaaaaatt atagcacgat cattaatagc ttgcaagatt + 2761 ctatccaaac aaatatgcca cttgagacta tgataaattt ggtcaatgct cagttagaaa + 2821 gtggagggaa ttataaagta aattctcaag atttaaaagg tacaggtcgg acggatcttc + 2881 cttcttatgc aatgccagac agtaacctct atgtgatgga aatagatgat agtagtttag + 2941 ctgtagttaa agcagctata caggatgtga tggagggtag atgaaatgat agacatccat + 3001 tcgcatatcg tttttgatgt agatgacggt cccaagtcaa gagaggaaag caaggctctc + 3061 ttgacagaat cctacaggca gggggtgcga accattgtct ctacctctca ccgtcgcaag + 3121 ggcatgtttg aaactccgga agagaagata gcagaaaact ttcttcaggt tcgggaaata + 3181 gctaaggaag tggcgagtga cttggtcatt gcttacgggg ctgaaattta ctacacacca + 3241 gatgttctgg ataagctgga aaaaaagcgg attccgaccc tcaatgatag tcgttatgcc + 3301 ttgatagagt tcagtatgaa cactccttat cgcgatattc atagcgcctt gagcaagatc + 3361 ttgatgttgg gaattactcc agtcattgcc cacattgagc gctatgatgc tcttgaaaat + 3421 aatgaaaaac gcgttcgaga actgattgat aggggctgtt acacgcaagt aaatagttca + 3481 catgtcctca aacccaaact ttttggcgaa cgttataaat tcatgaaaaa aagagctcag + 3541 tattttttag agcaggattt ggttcatatc attgcaagtg atatgcacaa tctagacggt + 3601 agacctcctc atatggcaga agcatatgac cttgttaccc aaaaatacgg agaagcgaag + 3661 gctcaggaac tttttataga caatcctcga aaaattgtaa tggatcaact aatttaggag + 3721 aaatgatgaa agaacaaaac acgatagaaa tcgatgtatt tcaattactt aaaaccttgt + 3781 ggaaacgcaa gctaatgatt ttaatagtgg cacttgtgac aggtgcgggg gcttttgcat + 3841 atagcacttt tattgttaag ccagaatata cgagtaccac gcgaatttac gtagtgaatc + 3901 gcaatcaagg agacaagccg gggctgacaa atcaggattt gcaggcagga tcttatctgg + 3961 taaaagacta ccgtgagatt atcctttcgc aggatgcatt ggaaaaagta gcgacaaatt + 4021 tgaagttgga tatgccagca aaaacgttag ccagcaaagt tcaagtgact gtaccagctg + 4081 acactcgtat cgtctcaatc tctgtcaagg ataaacagcc agaggaagcc agtcgtatcg + 4141 ctaattctct acgagaagtt gctgcagaaa agatcgtcgc tgtaacgcga gtatctgatg + 4201 taacgacact tgaagaagcg cgaccagcta cgactccctc ttctccaaat gttcgacgca + 4261 attccttgtt tggttttctt ggaggagcag tcgtaacagt aattgctgtt cttttgattg + 4321 agttgctgga cacccgtgtg aaacgtcctg aagatgttga agatgtactg aaaattccac + 4381 ttttagggct cgttccagat tttgacaaaa taaaatagga ggaagttatg ccaacattag + 4441 aaatctcaca ggcaaaattg gattctgtaa aaaaggcaga ggaatattat aacgctttgt + 4501 gcacgaacct acagttaagt ggagatggtt tgaaagtatt ttctatcact tctgtgaaaa + 4561 taggagaagg aaaatcaacg acttccgcca atatcgcttg ggcttttgcg cgtgcaggtt + 4621 acaaaacgct gctgattgat ggagatattc gcaattctgt tatgttaggt gtctttaaag + 4681 caaggaataa gattacaggc ctgacagaat ttttatcagg aactacagac ttatcacaag + 4741 ggctttgtga taccaatatc gaaaatctct ttgtaattca ggctggctct gtgtcaccga + 4801 atccgacagc tcttcttcaa agtaagaatt tcactacaat gcttgaaacc ttgcgtaaat + 4861 attttgacta catcattgta gatactgctc ctgttggtgt cgtgattgat gcggctatta + 4921 ttacgcgaaa ctgcgatgct tctattttag tgacggaggc aggtgaaata aatcgacggg + 4981 atattcaaaa agcaaaagaa cagttggaac acacagggaa gccgtttttg ggagttgtgt + 5041 tgaataaatt cgatacttca gtagacaaat acggttctta tggaaattat ggagattacg + 5101 ggaaaaataa aaaataggtc gggggataga gatgaatgga aaaatagtaa agtcttcatt + 5161 ggccataatc cagagttttc ttgttatttt attgacttat ctacttagtg ctgtgagaga + 5221 agcggagatt gtttcaacaa cagctattgc actttatatc ctccattatt ttgtctttta + 5281 tatcagtgat tatggacagg atttctttaa aaggggatat ttgattgaac ttgtccagac + 5341 attgaaatat atcctattct ttgcactagc gattagtatt tctaattttt tcttagagga + 5401 tcgatttagt atttccagac gaggcatgat ttacttcctc acattacatg ctctcttagt + 5461 ctatgtgcta aacctattta tcaagtggta ttggaagcgg gcttatccca actttaaagg + 5521 aagtaagaag attctcctac ttacagcaac ttctcgtgtc gaaaaggtac tggatagatt + 5581 aatagaatca aatgaggttg ttggggagtt ggtagccgtc agtgtcttag ataaaccaga + 5641 ttttcagcat gattgtttaa aggtagtagc agagggggag atagtaaact ttgcgactca + 5701 tgaggtggtc gatgaagtct ttatcaatct tccaagtgaa aaatacaata ttggagagct + 5761 tgtctctcag tttgaaacga tgggaattga tgtaacagtc aatctaaatg cttttgatcg + 5821 tagtttagca cgtaacaagc aaattcgtga gatggcagga ttaaacgttg tgactttttc + 5881 tacaacattt tataagacta gtcatgtaat tgctaagcgg attattgata tcgtgggtgc + 5941 attggtaggg ctgatactat gtggtttagt cagtattgta ctggttcctt tgattcgaaa + 6001 ggatgggggc tctgctattt ttgctcagac gcgtatagga aaaaatggtc gtcagttcac + 6061 tttttataag tttcgctcta tgtgtgtaga tgccgaggcg aaaaaaagag aactcatgga + 6121 acaaaatacc atgcagggtg gaatgtttaa ggtggacgat gatcctcgta tcacgaaaat + 6181 tggtcgtttt atacggaaga ctagcttgga cgagctacca cagttttaca atgttctaaa + 6241 gggagatatg agcttggtag gtacacgacc accaacagtg gacgagtatg agcactatac + 6301 cccagaacaa aaacgccgac taagttttaa acctggcata acaggtttat ggcaggtcag + 6361 cggacgaagt gaaatcaaga atttcgatga agttgtcaaa ttagatgtgg cctatattga + 6421 tggttggaca atctggaaag atattgaaat tttattgaaa acagttaaag ttgtatttat + 6481 gagagatgga gcgaagtaat ttctgtatat ccatcatatt aggagagaaa tgaaaaagtc + 6541 agtttatatc attggttcaa aaggaattcc tgctaagtat ggaggatttg aaacttttgt + 6601 tgaaaaatta acagccttcc aacaagataa ggctatccaa tattatgtgg cttgtatgcg + 6661 tgaaaactct gcaaaatcag ggactactga ggatgttttt gaacataatg gtgctatctg + 6721 ttataacgtc gatgttccta atattggtcc agcgcgagct atagcgtatg atatcgctgc + 6781 aattaacaga gctattgaaa ttgccaaaga aaataaggat gaagatccaa tcttctatat + 6841 tttagcttgt cgaatcggtc cgttcatcca tggaattaag aaaaaaatcc aggcgatagg + 6901 tgggactctt ctagttaatc cagatggtca cgagtggtta cgagctaagt ggagcgctcc + 6961 agttcgtcgt tattggaaaa tttccgaagg tcttatggtc aaacatgcag ctcttttagt + 7021 gtgtgatagt aagaatattg aaaaatatat ccaagaagat tatatacagt atcaacctaa + 7081 gacaacctat atcgcttatg ggaccgatac aacacgctct acattaaaga gtagtgatga + 7141 aaaagtacgt tcttggttca aagagaagaa tgtttctgag aacgagtatt atctagttgt + 7201 aggacgtttt gtaccagaaa acaactatga atctatgatt cgtggctttt tggcgtctaa + 7261 ctctaagaag gactttgtct taatcacaaa tgtagaacag aataaatttt ataatcagtt + 7321 gttggcaaaa actggttttg ataaggaccc acgagtaaaa tttgtaggta cagtctatga + 7381 gcaagagctt ctgaagtata ttcgagaaaa tgcttttgct tacttccacg gacatgaagt + 7441 tggtggaaca aatccttcgt tacttgaagc attagcatcc acaaagttaa acttactact + 7501 cgatgttggt tttaaccgcg aagttgggga gcaaagtgcg atctattgga aaaaagatga + 7561 gctttcccaa gtaatcgaga aagttgaaca atttgatgca aaaatgattg atgagttaga + 7621 tagacaatca aatcagagaa ttgcggatta tttcacttgg gaaaagattg tcacagacta + 7681 cgagaaagta tttaaaggtt agagttaatg gcagtaaaat taaaatatga taaatcagat + 7741 attacatttt tagatgatga cggattgaaa aaataccaat cagaattgtt gaaaatgata + 7801 tcagatgtgt ttactttttt tgatgaaaat gggatagcgt attctttaag tggaggtagc + 7861 attttagggg caatccgtca taaagggttt atcccttggg atgatgatgt tgatatcaat + 7921 attccgaggg aaagttacga taaactattt tctctatttg agtcagacaa tagtcttagt + 7981 cgtaaatatt atcttcaatc agcaaaaagt catccagaat tgggacttca tgtttctcaa + 8041 attagaaaaa aaggaacagt tgctcgtagg aaatacgatc attcggctga ggagtgcggt + 8101 atttctatag atctttacat tgtagaaaat gtatacaata atccagtgaa acgattcttt + 8161 caaggttata caagtatgtt tttgactttt gccttggctt ctgtacgaga aacaaagaat + 8221 catgccctga tgaaggaaat gtttagactg gaaggtagaa aactaaatta ttcaactgga + 8281 aagttaatgg ttggttggtt ttttggaatt attccaattg aaaagtggtt gaattggctt + 8341 gataaatgta attcaagctg taaggattca catacaaaat atgtatccat acctacagga + 8401 aggaaacact ttagacgcga gacttacttg cgagagaata tgaatattta taaaaaggtt + 8461 ccttttgaaa ctttgatggt gaatgttcct gtttggtcag aagagtattt agaaatgttt + 8521 tacggtaaag attatatggt cgttcctcct gttgataaga gagagcaaca tttgttttta + 8581 gagttgagtt acggagaaga ataaatgaaa gtagcgattt taacagcttc aggcattgga + 8641 agccgaattg gtcaagatat ccctaaacaa tttattcatg ttgaaaataa gccagtcatt + 8701 atctataccc ttgaaaaatt tcaaaatcat ccagaaattg atgaaatctg tattgtcatt + 8761 ttaaaaggct gggagcagat ggttaaagct tatgcggaac aatttggaat tacaaagtta + 8821 aagatgataa ctttgggagg gaagtctggt caagaatcaa tttataacgg tcttagagaa + 8881 gttaagaaag ctcatcccaa tgaggatgtg actgtattaa ttcatgacgg gaatcgtcct + 8941 ttagtgagca atgatattat tagcaacgct ttagcaacat accaacagtt tggaaatgct + 9001 gttgcagcga taccaacgac tgaggtagta tttgttttag aaaacccaca atcaacttcg + 9061 tccacagaag cattgaatcg tgacttgttg agacgaacac aaactcctca tgtttaccat + 9121 cttgataata ttctatcgct tcatgaaaaa gcattagaaa atgggataac tgatgttgca + 9181 gcatcatgcc aactcatgca actatttggt gaaaagagtt atttctctct tggaacagag + 9241 aaaaacttga aaattacgac tgtagaagat ctcgatattt ttaaagcctt attgagttca + 9301 actcgagata agtggattaa atagtaatga cattattatt aaataaaata tatagacaag + 9361 atgtagaatc ttctctagaa acaatcgtca atattaatga cttgaatggc aagtcaattt + 9421 taattactgg agcttctggt ttgattggtt caagtgtcat tgaccagtta ttattgctaa + 9481 atgaaataag gaattttaac attaaaattt tttgttgtgg aagaaagttt gaatcattag + 9541 aaaaacgatt tggtagacaa acagagtatt tacgctttgt gttctatgat gcgactaaag + 9601 cacctcactt tgattttgca gtggactaca ttattcatgc tgctagtcct gctagtcctg + 9661 aattatatgt taatcagcct gtagaaacaa tggctagtaa ttttctgggc atgtataatc + 9721 tactgacata cgcaaaaaat gctaaagttt caaatctagt ttatatctca tctagtgaag + 9781 tttatggaat tggcaccagt aataatcctt tggaggagag ttatattgga actgttgatc + 9841 atcttagcgt acgttcttcg tatgctagtt ctaagagagc tactgaaaca ctttgtgcta + 9901 gttttgcttc cgagtacggg atcaaaatca tgatagtaag accaggacac atatatggcc + 9961 ctagtgccaa gaaaagtgat aatcgtgtat catcattttt tatgatagaa gcgattgctg + 10021 gtcgtgatat cattatgaaa agtacaggga gtcagttgag atcgtattgt tatagtttgg + 10081 attgtgctag tgctatttta agtgttctcc tttcgggtga atcagggcaa gcttataatg + 10141 tttccaatcc aaattcaatt attactataa aacagatggc tgaaattatt tctcgagttg + 10201 gcaatgtgaa actcaccatg gatattccta gtgaccaaga tattaagcag actaatccta + 10261 tgcagaacgc cggtctaagc agtgataagc tagaagaatt aggatggcaa ggacatttta + 10321 cagctgagga aagttttcaa catacattta atattttaaa ggagttatcc agtgaaaagt + 10381 gatagcattt taatcatgat ggctacctac aacggagaag aatttcttcg tgaacagttg + 10441 gatagtatcc tttgtcaaac catctcaact tgggaactac tgattcgtga tgataattcc + 10501 aatgatcaaa caagagcaat tattaaagaa tacgaagaaa aagatagacg gattaaattg + 10561 attgaaaaca tatcggaata tcatggagcc tattataatt tttgggggtt attaaacgat + 10621 gttagacaaa acgaaaatcc atttgatttc tatatgtttg ctgatcagga tgatatctgg + 10681 gatgtggaca aattagaacg tttaattagt tattactata gaaaagttaa aacagaagaa + 10741 ccggtattga tttacgctga tatgcggatt atagatgcta acggtaaagt gatagctaat + 10801 agtatggatc aattgatggg aattcggtat accaatccta tctcaacttt tatggctcat + 10861 aaggtttatg gatgtaatac gttatttaat catgaattat ttgaaatctt acccctcctt + 10921 ccatgttatg ctccagaatt agccttccta tcacatgata actttacaac aaaaattgct + 10981 gcattgaaag ggcatgtgta tttttatgat gagcctacta tgagttatag acgatatggg + 11041 cataatgtta caagtaaaca tgagtataac tttacattga agcgaatctt aaaacgtatc + 11101 tcgaaaattg atgaattagc taaagatcat gccttgactt acaagcagac cttagtcgct + 11161 acaaatttgt tacatcaaca aacaagtatt gacactgaac tcctattttt agataaggta + 11221 gaaaaaataa tcaaaaaagg tggattaaat gctgtaaaaa tggtttggaa agaaaaaatt + 11281 gattggggaa atcgtgttaa gactataagc aggtctctga ttttagcgtc aaaattatat + 11341 aagaaatatt tataaaagat atttaaatac aaaaactctg ttttttatat gtcacaacta + 11401 agaacaactt tcaaattaaa gtgatttaat aaaaatttaa aggaataata atgtcaaaaa + 11461 aagaaatcaa accaatttgt ttttacttac cgcaatttca tcccatccca gagaatgatg + 11521 aggctcatgg agaaggattt actgaatgga ctaatgtaaa gaaagcctat ccactttatg + 11581 acgggcataa tcaaccacga gttccataca ataataatta ttatagtcta ttagataaag + 11641 aagtcttgat tcaacaggca gaattggcta aaaagtatgg aatttacgga ttttgttatt + 11701 atcattactg gtttaaaaat ggtaaaaaac tattagaaaa accagtagaa atgatgctag + 11761 aaaacaagga tgttgatata cctttttgtt tgagttgggc aaatgaaaac tggactaggc + 11821 gttgggatgg agggaatcat gaaatcattg ttgaacaaaa ctatgacgac ttaaatgatt + 11881 tggagaaaca tgtggattat ctgtgtcaat tttttaaaga tgaccgatat attaagattg + 11941 acgggaaacc gctcttgttg atttataagc cagagctaat tccaaattta gtaaagacaa + 12001 tggaaattat cagaaatcgt gctcgaaaga atggctttaa ggatttagag attattgtac + 12061 agtttccaaa gttcttgtta aataatcatc agcttgagtt atttgatgga tttgcagaat + 12121 tccaaccgat ttttgagatt catatggaaa agcacgagag aaaaaatcca gtttaccgat + 12181 ctgtgaaatc ttttctactt aaagttgggg ctcgaaattt agtacaaaaa cttgagatta + 12241 gaggtgaaaa aaaggtgcat aataaagctc tcttagatag gagagattat gatgcaacat + 12301 ggactaatat tattaatcgc ccgattaagg ataataagat gattgctggt gcttttgttg + 12361 attgggataa taccgctaga aataagaatg ggcgagtttt cgatggagct aatccagaaa + 12421 aatttgaagg ttacatgcga caactaattg aaaaaattca aaaagagtat caatcagaaa + 12481 ttgtttttat aaacgcatgg aatgaatggg cggaaggagc ataccttgag cctgataaaa + 12541 aacatggata tggctatcta gaggccttga agacagttat agacgagaca aggtaggaaa + 12601 agctatgaat attcgttata aacttcaatt tcgacgatgt aaaaaagagt ggcgaaaaaa + 12661 gaaccttcat aatgaaacaa cgcctcgaac tatgttccca atagaattgg tttcagtagg + 12721 ggaaaaaacc tatggtggtt tgtatgtttt gtccttcaat aaagagtcaa aattaaaaat + 12781 tggaaatttc tgctccattg caccagaggt tgcttttatt ctcagtgctg atcattatat + 12841 caatcagttc tctacgtatc cgttcaaatc taaagtattt gatcaaggtg atgaaggggt + 12901 ttcgaaaggg gatattatca ttgaggatga tgtatggatt ggttttcgtt ctacaattct + 12961 ttcgggagtt acaattggtc agggagctat tgttggagca ggatctgtgg taactaaatc + 13021 agttcctcct tacgctattg taggtggagt tccagcaaaa gtgatttctt atcgattcga + 13081 aacagagatt cgtgaagaaa tgaaaaaaat tgacttttcg gagttcaaat tagagaaatt + 13141 taaaaaggtt acggaagagt tgtatcagcc aatttcgtca ataagacaaa ttaataacat + 13201 aaatgaaaaa ttgaaataga gtcggaggag ttgcatgttt cgttttcaga atgggacagt + 13261 atcaataaac atgagaggat ttctgatgtt cattgcaatg ctcatttact gtcaaccaga + 13321 atatttgaaa tcaattccag ttacgggacg tatttataga gatttcatgc atgtaggaat + 13381 tatgtttgtg acgttttcgt acatttcaaa aaaacggttt ccaaaatttt ttgtatggct + 13441 agttcttcta tataactctt ggcttacttt tttaactatt caaaataacg gagatataaa + 13501 aagggcgata tttcaactct tgctgtttac aggctttgta tctatgatag acatattctc + 13561 tgaaaatatg caggatttaa tagaatcatt gttattcact tttgagatgg ttgtgtatct + 13621 aaactttgtc actgtactat ttttcccaga tggttttttc catcgtgtaa atgatgcata + 13681 cggaataaca aaagaatggt ttttgggagc tgataataat tttctattta ccttgtttcc + 13741 tgcaacactt atagctttat tgtataagaa tttaggtgga gtaaaaatca gagcatattc + 13801 attgatttca atcattttag ctactcaatt gattaaagga tcgggaacgg caaaggttgg + 13861 gattgttgcg ttgatactat ttgatttagt acctcttgtc aaatacatac ttacccctta + 13921 cagaggtttg gttatatcgt ctacgttgag ttttctaatt gtagttactg gtaaagtgga + 13981 atttttaaga gggattgttg aaggtattct agaaaaagat ttgacgttca cttcccgaac + 14041 ttttatttgg gataacgcta tgtcagcaat tcgagagaag ccatttggtt acggaatgat + 14101 gatgttcact gataacgtcc atatattagg gaattttcct ggttggattt ggaaaggagc + 14161 cacccatgct cataataact ttcttcaagt tttatttcag ggaggatatt taggatttgg + 14221 tgtttatttt ttaataattc taaagggagc aatgctatgt cgcaaatatt gggatgatag + 14281 aaatgcgaga ctactctttt atggactttt tatttttaca ataatatcta taacagaaaa + 14341 cttagagatg cagatgatgt atttggtgat tatactaccg tttttattgc ctaatatatt + 14401 ggttaaagaa aggggaaaaa atgaatagag gtattttggt atcaataatt gttcctatct + 14461 ataatcaaga agaatattta aatatttctt tacctacttt gaagcagcag acgtataaga + 14521 atttagaatt tatcttagta gatgatggtt cgacagatag tagcaaacag ataattaacg + 14581 agtatcttaa tgcagacagt agatttaaat atgtgtataa agaaaatgga ggcttagtat + 14641 ctgctacaat tgcaggggtg aaagaggctt cgggagacta tcttgctttt ttagatccag + 14701 atgataagtt aggattggac tatatagaaa acttcatcaa agaattggat tgtgactatg + 14761 atttcatagc ggcaggtttt ttctatgacg atggtaagtt aattaaacca tattacttga + 14821 aagagaattc agtcttgact caatcagata taaagaagtt aagaacggac tttttgtcgg + 14881 atacaggcgg gttagctatt tcaaatcgtg tttttatctc aagatggaat aaattatata + 14941 agacaaatct tgtaaaagaa attgtcaaag agtttcgtaa atttgaaatg gttagcttgg + 15001 gtgaagatac tatttttaca tttttacttc tacaaaaggc tcaattaggg aaaaccattg + 15061 ccctatctaa ttcttatttt tataatgtag gtaatcctaa ctcaatgatg aaggaaggag + 15121 ctattataaa ctatgttgaa aaatgtagga tagcatatca gagtcttact aagctactta + 15181 tagaaagaaa tttgactaat gaaatgagtt gtcaacttta ctatttctta gtgctttctt + 15241 tcttcaatcg cttagagaaa gaagatatgg agtctttcaa aaaaatatat gatattttga + 15301 aaagggattc actattttta aaaattctat tttcacttca aaagaaagca aataaaaaac + 15361 aaaaacttca gctattgatg attcgtctat gcaaaagtgg gaaacagtac ttaaacatta + 15421 aaagagtagt ttcaaaactc catgcaaaac ttaagttgtt ctgtcagaat tttaagttag + 15481 tgaggaaaca gatttttagg aagaatctag ttcaattagc ttatttttta aagttccaac + 15541 aacaacggaa aattggtttt gatgatatga aggtgttttt accgataatt gaagaaagat + 15601 taaaagaaga tttattggaa tttcaaaaat tagaagtatt accttcaaca attgaaaaga + 15661 atatttttgt tttttggtgg gatggctttg atgagatacc tgaaatagta agtatttgct + 15721 tagcatcttt aaaaaagaat tatccagagt gtaagttaca tctaatttat aaagataatt + 15781 atcaagatta cactaacatt catccaaata tattgaatga tttcaataaa ggaaaaattt + 15841 ctgttcaaac tttttcagat gtactccgat ttaatctact aaaaaataac ggaggaatgt + 15901 gggttgactc cactatatat tttactaaga aaatagattt attccaagaa ttggaaaaat + 15961 gttcattttc aacattgaat ttttcaacta gtaaagattt catgtcctat aagggagaag + 16021 tttgtacatg gtctggattt atgattgctt ctcataaaca gggacgccta gttagtatca + 16081 tcaatgaact ttttgaacgc tactatttaa agtataatac attttctaca tacttcttta + 16141 tagatattgt tttcatgctc tgtaaagttt acaaactaga tgacaatgtg ttagatcaaa + 16201 tcattttgaa ggatggaaac atgttccaat tagcttcagt tttagatcag ccgttcaata + 16261 aatctctatt gccatacata gaaaaactcc cgcaaaaact atttttgcat tacgaggata + 16321 ataatttgga taatttttac aaatacttta aagaaatagt gagttaacca tgagtaatag + 16381 acttgttaat actagaagaa atattgtttg gggaacatta aataagctta ttgcgattgc + 16441 tttaccattt ttagttcgaa caactttgat ttatcaatta gggatacaat atgtcggtat + 16501 tagtggactt tttgcatcta ttttacaagt tcttagttta gctgatttag gtttcgctaa + 16561 tgcaattgta tatagtatgt ataaacctct tgcccatggg gataatgaca ctgtcggtgc + 16621 acttctagga ttttataaaa aaatatatcg agtcgtcggg gtggtaatat taattgcggg + 16681 ccttttaatt gtgcccttta taaattactt agtaaagggt tcctatcctg cagatatcaa + 16741 tatacaacta atttacttaa tttatctggc aaatacagtt gttagttact ttctttttgc + 16801 ttataaacgc tctttattgt tagctagtca acgaaaagat atatttgaca acattgattc + 16861 agttgctcgc ataattttaa gtggattaca aattttatta ttgtttcttt ttcctgattt + 16921 ctatgttttt gctttagtaa ttccctgtat gacaatcctt aataatgtat ttaacgaaat + 16981 cgtgactaag aaaaattaca attatatcgt tgaaaatagt aacttagata aaaaagttaa + 17041 acaagaaatt attgaaaaaa caaagggatt atttgtctac aaagtatgtg ggattacaag + 17101 aaattccctc gataacatct ttatttctac ttttttaggg attacgacag tgggaattta + 17161 tagtaattat tattacatta tgatatcagt aaaaggtttt ttggatgtgg tttctacagg + 17221 aatgagtgct agtgttggac atagtgttgc tactgaaagt gttgaaaaaa atcatcgtga + 17281 cttagaaaat cttacatttg gtttctcttg gttagctacc tggtttatga catgtttatt + 17341 atgtctgttc caaccattta tgcttttgtg ggtaggacaa gctaatattt taccattttc + 17401 agtcgttgtt gctctctgtt tttactttta tgttcttgct gcaggtgata tgcggagcca + 17461 atatattgac gcctcaggtt tatgggataa agaaaaacta cggtcaattg cagaaacggt + 17521 aggtaatgtt gttttgaatt atattttggt tcaattttta ggtgttttag gaatagtgct + 17581 agctactgca ctaacaattt tgtttattgg aattccatgg agtacaaaaa ttgtgtttga + 17641 taattatttt aaaaatggtt ataaaaagta tttgtggaat caagcagtat atgctatagt + 17701 aactataatt gttgctagta ttacttatct aatctgtaca ctagttggtg gcaataacat + 17761 cgtggtttta attataagag gaataatttg tttatttgtc cccaatattt tatattactt + 17821 attcttttta aaaaatgaac agacgcgtct gtttttcaaa ataatcaagt cgaaattatt + 17881 aaaataattc tatgaaaaat atgtgaatta ccttatgatt aaataataga aggagtttca + 17941 ttatgaaagg tattattcta gcaggtggtt cggggacacg tttatatcct ttgactcgcg + 18001 ctgcatcaaa acaacttatg ccggtttatg ataaaccgat gatttactac ccactttcaa + 18061 cattgatgtt ggctgggatt agggatattt tgattatttc cactccacag gatttacatc + 18121 gatttcaaga gcttcttcaa gacggatctg agtttgggat caaactttct tatgcagagc + 18181 aaccaagtcc agatggtttg gcacaagcct ttatcattgg ggaagagttt atttctgatg + 18241 atagcgttgc gctaatctta ggtgataata tctaccatgg ttctgggctt tccaagatgc + 18301 tacaaaaggc agcgagtaag gagtcgggag caactgtttt tggctaccat gtcaaggatc + 18361 cagagcgctt tggtgtggtt gagtttgatc aggatatgaa ggctatttct attgaagaaa + 18421 agccagagca acctcgttca aactatgcag ttacaggtct ctatttctat gataatgatg + 18481 tagtagagat tgccaagagt attaaaccaa gtcctcgtgg tgaactggaa attacagatg + 18541 taaacaaagc ttacctagat cgtggtgatt tgtctgttga gcttatggga cgtggctttg + 18601 cttggctgga tactggaact catgaaagtt tactagaggc ttcacagtac atcgaaacag + 18661 tgcaacggat gcaaaatgtt caggtagcaa acttagaaga aattgcctat cgcatgggtt + 18721 atatcagtcg tgaagatgta ttgaccttag cccaaccact taagaaaaat gaatacggac + 18781 agtatctgct ccgtttgatt ggagaagcat agatgacaga taattttttc ggtaagacgc + 18841 ttgcggcacg caaggttgaa gctattccag gcatgttgga gtttgatatc cccgttcatg + 18901 gagataatcg tggctggttt aaagaaaatt tccaaaagga aaaaatgctt ccgcttggat + 18961 ttccagagtc tttctttgca gaaggaaaat tgcaaaacaa tgtatccttc tcacgtaaaa + 19021 atgtccttcg agggctccac gcagagcctt gggataagta catctctgta gcagatggag + 19081 ggaaagttct gggttcttgg gttgatctac gcgagggtga aacctttggg aatacctatc + 19141 agacagtaat tgatgcaagc aagggaatct ttgttcctcg aggcgtagct aatggcttcc + 19201 aagttctatc agatacagtg tcatatagct atctggtcaa tgattactgg gctctcgagc + 19261 tcaaacccaa gtatgccttt gtgaactacg ctgatccaag ccttggtatt gaatgggaaa + 19321 atattgcaga agcagaggtt tcagaagcag ataaacatca tcccctactt aaggatgtaa + 19381 aacctttgaa aaaagaagat ttgtaaaaag gaaagaatat gactgaatac aaaaatatta + 19441 tcgtgacagg tggagctggc tttatcggtt ctaactttgt ccattatgtt tacgagaact + 19501 ttccaggtgt tcacgtgaca gtcctagata agttgactta tgctggaaat cgcgcgaata + 19561 ttgaggaaat tttaggtaat cgtgttgagt tagttgttgg tgacattgct gatgcggagt + 19621 tggtagacaa gttggctgct caagcagatg ctatcgttca ttatgcagcg gaaagccaca + 19681 atgataattc gctcaatgat ccatcgccat ttattcatac taacttcatt ggaacctata + 19741 ctcttttaga agctgctcgt aagtatgata ttcgcttcca ccatgtatcg acagatgaag + 19801 tttatgggga tctcccttta cgcgaagatt tgccaggtca tggagaaggg ccgggtgaga + 19861 aatttacggc tgaaaccaag tacaatccaa gctcgcctta ctcatcaacc aaggcagcct + 19921 cagatttgat tgtcaaagcc tgggtgcgtt cttttggagt caaggcaacg atttccaact + 19981 gttcaaataa ctacggtcct tatcaacata tcgaaaaatt catcccacgt cagattacta + 20041 acatcctaag tggtattaag ccaaaacttt acggtgaagg taaaaacgtt cgtgactgga + 20101 ttcataccaa tgaccattct tcaggagttt ggacaatctt gacaaaaggg caaatcggtg + 20161 aaacctactt gattggggct gatggtgaga agaacaataa ggaagttttg gaacttatcc + 20221 ttaaggaaat gggacaagct gcggatgcct atgatcatgt gactgaccgt gcaggacatg + 20281 accttcgcta tgcgattgat gctagcaagc tccgtgatga gttggggtgg aaacctgaat + 20341 ttaccaactt tgaagctggg ctcaaggcaa caatcaagtg gtatacagat aaccaagaat + 20401 ggtggaaagc agaaaaagaa gctgttgaag ccaattatgc taagactcag gagattatta + 20461 cagtataaaa agcaggaaat agctgctttt tattgctata ttgggaagag ttacatatta + 20521 gaaaggtcta gagatgattt taattacagg ggcaaatggc caattaggaa cggaacttcg + 20581 ctatttattg gatgaacgta atgaagaata cgtggcagta gatgtggcta agatggacat + 20641 taccaatgaa gaaatggttg agaaagtttt tgaagaggtg aaaccgactt tagtctacca + 20701 ttgtgcagcc tacaccgctg ttgatgcagc agaggatgaa ggaaaagagt tggacttcgc + 20761 catcaatgtg acggggacaa aaaatgtcgc aaaagcatct gaaaagcatg gtgcaactct + 20821 agtttatatt tctacggact atgtctttga tggtaagaaa ccagttggac aagagtggga + 20881 agttgatgac cgaccagatc cacagacaga atatggacgc actaagcgta tgggggaaga + 20941 gttagttgag aagcatgtgt ctaatttcta tattatccgt actgcctggg tatttggaaa + 21001 ttatggcaaa aacttcgttt ttaccatgca aaatcttgcg aaaactcata agactttaac + 21061 agttgtaaat gatcagtacg gtcgtccgac ttggactcgt accttggctg agttcatgac + 21121 ctacctagct aaaaatcgta aggaatttgg ttattatcat ttgtcaaatg atgcgacaga + 21181 agatacaaca tggtatgatt ttgcagttga aattttgaaa gatacagatg tcgaagtcaa + 21241 gccagtagat tccagtcaat ttccagccaa agctaaacgt ccgctaaact caacgatgag + 21301 cctggccaaa gccaaagcta ctggatttgt tattccaact tggcaagatg cattgcaaga + 21361 attttacaaa caagaagtga gataagtagt agaatgattt tctagtctaa taaaagaggc + 21421 agagaatgaa ctccaaagga gcttaagatg tacgattatc ttgttgttgg tgcagtcttt + 21481 gcccatgaag cagtcttaaa aggaaaaaaa gtaaaagtta ttgaaaaatg aaatcatatc + 21541 gcgggtaata tctatactcg tgaagaggaa ggaattcaag ttcatcaata tggtgctcat + 21601 atcttccata cttctgataa ggagatctgg gattatgtaa atcagtttgc agactttaac + 21661 cgttatacca attctcctgt tgcaaactat aagggtgaga tttataacct tccttttaat + 21721 atgaatacct tcaataaact ctggggagtt gtgacgccag cagaagcaca agctaagatt + 21781 gatgaacaac gtgctatttt aaatggtaaa actcctgaaa atttggaaga acaggcgatt + 21841 tctcttgtag gtacagacat ctacgaaaaa ttaatcaaag actatacaga gaaacagtgg + 21901 ggcaaaccaa ctactgaact tccagccttt attattgttt gccagtacgc ctgacctatg + 21961 ataacaacta ttttaacgat acctatcaag ggattccaat tggtggatac actcaaatag + 22021 ttgaaaaatg ttggatcatg aaaatattga tgtagaaaca aatgttgatt tctttgtgaa + 22081 taaagagcaa tatctgaaag attttcctaa gattgtcttt actggtatga ttgatgaatt + 22141 ctttgactat aagttgggcg aactagagta ccgtagtctt cgttttgaaa atgagacctt + 22201 ggatatggaa aattaccaag gaaatgcagt tgtgaactat acggatgcag aaatcccata + 22261 tactcgcatt attgaacaca aacattttga gtttgggagt caagcaaaga ctatcattac + 22321 taaagaacat tctaaaacat gggaaaaagg tgatgagcct tattatccag ttaataatga + 22381 tcgtaataat catttgtata aatcgtataa aaaacttgct gatgagcaag ggaatgttat + 22441 ctttggtggc cgcttaggac actatcgtta ttacgatatg caccaagtaa ttggagcagc + 22501 tttgcagtgc gtgagaaatg agttagattc atactcaatg aaaattaaag agcaaactag + 22561 gaagctagcc gcaggttgct caaaacactg ttttgaggtt gcagatggaa gctgacgcgg + 22621 tttgaagaga ttttcgaaga gtataaacaa gtaaaactga ctactagtta ttatttagaa + 22681 atagtattaa aaattccttg actatatgat atagttgagg gatttttaaa tgatattcat + 22741 attttttgca aagatgttgt ttgaaaaata attttcaaaa attctgaaaa ttctgttgac + 22801 aactttctga aaagagttta taatggagag aaagttttaa aggagaaaat gatgaaaagt + 22861 tcaaaactat ttgcccttgc gggcgtgaca ttattg +// + diff --git a/public/res/serotype_genbank/serotype_18A.gb b/public/res/serotype_genbank/serotype_18A.gb new file mode 100644 index 0000000..ca3eff8 --- /dev/null +++ b/public/res/serotype_genbank/serotype_18A.gb @@ -0,0 +1,985 @@ +LOCUS CR931671 21887 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 8609/43 (serotype 18a). +ACCESSION CR931671 +VERSION CR931671.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21887) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21887) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21887 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="8609/43" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC18A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC18A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33524.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 294..467 + /gene="aliB" + /locus_tag="SPC18A_0002" + /pseudo + CDS 294..467 + /gene="aliB" + /locus_tag="SPC18A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI33525.1" + gene complement(460..1086) + /gene="tnp" + /locus_tag="SPC18A_0003" + /pseudo + CDS complement(460..1086) + /gene="tnp" + /locus_tag="SPC18A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1297..2742 + /gene="wzg" + /locus_tag="SPC18A_0004" + CDS 1297..2742 + /gene="wzg" + /locus_tag="SPC18A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33527.1" + /db_xref="GOA:Q4K198" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K198" + /translation="MSRRFKKSRSQKVKRSINIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALFLLVALVGLLLIIYKKAEEFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEFENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYRSLIAGETKAIVLSSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KMSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTATPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSDLHGKFHFPVGNAHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIQKLTST + EVLKDYSSILQGLQDSLQTNMPIETMMDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1297..1413 + /gene="wzg" + /locus_tag="SPC18A_0004" + /note="Signal peptide predicted for SPC0865 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.553 between residues 39 and 40" + misc_feature 1501..1848 + /gene="wzg" + /locus_tag="SPC18A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.3e-60" + misc_feature 2026..2469 + /gene="wzg" + /locus_tag="SPC18A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 3.8e-69" + gene 2744..3475 + /gene="wzh" + /locus_tag="SPC18A_0005" + CDS 2744..3475 + /gene="wzh" + /locus_tag="SPC18A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33528.1" + /db_xref="GOA:Q4K197" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K197" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIATNFIKVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSHHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 2747..3355 + /gene="wzh" + /locus_tag="SPC18A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 8.7e-40" + gene 3484..4176 + /gene="wzd" + /locus_tag="SPC18A_0006" + CDS 3484..4176 + /gene="wzd" + /locus_tag="SPC18A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33529.1" + /db_xref="GOA:Q4K196" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K196" + /translation="MKEQNTLEIDGLQLFRALWKRKLVILLVAIITSSVAFTYSTFVI + KPEFTSTTRIYVVNRNQEEKPGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSGLKLD + LTPKGLANKIEVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTRVKRPEDIEDTLQMT + LLGVVPNLNKLK" + misc_feature 3502..3918 + /gene="wzd" + /locus_tag="SPC18A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 6.1e-49" + misc_feature 4024..4101 + /gene="wzd" + /locus_tag="SPC18A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4186..4869 + /gene="wze" + /locus_tag="SPC18A_0007" + CDS 4186..4869 + /gene="wze" + /locus_tag="SPC18A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33530.1" + /db_xref="GOA:Q4K195" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K195" + /translation="MPTLEIAQKKLEFIKKAEEHYNALCTNIQLSGDKLKVISVTSVS + PGEGKTTTSVNIAWSFARAGYKTLLIDGDTRNSVISGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGAVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGETNKRDVQKAKQQLKQTGKLFLGVVLNKLDISVDKYGVY + GFYGNYGKK" + gene 4885..6252 + /gene="wchA" + /locus_tag="SPC18A_0008" + CDS 4885..6252 + /gene="wchA" + /locus_tag="SPC18A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33531.1" + /db_xref="GOA:Q4K194" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K194" + /translation="MDEKGLKIFLAVLQSIVVILLIYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSVSRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLNAFDKNLGRNKQIHEMVGLNVVTFSKNLYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFSQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKINNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDAVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5668..6249 + /gene="wchA" + /locus_tag="SPC18A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.9e-146" + gene 6283..7455 + /gene="wchF" + /locus_tag="SPC18A_0009" + CDS 6283..7455 + /gene="wchF" + /locus_tag="SPC18A_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33532.1" + /db_xref="GOA:Q4K193" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K193" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENNGEDPIF + YILACRIGPFIHGIKKRIQAIGGALLVNPDGHEWLREKWSLPVRKYWKYSERLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSILKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYEAMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRITDSFTWEKIVTDYEKLFKK" + gene 7452..8723 + /gene="wciU" + /locus_tag="SPC18A_0010" + CDS 7452..8723 + /gene="wciU" + /locus_tag="SPC18A_0010" + /note="member of homology group 59" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33533.1" + /db_xref="GOA:Q4K192" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K192" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMIEQIAQGYQVAALCPGRI + KFFSKKIEIIKATSRQFECYELLNSLPIALFGGISDPTAFMTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKNTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIQPANSVVLSITSSSIKHHQRLTTTNNKIRVS + YIGSDEEYKGYFDFIDFAGTLEQESYEVVTYGHLPNEECPSFIEQKGYFTKETIDSVY + ENIDILIIASKCKETFGLITVEALSYGVNVFVSENVGSKDLLPETHVFKDKEDLLAKI + INNQLEKVPLKTMEKHVEEVISYYKQVRSNN" + misc_feature 8226..8696 + /gene="wciU" + /locus_tag="SPC18A_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0002" + gene 8729..9793 + /gene="wciV" + /locus_tag="SPC18A_0011" + CDS 8729..9793 + /gene="wciV" + /locus_tag="SPC18A_0011" + /note="member of homology group 91" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33534.1" + /db_xref="GOA:Q4K191" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K191" + /translation="MIKDMSCPEISVIVPVYNVERYLRQCMDSLINQTYRDFEIILVN + DGSTDSSGILCEEWAKKDERIHVVHKKNEGLGFARNTGVEHAKGKYITFVDSDDYVSL + DMLQTLYNAVQEYDVEVVYSAGYYRSFSNGEIKKTDVGTKKPQLFEGGDVASELLPNV + ISAPPEYPNDGKVGVSAWKVLYKANLFKDKGLLFHSEREFISEDAIFQIDCLKLATSA + LVIPDILYYYRENFGSLSMKYKEDRFELDKILYNEQLKRVEGLPNQEILEERIERILI + ANIRLCVFQESLHKSSRIHKRLQRIRQICKDPVSKVVLHHYPIHRLPFPKRLICVLAK + YNMSLFLLALTLLKYRNRSV" + misc_feature 8759..9301 + /gene="wciV" + /locus_tag="SPC18A_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.2e-45" + gene 9799..10710 + /gene="wciW" + /locus_tag="SPC18A_0012" + CDS 9799..10710 + /gene="wciW" + /locus_tag="SPC18A_0012" + /note="member of homology group 92" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33535.1" + /db_xref="GOA:Q4K190" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4K190" + /translation="MGMNIEKLKLSLKNRTFFPVVIHALRNRWPLWWIRSKAIREVQL + EDRAYRILKKKYGSLISNSFDKAYLSEKVPKQIWICWFQGMENAPDLVKSCYRSLKKQ + FPEYVITVISSENIFEYVEIPDILYEKWVNGVIGNAHFSDILRVELLRKFGGIWIDST + VYCTGITTIQIIGKNPFFMYKSVSSVEERISSSNWMIASVPNHPFMITMSKLLQSYWS + KEVIAIHYYLFHILFTIMIESLPELWQLVPTYTNAAPHIMIDELNNVFSKERYQQLCQ + ISDFHKLNYKKNYNDKSESLYSYLLNQ" + misc_feature 9880..10698 + /gene="wciW" + /locus_tag="SPC18A_0012" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 6.1e-139" + gene 10722..12179 + /gene="wzx" + /locus_tag="SPC18A_0013" + CDS 10722..12179 + /gene="wzx" + /locus_tag="SPC18A_0013" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33536.1" + /db_xref="GOA:Q4K189" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K189" + /translation="MPSLKKNIVYNVLYQILAVIVPFITSPYLARVLGAEQIGVYSFT + YSIAFYFMILSMLGISNYGNRTIARVRTSREHLNQEFSNIYAVQLTCSLVMTISYLIY + ATVFVNSFQIVAYIQVLHVLSYATDVSWFFYGLEEFRITVARNSFVKLLTLISIFTFV + KSPNDIYLYTFIMAGGTLLGQLITWPFLLKQVNFVCPSLGKIKKHMKPIIILFFPVLA + VSIFSFLDKIMLGMYSSLKETAFYENSDKIISIPKALIQAFGAVMLPRTVHLLSIGDE + QKSLEYVDKTMWAVLVITMGCAFGLAGVSATFAPVYWGEEFRASSQIIAGMTPALVFS + AFGNVIRTQFLIPRSFDKEYTVSLLYGAVVNILINILLIPKIGAMGAVIGTIVAELVL + CCYQTWIARNYLHIREYLINAGILFLIGSVMYMVLILISSILPTSLLTLIIEIIVAAF + IYISLLILHIFSSKNRVIIGLRTNFLERTHLFKRK" + misc_feature 10731..11534 + /gene="wzx" + /locus_tag="SPC18A_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 8.6e-59" + gene 12182..13453 + /gene="wzy" + /locus_tag="SPC18A_0014" + CDS 12182..13453 + /gene="wzy" + /locus_tag="SPC18A_0014" + /note="member of homology group 93" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33537.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K188" + /translation="MKFKFKFNPIAILYILLVYLELATDRQHLYPVTYMTKYYIGILI + TVLFVLLLVGRGKLIFVNKKLLYLAKILAIPTIVLFLYSVLLDVMNPVEFDGYFSRLS + STTIFGLLAIFQAIVVFQFFGQKVVDYTFTAISLSYLTSIIVAFRQGGLSQFILMLTD + DSFNGSVLEMHEVAPITALFILYYLYKYFIKENSFSSVFRNILIALIILFLSLKRIVF + LSVLIIIPVFLIIYWYDKKVSKLGKERKILSLLNSFSLIFITGIFLYVYSVKSGFIYT + FIQEHNINSMARTDLWKGIESTYSFAPIFMGRGIGFVTKWMDNNWMTLNINGLTESTG + LHNDILKYYIEIGFVGLFIYFYTLLYRNAKRIFVKIGHKESFIYFVLIMFQMLIWFTD + NISTYHNFLWILNLLLFSLTNTDAELETQKL" + misc_feature 13025..13237 + /gene="wzy" + /locus_tag="SPC18A_0014" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1.7e-09" + gene 13533..14693 + /gene="wciY" + /locus_tag="SPC18A_0015" + CDS 13533..14693 + /gene="wciY" + /locus_tag="SPC18A_0015" + /note="member of homology group 78" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33538.1" + /db_xref="GOA:Q4K187" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K187" + /translation="MKFYIKNLLKKVFTLPLHLLPIQSNKIIFDNFGGRGFGDNPKYI + LEELVSREKNLNLVWVTKDREISIPEGVRVVKYGSYRSFYEWLTARVWVDNIRNSDRP + WKRKGQIYLQTWHGSDGVKLIEKSVAGNLKKTYLRMAKYDGKITDGIVSSRHFQTLGM + QNNFWLTENVEFLEFGLPRNDDFFKSEKIKTTNIKFRTLFDIDLDELVVLYMPTFRDD + GSLNAYNLDYSKLIHVFQNKFRKNVKILVRFHPNVDSNFINLQDTDCINVSTYSNPQD + LMMSADVMITDYSSASIDFMLLNRPVFLYLPDYQSYVNDRPLDDNFDKLPFPRAYHNN + ELTEIIRDFERSKYDEKVRLYELEDVRFDRGKASVQCANWIEEKIKNNKVID" + misc_feature 14118..14663 + /gene="wciY" + /locus_tag="SPC18A_0015" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 3.3e-68" + gene 14735..15127 + /gene="gct" + /locus_tag="SPC18A_0016" + CDS 14735..15127 + /gene="gct" + /locus_tag="SPC18A_0016" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33539.1" + /db_xref="GOA:Q4K186" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K186" + /translation="MKRIITYGTFDLLHYGHISLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNYEHRKNLVEAIRYVDLVIPETSWEQKKSDVKEYHIDTFVMGDDWKGKFDY + LEEEGVEVVYLPRTKEISTTKIKEDLSE" + misc_feature 14747..15115 + /gene="gct" + /locus_tag="SPC18A_0016" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 3.4e-29" + gene 15180..15856 + /gene="HG94" + /locus_tag="SPC18A_0017" + /pseudo + CDS join(15180..15350,15340..15594,15521..15856) + /gene="HG94" + /locus_tag="SPC18A_0017" + /note="member of homology group 94" + /pseudo + /codon_start=1 + /transl_table=11 + /product="hypothetical protein (pseudogene)" + gene complement(order(15740..16110,16139..16444)) + /gene="tnp" + /locus_tag="SPC18A_0018" + /pseudo + CDS complement(join(15740..16066,16063..16110,16139..16444)) + /gene="tnp" + /locus_tag="SPC18A_0018" + /note="member of homology group 19; + member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature complement(join(15752..16066,16063..16110,16139..16201)) + /gene="tnp" + /locus_tag="SPC18A_0018" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 7.5e-05" + /pseudo + gene 16838..17707 + /gene="rmlA" + /locus_tag="SPC18A_0019" + CDS 16838..17707 + /gene="rmlA" + /locus_tag="SPC18A_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33542.1" + /db_xref="GOA:Q4K185" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K185" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAGKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 16841..17557 + /gene="rmlA" + /locus_tag="SPC18A_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 4.1e-120" + gene 17708..18301 + /gene="rmlC" + /locus_tag="SPC18A_0020" + CDS 17708..18301 + /gene="rmlC" + /locus_tag="SPC18A_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33543.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 17744..18274 + /gene="rmlC" + /locus_tag="SPC18A_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 18314..19363 + /gene="rmlB" + /locus_tag="SPC18A_0021" + CDS 18314..19363 + /gene="rmlB" + /locus_tag="SPC18A_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33544.1" + /db_xref="GOA:Q4K2P4" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P4" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18329..19285 + /gene="rmlB" + /locus_tag="SPC18A_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0001" + misc_feature 18332..19072 + /gene="rmlB" + /locus_tag="SPC18A_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 2.7e-76" + misc_feature 18335..19147 + /gene="rmlB" + /locus_tag="SPC18A_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.7e-05" + gene 19429..20280 + /gene="rmlD" + /locus_tag="SPC18A_0022" + CDS 19429..20280 + /gene="rmlD" + /locus_tag="SPC18A_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33545.1" + /db_xref="GOA:Q4K182" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K182" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVTEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19429..20277 + /gene="rmlD" + /locus_tag="SPC18A_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.6e-146" + misc_feature 19432..20073 + /gene="rmlD" + /locus_tag="SPC18A_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00012" + misc_feature 19432..20061 + /gene="rmlD" + /locus_tag="SPC18A_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.4e-18" + misc_feature 19435..20163 + /gene="rmlD" + /locus_tag="SPC18A_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene order(20356..21309,21326..21541) + /gene="tnp" + /locus_tag="SPC18A_0023" + /pseudo + CDS join(20356..21309,21326..21541) + /gene="tnp" + /locus_tag="SPC18A_0023" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 20362..20805 + /gene="tnp" + /locus_tag="SPC18A_0023" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 5.5e-05" + /pseudo + gene 21840..>21887 + /gene="aliA" + /locus_tag="SPC18A_0024" + CDS 21840..>21887 + /gene="aliA" + /locus_tag="SPC18A_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33547.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata actaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactattt aaggagaaag aagatgaaca + 301 taaagaagcg tgtccttagt gcaggcctga cttttgcatc tgctttgctt ttagctgctt + 361 gcggccaatc aggttcagat acaaaaactt actcatcaac ctttggtgga aatccaacta + 421 catttaacta tctattagac tattacgctg ataacatagt caattgaaac aagaacagga + 481 caaaagagcc tcgtaaaagg tatggcaact tggtaatacc tttttgaggt gctttttgat + 541 ataagcccat gttttctcaa taggattgta ctcaggtgag tagggaggaa gaggtaaaag + 601 tttatgccca gactcttcgc ataaaagttc tagcttcccc attctatgga atcttgcatt + 661 atccataata tagtagattg aaactagaat agtacacctc tacttctaaa acattgttag + 721 aattcgattt tactgtcctg atcgatttat cttattctta tttcatttta ctataataac + 781 cgatggtatg gttaatgttg gtaagaaaaa cttctgaaac caagcttcaa aaaagtcgct + 841 cgtcatcgtc tcttcgtaag tcattggagc aattaactca ccatttgtta gccctgcaac + 901 caaagaaatc ctctgatatc ttcttccaga tactttgcct cttattaact gaccttttaa + 961 tgagcgacca tattctcgat aaaaataagt atcgaatcct gtttcgtcaa tataaacagg + 1021 tgctaggtgc tttaaactat taaaattctt aagaaataag gctacttttt ctgggtcttg + 1081 ttcataatta gattgaaact agagtagtac acctctgctt ctaaaacgtt gttagaaatc + 1141 ggtttaaccg tcctgttctt atttcatttt actatatttt tgtttcgcgg gaagtctact + 1201 aagatactta aagatgcaga tagtgaaaat aaaagtgtag acattaccgt aaaaaagtga + 1261 tataatcgta taatgttgaa tgtataggtg ttaatcatga gtagacgttt taaaaaatca + 1321 cgttcacaga aagtgaagcg aagtattaat atagttttgc tgactattta tttattgtta + 1381 gtttgttttt tattgttctt aatctttaag tacaatatcc ttgcttttag atatcttaat + 1441 ctagtggtaa ctgcgttatt cctactagtt gccttggtag ggctactctt gattatctat + 1501 aaaaaagctg aagaatttac tatttttctg ttggtattct ctatccttgt cagctctgtg + 1561 tcgctctttg cagtacagca gtttgttgga ctgaccaatc gtttaaatgc gacttctaat + 1621 tactcagaat attcaatcag tgtcgctgtt ttagcagata gtgagttcga aaatgttacg + 1681 caactgacga gtgtgacagc accgactggg actgataatg aaaatattca aaaactacta + 1741 gctgatatca agtcaagtca gaataccgat ttgacggtca accagagttc gtcttacttg + 1801 gcagcttaca ggagtttgat tgcaggggag actaaggcca ttgtcctaag tagtgtcttt + 1861 gaaaacatca tcgagtcaga gtatccagac tacgcatcga agataaagaa gatttatacc + 1921 aagggattca ctaaaaaagt agaagctcct aagatgtcta agaatcagtc tttcaatatc + 1981 tatgttagtg gaattgacac ctatggtcct attagttcgg tgtcgcgatc agatgtcaat + 2041 atcctgatga ctgtcaatcg agataccaag aaaatcctct tgaccgcaac gccacgtgat + 2101 gcctatgtac caatcgcaga tggtggaaat aatcaaaaag ataaattaac ccatgcgggc + 2161 atttatggag ttgattcgtc cattcacacc ttagaaaatc tctatggagt ggatatcaat + 2221 tactatgtgc gattgaactt cacttctttc ttgaaaatga ttgacttatt gggaggggta + 2281 gatgttcata atgatcaaga gttttcagat ctacatggga agttccattt cccagtaggg + 2341 aatgcccatc tagactctga gcaagcttta ggttttgtac gtgaacgcta ctcactagcc + 2401 gatggagacc gtgaccgtgg tcgcaatcaa caaaaggtca ttgtagcgat tattcagaag + 2461 ttaacttcta cagaggtctt gaaagactat agtagtattc ttcaaggatt gcaggattct + 2521 cttcaaacaa atatgccgat tgagactatg atggatttag tgaataccca gttggaaagc + 2581 ggagggaatt ataaagtaaa ttctcaagat ttaaaaggga caggtcggat ggatcttcct + 2641 tcctatgcaa tgccagacag taacctctat gtgatggaaa tagatgatag tagtttagct + 2701 gtagttaaag cagctataca ggatgtgatg gagggtagat gaaatgatag acatccattc + 2761 gcatatcgtc tttgatgtag atgatggtcc caagtcaaga gaggaaagta aggctctctt + 2821 ggcagaagcc tacagacagg gggtgcgaac cattgtctct acctctcacc gtcgcaaggg + 2881 catgtttgaa actccagaag aaaaaattgc aacaaatttt attaaggttc gtgaaattgc + 2941 aaaagaagta gcagatgatt tagtcattgc ttatggcgca gagatatact atactctgga + 3001 tgctctagaa aagctagaaa aaaaagaaat tcctaccctt aatgatagtc gttatgcttt + 3061 gattgagttt agcatgcata cttcctatcg tcagattcat acgggattga gcaatatttt + 3121 gatgttggga atcacgccag taattgctca tattgaacgt tatgatgctt tagagaataa + 3181 cgaaaaacgt gttcgtgaac tgattgatat ggggtgctat actcagataa atagccatca + 3241 tgtttcaaaa cctaagttct ttggtgaaaa atataaattc atgaaaaaga gagctcggta + 3301 ttttttggaa cgtgatttag ttcatgtagt tgcaagtgac atgcacaatt tagacagtag + 3361 acctccatat atgcaacagg catatgatat cattgctaag aaatatggag cgaaaaaagc + 3421 gaaagaactt tttgtagata atcccagaaa aattataatg gatcaattaa tttaggagaa + 3481 aatatgaagg aacaaaacac tttggaaatc gatggattgc aactattcag agctttatgg + 3541 aaaagaaagt tagtcatttt attagtggca attataactt cttcagttgc ttttacctac + 3601 agtacttttg ttatcaaacc tgagtttact agtacgactc ggatttatgt agttaaccgt + 3661 aatcaggaag agaagcctgg tttaaccaat caagacttgc aggcaggatc atacttggtt + 3721 aaagactatc gtgaaattat cctatcgcag gatgttttgg aggaagttgt ttctggtttg + 3781 aaactagatt tgacgccaaa aggtttggct aataaaattg aagtaacagt accagttgat + 3841 acccgtattg tctctgtttc agttaatgat cgagttcctg aagaggcgag ccgtatcgct + 3901 aactctttga gagaagtagc tgctcaaaaa attattagta ttactcgtgt ttctgatgtg + 3961 acaacactgg aggaggcaag accggcgata tcaccgtctt caccaaatat taaacgcaat + 4021 acactaattg gttttttggc aggggggatt ggaactagtg ttatagtttt tcttcttgaa + 4081 cttttggaca ctcgtgtgaa acgtccggaa gatatcgaag atacactgca gatgacactt + 4141 ttgggagttg taccaaactt gaataagttg aaataggaga gagagatgcc gacattagaa + 4201 atagcacaaa aaaaactgga gttcattaag aaggcagaag aacattacaa tgctttgtgt + 4261 acaaatatac agttgagcgg agataaacta aaagtaattt ccgttacttc tgttagccct + 4321 ggggaaggaa aaacaactac ttccgtaaat atagcatggt cgtttgcgcg tgcaggctat + 4381 aaaactcttt tgattgatgg cgatactcga aattcggtta tatcaggatt ttttaaatct + 4441 cgtgaaaaaa ttacagggct aacagaattt ttatctggga cagctgattt atctcacggt + 4501 ttatgtgata caaacattga aaatttattt gtagttcaat cgggagctgt atcaccaaac + 4561 cctacagcct tgttacaaag taaaaatttt aatgatatga ttgaaacatt gcgtaaatat + 4621 tttgattata tcattgttga tacagcacct attggaattg ttattgatgc ggcaattatc + 4681 actcaaaagt gtgatgcgtc catcttggta acagcaacag gtgagacgaa taaacgtgat + 4741 gtccaaaaag cgaaacaaca attaaaacaa acagggaaac tgttcctagg agttgtttta + 4801 aataaattag atatctcggt tgataagtat ggagtttacg gtttctatgg aaattatggt + 4861 aaaaaataac ttaggaaaga ttttatggat gaaaaaggat tgaaaatttt tctggcagta + 4921 ttacagagta ttgttgtcat tttattgatt tattttctta gctttgttag agagacagaa + 4981 cttgaacgtt cttcgatggt tatactatac cttctccact tttttgtatt ctattttagt + 5041 tcctatggta acaatttttt taaaagaggg tacctagttg agtttaatag tactataaga + 5101 tatatttttt tctttgcaat agctataagt gtattaaact tttttatagc ggaacggttt + 5161 agtgtctcta gaagaggaat ggtatacttc ttaactttag aaggaatatc cttatacttg + 5221 ttaaatttct tagtaaagaa atattggaag catgtgtttt ttaatctaaa aaatagcaag + 5281 aaaattttac tgttaacagt aacgaaaaat atggaaaaag ttcttgataa attgttagaa + 5341 tctgatgaac tttcatggaa attggtagca gtaagtgttt tggataaatc tgattttcaa + 5401 catgataaaa tacctgtaat tgaaaaggaa aaaattattg aatttgcaac gcatgaagtt + 5461 gtggatgagg tgtttgtcaa tcttccagga gagagctacg atattggaga aattatctct + 5521 aggtttgaga caatggggat agatgtaact gtaaatctta atgcatttga taagaatttg + 5581 ggtcgcaata aacaaattca tgagatggta ggattgaatg tagtcacttt ctctaaaaat + 5641 ctttataaaa ctagtcatgt gatttcaaag agaattctcg atatttgtgg tgccactatt + 5701 ggccttattc tttttgctat agctagtcta gttttagttc cattgattcg taaagatggc + 5761 ggaccagcta ttttttctca aactcgtata gggaaaaatg gtcgacattt taccttttat + 5821 aaattccgtt cgatgcggat cgatgctgaa gctatcaaag aacagttgat ggatcaaaat + 5881 acgatgcaag gtggtatgtt taagataaac aatgatcctc gtgttacaaa aattggtcgc + 5941 tttattcgta aaaccagttt agatgagtta ccccagtttt ggaatgtctt tataggagat + 6001 atgagcttgg tgggaacacg tccacctaca gtagacgagt atgatcagta tactccagaa + 6061 cagaaacgtc gactcagctt taaacctggt attacaggtt tatggcaggt tagcggccgt + 6121 agtaaaataa ccgattttga cgctgttgta aaattagatg tggcttatat tgataattgg + 6181 acaatctgga aagatattga aattttgctt aaaactgtta aagttgtatt tatgagagat + 6241 ggagcgaagt aatttctgta tatccatcct attaggagag aaatgaaaaa gtcagtttat + 6301 atcattggtt caaaaggaat tcctgctaag tatggaggat ttgaaacttt tgttgaaaaa + 6361 ttaacagcct tccaacaaga taaggctatc caatattatg tggcttgtat gcgtgaaaac + 6421 tctgcaaaat cagggactac tgaggatgtt tttgaacata atggtgctat ctgttataat + 6481 gtcgatgttc ctaatattgg tccagcgcga gctatagcgt atgatatcgc tgcaattaac + 6541 agagctattg aaattgctaa agaaaataat ggtgaagatc caatcttcta tattttagct + 6601 tgtcgaattg gtccgttcat ccatggaatt aagaaaagaa ttcaagcaat aggtggggct + 6661 cttctggtta atccggatgg tcatgaatgg ctacgagaaa aatggagttt acctgttcgc + 6721 aaatattgga aatactctga aagacttatg gtcaaacatg cagatctttt agtgtgtgat + 6781 agtaagaata ttgaaaaata tatccaagaa gattataaac agtatcaacc taagacaacc + 6841 tatatcgctt atgggactga tacaacacgc tccatattaa agagtagtga cgaaaaagta + 6901 cgttcttggt tcaaagagaa gaatgtttct gaaaacgagt attacctagt tgtaggacgt + 6961 tttgttccag aaaataacta tgaggctatg atacgtgggt ttttagcatc taattctaag + 7021 aaggactttg tcttaatcac aaatgtagaa cagaataaat tttataatca gttgttggca + 7081 aaaactggtt ttgataagga cccacgagta aaatttgtag gtacagtcta tgagcaagag + 7141 cttcttaaat atattcgtga aaacgccttt gcttacttcc acgggcatga agttggtgga + 7201 accaatcctt cgcttttaga agctctggca tcaactaaac tgaatttatt gctagatgtt + 7261 ggctttaacc gagaagttgg ggagcaaagt gcgatctatt ggaaaaaaga tgagctttcc + 7321 caagtaatcg agaaagttga gcaatttgat gcaaaaatga ttgatgagtt agatagacaa + 7381 tcaaatcaga gaattacgga ttctttcact tgggaaaaga ttgtcacaga ctacgagaaa + 7441 ttatttaaaa aatgaaaata ctacattata ctttaggatt tcaaccccag cgaacaggtg + 7501 gtttggttaa atatgctgag gatttaatga tagagcaaat tgctcaaggt tatcaagtag + 7561 ccgccctatg tccagggaga attaagttct tttcaaaaaa aatagaaata attaaagcga + 7621 cgtcaaggca gtttgagtgt tatgaactgc ttaatagctt acctatagct ttatttggag + 7681 gtatatccga tccaactgct ttcatgacac cttgtgacaa aaatgtttat cgtacttttt + 7741 tagaaaaagt acaacccgac attatacata ttcactcgtt tatgggattg cataaagaat + 7801 tcctcgaaat tgctaaaaac ttgaatatta gagtggtttt tacgagccat gattattatg + 7861 gattagcacc cgtacctcat ttctatttta atggggtgga ttatagtgat aaaaatacaa + 7921 acttaacatg gaatattatg tcttccaatg ctttaagtgt gaaaaaacta agactttttc + 7981 aagtttcatt ttatcctact attcgtaaac ttttgaaact attagggaaa aatccaaaat + 8041 ctaaaaagaa tttagttatt cgagatgtta ttgaggaaca agattatagt gaacttcgat + 8101 actattataa tgagatgttt cacttaatag atggttattt gtttaatagt agacttgcaa + 8161 agaaggtata tgagataaac gagattcaac cagctaatag tgtagtatta tctataacaa + 8221 gtagttcaat taaacatcat cagagattaa cgactacaaa taataagatt agggtttctt + 8281 atattggttc agacgaagaa tataaaggtt actttgattt tattgacttt gctggaactt + 8341 tagaacaaga atcatatgaa gtggtaactt atggtcattt accaaatgaa gagtgccctt + 8401 cattcattga acaaaaagga tattttacca aggaaacgat tgacagtgtc tatgaaaata + 8461 ttgatatttt gattatagca agcaaatgta aagaaacctt tggattgata acagtagaag + 8521 cattatccta tggggtaaat gtttttgtga gtgaaaatgt tggatcaaaa gacttgcttc + 8581 cagaaacaca tgtttttaaa gacaaggaag atttgttggc taaaatcatc aataatcagt + 8641 tggagaaagt tccgcttaaa acgatggaaa aacatgtaga agaagttatt agttattaca + 8701 aacaggttag aagcaacaat taaggagaat gattaaagat atgtcctgtc cagaaattag + 8761 cgtaattgta ccagtttata atgtggaacg atatttaaga cagtgtatgg attcattgat + 8821 aaatcaaact tatagggatt ttgaaataat tttagtaaac gatggatcaa cggattcttc + 8881 tgggattctc tgtgaagagt gggcaaaaaa agatgaaaga attcatgtag ttcacaaaaa + 8941 aaatgagggg cttggcttcg ctcgtaatac aggggttgaa cacgcaaagg ggaaatacat + 9001 aacctttgta gattcagatg actatgtttc tctagatatg ctgcaaactc tatataatgc + 9061 tgttcaagaa tatgatgtcg aagttgtata cagtgcggga tattatcgtt cctttagtaa + 9121 tggagaaata aagaagacag atgtaggaac aaaaaagcct caacttttcg aaggaggaga + 9181 tgttgcctct gaattactcc ctaatgtaat ttctgctcct cctgaatatc cgaatgatgg + 9241 gaaagttgga gtgtcggcat ggaaggttct ctataaagct aatttattta aggataaagg + 9301 gctattattt cattcggaaa gagaattcat ttcagaagat gctatttttc aaattgattg + 9361 tttaaaatta gcaacatctg cccttgttat cccagatatt ttatactact atcgtgaaaa + 9421 ctttggttct ttaagtatga aatataaaga agatcggttt gagttggata agatcttgta + 9481 taacgagcaa ttaaaaagag ttgaggggtt acctaatcaa gaaattttgg aagaaagaat + 9541 cgagagaatt ttaattgcta atattcgttt atgtgtcttt caggaatctt tacataaaag + 9601 ttctagaata cataaacgct tgcaaagaat tagacagatt tgtaaggatc cagtctcaaa + 9661 agtagtttta caccactatc caatccatcg cttacctttt cctaaacgtt tgatctgtgt + 9721 attagctaag tataatatgt cgctgtttct tttagcttta accctattaa aatatcggaa + 9781 tcggagtgta taacttttat ggggatgaat atagaaaaat taaaactatc tttgaaaaat + 9841 agaacgtttt ttcctgttgt tattcatgcc ttacgtaacc gttggccctt gtggtggatt + 9901 cggagtaagg ctattcgaga agtacaactt gaagataggg cctacagaat actaaaaaag + 9961 aaatacggtt ccttaatttc aaactctttt gataaagcat acttatcaga aaaagttccc + 10021 aagcaaatct ggatttgctg gtttcaaggt atggagaatg ctccagattt ggtgaaatca + 10081 tgttatagat cacttaaaaa gcaatttcct gaatatgtca ttacggttat ttcttcagag + 10141 aatatttttg aatatgtaga gatacctgat attctatatg aaaagtgggt gaatggtgta + 10201 ataggcaatg ctcatttttc tgatatcctt cgggtagagt tgttacgtaa gtttggagga + 10261 atatggattg actctacagt gtattgtaca ggaattacta ccatacagat aattggaaaa + 10321 aatccatttt ttatgtataa aagtgtatct tcggtcgagg agaggatctc ctcttccaac + 10381 tggatgattg cttctgttcc taatcatcca ttcatgatta cgatgagcaa acttttgcaa + 10441 tcttattggt caaaagaagt tatagcaatt cattattatc tatttcatat tctttttacg + 10501 attatgatag aatcacttcc tgagttgtgg cagcttgtac ccacctatac gaacgcagca + 10561 ccacatataa tgattgatga attaaataat gttttttcaa aggaacgtta ccagcaattg + 10621 tgtcaaattt cagattttca taaattaaat tataaaaaaa attacaatga taaatcagag + 10681 agtttgtaca gttatttact gaatcagtag aggggagaat cttgcctagt ttaaagaaaa + 10741 atattgttta caatgtctta tatcagatct tagctgtaat agtaccattt attacctcac + 10801 cttacttagc gcgtgtgtta ggtgcagagc aaattggagt ttattctttt acttattcca + 10861 ttgcttttta ctttatgatt ctgtccatgt tggggatttc taattatggg aatcggacaa + 10921 tagcacgggt acgaacaagt agagaacatt tgaatcagga attttcgaat atttacgcgg + 10981 ttcagttgac gtgttcacta gtaatgacca tctcatattt gatttatgca acagtatttg + 11041 tgaatagttt tcagattgta gcctatatcc aagtattaca tgttttatcg tatgcaacag + 11101 atgttagttg gtttttttat ggtcttgaag agtttcgtat tacggttgct aggaattcat + 11161 ttgttaagtt attaacttta atatctatct ttacatttgt aaaaagccct aatgatatct + 11221 atttatatac ctttataatg gcagggggta ccctgcttgg tcagttgatt acatggccat + 11281 ttttgctaaa acaagtaaac tttgtgtgcc ctagtcttgg aaaaataaag aaacacatga + 11341 aacctattat tattttattt ttccccgtct tagcggttag tattttttcg tttctagata + 11401 aaataatgct tgggatgtat agtagtttga aggaaactgc tttttatgag aattcagata + 11461 agatcattag tattccaaaa gctctgattc aagcctttgg agctgtaatg ttgcctcgaa + 11521 cagtacattt actgagtata ggtgatgaac aaaaaagttt agaatatgtt gataaaacga + 11581 tgtgggctgt tttagtgatt acaatgggct gtgctttcgg tttagcagga gtttctgcaa + 11641 cctttgctcc tgtttattgg ggtgaagaat ttagagccag tagccaaatt attgcaggaa + 11701 tgacaccggc tttagtattt tcggcttttg gaaatgtcat ccgaacccag tttttaattc + 11761 cacgaagttt tgacaaggaa tatacggtat ctttacttta tggagccgtt gttaatattt + 11821 tgattaatat tcttttaatt ccgaagatag gagcaatggg agctgttatc ggaacaattg + 11881 ttgcagagtt agttctatgt tgctatcaaa catggattgc tagaaattat ttacatatca + 11941 gagaatatct gataaatgct gggatattat ttcttatcgg ttcagtaatg tatatggttt + 12001 taattcttat ttcaagtatt ttacctactt cgttacttac acttattatt gaaattatag + 12061 tcgcagcttt catttatatt agtttactga ttctgcatat cttttcttca aaaaacaggg + 12121 taattattgg tttacgaaca aattttttag aacgtactca tttatttaaa aggaagtaat + 12181 agtgaaattt aaatttaaat ttaatccaat cgcgatactg tatatattgc tagtatactt + 12241 agagttagct acagataggc aacatctgta tcctgtaacg tacatgacaa aatattatat + 12301 tggtatttta atcactgtgt tgtttgtttt gttattagta ggccgtggga agcttatttt + 12361 tgttaataaa aaattattat atcttgctaa gatattagct ataccaacaa ttgttctttt + 12421 cctgtactca gtcttactag acgtaatgaa cccagttgaa tttgatggat attttagtag + 12481 gttatcaagt acgactattt ttggtttgtt agctatcttt caagctatag ttgtttttca + 12541 attttttgga caaaaagtag tagattacac ttttacagct atctccctca gctacttaac + 12601 cagtatcatt gttgccttta ggcagggagg acttagtcaa tttatcttga tgctaacaga + 12661 tgatagtttc aatggttcgg tactagaaat gcatgaagtt gcacctatta cagctctctt + 12721 tattctgtac tatttgtaca aatattttat aaaagaaaat agtttttctt cagtatttcg + 12781 taatatctta atagctctca ttattctttt tttaagcctt aaacgaatcg tttttttgag + 12841 tgtattaatt atcataccag tatttttgat aatttattgg tatgataaaa aagtaagcaa + 12901 actagggaaa gaacgaaaaa ttttaagttt attaaatagc ttttccttaa tatttataac + 12961 aggaatattc ctttatgttt atagtgtaaa atctggtttt atatatacat ttattcaaga + 13021 acataatatt aattcgatgg ctagaacaga tttatggaag ggaattgaat caacctatag + 13081 tttcgcccct atatttatgg ggagagggat agggtttgta acaaaatgga tggataataa + 13141 ttggatgact ttgaatatca atggtcttac agagtcaacg gggctccata atgatatttt + 13201 gaagtactac attgagatag gatttgtagg attatttatt tatttttaca ctcttcttta + 13261 tagaaatgct aaacgtatat ttgtaaaaat tggtcataaa gaatcattta tatattttgt + 13321 attgataatg tttcagatgc tgatatggtt tacagataat atttcaactt accataattt + 13381 tttatggatt ctaaatctac tgctcttttc tttaactaat acggatgcag aattggaaac + 13441 tcagaaatta taaaatattt atttcttgaa tttatggtct tacgccgtaa atttgatttc + 13501 actaatgact aatactaatt tataaaaata atatgaaatt ttatataaaa aatttattaa + 13561 aaaaagtctt tacattaccg ttgcatttat tgcctattca gtctaataag ataatatttg + 13621 ataattttgg tggtagaggt tttggggaca atcctaagta tatacttgaa gaacttgtct + 13681 ctcgagaaaa gaatctaaat cttgtgtggg taacaaaaga tagagaaatt tctatccctg + 13741 aaggcgttcg agtagtaaaa tacggcagtt accgttcttt ttatgaatgg ttaacagcta + 13801 gagtttgggt agataatatt cgtaattctg atcgaccttg gaagcgaaaa ggacagattt + 13861 atcttcaaac ttggcatggt tcagatgggg taaagttaat tgaaaaaagt gttgcaggga + 13921 atctaaaaaa aacatatctt agaatggcga agtatgatgg aaagattaca gacggtatcg + 13981 tatcaagtcg gcactttcaa actttgggta tgcaaaataa tttttggctg acagagaatg + 14041 tggaatttct ggaatttgga ttacctcgaa atgatgattt ttttaaaagt gaaaaaatca + 14101 aaaccacaaa tataaaattt agaacattat ttgatatcga tttagacgaa ctggtagttt + 14161 tgtatatgcc gacgttcaga gatgatggat cgttgaatgc ctataattta gattactcga + 14221 aactaataca tgtttttcaa aataaattta gaaaaaatgt aaaaatatta gttcgttttc + 14281 atccaaatgt tgattctaat tttataaatt tacaggatac agactgtata aatgtgtcga + 14341 cctattcaaa tcctcaggat ctgatgatga gtgcggatgt gatgattacg gattattcat + 14401 cggcttctat tgattttatg ttattaaatc gtccagtatt tctgtattta ccagattatc + 14461 aaagttatgt gaatgataga ccattggatg ataactttga taaattgcca tttccaagag + 14521 catatcataa caatgagttg acagaaatta ttagagactt tgaaagaagt aaatatgatg + 14581 aaaaagttcg tctgtatgaa ttagaggatg ttcgttttga tagaggaaaa gcatcagtac + 14641 agtgtgctaa ttggattgaa gaaaaaataa aaaacaataa agttattgat tgaaataatt + 14701 atatttattg aatgataaat aaggaggcct ttagatgaaa agaattataa catatggtac + 14761 atttgattta ttgcattatg gtcatatcag tcttttgaaa cgtgctaaac agctaggtga + 14821 ttatttgatt gtagttgttt caagtgatga gtttaattta aaagaaaaga ataaagtatg + 14881 ttactttaac tacgaacaca gaaaaaattt agtagaagct attcgatatg tcgatttagt + 14941 aatccctgaa actagttggg aacagaaaaa gtcagatgtt aaagagtacc atattgacac + 15001 ttttgtaatg ggtgatgatt ggaaaggtaa atttgattat cttgaagaag aaggtgttga + 15061 agtagtctat ttgcctagaa caaaggaaat atcaaccaca aagataaaag aagatttatc + 15121 ggaataaaat attattaaaa aatgctgaca taagaaattg tggcttttgt gtatagtttt + 15181 tgatagaata aagtaacaac actttaacca atgaggtgtg aataatggca gtaattttta + 15241 aagatgtact tgttgaagag aagactgatg aagaaaaaca acatatttta tctattttag + 15301 atgatgagaa tgttagagct tttgattgtg gatattaaga attgaatgat gttttttgat + 15361 atttagaaca aatacgatga agaaacaggc catgtattgc ctattgtaaa tcaaaatttt + 15421 gaattattag gttttatttc ttgtagacta gtatcatttt ctttcatagc tcgggttaaa + 15481 gagatgggaa ttagcataga ttatcttggt gtttataagg attgccagaa aatgggggat + 15541 cggttcgctt ttggtgacct ttgcacttcg attatcttta actattgact gttgattacc + 15601 aataaaaggt gtaatagttc atgctttaga ggatgttgta gaattctatg acaaactggg + 15661 ttttattgac cctagagata tagtgattta taatggcaaa ccggttacta tatattttag + 15721 taatagactt cctgcaaaac tagaatccta gttcatgatt gataatacca gcattcaaat + 15781 tcattcgtaa tccgaagcgt ttacgatgat ttcgataggt tgttgaaaac attttaaaca + 15841 tttttacttt ggcaaagatg ttctcaacct tgcttctctc cttagatagc gcatggttac + 15901 aggctttatc ttcagctgtt agtggcttga gtttgctgga tttacgtgga gtttgtgctt + 15961 gaggatatat cttcatgagc ccttgataat cactgtcagc caagatttta ccagcttgtc + 16021 cgatatttct gcgactcatt ttgaacaact tcatatcatg gcaatagaaa caattctccc + 16081 ttgacttgtg acaatcgctt gagccttcat agcgtggcat ttctttttac cagaatcatt + 16141 cgctaattgt ttttttaggt cgattgattt ttacttccgt cgcatcaatc attaccgtgt + 16201 cctcaaaact aagaggagtt cttgaaatcg taacaccact ttgaacaaga gttacttcaa + 16261 cccattggct ccgacggatt aagttgcttt cgtggatacc aaaatcagcc gcaatttctt + 16321 cataagttca atattctcgc acatattgaa gagtggccat aagaaggtct tctaggctta + 16381 atttaggttt tcgtccacct tttgcgtgtt taagttgata agctgttttt aatacagcta + 16441 acatctcttt aaaagtcgtg cgctgaacac caacaagacg cttaaatcgt gtatcagtta + 16501 attgtttact tgcttcataa ttcatagaac tactatacca tattttgttt cgcaggaagt + 16561 ctattgaaaa attaagaaat ggtgaaatta ttcctcacac acagttattt gaaacatcct + 16621 tagaaaatga tttttaattg tatgcaaaca aagtagaatt cacttatttt atcttatgct + 16681 aaatgtaata tgaaacaagt gaatttttat agacaaagaa gaatttttct gtaattttta + 16741 gataataatt ttaaaaaatg tgatgattat tttcttttta gagcagtaca gaattaatag + 16801 taattgactc taaatcaata aagaaaggta ccctattatg aaaggtatta ttctagcagg + 16861 tggttcggga actcgcttgt atcctttgac tcgcgctgca tcaaaacaac tgatgccggt + 16921 ttatgataaa cccatgattt actatccact ttcaacattg atgttggctg ggattaggga + 16981 tattttgata atctcaactc ctcaagattt gcctcgtttt aaagagcttc ttcaagacgg + 17041 atctgagttt gggatcaagc tttcttatgc agagcaacca agtccagatg gtttggcaca + 17101 agcctttatc attggggaag agtttattgg tgatgatagc gttgctctaa tcttaggcga + 17161 caatatctat cacggacctg gcctttctaa gatgttacaa aaggcagcag gtaaggagtc + 17221 gggagcaact gtttttggct accatgtcaa ggatccagag cgctttggtg tggttgagtt + 17281 tgatcaggat atgaaggcta tttctattga agaaaagcca gagcaacctc gttcaaacta + 17341 tgcagttaca ggtctctatt tctatgataa tgatgtagta gagattgcca agagtattaa + 17401 accaagtcct cgtggtgaac tggaaattac agatgtaaac aaagcttacc tagatcgtgg + 17461 tgatttgtct gttgagctta tgggacgtgg ctttgcttgg ctggatactg gaactcatga + 17521 aagtttacta gaggcttcac agtacatcga aacagtgcaa cggatgcaaa atgttcaggt + 17581 agcaaactta gaagaaattg cctatcgcat gggttatatc agtcgtgaag atgtattgac + 17641 cttagcccaa ccacttaaga aaaatgaata cggacagtat ctgctccgtt tgattggaga + 17701 agcatagatg acagataatt ttttcggtaa gacgcttgcg gcacgcaagg ttgaagctat + 17761 tccaggcatg ttggagtttg atatccccgt tcatggagat aatcgtggct ggtttaaaga + 17821 aaatttccaa aaggaaaaaa tgcttccact tggatttcca gagtctttct ttgcagaagg + 17881 aaaattgcaa aacaatgtat ccttctcacg taaaaatgtc cttcgagggc tccacgcaga + 17941 gccttgggat aagtacatct ctgtagcaga tggagggaaa gttctgggtt cttgggttga + 18001 tctacgcgag ggtgaaacct ttgggaatac ctatcagaca gtaattgatg caagcaaggg + 18061 aatctttgtt cctcgaggcg tagctaatgg cttccaagtt ctatcagata cagtgtcata + 18121 tagctatctg gtcaatgatt actgggctct cgagctcaaa cccaagtatg cctttgtgaa + 18181 ctacgctgat ccaagccttg gtattgaatg ggaaaatatt gcagaagcag aggtttcaga + 18241 agcagataaa catcatcccc tacttaagga tgtaaaacct ttgaaaaaag aagatttgta + 18301 aaaaggaaag aatatgactg aatacaaaaa tattatcgtg acaggtggag ctggctttat + 18361 cggttctaac tttgtccatt atgtttacga gaactttcca ggtgttcacg tgacagtcct + 18421 agataagttg acttatgctg gaaatcgcgc gaatattgag gaaattttag gtaatcgtgt + 18481 tgagttagtt gttggtgaca ttgctgatgc ggagttggta gacaagttgg ctgctcaagc + 18541 agatgctatc gttcattatg cagcggaaag ccacaatgat aattcactca atgatccatc + 18601 gccatttatt catactaact tcatcggaac ctatactctt ttagaagctg ctcgtaagta + 18661 tgatattcgc ttccaccatg tatcgacaga tgaagtttat ggggatctcc ctttacgcga + 18721 agatttgcca ggtcatggtg aaggaccagg tgagaaattt actgctgaaa caaaatacaa + 18781 cccaagctct ccgtactcat caaccaaggc agcctcagat ttgattgtca aagcttgggt + 18841 gcgttctttt ggagtcaagg caacgatttc caactgttca aataactacg gtccttatca + 18901 acatatcgaa aaattcatcc cacgtcagat tactaacatc ctaagtggaa ttaagccaaa + 18961 actttacggt gaaggtaaga acgttcgtga ctggattcat accaatgacc attcttcagg + 19021 agtttggaca atcttgacaa aagggcaaat cggtgaaacc tacttgattg gggctgatgg + 19081 tgagaagaac aataaggaag ttttggaact tatccttaag gaaatgggac aagctgcgga + 19141 tgcctatgat catgtgactg accgtgcagg acatgacctt cgctatgcga ttgatgccag + 19201 caagctccgt gatgagttgg ggtggaaacc tgaatttact aactttgaag ctgggctcaa + 19261 ggcaacaatc aagtggtata cagataacca agaatggtgg aaagcagaaa aagaagctgt + 19321 tgaagccaat tatgctaaga ctcaggagat tattacagta taaaaagcag gaaatagctg + 19381 ctttttattg ctatattggg aagagttaca tattagaaag gtctagagat gattttaatt + 19441 acaggggcaa atggccaatt aggaacggaa cttcgctatt tattggatga acgtaatgaa + 19501 gaatacgtgg cagtagatgt gactgagatg gacattacca atgaagaaat ggttgagaaa + 19561 gtttttgaag aggtgaaacc gactttagtc taccattgtg cagcctacac cgctgttgat + 19621 gcagcagagg atgaaggaaa agagttggac ttcgccatca atgtgacggg gacaaaaaat + 19681 gtcgcaaaag catctgaaaa gcatggtgca actctagttt atatttctac ggactatgtc + 19741 tttgacggta agaaaccagt tggacaagag tgggaagttg atgaccgacc agatccacag + 19801 acagaatatg gacgcactaa gcgtatgggg gaagagttag ttgagaagca tgtgtctaat + 19861 ttctatatta tccgtactgc ctgggtattt ggaaattatg gcaaaaactt cgtttttacc + 19921 atgcaaaatc ttgcgaaaac tcataagact ttaacagttg taaatgacca gtacggtcgt + 19981 ccgacttgga ctcgtacctt ggctgagttc atgacctacc tagctgaaaa tcgtaaggaa + 20041 tttggttatt atcatttgtc aaatgatgcg acagaagaca caacatggta tgattttgca + 20101 gttgaaattt tgaaagatac agatgtcgaa gtcaagccag tagattccag tcaatttcca + 20161 gccaaagcta aacgtccgct aaactcaacg atgagcctgg ccaaagccaa agctactgga + 20221 tttgttattc caacttggca agatgcattg caagaatttt acaaacaaga agtgagataa + 20281 gtagtagaat gattttctag tctaataaaa gaggcagata atgaactcca aaggagctta + 20341 agatgtacga ttatcttgtt gttggtgctg gtctctttgg cgcatagctt tggctcagtt + 20401 tctattatcg ctcacaccat ccatcagaag tttaatctga aggtacccaa ttatcgtcaa + 20461 gaagaagatt gggctaggat gggtttacca atcacacgta aggaaatctc taattggcat + 20521 atcaaggcaa gtcaatacta tttagagtcc ctttataacc ttttacgaga aaagttgtta + 20581 gaacaacctc ttcttcatgc ggatgaaacc tcttatcggg ttctagggag tgatagccat + 20641 ctgacctact attggacctt tttgtctggg aaagctgaga atcaagcaat cacgctgtac + 20701 catcatgatc agcgtcggag tggttcggta gtgcaagaat tcctaggaga ttattctggc + 20761 tatgtgcatt gtgatatgtt gcggcagtaa cttaggactt tagtcctcta gttctgccta + 20821 tgcgatagca gtccaaggtt taggagcaag gcgacgctaa gcttggtaaa ctgcgaaccg + 20881 ctagaagctt atcgtcaact ggaagaagct gaacttgttg gatgttgggc acatgtgaga + 20941 aggaagtttt ttgaagcgac ccccaagcaa gcagataaat catccttagg agctaaaggt + 21001 ttagcttatt gtgatcagtt attttccctg gaaagagact gggaggcttt gccagctgat + 21061 gaacgactac agaaacgtca agaacatctc cagcccttaa tggaagactt ctttgcttag + 21121 tgccggcgtc agtcagtttt agcaggttca aaactaggaa gggcaattga atacagcctc + 21181 aagtatgaag aaacctttaa gactattttg aaagacggac atctggtcct ttccaataat + 21241 ctagctgaac gcgccattaa atcattggtt atgggacgga gtaaaagagt ccagtggact + 21301 cttttagcct aagctaaatt ttaaaaagcg agggtggtta ttttctcaaa gttttgaagg + 21361 agctaaagca agaactatta ttatgagttt gttggaaaca gctaaacgtc atcaattaaa + 21421 tagcgagaaa tatctattct atcttctaga atgtctttca aacgaggaaa ctctcgtaaa + 21481 caaagaggtt ttagaggctt atttaccatg gactaaagtt gtacaagaaa agtgcaaata + 21541 agaaatctcc agattaggaa ctatccgtga gttctctagt ctggagattt ttcggctctt + 21601 tgtcaactgt agtgggttga aaaaaagcta agctcgagaa aggacaaatt ttgtcctttc + 21661 tttttttaga aatagtatta aaaattcctt gactatgtga tatagttgag ggatttttaa + 21721 atgatattca tattttttgc aaagatgttg tttgaaaaat aattttcaaa aattctgaaa + 21781 attctgttga catctttctg aaaagagtct ataatggaga gaaagtttta aaggagaaaa + 21841 tgatgaaaag ttcaaaacta cttgcccttg cgggcgtgac attattg +// + diff --git a/public/res/serotype_genbank/serotype_18B.gb b/public/res/serotype_genbank/serotype_18B.gb new file mode 100644 index 0000000..c0cc3ee --- /dev/null +++ b/public/res/serotype_genbank/serotype_18B.gb @@ -0,0 +1,1008 @@ +LOCUS CR931672 21819 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 1033/41 (serotype 18b). +ACCESSION CR931672 +VERSION CR931672.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21819) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21819) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21819 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="1033/41" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC18B_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC18B_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33548.1" + /db_xref="GOA:Q4K1T1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K1T1" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVELL" + gene 293..466 + /gene="aliB" + /locus_tag="SPC18B_0002" + /pseudo + CDS 293..466 + /gene="aliB" + /locus_tag="SPC18B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI33549.1" + gene complement(459..980) + /gene="tnp" + /locus_tag="SPC18B_0003" + /pseudo + CDS complement(459..980) + /gene="tnp" + /locus_tag="SPC18B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1203..2648 + /gene="wzg" + /locus_tag="SPC18B_0004" + CDS 1203..2648 + /gene="wzg" + /locus_tag="SPC18B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33551.1" + /db_xref="GOA:Q9AH98" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q9AH98" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILVF + RYLNLVVTVLVLLVALIGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGDTKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPIGSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNKKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRGRYSLADGDRDRGRNQQKVIVAIIQKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVAKAAIQDVMEGR" + misc_feature 1203..1319 + /gene="wzg" + /locus_tag="SPC18B_0004" + /note="Signal peptide predicted for SPC0890 by SignalP 2.0 + HMM (Signal peptide probability 0.996) with cleavage site + probability 0.577 between residues 39 and 40" + misc_feature 1407..1754 + /gene="wzg" + /locus_tag="SPC18B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.1e-64" + misc_feature 1932..2375 + /gene="wzg" + /locus_tag="SPC18B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.8e-69" + gene 2650..3381 + /gene="wzh" + /locus_tag="SPC18B_0005" + CDS 2650..3381 + /gene="wzh" + /locus_tag="SPC18B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33552.1" + /db_xref="GOA:Q4K157" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K157" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTMDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVIASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPIKIIMDQLI" + misc_feature 2653..3261 + /gene="wzh" + /locus_tag="SPC18B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.1e-38" + gene 3390..4082 + /gene="wzd" + /locus_tag="SPC18B_0006" + CDS 3390..4082 + /gene="wzd" + /locus_tag="SPC18B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33553.1" + /db_xref="GOA:Q4K177" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K177" + /translation="MQDQNTLEIDVFQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNKEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSISVNDRVPEEASRIANSLRKVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGVIGTSVIVLLLELLDTRVKRPEDIENTLQMT + LLGVVPNLGKLK" + misc_feature 3408..3824 + /gene="wzd" + /locus_tag="SPC18B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 4.5e-53" + misc_feature 3930..4007 + /gene="wzd" + /locus_tag="SPC18B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4092..4775 + /gene="wze" + /locus_tag="SPC18B_0007" + CDS 4092..4775 + /gene="wze" + /locus_tag="SPC18B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33554.1" + /db_xref="GOA:Q9AH95" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q9AH95" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSINIAWSFARAGYKTLLIDGDTRQSVMSGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILITATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGAY + GSYGNYGKK" + gene 4791..6158 + /gene="wchA" + /locus_tag="SPC18B_0008" + CDS 4791..6158 + /gene="wchA" + /locus_tag="SPC18B_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33555.1" + /db_xref="GOA:Q9AH94" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q9AH94" + /translation="MDEKGLKIFLAVLQSIIVILLIYFLNFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNLFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDEPSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNFGRNKQIHEMVGLDVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQISGRSKITDFDAVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5574..6155 + /gene="wchA" + /locus_tag="SPC18B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.3e-146" + gene 6189..7361 + /gene="wchF" + /locus_tag="SPC18B_0009" + CDS 6189..7361 + /gene="wchF" + /locus_tag="SPC18B_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33556.1" + /db_xref="GOA:Q9AH93" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q9AH93" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDEAPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYIQYQPKTTYIAYGTDTTRSTLNSSDEKVRAWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASSSKKDFVLITNVEQNKFYNQLLASTGFDKDPRV + KFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIGDYFTWEKIVTDYEKLFKK" + gene 7358..8629 + /gene="wciU" + /locus_tag="SPC18B_0010" + CDS 7358..8629 + /gene="wciU" + /locus_tag="SPC18B_0010" + /note="member of homology group 59" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33557.1" + /db_xref="GOA:Q9AH92" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q9AH92" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMIEQIAQGYQVAALYPGRI + KFFSKEIEIIKATSRQFECYELLNSLPMALFGGISDPTAFLTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKNTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSDLRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIKSANSIVLSITNSSINHHQRLTTANNKIRVA + YIGPDEEYKGYFDFIDFVETLDRESYEVATYGHLPNEECPSFIEQKGYFTKEMIDSVY + ENIDILIVPSKWKETFGLITVEALSYGVNVFVSENVGSKDLFPETHVFKDKEDLLAKI + INNQLKKIPLKTIEEHVEEVIGYYKQVRSNN" + misc_feature 8132..8602 + /gene="wciU" + /locus_tag="SPC18B_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00023" + gene 8635..9699 + /gene="wciV" + /locus_tag="SPC18B_0011" + CDS 8635..9699 + /gene="wciV" + /locus_tag="SPC18B_0011" + /note="member of homology group 91" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33558.1" + /db_xref="GOA:Q9AH91" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q9AH91" + /translation="MIKDMSCPEISVIVPVYNVERYLRQCMDSLINQTYRDFEIILVN + DGSTDSSGVLCEDWAKKDERIHVVHKKNEGLGFARNTGVEHAKGKYITFVDSDDYVSL + DMLQTLYNAVQEYDVEVVYSAGYYRSFSNGEIKKTDVETKKPQLFEGGDVASKLLPDV + ISAPPEYPNDGKVGVSAWKVLYEANLFKEKGLLFHSEREFISEDAIFQIDCLKLATSA + LVIPDILYYYRENFGSLSMKYKEERFELDKILYNEQLKRVEGLPNQEILEERIERILI + ANIRLCIFQESLYKSSRIHKRLQRIRQICKDPISKSVLRHYPIHRLPFTKRLICVLAK + YNMSLLLLVLTSLKYRNRSV" + misc_feature 8665..9207 + /gene="wciV" + /locus_tag="SPC18B_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.6e-45" + gene 9705..10616 + /gene="wciW" + /locus_tag="SPC18B_0012" + CDS 9705..10616 + /gene="wciW" + /locus_tag="SPC18B_0012" + /note="member of homology group 92" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33559.1" + /db_xref="GOA:Q9AH90" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q9AH90" + /translation="MGMNIEKLKLSFKNGTFFPVVIHALRNRWPLWWIRSKAIREVQL + EDRAYRILKKKYGSLISNSFDKSYLSEEVPKQIWICWFQGMENAPELVKSCYRSLKKQ + FPEYVITVISSENISEYVEISDIIYKKWGNGVIGNAHFSDILRVELLRKFGGIWIDST + VYCTGITTIETIEKNTFFMYKSLYSVEERISSSNWMIASVPNHPFMVTMSTLLQSYWS + KEVIAIHYYLFHILFTIMIESLSELWQLVPTYTNATPHIMVDELNNVFSKERYQQLCQ + ISDFHKLNYKKNYNDKSESLYSHLLNQ" + misc_feature 9786..10604 + /gene="wciW" + /locus_tag="SPC18B_0012" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.1e-149" + gene 10628..12085 + /gene="wzx" + /locus_tag="SPC18B_0013" + CDS 10628..12085 + /gene="wzx" + /locus_tag="SPC18B_0013" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33560.1" + /db_xref="GOA:Q4K149" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K149" + /translation="MPNLKKNIVYNVLYQILAVIVPFITSPYLARVLGAEQIGVYSFT + YSIAFYFMILSMLGISNYGNRTIAQVRTSREHLNQEFSNIYAVQLTCSLVMTVSYLIY + ATVFVNSFQIVAYIQVLHVLSYATDVSWFFYGLEEFRITVARNSFVKLLTLISIFTFV + KSPNDIYLYTFIMAGSTLLGQLITWQFLLKQVNFVRPNLGKIKKHMKPIIILFFPVLA + VSIFSFLDKIMLGMYSSLKETAFYENSDKIISIPKALIQAFGAVMLPRTVHLLSIGDE + QKSLEYVDKTMWVVLVITMGCAFGLAGVSATFAPVYWGEEFRASSQIIAGMTPALVFS + AFGNVIRTQFLIPRSFDKEYTVSLLYGAVVNILINILLIPKMGAMGAVIGIIVAELVL + CCYQTWIARNYLHIREYLINAGILFLIGSVMYMVLILISSILPTSLLTLIIEIIVGAF + IYISLLVLYIFSSKNRVIIGLRTNFLEHTHLFKRK" + misc_feature 10637..11440 + /gene="wzx" + /locus_tag="SPC18B_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.7e-56" + gene 12088..13362 + /gene="wzy" + /locus_tag="SPC18B_0014" + CDS 12088..13362 + /gene="wzy" + /locus_tag="SPC18B_0014" + /note="member of homology group 93" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33561.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K148" + /translation="MKFKFNPIAILYILLVYLELATDRQHLYPVTYMTKYYIGILIIV + LFVLLLVGRGKLIFVNKKLLYLAKILAIPTIVLFLYSVLLDVMNPVEFNGYFSRLSST + TIFGLLAIFQAIVVFQFFGQKVVDYTFTAISLSYLTSIIVAFRQGGLSQFILILTDDS + FNGSVLEMHEVAPITALFILYYLYKYFIKENSFSSVFYNILIALIILFLSLKRIVLLS + VLIIIPVFLVIYWYDKKVSKLGKERKILSLLNIFSLIFITGIFLYVYSVKSDFIYTFI + QEHNINSMARTDLWKGVESTYNFAPIFMGRGIGFVTKWMDNNWMTLNINGLTGTMGIH + NDILKYYIEIGFVGLFIYFYTLLYRNAKRIFVKIGHKESFIYFVLIMFQMLIWFTDNI + SIYHNFLWILNLLLFSLTNSDTELENLDFKNF" + misc_feature 12925..13137 + /gene="wzy" + /locus_tag="SPC18B_0014" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 7.3e-10" + gene order(13416..13583,13587..14417) + /gene="wciX" + /locus_tag="SPC18B_0015" + CDS join(13416..13583,13587..14417) + /gene="wciX" + /locus_tag="SPC18B_0015" + /note="member of homology group 107" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33562.1" + /db_xref="GOA:Q4K168" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K168" + /translation="MKTDARTKKRENETLYILKVWATFSVIAIHFGFLGQIGVFYKVL + ARFAVPLFFMISFYSFSISEEKLKKRIKNLSLLIISSTSFYFLLDVFLQLTQGNLRVV + FERFTFNNIFNFLVFNQISALIGSLATPLWFLYALLYVYIYLFFSNKKWIFNTILTVI + ILCCSFIIELKANSALFYRNFLFMGVPFFSFGMYFAQIQRKIINYKHFKELFIIGIMI + SGFLTLIEYTFLGANFELYVSSVIISCMLMVFSIKYPQLWTLDFAVNIAKKNATFIYI + SHQFVILLFKTYVRDGIAYKIGTFLIFLACVIMSIIFNYIVDIISRCCIKEKQDII" + gene 14414..15574 + /gene="wciY" + /locus_tag="SPC18B_0016" + CDS 14414..15574 + /gene="wciY" + /locus_tag="SPC18B_0016" + /note="member of homology group 78" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33563.1" + /db_xref="GOA:Q4K146" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K146" + /translation="MKFYIKNLLKKVFTLPLHLLPIQSNKIIFDNFGGRGFGDNPKYI + LEELVSREKNLDLVWVTKDREISIPEGVRVVKYGSYRSFYEWLTARVWVDNIRNSDRP + WKRKGQIYLQTWHGSDGVKLIEKSVAGNLKKTYLRMAKYDGKITDGIVSSRHFQTLGM + QNNFWLAENVEFLEFGLPRNDDFFKSEKIKTTNIKFRTLFDIDLDELVVLYMPTFRDD + GSLNAYNLDYSKLIHVFQNKFRKNVKILVRFHPNVDSSFINLQDTDCINVSTYSNPQD + LMMSADVMITDYSSASIDFMLLNRPVFLYLPDYQSYVNDRPLDDNFDKLPFPRAYHNN + ELTEIIRDFERSKYDEKVRLYELEDVRFDRGKASVQCANWIEEKIKNNKVID" + misc_feature 14999..15544 + /gene="wciY" + /locus_tag="SPC18B_0016" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 2.3e-68" + gene 15616..16008 + /gene="gct" + /locus_tag="SPC18B_0017" + CDS 15616..16008 + /gene="gct" + /locus_tag="SPC18B_0017" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33564.1" + /db_xref="GOA:Q9AH85" + /db_xref="HSSP:1COZ" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q9AH85" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNYEHRKNLVEAIRYVDLVIPETSWEQKKSDVKDYHIDTFVMGDDWKGKFDY + LEEEGVEVVYLPRTKEISTTKIKEDLSE" + misc_feature 15628..15996 + /gene="gct" + /locus_tag="SPC18B_0017" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 4.8e-29" + gene 16105..16649 + /gene="HG94" + /locus_tag="SPC18B_0018" + /pseudo + CDS join(16105..16215,16277..16465,16476..16649) + /gene="HG94" + /locus_tag="SPC18B_0018" + /note="member of homology group 94" + /pseudo + /codon_start=1 + /transl_table=11 + /product="hypothetical protein (pseudogene)" + gene 16848..17717 + /gene="rmlA" + /locus_tag="SPC18B_0019" + CDS 16848..17717 + /gene="rmlA" + /locus_tag="SPC18B_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33566.1" + /db_xref="GOA:Q9AH84" + /db_xref="HSSP:1H5R" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q9AH84" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEQPCSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEV" + misc_feature 16851..17567 + /gene="rmlA" + /locus_tag="SPC18B_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 2.2e-120" + gene 17718..18311 + /gene="rmlC" + /locus_tag="SPC18B_0020" + CDS 17718..18311 + /gene="rmlC" + /locus_tag="SPC18B_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33567.1" + /db_xref="GOA:Q9AH83" + /db_xref="HSSP:1NXM" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q9AH83" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSFGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 17754..18284 + /gene="rmlC" + /locus_tag="SPC18B_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 1.2e-15" + gene 18324..19373 + /gene="rmlB" + /locus_tag="SPC18B_0021" + CDS 18324..19373 + /gene="rmlB" + /locus_tag="SPC18B_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33568.1" + /db_xref="GOA:Q9AH82" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH82" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEVLGNRVELVIGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18339..19295 + /gene="rmlB" + /locus_tag="SPC18B_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 5.4e-05" + misc_feature 18342..19178 + /gene="rmlB" + /locus_tag="SPC18B_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0028" + misc_feature 18342..19082 + /gene="rmlB" + /locus_tag="SPC18B_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 3.5e-78" + misc_feature 18345..19157 + /gene="rmlB" + /locus_tag="SPC18B_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 7.5e-06" + gene 19439..20290 + /gene="rmlD" + /locus_tag="SPC18B_0022" + CDS 19439..20290 + /gene="rmlD" + /locus_tag="SPC18B_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33569.1" + /db_xref="GOA:Q9AH81" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH81" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19439..20287 + /gene="rmlD" + /locus_tag="SPC18B_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4.3e-146" + misc_feature 19442..20083 + /gene="rmlD" + /locus_tag="SPC18B_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00011" + misc_feature 19442..20071 + /gene="rmlD" + /locus_tag="SPC18B_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2e-18" + misc_feature 19445..20173 + /gene="rmlD" + /locus_tag="SPC18B_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-08" + gene 20353..21454 + /gene="glf" + /locus_tag="SPC18B_0023" + CDS join(20353..20427,20427..20975,20951..21454) + /gene="glf" + /locus_tag="SPC18B_0023" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33570.1" + /db_xref="GOA:Q4K161" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K161" + /translation="MYDYLVVGAGLFSAVFAHEVALKGKKVKVIEKRNHIVGNIYTRE + EEGIQVHQYGAHIFHTSDKESWDYVNQFAGFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIEEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPSFIIRRLPVHLTYDNNYFNDTYQGIPIGGYTQIVEKCWIMKILMMLDYENIDVE + TNVDFFVNKEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAV + VNYTDAETPYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKS + YKKFADEQGNVIFGGRLGHYRYYDMHQVIGAALQCVRNELD" + misc_feature join(20787..20951,20975..21394) + /gene="glf" + /locus_tag="SPC18B_0023" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 6.9e-102" + gene 21772..>21819 + /gene="aliA" + /locus_tag="SPC18B_0024" + CDS 21772..>21819 + /gene="aliA" + /locus_tag="SPC18B_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33571.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga aaatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agagaaagac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga aaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gaacgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata attagattga aactagaata gtacacctct gcttctaaaa + 1021 cattgttaga aatcgatttg actgtcctga tcgatttgtc atgttcttat ttcattttac + 1081 tatatttttg tttcgcggga agtctactaa gatacttaaa gatgcagata gtaaaaaaag + 1141 atgtagacat taccgtaaaa aagtgatata atcgtatgat attgaatgta taggtgttaa + 1201 tcttgagtag acgttttaaa aaatcacgtt cacagaaagt gaagcgaagt gttaatatag + 1261 ttttactgac tatttattta ttgttagttt gttttttatt gttcttaatc tttaagtaca + 1321 atatccttgt ttttagatat cttaatctag tggtaactgt gttagtccta ctagttgcct + 1381 tgatagggct actcttgatt atctataaaa aagctgaaaa gtttactatt tttctgttgg + 1441 tgttctctat ccttgtcagc tctgtgtcgc tctttgcagt acagcagttt gttggactga + 1501 ccaatcgttt aaatgcgact tctaattact cagaatattc aatcagtgtc gctgttttag + 1561 cagatagtga gatcgaaaat gttacgcaac tgacgagtgt gacagcaccg actgggactg + 1621 ataatgaaaa tattcaaaaa ctattagctg atatcaagtc aagtcagaat accgatttga + 1681 cggtcgacca gagttcgtct tacttggcag cttacaagag tttgattgca ggtgacacca + 1741 aggccattgt cttaaatagt gtctttgaaa atatcatcga gtcagagtat ccagactacg + 1801 catcgaagat aaaaaagatt tataccaagg gattcactaa aaaagtagaa gctcctaaga + 1861 cgtctaagaa tcagtctttc aatatctatg ttagtggaat tgacacctat ggtcctattg + 1921 gttcggtgtc gcgatcagat gtcaatatct tgatgactgt caatcgagat accaagaaaa + 1981 tcctcttgac cacaacgccg cgtgatgcct atgtaccaat cgcagatggt ggaaataata + 2041 aaaaagataa attgactcac gcgggcattt atggagttga ttcatccatt cacaccttag + 2101 aaaatctcta tggagtggat atcaattact atgtgcgatt gaacttcact tctttcttga + 2161 aaatgattga cttattggga ggggtagatg ttcataatga tcaagagttt tcagctctac + 2221 atgggaagtt ccatttccca gtagggaatg tccatctaga ctctgagcag gctctaggtt + 2281 ttgtacgtgg acgctactca ctagccgatg gagaccgtga ccgtggtcgc aaccaacaaa + 2341 aggtcattgt agcaattatt cagaagttaa cttctacaga ggttttgaaa aactatagta + 2401 gtattcttca aggattgcag gattctcttc aaacaaatat gccgattgag actatgatag + 2461 atttagtgaa tactcagttg gaaagtggag ggaattataa agtaaattct caagatttaa + 2521 aagggacagg tcggatggat cttccttctt atgcaatgcc agacagtaac ctctatgtga + 2581 tggaaataga tgatagtagt ttagctgtag ctaaagcagc tatacaggac gtgatggagg + 2641 gtagatgaaa tgatagatat ccattcgcat atcgtttttg atgtagatga cggtcccaag + 2701 tcaagagagg aaagcaaggc tctcttggca gaagcctaca ggcagggggt gcgaaccatt + 2761 gtctctacct ctcaccgtcg caagggcatg tttgaaactc cggaagagaa gatagcagaa + 2821 aactttcttc aggttcggga aattgcaaaa gaagtagcag atgatttagt cattgcttat + 2881 ggcgcagaga tatactatac tatggatgct ctagaaaagc tagaaaaaaa agaaattcct + 2941 acccttaatg atagtcgtta tgctttgatt gagtttagca tgcatacttc ctatcgtcag + 3001 attcatacgg gattgagcaa tattttgatg ttgggaatca cgccagtaat tgctcatatt + 3061 gaacgttatg atgctttaga gaataacgaa aaacgtgttc gtgaactgat tgatatgggg + 3121 tgctatactc agataaatag ttatcatgtt tcaaaaccta agttctttgg tgaaaaatat + 3181 aaattcatga aaaagagagc tcggtatttt ttggaacgtg atttagttca tgtcattgca + 3241 agtgacatgc acaatttaga cagtagacct ccatatatgc aacaggcata tgatatcatt + 3301 gctaagaaat atggagcgaa aaaagcgaaa gaactttttg tagataatcc cataaaaatt + 3361 ataatggatc aattaattta ggagaaaata tgcaagatca aaacactttg gaaatcgatg + 3421 tatttcaact attcagagct ttatggaaaa gaaagttggt tattttatta gtggcaatta + 3481 taacttcttc agttgctttt gcctacagta cttttgttat caaacctgag tttactagta + 3541 cgactcggat ttatgtagtt aaccgtaata aggaagagaa gtctggttta accaatcaag + 3601 acttgcaggc aggatcatac ttggttaaag actatcgtga aattatccta tcgcaggatg + 3661 ttttggagga agttgtttct gatttgaaac tagatttgac gccaaaaggt ttggctaata + 3721 aaattaaagt gacagtacca gttgataccc gtattgtctc tatttcagtt aatgatcgag + 3781 ttcctgaaga ggcaagccgt atcgctaact ctttgagaaa agtagctgct caaaaaatta + 3841 tcagtattac tcgtgtttct gatgtgacaa cactggagga ggcaagaccg gcgatatcgc + 3901 cgtcttcgcc aaatattaaa cgcaatacac taattggttt tttggcaggg gtgattggaa + 3961 ctagtgttat agttcttctt cttgaacttt tggacactcg tgtgaaacgt ccggaagata + 4021 tcgaaaatac attgcagatg acacttttgg gagttgtacc aaacttaggt aagttgaaat + 4081 aggagagaag gatgccgaca ttagaaatag cacaaaaaaa actggagttc attaagaagg + 4141 cagaagaata ttacaatgcc ttgtgtacaa atatacagtt gagcggagat aaactaaaag + 4201 taatttccgt tacttctgtt aaccctgggg aaggaaaaac aactacttcc ataaatatag + 4261 catggtcgtt tgcgcgtgca ggctataaaa ctcttttgat cgatggcgat actcgacaat + 4321 cagttatgtc aggagttttt aaatctcgtg aaaaaattac agggctaaca gaatttttat + 4381 ctgggacagc tgatttatct cacggtttat gtgatacaaa tattgaaaat ttatttgtag + 4441 ttcaatcggg atctgtatca ccaaacccta cagccttgtt acaaagtaaa aattttaatg + 4501 atatgattga aacattgcgt aaatattttg attatatcat tgttgataca ccacctattg + 4561 gaattgttat tgatgcggca attatcactc aaaagtgtga tgcgtccatc ttgataacag + 4621 caacaggtga ggtgaataaa cgtgatgtcc aaaaagcgaa acaacaatta gaacaaacag + 4681 ggaaactgtt cctgggagtt gttttaaata aattggatat ctcggttgat aagtatggag + 4741 cttacggttc ctatggaaat tatggtaaaa aataacttag aaaagatttt atggatgaaa + 4801 aaggattgaa aatttttctg gcagtattgc agagtattat tgtcatttta ttgatttatt + 4861 ttcttaactt tgttagagag acagaacttg aacgttcttc gatggttata ctataccttc + 4921 tccacttttt tgtattttat tttagttcct atggtaacaa tttttttaaa agagggtacc + 4981 tagttgagtt taatagtact ataagatata tttttttctt tgcaatagct ataagtgtat + 5041 taaacctttt tatagcggaa cggtttagta tctctagaag aggaatggta tacttcttaa + 5101 ctttagaagg aatatcctta tacttgttaa atttcttagt aaaaaaatat tggaagcatg + 5161 tgttttttaa tctaaaaaat agcaagaaaa ttttactgtt aacagtaacg aaaaatatgg + 5221 aaaaagttct tgataaattg ctagaatctg atgaaccttc atggaaattg gtagcagtaa + 5281 gtgttttgga taaatctgat tttcaacatg ataaaatacc tgtaattgaa aaggaaaaaa + 5341 ttattgaatt tgcaacgcat gaagttgtgg atgaggtgtt tgtcaatctt ccaggagaga + 5401 gctacgatat tggagaaatt atctctaggt ttgagacaat ggggatagat gtaactgtaa + 5461 atcttaaagc atttgataag aattttggtc gcaataaaca aattcatgag atggtaggac + 5521 tggatgtagt cactttctct acaaattttt ataaaactag tcatgtgatt tcaaagagaa + 5581 ttctcgatat ttgtggtgcc actattggcc ttattctttt tgctatagct agtctagttt + 5641 tagttccatt gattcgtaaa gatggcggac cagctatttt tgctcaaact cgtataggga + 5701 aaaatggtcg acatttcaca ttttataaat tccgttcgat gcggatcgat gctgaagcta + 5761 tcaaagaaca gttgatggat caaaatacga tgcaaggtgg tatgtttaag atagacaatg + 5821 atcctcgtgt tacaaaaatt ggtcgcttta ttcgtaaaac cagtttggat gaattgccgc + 5881 agttttggaa tgtatttata ggagatatga gtttggtagg aacacgtcca cctacagtag + 5941 acgagtatga tcagtatact ccagaacaga aacgtcgact cagctttaaa cctgggatta + 6001 caggcttatg gcagattagt ggccgaagta aaataaccga ttttgacgct gttgtaaaat + 6061 tagatgtggc ttatattgat aattggacaa tctggaaaga tattgaaatt ttgcttaaaa + 6121 ctgttaaagt tgtatttatg agagatggag cgaagtaatt tctgtatatc catcatatta + 6181 ggagagaaat gaaaaagtca gtttatatca ttggttcaaa aggaattcct gctaagtatg + 6241 gaggatttga aacttttgtt gaaaaattaa cagccttcca acaagataag gctatccaat + 6301 attatgtagc ttgtatgcgt gaaaactctg caaaatcagg gactactgag gatgtttttg + 6361 aacataatgg tgctatctgt tataacgtcg atgttcctaa tattggtcca gcgcgagcta + 6421 tagcgtatga tatcgctgca attaacagag ctattgaaat tgccaaagaa aataaggatg + 6481 aagctccaat cttctatatt ttagcttgtc gaatcggtcc gttcatccat ggaattaaga + 6541 aaaaaatcca ggcgataggt gggactcttc tagttaatcc agatggtcac gagtggttac + 6601 gagctaagtg gagcgctcca gttcgtcgtt attggaaaat ttccgaaggt cttatggtca + 6661 aacatgcaga tcttttagtg tgtgatagta agaatattga aaaatatatc caagaagatt + 6721 atatacagta tcaacctaag acaacctata tcgcttatgg gacagataca acacgctcca + 6781 cattaaatag cagtgatgaa aaagtgcgtg cttggttcaa ggagaaaaat gtttctgaaa + 6841 acgagtatta cctagttgta ggacgttttg ttccagaaaa taattatgag tctatgatac + 6901 gtggtttctt ggcgtctagc tctaagaagg attttgtcct aatcacaaat gtagaacaga + 6961 ataaatttta taatcagcta ttagcaagta ctggatttga taaagatcca cgagtgaaat + 7021 ttgttggaac agtctacgac caagaacttc tgaagtatat tcgagaaaat gcttttgctt + 7081 acttccacgg acatgaagtt ggtggaacaa atccttcgtt acttgaagca ttagcatcca + 7141 caaagttaaa cttactactc gatgttggtt ttaaccgcga agttggggag caaagtgcga + 7201 tctattggaa aaaagatgag ctttcccaag taatcgagaa agttgaacaa tttgatgcaa + 7261 aaatgattga tgagttagat agacaatcaa atcagagaat tggggattat ttcacttggg + 7321 aaaagattgt cacagactac gagaaattat ttaaaaaatg aaaatattac attatacttt + 7381 aggatttcaa ccccagcgaa caggtggttt ggttaaatat gctgaggatt taatgataga + 7441 gcaaattgct caaggttatc aagtagctgc cttatatcca ggaagaatta agttcttttc + 7501 aaaagaaata gaaataatta aagcgacgtc aagacagttt gagtgttatg aactgcttaa + 7561 tagcttacct atggctttat ttggaggtat atccgatcca actgctttcc tgacaccttg + 7621 tgacaaaaat gtttatcgta cttttttaga aaaagtacaa cccgacatta tacatattca + 7681 ctcgtttatg ggattgcata aagaattcct cgaaattgct aaaaacttga atattagagt + 7741 ggtttttacg agccatgatt attatggatt agcacccgta cctcatttct attttaatgg + 7801 ggtggattat agtgataaaa atacaaattt aacatggaat attatgtctt ccaatgcttt + 7861 aagtgtgaaa aaactaagac tttttcaggt ttcattttat ccgactattc gtaaactttt + 7921 gaaactatta gggaaaaatc caaaatctaa aaagaattta gttattcgag atgttattga + 7981 ggagcaagat tatagtgatc ttcgatacta ttataatgag atgtttcact taatagatgg + 8041 ttatttgttt aatagtagac ttgcaaagaa ggtatatgag ataaatgaga ttaagtcagc + 8101 taatagtata gtattatcta taacaaatag ttcaattaat catcatcaga gattgacaac + 8161 tgcaaataat aaaattagag ttgcttatat tggtccagat gaagaatata aaggatattt + 8221 tgattttatt gactttgttg aaactttaga tcgagagtcc tatgaagtgg caacttatgg + 8281 ccatttacca aatgaagagt gcccttcatt cattgaacaa aaaggatatt ttactaagga + 8341 aatgattgac agtgtctatg aaaatattga tattcttatt gttccaagta agtggaagga + 8401 aacatttgga ttgataacag tagaagcatt atcctatggg gtaaatgttt tcgtgagtga + 8461 aaatgttgga tcaaaagact tgtttccaga aacacatgtt tttaaagaca aggaagattt + 8521 gttggctaaa atcatcaata atcagttgaa gaaaattccg cttaaaacga tagaagaaca + 8581 tgtagaagaa gttattggtt attacaaaca ggttagaagt aacaattaag gagaatgatt + 8641 aaagatatgt cctgtccaga aattagcgta attgtaccag tttataatgt ggaacgatat + 8701 ttaaggcagt gtatggattc attgataaat caaacttata gggattttga aataatttta + 8761 gtaaacgatg gatcaacgga ttcttctggg gttctctgtg aggattgggc aaaaaaagat + 8821 gaaagaattc atgtagttca caaaaaaaat gaggggcttg gcttcgctcg taatacaggg + 8881 gttgaacacg caaaggggaa atacataacc tttgtagatt cagatgacta tgtttctcta + 8941 gatatgctgc aaactctata taatgctgtt caagaatatg atgtcgaagt tgtatacagt + 9001 gcgggatatt atcgttcctt tagtaatggg gaaataaaga agacagatgt agaaacaaaa + 9061 aaacctcaac ttttcgaagg aggagatgtt gcctctaaat tactccctga tgtaatttct + 9121 gctcctcctg agtatccgaa tgatgggaaa gttggagtgt cggcatggaa ggttctctac + 9181 gaagctaatt tgtttaagga aaaaggctta ttatttcatt cagaaagaga attcatttca + 9241 gaagatgcta tttttcaaat tgattgttta aaattagcaa catctgccct tgttatccca + 9301 gatattttat actactatcg tgaaaacttt ggttctttaa gtatgaaata taaagaagaa + 9361 cggtttgagt tggataaaat cttgtataac gagcaattaa aaagagttga ggggttacct + 9421 aatcaagaaa ttttggaaga aagaatagag agaattttaa ttgctaatat tcgtttatgt + 9481 atctttcagg aatccttata taaaagttct agaattcata aacgtttgca aagaattaga + 9541 cagatttgta aggacccaat atcaaaatca gtattacgtc attatccaat ccatcgttta + 9601 ccttttacta aacgtttgat ctgtgtatta gctaagtata atatgtcgtt gttgctttta + 9661 gttttaacct cattaaaata tcggaatcgg agtgtgtaac ttttatgggg atgaatatag + 9721 aaaaattaaa actatctttt aaaaatggaa cgttttttcc tgttgttatt cacgccttac + 9781 gtaaccgttg gcccttgtgg tggattcgga gtaaggctat tcgagaagtg caacttgaag + 9841 atagggccta cagaatacta aaaaagaaat acggttcttt aatttcaaac tcttttgata + 9901 aatcatactt atcagaagaa gttcccaagc aaatctggat ttgctggttt caaggtatgg + 9961 agaatgctcc agagttggtg aaatcatgtt atagatcact aaaaaaacaa tttcctgaat + 10021 atgtcattac ggttatttct tcagaaaata tttccgaata tgtagaaata tctgatatta + 10081 tttataaaaa atggggaaat ggtgtaatag gaaatgctca tttttctgat atccttcggg + 10141 tagagctgtt acgtaagttt gggggaatat ggattgactc aacagtgtat tgtacaggaa + 10201 ttactaccat agagacaatt gaaaaaaata cattttttat gtataaaagt ttatattcag + 10261 ttgaggagag aatttcctct tccaactgga tgattgcttc tgttcccaat catccattta + 10321 tggttacgat gagcacactc ttgcaatctt attggtcaaa agaagttata gcaattcatt + 10381 attatctatt tcatattctt tttacgatta tgattgaatc actttctgag ttgtggcagc + 10441 ttgtacccac ctatacgaac gcaacaccac atataatggt tgatgaatta aataatgttt + 10501 tttcaaagga acgttatcag caattgtgtc aaatttcaga ttttcataaa ttaaattata + 10561 aaaaaaatta caatgataaa tcagagagtt tgtacagtca cttactgaat cagtagaggg + 10621 gagaatcttg cctaatttaa agaaaaacat tgtttacaat gtcttatatc agatcttagc + 10681 tgtaatagta ccgtttatta cctcacctta cttagcgcgt gtgttaggtg cagagcaaat + 10741 tggagtttat tcttttactt attccattgc tttttacttt atgattctgt ccatgttggg + 10801 aatttctaat tatgggaatc ggacaatagc acaggtacga acaagtagag aacatttgaa + 10861 tcaagaattt tcgaatattt acgcagttca gttgacgtgt tcactagtaa tgaccgtctc + 10921 atatttgatt tatgcaacag tatttgtgaa tagttttcag attgtagcct atatccaagt + 10981 attacatgtt ttatcgtatg caacagatgt tagttggttt ttttatggtc ttgaagagtt + 11041 tcgtattacg gttgctagga attcatttgt taagttatta actttaatat ctatctttac + 11101 atttgtaaaa agccctaatg atatctattt atataccttt ataatggcag ggagtaccct + 11161 gcttggtcag ttgattacat ggcaattttt gctaaaacaa gtaaactttg tgcgccctaa + 11221 tcttggaaaa ataaagaaac acatgaaacc tattattatt ttatttttcc ccgtcttagc + 11281 ggttagtatt ttttcgtttc tagataaaat aatgcttggg atgtatagta gtttgaagga + 11341 aactgctttt tatgagaatt cagataagat aattagtatt ccaaaagctc tgattcaagc + 11401 ctttggagct gtaatgttgc ctcgaacagt acatttactg agtataggtg atgaacaaaa + 11461 aagtttagaa tatgttgata aaacgatgtg ggttgtttta gtgattacaa tgggctgtgc + 11521 tttcggttta gcaggagttt ctgcaacctt tgctcctgtt tattggggtg aagaatttag + 11581 ggccagtagc caaattattg caggaatgac accggcttta gtattttcgg cttttggaaa + 11641 tgtcatccga acccagtttt taattccacg aagttttgac aaggaatata cggtatcttt + 11701 gctttatgga gccgtagtta atatcttgat taatattctt ttgattccga agatgggagc + 11761 aatgggagct gttatcggaa taattgttgc agagttagtt ctatgttgct atcaaacatg + 11821 gattgctaga aattatttac atatcagaga atatctgata aatgctggga tattatttct + 11881 tattggttca gtaatgtata tggttttaat tcttatttca agtattttac ctacatcgtt + 11941 acttacactt attattgaaa ttatagtcgg agctttcatt tatattagtt tactggttct + 12001 gtatatcttt tcttcaaaaa acagggtaat tattggttta cgaacaaatt ttttagaaca + 12061 tactcattta tttaaaagga aataatagtg aaatttaaat ttaatccaat cgcgatactg + 12121 tatatattgc tagtatactt agagttggct acagataggc aacatctgta tcctgtaacg + 12181 tacatgacaa aatattatat tggtatttta atcattgtgt tgtttgtttt attattagta + 12241 ggccgtggga agcttatttt tgttaataaa aaattattat atcttgctaa gatattagct + 12301 ataccaacaa ttgttctttt cctgtactca gtcttactag acgtaatgaa cccagttgaa + 12361 tttaatggat attttagtag attatcaagt acgactattt ttggtttgtt agctatcttt + 12421 caagctatag ttgtttttca attttttgga caaaaagtag tagattacac ttttacagct + 12481 atctccctca gctacttaac cagtatcatt gttgccttta ggcagggagg acttagtcaa + 12541 tttatcttga tactaacaga tgatagtttc aatggttcgg tactagaaat gcatgaagtt + 12601 gcacctatta cagctctctt tattctgtac tatttgtaca aatattttat aaaagaaaat + 12661 agtttttctt cagtatttta taatatctta atagctctca ttattctttt tttaagcctt + 12721 aaacgaatcg ttcttttgag tgtattaatt atcataccag tatttttggt aatttattgg + 12781 tatgataaaa aagtaagtaa actagggaaa gaacgaaaaa ttttaagttt attaaatatc + 12841 ttttccttaa tatttataac aggaatattc ctttatgttt atagtgtaaa atctgatttt + 12901 atatatacat ttattcaaga acataatatt aattcgatgg ctagaacaga tttatggaag + 12961 ggagttgaat caacctataa tttcgcccct atatttatgg ggagagggat agggtttgta + 13021 acaaaatgga tggataataa ttggatgact ttgaatatca atggtcttac agggacaatg + 13081 gggatccata atgatatttt gaagtactac attgagatag gatttgtagg attatttatt + 13141 tatttttaca ctcttcttta tagaaatgct aaacgtatat ttgtaaaaat tggtcataaa + 13201 gaatcattca tatattttgt attgataatg tttcagatgc tgatatggtt tacagataat + 13261 atttcaattt accataattt tttatggatc ctaaatctac tactcttttc tttaactaat + 13321 tcggatacag aattggaaaa tttagatttt aaaaattttt aatgtgtaag tagtaactac + 13381 taattttatt aaaaaatcag aatataggtg tatttatgaa gacagatgct aggactaaaa + 13441 agagagagaa tgaaacgtta tatattctaa aagtttgggc aacatttagt gtgattgcta + 13501 tacattttgg ttttttgggc caaattggag tgttttacaa agtattagct cgatttgctg + 13561 tacctttatt tttcatgatt tcatgatttt attcgtttag tatttcagaa gaaaaactga + 13621 agaaaagaat taaaaatctg agtttattga taatttccag tacaagtttt tattttttac + 13681 tggatgtttt tcttcaatta acacaaggaa atctaagagt tgtatttgaa agatttactt + 13741 ttaataatat ttttaatttt ttggtattca atcaaatttc tgctctaatt ggctcgttag + 13801 caacaccact atggttctta tatgcattac tgtatgttta tatttatcta tttttttcaa + 13861 ataaaaaatg gatatttaat actattttga ctgtgatcat actctgttgt tcatttataa + 13921 tcgagttaaa agcaaatagt gctttatttt atagaaactt cttatttatg ggagttccct + 13981 tcttttcttt tgggatgtat tttgctcaaa ttcagagaaa aattataaat tataagcact + 14041 tcaaagaact ttttataatt ggaattatga tttcaggatt tctaactctg attgaatata + 14101 cctttttagg agcaaatttt gaactttatg taagttcggt gataatatct tgtatgctta + 14161 tggtcttttc gattaaatat cctcaactct ggacgttaga ttttgctgtc aatattgcta + 14221 aaaaaaatgc gacgtttatt tatattagtc atcaatttgt gattttatta tttaaaacat + 14281 acgttagaga tggaattgct tataaaattg gaactttctt gatattttta gcatgtgtta + 14341 ttatgagtat tattttcaac tatatagtcg atataatcag tcgttgttgc ataaaagaaa + 14401 aacaagatat aatatgaaat tttatataaa aaatttatta aaaaaagtct ttacattacc + 14461 gttgcattta ttgcctattc agtctaataa gataatattt gataattttg gtggtagagg + 14521 ttttggggac aatcctaagt atatacttga agaacttgtc tctcgagaaa agaatctaga + 14581 tcttgtgtgg gtaacaaaag atagagaaat ttctatccct gaaggcgttc gagtagtaaa + 14641 atacggcagt taccgttctt tttatgaatg gttaacagct agagtttggg tagataatat + 14701 tcgtaattct gatcgacctt ggaagcgaaa aggacagatt tatcttcaaa cttggcatgg + 14761 ttcagatggg gtaaagttaa ttgaaaaaag tgttgcaggg aacctaaaaa aaacatatct + 14821 tagaatggcg aagtatgatg gaaagattac agacggtatc gtatcaagtc ggcattttca + 14881 aactttgggt atgcaaaata atttttggct ggcagagaat gtggaatttc tggaatttgg + 14941 attacctcga aatgatgatt tttttaaaag tgaaaaaatc aaaaccacaa atataaaatt + 15001 tagaacatta tttgatatcg atttagacga actggtagtt ttgtatatgc cgacgttcag + 15061 agatgatgga tcgttgaatg cctataattt agattactcg aaactaatac atgtttttca + 15121 aaataaattt agaaaaaatg taaaaatatt agttcgtttt catccaaatg ttgattctag + 15181 ttttataaat ttacaggata cagactgtat aaatgtgtcg acctattcaa atcctcagga + 15241 tctgatgatg agtgcagatg tgatgattac ggattattca tcggcttcta ttgattttat + 15301 gttattaaat cgtccagtat ttctgtattt accagattat caaagttatg tgaatgatag + 15361 accattggat gataactttg ataaattgcc atttccaaga gcatatcata acaatgagtt + 15421 gacagaaatt attagagact ttgaaagaag taaatatgat gaaaaagttc gtctgtatga + 15481 attagaggat gttcgttttg atagaggaaa agcatcagta cagtgtgcta attggattga + 15541 agaaaaaata aaaaacaata aagttattga ttgaaataat tatatttatt gaattataaa + 15601 taaggaggtc tttagatgaa aagagttata acatatggta catttgattt attgcattat + 15661 ggtcatatca atcttttgaa acgtgctaaa cagctaggtg attatttgat tgtagttgtt + 15721 tcaagtgatg agtttaattt aaaagaaaag aataaagtat gttactttaa ctacgaacac + 15781 agaaaaaatt tagtagaagc tattcgatat gtcgatttag taatccctga aactagttgg + 15841 gaacagaaaa agtcagatgt taaagactac catattgaca cttttgtaat gggtgatgat + 15901 tggaaaggta aatttgatta tcttgaagaa gaaggtgttg aagtagtcta tttgcctaga + 15961 acaaaggaaa tatcaaccac aaagataaaa gaagatttat cggaatgaaa tattattaaa + 16021 aatgctgaca taagaaattg tggcttttgt gtctagtttt tgatagaata aagtaacaac + 16081 actttaacca atgaggtgtg aataatggca gtaattttta aagatgtact tgttgaagag + 16141 aaaactgatg aagaaaaaca acatatttta tctattttaa atgatgagaa tgttagagct + 16201 tttgattgtg gatattaaga attgaatgat gttttttgat atttagaaca aatacgatga + 16261 agaaacaggc catgtattgc ctattgtaaa tcaaaatttt gaattattag gttttatttc + 16321 ttgtagacta gtatcatttt ctttcatagc tcaggttaaa gagatgggaa ttagcataga + 16381 ttatcttggt attcataagg attgccagaa aatgggggat cggttcgctt ttggtgctct + 16441 ttgcgcttcg attatcttta actattgact gttgattacc aataaaaggt gtaatagttc + 16501 atgctctaga ggatgttgta gaattctatg acaaactggg ttttattgac cctagagata + 16561 tagttattta taatggcaaa ccggttacta tatattttag tattgaaaaa ctaagaaatg + 16621 gtgaaaatta ttcctctcac acagttattt gaaacatcct tagaaaatga tttttaattg + 16681 tatgcaaaca aagtagaatt cgcttatttc atcttatgct aaatgtaata tgaaacaagt + 16741 gaatttttat agataaagaa gaattttaaa aaatgtgatg attattttta gagcagtaca + 16801 gaattaatag taattgactc taaatcaata aagaaaggta ccctattatg aaaggtatta + 16861 ttctagcagg tggttcgggg acacgtttat atcctttgac tcgagctgca tcaaaacaac + 16921 tgatgccggt ttatgataaa ccgatgattt actatccact ttcaacattg atgttggctg + 16981 ggattaggga tattttgata atctcaactc ctcaagattt gcctcgtttt aaagagcttc + 17041 ttcaagacgg atctgagttt gggattaaac tttcttatgc agagcaacca agtccagatg + 17101 gtttggcaca agcctttatc attggggaag agtttattgg tgatgatagt gttgctttga + 17161 tcttggggga caatatctat cacggccctg gtttgagcaa aatgcttcaa aaagcagcca + 17221 agaaagagaa aggtgcgact gtctttggct accatgtcaa ggatccagaa cgctttggtg + 17281 ttgtagaatt tgatgaaaat atgaatgcta tctccatcga agaaaaacca gaacagccgt + 17341 gctctaacta tgcagtgaca ggactgtatt tctatgataa cgatgttgtc gagattgcca + 17401 aaagtattaa accaagtcct cgtggtgaat tggaaattac agatgtaaac aaagcttacc + 17461 tagatcgtgg tgatttgtct gttgagctta tgggacgcgg ctttgcttgg ttggatactg + 17521 gaacacatga aagtttactg gaggcttcac agtacatcga aacagtgcaa cggatgcaaa + 17581 atgttcaggt agcaaacttg gaagaaattg cctatcgcat gggttatatc agtcgtgaag + 17641 atgtattgac cttagcccaa ccacttaaga aaaatgaata cggacagtat ctgctccgtt + 17701 tgattggaga agtctagatg acagataatt ttttcggtaa gacgcttgcg gcacgcaagg + 17761 ttgaagctat tccaggcatg ttggagtttg atatccccgt tcatggagat aatcgtggct + 17821 ggtttaaaga aaatttccaa aaggaaaaaa tgcttccact tggatttcca gagtctttct + 17881 ttgcagaagg aaaattgcaa aacaatgtat ccttctcacg taaaaatgtc cttcgaggcc + 17941 tccacgcaga gccttgggat aagtacatct ctgtagcaga tggagggaaa gttctgggtt + 18001 cttgggttga tctacgcgag ggtgaaacct ttgggaatac ctatcagaca gtaattgatg + 18061 caagcaaggg aatctttgtt cctcgtggcg tagctaatgg cttccaagtt ttatcagata + 18121 cagtgtcata tagctatctg gtcaatgatt actgggcgct tgaactcaaa cccaagtatg + 18181 cctttgtgaa ctacgctgat ccaagctttg gtattgaatg ggaaaatatt gcagaagcag + 18241 aggtttcaga agcagataaa catcatcccc tacttaagga cgtgaagcct ttgaaaaaag + 18301 aagatttgta aaaaggaaag aatatgactg aatacaaaaa tattatcgtg acaggtggag + 18361 ctggctttat cggttctaac tttgtccatt atgtttacga gaactttcca gatgttcatg + 18421 tgacagtcct agataagttg acttatgctg gaaaccgcgc gaatattgag gaagttttag + 18481 gtaatcgtgt tgagttagtt attggtgaca ttgctgatgc ggagttggta gacaagttgg + 18541 ctgctcaagc agatgctatc gttcattatg cagcggaaag ccacaatgat aattcgctca + 18601 atgatccatc gccatttatt catactaact tcatcggaac ctatactctt ttagaagctg + 18661 ctcgtaagta tgatattcgc ttccaccatg tatcgacaga tgaagtttat ggggatctcc + 18721 ctttacgcga agatttgcca ggtcatggtg aaggaccagg tgagaaattt actgctgaaa + 18781 caaaatacaa cccaagctct ccgtactcat caaccaaggc agcctcagat ttgattgtca + 18841 aagcctgggt gcgttctttt ggagtcaagg caacgatttc caactgttca aataactacg + 18901 gtccttatca acatatcgaa aaattcatcc cacgtcagat tactaacatc ctaagtggaa + 18961 ttaagccaaa actttacggt gaaggtaaga atgttcgtga ctggatccat accaatgacc + 19021 attcttcagg agtttggaca atcttgacaa aagggcaaat cggtgaaacc tacttgattg + 19081 gggctgatgg tgagaagaac aataaggaag ttttggaact tatccttaag gaaatgggac + 19141 aagctacgga tgcctatgat catgtgactg accgtgcagg acatgacctt cgctatgcga + 19201 ttgatgccag caagctccgt gatgagttgg ggtggaaacc tgaatttacc aactttgaag + 19261 ctgggctcaa ggcaacaatc aagtggtata cagataacca agaatggtgg aaagcagaaa + 19321 aagaagctgt tgaagccaat tatgctaaga ctcaggagat tattacagta taaaaagcag + 19381 gaaatagctg ctttttattg ctatattggg aagagttaca tattagaaag gtctagagat + 19441 gattttaatt acaggggcaa atggccaatt aggaacggaa cttcgctatt tattggatga + 19501 acgtaatgaa gaatacgtgg cagtagatgt ggctaagatg gacattacca atgaagaaat + 19561 ggttgagaaa gtttttgaag aggtgaaacc gactttagtc taccattgtg cagcctacac + 19621 cgctgttgat gcagcagagg atgaaggaaa agagttggac ttcgccatca atgtgacggg + 19681 gacaaaaaat gtcgcaaaag catctgaaaa gcatggtgca actctagttt atatttctac + 19741 ggactatgtc tttgacggta agaaaccagt tggacaagag tgggaagttg atgaccgacc + 19801 agatccacag acagaatatg gacgcactaa gcgtatgggg gaagagttag ttgagaagca + 19861 tgtgtctaat ttctatatta tccgtactgc ctgggtattt ggaaattatg gcaaaaactt + 19921 cgtttttacc atgcaaaatc ttgcgaaaac tcataagact ttaacagttg taaatgacca + 19981 gtacggtcgt ccgacttgga ctcgtacctt ggctgagttc atgacctacc tagctgaaaa + 20041 tcgtaaggaa tttggttatt atcatttgtc aaatgatgcg acagaagaca caacatggta + 20101 tgattttgca gttgaaattt tgaaagatac agatgtcgaa gtcaagccag tagattccag + 20161 tcaatttcca gccaaagcta aacgtccgct aaactcaacg atgagcctgg ccaaagccaa + 20221 agctactgga tttgttattc caacttggca agatgcattg caagaatttt acaaacaaga + 20281 agtgagataa gtagtagaat gattttctag tctaataaaa gaggcagata atgaactcaa + 20341 aaggagctta aggtgtacga ttatcttgtt gttggtgctg gtctctttag tgcagtcttt + 20401 gcccatgaag tagccttaaa aggaaaaaag taaaagtcat tgaaaaacgg aatcatatcg + 20461 tgggtaatat ctatactcgt gaagaggaag gaattcaagt tcatcaatat ggtgctcata + 20521 tcttccatac ttctgataag gagagctggg attatgtaaa tcagtttgca gggtttaacc + 20581 gttacaccaa ttctcctgtt gcaaactata agggtgagat ttataacctt ccttttaata + 20641 tgaatacttt caataaactc tggggagttg taacgccagc agaagcacaa gctaagattg + 20701 aggaacaacg tgctatttta aatggtaaaa ctcctgaaaa tttggaagaa caggcgattt + 20761 ctcttgtagg tacagacatc tacgaaaaat taatcaaaga ctatacagag aaacagtggg + 20821 gcaaaccaac tactgaactt ccatccttta ttattcgccg tttaccagta cacctgacct + 20881 atgataacaa ctattttaac gatacctatc aagggattcc aattggtgga tacactcaaa + 20941 tagttgaaaa atgttggatt atgaaaatat tgatgtagaa acaaatgttg atttctttgt + 21001 gaacaaagag caatatctga aagattttcc taagattgtc tttactggta tgattgatga + 21061 attctttgac tataagttgg gcgaactaga gtaccgtagt cttcgttttg aaaatgagac + 21121 cttggatatg gaaaattacc aaggaaatgc agttgtgaac tatacggatg cagaaacccc + 21181 atatactcgc attattgaac acaaacattt tgagtttggg agtcaagcaa agactatcat + 21241 tactaaagaa cattctaaaa catgggaaaa aggtgatgag ccttattatc cagttaataa + 21301 tgatcgtaat aatcatttgt ataaatcgta taaaaaattt gctgatgagc aagggaatgt + 21361 tatctttggt ggccgcttag gacactatcg ttattacgat atgcaccaag taattggagc + 21421 agctttgcag tgcgtgagaa atgagttaga ttaatactca atgaaaatca aagagcaaac + 21481 taggaagcta gccacaggtt gctcaaaata ctgttttgag gttgcagatg gaagctgacg + 21541 cggtttgaag agattttcga agagtataaa caagtaaaac tgactaccag ttattattta + 21601 gaaatagtat taaaaattcc ttgactatgt gatatagttg agggattttt aaatgatatt + 21661 catatttttt gcaaagatgt tgtttgaaaa ataattttca aaaattctga aaattctgtt + 21721 gacatctttc tgaaaagagt ttataatgga gagaaagttt taaaggagaa aatgatgaaa + 21781 agttcaaaac tacttgccct tgcgggcgtg acattattg +// + diff --git a/public/res/serotype_genbank/serotype_18C.gb b/public/res/serotype_genbank/serotype_18C.gb new file mode 100644 index 0000000..6e1f5c7 --- /dev/null +++ b/public/res/serotype_genbank/serotype_18C.gb @@ -0,0 +1,997 @@ +LOCUS CR931673 21819 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 4593/40 (serotype 18c). +ACCESSION CR931673 +VERSION CR931673.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21819) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21819) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21819 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="4593/40" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC18C_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC18C_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33572.1" + /db_xref="GOA:Q4K1T1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K1T1" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVELL" + gene 293..466 + /gene="aliB" + /locus_tag="SPC18C_0002" + /pseudo + CDS 293..466 + /gene="aliB" + /locus_tag="SPC18C_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI33573.1" + gene complement(459..980) + /gene="tnp" + /locus_tag="SPC18C_0003" + /pseudo + CDS complement(459..980) + /gene="tnp" + /locus_tag="SPC18C_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1203..2648 + /gene="wzg" + /locus_tag="SPC18C_0004" + CDS 1203..2648 + /gene="wzg" + /locus_tag="SPC18C_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33575.1" + /db_xref="GOA:Q9AH98" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q9AH98" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILVF + RYLNLVVTVLVLLVALIGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGDTKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPIGSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNKKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRGRYSLADGDRDRGRNQQKVIVAIIQKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVAKAAIQDVMEGR" + misc_feature 1203..1319 + /gene="wzg" + /locus_tag="SPC18C_0004" + /note="Signal peptide predicted for SPC0914 by SignalP 2.0 + HMM (Signal peptide probability 0.996) with cleavage site + probability 0.577 between residues 39 and 40" + misc_feature 1407..1754 + /gene="wzg" + /locus_tag="SPC18C_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.1e-64" + misc_feature 1932..2375 + /gene="wzg" + /locus_tag="SPC18C_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.8e-69" + gene 2650..3381 + /gene="wzh" + /locus_tag="SPC18C_0005" + CDS 2650..3381 + /gene="wzh" + /locus_tag="SPC18C_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33576.1" + /db_xref="GOA:Q4K157" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K157" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTMDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVIASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPIKIIMDQLI" + misc_feature 2653..3261 + /gene="wzh" + /locus_tag="SPC18C_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.1e-38" + gene 3390..4082 + /gene="wzd" + /locus_tag="SPC18C_0006" + CDS 3390..4082 + /gene="wzd" + /locus_tag="SPC18C_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33577.1" + /db_xref="GOA:Q9AH96" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q9AH96" + /translation="MQDQNALEIDVFQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNKEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSISVNDRVPEEASRIANSLRKVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGVIGTSVIVLLLELLDTRVKRPEDIENTLQMT + LLGVVPNLGKLK" + misc_feature 3408..3824 + /gene="wzd" + /locus_tag="SPC18C_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 4.5e-53" + misc_feature 3930..4007 + /gene="wzd" + /locus_tag="SPC18C_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4092..4775 + /gene="wze" + /locus_tag="SPC18C_0007" + CDS 4092..4775 + /gene="wze" + /locus_tag="SPC18C_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33578.1" + /db_xref="GOA:Q9AH95" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q9AH95" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSINIAWSFARAGYKTLLIDGDTRQSVMSGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILITATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGAY + GSYGNYGKK" + gene 4791..6158 + /gene="wchA" + /locus_tag="SPC18C_0008" + CDS 4791..6158 + /gene="wchA" + /locus_tag="SPC18C_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33579.1" + /db_xref="GOA:Q9AH94" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q9AH94" + /translation="MDEKGLKIFLAVLQSIIVILLIYFLNFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNLFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDEPSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNFGRNKQIHEMVGLDVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQISGRSKITDFDAVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5574..6155 + /gene="wchA" + /locus_tag="SPC18C_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.3e-146" + gene 6189..7361 + /gene="wchF" + /locus_tag="SPC18C_0009" + CDS 6189..7361 + /gene="wchF" + /locus_tag="SPC18C_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33580.1" + /db_xref="GOA:Q9AH93" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q9AH93" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDEAPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYIQYQPKTTYIAYGTDTTRSTLNSSDEKVRAWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASSSKKDFVLITNVEQNKFYNQLLASTGFDKDPRV + KFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIGDYFTWEKIVTDYEKLFKK" + gene 7358..8629 + /gene="wciU" + /locus_tag="SPC18C_0010" + CDS 7358..8629 + /gene="wciU" + /locus_tag="SPC18C_0010" + /note="member of homology group 59" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33581.1" + /db_xref="GOA:Q9AH92" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q9AH92" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMIEQIAQGYQVAALYPGRI + KFFSKEIEIIKATSRQFECYELLNSLPMALFGGISDPTAFLTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKNTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSDLRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIKSANSIVLSITNSSINHHQRLTTANNKIRVA + YIGPDEEYKGYFDFIDFVETLDRESYEVATYGHLPNEECPSFIEQKGYFTKEMIDSVY + ENIDILIVPSKWKETFGLITVEALSYGVNVFVSENVGSKDLFPETHVFKDKEDLLAKI + INNQLKKIPLKTIEEHVEEVIGYYKQVRSNN" + misc_feature 8132..8602 + /gene="wciU" + /locus_tag="SPC18C_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00023" + gene 8635..9699 + /gene="wciV" + /locus_tag="SPC18C_0011" + CDS 8635..9699 + /gene="wciV" + /locus_tag="SPC18C_0011" + /note="member of homology group 91" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33582.1" + /db_xref="GOA:Q9AH91" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q9AH91" + /translation="MIKDMSCPEISVIVPVYNVERYLRQCMDSLINQTYRDFEIILVN + DGSTDSSGVLCEDWAKKDERIHVVHKKNEGLGFARNTGVEHAKGKYITFVDSDDYVSL + DMLQTLYNAVQEYDVEVVYSAGYYRSFSNGEIKKTDVETKKPQLFEGGDVASKLLPDV + ISAPPEYPNDGKVGVSAWKVLYEANLFKEKGLLFHSEREFISEDAIFQIDCLKLATSA + LVIPDILYYYRENFGSLSMKYKEERFELDKILYNEQLKRVEGLPNQEILEERIERILI + ANIRLCIFQESLYKSSRIHKRLQRIRQICKDPISKSVLRHYPIHRLPFTKRLICVLAK + YNMSLLLLVLTSLKYRNRSV" + misc_feature 8665..9207 + /gene="wciV" + /locus_tag="SPC18C_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.6e-45" + gene 9705..10616 + /gene="wciW" + /locus_tag="SPC18C_0012" + CDS 9705..10616 + /gene="wciW" + /locus_tag="SPC18C_0012" + /note="member of homology group 92" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33583.1" + /db_xref="GOA:Q9AH90" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q9AH90" + /translation="MGMNIEKLKLSFKNGTFFPVVIHALRNRWPLWWIRSKAIREVQL + EDRAYRILKKKYGSLISNSFDKSYLSEEVPKQIWICWFQGMENAPELVKSCYRSLKKQ + FPEYVITVISSENISEYVEISDIIYKKWGNGVIGNAHFSDILRVELLRKFGGIWIDST + VYCTGITTIETIEKNTFFMYKSLYSVEERISSSNWMIASVPNHPFMVTMSTLLQSYWS + KEVIAIHYYLFHILFTIMIESLSELWQLVPTYTNATPHIMVDELNNVFSKERYQQLCQ + ISDFHKLNYKKNYNDKSESLYSHLLNQ" + misc_feature 9786..10604 + /gene="wciW" + /locus_tag="SPC18C_0012" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.1e-149" + gene 10628..12085 + /gene="wzx" + /locus_tag="SPC18C_0013" + CDS 10628..12085 + /gene="wzx" + /locus_tag="SPC18C_0013" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33584.1" + /db_xref="GOA:Q4K149" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K149" + /translation="MPNLKKNIVYNVLYQILAVIVPFITSPYLARVLGAEQIGVYSFT + YSIAFYFMILSMLGISNYGNRTIAQVRTSREHLNQEFSNIYAVQLTCSLVMTVSYLIY + ATVFVNSFQIVAYIQVLHVLSYATDVSWFFYGLEEFRITVARNSFVKLLTLISIFTFV + KSPNDIYLYTFIMAGSTLLGQLITWQFLLKQVNFVRPNLGKIKKHMKPIIILFFPVLA + VSIFSFLDKIMLGMYSSLKETAFYENSDKIISIPKALIQAFGAVMLPRTVHLLSIGDE + QKSLEYVDKTMWVVLVITMGCAFGLAGVSATFAPVYWGEEFRASSQIIAGMTPALVFS + AFGNVIRTQFLIPRSFDKEYTVSLLYGAVVNILINILLIPKMGAMGAVIGIIVAELVL + CCYQTWIARNYLHIREYLINAGILFLIGSVMYMVLILISSILPTSLLTLIIEIIVGAF + IYISLLVLYIFSSKNRVIIGLRTNFLEHTHLFKRK" + misc_feature 10637..11440 + /gene="wzx" + /locus_tag="SPC18C_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.7e-56" + gene 12088..13362 + /gene="wzy" + /locus_tag="SPC18C_0014" + CDS 12088..13362 + /gene="wzy" + /locus_tag="SPC18C_0014" + /note="member of homology group 93" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33585.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K148" + /translation="MKFKFNPIAILYILLVYLELATDRQHLYPVTYMTKYYIGILIIV + LFVLLLVGRGKLIFVNKKLLYLAKILAIPTIVLFLYSVLLDVMNPVEFNGYFSRLSST + TIFGLLAIFQAIVVFQFFGQKVVDYTFTAISLSYLTSIIVAFRQGGLSQFILILTDDS + FNGSVLEMHEVAPITALFILYYLYKYFIKENSFSSVFYNILIALIILFLSLKRIVLLS + VLIIIPVFLVIYWYDKKVSKLGKERKILSLLNIFSLIFITGIFLYVYSVKSDFIYTFI + QEHNINSMARTDLWKGVESTYNFAPIFMGRGIGFVTKWMDNNWMTLNINGLTGTMGIH + NDILKYYIEIGFVGLFIYFYTLLYRNAKRIFVKIGHKESFIYFVLIMFQMLIWFTDNI + SIYHNFLWILNLLLFSLTNSDTELENLDFKNF" + misc_feature 12925..13137 + /gene="wzy" + /locus_tag="SPC18C_0014" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 7.3e-10" + gene 13416..14417 + /gene="wciX" + /locus_tag="SPC18C_0015" + CDS 13416..14417 + /gene="wciX" + /locus_tag="SPC18C_0015" + /note="member of homology group 107" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33586.1" + /db_xref="GOA:Q9AH87" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q9AH87" + /translation="MKTDARTKKRENETLYILKVWATFSVIAIHFGFLGQIGVFYKVL + ARFAVPLFFMISGFYSFSISEEKLKKRIKNLSLLIISSTSFYFLLDVFLQLTQGNLRV + VFERFTFNNIFNFLVFNQISALIGSLATPLWFLYALLYVYIYLFFSNKKWIFNTILTV + IILCCSFIIELKANSALFYRNFLFMGVPFFSFGMYFAQIQRKIINYKHFKELFIIGIM + ISGFLTLIEYTFLGANFELYVSSVIISCMLMVFSIKYPQLWTLDFAVNIAKKNATFIY + ISHQFVILLFKTYVRDGIAYKIGTFLIFLACVIMSIIFNYIVDIISRCCIKEKQDII" + gene 14414..15574 + /gene="wciY" + /locus_tag="SPC18C_0016" + CDS 14414..15574 + /gene="wciY" + /locus_tag="SPC18C_0016" + /note="member of homology group 78" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33587.1" + /db_xref="GOA:Q4K146" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K146" + /translation="MKFYIKNLLKKVFTLPLHLLPIQSNKIIFDNFGGRGFGDNPKYI + LEELVSREKNLDLVWVTKDREISIPEGVRVVKYGSYRSFYEWLTARVWVDNIRNSDRP + WKRKGQIYLQTWHGSDGVKLIEKSVAGNLKKTYLRMAKYDGKITDGIVSSRHFQTLGM + QNNFWLAENVEFLEFGLPRNDDFFKSEKIKTTNIKFRTLFDIDLDELVVLYMPTFRDD + GSLNAYNLDYSKLIHVFQNKFRKNVKILVRFHPNVDSSFINLQDTDCINVSTYSNPQD + LMMSADVMITDYSSASIDFMLLNRPVFLYLPDYQSYVNDRPLDDNFDKLPFPRAYHNN + ELTEIIRDFERSKYDEKVRLYELEDVRFDRGKASVQCANWIEEKIKNNKVID" + misc_feature 14999..15544 + /gene="wciY" + /locus_tag="SPC18C_0016" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 2.3e-68" + gene 15616..16008 + /gene="gct" + /locus_tag="SPC18C_0017" + CDS 15616..16008 + /gene="gct" + /locus_tag="SPC18C_0017" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33588.1" + /db_xref="GOA:Q9AH85" + /db_xref="HSSP:1COZ" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q9AH85" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNYEHRKNLVEAIRYVDLVIPETSWEQKKSDVKDYHIDTFVMGDDWKGKFDY + LEEEGVEVVYLPRTKEISTTKIKEDLSE" + misc_feature 15628..15996 + /gene="gct" + /locus_tag="SPC18C_0017" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 4.8e-29" + gene 16105..16649 + /gene="HG94" + /locus_tag="SPC18C_0018" + /pseudo + CDS join(16105..16215,16247..16465,16476..16649) + /gene="HG94" + /locus_tag="SPC18C_0018" + /note="member of homology group 94" + /pseudo + /codon_start=1 + /transl_table=11 + /product="hypothetical protein (pseudogene)" + gene 16848..17717 + /gene="rmlA" + /locus_tag="SPC18C_0019" + CDS 16848..17717 + /gene="rmlA" + /locus_tag="SPC18C_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33590.1" + /db_xref="GOA:Q9AH84" + /db_xref="HSSP:1H5R" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q9AH84" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEQPCSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEV" + misc_feature 16851..17567 + /gene="rmlA" + /locus_tag="SPC18C_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 2.2e-120" + gene 17718..18311 + /gene="rmlC" + /locus_tag="SPC18C_0020" + CDS 17718..18311 + /gene="rmlC" + /locus_tag="SPC18C_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33591.1" + /db_xref="GOA:Q9AH83" + /db_xref="HSSP:1NXM" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q9AH83" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSFGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 17754..18284 + /gene="rmlC" + /locus_tag="SPC18C_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 1.2e-15" + gene 18324..19373 + /gene="rmlB" + /locus_tag="SPC18C_0021" + CDS 18324..19373 + /gene="rmlB" + /locus_tag="SPC18C_0021" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33592.1" + /db_xref="GOA:Q9AH82" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH82" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEVLGNRVELVIGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18339..19295 + /gene="rmlB" + /locus_tag="SPC18C_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 5.4e-05" + misc_feature 18342..19178 + /gene="rmlB" + /locus_tag="SPC18C_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0028" + misc_feature 18342..19082 + /gene="rmlB" + /locus_tag="SPC18C_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 3.5e-78" + misc_feature 18345..19157 + /gene="rmlB" + /locus_tag="SPC18C_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 7.5e-06" + gene 19439..20290 + /gene="rmlD" + /locus_tag="SPC18C_0022" + CDS 19439..20290 + /gene="rmlD" + /locus_tag="SPC18C_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33593.1" + /db_xref="GOA:Q9AH81" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH81" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19439..20287 + /gene="rmlD" + /locus_tag="SPC18C_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4.3e-146" + misc_feature 19442..20083 + /gene="rmlD" + /locus_tag="SPC18C_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00011" + misc_feature 19442..20071 + /gene="rmlD" + /locus_tag="SPC18C_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2e-18" + misc_feature 19445..20173 + /gene="rmlD" + /locus_tag="SPC18C_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-08" + gene order(20335..20430,20460..21454) + /gene="glf" + /locus_tag="SPC18C_0023" + /pseudo + CDS join(20335..20430,20460..20975,20951..21454) + /gene="glf" + /locus_tag="SPC18C_0023" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + misc_feature join(20787..20951,20975..21394) + /gene="glf" + /locus_tag="SPC18C_0023" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 6.9e-102" + /pseudo + gene 21772..>21819 + /gene="aliA" + /locus_tag="SPC18C_0024" + CDS 21772..>21819 + /gene="aliA" + /locus_tag="SPC18C_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33595.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga aaatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agagaaagac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga aaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gaacgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata attagattga aactagaata gtacacctct gcttctaaaa + 1021 cattgttaga aatcgatttg actgtcctga tcgatttgtc atgttcttat ttcattttac + 1081 tatatttttg tttcgcggga agtctactaa gatacttaaa gatgcagata gtaaaaaaag + 1141 atgtagacat taccgtaaaa aagtgatata atcgtatgat attgaatgta taggtgttaa + 1201 tcttgagtag acgttttaaa aaatcacgtt cacagaaagt gaagcgaagt gttaatatag + 1261 ttttactgac tatttattta ttgttagttt gttttttatt gttcttaatc tttaagtaca + 1321 atatccttgt ttttagatat cttaatctag tggtaactgt gttagtccta ctagttgcct + 1381 tgatagggct actcttgatt atctataaaa aagctgaaaa gtttactatt tttctgttgg + 1441 tgttctctat ccttgtcagc tctgtgtcgc tctttgcagt acagcagttt gttggactga + 1501 ccaatcgttt aaatgcgact tctaattact cagaatattc aatcagtgtc gctgttttag + 1561 cagatagtga gatcgaaaat gttacgcaac tgacgagtgt gacagcaccg actgggactg + 1621 ataatgaaaa tattcaaaaa ctattagctg atatcaagtc aagtcagaat accgatttga + 1681 cggtcgacca gagttcgtct tacttggcag cttacaagag tttgattgca ggtgacacca + 1741 aggccattgt cttaaatagt gtctttgaaa atatcatcga gtcagagtat ccagactacg + 1801 catcgaagat aaaaaagatt tataccaagg gattcactaa aaaagtagaa gctcctaaga + 1861 cgtctaagaa tcagtctttc aatatctatg ttagtggaat tgacacctat ggtcctattg + 1921 gttcggtgtc gcgatcagat gtcaatatct tgatgactgt caatcgagat accaagaaaa + 1981 tcctcttgac cacaacgccg cgtgatgcct atgtaccaat cgcagatggt ggaaataata + 2041 aaaaagataa attgactcac gcgggcattt atggagttga ttcatccatt cacaccttag + 2101 aaaatctcta tggagtggat atcaattact atgtgcgatt gaacttcact tctttcttga + 2161 aaatgattga cttattggga ggggtagatg ttcataatga tcaagagttt tcagctctac + 2221 atgggaagtt ccatttccca gtagggaatg tccatctaga ctctgagcag gctctaggtt + 2281 ttgtacgtgg acgctactca ctagccgatg gagaccgtga ccgtggtcgc aaccaacaaa + 2341 aggtcattgt agcaattatt cagaagttaa cttctacaga ggttttgaaa aactatagta + 2401 gtattcttca aggattgcag gattctcttc aaacaaatat gccgattgag actatgatag + 2461 atttagtgaa tactcagttg gaaagtggag ggaattataa agtaaattct caagatttaa + 2521 aagggacagg tcggatggat cttccttctt atgcaatgcc agacagtaac ctctatgtga + 2581 tggaaataga tgatagtagt ttagctgtag ctaaagcagc tatacaggac gtgatggagg + 2641 gtagatgaaa tgatagatat ccattcgcat atcgtttttg atgtagatga cggtcccaag + 2701 tcaagagagg aaagcaaggc tctcttggca gaagcctaca ggcagggggt gcgaaccatt + 2761 gtctctacct ctcaccgtcg caagggcatg tttgaaactc cggaagagaa gatagcagaa + 2821 aactttcttc aggttcggga aattgcaaaa gaagtagcag atgatttagt cattgcttat + 2881 ggcgcagaga tatactatac tatggatgct ctagaaaagc tagaaaaaaa agaaattcct + 2941 acccttaatg atagtcgtta tgctttgatt gagtttagca tgcatacttc ctatcgtcag + 3001 attcatacgg gattgagcaa tattttgatg ttgggaatca cgccagtaat tgctcatatt + 3061 gaacgttatg atgctttaga gaataacgaa aaacgtgttc gtgaactgat tgatatgggg + 3121 tgctatactc agataaatag ttatcatgtt tcaaaaccta agttctttgg tgaaaaatat + 3181 aaattcatga aaaagagagc tcggtatttt ttggaacgtg atttagttca tgtcattgca + 3241 agtgacatgc acaatttaga cagtagacct ccatatatgc aacaggcata tgatatcatt + 3301 gctaagaaat atggagcgaa aaaagcgaaa gaactttttg tagataatcc cataaaaatt + 3361 ataatggatc aattaattta ggagaaaata tgcaagatca aaacgctttg gaaatcgatg + 3421 tatttcaact attcagagct ttatggaaaa gaaagttggt tattttatta gtggcaatta + 3481 taacttcttc agttgctttt gcctacagta cttttgttat caaacctgag tttactagta + 3541 cgactcggat ttatgtagtt aaccgtaata aggaagagaa gtctggttta accaatcaag + 3601 acttgcaggc aggatcatac ttggttaaag actatcgtga aattatccta tcgcaggatg + 3661 ttttggagga agttgtttct gatttgaaac tagatttgac gccaaaaggt ttggctaata + 3721 aaattaaagt gacagtacca gttgataccc gtattgtctc tatttcagtt aatgatcgag + 3781 ttcctgaaga ggcaagccgt atcgctaact ctttgagaaa agtagctgct caaaaaatta + 3841 tcagtattac tcgtgtttct gatgtgacaa cactggagga ggcaagaccg gcgatatcgc + 3901 cgtcttcgcc aaatattaaa cgcaatacac taattggttt tttggcaggg gtgattggaa + 3961 ctagtgttat agttcttctt cttgaacttt tggacactcg tgtgaaacgt ccggaagata + 4021 tcgaaaatac attgcagatg acacttttgg gagttgtacc aaacttaggt aagttgaaat + 4081 aggagagaag gatgccgaca ttagaaatag cacaaaaaaa actggagttc attaagaagg + 4141 cagaagaata ttacaatgcc ttgtgtacaa atatacagtt gagcggagat aaactaaaag + 4201 taatttccgt tacttctgtt aaccctgggg aaggaaaaac aactacttcc ataaatatag + 4261 catggtcgtt tgcgcgtgca ggctataaaa ctcttttgat cgatggcgat actcgacaat + 4321 cagttatgtc aggagttttt aaatctcgtg aaaaaattac agggctaaca gaatttttat + 4381 ctgggacagc tgatttatct cacggtttat gtgatacaaa tattgaaaat ttatttgtag + 4441 ttcaatcggg atctgtatca ccaaacccta cagccttgtt acaaagtaaa aattttaatg + 4501 atatgattga aacattgcgt aaatattttg attatatcat tgttgataca ccacctattg + 4561 gaattgttat tgatgcggca attatcactc aaaagtgtga tgcgtccatc ttgataacag + 4621 caacaggtga ggtgaataaa cgtgatgtcc aaaaagcgaa acaacaatta gaacaaacag + 4681 ggaaactgtt cctgggagtt gttttaaata aattggatat ctcggttgat aagtatggag + 4741 cttacggttc ctatggaaat tatggtaaaa aataacttag aaaagatttt atggatgaaa + 4801 aaggattgaa aatttttctg gcagtattgc agagtattat tgtcatttta ttgatttatt + 4861 ttcttaactt tgttagagag acagaacttg aacgttcttc gatggttata ctataccttc + 4921 tccacttttt tgtattttat tttagttcct atggtaacaa tttttttaaa agagggtacc + 4981 tagttgagtt taatagtact ataagatata tttttttctt tgcaatagct ataagtgtat + 5041 taaacctttt tatagcggaa cggtttagta tctctagaag aggaatggta tacttcttaa + 5101 ctttagaagg aatatcctta tacttgttaa atttcttagt aaaaaaatat tggaagcatg + 5161 tgttttttaa tctaaaaaat agcaagaaaa ttttactgtt aacagtaacg aaaaatatgg + 5221 aaaaagttct tgataaattg ctagaatctg atgaaccttc atggaaattg gtagcagtaa + 5281 gtgttttgga taaatctgat tttcaacatg ataaaatacc tgtaattgaa aaggaaaaaa + 5341 ttattgaatt tgcaacgcat gaagttgtgg atgaggtgtt tgtcaatctt ccaggagaga + 5401 gctacgatat tggagaaatt atctctaggt ttgagacaat ggggatagat gtaactgtaa + 5461 atcttaaagc atttgataag aattttggtc gcaataaaca aattcatgag atggtaggac + 5521 tggatgtagt cactttctct acaaattttt ataaaactag tcatgtgatt tcaaagagaa + 5581 ttctcgatat ttgtggtgcc actattggcc ttattctttt tgctatagct agtctagttt + 5641 tagttccatt gattcgtaaa gatggcggac cagctatttt tgctcaaact cgtataggga + 5701 aaaatggtcg acatttcaca ttttataaat tccgttcgat gcggatcgat gctgaagcta + 5761 tcaaagaaca gttgatggat caaaatacga tgcaaggtgg tatgtttaag atagacaatg + 5821 atcctcgtgt tacaaaaatt ggtcgcttta ttcgtaaaac cagtttggat gaattgccgc + 5881 agttttggaa tgtatttata ggagatatga gtttggtagg aacacgtcca cctacagtag + 5941 acgagtatga tcagtatact ccagaacaga aacgtcgact cagctttaaa cctgggatta + 6001 caggcttatg gcagattagt ggccgaagta aaataaccga ttttgacgct gttgtaaaat + 6061 tagatgtggc ttatattgat aattggacaa tctggaaaga tattgaaatt ttgcttaaaa + 6121 ctgttaaagt tgtatttatg agagatggag cgaagtaatt tctgtatatc catcatatta + 6181 ggagagaaat gaaaaagtca gtttatatca ttggttcaaa aggaattcct gctaagtatg + 6241 gaggatttga aacttttgtt gaaaaattaa cagccttcca acaagataag gctatccaat + 6301 attatgtagc ttgtatgcgt gaaaactctg caaaatcagg gactactgag gatgtttttg + 6361 aacataatgg tgctatctgt tataacgtcg atgttcctaa tattggtcca gcgcgagcta + 6421 tagcgtatga tatcgctgca attaacagag ctattgaaat tgccaaagaa aataaggatg + 6481 aagctccaat cttctatatt ttagcttgtc gaatcggtcc gttcatccat ggaattaaga + 6541 aaaaaatcca ggcgataggt gggactcttc tagttaatcc agatggtcac gagtggttac + 6601 gagctaagtg gagcgctcca gttcgtcgtt attggaaaat ttccgaaggt cttatggtca + 6661 aacatgcaga tcttttagtg tgtgatagta agaatattga aaaatatatc caagaagatt + 6721 atatacagta tcaacctaag acaacctata tcgcttatgg gacagataca acacgctcca + 6781 cattaaatag cagtgatgaa aaagtgcgtg cttggttcaa ggagaaaaat gtttctgaaa + 6841 acgagtatta cctagttgta ggacgttttg ttccagaaaa taattatgag tctatgatac + 6901 gtggtttctt ggcgtctagc tctaagaagg attttgtcct aatcacaaat gtagaacaga + 6961 ataaatttta taatcagcta ttagcaagta ctggatttga taaagatcca cgagtgaaat + 7021 ttgttggaac agtctacgac caagaacttc tgaagtatat tcgagaaaat gcttttgctt + 7081 acttccacgg acatgaagtt ggtggaacaa atccttcgtt acttgaagca ttagcatcca + 7141 caaagttaaa cttactactc gatgttggtt ttaaccgcga agttggggag caaagtgcga + 7201 tctattggaa aaaagatgag ctttcccaag taatcgagaa agttgaacaa tttgatgcaa + 7261 aaatgattga tgagttagat agacaatcaa atcagagaat tggggattat ttcacttggg + 7321 aaaagattgt cacagactac gagaaattat ttaaaaaatg aaaatattac attatacttt + 7381 aggatttcaa ccccagcgaa caggtggttt ggttaaatat gctgaggatt taatgataga + 7441 gcaaattgct caaggttatc aagtagctgc cttatatcca ggaagaatta agttcttttc + 7501 aaaagaaata gaaataatta aagcgacgtc aagacagttt gagtgttatg aactgcttaa + 7561 tagcttacct atggctttat ttggaggtat atccgatcca actgctttcc tgacaccttg + 7621 tgacaaaaat gtttatcgta cttttttaga aaaagtacaa cccgacatta tacatattca + 7681 ctcgtttatg ggattgcata aagaattcct cgaaattgct aaaaacttga atattagagt + 7741 ggtttttacg agccatgatt attatggatt agcacccgta cctcatttct attttaatgg + 7801 ggtggattat agtgataaaa atacaaattt aacatggaat attatgtctt ccaatgcttt + 7861 aagtgtgaaa aaactaagac tttttcaggt ttcattttat ccgactattc gtaaactttt + 7921 gaaactatta gggaaaaatc caaaatctaa aaagaattta gttattcgag atgttattga + 7981 ggagcaagat tatagtgatc ttcgatacta ttataatgag atgtttcact taatagatgg + 8041 ttatttgttt aatagtagac ttgcaaagaa ggtatatgag ataaatgaga ttaagtcagc + 8101 taatagtata gtattatcta taacaaatag ttcaattaat catcatcaga gattgacaac + 8161 tgcaaataat aaaattagag ttgcttatat tggtccagat gaagaatata aaggatattt + 8221 tgattttatt gactttgttg aaactttaga tcgagagtcc tatgaagtgg caacttatgg + 8281 ccatttacca aatgaagagt gcccttcatt cattgaacaa aaaggatatt ttactaagga + 8341 aatgattgac agtgtctatg aaaatattga tattcttatt gttccaagta agtggaagga + 8401 aacatttgga ttgataacag tagaagcatt atcctatggg gtaaatgttt tcgtgagtga + 8461 aaatgttgga tcaaaagact tgtttccaga aacacatgtt tttaaagaca aggaagattt + 8521 gttggctaaa atcatcaata atcagttgaa gaaaattccg cttaaaacga tagaagaaca + 8581 tgtagaagaa gttattggtt attacaaaca ggttagaagt aacaattaag gagaatgatt + 8641 aaagatatgt cctgtccaga aattagcgta attgtaccag tttataatgt ggaacgatat + 8701 ttaaggcagt gtatggattc attgataaat caaacttata gggattttga aataatttta + 8761 gtaaacgatg gatcaacgga ttcttctggg gttctctgtg aggattgggc aaaaaaagat + 8821 gaaagaattc atgtagttca caaaaaaaat gaggggcttg gcttcgctcg taatacaggg + 8881 gttgaacacg caaaggggaa atacataacc tttgtagatt cagatgacta tgtttctcta + 8941 gatatgctgc aaactctata taatgctgtt caagaatatg atgtcgaagt tgtatacagt + 9001 gcgggatatt atcgttcctt tagtaatggg gaaataaaga agacagatgt agaaacaaaa + 9061 aaacctcaac ttttcgaagg aggagatgtt gcctctaaat tactccctga tgtaatttct + 9121 gctcctcctg agtatccgaa tgatgggaaa gttggagtgt cggcatggaa ggttctctac + 9181 gaagctaatt tgtttaagga aaaaggctta ttatttcatt cagaaagaga attcatttca + 9241 gaagatgcta tttttcaaat tgattgttta aaattagcaa catctgccct tgttatccca + 9301 gatattttat actactatcg tgaaaacttt ggttctttaa gtatgaaata taaagaagaa + 9361 cggtttgagt tggataaaat cttgtataac gagcaattaa aaagagttga ggggttacct + 9421 aatcaagaaa ttttggaaga aagaatagag agaattttaa ttgctaatat tcgtttatgt + 9481 atctttcagg aatccttata taaaagttct agaattcata aacgtttgca aagaattaga + 9541 cagatttgta aggacccaat atcaaaatca gtattacgtc attatccaat ccatcgttta + 9601 ccttttacta aacgtttgat ctgtgtatta gctaagtata atatgtcgtt gttgctttta + 9661 gttttaacct cattaaaata tcggaatcgg agtgtgtaac ttttatgggg atgaatatag + 9721 aaaaattaaa actatctttt aaaaatggaa cgttttttcc tgttgttatt cacgccttac + 9781 gtaaccgttg gcccttgtgg tggattcgga gtaaggctat tcgagaagtg caacttgaag + 9841 atagggccta cagaatacta aaaaagaaat acggttcttt aatttcaaac tcttttgata + 9901 aatcatactt atcagaagaa gttcccaagc aaatctggat ttgctggttt caaggtatgg + 9961 agaatgctcc agagttggtg aaatcatgtt atagatcact aaaaaaacaa tttcctgaat + 10021 atgtcattac ggttatttct tcagaaaata tttccgaata tgtagaaata tctgatatta + 10081 tttataaaaa atggggaaat ggtgtaatag gaaatgctca tttttctgat atccttcggg + 10141 tagagctgtt acgtaagttt gggggaatat ggattgactc aacagtgtat tgtacaggaa + 10201 ttactaccat agagacaatt gaaaaaaata cattttttat gtataaaagt ttatattcag + 10261 ttgaggagag aatttcctct tccaactgga tgattgcttc tgttcccaat catccattta + 10321 tggttacgat gagcacactc ttgcaatctt attggtcaaa agaagttata gcaattcatt + 10381 attatctatt tcatattctt tttacgatta tgattgaatc actttctgag ttgtggcagc + 10441 ttgtacccac ctatacgaac gcaacaccac atataatggt tgatgaatta aataatgttt + 10501 tttcaaagga acgttatcag caattgtgtc aaatttcaga ttttcataaa ttaaattata + 10561 aaaaaaatta caatgataaa tcagagagtt tgtacagtca cttactgaat cagtagaggg + 10621 gagaatcttg cctaatttaa agaaaaacat tgtttacaat gtcttatatc agatcttagc + 10681 tgtaatagta ccgtttatta cctcacctta cttagcgcgt gtgttaggtg cagagcaaat + 10741 tggagtttat tcttttactt attccattgc tttttacttt atgattctgt ccatgttggg + 10801 aatttctaat tatgggaatc ggacaatagc acaggtacga acaagtagag aacatttgaa + 10861 tcaagaattt tcgaatattt acgcagttca gttgacgtgt tcactagtaa tgaccgtctc + 10921 atatttgatt tatgcaacag tatttgtgaa tagttttcag attgtagcct atatccaagt + 10981 attacatgtt ttatcgtatg caacagatgt tagttggttt ttttatggtc ttgaagagtt + 11041 tcgtattacg gttgctagga attcatttgt taagttatta actttaatat ctatctttac + 11101 atttgtaaaa agccctaatg atatctattt atataccttt ataatggcag ggagtaccct + 11161 gcttggtcag ttgattacat ggcaattttt gctaaaacaa gtaaactttg tgcgccctaa + 11221 tcttggaaaa ataaagaaac acatgaaacc tattattatt ttatttttcc ccgtcttagc + 11281 ggttagtatt ttttcgtttc tagataaaat aatgcttggg atgtatagta gtttgaagga + 11341 aactgctttt tatgagaatt cagataagat aattagtatt ccaaaagctc tgattcaagc + 11401 ctttggagct gtaatgttgc ctcgaacagt acatttactg agtataggtg atgaacaaaa + 11461 aagtttagaa tatgttgata aaacgatgtg ggttgtttta gtgattacaa tgggctgtgc + 11521 tttcggttta gcaggagttt ctgcaacctt tgctcctgtt tattggggtg aagaatttag + 11581 ggccagtagc caaattattg caggaatgac accggcttta gtattttcgg cttttggaaa + 11641 tgtcatccga acccagtttt taattccacg aagttttgac aaggaatata cggtatcttt + 11701 gctttatgga gccgtagtta atatcttgat taatattctt ttgattccga agatgggagc + 11761 aatgggagct gttatcggaa taattgttgc agagttagtt ctatgttgct atcaaacatg + 11821 gattgctaga aattatttac atatcagaga atatctgata aatgctggga tattatttct + 11881 tattggttca gtaatgtata tggttttaat tcttatttca agtattttac ctacatcgtt + 11941 acttacactt attattgaaa ttatagtcgg agctttcatt tatattagtt tactggttct + 12001 gtatatcttt tcttcaaaaa acagggtaat tattggttta cgaacaaatt ttttagaaca + 12061 tactcattta tttaaaagga aataatagtg aaatttaaat ttaatccaat cgcgatactg + 12121 tatatattgc tagtatactt agagttggct acagataggc aacatctgta tcctgtaacg + 12181 tacatgacaa aatattatat tggtatttta atcattgtgt tgtttgtttt attattagta + 12241 ggccgtggga agcttatttt tgttaataaa aaattattat atcttgctaa gatattagct + 12301 ataccaacaa ttgttctttt cctgtactca gtcttactag acgtaatgaa cccagttgaa + 12361 tttaatggat attttagtag attatcaagt acgactattt ttggtttgtt agctatcttt + 12421 caagctatag ttgtttttca attttttgga caaaaagtag tagattacac ttttacagct + 12481 atctccctca gctacttaac cagtatcatt gttgccttta ggcagggagg acttagtcaa + 12541 tttatcttga tactaacaga tgatagtttc aatggttcgg tactagaaat gcatgaagtt + 12601 gcacctatta cagctctctt tattctgtac tatttgtaca aatattttat aaaagaaaat + 12661 agtttttctt cagtatttta taatatctta atagctctca ttattctttt tttaagcctt + 12721 aaacgaatcg ttcttttgag tgtattaatt atcataccag tatttttggt aatttattgg + 12781 tatgataaaa aagtaagtaa actagggaaa gaacgaaaaa ttttaagttt attaaatatc + 12841 ttttccttaa tatttataac aggaatattc ctttatgttt atagtgtaaa atctgatttt + 12901 atatatacat ttattcaaga acataatatt aattcgatgg ctagaacaga tttatggaag + 12961 ggagttgaat caacctataa tttcgcccct atatttatgg ggagagggat agggtttgta + 13021 acaaaatgga tggataataa ttggatgact ttgaatatca atggtcttac agggacaatg + 13081 gggatccata atgatatttt gaagtactac attgagatag gatttgtagg attatttatt + 13141 tatttttaca ctcttcttta tagaaatgct aaacgtatat ttgtaaaaat tggtcataaa + 13201 gaatcattca tatattttgt attgataatg tttcagatgc tgatatggtt tacagataat + 13261 atttcaattt accataattt tttatggatc ctaaatctac tactcttttc tttaactaat + 13321 tcggatacag aattggaaaa tttagatttt aaaaattttt aatgtgtaag tagtaactac + 13381 taattttatt aaaaaatcag aatataggtg tatttatgaa gacagatgct aggactaaaa + 13441 agagagagaa tgaaacgtta tatattctaa aagtttgggc aacatttagt gtgattgcta + 13501 tacattttgg ttttttgggc caaattggag tgttttacaa agtattagct cgatttgctg + 13561 tacctttatt tttcatgatt tcaggatttt attcgtttag tatttcagaa gaaaaactga + 13621 agaaaagaat taaaaatctg agtttattga taatttccag tacaagtttt tattttttac + 13681 tggatgtttt tcttcaatta acacaaggaa atctaagagt tgtatttgaa agatttactt + 13741 ttaataatat ttttaatttt ttggtattca atcaaatttc tgctctaatt ggctcgttag + 13801 caacaccact atggttctta tatgcattac tgtatgttta tatttatcta tttttttcaa + 13861 ataaaaaatg gatatttaat actattttga ctgtgatcat actctgttgt tcatttataa + 13921 tcgagttaaa agcaaatagt gctttatttt atagaaactt cttatttatg ggagttccct + 13981 tcttttcttt tgggatgtat tttgctcaaa ttcagagaaa aattataaat tataagcact + 14041 tcaaagaact ttttataatt ggaattatga tttcaggatt tctaactctg attgaatata + 14101 cctttttagg agcaaatttt gaactttatg taagttcggt gataatatct tgtatgctta + 14161 tggtcttttc gattaaatat cctcaactct ggacgttaga ttttgctgtc aatattgcta + 14221 aaaaaaatgc gacgtttatt tatattagtc atcaatttgt gattttatta tttaaaacat + 14281 acgttagaga tggaattgct tataaaattg gaactttctt gatattttta gcatgtgtta + 14341 ttatgagtat tattttcaac tatatagtcg atataatcag tcgttgttgc ataaaagaaa + 14401 aacaagatat aatatgaaat tttatataaa aaatttatta aaaaaagtct ttacattacc + 14461 gttgcattta ttgcctattc agtctaataa gataatattt gataattttg gtggtagagg + 14521 ttttggggac aatcctaagt atatacttga agaacttgtc tctcgagaaa agaatctaga + 14581 tcttgtgtgg gtaacaaaag atagagaaat ttctatccct gaaggcgttc gagtagtaaa + 14641 atacggcagt taccgttctt tttatgaatg gttaacagct agagtttggg tagataatat + 14701 tcgtaattct gatcgacctt ggaagcgaaa aggacagatt tatcttcaaa cttggcatgg + 14761 ttcagatggg gtaaagttaa ttgaaaaaag tgttgcaggg aacctaaaaa aaacatatct + 14821 tagaatggcg aagtatgatg gaaagattac agacggtatc gtatcaagtc ggcattttca + 14881 aactttgggt atgcaaaata atttttggct ggcagagaat gtggaatttc tggaatttgg + 14941 attacctcga aatgatgatt tttttaaaag tgaaaaaatc aaaaccacaa atataaaatt + 15001 tagaacatta tttgatatcg atttagacga actggtagtt ttgtatatgc cgacgttcag + 15061 agatgatgga tcgttgaatg cctataattt agattactcg aaactaatac atgtttttca + 15121 aaataaattt agaaaaaatg taaaaatatt agttcgtttt catccaaatg ttgattctag + 15181 ttttataaat ttacaggata cagactgtat aaatgtgtcg acctattcaa atcctcagga + 15241 tctgatgatg agtgcagatg tgatgattac ggattattca tcggcttcta ttgattttat + 15301 gttattaaat cgtccagtat ttctgtattt accagattat caaagttatg tgaatgatag + 15361 accattggat gataactttg ataaattgcc atttccaaga gcatatcata acaatgagtt + 15421 gacagaaatt attagagact ttgaaagaag taaatatgat gaaaaagttc gtctgtatga + 15481 attagaggat gttcgttttg atagaggaaa agcatcagta cagtgtgcta attggattga + 15541 agaaaaaata aaaaacaata aagttattga ttgaaataat tatatttatt gaattataaa + 15601 taaggaggtc tttagatgaa aagagttata acatatggta catttgattt attgcattat + 15661 ggtcatatca atcttttgaa acgtgctaaa cagctaggtg attatttgat tgtagttgtt + 15721 tcaagtgatg agtttaattt aaaagaaaag aataaagtat gttactttaa ctacgaacac + 15781 agaaaaaatt tagtagaagc tattcgatat gtcgatttag taatccctga aactagttgg + 15841 gaacagaaaa agtcagatgt taaagactac catattgaca cttttgtaat gggtgatgat + 15901 tggaaaggta aatttgatta tcttgaagaa gaaggtgttg aagtagtcta tttgcctaga + 15961 acaaaggaaa tatcaaccac aaagataaaa gaagatttat cggaatgaaa tattattaaa + 16021 aatgctgaca taagaaattg tggcttttgt gtctagtttt tgatagaata aagtaacaac + 16081 actttaacca atgaggtgtg aataatggca gtaattttta aagatgtact tgttgaagag + 16141 aaaactgatg aagaaaaaca acatatttta tctattttaa atgatgagaa tgttagagct + 16201 tttgattgtg gatattaaga attgaatgat gttttttgat atttagaaca aatacgatga + 16261 agaaacaggc catgtattgc ctattgtaaa tcaaaatttt gaattattag gttttatttc + 16321 ttgtagacta gtatcatttt ctttcatagc tcaggttaaa gagatgggaa ttagcataga + 16381 ttatcttggt attcataagg attgccagaa aatgggggat cggttcgctt ttggtgctct + 16441 ttgcgcttcg attatcttta actattgact gttgattacc aataaaaggt gtaatagttc + 16501 atgctctaga ggatgttgta gaattctatg acaaactggg ttttattgac cctagagata + 16561 tagttattta taatggcaaa ccggttacta tatattttag tattgaaaaa ctaagaaatg + 16621 gtgaaaatta ttcctctcac acagttattt gaaacatcct tagaaaatga tttttaattg + 16681 tatgcaaaca aagtagaatt cgcttatttc atcttatgct aaatgtaata tgaaacaagt + 16741 gaatttttat agataaagaa gaattttaaa aaatgtgatg attattttta gagcagtaca + 16801 gaattaatag taattgactc taaatcaata aagaaaggta ccctattatg aaaggtatta + 16861 ttctagcagg tggttcgggg acacgtttat atcctttgac tcgagctgca tcaaaacaac + 16921 tgatgccggt ttatgataaa ccgatgattt actatccact ttcaacattg atgttggctg + 16981 ggattaggga tattttgata atctcaactc ctcaagattt gcctcgtttt aaagagcttc + 17041 ttcaagacgg atctgagttt gggattaaac tttcttatgc agagcaacca agtccagatg + 17101 gtttggcaca agcctttatc attggggaag agtttattgg tgatgatagt gttgctttga + 17161 tcttggggga caatatctat cacggccctg gtttgagcaa aatgcttcaa aaagcagcca + 17221 agaaagagaa aggtgcgact gtctttggct accatgtcaa ggatccagaa cgctttggtg + 17281 ttgtagaatt tgatgaaaat atgaatgcta tctccatcga agaaaaacca gaacagccgt + 17341 gctctaacta tgcagtgaca ggactgtatt tctatgataa cgatgttgtc gagattgcca + 17401 aaagtattaa accaagtcct cgtggtgaat tggaaattac agatgtaaac aaagcttacc + 17461 tagatcgtgg tgatttgtct gttgagctta tgggacgcgg ctttgcttgg ttggatactg + 17521 gaacacatga aagtttactg gaggcttcac agtacatcga aacagtgcaa cggatgcaaa + 17581 atgttcaggt agcaaacttg gaagaaattg cctatcgcat gggttatatc agtcgtgaag + 17641 atgtattgac cttagcccaa ccacttaaga aaaatgaata cggacagtat ctgctccgtt + 17701 tgattggaga agtctagatg acagataatt ttttcggtaa gacgcttgcg gcacgcaagg + 17761 ttgaagctat tccaggcatg ttggagtttg atatccccgt tcatggagat aatcgtggct + 17821 ggtttaaaga aaatttccaa aaggaaaaaa tgcttccact tggatttcca gagtctttct + 17881 ttgcagaagg aaaattgcaa aacaatgtat ccttctcacg taaaaatgtc cttcgaggcc + 17941 tccacgcaga gccttgggat aagtacatct ctgtagcaga tggagggaaa gttctgggtt + 18001 cttgggttga tctacgcgag ggtgaaacct ttgggaatac ctatcagaca gtaattgatg + 18061 caagcaaggg aatctttgtt cctcgtggcg tagctaatgg cttccaagtt ttatcagata + 18121 cagtgtcata tagctatctg gtcaatgatt actgggcgct tgaactcaaa cccaagtatg + 18181 cctttgtgaa ctacgctgat ccaagctttg gtattgaatg ggaaaatatt gcagaagcag + 18241 aggtttcaga agcagataaa catcatcccc tacttaagga cgtgaagcct ttgaaaaaag + 18301 aagatttgta aaaaggaaag aatatgactg aatacaaaaa tattatcgtg acaggtggag + 18361 ctggctttat cggttctaac tttgtccatt atgtttacga gaactttcca gatgttcatg + 18421 tgacagtcct agataagttg acttatgctg gaaaccgcgc gaatattgag gaagttttag + 18481 gtaatcgtgt tgagttagtt attggtgaca ttgctgatgc ggagttggta gacaagttgg + 18541 ctgctcaagc agatgctatc gttcattatg cagcggaaag ccacaatgat aattcgctca + 18601 atgatccatc gccatttatt catactaact tcatcggaac ctatactctt ttagaagctg + 18661 ctcgtaagta tgatattcgc ttccaccatg tatcgacaga tgaagtttat ggggatctcc + 18721 ctttacgcga agatttgcca ggtcatggtg aaggaccagg tgagaaattt actgctgaaa + 18781 caaaatacaa cccaagctct ccgtactcat caaccaaggc agcctcagat ttgattgtca + 18841 aagcctgggt gcgttctttt ggagtcaagg caacgatttc caactgttca aataactacg + 18901 gtccttatca acatatcgaa aaattcatcc cacgtcagat tactaacatc ctaagtggaa + 18961 ttaagccaaa actttacggt gaaggtaaga atgttcgtga ctggatccat accaatgacc + 19021 attcttcagg agtttggaca atcttgacaa aagggcaaat cggtgaaacc tacttgattg + 19081 gggctgatgg tgagaagaac aataaggaag ttttggaact tatccttaag gaaatgggac + 19141 aagctacgga tgcctatgat catgtgactg accgtgcagg acatgacctt cgctatgcga + 19201 ttgatgccag caagctccgt gatgagttgg ggtggaaacc tgaatttacc aactttgaag + 19261 ctgggctcaa ggcaacaatc aagtggtata cagataacca agaatggtgg aaagcagaaa + 19321 aagaagctgt tgaagccaat tatgctaaga ctcaggagat tattacagta taaaaagcag + 19381 gaaatagctg ctttttattg ctatattggg aagagttaca tattagaaag gtctagagat + 19441 gattttaatt acaggggcaa atggccaatt aggaacggaa cttcgctatt tattggatga + 19501 acgtaatgaa gaatacgtgg cagtagatgt ggctaagatg gacattacca atgaagaaat + 19561 ggttgagaaa gtttttgaag aggtgaaacc gactttagtc taccattgtg cagcctacac + 19621 cgctgttgat gcagcagagg atgaaggaaa agagttggac ttcgccatca atgtgacggg + 19681 gacaaaaaat gtcgcaaaag catctgaaaa gcatggtgca actctagttt atatttctac + 19741 ggactatgtc tttgacggta agaaaccagt tggacaagag tgggaagttg atgaccgacc + 19801 agatccacag acagaatatg gacgcactaa gcgtatgggg gaagagttag ttgagaagca + 19861 tgtgtctaat ttctatatta tccgtactgc ctgggtattt ggaaattatg gcaaaaactt + 19921 cgtttttacc atgcaaaatc ttgcgaaaac tcataagact ttaacagttg taaatgacca + 19981 gtacggtcgt ccgacttgga ctcgtacctt ggctgagttc atgacctacc tagctgaaaa + 20041 tcgtaaggaa tttggttatt atcatttgtc aaatgatgcg acagaagaca caacatggta + 20101 tgattttgca gttgaaattt tgaaagatac agatgtcgaa gtcaagccag tagattccag + 20161 tcaatttcca gccaaagcta aacgtccgct aaactcaacg atgagcctgg ccaaagccaa + 20221 agctactgga tttgttattc caacttggca agatgcattg caagaatttt acaaacaaga + 20281 agtgagataa gtagtagaat gattttctag tctaataaaa gaggcagata atgaactcaa + 20341 aaggagctta aggtgtacga ttatcttgtt gttggtgctg gtctctttag tgcagtcttt + 20401 gcccatgaag tagccttaaa aggaaaaaag taaaagtcat tgaaaaacgg aatcatatcg + 20461 tgggtaatat ctatactcgt gaagaggaag gaattcaagt tcatcaatat ggtgctcata + 20521 tcttccatac ttctgataag gagagctggg attatgtaaa tcagtttgca gggtttaacc + 20581 gttacaccaa ttctcctgtt gcaaactata agggtgagat ttataacctt ccttttaata + 20641 tgaatacttt caataaactc tggggagttg taacgccagc agaagcacaa gctaagattg + 20701 aggaacaacg tgctatttta aatggtaaaa ctcctgaaaa tttggaagaa caggcgattt + 20761 ctcttgtagg tacagacatc tacgaaaaat taatcaaaga ctatacagag aaacagtggg + 20821 gcaaaccaac tactgaactt ccatccttta ttattcgccg tttaccagta cacctgacct + 20881 atgataacaa ctattttaac gatacctatc aagggattcc aattggtgga tacactcaaa + 20941 tagttgaaaa atgttggatt atgaaaatat tgatgtagaa acaaatgttg atttctttgt + 21001 gaacaaagag caatatctga aagattttcc taagattgtc tttactggta tgattgatga + 21061 attctttgac tataagttgg gcgaactaga gtaccgtagt cttcgttttg aaaatgagac + 21121 cttggatatg gaaaattacc aaggaaatgc agttgtgaac tatacggatg cagaaacccc + 21181 atatactcgc attattgaac acaaacattt tgagtttggg agtcaagcaa agactatcat + 21241 tactaaagaa cattctaaaa catgggaaaa aggtgatgag ccttattatc cagttaataa + 21301 tgatcgtaat aatcatttgt ataaatcgta taaaaaattt gctgatgagc aagggaatgt + 21361 tatctttggt ggccgcttag gacactatcg ttattacgat atgcaccaag taattggagc + 21421 agctttgcag tgcgtgagaa atgagttaga ttaatactca atgaaaatca aagagcaaac + 21481 taggaagcta gccacaggtt gctcaaaata ctgttttgag gttgcagatg gaagctgacg + 21541 cggtttgaag agattttcga agagtataaa caagtaaaac tgactaccag ttattattta + 21601 gaaatagtat taaaaattcc ttgactatgt gatatagttg agggattttt aaatgatatt + 21661 catatttttt gcaaagatgt tgtttgaaaa ataattttca aaaattctga aaattctgtt + 21721 gacatctttc tgaaaagagt ttataatgga gagaaagttt taaaggagaa aatgatgaaa + 21781 agttcaaaac tacttgccct tgcgggcgtg acattattg +// + diff --git a/public/res/serotype_genbank/serotype_18F.gb b/public/res/serotype_genbank/serotype_18F.gb new file mode 100644 index 0000000..49af2cf --- /dev/null +++ b/public/res/serotype_genbank/serotype_18F.gb @@ -0,0 +1,1066 @@ +LOCUS CR931674 22849 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Gethens (serotype 18f). +ACCESSION CR931674 +VERSION CR931674.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22849) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22849) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22849 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Gethens" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC18F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC18F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33596.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC18F_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC18F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..1325) + /gene="tnp" + /locus_tag="SPC18F_0003" + /pseudo + CDS complement(459..1325) + /gene="tnp" + /locus_tag="SPC18F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(930..1307) + /gene="tnp" + /locus_tag="SPC18F_0003" + /note="HMMPfam hit to PF01710, Transposase, score 9.3e-21" + /pseudo + gene 1560..3005 + /gene="wzg" + /locus_tag="SPC18F_0004" + CDS 1560..3005 + /gene="wzg" + /locus_tag="SPC18F_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33599.1" + /db_xref="GOA:Q4K240" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K240" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGIDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEINDSSLASVKTAIQDVLEGR" + misc_feature 1560..1676 + /gene="wzg" + /locus_tag="SPC18F_0004" + /note="Signal peptide predicted for SPC0938 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 1764..2111 + /gene="wzg" + /locus_tag="SPC18F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 2289..2732 + /gene="wzg" + /locus_tag="SPC18F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.1e-69" + gene 3007..3738 + /gene="wzh" + /locus_tag="SPC18F_0005" + CDS 3007..3738 + /gene="wzh" + /locus_tag="SPC18F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33600.1" + /db_xref="GOA:Q4K239" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K239" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKNRIPTLNNS + RYALIEFSMNTPYRDIHSALIKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLERDLVHVIASDMHNVDSRPPHMAEAYDLVS + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3010..3618 + /gene="wzh" + /locus_tag="SPC18F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 6.8e-38" + gene 3747..4439 + /gene="wzd" + /locus_tag="SPC18F_0006" + CDS 3747..4439 + /gene="wzd" + /locus_tag="SPC18F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33601.1" + /db_xref="GOA:Q4K238" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K238" + /translation="MKEQNTIEIDVFQSLKTLWKYKLIILLVALVTGAGAFAYSTFIV + KPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDVLEKVATNLKLD + IPAKTLTSKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDVT + TLEEARPATTPSSPNVRRNTLVGFLGGAAVTVITVLLIELLDTRVKRPEDVEDVLQMP + LLGVVPDFDKMK" + misc_feature 3765..4181 + /gene="wzd" + /locus_tag="SPC18F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 4.7e-51" + misc_feature 4287..4364 + /gene="wzd" + /locus_tag="SPC18F_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4449..5132 + /gene="wze" + /locus_tag="SPC18F_0007" + CDS 4449..5132 + /gene="wze" + /locus_tag="SPC18F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33602.1" + /db_xref="GOA:Q4K135" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K135" + /translation="MPTLEISQVKLELAKKAEEYYNALCTNLQLSGDDLKVFSITSVK + AGEGKTTTSTNIAWAFARAGYKTLLIDADMRNSVMSGVFKSRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLGTLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILITATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGAY + GSYGNYGKK" + gene 5148..6515 + /gene="wchA" + /locus_tag="SPC18F_0008" + CDS 5148..6515 + /gene="wchA" + /locus_tag="SPC18F_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33603.1" + /db_xref="GOA:Q4K134" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K134" + /translation="MDEKGLKIFLAVLQSIIVILLIYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKDFGRNKQIHEMVGLDVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAESIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5931..6512 + /gene="wchA" + /locus_tag="SPC18F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.1e-146" + gene 6546..7718 + /gene="wchF" + /locus_tag="SPC18F_0009" + CDS 6546..7718 + /gene="wchF" + /locus_tag="SPC18F_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33604.1" + /db_xref="GOA:Q4K133" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K133" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIVYDIAAINRAIKIAKENKDEDPIF + YILACRIGPFIHGIKKKIQEIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSILKSSDEKVRSWFKKKNVSEN + EYYLVVGRFVPENNYEAMIRGFLASNSKKDFVLITNVEQNKFYNQLLASTGFDKDPRV + KFVGTVYDQELLKYIRENTFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIVDFFTWEKIVTDYEKLFKK" + gene 7715..8986 + /gene="wciU" + /locus_tag="SPC18F_0010" + CDS 7715..8986 + /gene="wciU" + /locus_tag="SPC18F_0010" + /note="member of homology group 59" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33605.1" + /db_xref="GOA:Q4K132" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K132" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMLEQIAQGYQVAALYPGRI + KFFSKKIEIIKATSRQFECYELLNSLPMALFGGISDPTAFLTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKSTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIKSANSIVLSITNSSINHHQRLTTTNNKIRVA + YIGPDEEYKGYFDFVDFVETLDRESYEVATYGHLPNEECPSFIEQKGYFTKEMIDSVY + ENIDILIVPSKWKETFGLITVEALSYGVNVFVSENVGSKDLLPESHVFKNQNDLVVKF + LKNDIENTKLKTLDEHSIEVIQYYERVINDS" + misc_feature 8489..8950 + /gene="wciU" + /locus_tag="SPC18F_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0015" + gene 8976..9662 + /gene="wcxM" + /locus_tag="SPC18F_0011" + CDS 8976..9662 + /gene="wcxM" + /locus_tag="SPC18F_0011" + /note="member of homology group 105" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33606.1" + /db_xref="GOA:Q4K131" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K131" + /translation="MIVKSFIKKITGKTVDIHPDVPLSYILQRGINYGFGLFRGVVRG + IGFGQNDKRLFIGQGVSILAKRKLFVGKNVRIGKKVSIDALSKEGIHFADNVKIGDYS + QIIGTGSIKNMGIGLKIGKNSSFSEYSLFGSAGGITIGDNVIAGQNVRFHAENHNYSD + LDKLIVEQGVSRKGISVGDNCWIGAGSVFLDGSSIGSGCVVGANAVVTKQFPDNVIIG + GVPARILAYR" + misc_feature 9174..9227 + /gene="wcxM" + /locus_tag="SPC18F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 16" + misc_feature 9240..9293 + /gene="wcxM" + /locus_tag="SPC18F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 13" + misc_feature 9381..9434 + /gene="wcxM" + /locus_tag="SPC18F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 10" + misc_feature 9495..9548 + /gene="wcxM" + /locus_tag="SPC18F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 11" + misc_feature 9549..9602 + /gene="wcxM" + /locus_tag="SPC18F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.77" + gene 9694..10740 + /gene="wciV" + /locus_tag="SPC18F_0012" + CDS 9694..10740 + /gene="wciV" + /locus_tag="SPC18F_0012" + /note="member of homology group 91" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33607.1" + /db_xref="GOA:Q4K130" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K130" + /translation="MPTFSVVVPVYNVENYLSQCLNALVNQSFKDFELILVNDGSTDT + SGSLCEEWGKKDHRIKVIHKTNEGLGFARNTGIENCTGDYIVFVDSDDYVSYEMLEIY + DTYLQRFNADVIYSENFYRVDNKGNIIEPLDQSLDSIFYKNDSIFTELLPDVISSPPE + FIGDGKIGVSVWKGVYKRSLFKDKGLLFHSEREFISEDAIFQIDCLKLAISALVIPDI + LYYYRENFGSLSMKYKEDRFELNKILYNEQLKRVEGLPNQEILEERIERILIANIRLC + IFQESLYKNSRIHKRLQRIRQICKDPISKSVLRHYPIRRLPFSKRLICVLAKYNMPLM + LLVLTLLKYRNRSV" + misc_feature 9706..10248 + /gene="wciV" + /locus_tag="SPC18F_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.7e-41" + gene 10746..11657 + /gene="wciW" + /locus_tag="SPC18F_0013" + CDS 10746..11657 + /gene="wciW" + /locus_tag="SPC18F_0013" + /note="member of homology group 92" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33608.1" + /db_xref="GOA:Q4K129" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4K129" + /translation="MGMNIEKLKLSLKNGTFFSVVIHALRNRWPLWWIGNKAIREVQL + EDRAYRILKKKYGSLISSSFDKSYLSEEVPKQIWICWLQGMENAPELVKSCYRSLKKQ + FPEYVITVISSENISEYVEIPDIIYKKWGNGVIGNAHFSDILRVELLRKFGGIWIDST + VYCTGITTIETIEKNPFFMYKSLSSVEERISSSNWMIASVPNHPFMITMSTLLQSYWS + KEVIAIHYYLFHILFTIMIESLPELWQLVPTYTNATPHIMVDELNNIFSKERYQQLCQ + ISDFHKLNYKKNYNDKSESLYSHLLNQ" + misc_feature 10827..11645 + /gene="wciW" + /locus_tag="SPC18F_0013" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.8e-144" + gene 11669..13126 + /gene="wzx" + /locus_tag="SPC18F_0014" + CDS 11669..13126 + /gene="wzx" + /locus_tag="SPC18F_0014" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33609.1" + /db_xref="GOA:Q4K128" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K128" + /translation="MPNLKKNIVYNVLYQILAVIVPFITSPYLARVLGAEQIGVYSFT + YSIAFYFMILSMLGISNYGNRTIAQVRTSREHLNQEFSNIYAVQLTCSLVMTVSYLIY + ATVFVNSFQIVAYIQVLHVLSYATDVSWFFYGLEEFRITVARNSFVKLLTLISIFTFV + KSPNDIYLYTFIMAGSTLLGQLITWPFLLKQVNFVRPSLGKIKKHMKPIIILFFPVLA + ISIFSFIDKIMLGMYSSLRETAFYENSDKIISIPKALIQAFGAVMLPRTVHLLSIGDE + QKSLEYVDKTMWVVLVITMGCAFGLAGVSATFAPVYWGEEFRASSQIIAGMTPALVFS + AFGNVIRTQFLIPRSFDKEYTVSLLYGAVVNILINILLIPKIGAMGAVIGIIVAELVL + CCYQTWIARNYLHIREYLINAGILFLIGSVMYMVLILISSILPTSLLTLIIEIIVGAF + IYISLLILYIFSSKNRVIIGLRTNFLEHTHLFKRK" + misc_feature 11678..12481 + /gene="wzx" + /locus_tag="SPC18F_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.9e-56" + gene 13129..14403 + /gene="wzy" + /locus_tag="SPC18F_0015" + CDS 13129..14403 + /gene="wzy" + /locus_tag="SPC18F_0015" + /note="member of homology group 93" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33610.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K127" + /translation="MKFKFNPIAILYILLVYLELATDRQHLYPVTYMTKYYIGILIIV + LFVLLLVGRGKLIFVNKKLLYLAKILAIPTIVLFLYSVLLDVMNPVEFNGYFSRLSST + TIFGLLAIFQAIVVFQFFGQKVVDYTFTAISLSYLTSIIVAFRQGGLSQFILILTDDS + FNGSVLEMHEVAPITALFILYYLYKYFIKENSFSSVFHNILIALIILFLSLKRIVFLS + VLIIIPVFLVIYWYDKKVSKLGKERKILSLLNIFSLIFITGIFFYVYSVKSDFIYTFI + QEHNINSMARTDLWKGVESTYNFAPIFMGRGIGFVTKWMDNNWMTLNINGLTGSMGIH + NDILKYYIEIGFVGLFIYFYTLLYRNAKRIFVKIGHKESFIYFVLIMFQMLIWFTDNI + SIYHNFLWILNLLLFSLTNSDTELENLDFKNF" + misc_feature 13966..14178 + /gene="wzy" + /locus_tag="SPC18F_0015" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 2.1e-09" + gene 14457..15458 + /gene="wciX" + /locus_tag="SPC18F_0016" + CDS 14457..15458 + /gene="wciX" + /locus_tag="SPC18F_0016" + /note="member of homology group 107" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33611.1" + /db_xref="GOA:Q4K126" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K126" + /translation="MKTDARTKKRENETLYILKVWATFSVIAIHFGFLGQIGVFYKVL + ARFAVPLFFMISGFYSFSISEEKLKKRIKNLSLLIISSTSFYFLLDVFLQLTQGNLRV + VFERFTFNNIFNFLVFNQISALIGSLATPLWFLYALLYVYIYLFFSNKKWIFNTILTV + IILCCSFIIELKANSALFYRNFLFMGVPFFSFGMYFAQIQRKIINYKHFKELFIIGIM + ISGFLTLIEYTFLGANFELYISSVIISCMLMVFSIKYPQLWTLDFAVNIAKKNATFIY + ISHQFVILLFKTYVRDGIAYKIGTFLIFLACVIMSIIFNYIVDIISRCCIKEKQDII" + gene 15455..16615 + /gene="wciY" + /locus_tag="SPC18F_0017" + CDS 15455..16615 + /gene="wciY" + /locus_tag="SPC18F_0017" + /note="member of homology group 78" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33612.1" + /db_xref="GOA:Q4K125" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4K125" + /translation="MKFYIKNLLKKVFTLPLHLLPIQSNKIIFDNFGGRGFGDNPKYI + LEELVSREKNLDLVWVTKDREISIPEGVRVVKYGSYRSFYEWLTARVWVDNIRNSDRP + WKRNGQIYLQTWHGSDGVKLIEKSVAGNLKKTYIRMAKYDGKITDGIVSSRHFQTLGM + QNNFWLTENVEFLEFGLPRNDDFFKSEKIKTTNIKFRTLFDIDLDELVVLYMPTFRDD + GSLNAYNLDYSKLIHVFQNKFRKNVRILVRFHPNVDSSFINLQDTDCINVSTYSNPQD + LMMSADVMITDYSSASIDFMLLNRPVFLYLPDYQSYVNDRPLDDNFDKLPFPRAYHNN + ELTEIIRDFERSKYDEKVRLYELEDVRFDRGKASVQCANWIEEKIKNNKVID" + misc_feature 16040..16585 + /gene="wciY" + /locus_tag="SPC18F_0017" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 8.2e-68" + gene 16657..17049 + /gene="gct" + /locus_tag="SPC18F_0018" + CDS 16657..17049 + /gene="gct" + /locus_tag="SPC18F_0018" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI33613.1" + /db_xref="GOA:Q4K124" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4K124" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNYEHRKNLVEAIRYVDLVIPETSWEQKKSDVKEYRIDTFVMGDDWKGKFDY + LEEEGVEVVYLPRTKEISTTKIKEDLSE" + misc_feature 16669..17037 + /gene="gct" + /locus_tag="SPC18F_0018" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 3.9e-29" + gene 17147..17691 + /gene="HG94" + /locus_tag="SPC18F_0019" + /pseudo + CDS join(17147..17257,17319..17507,17518..17691) + /gene="HG94" + /locus_tag="SPC18F_0019" + /note="member of homology group 94" + /pseudo + /codon_start=1 + /transl_table=11 + /product="hypothetical protein (pseudogene)" + gene 17896..18765 + /gene="rmlA" + /locus_tag="SPC18F_0020" + CDS 17896..18765 + /gene="rmlA" + /locus_tag="SPC18F_0020" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33615.1" + /db_xref="GOA:Q4K123" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K123" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGYEFGIKLSYAEQPSPDGLAQAFIIGEKFIGDDSV + ALILGDNIYHGPGLSKMLQKVSSKESGATVFGYHVKDPERFGVVEFDKDMNAISIEEK + PEHPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVEVMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17899..18615 + /gene="rmlA" + /locus_tag="SPC18F_0020" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 4e-119" + gene 18766..19359 + /gene="rmlC" + /locus_tag="SPC18F_0021" + CDS 18766..19359 + /gene="rmlC" + /locus_tag="SPC18F_0021" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33616.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 18802..19332 + /gene="rmlC" + /locus_tag="SPC18F_0021" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 19372..20421 + /gene="rmlB" + /locus_tag="SPC18F_0022" + CDS 19372..20421 + /gene="rmlB" + /locus_tag="SPC18F_0022" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33617.1" + /db_xref="GOA:Q4K121" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K121" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 19387..20343 + /gene="rmlB" + /locus_tag="SPC18F_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 7.1e-05" + misc_feature 19390..20226 + /gene="rmlB" + /locus_tag="SPC18F_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0039" + misc_feature 19390..20130 + /gene="rmlB" + /locus_tag="SPC18F_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2.7e-76" + misc_feature 19393..20205 + /gene="rmlB" + /locus_tag="SPC18F_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.6e-05" + gene 20487..21338 + /gene="rmlD" + /locus_tag="SPC18F_0023" + CDS 20487..21338 + /gene="rmlD" + /locus_tag="SPC18F_0023" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33618.1" + /db_xref="GOA:Q4K1G6" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G6" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 20487..21335 + /gene="rmlD" + /locus_tag="SPC18F_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-147" + misc_feature 20490..21131 + /gene="rmlD" + /locus_tag="SPC18F_0023" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 20490..21119 + /gene="rmlD" + /locus_tag="SPC18F_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 20493..21221 + /gene="rmlD" + /locus_tag="SPC18F_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene order(21401..21580,21584..22568) + /gene="glf" + /locus_tag="SPC18F_0024" + CDS join(21401..21481,21485..21580,21584..22249,22248..22568) + /gene="glf" + /locus_tag="SPC18F_0024" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33619.1" + /db_xref="GOA:Q4K119" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K119" + /translation="MYDYLVVGAVFAHEAVLKGKKVKVIEKNHIAGNIYTREEEGIQV + HQYGAHIFHTSDKEIDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNKLWGVVTP + AEAQAKIDEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPTTELPSFI + IRRLPVHLTYDNNYFNDTYQGIPIGGYNVIIENMLKDVEVELGVNFFANRQELEASAE + KVVFTGMIDQSFDYKHGELEYCSLRFDHEVLDEENYQGNAVVNYMDAETPYTRIIEHK + HFEFGGVKQRLSLLIEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQGNVIFGGR + LGHYRYYDMHQVIGAALQCVRNELDSYSMKIKEQTRKLAVGCSKHCFEVADGS" + misc_feature order(21821..22248,22249..22424) + /gene="glf" + /locus_tag="SPC18F_0024" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 8.1e-107" + gene 22802..>22849 + /gene="aliA" + /locus_tag="SPC18F_0025" + CDS 22802..>22849 + /gene="aliA" + /locus_tag="SPC18F_0025" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33620.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggagaactgt ataaaaagca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactattg aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gttttgcttt tagttgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agagcaggat + 481 aaaaaagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtat tcaggcgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca caagagttct agcttcccca ttctatggaa tcttacatta + 661 tccataataa taaccgatag tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattc + 781 atttgttaga cctgcaacca aagaaatcct ctgatatctt cttccagata ctttgcctct + 841 tcttaactga ccttttaatg agcgaccata ttctcgataa aaataagtat cgaatcctgt + 901 ttccaatata aacaggtgct aggtgcttta aactattaaa attcttaaga aataaggcta + 961 ctttttctgg ctcttgttca tagtaggtgt ggttcttttt ttcgagtgta gcccatagct + 1021 ttgagtgcat agtggatggt agttggatga cagccaaatt cagaagctat ttcagtcaaa + 1081 taagcgtctg gattatcagt aagatagttt ttaagtctat ctctatcaac ttttcttggt + 1141 tttgttcctt ttacttggtg gtttagctct cctgttttct cttttagctt taaccagcca + 1201 taaatggtat tacgtgagat ttggaaaacg tgtgatgctt ctgttatact acctgttcgc + 1261 tcacaataag agagaacttt tttacgaaaa tctattgaat atgccataag aagattatac + 1321 cacattgtgt actataatta tattgaaact agaatagtac gcctctgctt ctaaaacatt + 1381 gttagaaatc gatttgactg tcctgatcga tttgtcatgt tcttatttca ttttactata + 1441 tttttggttc gcgggaagtc tactaagata cttaaagatg cagatagtga aaaaaaggtg + 1501 tagacattac cgtaaaaaag tgatataatc gtatgatgtt caatgtatag gtgttaatca + 1561 tgagtagacg ttttaaaaaa tcaggttcac agaaagtgaa gcgaagtgtt aatatagttt + 1621 tgttgactat ttatttattg ttagtttgtt ttttattgtt cttaatcttt aagtacaata + 1681 tccttgcttt tagatatctt aatctagtgg taactgcgtt agtcctacta gttgccttgg + 1741 tagggctact cttgattatc tataaaaaag ctgaaaaatt tactattttt ctgttggtgt + 1801 tctctatcct tgtcagctct gtgtcgctct ttgcagtaca gcagtttgtt ggactgacca + 1861 atcgtttaaa tgcgacttct aattactcag aatattcaat cagtgtcgct gttttagcag + 1921 atagtgagat cgaaaatgtt acgcaactga cgagtgtgac agcaccgact gggactgata + 1981 atgaaaatat tcaaaaacta ctagctgata tcaagtcaag tcagaatacc gatttgacgg + 2041 tcaaccagag ttcgtcttac ttggcagctt acaagagttt gattgcaggg gagactaagg + 2101 ccattgtcct aaatagtgtc tttgaaaaca tcatcgagtc agagtatcca gactacgcat + 2161 cgaagataaa gaagatttat accaagggat tcactaaaaa agtagaagct cctaagacgt + 2221 ctaagaatca gtctttcaat atctatgtta gtggaattga cacctatggt cctattagtt + 2281 cggtgtcgcg atcagatgtc aatatcctga tgactgtcaa tcgagatacc aagaaaatcc + 2341 tcttgaccac aacaccacgt gatgcctatg taccaatcgc agatggtgga aataatcaaa + 2401 aagataaatt aacccatgcg ggcatttatg gagttgattc gtccattcac accttagaaa + 2461 atctctatgg agtggatatc aattactatg tgcgattgaa cttcacttct ttcttgaaaa + 2521 tgattgactt attgggaggg atagatgttc ataatgatca agagttttca gctctacatg + 2581 ggaagttcca tttcccagta gggaatgtcc atctagactc tgagcaagct ttaggttttg + 2641 ttcgtgagcg ctactcccta gcagatggcg atcgtgaccg tggtcgcaac caacaaaagg + 2701 tgattgtggc tatccttcaa aaattaacgt caaccgaagc gctgaaaaat tatagtacga + 2761 tcattgatag cttgcaagat tctatccaaa caaatatgcc acttgagacc atgataaatt + 2821 tggtcaatgc tcagttagaa agtggaggga attataaagt aaattctcaa gatttaaaag + 2881 ggacaggtcg gacggatctt ccttcctatg cgatgccaga tagtaacctc tatgtgatgg + 2941 aaattaacga cagtagcctt gcatctgtca aaactgctat tcaggacgtg ttggagggca + 3001 gatgaaatga ttgatattca ttcgcacatt gtctttgatg tagatgatgg tcccaagtca + 3061 agagaggaaa gcaaggctct cttgacagaa gcctacaggc agggggtgcg aaccattgtc + 3121 tctacctctc accgtcgcaa gggcatgttt gaaactccag aagagaagat agcagaaaac + 3181 tttcttcagg ttcgggaaat agctaaggaa gtcgcgagtg acttagtcat tgcttatggg + 3241 gctgaaattt actacacacc agatgttttg gataagctgg aaaaaaatcg gattccgacc + 3301 ctcaataata gtcgttatgc cttgatagag tttagtatga acacccctta tcgcgatatt + 3361 catagtgcct tgattaaaat attgatgttg ggaattactc cagtcattgc ccacatcgag + 3421 cgctatgatg cacttgaaaa caatgaaaaa cgcgttcgag agctgatcga tatgggctgt + 3481 tacacgcaag taaatagttc acatgtcctc aaatccaaac tttttggaga acggtataaa + 3541 ttcatgaaaa aaagagcgca gtatttcttg gagcgtgatt tggttcatgt gattgcaagt + 3601 gatatgcata atgtggacag cagacctccc catatggcag aagcatatga ccttgtttct + 3661 caaaaatacg gagaagcgaa ggctcaggaa ctttttatag ataatcctcg aaaaattgta + 3721 atggatcaac taatttagga gaaataatga aagaacaaaa tacgatagaa atcgatgtat + 3781 ttcaatcact taaaacctta tggaaataca agctaatcat tttattagtg gcacttgtga + 3841 caggggcggg agcttttgca tatagcactt ttattgttaa gccagaatat acaagtacca + 3901 cgcgtattta cgtagtcaac cgtaatcaag gagataagcc gggactgacg aatcaggact + 3961 tgcaggcagg aacttatctg gtaaaagact accgcgaaat tatcctttcg caagatgtat + 4021 tggaaaaggt agcgacaaat ttgaaattgg atattccagc aaaaacgtta actagcaaag + 4081 tgcaagtgac tgtaccagcc gacactcgta tcgtctcaat ctctgtcaag gataaacaac + 4141 cagaggaagc cagtcgcatt gctaattctc tacgagaagt tgctgcagaa aagatcatcg + 4201 ctgtaacgcg agtatctgat gtaacgacgc ttgaagaagc gcgaccagct acgactccct + 4261 cttctccaaa tgttcgacgc aacaccttag ttggttttct tggaggagcc gccgtaacag + 4321 taattactgt tcttttgatt gagttgctcg atacccgtgt aaaacgtcct gaagatgttg + 4381 aagatgtact gcaaatgcca cttctaggag tcgttccaga ttttgataaa atgaaatagg + 4441 aggaagttat gccaacgtta gaaatctcac aggtgaaatt agaacttgcg aaaaaggcag + 4501 aggaatatta taatgctttg tgcacgaacc tacagttaag tggagatgat ttgaaagtat + 4561 tttctatcac ttctgtgaaa gcaggagaag gaaaaacaac gacttccacc aatatcgctt + 4621 gggcttttgc gcgtgcaggt tacaaaacgc tgctgattga tgcagacatg cgtaactccg + 4681 ttatgtcagg tgtctttaaa tcaagggaaa ggattactgg actaacagaa tttctatcag + 4741 ggacaacaga cctgtcacag gggctttgcg ataccaatat tgagaatctc tttgtgattc + 4801 aggctggctc tgtgtcacca aatccgacag cccttcttca aagtaagaat ttcagcacaa + 4861 tgcttggaac cttgcgtaaa tattttgatt atatcattgt tgatacacca cctattggaa + 4921 ttgttattga tgcggcaatt atcactcaaa agtgtgatgc gtccatcttg ataacagcaa + 4981 caggtgaggt gaataaacgt gatgtccaaa aagcgaaaca acaattagaa caaacaggga + 5041 aactgttcct gggagttgtt ttaaataaat tggatatctc ggttgataag tatggagctt + 5101 acggttccta tggaaattat ggcaaaaaat aacttagaaa agattttatg gatgaaaaag + 5161 gattgaaaat ttttctggca gtattgcaga gtattattgt cattttattg atttattttc + 5221 ttagctttgt tagagagaca gaacttgaac gttcttcgat ggttatacta taccttctcc + 5281 acttttttgt attttatttt agttcctatg gtaacaattt ttttaaaaga gggtacctag + 5341 ttgagtttaa tagtactata agatatattt ttttctttgc aatagctata agtgtattaa + 5401 acttttttat agcggaacgg tttagtatct ctagaagagg aatggtatac ttcttaactt + 5461 tagaaggaat atccttatac ttgttaaatt tcttagtaaa aaaatattgg aagcatgtgt + 5521 tttttaatct aaaaaatagc aagaaaattt tactgttaac agtaacgaaa aatatggaaa + 5581 aagttcttga taaattgcta gaatctgatg aactttcatg gaaattggta gcagtaagtg + 5641 ttttggataa atctgatttt caacatgata aaatacctgt aattgaaaag gaaaaaatta + 5701 ttgaatttgc aacgcatgaa gttgtggatg aggtgtttgt caatcttcca ggagagagct + 5761 acgatattgg agaaattatc tctaggtttg agacaatggg gatagatgta actgtaaatc + 5821 ttaaagcatt tgataaggat tttggtcgca ataaacaaat tcatgagatg gtaggattgg + 5881 atgtagtcac tttctctaca aatttttata aaactagtca tgtgatttca aagagaattc + 5941 tcgatatttg tggtgccact attggcctta ttctttttgc tatagctagt ctagttttag + 6001 ttccattgat tcgtaaagat ggcggaccag ctatttttgc tcaaactcgt atagggaaaa + 6061 atggtcgaca ttttaccttt tataaattcc gttcgatgcg gatcgatgct gaatctatca + 6121 aagaacagtt gatggatcaa aatacgatgc aaggtggtat gtttaagata gacaatgatc + 6181 ctcgtgttac aaaaattggt cgctttattc gtaaaaccag tttagatgag ttaccccagt + 6241 tttggaatgt atttatagga gatatgagtt tggtgggaac acgtccacct acagtagacg + 6301 agtatgatca gtatactcca gaacagaaac gtcgactcag ctttaaacct ggtattacag + 6361 gtttatggca ggttagcggc cgtagtaaaa taaccgattt tgacgatgtt gtaaaattag + 6421 atgtggctta tattgataat tggacaatct ggaaagatat tgaaattttg cttaaaactg + 6481 ttaaagttgt atttatgaga gatggagcga agtaatttct gtatatccat catattagga + 6541 gagaaatgaa aaagtcagtt tatatcattg gttcaaaagg aattcctgct aagtatggag + 6601 gatttgaaac ttttgttgaa aaattaacag ccttccaaca agataaggct atccaatatt + 6661 atgtggcttg tatgcgtgaa aactctgcaa aatcagggac tactgaggat gtttttgaac + 6721 ataatggtgc tatctgttat aacgtcgatg ttcctaatat tggtccagcg cgagccatag + 6781 tatatgatat cgcggcaatt aacagagcta ttaaaattgc caaagaaaat aaggatgaag + 6841 atccaatctt ctatattcta gcttgtcgaa tcggtccgtt catccatgga attaagaaaa + 6901 aaatccagga gataggtggg actcttctag ttaatccaga tggtcacgag tggttacgag + 6961 ctaagtggag cgctccagtt cgtcgttatt ggaaaatttc cgaaggtctt atggtcaaac + 7021 atgcagatct tttagtgtgt gatagtaaga atattgaaaa atatatccaa gaagattata + 7081 aacagtatca acctaagaca acctatatcg cttatgggac tgatacaaca cgctccatat + 7141 taaagagtag tgacgaaaaa gtacgttctt ggttcaaaaa gaagaatgtt tctgaaaacg + 7201 agtattacct agttgtagga cgttttgttc cagaaaataa ctatgaggct atgatacgtg + 7261 ggtttttagc atctaattct aagaaggact ttgtcctaat aacaaatgta gaacagaata + 7321 aattttataa tcaactatta gcaagtactg gctttgataa agatccacga gtgaaatttg + 7381 ttggaacagt ctacgatcaa gaacttctga agtatattcg agaaaacacc tttgcttact + 7441 tccatggaca tgaagttgga ggaaccaatc cttcgctttt agaagctctg gcatcaacta + 7501 aactgaattt attgctagat gttggcttta accgagaagt tggggagcaa agtgcaatct + 7561 attggaaaaa agatgagctt tcccaagtaa tcgagaaagt tgaacaattt gatgcaaaaa + 7621 tgattgatga gttagataga caatcaaatc agagaattgt ggattttttc acttgggaaa + 7681 agattgtcac agactacgag aaattattta aaaaatgaaa atattacatt atactttagg + 7741 atttcaaccc cagcgaacag gtggtttggt taaatatgct gaggatttaa tgctagagca + 7801 aattgctcaa ggttatcaag tggctgccct atatccagga agaattaagt tcttttcaaa + 7861 aaaaatagaa ataattaaag cgacgtcaag acagtttgag tgttatgagc tgcttaatag + 7921 cttacctatg gctttatttg gaggtatatc cgatccaact gctttcctga caccttgtga + 7981 caaaaatgtt tatcgtactt ttttagaaaa agtacaaccc gacattatac atattcactc + 8041 gtttatggga ttgcataaag aattcctcga aattgctaaa aacttgaata ttagagtggt + 8101 ttttacgagc catgattatt atggattagc acccgtacct catttctatt ttaatggggt + 8161 ggattatagt gataaaagta caaacttaac atggaatatt atgtcttcca atgctttaag + 8221 tgtgaaaaaa ctaagacttt ttcaggtttc attttatcct actattcgta aacttttgaa + 8281 actattaggg aaaaatccaa aatctaaaaa gaatttagtt attcgagatg ttattgagga + 8341 gcaagattat agtgagcttc gatactatta taatgagatg tttcacttaa tagatggtta + 8401 tttgtttaat agtagacttg caaagaaggt atatgagata aatgagatta agtcagctaa + 8461 tagtatagta ttatctataa caaatagttc aattaatcat catcagagat tgacaactac + 8521 aaataataaa attagagttg cttatattgg tccagatgaa gaatataaag gatattttga + 8581 ttttgttgac tttgttgaaa ctttagatcg agagtcctat gaagtggcaa cttatggcca + 8641 tttaccaaat gaagagtgtc cttcattcat tgaacaaaaa ggatatttta ctaaggaaat + 8701 gattgacagt gtctatgaaa atattgatat tcttattgtt ccaagtaagt ggaaggaaac + 8761 atttggattg ataacagtag aagcattatc ctatggggta aatgttttcg tgagtgaaaa + 8821 tgttggatca aaagacttac ttccagaatc gcatgttttt aaaaatcaga atgatttagt + 8881 agttaaattt ttaaaaaatg atatagaaaa tacaaaattg aaaactttag atgaacactc + 8941 gatagaagtg attcagtatt atgaaagagt gataaatgat agttaagagt ttcataaaaa + 9001 agattactgg aaaaacagta gacattcatc cagatgtacc tttgtcgtat atactacaaa + 9061 gaggtataaa ctatggtttc ggactctttc gtggggttgt acgtggaatc ggatttggtc + 9121 aaaacgacaa acgtttattc attggacaag gagtttctat cttagcaaag cgtaaattat + 9181 ttgttggaaa aaatgttcga attggtaaaa aggtgtctat agatgcactg tcaaaagaag + 9241 gaatccattt tgcagataat gtaaagattg gagattattc tcaaattatt ggcacaggtt + 9301 ctataaaaaa tatggggatt ggcttgaaaa tcggtaagaa ttcatctttt tcagaatata + 9361 gtttatttgg ttctgctgga ggtatcacaa ttggtgataa tgttatcgca ggtcagaatg + 9421 ttcgttttca tgctgaaaat cataattata gtgatttaga taaactcatt gttgaacaag + 9481 gggtatctcg aaagggaatt tcagtaggtg ataattgttg gattggtgct ggatctgttt + 9541 ttttggatgg gtccagcatc ggttcaggtt gtgttgttgg agcgaatgct gtcgtcacta + 9601 agcagtttcc agataatgtt atcataggtg gagtaccagc taggatactg gcctatagat + 9661 agtgtttaac tatttctgaa aggaagaaaa tttatgccta catttagtgt agttgttcca + 9721 gtttataatg tagagaatta tttatcgcaa tgtttaaatg ctcttgtaaa tcagtctttt + 9781 aaagattttg aacttatctt ggtaaatgat ggttctactg acacatctgg aagtctttgt + 9841 gaagaatggg gaaaaaaaga tcatcggata aaagtaatac ataaaaccaa tgaaggtctt + 9901 ggttttgcac gtaacacagg tattgaaaac tgtacaggag attatattgt ctttgttgat + 9961 tcggatgatt atgtctcata tgagatgctt gaaatttatg atacatactt acaacgtttt + 10021 aatgcagacg tgatttatag tgaaaatttt tatcgagtgg ataataaagg aaatattata + 10081 gaaccacttg atcagagcct agattccatt ttttataaaa atgattcaat tttcacagaa + 10141 cttttaccag atgtaatatc ttcaccacca gaatttattg gagatggaaa gataggtgtt + 10201 tcagtgtgga aaggggtata taaacgttct ttgtttaagg ataaggggct attatttcat + 10261 tcagaaagag aattcatttc agaagatgct atttttcaaa ttgattgttt aaaattagca + 10321 atatctgccc ttgttatccc agatatttta tattactatc gtgaaaactt tggttcttta + 10381 agtatgaaat ataaagaaga tcggtttgag ttgaataaaa tcttgtataa cgagcaatta + 10441 aaaagagttg aggggttacc taatcaagaa attttggaag aaagaattga gagaatttta + 10501 attgctaata ttcgtttatg tatctttcag gaatccttat ataaaaattc tagaattcat + 10561 aaacgtttgc aaagaattag acagatttgt aaggacccaa tatcaaaatc agtattacgt + 10621 cattatccaa tccgtcgttt acctttttct aaacgcttga tctgcgtatt agctaagtat + 10681 aatatgccgt tgatgctttt agttttaacc ttattaaaat atcggaatcg gagcgtataa + 10741 cttttatggg gatgaatata gaaaaattaa aactatcttt gaaaaatgga acgttttttt + 10801 ctgttgttat tcacgcctta cgaaatcgtt ggcctttatg gtggattggg aacaaggcta + 10861 ttcgagaagt gcaacttgaa gatagggcct acagaatact aaaaaagaaa tacggctcct + 10921 taatttcaag ctcttttgat aaatcatatt tatcagaaga agttcccaag caaatctgga + 10981 tttgttggct tcaaggtatg gagaatgctc cagagttggt gaaatcatgt tatagatcac + 11041 taaaaaaaca atttcctgaa tatgtcatta cggttatttc ttcagaaaat atttccgaat + 11101 atgtagaaat acctgatatt atttataaaa aatggggaaa tggtgtaata ggaaatgctc + 11161 atttttctga tatccttcgg gtagagctgt tacgtaagtt tgggggaata tggattgact + 11221 caacagtgta ttgtacagga attactacca tagagacaat tgaaaaaaat ccatttttta + 11281 tgtataaaag tttatcttca gttgaggaga gaatttcctc ttccaactgg atgattgctt + 11341 ctgttcccaa tcatccattt atgattacga tgagcacact cttgcaatct tattggtcaa + 11401 aagaagttat agcaattcat tattatctat ttcatattct ttttacgatt atgattgaat + 11461 cacttcctga gttgtggcag cttgtaccca cctatacgaa cgcaacacca catataatgg + 11521 ttgatgaatt aaataatatt ttttcaaagg aacgttacca gcaattgtgt caaatttcag + 11581 attttcataa attaaattat aaaaaaaatt acaatgataa atcagagagt ttgtacagtc + 11641 acttactgaa tcagtagagg ggagaatctt gcctaattta aagaaaaaca ttgtttacaa + 11701 tgtcttatat cagatcttag ctgtaatagt accgtttatt acctcacctt acttagcgcg + 11761 tgtgttaggt gcagagcaaa ttggagttta ttcttttact tattccattg ctttttactt + 11821 tatgattctg tccatgttgg gaatttctaa ttatgggaat cggacaatag cacaggtacg + 11881 aacaagtaga gaacatttga atcaagaatt ttcgaatatt tacgcggttc aattgacgtg + 11941 ttcactagta atgaccgtct catatttgat ttatgcaaca gtatttgtga atagttttca + 12001 gattgtagcc tatatccaag tattacatgt tttatcgtat gcaacagatg ttagttggtt + 12061 tttttatggt cttgaagagt ttcgtattac ggttgctagg aattcatttg ttaagttatt + 12121 aactttaata tctatcttta catttgtaaa aagccctaat gatatctatt tatatacctt + 12181 tataatggca gggagtaccc tgcttggtca gttgattaca tggccatttt tgctaaaaca + 12241 agtaaacttt gtgcgcccta gtcttggaaa aataaagaaa cacatgaaac ctattattat + 12301 tttatttttt cccgtcttag cgattagtat tttttcgttt atagataaaa taatgcttgg + 12361 gatgtatagt agtttgaggg aaactgcttt ttatgagaat tcagataaga tcattagtat + 12421 tccaaaagct ctgattcaag cctttggagc tgtaatgttg cctcgaacag tacatttact + 12481 gagtataggt gatgaacaaa aaagtttaga atatgttgat aaaacgatgt gggttgtttt + 12541 agtgattaca atgggctgtg ctttcggttt agcaggagtt tctgcaacct ttgctcctgt + 12601 ttattggggt gaagaattta gggccagtag ccaaattatt gcaggaatga caccggcttt + 12661 agtattttcg gcttttggaa atgtcatccg aacccagttt ttaattccac gaagttttga + 12721 caaggaatat acggtatctt tgctttatgg agccgtagtt aatatcttga ttaatattct + 12781 tttgattccg aagataggag caatgggagc tgttatcgga ataattgttg cagagttagt + 12841 tctatgttgc tatcaaacgt ggattgctag aaattattta catatcagag aatatctgat + 12901 aaatgctggg atattgtttc ttattggttc agtaatgtat atggttttaa ttcttatttc + 12961 aagtatttta cctacatcgt tacttacact tattattgaa attatagtcg gagctttcat + 13021 ttatattagt ttactgattc tgtatatctt ttcttcaaaa aacagggtaa ttattggttt + 13081 acgaacaaat tttttagaac atactcattt atttaaaagg aagtaatagt gaaatttaaa + 13141 tttaatccaa tcgcgatact gtatatattg ctagtatact tagagttggc tacagatagg + 13201 caacatctgt atcctgtaac gtacatgaca aaatattata ttggtatttt aattattgtg + 13261 ttgtttgttt tattattagt aggccgtggg aagcttattt ttgttaataa aaaattatta + 13321 tatcttgcta agatattagc tataccaaca attgttcttt tcctgtactc agtcttacta + 13381 gacgtaatga acccagttga atttaatgga tattttagta ggttatcaag tacgactatt + 13441 tttggtttgt tagctatctt tcaagctata gttgtttttc aattttttgg acaaaaagta + 13501 gtagattaca cttttacagc tatctccctc agctacttaa ccagtatcat tgttgccttt + 13561 aggcagggag gacttagtca atttatcttg atactaacag atgatagttt caatggttcg + 13621 gtactagaaa tgcatgaagt tgcacctatt acagccctct ttattctgta ctatttgtac + 13681 aaatatttta taaaagaaaa tagtttttct tcagtatttc ataatatctt aatagctctc + 13741 attattcttt ttttaagcct taaacgaatc gtttttttga gtgtattaat tatcatacca + 13801 gtatttttgg taatttattg gtatgataaa aaagtaagca aactagggaa agaacgaaaa + 13861 attttaagtt tattaaatat cttttcctta atatttataa caggaatatt cttttatgtt + 13921 tatagtgtaa aatctgattt tatatataca tttattcaag aacataatat taattcgatg + 13981 gctagaacag atttatggaa gggagttgaa tcaacctata atttcgcccc tatatttatg + 14041 gggagaggga tagggtttgt aacaaaatgg atggataata attggatgac tttgaatatc + 14101 aatggtctta caggatcaat ggggatccat aatgatattt tgaagtacta cattgagata + 14161 ggatttgtag gattatttat ttatttttac actcttcttt atagaaatgc taaacgtata + 14221 tttgtaaaaa ttggtcataa agaatcattc atatattttg tattgataat gtttcagatg + 14281 ctgatatggt ttacagataa tatttcaatt taccataatt ttttatggat cctaaatcta + 14341 ctactctttt ctttaactaa ttcggataca gaattggaaa atttagattt taaaaatttt + 14401 taatgtgtaa gtagtaacta ctaattttat taaaaaatca gaatataggt gtatttatga + 14461 agacagatgc taggactaaa aagagagaga atgaaacgtt atatattcta aaagtttggg + 14521 caacatttag tgtgattgct atacattttg gttttttggg ccaaattgga gtgttttaca + 14581 aagtattagc tcgatttgct gtacctttat ttttcatgat ttcaggattt tattcgttta + 14641 gtatttcaga agaaaaactg aagaaaagaa ttaaaaatct gagtttattg ataatttcca + 14701 gtacaagttt ttatttttta ctggatgttt ttcttcaatt aacacaagga aatctaagag + 14761 ttgtatttga aagatttact tttaataata tttttaattt tttggtattc aatcaaattt + 14821 ctgctctaat tggctcgtta gcaacaccac tatggttctt atatgcatta ctgtatgttt + 14881 atatttatct atttttttca aataaaaaat ggatatttaa tactatcttg actgtgatca + 14941 tactctgttg ttcatttata atcgagttaa aagcaaatag tgctttattt tatagaaact + 15001 tcttatttat gggagttccc ttcttttctt ttgggatgta ttttgctcaa attcagagaa + 15061 aaattataaa ttataagcac ttcaaagaac tttttataat tggaattatg atttcaggat + 15121 ttctaactct gattgaatat acctttttag gagcaaattt tgaactttat ataagttcgg + 15181 tgataatatc ttgtatgctt atggtctttt cgattaaata tcctcaactc tggacgctag + 15241 attttgctgt caatattgct aaaaaaaatg cgacgtttat ttatattagt catcaatttg + 15301 tgattttatt atttaaaaca tacgttaggg atggaattgc ttataaaatt ggaactttct + 15361 tgatattttt agcatgtgtt attatgagta ttattttcaa ctatatagtc gatataatca + 15421 gtcgttgttg cataaaagaa aaacaagata taatatgaaa ttttatataa aaaatttact + 15481 aaaaaaagtc tttacattac cgttgcattt attgcctatt cagtctaata agataatatt + 15541 tgataatttt ggtggtagag gttttgggga caatcctaag tatatacttg aagaacttgt + 15601 ctctcgagaa aagaatctag atcttgtgtg ggtaacaaaa gatagagaaa tttctatccc + 15661 tgaaggcgtt cgagtagtaa aatacggcag ttaccgttct ttttatgaat ggttaacagc + 15721 tagagtttgg gtagataata ttcgtaattc tgatcgacct tggaagcgaa acggacagat + 15781 ttatcttcaa acttggcatg gttcagatgg ggtaaagtta attgaaaaaa gtgttgcagg + 15841 gaacctaaaa aaaacatata ttagaatggc gaagtatgat ggaaagatta cagacggtat + 15901 cgtatcaagt cggcactttc aaactttggg tatgcaaaat aatttttggc tgacagagaa + 15961 tgtggaattt ctggaatttg gattacctcg aaatgatgat ttttttaaaa gtgaaaaaat + 16021 caaaaccaca aatataaaat ttagaacatt atttgatatc gatttagacg aactggtagt + 16081 tttgtatatg ccgacgttca gagatgatgg atcgttgaat gcctataatt tagattactc + 16141 gaaactaata catgtttttc aaaataaatt tagaaaaaat gtaagaatat tagttcgttt + 16201 tcatccaaat gttgattcta gttttataaa tttacaggat acagactgta taaatgtgtc + 16261 gacctattca aatcctcagg atctgatgat gagtgcggat gtgatgatta cggattattc + 16321 atcggcttct attgatttta tgttattaaa tcgtccagta tttctgtatt taccagatta + 16381 tcaaagttat gtgaatgata gaccattgga tgataacttt gataaattgc catttccaag + 16441 agcatatcat aacaatgagt tgacagaaat tattagagac tttgaaagaa gtaaatatga + 16501 tgaaaaagtt cgtctgtatg aattagagga tgttcgtttt gatagaggaa aagcatcagt + 16561 acagtgtgct aattggattg aagaaaaaat aaaaaacaat aaagttattg attgaaataa + 16621 ttatatttat tgaatgataa ataaggaggc ctttagatga aaagagttat aacatatggt + 16681 acatttgatt tattgcatta tggtcatatc aatcttttga aacgtgctaa acagctaggt + 16741 gattatttga ttgtagttgt ttcaagtgat gagtttaatt taaaagaaaa gaataaagta + 16801 tgttacttta actacgaaca cagaaaaaat ttagtagaag ctattcgata tgtcgattta + 16861 gtaatccctg aaactagttg ggaacagaaa aagtcagatg ttaaagagta ccgtattgac + 16921 acttttgtaa tgggtgatga ttggaaaggt aaatttgatt atcttgaaga agaaggtgtt + 16981 gaagtagtct atttgcctag aacaaaggaa atatcaacca caaagataaa agaagattta + 17041 tcggaatgaa atattattaa aaaatgctga cataagaaat tgtgactttt gtgtctagtt + 17101 tttgatagaa taaagtaaca acactttaac caatgaggtg tgaataatgg tagtaatttt + 17161 taaagatgta cttgttgaag agaaaactga tgaagaaaaa caacatattt tatctatttt + 17221 aaatgatgag aatgttagag cttttgattg tggatattaa gaattgaatg atgttttttg + 17281 atatttagaa caaatacgat gaagaaacag gccatgtatt gcctattgta aatcaaaatt + 17341 ttgaattatt aggttttatt tcttgtagac tagtatcatt ttctttcata gctcaggtta + 17401 aagagatggg aattagcata gattatcttg gtattcataa ggattgccag aaaatgggtg + 17461 atcggttcgc ttttggtgct ctttgcgctt cgattatctt taactattga ctgttgatta + 17521 ccaataaaag gtgtaatagt tcatgctttc gaggatgttg tagaattcta tgacaaactg + 17581 ggttttattg accctagaga tatagtgatt tataatggca aaccggttac tatatatttt + 17641 agtattgaaa aactaagaaa tggtgaaaat tattcctctc acacagttat ttgaaacatc + 17701 cttagaaaat gatttttaat tgtatgcaaa caaagtagaa ttcgcttatt tcatcttatg + 17761 ctaaatgtaa tatgaaacaa gtgaattttt atagataaag aagaatttta aaaaatgtga + 17821 tgattatttt ctttttagag cagtacagaa ttaatagtaa ttgactctaa atcaataaag + 17881 aaaggtaccc cttttatgaa aggtattatt ctagcaggtg gttcgggaac tcgcttgtat + 17941 cctttgactc gcgctgcatc aaaacaactt atgccggttt atgataaacc gatgatttac + 18001 tacccacttt caacattaat gttggctggg attagggata ttttgattat ctcaactcct + 18061 caagatttgc ctcgttttaa agagcttctt caagatggtt atgagtttgg tattaaactt + 18121 tcttatgctg agcaaccaag tccagatggt ttggcacaag cctttatcat tggggaaaag + 18181 tttattggtg atgatagtgt tgcgctaatc ttaggcgaca atatctacca tgggcctggt + 18241 ctttctaaga tgctacaaaa ggtatcaagt aaggagtcgg gagcaactgt ttttggctac + 18301 catgtcaagg atccagagcg ctttggtgta gttgagtttg acaaggatat gaacgctatt + 18361 tctatcgaag aaaagccaga gcaccctcgt tcaaactatg cagttacagg actctatttc + 18421 tatgataatg atgtagtaga gattgccaaa agtataaaac caagccctcg tggtgaactg + 18481 gaaattacag atgtaaacaa ggcttaccta gatcgtggag atttatccgt tgaggttatg + 18541 ggacgaggct ttgcttggct ggatactgga actcatgaaa gtttattaga ggcttcacag + 18601 tacatcgaga cagtgcaacg gatgcaaaat gttcaggtgg caaacttaga agaaattgcc + 18661 tatcgcatgg gttatatcag tcgtgaagat gtattgacct tagctcaacc acttaagaaa + 18721 aatgaatacg gacagtatct gctccgtttg attggagaag catagatgac agataatttt + 18781 ttcggtaaga cgcttgcggc acgcaaggtt gaagctattc caggcatgtt ggagtttgat + 18841 atccccgttc atggagataa tcgtggctgg tttaaagaaa atttccaaaa ggaaaaaatg + 18901 cttccacttg gatttccaga gtctttcttt gcagaaggaa aattgcaaaa caatgtatcc + 18961 ttctcacgta aaaatgtcct tcgagggctc cacgcagagc cttgggataa gtacatctct + 19021 gtagcagatg gagggaaagt tctgggttct tgggttgatc tacgcgaggg tgaaaccttt + 19081 gggaatacct atcagacagt aattgatgca agcaagggaa tctttgttcc tcgaggcgta + 19141 gctaatggct tccaagttct atcagataca gtgtcatata gctatctggt caatgattac + 19201 tgggctctcg agctcaaacc caagtatgcc tttgtgaact acgctgatcc aagccttggt + 19261 attgaatggg aaaatattgc agaagcagag gtttcagaag cagataaaca tcatccccta + 19321 cttaaggatg taaaaccttt gaaaaaagaa gatttgtaaa aaggaaagaa tatgactgaa + 19381 tacaaaaata ttatcgtgac aggtggagct ggctttatcg gttctaactt tgtccattat + 19441 gtttacgaga actttccagg tgttcacgtg acagtcctag ataagttgac ttatgctgga + 19501 aatcgcgcga atattgagga aattttaggt aatcgtgttg agttagttgt tggtgacatt + 19561 gctgatgcgg agttggtaga caagttggct gctcaagcag atgctatcgt tcattatgca + 19621 gcggaaagcc acaatgataa ttcgctcaat gatccatcgc catttattca tactaacttc + 19681 atcggaacct atactctttt agaagctgct cgtaagtatg atattcgctt ccaccatgta + 19741 tcgacagatg aagtttatgg ggatctccct ttacgcgaag atttgccagg tcatggtgaa + 19801 ggaccaggtg agaaatttac tgctgaaaca aaatacaacc caagctctcc gtactcatca + 19861 accaaggcag cctcagattt gattgtcaaa gcctgggtgc gttcttttgg agtcaaggca + 19921 acgatttcca actgttcaaa taactacggt ccttatcaac atatcgaaaa attcatccca + 19981 cgtcagatta ctaacatcct aagtggaatt aagccaaaac tttacggtga aggtaagaat + 20041 gttcgtgact ggattcatac caatgaccat tcttcaggag tttggacaat cttgacaaaa + 20101 gggcaaatcg gtgaaaccta cttgattggg gctgatggtg agaagaacaa taaggaagtt + 20161 ttggaactta tccttaagga aatgggacaa gctacggatg cctatgatca tgtgactgac + 20221 cgtgcaggac atgaccttcg ctatgcgatt gatgccagca agctccgtga tgagttgggg + 20281 tggaaacctg aatttaccaa ctttgaagct gggctcaagg caacaatcaa gtggtataca + 20341 gataaccaag aatggtggaa agcagaaaaa gaagctgttg aagccaatta tgctaagact + 20401 caggagatta ttacagtata aaaagcagga aatagctgct ttttattgct atattgggaa + 20461 gagttacata ttagaaaggt ctagagatga ttttaattac aggggcaaat ggccaattag + 20521 gaacggaact tcgctattta ttggatgaac gtaatgaaga atacgtggca gtagatgtgg + 20581 ctgagatgga cattaccaat gaagaaatgg ttgagaaagt ttttgaagag gtgaaaccga + 20641 ctttagtcta ccattgtgca gcctacaccg ctgttgatgc agcagaggat gaaggaaaag + 20701 agttggactt cgccatcaat gtgacgggga caaaaaatgt cgcaaaagca tctgaaaagc + 20761 atggtgcaac tctagtttat atttctacgg actatgtctt tgacggtaag aaaccagttg + 20821 gacaagagtg ggaagttgat gaccgaccag atccacagac agaatatgga cgcactaagc + 20881 gtatggggga agagttagtt gagaagcatg tgtctaattt ctatattatc cgtactgcct + 20941 gggtatttgg aaattatggc aaaaacttcg tttttaccat gcaaaatctt gcgaaaactc + 21001 ataagacttt aacagttgta aatgaccagt acggtcgtcc gacttggact cgtaccttgg + 21061 ctgagttcat gacctaccta gctgaaaatc gtaaggaatt tggttattat catttgtcaa + 21121 atgatgcgac agaagacaca acatggtatg attttgcagt tgaaattttg aaagatacag + 21181 atgtcgaagt caagccagta gattccagtc aatttccagc caaagctaaa cgtccgctaa + 21241 actcaacgat gagcctggcc aaagccaaag ctactggatt tgttattcca acttggcaag + 21301 atgcattgca agaattttac aaacaagaag tgagataagt agtagaatga ttttctagtc + 21361 taataaaaga ggcagagaat gaactccaaa ggagcttaag atgtacgatt atcttgttgt + 21421 tggtgcagtc tttgcccatg aagcagtctt aaaaggaaaa aaagtaaaag ttattgaaaa + 21481 atgaaatcat atcgcgggta atatctatac tcgtgaagag gaaggaattc aagttcatca + 21541 atatggtgct catatcttcc atacttctga taaggagatc tgagattatg taaatcagtt + 21601 tgcagagttt aaccgttata ccaattctcc tgttgcaaac tataagggag agatttataa + 21661 cttacctttt aatatgaata ccttcaataa actctgggga gttgtgacgc cagcagaagc + 21721 acaagctaag attgatgaac aacgtgctat tttaaatggt aaaactcctg aaaatttgga + 21781 agaacaggcg atttctcttg taggtacaga catctacgaa aaattaatca aagactatac + 21841 agagaaacag tggggcaaac caactactga acttccatcc tttattattc gccgtttacc + 21901 agtacacctg acctatgata acaactattt taacgatacc tatcaaggga ttccaattgg + 21961 tggttataat gttatcatcg aaaatatgct gaaggatgta gaagtagaac ttggagtgaa + 22021 cttttttgcc aatcgtcaag aattagaggc ttctgctgaa aaggttgtct ttacagggat + 22081 gattgaccaa tcctttgatt ataaacatgg tgagttagaa tactgtagtc ttcgttttga + 22141 tcatgaagtt ctagatgagg aaaactatca aggaaacgca gttgtgaact atatggatgc + 22201 agaaacccca tatactcgca ttattgaaca caaacatttt gagtttggga gtcaagcaaa + 22261 gactatcatt actaatagaa cattctaaaa catgggaaaa aggtgatgag ccttattatc + 22321 cagttaataa tgatcgtaat aatcatttgt ataaatcata taaaaaactt gctgatgagc + 22381 aagggaatgt tatctttggt ggccgcttag gacactatcg ttattacgat atgcaccaag + 22441 taattggagc agctttgcag tgcgtgagaa atgagttaga ttcatactca atgaaaatca + 22501 aagagcaaac taggaagcta gccgtaggtt gctcaaaaca ctgttttgag gttgcagatg + 22561 gaagctgacg cggtttgaag agattttcga agagtataaa caagtaaaac tgactaccag + 22621 ttattattta gaaatagtat taaaaattcc ttgactatgt gatatagttg agggattttt + 22681 aaatgatatt catatttttt gcaaagatgt tgtttgaaaa ataattttca aaaattctga + 22741 aaattctgtt gacaactttc tgaaaagagt ctataatgga gagaaagttt taaaggagaa + 22801 aatgatgaaa agttcaaaac tatttgccct tgcgggcgtg acattattg +// + diff --git a/public/res/serotype_genbank/serotype_18X1.gb b/public/res/serotype_genbank/serotype_18X1.gb new file mode 100755 index 0000000..8aa20ed --- /dev/null +++ b/public/res/serotype_genbank/serotype_18X1.gb @@ -0,0 +1,1177 @@ +LOCUS MK606431 29861 bp DNA linear BCT 30-SEP-2020 +DEFINITION Streptococcus pneumoniae strain GPS_IN_IIT_NP32 cps gene cluster, + complete sequence. +ACCESSION MK606431 +VERSION MK606431.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 29861) + AUTHORS van Tonder,A.J., Gladstone,R.A., Lo,S.W., Nahm,M.H., du Plessis,M., + Cornick,J., Kwambana-Adams,B., Madhi,S.A., Hawkins,P.A., + Benisty,R., Dagan,R., Everett,D., Antonio,M., Klugman,K.P., von + Gottberg,A., Breiman,R.F., McGee,L., Bentley,S.D. and The Global + Pneumococcal Sequencing,C.O. + TITLE Putative novel cps loci in a large global collection of pneumococci + JOURNAL Microb Genom 5 (7) (2019) + PUBMED 31184299 +REFERENCE 2 (bases 1 to 29861) + AUTHORS van Tonder,A.J. + TITLE Direct Submission + JOURNAL Submitted (06-MAR-2019) Parasites and Microbes, Wellcome Sanger + Institute, Wellcome Genome Campus, Hinxton, Cambridge CB10 1SA, + United Kingdom +COMMENT ##Assembly-Data-START## + Assembly Method :: Velvet v. 1.2 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..29861 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="GPS_IN_IIT_NP32" + /isolation_source="nasopharyngeal swab" + /host="Homo sapiens" + /db_xref="taxon:1313" + /geo_loc_name="India" + /collection_date="2014" + misc_feature 1..29861 + /note="cps gene cluster" + gene 1..1611 + /gene="dexB" + CDS 1..1611 + /gene="dexB" + /EC_number="3.2.1.70" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3280" + /inference="protein motif:CLUSTERS:PRK10933" + /inference="protein motif:Pfam:PF00128.18" + /inference="protein motif:TIGRFAMs:TIGR02403" + /inference="similar to AA sequence:RefSeq:YP_004326655.1" + /inference="similar to AA sequence:UniProtKB:Q99040" + /note="trehalose-6-phosphate hydrolase; maltooligosyl + trehalose synthase; alpha,alpha-phosphotrehalase; alpha + amylase catalytic domain protein" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="QCO91906.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNGDGVGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIAAIFGTMEDMDQLIAEAKKRDIRIIMDLVVN + HTSDEHAWFVEACENTDSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGDKELLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKGVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTGQPWLAVNPNYEMINVQEALANPDSIFYTYQKL + VQIRKENSWLVRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTAAKEVLEKQVLAPWDAFCVEMTD" + CDS complement(1742..3142) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00665.20" + /inference="similar to AA sequence:RefSeq:YP_006065738.1" + /note="integrase core domain protein" + /codon_start=1 + /transl_table=11 + /product="IS1202 transposase" + /protein_id="QCO91907.1" + /translation="MKKYLVIKAIAQGKKTKKRACAELNLSERQINRLLLAYQLKGKE + AFRHGNRNRKPKHAIPDEIKGRLLKKYLSYETYKPNVLHFCELLAEEEGIQLSDTTVR + KILYKENILSPKSHRKTKKRVRRQAKLNPKQPLDNPILPTAENFLEDPKKVHPSRPRK + KFAGELIQMDASPHAWFGAQTSNLHLAIDDASGNILGAYFDKQETLNTYYHVLEQILG + NHGIPLQIKTDKRTVFTYQVSNSKKMEDDTHTQFGYACHQLGILLETTSIPQAKGRVE + RLNQTLQSRLPIELERNNIHTLEEANTFLLSYIQTFNEQFGNKTKLSVFEEVPNPSER + NLILARLAERVVDSGHHIRFQNRYYIPTEQGKEVYFIRKTKALVIKAFNGDIYLNIAD + KIYRTKELLDHELYSKNFEQEPEQKKKDTSISLHKPIRGNSHLSNNIFIKIKRIMKSL + LVRSLILLNYKYSKMK" + gene 3327..4772 + /gene="wzg" + CDS 3327..4772 + /gene="wzg" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09379" + /inference="protein motif:Pfam:PF03816.8" + /inference="protein motif:TIGRFAMs:TIGR00350" + /inference="similar to AA sequence:RefSeq:YP_001835063.1" + /inference="similar to AA sequence:UniProtKB:Q7WY78" + /note="putative transcriptional regulator ywtF; + membrane-bound transcriptional regulator LytR; cell + envelope-related function transcriptional attenuator + common domain; cell envelope-related transcriptional + attenuator domain protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14A" + /protein_id="QCO91908.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLSVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + ADHSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYIKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRGRYSLADGDRDRGRNQQKVIVAIIQKLTST + EVLENYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLTVVKAAIQDVMEGR" + gene 4774..5505 + /gene="wzh" + CDS 4774..5505 + /gene="wzh" + /EC_number="3.1.3.48" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4464" + /inference="protein motif:Pfam:PF02811.13" + /inference="similar to AA sequence:RefSeq:YP_002739714.1" + /inference="similar to AA sequence:UniProtKB:Q54518" + /note="capsular polysaccharide biosynthesis protein; PHP + domain protein" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein phosphatase wzh" + /protein_id="QCO91909.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDTLEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKHVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + gene 5514..6206 + /gene="wzd" + CDS 5514..6206 + /gene="wzd" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:Pfam:PF02706.9" + /inference="protein motif:TIGRFAMs:TIGR01006" + /inference="similar to AA sequence:RefSeq:YP_001835065.1" + /inference="similar to AA sequence:UniProtKB:P72367" + /note="capsular polysaccharide type 8 biosynthesis protein + cap8A; capsular polysaccharide biosynthesis protein; MPA1 + family polysaccharide export protein; chain length + determinant protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14C" + /protein_id="QCO91910.1" + /translation="MKEQNTLEIDGLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKPGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTRVKRPEDIEDTLQMT + LLGVVPNLNKLK" + gene 6216..6899 + /gene="wze" + CDS 6216..6899 + /gene="wze" + /EC_number="2.7.10.2" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:CLUSTERS:PRK11519" + /inference="protein motif:Pfam:PF01656.17" + /inference="protein motif:TIGRFAMs:TIGR01007" + /inference="similar to AA sequence:RefSeq:YP_001835066.1" + /inference="similar to AA sequence:UniProtKB:Q54520" + /note="tyrosine-protein kinase CpsD; tyrosine kinase; + capsular polysaccharide biosynthesis protein; capsular + exopolysaccharide family protein; CobQ/CobB/MinD/ParA + nucleotide binding domain" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14D" + /protein_id="QCO91911.1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVS + PGEGKTTTSVNIAWSFARAGYKTLLIDGDTRNSVISGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGAVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGETNKRDVQKAKQQLKQTGKLFLGVVLNKLDISVDKYGVY + GFYGNYGKK" + gene 6915..8282 + /gene="wchA" + CDS 6915..8282 + /gene="wchA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15204" + /inference="protein motif:Pfam:PF02397.10" + /inference="protein motif:TIGRFAMs:TIGR03025" + /inference="similar to AA sequence:RefSeq:YP_001835067.1" + /inference="similar to AA sequence:UniProtKB:P71241" + /note="putative colanic biosynthesis UDP-glucose lipid + carrier transferase; undecaprenyl-phosphate galactose + phosphotransferase; exopolysaccharide biosynthesis + polyprenyl glycosylphosphotransferase; Bacterial sugar + transferase" + /codon_start=1 + /transl_table=11 + /product="glucosyl-1-phosphate transferase" + /protein_id="QCO91912.1" + /translation="MDEKGLKIFLAVLQSIVVILLIYFLSFVRETEVERSSMVILYLL + HFFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLNAFDKNLGRNKQIHEMVGLNVVTFSKNLYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKINNDPRVTKIGRFIRKTSLDEIPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDAVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + gene 8313..9485 + /gene="wchF" + CDS 8313..9485 + /gene="wchF" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF09314.5" + /inference="protein motif:TIGRFAMs:TIGR03088" + /inference="similar to AA sequence:RefSeq:YP_002510379.1" + /note="PEP-CTERM/EpsH1 system-associated sugar + transferase; DUF1972 protein" + /codon_start=1 + /transl_table=11 + /product="rhamnosyltransferase WchF" + /protein_id="QCO91913.1" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDEDPIF + YILACRIGPFIHGIKKRIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKYA + DFLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSTLKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTAFDKDPRV + KFVGTVYDQELLKYIRENTFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKKIDELDRQSNQRIVDSFTWEKIVTDYEKLFKK" + gene 9482..10753 + /gene="wciU" + CDS 9482..10753 + /gene="wciU" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15484" + /inference="protein motif:Pfam:PF00534.14" + /note="glycosyl transferase group 1 protein" + /codon_start=1 + /transl_table=11 + /product="lipopolysaccharide + 1,2-N-acetylglucosaminetransferase" + /protein_id="QCO91914.1" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMLEQIAQGYQVAALYSGRI + KFFSKKIEIIKATSRQFECYELLNSLPMALFGGISDPTAFLTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKSTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKVLKLLGKNPKSKKNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIKSANSIVLSITNSSINHHQRLTTTNNKIRVA + YIGPDEEYKGYFDFVDFVETLDRESYEVATYGHLPNEECPSFIEQKGYFTKEMIDSVY + ENIDILIVPSKWKETFGLITVEALSYGVNVFVSENVGSKDLLPETHVFKDKEDLLAKI + INNQLEKVPLKTMEKHVEEVISYYKQVRSNN" + gene 10771..11823 + /gene="cpsJ" + CDS 10771..11823 + /gene="cpsJ" + /EC_number="2.4.1.212" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3858" + /inference="protein motif:CLUSTERS:PRK10073" + /inference="protein motif:Pfam:PF00535.20" + /inference="protein motif:TIGRFAMs:TIGR03937" + /inference="similar to AA sequence:RefSeq:YP_006033775.1" + /inference="similar to AA sequence:UniProtKB:Q7BLV3" + /note="hyaluronan synthase; putative glycosyl transferase; + putative glycosyl hydrolase; poly-beta-1,6 + N-acetyl-D-glucosamine synthase; Glycosyl transferase + family 2" + /codon_start=1 + /transl_table=11 + /product="family 2 glycosyl transferase" + /protein_id="QCO91915.1" + /translation="MSCPEISVIVPVYNVERYLRQCMDSLINQTYRDFEIILVNDGST + DSSGILCEEWAKKDERIHVVHKKNEGLGFARNTGVEHAKGKHITFVDSDDYVSLDMLQ + TLYNAVQEYDVEVVYSAGYYRSFSNGEIKKTDVGTKKPQLFEGGDVASELLPDVISAP + PEYPNDGKVGVSAWKVLYKANLFKDKGLLFHSEREFISEDAIFQIDCLKLATSALVIP + DILYYYRENFGSLSMKYKEDRFELDKILYNEQLKRVEGLPNQEILEERIERILIANIR + LCIFQESLHKSSRIHKRLQRIRQICKDPVSKVVLHHYPIHRLPFPKRLICVLAKYNMS + LFLLALTLLKYRNRSV" + gene 11835..12740 + /gene="wchN" + CDS 11835..12740 + /gene="wchN" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3774" + /inference="protein motif:Pfam:PF05704.6" + /inference="similar to AA sequence:RefSeq:YP_001835073.1" + /note="mannosyltransferase OCH1-related enzyme" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide synthesis protein" + /protein_id="QCO91916.1" + /translation="MNIEKLKLSLKNRTFFPVVIHALRNRWPLWWIRSKAIREVQLED + RAYRILKKKYGSLISNSFDKAYLSEKVPKQIWICWFQGMENAPDLVKSCYKSVKREFP + DYKITVLTAQTIQQHVTIPEEILYKWNKGIINNANFSDVLRVEILSKYGGIWLDATVY + CTGNTIKELIEKNPFFMYKSLSSIEENISASSWMIASTANHPLILSAKKLLVEYWCRE + NIAIHYFVFHLLFTIVAENYSDVWQSVPTYTNAAPHIMIDELNNVFSKERYQQLCQIS + DFHKLNYKKNYNDKSESLYSYLLNQ" + gene 12752..14209 + /gene="wzx" + CDS 12752..14209 + /gene="wzx" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF01943.11" + /inference="similar to AA sequence:RefSeq:YP_001835074.1" + /inference="similar to AA sequence:UniProtKB:P37746" + /note="putative O-antigen transporter; polysaccharide + biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="transporter" + /protein_id="QCO91917.1" + /translation="MPSLKKNIVYNILYQILAVIVPFITSPYLARVLGAEQIGVYSFT + YSIAFYFMILSMLGISNYGNRTIAQVRTSREHLNQEFSNIYAVQLTCSLVMTVSYLIY + ATVFVNSFQIVAYIQVLHVLSYATDVSWFFYGLEEFRITVARNSFVKLLTLISIFTFV + KSPNDIYLYTFIMAGSTLLGQLITWPFLLKQVNFVRPSLGKIKEHMKPIIILFFPVLA + VSIFSFLDKIMLGMYSSLKETAFYENSDKIISIPKALIQAFGAVMLPRTVHLLSIGDE + QKSLEYVDKTMWAVLVITMGCAFGLAGVSVTFAPVYWGEEFRASSQIIAGMTPALVFS + AFGNVIRTQFLIPRSFDKEYTVSLLYGAVVNILINILLIPKIGAMGAVIGTIVAELVL + CYYQTWIARNYLHIREYLINAGILFLIGSVMYMVLILVSSILPTSLLTLIIEIIVGAF + IYISLLILYIFSSKNRVIIGLRTNFLERTHLFKRK" + gene 14212..15477 + /gene="wzy" + CDS 14212..15477 + /gene="wzy" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04932.9" + /codon_start=1 + /transl_table=11 + /product="O-antigen ligase" + /protein_id="QCO91918.1" + /translation="MKFKFNPIAILYILLVYLELATDRQHLYPVTYMTKYYIGILITV + LFVLLLVGRGKVIFVNKKLLYLAKILAIPTIVLFLYSVLLDVMNPVEFNGYFSRLSST + TIFGLLAIFQAIVVFQFFGQKVVDYTFTAISLSYLTSIIVAFREGGLSQFILMLTDDS + FNGSVLEMHEVAPITALFILYYLYKYFIKENSFSLVFRNILIALIILFLSLKRIVFLS + VLIIIPVFLVIYWYDKKVSKLGKERKILSLLNSFSLIFITGIFLYVYSVKSGFIYTFI + QEHNINSMARTDLWKGIESTYSFAPIFMGRGIGFVTKWMDNNWMTLNINGLTESTGLH + NDILKYYIEIGFVGLFIYFYTLLYRNAKRIFVKIGHKESFIYFVLIMFQVLIWFTDNI + STYHNFLWILNLLLFSLTNTDAELETQKL" + gene 15557..16717 + /gene="wchX" + CDS 15557..16717 + /gene="wchX" + /EC_number="2.7.8.12" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04464.8" + /inference="similar to AA sequence:RefSeq:YP_002510384.1" + /inference="similar to AA sequence:UniProtKB:P13485" + /note="CDP-glycerol:poly(glycerophosphate) + glycerophosphotransferase" + /codon_start=1 + /transl_table=11 + /product="glycerol phosphotransferase WchX" + /protein_id="QCO91919.1" + /translation="MKFYIKNLLKKVFTLPLHLLPIQSNKIIFDNFGGRGFGDNPKYI + LEELVSREKNLNLVWVTKDREMSIPEGVRVVKYGSYRSFYEWLTARVWVDNIRNSDRP + WKRKGQIYLQTWHGSDGVKLIEKSVAGNLKKTYLRMAKYDGKITDGIVSSRHFQTLGM + QNNFWLAENVEFLEFGLPRNDDFFKSEKIKTTNIKFRTLFDIDLDELVVLYMPTFRDD + GSLNAYNLDYSKLIHVFQNKFRKNVKILVRFHPNVDSSFINLQDTDCINVSTYSNPQD + LMMSADVMITDYSSASIDFMLLNRPVFLYLPDYQSYVNDRPLDDNFDKLPFPRAYHNN + ELTEIIRDFERSKYDEKVRLYELEDVRFDRGKASVQCANWIEEKIKNNKVID" + gene 16759..17151 + /gene="gct" + CDS 16759..17151 + /gene="gct" + /EC_number="2.7.7.39" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0615" + /inference="protein motif:CLUSTERS:PRK11316" + /inference="protein motif:Pfam:PF01467.1" + /inference="protein motif:TIGRFAMs:TIGR01518" + /inference="similar to AA sequence:RefSeq:YP_003875983.1" + /inference="similar to AA sequence:UniProtKB:P27623" + /note="glycerol-3-phosphate cytidylyltransferase; + bifunctional heptose 7-phosphate kinase/heptose + 1-phosphate adenyltransferase; cytidylyltransferase" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="QCO91920.1" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNYEHRKNLVEAIRYVDLVIPETSWEQKKSDVKDYHIDTFVMGDDWKGKFDY + LEEEGVEVVYLPRTKEISTTKIKEDLSE" + CDS 17249..17362 + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_006742607.1" + /codon_start=1 + /transl_table=11 + /product="heme-based aerotactic transducer" + /protein_id="QCO91921.1" + /translation="MAVIFKDVLVEEKTDEEKQHILSILNDENVRAFDCGY" + gene 17992..18861 + /gene="rmlA" + CDS 17992..18861 + /gene="rmlA" + /EC_number="2.7.7.24" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4750" + /inference="protein motif:CLUSTERS:PRK15480" + /inference="protein motif:Pfam:PF00483.17" + /inference="protein motif:TIGRFAMs:TIGR01207" + /inference="similar to AA sequence:RefSeq:YP_815843.1" + /inference="similar to AA sequence:UniProtKB:P37744" + /note="glucose-1-phosphate thymidylyltransferase RfbA; + CTP:phosphocholine cytidylyltransferase; nucleotidyl + transferase" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase" + /protein_id="QCO91922.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEQPCSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLNRGDLSVEVMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + gene 18862..19455 + /gene="rmlC" + CDS 18862..19455 + /gene="rmlC" + /EC_number="5.1.3.13" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00908.11" + /inference="protein motif:TIGRFAMs:TIGR01221" + /inference="similar to AA sequence:RefSeq:YP_003878604.1" + /inference="similar to AA sequence:UniProtKB:Q5XCG7" + /note="putative dTDP-4-dehydrorhamnose 3,5-epimerase" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-dehydrorhamnose 3,5-epimerase" + /protein_id="QCO91923.1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + gene 19468..20517 + /gene="rmlB" + CDS 19468..20517 + /gene="rmlB" + /EC_number="4.2.1.46" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK10084" + /inference="protein motif:Pfam:PF01370.15" + /inference="protein motif:TIGRFAMs:TIGR01181" + /inference="similar to AA sequence:RefSeq:YP_006742612.1" + /inference="similar to AA sequence:UniProtKB:P95780" + /note="dTDP-glucose 4,6 dehydratase; NAD-dependent + epimerase/dehydratase family protein" + /codon_start=1 + /transl_table=11 + /product="dTDP-glucose 4,6-dehydratase" + /protein_id="QCO91924.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLREELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + gene 20583..21434 + /gene="rmlD" + CDS 20583..21434 + /gene="rmlD" + /EC_number="1.1.1.133" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09987" + /inference="protein motif:Pfam:PF04321.11" + /inference="protein motif:TIGRFAMs:TIGR01214" + /inference="similar to AA sequence:RefSeq:YP_141831.1" + /inference="similar to AA sequence:UniProtKB:P29781" + /note="dTDP-4-dehydrorhamnose reductase; RmlD + substrate-binding domain protein" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase" + /protein_id="QCO91925.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + gene 21784..22446 + /gene="glf" + CDS 21784..22446 + /gene="glf" + /EC_number="5.4.99.9" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF03275.7" + /inference="protein motif:TIGRFAMs:TIGR00031" + /inference="similar to AA sequence:RefSeq:YP_004326638.1" + /inference="similar to AA sequence:UniProtKB:P37747" + /note="protoporphyrinogen oxidase" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase" + /protein_id="QCO91926.1" + /translation="MNTFNKLWGVVTPAGAQAKIEEQHAILNGKTPENLEAQAISLVG + TDIYEKLIKDYTEKQWGKPTTELPSFIIRRLPVHLTYDNNYFNDTYQGIPIGDYNVII + ENMLKDVEVELGVNFFANRQELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFDHEVL + DEENYQGNAVVNYTEREIPYTRIIEHKHFEYGTQEKTVITREYPADFFLHYRKHYKSN + FK" + CDS 22443..23516 + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4763" + /inference="protein motif:Pfam:PF01757.16" + /note="acyltransferase family protein" + /codon_start=1 + /transl_table=11 + /product="putative membrane protein" + /protein_id="QCO91927.1" + /translation="MTRISMKKIKEYEILKVIAIILVVVGHSTYYNIYTGYGGIEYQQ + YINNHLSLAVYKLLSKLTEIIYYFHMPLFMAISGAFFSIQVKNNRWHGIGSLLTNKFR + RLMIPFFVFTLVYTIPIKYISNYFDGINFWKAVSGQLFLLGNSHLWYLYALFIVFIVG + FYILKKRTLFDVYLLLYILHILSYSVHLTLVSAPLQYLFWFSMGFLFEFKRKQYNHYL + KNNKWLSFLLVLLFIACVALKFVLKDNHEVLNRIIMDLAAVLGSLICYNISYYLSDKR + ELTENRLFNVILINGLGIYIFSDTLNYLILNISYSISNRFMFTAFGILALFLIRIFFT + LFIGLGLTLLFKKIFKKHSWLVN" + gene 23764..24291 + /gene="tnp" + CDS complement(23764..24291) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3464" + /inference="similar to AA sequence:RefSeq:YP_003878676.1" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO91928.1" + /translation="MSRVRVQIMNQFHRKSHEYKAIKRYWKLIQQDSRKLSDKRFYRP + TFRMHLTNKEILDKLLSYSQDLKHHYQLYQLLLFHFQNKKPEKFFGLIEDNLKQVHPL + FQTVFKTFLKDKEKIVNALQLPYSNAKLEATNNLIKLIKRNAFGFRNFENFKKRIFIA + LNIKKERTKFVLSQA" + gene 24288..25070 + /gene="tnp" + CDS complement(24288..25070) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3464" + /inference="protein motif:Pfam:PF01610.11" + /inference="similar to AA sequence:RefSeq:YP_003878675.1" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO91929.1" + /translation="MEQLHFITKLLDIKDPNIQILDIINKDTHKEIIAKLDYDAPSCP + ECGNQLKKYDFQKPSKIPYLETTGMPTRILLRKRRFKCYHCSKMMVAETSIVKKNHQI + PRIINQKIAQKLIEKISMTDIAHQLSISTSTVIRKLNDFHFKHDFSCLPEIMSWDEYA + FTKGKMSFIAQDFNNLNIITVLEGRTQAIIRNHFLRYDRVVRCRVKIITMDMFSPYYD + LAKQLRFQISRLRLKQSPRLFHSRMLKSFLNAFILYNILAVL" + gene 25185..25472 + /gene="tnp" + CDS complement(25185..25472) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF03050.8" + /inference="similar to AA sequence:RefSeq:YP_003879130.1" + /note="transposase IS66 family protein" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO91930.1" + /translation="MGLPITRKEISNWHIKTSQYYLESLYNLLREKLLEQALLHADET + SYRVLESDSQLTYYWTFLSGKSEKQGITLYHHDQCRSGSVVQEFLGDYSAL" + gene 25491..25958 + /gene="tnp" + CDS complement(25491..25958) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3436" + /inference="protein motif:Pfam:PF13005.1" + /inference="similar to AA sequence:RefSeq:YP_002738582.1" + /note="putative helix-turn-helix transposase IS66" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO91931.1" + /translation="MENPLRKVFALLDNSVFLKRNKIWKKTLTYPVEREEITYKRKKA + KGKRQAILAQFDSEEVHHQVEESICPDCQDDLKEIGASLQRQELVFIPAQLKRVDHIQ + HAYKCQACSDKNPSDKIVKAPVPKAPLAHSLGSASIIAHTIHQKFNLKVPNYR" + gene 26327..26575 + /gene="tnp" + CDS complement(26327..26575) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3436" + /inference="protein motif:Pfam:PF05717.7" + /inference="similar to AA sequence:RefSeq:YP_002037914.1" + /note="transposase IS66 Orf2-like protein" + /codon_start=1 + /transl_table=11 + /product="IS66-Spn1 transposase" + /protein_id="QCO91932.1" + /translation="MTIHLSSLGQVYLVCGKTDMRQGIDSLAYLVKTHFELDPFSGQV + FLFCGGRKDRFKALYWDGQGFWLLYKRFENGRLTWSST" + gene 26556..26795 + /gene="tnp" + CDS complement(26556..26795) + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_001836149.1" + /codon_start=1 + /transl_table=11 + /product="IS66 family Orf1" + /protein_id="QCO91933.1" + /translation="MELLLYTISKVKLLEDILMPQPIVPVEIPQSRPFDSKKRNDILL + KIRIGKLEVSFFQSLNLEMIEQLLDKVLLYDNSSI" + gene 26892..27071 + /gene="tnp" + CDS 26892..27071 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_003876565.1" + /codon_start=1 + /transl_table=11 + /product="IS1381 ISSpn7 transposase-like protein" + /protein_id="QCO91934.1" + /translation="MLAVLKTAYQLKHAKGGRKPKLSLEDLLMATLQYVREYRTYEQI + AADFGIHESNLIRRS" + gene 27226..27615 + /gene="tnp" + CDS 27226..27615 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3293" + /inference="protein motif:Pfam:PF01609.15" + /inference="similar to AA sequence:RefSeq:YP_007814220.1" + /note="transposase DDE domain protein" + /codon_start=1 + /transl_table=11 + /product="IS1381 orf A-B fusion protein" + /protein_id="QCO91935.1" + /translation="MKAQAIVTSQGRIVSLDITVNYCHDMKLFKMSCRNIGQAGKILA + DSGYQGLMKIYPQAQIPRKSSKLKPLIAEDKAYNHALSKDRSKVENIFAKVKTFKMFS + TTYRNHRKRFGLRMNLIAGIINHELGF" + gene 27879..29861 + /gene="aliA" + CDS 27879..29861 + /gene="aliA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4166" + /inference="protein motif:CLUSTERS:PRK15104" + /inference="protein motif:Pfam:PF00496.16" + /inference="protein motif:TIGRFAMs:TIGR02294" + /inference="similar to AA sequence:RefSeq:YP_001835080.1" + /inference="similar to AA sequence:UniProtKB:P31306" + /note="76 kDa cell surface lipoprotein; oligopeptide ABC + transporter substrate-binding protein OppA; ABC-type + oligopeptide transport system, periplasmic component; + nickel ABC transporter, nickel/metallophore periplasmic + binding protein; Bacterial extracellular solute-binding + proteins, family 5 Middle" + /codon_start=1 + /transl_table=11 + /product="oligopeptide ABC transporter + oligopeptide-binding protein AliA" + /protein_id="QCO91936.1" + /translation="MKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETDP + DNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDA + KWYTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDGYVKGEIKDFSQVG + IKALDEQTVQYTLNKPESFWNSKTTMGVMAPVNEEFLNSKGDDFAKATDPSSLLYNGP + YLLKSIVTKSSVEFAKNPNYWDKDNVHIDKVKLSFWDGQDTSKPAENFKDGSLTAARL + YPTSASFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKALL + NKDFRQAIAFGFDRTAYASQLNGQTGASKILRNIFVPPTFVQADGKNFGDMVKEKLVT + YGDEWKDVNLADSQDGLYNPEKAKAEFAKAKSALQAEGVTFPIHLDMPVDQTATTKVQ + RVQSMKQSLEATLGADNVVIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPDFA + DPSTYLDIIKPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDETTDVAKRY + DKYAAAQAWLTDSALIIPTTSRTGRPILSKMIPFTIPFALSGNKGTSEPILYKYLELQ + DKAVTVDEYQKAQEKWMKEKEESNKKAQEDLAKHVK" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg gagatggagt tggtgatttg ccaggtatta ccagtaagtt ggactatcta + 121 gctaagttag gaatcacagc gatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctacg atattgctga ttatcaagcg attgcggcta tttttggaac catggaggac + 241 atggatcagc tgattgcaga agctaagaag cgtgatatcc gtatcatcat ggacttggtg + 301 gtcaatcata cctcggatga gcatgcttgg tttgtcgaag cctgtgaaaa tactgacagc + 361 cctgagcgag actactatat ctggcgcgat gaacccaatg acctagattc tatctttagt + 421 gggtctgctt gggaatacga tgaaaagtca ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaagg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agataaggag ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcagc ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttacttcat + 1021 ctcatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatctctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaacct + 1261 tggttggcgg ttaatccaaa ttacgagatg atcaatgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 gttcgagctg actttgaatt gcttgatacg gctgataagg tctttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacactg cggctaaaga agtacttgaa + 1561 aaacaggtct tggctccatg ggatgctttc tgtgtggaaa tgactgacta gaatgagcaa + 1621 acctcaagtt tttgaagctt gaggtttttt actatagtgg attgaaacta gaatagtgca + 1681 cctctacttc taaaatattg ttagaaatcg atttgattgt cctgatcgat ttgtcctatt + 1741 cttatttcat tttactatac ttgtagttga ggagaattaa gctcctcact agtaaactct + 1801 tcataatcct ttttattttt atgaagatat tgtttgaaag atgtgagttt ccacggatgg + 1861 gtttgtggag ggatatactt gtgtctttct ttttttgttc tggttcttgt tcaaagtttt + 1921 tcgaatagag ttcatgatct agtagctcct ttgtgcgata gattttgtca gcgatattga + 1981 ggtagatgtc tccgttaaat gcttttataa ctaatgcttt cgtctttctg atgaaataga + 2041 cttcttttcc ttgttcggta gggatatagt aacgattttg gaatcggata tggtgtccac + 2101 tatcgacgac tctctccgcc agtctagcca gaatgagatt cctttcagaa gggttaggaa + 2161 cctcctcgaa gacagagagt tttgtcttgt ttccaaactg ttcattaaag gtttggatgt + 2221 aggaaagcag gaaggtattg gcttcttcca aggtatgaat attgtttcgt tccagttcga + 2281 taggcaggcg agattgtagt gtctgattaa gtctttcgac tctcccttta gcttgaggga + 2341 tagaggttgt ctccagaaga atccccagtt ggtgacaggc gtatccgaat tgtgtatgag + 2401 tgtcgtcctc cattttctta gagttggaga cttgataggt aaagactgtt cttttatctg + 2461 ttttgatttg aaggggaatg ccgtgattgc ctaaaatttg ttcgaggaca tgatagtaag + 2521 tattcaaggt ctcttgttta tcaaaataag cgcctaggat attgccagaa gcatcatcaa + 2581 tggctaagtg taagttagat gtttgtgctc caaaccaggc atgagggctg gcatccattt + 2641 gaatgagttc accagcaaat ttctttctgg gtctactagg atgtactttt ttagggtctt + 2701 caaggaagtt ttcagccgtc ggtaagattg gattatctag gggttgcttg gggttcagtt + 2761 tagcttgtct tcttactctc ttctttgtct ttctatgaga cttaggcgac aggatgtttt + 2821 ccttatagag tatttttcta acagttgtat cagagagctg aattccttct tcttcagcta + 2881 gcaattcaca gaaatgaagg acatttggtt tatatgtttc ataggagagg tattttttta + 2941 ggagacgtcc tttgatttca tcagggattg catgttttgg ttttcgattt ctgtttccgt + 3001 gtctgaaggc ttcttttcct ttcagttgat aggctagtag cagacgattg atttgccttt + 3061 cagaaagatt gagttcggca caggctcgtt tctttgtttt ctttccttgg gctatagctt + 3121 ttatcacaag atattttttc atttcattca tatttagttg gatccttttc atatgactat + 3181 tctaccaaat gggacatttt cacgttcgat ttactaaaga cattatcacc ttcgaatcac + 3241 aaagatgcag atagtgaaaa aaaggtgtag acattaccgt aaaaaagtga tataatcgta + 3301 agatgttcaa ggtataggtg ttaatcatga gtagacgttt taaaaaatca cgttcacaga + 3361 aagtgaagcg aagtgttaat atcgttttgc tgactattta tttattgtca gtttgttttt + 3421 tattgttctt aatctttaag tacaatatcc ttgcttttag atatcttaac ctagtggtaa + 3481 ctgcgttagt cctactagtt gccttggtag ggctactctt gattatctat aaaaaagctg + 3541 aaaaattcac tatttttctg ttgctgttct ctatccttgt cagctcagtg tcgctctttg + 3601 cagtacagca gtttgttgga ctgaccaatc gtttaaatgc gacttctaat tactcagaat + 3661 attcgctcag tgtcgctgtt ttagcagata gtgagatcga aaatgttacg caactgacga + 3721 gtgtgacagc accgactggg actgataatg aaaatattca aaaactacta gctgatatca + 3781 agtcaagtca gaataccgat ttgacggccg accatagttc gtcttacttg gctgcttaca + 3841 agagtctgat tgcaggggag actaaggcca ttgtcttaaa tagtgtcttt gaaaatatca + 3901 tcgagtcaga gtatccagac tacgcatcga agataaaaaa gatttatatc aagggattca + 3961 ctaaaaaagt agaagctcct aagacgtcta agaatcagtc tttcaatatc tatgttagtg + 4021 gaattgacac ctatggtcct attagttcgg tgtcgcgatc agatgtcaat atcctgatga + 4081 ctgtcaatcg agataccaag aaaatcctct tgaccacaac gccgcgtgat gcctatgtac + 4141 caatcgcaga tggtggaaat aatcaaaaag ataaattaac ccatgcgggc atttatggag + 4201 ttgattcgtc cattcacacc ttagaaaatc tctatggagt ggatatcaat tactatgtgc + 4261 gattgaactt cacttctttc ttaaaaatga ttgacttatt gggaggggta gatgttcata + 4321 atgatcaaga gttttcagct ctacatggga agttccattt cccagtaggg aatgtccatc + 4381 tagactctga gcaggctcta ggttttgtac gtggacgcta ctcactagcc gatggagacc + 4441 gtgaccgtgg tcgcaaccaa caaaaggtca ttgtagcaat tattcagaag ttaacttcta + 4501 cagaggtttt ggaaaactat agtagtattc ttcaaggatt gcaggattct cttcaaacaa + 4561 atatgccgat tgagactatg atagatttag tgaatactca gttggaaagt ggagggaatt + 4621 ataaagtaaa ttctcaagat ttaaaaggga caggtcggat ggatcttcct tcttatgcaa + 4681 tgccagacag taacctctat gtgatggaaa tagatgacag tagtttaact gtagttaaag + 4741 cagctataca ggatgtgatg gagggtagat gaaatgatag atatccattc gcatatcgtt + 4801 tttgatgtag atgacggtcc caagtcaaga gaggaaagca aggctctctt ggcagaagcc + 4861 tacaggcagg gggtgcgaac cattgtctct acctctcacc gtcgcaaggg catgtttgaa + 4921 actccggaag agaagatagc agaaaacttt cttcaggttc gggaaattgc aaaagaagta + 4981 gcagatgatt tagtcatcgc ttatggcgca gagatatact atactctgga tactctagaa + 5041 aagctagaaa aaaaagaaat tcctaccctt aatgatagtc gttatgcttt gattgagttt + 5101 agcatgcata cttcctatcg tcagattcat acgggattga gcaatatttt gatgttggga + 5161 atcacgccag taattgctca tattgaacgg tatgatgctt tagagaataa cgaaaaacat + 5221 gttcgtgaac tgattgatat ggggtgctat actcagataa atagttatca tgtttcaaaa + 5281 cctaagttct ttggtgaaaa atataaattc atgaaaaaga gagctcggta ttttttggaa + 5341 cgtgatttag ttcatgtagt tgcaagtgac atgcacaatt tagacagtag acctccatat + 5401 atgcaacaag catatgatat cattgctaag aaatatggag cgaaaaaagc gaaagaactt + 5461 tttgtagata atcccagaaa aattataatg gatcaattaa tttaggagaa aatatgaagg + 5521 aacaaaacac tttggaaatc gatggattgc aactattcag agctttatgg aaaagaaagt + 5581 tggtcatttt attagtggca attataactt cttcagttgc ttttgcctac agtacttttg + 5641 ttatcaaacc tgagtttact agtacgactc ggatttatgt agttaaccgt aatcaggaag + 5701 agaagcctgg tttaaccaat caagacttgc aggcaggatc atacttggtt aaagactatc + 5761 gtgaaattat cctatcgcag gatgttttgg aggaagttgt ttctgatttg aaactagatt + 5821 tgacgccaaa aggtttggct aataaaatta aagtaacagt accagttgat acccgtattg + 5881 tctctgtttc agttaatgat cgagttcctg aagaggcaag ccgtatcgct aactctttga + 5941 gagaagtagc tgctcaaaaa attatcagta ttactcgtgt ttctgatgtg acaacactgg + 6001 aggaggcaag accggcgata tcaccgtctt caccaaatat taaacgcaat acactaattg + 6061 gttttttggc aggggggatt ggaactagtg ttatagtttt tcttcttgaa cttttggaca + 6121 ctcgtgtgaa acgtccggaa gatatcgaag atacactgca gatgacactt ttgggagttg + 6181 taccaaactt gaataagttg aaataggaga gagagatgcc gacattagaa atagcacaaa + 6241 aaaaactgga gttcattaag aaggcagaag aatattacaa tgccttgtgt acaaatatac + 6301 agttgagcgg agataaacta aaagtaattt ccgttacttc tgttagccct ggggaaggaa + 6361 aaacaactac ttccgtaaat atagcatggt cgtttgcgcg tgcaggctat aaaactcttt + 6421 tgattgatgg cgatactcga aattcggtta tatcaggatt ttttaaatct cgtgaaaaga + 6481 ttacaggtct aacagaattt ttatctggga cagctgattt atctcacggt ttatgtgata + 6541 caaatattga aaatttattt gtagttcaat cgggagctgt atcaccaaac cctacagcct + 6601 tgttacaaag taaaaatttt aatgatatga ttgaaacatt gcgtaaatat tttgattata + 6661 tcattgttga tacagcacct attggaattg ttattgatgc ggcaattatc actcaaaagt + 6721 gtgatgcgtc catcttggta acagcaacag gtgagacgaa taaacgtgat gtccaaaaag + 6781 cgaaacaaca attaaaacaa acagggaaac tgttcctagg agttgtttta aataaattag + 6841 atatctcggt tgataagtat ggagtttacg gtttctatgg aaattatggt aaaaaataac + 6901 ttaggaaaga ttttatggat gaaaaaggat tgaaaatttt tctggcagta ttacagagta + 6961 ttgttgtcat tttattgatt tattttctta gctttgttag agagacagaa gttgaacgtt + 7021 cttcgatggt tatactatac cttctccact tttttgtatt ctattttagt tcctatggta + 7081 acaatttttt taaaagaggg cacctagttg agtttaatag tactataaga tatatttttt + 7141 tctttgcaat agctataagt gtattaaact tttttatagc ggaacggttt agtatctcta + 7201 gaagaggaat ggtatacttc ttaactttag aaggaatatc cttatacttg ttaaatttct + 7261 tagtaaagaa atattggaag catgtgtttt ttaatctaaa aaatagcaag aaaattttac + 7321 tgttaacagt aacgaaaaat atggaaaaag ttcttgataa attgttagaa tctgatgaac + 7381 tttcatggaa attggtagca gtaagtgttt tggataaatc tgattttcaa catgataaaa + 7441 tacctgtaat tgaaaaggaa aaaattattg aatttgcaac gcatgaagtt gtggatgagg + 7501 tgtttgtcaa tcttccagga gagagctacg atattggaga aattatctct aggtttgaga + 7561 caatggggat agatgtaact gtaaatctta atgcatttga taagaatttg ggtcgcaata + 7621 aacaaattca tgagatggta ggattgaatg tagtcacttt ctctaaaaat ctttataaaa + 7681 ctagtcatgt gatttcaaag agaattctcg atatttgtgg tgccactatt ggccttattc + 7741 tttttgctat agctagtcta gttttagttc cattgattcg taaagatggc ggaccagcta + 7801 tttttgctca gacgcgtata gggaaaaatg gtcgacattt taccttttat aaattccgtt + 7861 cgatgcggat cgatgctgaa gctatcaaag aacagttgat ggatcaaaat acgatgcaag + 7921 gtggtatgtt taagataaac aatgatcctc gtgttacaaa aattggccgc tttattcgta + 7981 aaaccagttt ggatgagata ccccagtttt ggaatgtctt tataggagat atgagtttgg + 8041 tgggaacacg tccacctaca gtagacgagt atgatcagta tactccagaa cagaaacgtc + 8101 gactcagctt taaacctggt attacaggtt tatggcaggt tagcggccgt agtaaaataa + 8161 ccgattttga cgctgttgta aaattagatg tggcttatat tgataattgg acaatctgga + 8221 aagatattga aattttgctt aaaactgtta aagttgtatt tatgagagat ggagcgaagt + 8281 aatttctgta tatccatcct attaggagag aaatgaaaaa gtcagtttat atcattggtt + 8341 caaaaggaat tcctgctaag tatggaggat ttgaaacttt tgttgaaaaa ttaacagcct + 8401 tccaacaaga taaggctatc caatattatg tggcttgtat gcgtgaaaac tctgcaaaat + 8461 cagggactac tgaggatgtt tttgaacata atggtgctat ctgttataac gtcgatgttc + 8521 ctaatattgg tccagcgcga gctatagcgt atgatatcgc tgcaattaac agagctattg + 8581 aaattgccaa agaaaataag gatgaagatc caatcttcta tattttagct tgtcgaattg + 8641 gtccgttcat ccatggaatt aagaaaagaa ttcaagcaat aggtgggact cttctggtta + 8701 atccagatgg tcacgagtgg ttacgagcca agtggagtgc tcctgttcgt cgctactgga + 8761 aaatttctga aggtcttatg gtcaaatatg cagatttttt agtgtgtgat agtaagaata + 8821 ttgaaaaata tatccaagaa gattataaac agtatcaacc taaaacaacc tatatcgctt + 8881 atggaacaga tacaacacgc tctacattaa aaagtagtga tgaaaaagta cgttcttggt + 8941 tcaaagagaa gaatgtttct gagaacgagt attatctagt tgtaggacgt tttgtaccag + 9001 aaaacaacta tgaatctatg attcgtggct ttttggcgtc taactctaag aaggactttg + 9061 ttttaatcac aaatgtagaa cagaataaat tttataatca gttgttggca aaaactgctt + 9121 ttgataagga cccacgagta aaatttgttg gaacagtcta cgatcaagaa cttctgaagt + 9181 atattcgaga aaacaccttt gcttacttcc atggacatga agttggagga accaatcctt + 9241 cgcttttaga agctctggca tcaactaaac tgaatttatt gctagatgtt ggctttaacc + 9301 gagaagttgg ggagcaaagt gcaatctatt ggaaaaaaga tgagctttcc caagtaatcg + 9361 agaaagttga acaatttgat gcaaaaaaga ttgatgagtt agatagacaa tcaaatcaga + 9421 gaattgtgga ttctttcact tgggaaaaga ttgtcacaga ctacgagaaa ttatttaaaa + 9481 aatgaaaata ttacattata ctttaggatt tcaaccccag cgaacaggtg gtttggttaa + 9541 atatgctgag gatttaatgc tagagcaaat tgctcaaggt tatcaagtgg ctgccctata + 9601 ttcaggaaga attaagttct tttcaaaaaa aatagaaata attaaagcga cgtcaagaca + 9661 gtttgagtgt tatgagctgc ttaatagctt acctatggct ttatttggag gtatatccga + 9721 tccaactgct ttcctgacac cttgtgacaa aaatgtttat cgtacttttt tagaaaaagt + 9781 acaacccgac attatacata ttcattcgtt tatgggattg cataaagaat tcctcgaaat + 9841 tgctaaaaac ttgaatatta gagtggtttt tacgagccat gattattatg gattagcacc + 9901 cgtacctcat ttctatttta atggggtgga ttatagtgat aaaagtacaa acttaacatg + 9961 gaatattatg tcttccaatg ctttaagtgt gaaaaaacta agactttttc aggtttcatt + 10021 ttatcctact attcgtaaag ttttgaaact attagggaaa aatccaaaat ctaaaaagaa + 10081 tttagttatt cgagatgtta ttgaggagca agattatagt gagcttcgat actattataa + 10141 tgagatgttt cacttaatag atggttattt gtttaatagt agacttgcaa agaaggtata + 10201 tgagataaat gagattaagt cagctaatag tatagtatta tctataacaa atagttcaat + 10261 taatcatcat cagagattga caactacaaa taataaaatt agagttgctt atattggtcc + 10321 agatgaagaa tataaaggat attttgattt tgttgacttt gttgaaactt tagatcgaga + 10381 gtcctatgaa gtggcaactt atggccattt accaaatgaa gagtgtcctt cattcattga + 10441 acaaaaagga tattttacta aggaaatgat tgacagtgtc tatgaaaata ttgatattct + 10501 tattgttcca agtaagtgga aggaaacatt tggattgata acagtagaag cattatccta + 10561 tggggtaaat gttttcgtga gtgaaaatgt tggatcaaaa gacttgcttc cagaaacaca + 10621 tgtttttaaa gacaaggaag atttgttggc taaaatcatc aataatcagt tggagaaagt + 10681 tccgcttaaa acgatggaaa aacatgtaga agaagttatt agttattaca aacaggttag + 10741 aagcaacaat taaggagaat gattaaagat atgtcctgtc cagaaattag cgtaattgta + 10801 ccagtttata atgtggaacg atatttaaga cagtgtatgg attcattgat aaatcaaact + 10861 tatagggatt ttgaaataat tttagtaaac gatggatcaa cggattcttc tgggattctc + 10921 tgtgaagagt gggcaaaaaa agatgaaaga attcatgtgg ttcataaaaa aaatgagggg + 10981 cttggcttcg ctcgtaatac aggggttgaa cacgcaaagg ggaaacacat aacctttgta + 11041 gattcagatg actatgtttc tctagatatg ctgcaaactc tatataatgc tgttcaagaa + 11101 tatgatgtcg aagttgtata cagtgcggga tattatcgtt cctttagtaa tggggaaata + 11161 aagaagacag atgtaggaac aaaaaagcct caacttttcg aaggaggaga tgttgcctct + 11221 gaattactcc ctgatgtaat ttctgctcct cctgaatatc caaatgatgg gaaagttgga + 11281 gtgtcggcat ggaaggttct ctacaaagct aatttattta aggataaagg gctattattt + 11341 cattcggaaa gagaattcat ttcagaagat gctatttttc aaattgattg tttaaaatta + 11401 gcaacatctg cccttgttat cccagatatt ttatactact atcgtgaaaa ctttggttct + 11461 ttaagtatga aatataaaga agatcggttt gagttggata aaatcttgta taacgagcaa + 11521 ttaaaaagag ttgaggggtt acctaatcaa gaaattttgg aagaaagaat cgagagaatt + 11581 ttaattgcta atattcgttt atgtatcttt caggaatctt tacataaaag ttctagaata + 11641 cataaacgct tgcaaagaat tagacagatt tgtaaggatc cagtctcaaa agtagtttta + 11701 caccactatc caatccatcg tttacctttt cctaaacgtt tgatctgtgt attagctaag + 11761 tataatatgt cgctgtttct tttagcttta accctattaa aatatcggaa tcggagtgta + 11821 taacttttat ggggatgaat atagaaaaat taaaactatc tttgaaaaat agaacgtttt + 11881 ttcctgttgt tattcatgcc ttacgtaacc gttggccctt gtggtggatt cggagtaagg + 11941 ctattcgaga agtacaactt gaagataggg cctacagaat actaaaaaag aaatacggtt + 12001 ccttaatttc aaactctttt gataaagcat acttatcaga aaaagttccc aagcaaatct + 12061 ggatttgctg gtttcaaggt atggagaatg ctccagattt ggtgaaatca tgttataagt + 12121 ctgttaaaag agaatttcca gattataaaa ttacagtatt aacggctcag actattcaac + 12181 agcatgtaac aattcctgaa gaaattttgt ataagtggaa taaaggtatc ataaataacg + 12241 caaatttttc agatgttttg cgtgttgaga ttttatctaa atatggaggt atttggttag + 12301 atgctacagt ttattgcact ggtaatacaa ttaaggaatt aattgagaaa aatccatttt + 12361 ttatgtataa gagtctatct tcaatcgaag aaaatatttc tgcatcaagc tggatgattg + 12421 cttcaacagc aaatcaccct ttaatactat ctgcgaagaa gttgctagta gaatattggt + 12481 gtagagaaaa tattgcaatc cattattttg tttttcattt gctgttcacg attgtagctg + 12541 aaaattattc ggatgtttgg cagtctgtac ccacctatac gaacgcagca ccacatataa + 12601 tgattgatga attaaataat gttttttcaa aggaacgtta ccagcaattg tgtcaaattt + 12661 cagattttca taaattgaat tataaaaaaa attacaatga taaatctgag agtttgtaca + 12721 gttacttact gaatcagtag aggggagaat cttgcctagt ttaaagaaaa acattgttta + 12781 caatatctta tatcagatct tagctgtaat agtaccgttt attacctcac cttatttagc + 12841 tcgtgtgtta ggtgcagagc aaattggagt ttattctttt acctattcca ttgcttttta + 12901 ctttatgatt ctgtccatgt tggggatttc taattatggg aatcggacaa tagcacaggt + 12961 acgaacaagt agagaacatt tgaatcagga attttcgaat atttacgcgg ttcagttgac + 13021 gtgttcacta gtaatgaccg tctcatattt gatttatgca acagtatttg tgaatagttt + 13081 tcagattgta gcctatatcc aagtattaca tgttttatcg tatgcaacag atgttagttg + 13141 gtttttttat ggtcttgaag agtttcgtat tacggttgct aggaattcat ttgttaaatt + 13201 attgacttta atatctatct ttacatttgt aaaaagccct aatgatatct atttatatac + 13261 ctttataatg gcagggagta ccctgcttgg tcagttgatt acatggccat ttttgctaaa + 13321 acaagtaaac tttgtgcgcc ctagtcttgg aaaaataaag gaacacatga aacctattat + 13381 tattttattt ttccccgtct tagcggttag tattttttcg tttttagata aaataatgct + 13441 tgggatgtat agtagtttga aggaaactgc tttttatgag aattcagata agatcattag + 13501 tattccaaaa gctctgattc aagcctttgg agctgtaatg ttgcctcgaa cagtacattt + 13561 actgagtata ggtgatgaac aaaaaagttt agaatatgtt gataaaacga tgtgggctgt + 13621 tttagtgatt acaatgggct gtgctttcgg tttagcagga gtttctgtaa cctttgctcc + 13681 tgtttattgg ggtgaagaat ttagggccag tagccaaatt attgcaggaa tgacaccggc + 13741 tttagtattt tcggcttttg gaaatgtcat ccgaacccag tttttaattc cacgaagttt + 13801 tgacaaggaa tatacggtat ctttgcttta tggagccgtt gttaatattt tgattaatat + 13861 tcttttgatt ccgaagatag gagcaatggg agctgttatt ggaacaattg ttgcagagtt + 13921 agttctatgt tactatcaaa catggattgc tagaaattat ttacatatca gagaatatct + 13981 gataaatgct gggatattat ttcttattgg ttcagtaatg tatatggttt taattcttgt + 14041 ttcaagtatt ttacctactt cgttacttac acttattatt gaaattatag tcggagcttt + 14101 catttatatt agtttactga ttctgtatat cttttcttca aaaaacaggg taattattgg + 14161 tttacgaaca aattttttag aacgtactca tttatttaaa aggaagtaat agtgaaattt + 14221 aaatttaatc caatcgcgat actgtatata ttgctagtat acttagagtt agctacagat + 14281 aggcaacatc tgtatccagt aacgtacatg acaaaatatt atattggtat tttaatcact + 14341 gtgttgtttg ttttgttatt agtaggccgt gggaaggtta tttttgttaa taaaaaatta + 14401 ttatatcttg ctaagatatt agctatacca acaattgttc ttttcctgta ctcagtctta + 14461 ctagacgtaa tgaacccagt tgaatttaat ggatatttta gtagattatc aagtacgact + 14521 atttttggtt tgttagctat ctttcaagct atagttgttt ttcaattttt tggacaaaaa + 14581 gtagtagatt acacttttac agctatctcc ctcagctact taaccagtat cattgttgcc + 14641 tttagggagg gaggacttag tcaatttatc ttgatgctaa cagatgatag tttcaatggt + 14701 tcggtactag aaatgcatga agttgcacct attacagctc tctttattct gtactatttg + 14761 tacaaatatt ttataaaaga aaatagtttt tctttagtat ttcgtaatat cttaatagct + 14821 ctcattattc tttttttaag ccttaaacga atcgtttttt tgagtgtatt aattatcata + 14881 ccagtatttt tggtaattta ttggtatgat aaaaaagtaa gcaaactagg gaaagaacga + 14941 aaaattttaa gtttattaaa tagcttttcc ttaatattta taacaggaat attcctttat + 15001 gtttatagtg taaaatctgg ttttatatat acatttattc aagaacataa tattaattcg + 15061 atggctagaa cagatttatg gaagggaatt gaatcaacct atagttttgc ccctatattt + 15121 atggggagag ggatagggtt tgtaacaaaa tggatggata ataattggat gactttgaat + 15181 atcaatggtc ttacagagtc aacggggctc cataatgata ttttgaagta ctacattgag + 15241 ataggatttg taggattatt tatttatttt tacactcttc tttatagaaa tgctaaacgt + 15301 atatttgtaa aaattggtca taaagaatca ttcatatatt ttgtattgat aatgtttcag + 15361 gtgctgatat ggtttacaga taatatttca acttaccata attttttatg gattctaaat + 15421 ctactgctct tttctttaac taatacggat gcagagttgg aaactcagaa attataaaat + 15481 atttatttct tgaatttatg gtcttacgcc gtaaatttga tttcactaat gaccaatact + 15541 aatttataaa agtaatatga aattttatat aaaaaattta ttaaaaaaag tctttacatt + 15601 accgttgcat ttattgccta ttcagtctaa taagataata tttgataatt ttggtggtag + 15661 aggttttggg gacaatccta agtatatact tgaagaactt gtctctcgag aaaagaatct + 15721 aaatcttgtg tgggtaacaa aagatagaga aatgtctatc cctgaaggcg ttcgagtagt + 15781 aaaatacggc agttaccgtt ctttttatga atggttaaca gctagagttt gggtagataa + 15841 tattcgtaat tctgatcgac cttggaagcg aaaaggacag atttatcttc aaacttggca + 15901 tggttcagat ggggtaaagt taattgaaaa aagtgttgca gggaatctaa aaaaaacata + 15961 tcttagaatg gcgaagtatg atggaaagat tacagacggt atcgtatcaa gtcggcactt + 16021 tcaaactttg ggtatgcaaa ataatttttg gctggcagag aatgtggaat ttctggaatt + 16081 tggattacct cgaaatgatg atttttttaa aagtgaaaaa atcaaaacca caaatataaa + 16141 atttagaaca ttatttgata tcgatttaga cgaactggta gttttgtata tgccgacgtt + 16201 cagagatgat ggatcgttga atgcctataa tttagattac tcgaaactaa tacatgtttt + 16261 tcaaaataaa tttagaaaaa atgtaaaaat attagttcgt tttcatccaa atgttgattc + 16321 tagttttata aatttacagg atacagactg tataaatgtg tcgacctatt caaatcctca + 16381 ggatctgatg atgagtgcag atgtgatgat tacggattat tcatcggctt ctattgattt + 16441 tatgttatta aatcgtccag tatttctgta tttaccagat tatcaaagtt atgtgaatga + 16501 tagaccattg gatgataact ttgataaatt gccatttcca agagcatatc ataacaatga + 16561 gttgacagaa attattagag actttgaaag aagtaaatat gatgaaaaag ttcgtctgta + 16621 tgaattagag gatgttcgtt ttgatagagg aaaagcatca gtacagtgtg ctaattggat + 16681 tgaagaaaaa ataaaaaaca ataaagttat tgattgaaat aattatattt attgaattat + 16741 aaataaggag gtctttagat gaaaagagtt ataacatatg gtacatttga tttattgcat + 16801 tatggtcata tcaatctttt gaaacgtgct aaacagctag gtgattattt gattgtagtt + 16861 gtttcaagtg atgagtttaa tttaaaagaa aagaataaag tatgttactt taactacgaa + 16921 cacagaaaaa atttagtaga agctattcga tatgtcgatt tagtaatccc tgaaactagt + 16981 tgggaacaga aaaagtcaga tgttaaagac taccatattg acacttttgt aatgggtgat + 17041 gattggaaag gtaaatttga ttatcttgaa gaagaaggtg ttgaagtagt ctatttgcct + 17101 agaacaaagg aaatatcaac cacaaagata aaagaagatt tatcggaatg aaatattatt + 17161 aaaaaatgct gacataagaa attgtggctt ttgtgtctag tttttgatag aataaagtaa + 17221 caacacttta accaatgagg tgtgaataat ggcagtaatt tttaaagatg tacttgttga + 17281 agagaaaact gatgaagaaa aacaacatat tttatctatt ttaaatgatg agaatgttag + 17341 agcttttgat tgtggatatt aagaattgaa tgatgttttt tgatatttag aacaaatacg + 17401 atgaagaaac aggccatgta ttgcctattg taaatcaaaa ttttgaatta ttaggtttta + 17461 tttcttgtag actagtatca ttttctttca tagctcaggt taaagagatg ggaattagca + 17521 tagattatct tggtattcat aaggattgcc agaaaatggg ggatcggttc gcttttggtg + 17581 ctctttgcgc ttcgattatc tttaactatt tactgttgat taccaataaa aggtgtaata + 17641 gttcatgctc tagaggatgt tgtagaattc tatgacaaac tgggttttat tgaccctaga + 17701 gatatagtta tttataatgg caaaccggtt actatatatt ttagtattga aaaactaaga + 17761 aatggtgaaa attattcctc tcacacagtt atttgaaaca tccttagaaa atgattttta + 17821 attgtatgca aacaaagtag aattcgctta tttcatctta tgctaaatgt aatatgaaac + 17881 aagtgaattt ttatagataa agaagaattt taaaaaatgt gatgattatt tttagagcag + 17941 tacagaatta atagtaattg actctaaatc aataaagaaa ggtaccctat tatgaaaggt + 18001 attattctag caggtggttc ggggacacgt ttatatcctt tgactcgagc tgcatcaaaa + 18061 caactgatgc cggtttatga taaaccgatg atttactatc cactttcaac attgatgttg + 18121 gctgggatta gggatatttt gataatctca actcctcaag atttgcctcg ttttaaagag + 18181 cttcttcaag acggatctga gtttgggatt aaactttctt atgcagagca accaagtcca + 18241 gatggtttgg cacaagcctt tatcattggg gaagagttta ttggtgatga tagtgttgct + 18301 ttgatcttgg gggacaatat ctatcacggc cctggtttga gcaaaatgct tcaaaaagca + 18361 gccaagaaag agaaaggtgc gactgtcttt ggctaccatg tcaaggatcc agaacgcttt + 18421 ggtgttgtag aatttgatga aaatatgaat gctatctcca tcgaagaaaa accagaacag + 18481 ccgtgctcta actatgcagt gacaggactg tatttctatg ataacgatgt tgtcgagatt + 18541 gccaaaagta ttaaaccaag tcctcgtggt gaattggaaa ttacagatgt aaacaaggct + 18601 tacctaaatc gtggagattt atccgttgag gttatgggac gcggctttgc ttggttggat + 18661 actggaacac atgaaagttt actggaggct tcacagtaca tcgaaacagt ccaacggatg + 18721 caaaatgttc aggtagcaaa cttagaagaa attgcttacc gtatgggcta tatcagtcga + 18781 gaagatgtat tggccttagc ccaaccactt aagaaaaatg aatacggaca gtatctgctc + 18841 cgtttgattg gagaagcata gatgacagat aattttttcg gtaagacgct tgcggcacgc + 18901 aaggttgaag ctattccagg catgttggag tttgatatcc ccgttcatgg agataatcgt + 18961 ggctggttta aagaaaattt ccaaaaggaa aaaatgcttc cacttggatt tccagagtct + 19021 ttctttgcag aaggaaaatt gcaaaacaat gtatccttct cacgtaaaaa tgtccttcga + 19081 ggcctccacg cagagccttg ggataagtac atctctgtag cagatggagg gaaagttctg + 19141 ggttcttggg ttgatctacg cgagggtgaa acctttggga atacctatca gacagtgatt + 19201 gatgcgagta agggaatctt tgttcctcga ggcgtagcta atggcttcca agttttatca + 19261 gatacagtgt catatagcta tctggtcaat gattactggg ctcttgaact caaacccaag + 19321 tatgcctttg tgaactacgc tgatccaagc cttggtattg aatgggaaaa tattgcagaa + 19381 gcagaggttt cagaagcaga taaaaatcat ccactactta aggatgtaaa acctttgaaa + 19441 aaagaagatt tgtaaaaagg aaagaatatg actgaataca aaaatattat cgtgacaggt + 19501 ggagctggct ttatcggttc taactttgtc cattatgttt acgagaactt tccagatgtt + 19561 catgtgacag tcctagataa gttgacttat gctggaaacc gcgcgaatat tgaggaaatt + 19621 ttaggtaatc gtgttgagtt agttgttggt gacattgctg atgcggagtt ggtagacaag + 19681 ttggctgctc aagcagatgc tatcgttcat tatgcagcgg aaagccacaa tgataattcg + 19741 ctcaatgatc catcgccatt tattcatact aacttcatcg gaacctatac tcttttagaa + 19801 gctgctcgta agtatgatat tcgcttccac catgtatcga cagatgaagt ttatggggat + 19861 ctccctttac gcgaggattt gccaggtcat ggtgaaggac caggtgagaa atttactgct + 19921 gaaacaaaat acaacccaag ctctccgtac tcatcaacca aggcagcctc agatttgatt + 19981 gtcaaagcct gggtgcgttc ttttggagtc aaggcaacga tttccaactg ttcaaataac + 20041 tacggtcctt atcaacatat cgaaaaattc atcccacgtc agattactaa catcctaagt + 20101 ggtatcaagc caaaacttta cggtgaaggt aagaacgttc gtgattggat tcataccaat + 20161 gaccattctt caggagtttg gacaatcttg acaaaagggc aaatcggtga aacctacttg + 20221 attggggctg atggtgagaa gaacaataag gaagttttgg aacttatcct taaggaaatg + 20281 ggacaagcta cggatgccta tgatcatgtg actgaccgtg caggacatga ccttcgctat + 20341 gcgattgatg ccagcaagct ccgtgaggag ttggggtgga aacctgaatt taccaacttt + 20401 gaagctgggc tcaaggcaac aatcaagtgg tatacagata accaagaatg gtggaaagca + 20461 gaaaaagaag ctgttgaagc caattatgct aaaactcagg agattattac agtataaaaa + 20521 gcaggaaata gctgcttttt attgctatat tgggaagagt tacatattag aaaggtctag + 20581 agatgatttt aattacaggg gcaaatggcc aattaggaac ggaacttcgc tatttattgg + 20641 atgaacgtaa tgaagaatac gtggcagtag atgtggctga gatggacatt accgatgcag + 20701 aaatggttga gaaagttttt gaagaggtga aaccgacttt agtctaccac tgtgcagcct + 20761 acaccgctgt tgatgcagca gaggatgaag gaaaagagtt ggacttcgcc atcaatgtga + 20821 cggggacaaa aaatgtcgca aaagcatctg aaaagcatgg tgcaactcta gtttatattt + 20881 ctacggacta tgtctttgac ggtaagaaac cagttggaca agagtgggaa gttgatgacc + 20941 gaccagatcc acagacagaa tatgggcgta ctaagcgtat gggggaagag ttagttgaga + 21001 agcatgtgtc taatttctat attattcgta ctgcctgggt atttggaaat tatggcaaaa + 21061 acttcgtttt taccatgcaa aatcttgcga aaactcataa gactttaaca gttgtaaatg + 21121 accagtacgg tcgtccgact tggactcgta ccttggctga gttcatgacc tacctagctg + 21181 aaaatcgtaa ggaatttggt tattatcatt tgtcaaatga tgcgacagaa gacacaacat + 21241 ggtatgattt tgcagttgaa attttgaaag atacagatgt cgaagtcaag ccagtagatt + 21301 ccagtcaatt tccagccaaa gctaaacgtc cgctaaactc aacgatgagc ctggccaaag + 21361 ccaaagctac tggatttgtt attccaactt ggcaagatgc attgcaagaa ttttacaaac + 21421 aagaagtgag ataagtagta gaatgatttt ctagtctaat aaaagaggca gataatgaac + 21481 tccaaaggag cttaagatgt acgattatct tgttgttggt gctggtctct ttggtgcagt + 21541 ctttgcccat gaagcagcct taaaaggaaa aaagtaaaag ttattgaaaa acgaaatcat + 21601 atcgcgggta atatctatac tcgtgaagag gaaggaattc aagtttatca atatggtgct + 21661 catatcttcc atacttctga taaggagatc tgggattatg taaatcagct tgcagagttt + 21721 aaccgttaca caaattctcc tgttgcaaac tataagggtg agatttataa ccttcctttt + 21781 aatatgaata ctttcaataa actctgggga gttgtaacgc cagcaggagc acaagctaag + 21841 attgaggaac aacatgctat tttaaatggt aaaactcctg aaaatttgga agcacaggcg + 21901 atttctcttg taggtacaga tatctacgaa aaattaatca aagactatac agagaaacag + 21961 tggggcaaac caactactga acttccatcc tttattattc gccgtttacc agtacacctg + 22021 acctatgata acaactattt taacgatacc tatcaaggga ttccaattgg tgattataat + 22081 gttatcatcg aaaatatgct gaaggatgta gaagtagaac ttggagtgaa cttttttgcc + 22141 aatcgtcaag aattagaggc ttctgctgaa aaggttgtct ttacaggaat gattgaccaa + 22201 tactttgatt ataaacatgg tgagttagaa taccgtagtc ttcgttttga tcatgaagtt + 22261 ctagatgagg aaaactatca aggaaacgca gttgtaaact atacagaacg agaaattcct + 22321 tatactcgta ttattgagca taaacacttt gagtatggta ctcaggagaa aacggttatt + 22381 actcgtgaat acccagctga tttctttttg cattatagga aacattataa gagtaacttt + 22441 aaatgacaag gattagtatg aaaaaaataa aagaatacga aattttaaaa gtaatagcca + 22501 ttatcttagt tgtggtagga cacagcacct actataatat ttatactggt tatggtggga + 22561 tagaatatca acaatacata aacaaccatt tatccttagc tgtatataag ttgttaagca + 22621 aattgacaga gattatttat tattttcata tgcctttatt catggctata tctggtgcgt + 22681 ttttctctat tcaggttaaa aataatcgat ggcatggtat tggctcatta ttaacaaata + 22741 agtttagaag gctaatgata ccattttttg tctttactct agtatataca ataccaataa + 22801 aatatatatc aaattacttt gatggtatca atttctggaa agcggtctct ggtcaattat + 22861 ttctacttgg gaattctcac ttgtggtatt tgtatgcatt gtttattgtc tttatagttg + 22921 gcttttatat tttgaaaaaa cgtactttat ttgatgttta tctactgcta tatattctac + 22981 acatcttgag ttactcagtt catttaacat tagtaagtgc accattacaa tatctatttt + 23041 ggttttctat gggcttctta tttgaattta agaggaagca gtataatcat tatttaaaga + 23101 ataataagtg gctaagcttt ttattggtgc tactatttat agcatgtgta gccctaaaat + 23161 ttgtgcttaa agataaccat gaagttttga ataggataat tatggatcta gcagctgtgc + 23221 taggctcact tatttgttat aatatatcgt attatctcag tgataaaaga gaattaacag + 23281 agaatagact atttaatgtt attttgatta acggattagg aatttacatc ttttctgata + 23341 ctttaaatta tttaatatta aatatctcat attcaatcag taatcgattc atgtttacag + 23401 catttggtat tctcgcatta tttttgatta gaattttctt tactttattt ataggattag + 23461 gtttaacact gctatttaaa aaaatattca aaaaacattc ctggttagta aactagccaa + 23521 atttggttaa tttattattg tcttgaggta atattcaaag agaacttttt gaaatttttc + 23581 tattactcta gaaatagata ctggaagatt atggtcacgt atttcttatc tattttgtaa + 23641 ccgtccaata acgaagtata ttgaaaaatc tccagactag agaactcacg gatagttcct + 23701 aatctggaga tttcttattt gcacttttcg gctctttgtc aactgtagtg ggttgaagaa + 23761 aagctaagct tgagaaagga caaatttcgt cctttctttt ttgatattca gagcgataaa + 23821 aatccgtttt ttgaagtttt caaagttccg aaaaccaaag gcattgcgct tgataagttt + 23881 gatgagatta ttggtcgctt ccaatttggc gtttgaatag ggtagttgaa gggcgttgac + 23941 gattttctct ttgtccttta gaaaggtttt aaagacagtc tgaaaaagag gatgaacctg + 24001 ctttagattg tcctcaatga gtccgaaaaa tttctccggt ttcttattct gaaagtgaaa + 24061 cagcaagagt tgatagagct gatagtgatg tttcaagtct tgtgaatagc tcaaaagctt + 24121 gtctaaaatc tctttattgg ttaagtgcat acgaaaagta ggacgataaa atcgcttatc + 24181 actcagttta cggctatcct gttgtatgag cttccagtag cgcttgatag ccttgtattc + 24241 atgggatttt cgatgaaact gattcatgat ttgaacacgc acacgactca tagcacggct + 24301 aagatgttgt acaatatgaa agcgttcaag aacgatttta gcattcggga gtgaaacagt + 24361 ctgggagact gtttcagcct gagcctagaa atttgaaagc gaagctgttt agccaagtca + 24421 tagtaagggc taaacatatc catagtaata attttgacgc gacatcggac aactctatcg + 24481 tagcgaagaa agtgatttcg aatgatagct tgtgttctac cctcaagaac agtgatgata + 24541 ttgagattgt taaaatcttg cgcaatgaag ctcatctttc cctttgtaaa agcatactca + 24601 tcccaagaca taatctcagg aagacaagaa aaatcatgtt taaagtgaaa atcattgagc + 24661 ttacgaataa cagttgaagt tgagatggaa agctgatggg caatatcagt catagaaatc + 24721 ttttcaatta acttttgagc aatcttttgg ttgatgatac gagggatttg gtgattcttc + 24781 ttgacgatag aagtttcagc gaccatcatt tttgaacagt gatagcactt gaaacgacgc + 24841 tttctaagga gaattctagt aggcatacca gtcgtttcaa gataaggaat tttagaaggt + 24901 ttttgaaagt catatttctt caattggttt ccgcactcag ggcaagatgg agcgtcgtag + 24961 tccagtttgg cgatgatttc cttgtgtgta tccttattga tgatgtctaa aatctggata + 25021 ttagggtctt taatgtctag taattttgtg ataaaatgta attgttccat atgaatcttt + 25081 ctaatgagtt gttttgtcgc ttttcattat aggtcatatg ggactttttt tctacaacaa + 25141 aataggctcc ataatatcta taagggattt acccactaca aatattatag agccgaataa + 25201 tctcctagga attcttgtac tactgaacca cttcgacact gatcatggtg gtaaagcgta + 25261 atcccttgtt tctctgattt acctgacaaa aaagtccaat agtaagtcag ctgactatca + 25321 ctttctaaga cccgataaga ggtttcatct gcatgaagaa gagcttgttc taacaacttt + 25381 tctcgtaaaa ggttataaag ggactctaaa tagtattgac tcgtcttgat atgccaatta + 25441 gaaatttcct tacgtgtgat tggtaaaccc atcttagccc aatcttcttc ttagcgataa + 25501 ttgggtacct tcagattaaa cttctgatgg atggtgtgag cgataataga ggctgaacca + 25561 aggctatgcg ccaaaggggc tttagggaca ggagctttta caattttatc acttggattt + 25621 ttatcactgc atgcttggca tttgtaagcg tgttggatat gatccactct ttttaattgc + 25681 gcaggaataa agaccaattc ttgtcgttga aggctcgctc caatctcttt taaatcgtcc + 25741 tgacaatcag ggcaaatgct ctcttctact tgatgatgaa cttcttctga atcaaattgg + 25801 gcaagaatag cttgacgttt ccctttagct ttcttacgtt tataggtgat ttcttctctt + 25861 tcaactgggt aagtcagagt cttcttccat attttgttcc tcttcaaaaa gactgagttg + 25921 tccaaaaggg caaacacttt tctcagagga ttttccatag agcttttgcg ttagataagc + 25981 cacttgttca cgcagaaggg aaagttcatt agtgagacta tcaattatag cactctgttg + 26041 ttgaatgatt ttcaatcttc tcccatagac tttcctcctt atttcctaac tttattatat + 26101 agtgtattga atctataaca gtacaccttg actgctaaaa tatttctata aattaatttg + 26161 actttcctga tagagatgtt catatcttat ttcaattcac tatactaaaa agaaagtcct + 26221 catttcaata gaaatcacga ctttctgata aatttatttt gggagtgata gaaaagccct + 26281 tcataagcca gtctatttgt tcaggtgtga gagctttgac atccttttat gtactggacc + 26341 aagtcagtct gccgttctca aagcgtttat atagtagcca aaatccttga ccatcccagt + 26401 aaagggcttt aaagcggtct ttacgtccac cacaaaagag aaaaacttga ccggagaaag + 26461 gatctaattc aaaatgggtt ttaaccagat aagccagtga atcaatgcct tgcctcatat + 26521 ccgttttccc acatacgaga taaacctgcc ctaggctaga tagatgaatt gtcatagagc + 26581 aacaccttat ccaaaagttg ttctatcatt tcgagattga gagattgaaa aaaacttact + 26641 tcaagcttgc caatacgaat tttaagcaga atatcatttc tctttttaga atcaaaagga + 26701 cgagattgtg gaatctctac aggaacaata ggttgtggca ttaaaatatc ctccaatagt + 26761 tttactttac taatagtata caggagaagc tccatgaatg atagatacct tgttatgacg + 26821 cgcttactaa acaactaact gatgcacgat ttaagcgcct tgttggtgtt cagcgcacga + 26881 cttttgaaga gatgttagct gtattaaaaa cagcttatca acttaaacac gcaaaaggtg + 26941 gacgaaaacc taaattaagc ctagaagacc ttcttatggc cactcttcaa tatgtgcgag + 27001 aatatcgaac ttatgaacaa attgcggctg attttggtat ccacgaaagc aacttaatcc + 27061 gtcggagcta atgggttgaa gtaactcttg ttcaaagtgg tgttacgatt tcaagaactc + 27121 ctctcagctc tgaggacacg gtaatgattg atgcgacgga agtaaaaatc aatcgcccta + 27181 aaaaaagaat tagcgaatga ttctggtaaa aagaaatgcc acgctatgaa ggctcaagcg + 27241 attgtcacaa gtcaagggag aattgtttct ttggatatca ctgtgaacta ttgtcatgat + 27301 atgaagttgt tcaaaatgag ttgcagaaat atcggacaag ctggtaaaat cttggctgac + 27361 agtggttatc aagggctcat gaagatatat cctcaagcac aaattccacg taaatccagc + 27421 aaactcaagc cgctaatagc tgaagataaa gcctataacc atgcgctatc taaggataga + 27481 agcaaggttg agaacatctt tgccaaagta aaaacgttta aaatgttttc aacaacctat + 27541 cgaaatcatc gtaaacgctt cggattacga atgaatttga ttgctggtat tatcaatcat + 27601 gaactaggat tctagttttg caggaagtct attgaaggat cttttgcttt agttccttgg + 27661 tcaagattga ttattttcac ggagcgcttc cgattgtttt cataaaccat ttgcgcatag + 27721 tcagcagaat aaatcttttt gaaacgtccc tttcctagac attatagaac tttcagattc + 27781 atctgaattt accaaattaa cacaaaaatt ccgaaaattc tgttgacaac tttctgaaaa + 27841 gagtctataa tggagagaaa gttttaaagg agaaaatgat gaaaagttca aaactatttg + 27901 cccttgcggg cgtgacatta ttggcggcga ctactttagc tgcatgctct ggatcaggtt + 27961 caagcactaa aggtgagaag acattctcat acatttatga gacagaccct gataacctca + 28021 actatttgac aactgctaag gctgcgacag caaatattac cagtaacgtg gttgatggtt + 28081 tgctagaaaa tgatcgctac gggaactttg tgccgtctat ggctgaggat tggtctgtat + 28141 ccaaggatgg attgacttac acttatacta tccgtaagga tgcaaaatgg tatacttctg + 28201 aaggtgaaga atacgcggca gtcaaagctc aagactttgt aacaggatta aaatatgctg + 28261 ctgataaaaa atcagatgct ctttaccttg ttcaagaatc aatcaaagga ttggatggct + 28321 atgtaaaagg ggaaatcaaa gatttctcac aagtaggaat taaggctctg gatgaacaga + 28381 cagttcagta cactttgaac aaaccagaaa gcttctggaa ttctaagaca acaatgggag + 28441 taatggctcc agttaatgaa gagtttttga attcaaaagg ggatgatttt gccaaagcta + 28501 cggatccaag tagtctcttg tataacggtc cttatttgtt gaaatccatt gtgaccaaat + 28561 cttctgttga atttgcgaaa aatccgaact actgggataa ggacaatgtg catattgaca + 28621 aagttaaatt gtcattctgg gatggtcaag ataccagcaa acctgcagaa aactttaaag + 28681 atggtagcct tacagcagct cgtctctatc caacaagtgc aagtttcgca gagcttgaga + 28741 agagtatgaa ggacaatatt gtctatactc aacaagactc tattacgtat ctagtcggta + 28801 caaatattga ccgtcagtcc tataaataca catctaagac cagcgacgaa caaaaggcat + 28861 cgactaaaaa ggctctctta aacaaggatt tccgtcaggc tattgccttt ggttttgatc + 28921 gtacagccta tgcctctcag ttgaatggac aaactggagc aagcaaaatc ttacgtaata + 28981 tctttgttcc accaacattt gttcaagcag atggtaaaaa ctttggcgat atggtcaaag + 29041 agaaattggt cacttatggg gatgaatgga aggatgttaa tcttgcagat tctcaggatg + 29101 gtctttacaa tccagaaaaa gccaaggctg aatttgctaa agctaaatca gccttacaag + 29161 cagaaggtgt gactttccca attcatttgg atatgccagt tgaccagaca gcaactacaa + 29221 aagttcagcg cgtccaatct atgaaacaat ccttggaagc aactttagga gcggataatg + 29281 tagtcattga tattcaacaa ctacaaaaag acgaagtaaa caatattaca tattttgctg + 29341 aaaatgctgc tggcgaagac tgggatttat cagataatgt cggttggggt ccagactttg + 29401 ccgatccatc aacctacctt gatatcatca aaccatctgt aggagaaagt actaaaacat + 29461 atttagggtt tgactcaggg gaagataatg tagctgctaa aaaagtaggt ctatatgact + 29521 acgaaaaatt ggttactgag gctggtgatg agactacaga tgttgctaaa cgctatgata + 29581 aatacgctgc agcccaagct tggttgacag atagtgcttt gattattcca actacatctc + 29641 gtacagggcg tccaatcttg tctaagatga taccatttac aataccattt gcattgtcag + 29701 gaaataaagg tacaagtgaa ccaatcttat ataaatactt ggaacttcaa gacaaggcag + 29761 tcactgtaga tgaataccaa aaagctcagg aaaaatggat gaaagaaaaa gaagagtcta + 29821 ataaaaaggc tcaagaagat ctcgcaaaac atgtgaaata a +// + diff --git a/public/res/serotype_genbank/serotype_18X2.gb b/public/res/serotype_genbank/serotype_18X2.gb new file mode 100755 index 0000000..773ff34 --- /dev/null +++ b/public/res/serotype_genbank/serotype_18X2.gb @@ -0,0 +1,976 @@ +LOCUS MK606432 24889 bp DNA linear BCT 30-SEP-2020 +DEFINITION Streptococcus pneumoniae strain GPS_IN_P54 cps gene cluster, + complete sequence. +ACCESSION MK606432 +VERSION MK606432.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 24889) + AUTHORS van Tonder,A.J., Gladstone,R.A., Lo,S.W., Nahm,M.H., du Plessis,M., + Cornick,J., Kwambana-Adams,B., Madhi,S.A., Hawkins,P.A., + Benisty,R., Dagan,R., Everett,D., Antonio,M., Klugman,K.P., von + Gottberg,A., Breiman,R.F., McGee,L., Bentley,S.D. and The Global + Pneumococcal Sequencing,C.O. + TITLE Putative novel cps loci in a large global collection of pneumococci + JOURNAL Microb Genom 5 (7) (2019) + PUBMED 31184299 +REFERENCE 2 (bases 1 to 24889) + AUTHORS van Tonder,A.J. + TITLE Direct Submission + JOURNAL Submitted (06-MAR-2019) Parasites and Microbes, Wellcome Sanger + Institute, Wellcome Genome Campus, Hinxton, Cambridge CB10 1SA, + United Kingdom +COMMENT ##Assembly-Data-START## + Assembly Method :: Velvet v. 1.2 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..24889 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="GPS_IN_P54" + /isolation_source="blood" + /host="Homo sapiens" + /db_xref="taxon:1313" + /geo_loc_name="India" + /collection_date="2015" + misc_feature 1..24889 + /note="cps gene cluster" + gene 1..1611 + /gene="dexB" + CDS 1..1611 + /gene="dexB" + /EC_number="3.2.1.70" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3280" + /inference="protein motif:CLUSTERS:PRK10933" + /inference="protein motif:Pfam:PF00128.18" + /inference="protein motif:TIGRFAMs:TIGR02403" + /inference="similar to AA sequence:RefSeq:YP_004326655.1" + /inference="similar to AA sequence:UniProtKB:Q99040" + /note="trehalose-6-phosphate hydrolase; maltooligosyl + trehalose synthase; alpha,alpha-phosphotrehalase; alpha + amylase catalytic domain protein" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="QCO91937.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNGDGVGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIAAIFGTMEDMDQLIAEAKKRDIRIIMDLVVN + HTSDEHAWFVEACENTDSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGDKELLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKGVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTGQPWLAVNPNYEMINVQEALANPDSIFYTYQKL + VQIRKENSWLVRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTAAKEVLEKQVLAPWDAFCVEMTD" + CDS complement(1742..3142) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00665.20" + /inference="similar to AA sequence:RefSeq:YP_006065738.1" + /note="integrase core domain protein" + /codon_start=1 + /transl_table=11 + /product="IS1202 transposase" + /protein_id="QCO91938.1" + /translation="MKKYLVIKAIAQGKKTKKRACAELNLSERQINRLLLAYQLKGKE + AFRHGNRNRKPKHAIPDEIKGRLLKKYLSYETYKPNVLHFCELLAEEEGIQLSDTTVR + KILYKENILSPKSHRKTKKRVRRQAKLNPKQPLDNPILPTAENFLEDPKKVHPSRPRK + KFAGELIQMDASPHAWFGAQTSNLHLAIDDASGNILGAYFDKQETLNTYYHVLEQILG + NHGIPLQIKTDKRTVFTYQVSNSKKMEDDTHTQFGYACHQLGILLETTSIPQAKGRVE + RLNQTLQSRLPIELERNNIHTLEEANTFLLSYIQTFNEQFGNKTKLSVFEEVPNPSER + NLILARLAERVVDSGHHIRFQNRYYIPTEQGKEVYFIRKTKALVIKAFNGDIYLNIAD + KIYRTKELLDHELYSKNFEQEPEQKKKDTSISLHKPIRGNSHLSNNIFIKIKRIMKSL + LVRSLILLNYKYSKMK" + gene 3327..4772 + /gene="wzg" + CDS 3327..4772 + /gene="wzg" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09379" + /inference="protein motif:Pfam:PF03816.8" + /inference="protein motif:TIGRFAMs:TIGR00350" + /inference="similar to AA sequence:RefSeq:YP_001835063.1" + /inference="similar to AA sequence:UniProtKB:Q7WY78" + /note="putative transcriptional regulator ywtF; + membrane-bound transcriptional regulator LytR; cell + envelope-related function transcriptional attenuator + common domain; cell envelope-related transcriptional + attenuator domain protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14A" + /protein_id="QCO91939.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLSVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + ADHSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYIKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRGRYSLADGDRDRGRNQQKVIVAIIQKLTST + EVLENYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKETGRMDLPSY + AMPDSNLYVMEIDDSSLTVVKAAIQYVMEGR" + gene 4774..5505 + /gene="wzh" + CDS 4774..5505 + /gene="wzh" + /EC_number="3.1.3.48" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4464" + /inference="protein motif:Pfam:PF02811.13" + /inference="similar to AA sequence:RefSeq:YP_002739714.1" + /inference="similar to AA sequence:UniProtKB:Q54518" + /note="capsular polysaccharide biosynthesis protein; PHP + domain protein" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein phosphatase wzh" + /protein_id="QCO91940.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDTLEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKHVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + gene 5514..6206 + /gene="wzd" + CDS 5514..6206 + /gene="wzd" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:Pfam:PF02706.9" + /inference="protein motif:TIGRFAMs:TIGR01006" + /inference="similar to AA sequence:RefSeq:YP_001835065.1" + /inference="similar to AA sequence:UniProtKB:P72367" + /note="capsular polysaccharide type 8 biosynthesis protein + cap8A; capsular polysaccharide biosynthesis protein; MPA1 + family polysaccharide export protein; chain length + determinant protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14C" + /protein_id="QCO91941.1" + /translation="MKEQNTLEIDGLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKPGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTRVKRPEDIEDTLQMT + LLGVVPNLNKLK" + gene 6216..6899 + /gene="wze" + CDS 6216..6899 + /gene="wze" + /EC_number="2.7.10.2" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:CLUSTERS:PRK11519" + /inference="protein motif:Pfam:PF01656.17" + /inference="protein motif:TIGRFAMs:TIGR01007" + /inference="similar to AA sequence:RefSeq:YP_001835066.1" + /inference="similar to AA sequence:UniProtKB:Q54520" + /note="tyrosine-protein kinase CpsD; tyrosine kinase; + capsular polysaccharide biosynthesis protein; capsular + exopolysaccharide family protein; CobQ/CobB/MinD/ParA + nucleotide binding domain" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14D" + /protein_id="QCO91942.1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVS + PGEGKTTTSVNIAWSFARAGYKTLLIDGDTRNSVISGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGAVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGETNKRDVQKAKQQLKQTGKLFLGVVLNKLDISVDKYGVY + GFYGNYGKK" + gene 6915..8282 + /gene="wchA" + CDS 6915..8282 + /gene="wchA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15204" + /inference="protein motif:Pfam:PF02397.10" + /inference="protein motif:TIGRFAMs:TIGR03025" + /inference="similar to AA sequence:RefSeq:YP_001835067.1" + /inference="similar to AA sequence:UniProtKB:P71241" + /note="putative colanic biosynthesis UDP-glucose lipid + carrier transferase; undecaprenyl-phosphate galactose + phosphotransferase; exopolysaccharide biosynthesis + polyprenyl glycosylphosphotransferase; Bacterial sugar + transferase" + /codon_start=1 + /transl_table=11 + /product="glucosyl-1-phosphate transferase" + /protein_id="QCO91943.1" + /translation="MDEKGLKIFLAVLQSIVVILLIYFLSFVRETEVERSSMVILYLL + HFFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLNAFDKNLGRNKQIHEMVGLNVVTFSKNLYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKINNDPRVTKIGRFIRKTSLDEIPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDAVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + gene 8313..9485 + /gene="wchF" + CDS 8313..9485 + /gene="wchF" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF09314.5" + /inference="protein motif:TIGRFAMs:TIGR03088" + /inference="similar to AA sequence:RefSeq:YP_002510379.1" + /note="PEP-CTERM/EpsH1 system-associated sugar + transferase; DUF1972 protein" + /codon_start=1 + /transl_table=11 + /product="rhamnosyltransferase WchF" + /protein_id="QCO91944.1" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDEDPIF + YILACRIGPFIHGIKKRIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKYA + DFLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSTLKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTAFDKDPRV + KFVGTVYDQELLKYIRENTFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKKIDELDRQSNQRIVDSFTWEKIVTDYEKLFKK" + gene 9482..10753 + /gene="wciU" + CDS 9482..10753 + /gene="wciU" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00534.14" + /codon_start=1 + /transl_table=11 + /product="glycosyl transferase group 1" + /protein_id="QCO91945.1" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMLEQIAQGYQVAALCPGRI + KFFSKKIEIIKATSRQFECYELLNSLPIALFGGISDPTAFMTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKNTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIQPVNSVVLSITSSSIKHHQRLTTTNNKIRVS + YIGSDEEYKGYFDFIDFAGTLEQESYEVVTYGHLPNEECPSFIEQKGYFTKETIDSVY + ENIDILIIASKCKETFGLITVEALSYGVNVFVSENVGSKDLLPETHVFKDKEDLLAKI + INNQLEKVPLKTMEKHVEEVISYYKQVRSNN" + gene 10771..11823 + /gene="cpsJ" + CDS 10771..11823 + /gene="cpsJ" + /EC_number="2.4.1.212" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3858" + /inference="protein motif:CLUSTERS:PRK10073" + /inference="protein motif:Pfam:PF00535.20" + /inference="protein motif:TIGRFAMs:TIGR03937" + /inference="similar to AA sequence:RefSeq:YP_006033775.1" + /inference="similar to AA sequence:UniProtKB:Q7BLV3" + /note="hyaluronan synthase; putative glycosyl transferase; + putative glycosyl hydrolase; poly-beta-1,6 + N-acetyl-D-glucosamine synthase; Glycosyl transferase + family 2" + /codon_start=1 + /transl_table=11 + /product="family 2 glycosyl transferase" + /protein_id="QCO91946.1" + /translation="MSCPEISVIVPVYNVERYLRQCMDSLINQTYRNFEIILVNDGST + DSSGILCEEWAKKDERIHVVHKKNEGLGFARNTGVEHAKGKHITFVDSDDYVSLDMLQ + TLYNAVQEYDVEVVYSAGYYRSFSNGEIKKTDVGTKKPQLFEGGDVASELLPDVISAP + PEYPNDGKVGVSAWKVLYKANLFKDKGLLFHSEREFISEDAIFQIDCLKLATSALVIP + DILYYYRENFGSLSMKYKEDRFELDKILYNEQLKRVEGLPNQEILEERIERILIANIR + LCIFQESLHKSSRIHKRLQRIRQICKDPVSKVVLHHYPIHRLPFPKRLICVLAKYNMS + LFLLALTLLKYRNRSV" + gene 11835..12740 + /gene="wchN" + CDS 11835..12740 + /gene="wchN" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3774" + /inference="protein motif:Pfam:PF05704.6" + /inference="similar to AA sequence:RefSeq:YP_001835073.1" + /note="mannosyltransferase OCH1-related enzyme" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide synthesis protein" + /protein_id="QCO91947.1" + /translation="MNIEKLKLSLKNRTFFPVVIHALRNRWPLWWIRSKAIREVQLED + RAYRILKKKYGSLISNSFDKAYLSEKVPKQIWICWFQGMENAPDLVKSCYKSVKREFP + DYKITVLTAQTIQQHVTIPEEILYKWNKGIINNANFSDVLRVEILSKYGGIWLDATVY + CTGNTIKELIEKNPFFMYKSLSSIEENISASSWMIASTANHPLILSAKKLLVEYWCRE + NIAIHYFVFHLLFTIVAENYSDVWQSVPTYTNAAPHIMIDELNNVFSKERYQQLCQIS + DFHKLNYKKNYNDKSESLYSYLLNQ" + gene 12752..14209 + /gene="wzx" + CDS 12752..14209 + /gene="wzx" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF01943.11" + /inference="similar to AA sequence:RefSeq:YP_001835074.1" + /inference="similar to AA sequence:UniProtKB:P37746" + /note="putative O-antigen transporter; polysaccharide + biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="transporter" + /protein_id="QCO91948.1" + /translation="MPSLKKNIVYNILYQILAVIVPFITSPYLARVLGAEQIGVYSFT + YSIAFYFMILSMLGISNYGNRTIAQVRTSREHLNQEFSNIYAVQLTCSLVMTVSYLIY + ATVFVNSFQIVAYIQVLHVLSYATDVSWFFYGLEEFRITVARNSFVKLLTLISIFTFV + KSPNDIYLYTFIMAGSTLLGQLITWPFLLKQVNFVRPSLGKIKEHMKPIIILFFPVLA + VSIFSFLDKIMLGMYSSLKETAFYENSDKIISIPKALIQAFGAVMLPRTVHLLSIGDE + QKSLEYVDKTMWAVLVITMGCAFGLAGVSVTFAPVYWGEEFRASSQIIAGMTPALAFS + AFGNVIRTQFLIPRSFDKEYTVSLLYGAVVNILINILLIPKIGAMGAVIGTIVAELVL + CYYQTWIARNYLHIREYLINAGILFLIGSVMYMVLILVSSILPTSLLTLIIEIIVGAF + IYISLLILYIFSSKNRVIIGLRTNFLERTHLFKRK" + gene 14212..15477 + /gene="wzy" + CDS 14212..15477 + /gene="wzy" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04932.9" + /codon_start=1 + /transl_table=11 + /product="O-antigen ligase" + /protein_id="QCO91949.1" + /translation="MKFKFNPIAILYILLVYLELATDRQHLYPVTYMTKYYIGILITV + LFVLLLVGRGKVIFVNKKLLYLAKILAIPTIVLFLYSVLLDVMNPVEFNGYFSRLSST + TIFGLLAIFQAIVVFQFFGQKVVDYTFTAISLSYLTSIIVAFREGGLSQFILMLTDAS + FNGSVLEMHEVAPITALFILYYLYKYFIKENSFSLVFRNILIALIILFLSLKRIVFLS + VLIIIPVFLVIYWYDKKVSKLGKERKILSLLNSFSLIFITGIFLYVYSVKSGFIYTFI + QEHNINSMARTDLWKGIESTYSFAPIFMGRGIGFVTKWMDNNWMTLNINGLTESTGLH + NDILKYYIEIGFVGLFIYFYTLLYRNAKRIFVKIGHKESFIYFVLIMFQVLIWFTDNI + STYHNFLWILNLLLFSLTNTDAELETQKL" + gene 15557..16717 + /gene="wchX" + CDS 15557..16717 + /gene="wchX" + /EC_number="2.7.8.12" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04464.8" + /inference="similar to AA sequence:RefSeq:YP_002510384.1" + /inference="similar to AA sequence:UniProtKB:P13485" + /note="CDP-glycerol:poly(glycerophosphate) + glycerophosphotransferase" + /codon_start=1 + /transl_table=11 + /product="glycerol phosphotransferase WchX" + /protein_id="QCO91950.1" + /translation="MKFYIKNLLKKVFTLPLHLLPIQSNKIIFDNFGGRGFGDNPKYI + LEELVSREKNLNLVWVTKDREMSIPEGVRVVKYGSYRSFYEWLTARVWVDNIRNSDRP + WKRKGQIYLQTWHGSDGVKLIEKSVAGNLKKTYLRMAKYDGKITDGIVSSRHFQTLGM + QNNFWLAENVEFLEFGLPRNDDFFKSEKIKTTNIKFRTLFDIDLDELVVLYMPTFRDD + GSLNAYNLDYSKLIHVFQNKFRKNVKILVRFHPNVDSSFINLQDTDCINVSTYSNPQD + LMMSADVMITDYSSASIDFMLLNRPVFLYLPDYQSYVNDRPLDDNFDKLPFPRAYHNN + ELTEIIRDFERSKYDEKVRLYELEDVRFDRGKASVQCANWIEEKIKNNKVID" + gene 16759..17151 + /gene="gct" + CDS 16759..17151 + /gene="gct" + /EC_number="2.7.7.39" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0615" + /inference="protein motif:CLUSTERS:PRK11316" + /inference="protein motif:Pfam:PF01467.1" + /inference="protein motif:TIGRFAMs:TIGR01518" + /inference="similar to AA sequence:RefSeq:YP_003875983.1" + /inference="similar to AA sequence:UniProtKB:P27623" + /note="glycerol-3-phosphate cytidylyltransferase; + bifunctional heptose 7-phosphate kinase/heptose + 1-phosphate adenyltransferase; cytidylyltransferase" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="QCO91951.1" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNYEHRKNLVEAIRYVDLVIPETSWEQKKSDVKDYHIDTFVMGDDWKGKFDY + LEEEGVEVVYLPRTKEISTTKIKEDLSE" + CDS 17249..17362 + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_006742607.1" + /codon_start=1 + /transl_table=11 + /product="heme-based aerotactic transducer" + /protein_id="QCO91952.1" + /translation="MAVIFKDVLVEEKTDEEKQHILSILNDENVRAFDCGY" + gene 17992..18861 + /gene="rmlA" + CDS 17992..18861 + /gene="rmlA" + /EC_number="2.7.7.24" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4750" + /inference="protein motif:CLUSTERS:PRK15480" + /inference="protein motif:Pfam:PF00483.17" + /inference="protein motif:TIGRFAMs:TIGR01207" + /inference="similar to AA sequence:RefSeq:YP_815843.1" + /inference="similar to AA sequence:UniProtKB:P37744" + /note="glucose-1-phosphate thymidylyltransferase RfbA; + CTP:phosphocholine cytidylyltransferase; nucleotidyl + transferase" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase" + /protein_id="QCO91953.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEQPCSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLNRGDLSVEVMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISRENVLALAQPLKKN + EYGQYLLRLIGEA" + gene 18862..19455 + /gene="rmlC" + CDS 18862..19455 + /gene="rmlC" + /EC_number="5.1.3.13" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00908.11" + /inference="protein motif:TIGRFAMs:TIGR01221" + /inference="similar to AA sequence:RefSeq:YP_003878604.1" + /inference="similar to AA sequence:UniProtKB:Q5XCG7" + /note="putative dTDP-4-dehydrorhamnose 3,5-epimerase" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-dehydrorhamnose 3,5-epimerase" + /protein_id="QCO91954.1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + gene 19468..20517 + /gene="rmlB" + CDS 19468..20517 + /gene="rmlB" + /EC_number="4.2.1.46" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK10084" + /inference="protein motif:Pfam:PF01370.15" + /inference="protein motif:TIGRFAMs:TIGR01181" + /inference="similar to AA sequence:RefSeq:YP_006742612.1" + /inference="similar to AA sequence:UniProtKB:P95780" + /note="dTDP-glucose 4,6 dehydratase; NAD-dependent + epimerase/dehydratase family protein" + /codon_start=1 + /transl_table=11 + /product="dTDP-glucose 4,6-dehydratase" + /protein_id="QCO91955.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + gene 20583..21434 + /gene="rmlD" + CDS 20583..21434 + /gene="rmlD" + /EC_number="1.1.1.133" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09987" + /inference="protein motif:Pfam:PF04321.11" + /inference="protein motif:TIGRFAMs:TIGR01214" + /inference="similar to AA sequence:RefSeq:YP_141831.1" + /inference="similar to AA sequence:UniProtKB:P29781" + /note="dTDP-4-dehydrorhamnose reductase; RmlD + substrate-binding domain protein" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase" + /protein_id="QCO91956.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + gene 21872..22384 + /gene="glf_1" + CDS 21872..22384 + /gene="glf_1" + /EC_number="5.4.99.9" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF03275.7" + /inference="protein motif:TIGRFAMs:TIGR00031" + /inference="similar to AA sequence:RefSeq:YP_004326638.1" + /inference="similar to AA sequence:UniProtKB:P37747" + /note="protoporphyrinogen oxidase" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase" + /protein_id="QCO91957.1" + /translation="MEEQAISLVGTDIYEKLIKDYTEKQWGKPTTELPSFIIRRLPVH + LTYDNNYFNDTYQGIPIGGYNVIIENMLKDVEVELGVNFFANRQELEASAEKVVFTGM + IDQYFDYKHGELEYCSLRFDHEVLDEENYQGNAVVNYTDAETPYTRIIEHKHFEFGSQ + AKTIITNRTF" + gene 22335..22664 + /gene="glf_2" + CDS 22335..22664 + /gene="glf_2" + /EC_number="5.4.99.9" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF03275.7" + /inference="protein motif:TIGRFAMs:TIGR00031" + /inference="similar to AA sequence:RefSeq:YP_006252639.1" + /inference="similar to AA sequence:UniProtKB:P37747" + /note="UDP-galactopyranose mutase" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="QCO91958.1" + /translation="MSLGVKQRLSLLIEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKL + ADEQGNVIFGGRLGHYRYYDMHQVIGAALQCVRNELDSYSMKIKEQTRKLAAGCSKHC + FEVADGS" + gene 22901..24889 + /gene="aliA" + CDS 22901..24889 + /gene="aliA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4166" + /inference="protein motif:CLUSTERS:PRK15104" + /inference="protein motif:Pfam:PF00496.16" + /inference="protein motif:TIGRFAMs:TIGR02294" + /inference="similar to AA sequence:RefSeq:YP_001835080.1" + /inference="similar to AA sequence:UniProtKB:P31306" + /note="76 kDa cell surface lipoprotein; oligopeptide ABC + transporter substrate-binding protein OppA; ABC-type + oligopeptide transport system, periplasmic component; + nickel ABC transporter, nickel/metallophore periplasmic + binding protein; Bacterial extracellular solute-binding + proteins, family 5 Middle" + /codon_start=1 + /transl_table=11 + /product="oligopeptide ABC transporter + oligopeptide-binding protein AliA" + /protein_id="QCO91959.1" + /translation="MKSSKLFALAGVTLLAATTLAACSGSGSSSSTKGEKTFSYIYET + DPDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRK + DAKWYTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDAYVKGEIKDFSQ + VGIKVLDEQTVQYTLNKPESFWNSKTTMGVLAPVNEEFLNSKGDDFAKATDPSSLLYN + GPYLLKSIVTKSSVEFAKNPNYWDKDNVHIDKVKLSFWDGQDTSKPAENFKDGSLTAA + RLYPTSASFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKA + LLNKDFRQAIAFGFDRTAYASQLNGQTGASKILRNIFVPPTFVQADGKNFGDMVKEKL + VTYGDEWKDVNLADSQDGLYNPEKAKAEFAKAKSALQAEGVTFPIHLDMPVDQTATTK + VQRVQSMKQSLEATLGADNVIIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPD + FADPSTYLDIIKPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDEATDVAK + RYDKYAAAQAWLTDSALIIPTTSRTGRPILSKMVPFTIPFALSGNKGTSEPILYKYLE + LQDKAVTVDEYQKAQEKWMKEKEESNKKAQEDLAKHVK" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg gagatggagt tggtgatttg ccaggtatta ccagtaagtt ggactatcta + 121 gctaagttag gaatcacagc gatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctacg atattgctga ttatcaagcg attgcggcta tttttggaac catggaggac + 241 atggatcagc tgattgcaga agctaagaag cgtgatatcc gtatcatcat ggacttggtg + 301 gtcaatcata cctcggatga gcatgcttgg tttgtcgaag cctgtgaaaa tactgacagc + 361 cctgagcgag actactatat ctggcgcgat gaacccaatg acctagattc tatctttagt + 421 gggtctgctt gggaatacga tgaaaagtca ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaagg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agataaggag ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcagc ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttacttcat + 1021 ctcatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatctctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaacct + 1261 tggttggcgg ttaatccaaa ttacgagatg atcaatgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 gttcgagctg actttgaatt gcttgatacg gctgataagg tctttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacactg cggctaaaga agtacttgaa + 1561 aaacaggtct tggctccatg ggatgctttc tgtgtggaaa tgactgacta gaatgagcaa + 1621 acctcaagtt tttgaagctt gaggtttttt actatagtgg attgaaacta gaatagtgca + 1681 cctctacttc taaaatattg ttagaaatcg atttgattgt cctgatcgat ttgtcctatt + 1741 cttatttcat tttactatac ttgtagttga ggagaattaa gctcctcact agtaaactct + 1801 tcataatcct ttttattttt atgaagatat tgtttgaaag atgtgagttt ccacggatgg + 1861 gtttgtggag ggatatactt gtgtctttct ttttttgttc tggttcttgt tcaaagtttt + 1921 tcgaatagag ttcatgatct agtagctcct ttgtgcgata gattttgtca gcgatattga + 1981 ggtagatgtc tccgttaaat gcttttataa ctaatgcttt cgtctttctg atgaaataga + 2041 cttcttttcc ttgttcggta gggatatagt aacgattttg gaatcggata tggtgtccac + 2101 tatcgacgac tctctccgcc agtctagcca gaatgagatt cctttcagaa gggttaggaa + 2161 cctcctcgaa gacagagagt tttgtcttgt ttccaaactg ttcattaaag gtttggatgt + 2221 aggaaagcag gaaggtattg gcttcttcca aggtatgaat attgtttcgt tccagttcga + 2281 taggcaggcg agattgtagt gtctgattaa gtctttcgac tctcccttta gcttgaggga + 2341 tagaggttgt ctccagaaga atccccagtt ggtgacaggc gtatccgaat tgtgtatgag + 2401 tgtcgtcctc cattttctta gagttggaga cttgataggt aaagactgtt cttttatctg + 2461 ttttgatttg aaggggaatg ccgtgattgc ctaaaatttg ttcgaggaca tgatagtaag + 2521 tattcaaggt ctcttgttta tcaaaataag cgcctaggat attgccagaa gcatcatcaa + 2581 tggctaagtg taagttagat gtttgtgctc caaaccaggc atgagggctg gcatccattt + 2641 gaatgagttc accagcaaat ttctttcttg gtctactagg atgtactttt ttagggtctt + 2701 caaggaagtt ttcagccgtc ggtaagattg gattatctag gggttgcttg gggttcagtt + 2761 tagcttgtct tcttactctc ttctttgtct ttctatgaga cttaggcgac aggatgtttt + 2821 ccttatagag tatttttcta acagttgtat cagagagctg aattccttct tcttcagcta + 2881 gcaattcaca gaaatgaagg acatttggtt tatatgtttc ataggagagg tattttttta + 2941 ggagacgtcc tttgatttca tcagggattg catgttttgg ttttcgattt ctgtttccgt + 3001 gtctgaaggc ttcttttcct ttcagttgat aggctagtag cagacgattg atttgccttt + 3061 cagaaagatt gagttcggca caggctcgtt tctttgtttt ctttccttgg gctatagctt + 3121 ttatcacaag atattttttc atttcattca tatttagttg gatccttttc atatgactat + 3181 tctaccaaat gggacatttt cacgttcgat ttactaaaga cattatcacc ttcgaatcac + 3241 aaagatgcag atagtgaaaa aaaggtgtag acattaccgt aaaaaagtga tataatcgta + 3301 agatgttcaa ggtataggtg ttaatcatga gtagacgttt taaaaaatca cgttcacaga + 3361 aagtgaagcg aagtgttaat atcgttttgc tgactattta tttattgtca gtttgttttt + 3421 tattgttctt aatctttaag tacaatatcc ttgcttttag atatcttaac ctagtggtaa + 3481 ctgcgttagt cctactagtt gccttggtag ggctactctt gattatctat aaaaaagctg + 3541 aaaaatttac tatttttctg ttgctgttct ctatccttgt cagctcagtg tcgctctttg + 3601 cagtacagca gtttgttgga ctgaccaatc gtttaaatgc gacttctaat tactcagaat + 3661 attcgctcag tgtcgctgtt ttagcagata gtgagatcga aaatgttacg caactgacga + 3721 gtgtgacagc accgactggg actgataatg aaaatattca aaaactacta gctgatatca + 3781 agtcaagtca gaataccgat ttgacggccg accatagttc gtcttacttg gctgcttaca + 3841 agagtctgat tgcaggggag actaaggcca ttgtcttaaa tagtgtcttt gaaaatatca + 3901 tcgagtcaga gtatccagac tacgcatcga agataaaaaa gatttatatc aagggattca + 3961 ctaaaaaagt agaagctcct aagacgtcta agaatcagtc tttcaatatc tatgttagtg + 4021 gaattgacac ctatggtcct attagttcgg tgtcgcgatc agatgtcaat atcctgatga + 4081 ctgtcaatcg agataccaag aaaatcctct tgaccacaac gccgcgtgat gcctatgtac + 4141 caatcgcaga tggtggaaat aatcaaaaag ataaattaac ccatgcgggc atttatggag + 4201 ttgattcgtc cattcacacc ttagaaaatc tctatggagt ggatatcaat tactatgtgc + 4261 gattgaactt cacttctttc ttaaaaatga ttgacttatt gggaggggta gatgttcata + 4321 atgatcaaga gttttcagct ctacatggga agttccattt cccagtaggg aatgtccatc + 4381 tagactctga gcaggctcta ggttttgtac gtggacgcta ctcactagcc gatggagacc + 4441 gtgaccgtgg tcgcaaccaa caaaaggtca ttgtagcaat tattcagaag ttaacttcta + 4501 cagaggtttt ggaaaactat agtagtattc ttcaaggatt gcaggattct cttcaaacaa + 4561 atatgccgat tgagactatg atagatttag tgaatactca gttggaaagt ggagggaatt + 4621 ataaagtaaa ttctcaagat ttaaaagaga caggtcggat ggatcttcct tcttatgcaa + 4681 tgccagacag taacctctat gtgatggaaa tagatgacag tagtttaact gtagttaaag + 4741 cagctataca gtatgtgatg gagggtagat gaaatgatag atatccattc gcatatcgtt + 4801 tttgatgtag atgacggtcc caagtcaaga gaggaaagca aggctctctt ggcagaagcc + 4861 tacaggcagg gggtgcgaac cattgtctct acctctcacc gtcgcaaggg catgtttgaa + 4921 actccggaag agaagatagc agaaaacttt cttcaggttc gggaaattgc aaaagaagta + 4981 gcagatgatt tagtcatcgc ttatggcgca gagatatact atactctgga tactctagaa + 5041 aagctagaaa aaaaagaaat tcctaccctt aatgatagtc gttatgcttt gattgagttt + 5101 agcatgcata cttcctatcg tcagattcat acgggattga gcaatatttt gatgttggga + 5161 atcacgccag taattgctca tattgaacgg tatgatgctt tagagaataa cgaaaaacat + 5221 gttcgtgaac tgattgatat ggggtgctat actcagataa atagttatca tgtttcaaaa + 5281 cctaagttct ttggtgaaaa atataaattc atgaaaaaga gagctcggta ttttttggaa + 5341 cgtgatttag ttcatgtagt tgcaagtgac atgcacaatt tagacagtag acctccatat + 5401 atgcaacaag catatgatat cattgctaag aaatatggag cgaaaaaagc gaaagaactt + 5461 tttgtagata atcccagaaa aattataatg gatcaattaa tttaggagaa aatatgaagg + 5521 aacaaaacac tttggaaatc gatggattgc aactattcag agctttatgg aaaagaaagt + 5581 tggtcatttt attagtggca attataactt cttcagttgc ttttgcctac agtacttttg + 5641 ttatcaaacc tgagtttact agtacgactc ggatttatgt agttaaccgt aatcaggaag + 5701 agaagcctgg tttaaccaat caagacttgc aggcaggatc atacttggtt aaagactatc + 5761 gtgaaattat cctatcgcag gatgttttgg aggaagttgt ttctgatttg aaactagatt + 5821 tgacgccaaa aggtttggct aataaaatta aagtaacagt accagttgat acccgtattg + 5881 tctctgtttc agttaatgat cgagttcctg aagaggcaag ccgtatcgct aactctttga + 5941 gagaagtagc tgctcaaaaa attatcagta ttactcgtgt ttctgatgtg acaacactgg + 6001 aggaggcaag accggcgata tcaccgtctt caccaaatat taaacgcaat acactaattg + 6061 gttttttggc aggggggatt ggaactagtg ttatagtttt tcttcttgaa cttttggaca + 6121 ctcgtgtgaa acgtccggaa gatatcgaag atacactaca gatgacactt ttgggagttg + 6181 taccaaactt gaataagttg aaataggaga gagagatgcc gacattagaa atagcacaaa + 6241 aaaaactgga gttcattaag aaggcagaag aatattacaa tgccttgtgt acaaatatac + 6301 agttgagcgg agataaacta aaagtaattt ccgttacttc tgttagccct ggggaaggaa + 6361 aaacaactac ttccgtaaat atagcatggt cgtttgcgcg tgcaggctat aaaactcttt + 6421 tgattgatgg agatactcga aattcggtta tatcaggatt ttttaaatct cgtgaaaaga + 6481 ttacaggtct aacagaattt ttatctggga cagctgattt atctcacggt ttatgtgata + 6541 caaatattga aaatttattt gtagttcaat cgggagctgt atcaccaaac cctacagcct + 6601 tgttacaaag taaaaatttt aatgatatga ttgaaacatt gcgtaaatat tttgattata + 6661 tcattgttga tacagcacct attggaattg ttattgatgc ggcaattatc actcaaaagt + 6721 gtgatgcgtc catcttggta acagcaacag gtgagacgaa taaacgtgat gtccaaaaag + 6781 cgaaacaaca attaaaacaa acagggaaac tgttcctagg agttgtttta aataaattag + 6841 atatctcggt tgataagtat ggagtttacg gtttctatgg aaattatggt aaaaaataac + 6901 ttaggaaaga ttttatggat gaaaaaggat tgaaaatttt tctggcagta ttacagagta + 6961 ttgttgtcat tttattgatt tattttctta gctttgttag agagacagaa gttgaacgtt + 7021 cttcgatggt tatactatac cttctccact tttttgtatt ctattttagt tcctatggta + 7081 acaatttttt taaaagaggg cacctagttg agtttaatag tactataaga tatatttttt + 7141 tctttgcaat agctataagt gtattaaact tttttatagc ggaacggttt agtatctcta + 7201 gaagaggaat ggtatacttc ttaactttag aaggaatatc cttatacttg ttaaatttct + 7261 tagtaaagaa atattggaag catgtgtttt ttaatctaaa aaatagcaag aaaattttac + 7321 tgttaacagt aacgaaaaat atggaaaaag ttcttgataa attgttagaa tctgatgaac + 7381 tttcatggaa attggtagca gtaagtgttt tggataaatc tgattttcaa catgataaaa + 7441 tacctgtaat tgaaaaggaa aaaattattg aatttgcaac gcatgaagtt gtggatgagg + 7501 tgtttgtcaa tcttccagga gagagctacg atattggaga aattatctct aggtttgaga + 7561 caatggggat agatgtaact gtaaatctta atgcatttga taagaatttg ggtcgcaata + 7621 aacaaattca tgagatggta ggattgaatg tagtcacttt ctctaaaaat ctttataaaa + 7681 ctagtcatgt gatttcaaag agaattctcg atatttgtgg tgccactatt ggccttattc + 7741 tttttgctat agctagtcta gttttagttc cattgattcg taaagatggc ggaccagcta + 7801 tttttgctca gacgcgtata gggaaaaatg gtcgacattt taccttttat aaattccgtt + 7861 cgatgcggat cgatgctgaa gctatcaaag aacagttgat ggatcaaaat acgatgcaag + 7921 gtggtatgtt taagataaac aatgatcctc gtgttacaaa aattggccgc tttattcgta + 7981 aaaccagttt ggatgagata ccccagtttt ggaatgtctt tataggagat atgagtttgg + 8041 tgggaacacg tccacctaca gtagacgagt atgatcagta tactccagaa cagaaacgtc + 8101 gactcagctt taaacctggt attacaggtt tatggcaggt tagcggccgt agtaaaataa + 8161 ccgattttga cgctgttgta aaattagatg tggcttatat tgataattgg acaatctgga + 8221 aagatattga aattttgctt aaaactgtta aagttgtatt tatgagagat ggagcgaagt + 8281 aatttctgta tatccatcct attaggagag aaatgaaaaa gtcagtttat atcattggtt + 8341 caaaaggaat tcctgctaag tatggaggat ttgaaacttt tgttgaaaaa ttaacagcct + 8401 tccaacaaga taaggctatc caatattatg tggcttgtat gcgtgaaaac tctgcaaaat + 8461 cagggactac tgaggatgtt tttgaacata atggtgctat ctgttataac gtcgatgttc + 8521 ctaatattgg tccagcgcga gctatagcgt atgatatcgc tgcaattaac agagctattg + 8581 aaattgccaa agaaaataag gatgaagatc caatcttcta tattttagct tgtcgaattg + 8641 gtccgttcat ccatggaatt aagaaaagaa ttcaagcaat aggtgggact cttctggtta + 8701 atccagatgg tcacgagtgg ttacgagcca agtggagtgc tcctgttcgt cgctactgga + 8761 aaatttctga aggtcttatg gtcaaatatg cagatttttt agtgtgtgat agtaagaata + 8821 ttgaaaaata tatccaagaa gattataaac agtatcaacc taaaacaacc tatatcgctt + 8881 atggaacaga tacaacacgc tctacattaa aaagtagtga tgaaaaagta cgttcttggt + 8941 tcaaagagaa gaatgtttct gagaacgagt attatctagt tgtaggacgt tttgtaccag + 9001 aaaacaacta tgaatctatg attcgtggct ttttggcgtc taactctaag aaggactttg + 9061 ttttaatcac aaatgtagaa cagaataaat tttataatca gttgttggca aaaactgctt + 9121 ttgataagga cccacgagta aaatttgttg gaacagtcta cgatcaagaa cttctgaagt + 9181 atattcgaga aaacaccttt gcttacttcc atggacatga agttggagga accaatcctt + 9241 cgcttttaga agctctggca tcaactaaac tgaatttatt gctagatgtt ggctttaacc + 9301 gagaagttgg ggagcaaagt gcaatctatt ggaaaaaaga tgagctttcc caagtaatcg + 9361 agaaagttga acaatttgat gcaaaaaaga ttgatgagtt agatagacaa tcaaatcaga + 9421 gaattgtgga ttctttcact tgggaaaaga ttgtcacaga ctacgagaaa ttatttaaaa + 9481 aatgaaaata ttacattata ctttaggatt tcaaccccag cgaacaggtg gtttggttaa + 9541 atatgctgag gatttaatgc tagagcaaat tgctcaaggt tatcaagtag ccgccctatg + 9601 tccagggaga attaagttct tttcaaaaaa aatagaaata attaaagcga cgtcaaggca + 9661 gtttgagtgt tatgaactgc ttaatagctt acctatagct ttatttggag gtatatccga + 9721 tccaactgct ttcatgacac cttgtgacaa aaatgtttat cgtacttttt tagaaaaagt + 9781 acaacccgac attatacata ttcactcgtt tatgggattg cataaagaat tcctcgaaat + 9841 tgctaaaaac ttgaatatta gagtggtttt tacgagccat gattattatg gattagcacc + 9901 cgtacctcat ttctatttta atggggtgga ttatagtgat aaaaatacaa acttaacatg + 9961 gaatattatg tcttccaatg ctttaagtgt gaaaaaacta agactttttc aagtttcatt + 10021 ttatcctact attcgtaaac ttttgaaact attagggaaa aatccaaaat ctaaaaagaa + 10081 tttagttatt cgagatgtta ttgaggaaca agattatagt gaacttcgat actattataa + 10141 tgagatgttt cacttaatag atggttattt gtttaatagt agacttgcaa agaaggtata + 10201 tgagataaac gagattcaac cagttaatag tgtagtatta tctataacaa gtagttcaat + 10261 taaacatcat cagagattaa cgactacaaa taataagatt agggtttctt atattggttc + 10321 agacgaagaa tataaaggtt actttgattt tattgacttt gctggaactt tagaacaaga + 10381 atcatatgaa gtggtaactt atggtcattt accaaatgaa gagtgccctt cattcattga + 10441 acaaaaagga tattttacca aggaaacgat tgacagtgtc tatgaaaata ttgatatttt + 10501 gattatagca agcaaatgta aagaaacctt tggattgata acagtagaag cattatccta + 10561 tggggtaaat gtttttgtga gtgaaaatgt tggatcaaaa gacttgcttc cagaaacaca + 10621 tgtttttaaa gacaaggaag atttgttggc taaaatcatc aataatcagt tggagaaagt + 10681 tccgcttaaa acgatggaaa aacatgtaga agaagttatt agttattaca aacaggttag + 10741 aagcaacaat taaggagaat gattaaagat atgtcctgtc cagaaattag cgtaattgta + 10801 ccagtttata atgtggaacg atatttaaga cagtgtatgg attcattgat aaatcaaact + 10861 tataggaatt ttgaaataat tttagtaaac gatggatcaa cggattcttc tgggattctc + 10921 tgtgaagagt gggcaaaaaa agatgaaaga attcatgtgg ttcataaaaa aaatgagggg + 10981 cttggcttcg ctcgtaatac aggggttgaa cacgcaaagg ggaaacacat aacctttgta + 11041 gattcagatg actatgtttc tctagatatg ctgcaaactc tatataatgc tgttcaagaa + 11101 tatgatgtcg aagttgtata cagtgcggga tattatcgtt cctttagtaa tggggaaata + 11161 aagaagacag atgtaggaac aaaaaagcct caacttttcg aaggaggaga tgttgcctct + 11221 gaattactcc ctgatgtaat ttctgctcct cctgaatatc caaatgatgg gaaagttgga + 11281 gtgtcggcat ggaaggttct ctacaaagct aatttattta aggataaagg gctattattt + 11341 cattcggaaa gagaattcat ttcagaagat gctatttttc aaattgattg tttaaaatta + 11401 gcaacatctg cccttgttat cccagatatt ttatactact atcgtgaaaa ctttggttct + 11461 ttaagtatga aatataaaga agatcggttt gagttggata aaatcttgta taacgagcaa + 11521 ttaaaaagag ttgaggggtt acctaatcaa gaaattttgg aagaaagaat cgagagaatt + 11581 ttaattgcta atattcgttt atgtatcttt caggaatctt tacataaaag ttctagaata + 11641 cataaacgct tgcaaagaat tagacagatt tgtaaggatc cagtctcaaa agtagtttta + 11701 caccactatc caatccatcg tttacctttt cctaaacgtt tgatctgtgt attagctaag + 11761 tataatatgt cgctgtttct tttagcttta accctattaa aatatcggaa tcggagtgta + 11821 taacttttat ggggatgaat atagaaaaat taaaactatc tttgaaaaat agaacgtttt + 11881 ttcctgttgt tattcatgcc ttacgtaacc gttggccctt gtggtggatt cggagtaagg + 11941 ctattcgaga agtacaactt gaagataggg cctacagaat actaaaaaag aaatacggtt + 12001 ccttaatttc aaactctttt gataaagcat acttatcaga aaaagttccc aagcaaatct + 12061 ggatttgctg gtttcaaggt atggagaatg ctccagattt ggtgaaatca tgttataagt + 12121 ctgttaaaag agaatttcca gattataaaa ttacagtatt aacggctcag actattcaac + 12181 agcatgtaac aattcctgaa gaaattttgt ataagtggaa taaaggtatc ataaataacg + 12241 caaatttttc agatgttttg cgtgttgaga ttttatctaa atatggaggt atttggttag + 12301 atgctacagt ttattgcact ggtaatacaa ttaaggaatt aattgagaaa aatccatttt + 12361 ttatgtataa gagtctatct tcaatcgaag aaaatatttc tgcatcaagc tggatgattg + 12421 cttcaacagc aaatcaccct ttaatactat ctgcgaagaa gttgctagta gaatattggt + 12481 gtagagaaaa tattgcaatc cattattttg tttttcattt gctgttcacg attgtagctg + 12541 aaaattattc ggatgtttgg cagtctgtac ccacctatac gaacgcagca ccacatataa + 12601 tgattgatga attaaataat gttttttcaa aggaacgtta ccagcaattg tgtcaaattt + 12661 cagattttca taaattgaat tataaaaaaa attacaatga taaatctgag agtttgtata + 12721 gttacttact gaatcagtag aggggagaat cttgcctagt ttaaagaaaa acattgttta + 12781 caatatctta tatcagatct tagctgtaat agtaccgttt attacctcac cttatttagc + 12841 tcgtgtgtta ggtgcagagc aaattggagt ttattctttt acctattcca ttgcttttta + 12901 ctttatgatt ctgtccatgt tggggatttc taattatggg aatcggacaa tagcacaggt + 12961 acgaacaagt agagaacatt tgaatcagga attttcgaat atttacgcgg ttcagttgac + 13021 gtgttcacta gtaatgaccg tctcatattt gatttatgca acagtatttg tgaatagttt + 13081 tcagattgta gcctatatcc aagtattaca tgttttatcg tatgcaacag atgttagttg + 13141 gtttttttat ggtcttgaag agtttcgtat tacggttgct aggaattcat ttgttaaatt + 13201 attgacttta atatctatct ttacatttgt aaaaagccct aatgatatct atttatatac + 13261 ctttataatg gcagggagta ccctgcttgg tcagttgatt acatggccat ttttgctaaa + 13321 acaagtaaac tttgtgcgcc ctagtcttgg aaaaataaag gaacacatga aacctattat + 13381 tattttattt ttccccgtct tagcggttag tattttttcg tttttagata aaataatgct + 13441 tgggatgtat agtagtttga aggaaactgc tttttatgag aattcagata agatcattag + 13501 tattccaaaa gctctgattc aagcctttgg agctgtaatg ttgcctcgaa cagtacattt + 13561 actgagtata ggtgatgaac aaaaaagttt agaatatgtt gataaaacga tgtgggctgt + 13621 tttagtgatt acaatgggct gtgctttcgg tttagcagga gtttctgtaa cctttgctcc + 13681 tgtttattgg ggtgaagaat ttagggccag tagccaaatt attgcaggaa tgacaccggc + 13741 tttagcattt tcggcttttg gaaatgtcat ccgaacccag tttttaattc cacgaagttt + 13801 tgacaaggaa tatacggtat ctttgcttta tggagccgtt gttaatattt tgattaatat + 13861 tcttttgatt ccgaagatag gagcaatggg agctgttatt ggaacaattg ttgcagagtt + 13921 agttctatgt tactatcaaa catggattgc tagaaattat ttacatatca gagaatatct + 13981 gataaatgct gggatattat ttcttattgg ttcagtaatg tatatggttt taattcttgt + 14041 ttcaagtatt ttacctactt cgttacttac acttattatt gaaattatag tcggagcttt + 14101 catttatatt agtttactga ttctgtatat cttttcttca aaaaacaggg taattattgg + 14161 tttacgaaca aattttttag aacgtactca tttatttaaa aggaagtaat agtgaaattt + 14221 aaatttaatc caatcgcgat actgtatata ttgctagtat acttagagtt agctacagat + 14281 aggcaacatc tgtatccagt aacgtacatg acaaaatatt atattggtat tttaatcact + 14341 gtgttgtttg ttttgttatt agtaggccgt gggaaggtta tttttgttaa taaaaaatta + 14401 ttatatcttg ctaagatatt agctatacca acaattgttc ttttcctgta ctcagtctta + 14461 ctagacgtaa tgaacccagt tgaatttaat ggatatttta gtagattatc aagtacgact + 14521 atttttggtt tgttagctat ctttcaagct atagttgttt ttcaattttt tggacaaaaa + 14581 gtagtagatt acacttttac agctatctcc ctcagctact taaccagtat cattgttgcc + 14641 tttagggagg gaggacttag tcaatttatc ttgatgctaa cagatgctag tttcaatggt + 14701 tcggtactag aaatgcatga agttgcacct attacagctc tctttattct gtactatttg + 14761 tacaaatatt ttataaaaga aaatagtttt tctttagtat ttcgtaatat cttaatagct + 14821 ctcattattc tttttttaag ccttaaacga atcgtttttt tgagtgtatt aattatcata + 14881 ccagtatttt tggtaattta ttggtatgat aaaaaagtaa gcaaactagg gaaagaacga + 14941 aaaattttaa gtttattaaa tagcttttcc ttaatattta taacaggaat attcctttat + 15001 gtttatagtg taaaatctgg ttttatatat acatttattc aagaacataa tattaattcg + 15061 atggctagaa cagatttatg gaagggaatt gaatcaacct atagttttgc ccctatattt + 15121 atggggagag ggatagggtt tgtaacaaaa tggatggata ataattggat gactttgaat + 15181 atcaatggtc ttacagagtc aacggggctc cataatgata ttttgaagta ctacattgag + 15241 ataggatttg taggattatt tatttatttt tacactcttc tttatagaaa tgctaaacgt + 15301 atatttgtaa aaattggtca taaagaatca ttcatatatt ttgtattgat aatgtttcag + 15361 gtgctgatat ggtttacaga taatatttca acttaccata attttttatg gattctaaat + 15421 ctactgctct tttctttaac taatacggat gcagagttgg aaactcagaa attataaaat + 15481 atttatttct tgaatttatg gtcttacgcc gtaaatttga tttcactaat gaccaatact + 15541 aatttataaa agtaatatga aattttatat aaaaaattta ttaaaaaaag tctttacatt + 15601 accgttgcat ttattgccta ttcagtctaa taagataata tttgataatt ttggtggtag + 15661 aggttttggg gacaatccta agtatatact tgaagaactt gtctctcgag aaaagaatct + 15721 aaatcttgtg tgggtaacaa aagatagaga aatgtctatc cctgaaggcg ttcgagtagt + 15781 aaaatacggc agttaccgtt ctttttatga atggttaaca gctagagttt gggtagataa + 15841 tattcgtaat tctgatcgac cttggaagcg aaaaggacag atttatcttc aaacttggca + 15901 tggttcagat ggggtaaagt taattgaaaa aagtgttgca gggaatctaa aaaaaacata + 15961 tcttagaatg gcgaagtatg atggaaagat tacagacggt atcgtatcaa gtcggcactt + 16021 tcaaactttg ggtatgcaaa ataatttttg gctggcagag aatgtggaat ttctggaatt + 16081 tggattacct cgaaatgatg atttttttaa aagtgaaaaa atcaaaacca caaatataaa + 16141 atttagaaca ttatttgata tcgatttaga cgaactggta gttttgtata tgccgacgtt + 16201 cagagatgat ggatcgttga atgcctataa tttagattac tcgaaactaa tacatgtttt + 16261 tcaaaataaa tttagaaaaa atgtaaaaat attagttcgt tttcatccaa atgttgattc + 16321 tagttttata aatttacagg atacagactg tataaatgtg tcgacctatt caaatcctca + 16381 ggatctgatg atgagtgcag atgtgatgat tacggattat tcatcggctt ctattgattt + 16441 tatgttatta aatcgtccag tatttctgta tttaccagat tatcaaagtt atgtgaatga + 16501 tagaccattg gatgataact ttgataaatt gccatttcca agagcatatc ataacaatga + 16561 gttgacagaa attattagag actttgaaag aagtaaatat gatgaaaaag ttcgtctgta + 16621 tgaattagag gatgttcgtt ttgatagagg aaaagcatca gtacagtgtg ctaattggat + 16681 tgaagaaaaa ataaaaaaca ataaagttat tgattgaaat aattatattt attgaattat + 16741 aaataaggag gtctttagat gaaaagagtt ataacatatg gtacatttga tttattgcat + 16801 tatggtcata tcaatctttt gaaacgtgct aaacagctag gtgattattt gattgtagtt + 16861 gtttcaagtg atgagtttaa tttaaaagaa aagaataaag tatgttactt taactacgaa + 16921 cacagaaaaa atttagtaga agctattcga tatgtcgatt tagtaatccc tgaaactagt + 16981 tgggaacaga aaaagtcaga tgttaaagac taccatattg acacttttgt aatgggtgat + 17041 gattggaaag gtaaatttga ttatcttgaa gaagaaggtg ttgaagtagt ctatttgcct + 17101 agaacaaagg aaatatcaac cacaaagata aaagaagatt tatcggaatg aaatattatt + 17161 aaaaaatgct gacataagaa attgtggctt ttgtgtctag tttttgatag aataaagtaa + 17221 caacacttta accaatgagg tgtgaataat ggcagtaatt tttaaagatg tacttgttga + 17281 agagaaaact gatgaagaaa aacaacatat tttatctatt ttaaatgatg agaatgttag + 17341 agcttttgat tgtggatatt aagaattgaa tgatgttttt tgatatttag aacaaatacg + 17401 atgaagaaac aggccatgta ttgcctattg taaatcaaaa ttttgaatta ttaggtttta + 17461 tttcttgtag actagtatca ttttctttca tagctcaggt taaagagatg ggaattagca + 17521 tagattatct tggtattcat aaggattgcc agaaaatggg ggatcggttc gcttttggtg + 17581 ctctttgcgc ttcgattatc tttaactatt tactgttgat taccaataaa aggtgtaata + 17641 gttcatgctc tagaggatgt tgtagaattc tatgacaaac tgggttttat tgaccctaga + 17701 gatatagtta tttataatgg caaaccggtt actatatatt ttagtattga aaaactaaga + 17761 aatggtgaaa attattcctc tcacacagtt atttgaaaca tccttagaaa atgattttta + 17821 attgtatgca aacaaagtag aattcgctta tttcatctta tgctaaatgt aatatgaaac + 17881 aagtgaattt ttatagataa agaagaattt taaaaaatgt gatgattatt tttagagcag + 17941 tacagaatta atagtaattg actctaaatc aataaagaaa ggtaccctat tatgaaaggt + 18001 attattctag caggtggttc ggggacacgt ttatatcctt tgactcgagc tgcatcaaaa + 18061 caactgatgc cggtttatga taaaccgatg atttactatc cactttcaac attgatgttg + 18121 gctgggatta gggatatttt gataatctca actcctcaag atttgcctcg ttttaaagag + 18181 cttcttcaag acggatctga gtttgggatt aaactttctt atgcagagca accaagtcca + 18241 gatggtttgg cacaagcctt tatcattggg gaagagttta ttggtgatga tagtgttgct + 18301 ttgatcttgg gggacaatat ctatcacggc cctggtttga gcaaaatgct tcaaaaagca + 18361 gccaagaaag agaaaggtgc gactgtcttt ggctaccatg tcaaggatcc agaacgcttt + 18421 ggtgttgtag aatttgatga aaatatgaat gctatctcca tcgaagaaaa accagaacag + 18481 ccgtgctcta actatgcagt gacaggactg tatttctatg ataacgatgt tgtcgagatt + 18541 gccaaaagta ttaaaccaag tcctcgtggt gaattggaaa ttacagatgt aaacaaggct + 18601 tacctaaatc gtggagattt atccgttgag gttatgggac gcggctttgc ttggttggat + 18661 actggaacac atgaaagttt actggaggct tcacagtaca tcgaaacagt ccaacggatg + 18721 caaaatgttc aggtagcaaa cttagaagaa attgcttacc gtatgggcta tatcagtcga + 18781 gaaaatgtat tggccttagc ccaaccactt aagaaaaatg aatacggaca gtatctgctc + 18841 cgtttgattg gagaagcata gatgacagat aattttttcg gtaagacgct tgcggcacgc + 18901 aaggttgaag ctattccagg catgttggag tttgatatcc ccgttcatgg agataatcgt + 18961 ggctggttta aagaaaattt ccaaaaggaa aaaatgcttc cacttggatt tccagagtct + 19021 ttctttgcag aaggaaaatt gcaaaacaat gtatccttct cacgtaaaaa tgtccttcga + 19081 ggcctccacg cagagccttg ggataagtac atctctgtag cagatggagg gaaagttctg + 19141 ggttcttggg ttgatctacg cgagggtgaa acctttggga atacctatca gacagtgatt + 19201 gatgcgagta agggaatctt tgttcctcga ggcgtagcta atggcttcca agttttatca + 19261 gatacagtgt catatagcta tctggtcaat gattactggg ctcttgaact caaacccaag + 19321 tatgcctttg tgaactacgc tgatccaagc cttggtattg aatgggaaaa tattgcagaa + 19381 gcagaggttt cagaagcaga taaaaatcat ccactactta aggatgtaaa acctttgaaa + 19441 aaagaagatt tgtaaaaagg aaagaatatg actgaataca aaaatattat cgtgacaggt + 19501 ggagctggct ttatcggttc taactttgtc cattatgttt acgagaactt tccagatgtt + 19561 catgtgacag tcctagataa gttgacttat gctggaaacc gcgcgaatat tgaggaaatt + 19621 ttaggtaatc gtgttgagtt agttgttggt gacattgctg atgcggagtt ggtagacaag + 19681 ttggctgctc aagcagatgc tatcgttcat tatgcagcgg aaagccacaa tgataattcg + 19741 ctcaatgatc catcgccatt tattcatact aacttcatcg gaacctatac tcttttagaa + 19801 gctgctcgta agtatgatat tcgcttccac catgtatcga cagatgaagt ttatggggat + 19861 ctccctttac gcgaggattt gccaggtcat ggtgaaggac caggtgagaa atttactgct + 19921 gaaacaaaat acaacccaag ctctccgtac tcatcaacca aggcagcctc agatttgatt + 19981 gtcaaagcct gggtgcgttc ttttggagtc aaggcaacga tttccaactg ttcaaataac + 20041 tacggtcctt atcaacatat cgaaaaattc atcccacgtc agattactaa catcctaagt + 20101 ggtatcaagc caaaacttta cggtgaaggt aagaacgttc gtgattggat tcataccaat + 20161 gaccattctt caggagtttg gacaatcttg acaaaagggc aaatcggtga aacctacttg + 20221 attggggctg atggtgagaa gaacaataag gaagttttgg aacttatcct taaggaaatg + 20281 ggacaagctg cggatgccta tgatcatgtg actgaccgtg caggacatga ccttcgctat + 20341 gcgattgatg ctagcaagct ccgtgatgag ttggggtgga aacctgaatt taccaacttt + 20401 gaagctgggc tcaaggcaac aatcaagtgg tatacagata accaagaatg gtggaaagca + 20461 gagaaagaag ctgttgaagc caattatgct aagactcagg agattattac agtataaaaa + 20521 gcaggaaata gctgcttttt attgctatat tgggaagagt tacatattag aaaggtctag + 20581 agatgatttt aattacaggg gcaaatggcc aattaggaac ggaacttcgc tatttattgg + 20641 atgagcgtaa tgaagaatac gtggcagtag atgtggctga gatggacatt accgatgcag + 20701 aaatggttga gaaagttttt gaagaggtga aaccgacttt agtctaccac tgtgcagcct + 20761 acaccgctgt tgatgcagca gaggatgaag gaaaagagtt ggacttcgcc atcaatgtga + 20821 cggggacaaa aaatgtcgca aaagcatctg aaaagcatgg tgcaactcta gtttatattt + 20881 ctacggacta tgtctttgac ggtaagaaac cagttggaca agagtgggaa gttgatgacc + 20941 gaccagatcc acagacagaa tatggacgca ctaagcgtat gggggaagag ttagttgaga + 21001 agcatgtgtc taatttctat attatccgta ctgcctgggt atttggaaat tatggcaaaa + 21061 acttcgtttt taccatgcaa aatcttgcga aaactcataa gactttaaca gttgtaaatg + 21121 accagtacgg tcgtccgact tggactcgta ccttggctga gttcatgacc tacctagctg + 21181 aaaatcgtaa ggaatttggt tattatcatt tgtcaaatga tgcgacagaa gacacaacat + 21241 ggtatgattt tgcagttgaa attttgaaag atacagatgt cgaagtcaag ccagtagatt + 21301 ccagtcaatt tccagccaaa gctaaacgtc cgctaaactc aacgatgagc ctggccaaag + 21361 ccaaagctac tggatttgtt attccaactt ggcaagatgc attgcaagaa ttttacaaac + 21421 aagaagtgag ataagtagta gaatgatttt ctagtctaat aaaagaggca gagaatgaac + 21481 tccaaaggag cttaagatgt acgattatct tgttgttggt gcagtctttg cccatgaagc + 21541 agtcttaaaa ggaaaaaaag taaaagttat tgaaaaatga aatcatatcg cgggtaatat + 21601 ctatactcgt gaagaggaag gaattcaagt tcatcaatat ggtgctcata tcttccatac + 21661 ttctgataag gagatctggg attatgtaaa tcagtttgca gagtttaacc gttataccaa + 21721 ttctcctgtt gcaaactata agggagagat ttataactta ccttttaata tgaatacctt + 21781 caataaactc tggggagttg tgacgccagc agaagcataa gctaagattg atgaacaatg + 21841 tgctatttta aatggtaaaa ctcctgaaaa tttggaagaa caggcgattt ctcttgtagg + 21901 tacagacatc tacgaaaaat taatcaaaga ctatacagag aaacagtggg gcaaaccaac + 21961 tactgaactt ccatccttta ttattcgccg tttaccagta cacctgacct atgataacaa + 22021 ctattttaac gatacctatc aagggattcc aattggtggt tataatgtta tcatcgaaaa + 22081 tatgctgaag gatgtagaag tagaacttgg agtgaacttt tttgccaatc gtcaagaatt + 22141 agaggcttct gctgaaaagg ttgtctttac agggatgatt gaccaatact ttgattataa + 22201 acatggtgag ttagaatact gtagtcttcg ttttgatcat gaagttctag atgaggaaaa + 22261 ctatcaagga aacgcagttg tgaactatac ggatgcagaa accccatata ctcgcattat + 22321 tgaacacaaa cattttgagt ttgggagtca agcaaagact atcattacta atagaacatt + 22381 ctaaaacatg ggaaaaaggt gatgagcctt attatccagt taataatgat cgtaataatc + 22441 atttgtataa atcatataaa aaacttgctg atgagcaagg gaatgttatc tttggtggcc + 22501 gcttaggaca ctatcgttat tacgatatgc accaagtaat tggagcagct ttgcagtgcg + 22561 tgagaaatga gttagattca tactcaatga aaatcaaaga gcaaactagg aagctagccg + 22621 caggttgctc aaaacactgt tttgaggttg cagatggaag ctgacgcggt ttgaagagat + 22681 tttcgaagag tataaacaag taaaactgac taccagttat tatttagaaa tagtattaaa + 22741 aattccttga ctatgtgata tagttgaggg atttttaaat gatattcata ttttttgcaa + 22801 agatgttgtt tgaaaaataa ttttcaaaaa ttctgaaaat tctgttgaca actttctgaa + 22861 aagagtctat aatggagaga aagttttaaa ggagaaaatg atgaaaagtt caaaactatt + 22921 tgcccttgcg ggcgtgacat tattggcggc gactacttta gctgcatgct ctggatcagg + 22981 ttcaagttca agcactaaag gtgagaagac attctcatac atttatgaga cagaccctga + 23041 taacctcaac tatttgacaa ctgctaaggc tgcgacagca aatattacca gtaacgtggt + 23101 tgatggtttg ctagaaaatg atcgctacgg gaactttgtg ccgtctatgg ctgaggattg + 23161 gtctgtatcc aaggatggat tgacttacac ttatactatc cgtaaggatg caaaatggta + 23221 tacttctgaa ggtgaagaat acgcggcagt caaagctcaa gactttgtaa caggactaaa + 23281 atatgctgct gataaaaaat cagatgctct ttaccttgtt caagaatcaa tcaaagggtt + 23341 ggatgcctat gtaaaagggg aaatcaaaga tttctcacaa gtaggaatta aggttctgga + 23401 tgaacagaca gttcagtaca ctttgaacaa accagaaagc ttctggaatt ctaagacaac + 23461 catgggtgtg cttgcgccag ttaatgaaga gtttttgaat tcaaaaggag atgattttgc + 23521 caaagctacg gatccaagta gtctcttgta taacggtcct tatttgttga aatccattgt + 23581 gaccaaatcc tctgttgaat ttgcgaaaaa tccgaactac tgggataagg acaatgtgca + 23641 tattgacaaa gttaaattgt cattctggga tggtcaagat accagcaaac ctgcagaaaa + 23701 ctttaaagat ggtagcctta cagcagctcg tctctatcca acaagtgcaa gtttcgcaga + 23761 gcttgagaag agtatgaagg acaatattgt ctatactcaa caagactcta ttacgtatct + 23821 agttggtaca aatattgacc gtcagtccta taaatacaca tctaagacca gcgacgaaca + 23881 aaaggcatcg actaaaaagg ctctcttaaa caaggatttc cgtcaggcta ttgcctttgg + 23941 ttttgatcgt acagcctatg cctctcagtt gaatggacaa actggagcaa gcaaaatctt + 24001 acgtaatatc tttgtgccac caacatttgt tcaagcagat ggtaaaaact ttggcgatat + 24061 ggtcaaagag aaattggtca cttatgggga tgaatggaag gatgttaatc ttgcagattc + 24121 tcaggatggt ctttacaatc cagaaaaagc caaggctgaa tttgctaaag ctaaatcagc + 24181 cttacaagca gaaggtgtga ctttcccaat tcatttggat atgccagttg accagacagc + 24241 aactacaaaa gttcagcgcg tccaatctat gaaacaatcc ttggaagcaa ctttaggagc + 24301 tgataatgtc attattgata tccaacaact acaaaaagac gaagtaaaca atattacata + 24361 ttttgctgaa aatgctgctg gcgaagactg ggatttatca gataatgtcg gttggggtcc + 24421 agactttgcc gatccatcaa cctaccttga tatcatcaaa ccatctgtag gagaaagtac + 24481 taaaacatat ttagggtttg actcagggga agataatgta gctgctaaaa aagtaggtct + 24541 atatgactac gaaaaattgg ttactgaggc tggtgatgag gctacagatg ttgctaaacg + 24601 ctatgataaa tacgctgcag cccaagcttg gttgacagat agtgctttga ttattccaac + 24661 tacatctcgt acagggcgtc caatcttgtc taagatggta ccatttacaa taccatttgc + 24721 attgtcagga aataaaggta caagtgaacc aatcttatat aaatacttgg aacttcaaga + 24781 caaggcagtc actgtagatg aataccaaaa agctcaggaa aaatggatga aagaaaaaga + 24841 agagtctaat aaaaaggctc aagaagatct cgcaaaacat gtgaaataa +// + diff --git a/public/res/serotype_genbank/serotype_18X3.gb b/public/res/serotype_genbank/serotype_18X3.gb new file mode 100755 index 0000000..9439f2d --- /dev/null +++ b/public/res/serotype_genbank/serotype_18X3.gb @@ -0,0 +1,1062 @@ +LOCUS MK606433 26930 bp DNA linear BCT 30-SEP-2020 +DEFINITION Streptococcus pneumoniae strain D2310 cps gene cluster, complete + sequence. +ACCESSION MK606433 +VERSION MK606433.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 26930) + AUTHORS van Tonder,A.J., Gladstone,R.A., Lo,S.W., Nahm,M.H., du Plessis,M., + Cornick,J., Kwambana-Adams,B., Madhi,S.A., Hawkins,P.A., + Benisty,R., Dagan,R., Everett,D., Antonio,M., Klugman,K.P., von + Gottberg,A., Breiman,R.F., McGee,L., Bentley,S.D. and The Global + Pneumococcal Sequencing,C.O. + TITLE Putative novel cps loci in a large global collection of pneumococci + JOURNAL Microb Genom 5 (7) (2019) + PUBMED 31184299 +REFERENCE 2 (bases 1 to 26930) + AUTHORS van Tonder,A.J. + TITLE Direct Submission + JOURNAL Submitted (06-MAR-2019) Parasites and Microbes, Wellcome Sanger + Institute, Wellcome Genome Campus, Hinxton, Cambridge CB10 1SA, + United Kingdom +COMMENT ##Assembly-Data-START## + Assembly Method :: Velvet v. 1.2 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..26930 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="D2310" + /isolation_source="blood" + /host="Homo sapiens" + /db_xref="taxon:1313" + /geo_loc_name="Malawi" + /collection_date="1999" + misc_feature 1..26930 + /note="cps gene cluster" + gene 1..1611 + /gene="dexB" + CDS 1..1611 + /gene="dexB" + /EC_number="3.2.1.70" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3280" + /inference="protein motif:CLUSTERS:PRK10933" + /inference="protein motif:Pfam:PF00128.18" + /inference="protein motif:TIGRFAMs:TIGR02403" + /inference="similar to AA sequence:RefSeq:YP_004326655.1" + /inference="similar to AA sequence:UniProtKB:Q99040" + /note="trehalose-6-phosphate hydrolase; maltooligosyl + trehalose synthase; alpha,alpha-phosphotrehalase; alpha + amylase catalytic domain protein" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="QCO91960.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNEDGIGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIAAIFGTMEDMDQLIAEAKKRDIRIIMDLVVN + HTSDEHAWFVEACENPNSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGAKDLLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKGVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTGQPWLAVNPNYKMINVQEALANPDSIFYTYQKL + VQIRKENSWLIRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTAAKEVLEKQVLAPWDAFCVEMTD" + CDS complement(2060..3457) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3415" + /inference="protein motif:Pfam:PF00665.20" + /inference="similar to AA sequence:RefSeq:YP_006065738.1" + /note="integrase core domain protein" + /codon_start=1 + /transl_table=11 + /product="IS1202 transposase" + /protein_id="QCO91961.1" + /translation="MNETKKYLVIKAIAQGKKTKKRACVELNLSERQINRLLLAYQQK + GKEAFRHGNRNRKPKHAIPDEIKERVLKKYLSYETYKPNVLHFCELLAEEEGIKLSDT + TVRKILYKKNILSPKSHRKTKKRVRKQAKLNLNQPLDNPILPTAKDFLENPKKVHPSR + PRKKFAGELIQMDASPHAWFGPETTNLHLAIDDASGNILGAYFDKQETLNAYYHVLEQ + ILANHGIPLQMKTDKRTVFTYQASNSKKMEDDTYTQFGYACHQLGILLETTSIPQAKG + RVERLNQTLQSRLPIELERNKIHTLEEANTFLLSYIQTFNEQFGNKTKLSVFEEAPNL + SERNLILARLAERVVDSGHHIRFQNRYYIPTEQGKEVYFIRKTKALVLKAFDGDIYLN + IADKIYHTKELLDYELYSKNFEQEPEQKKERRKYIPPQTHPWKLTSFKQYLHKNKKDY + EEFTSEELHSPQLQV" + gene 3608..5053 + /gene="wzg" + CDS 3608..5053 + /gene="wzg" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09379" + /inference="protein motif:Pfam:PF03816.8" + /inference="protein motif:TIGRFAMs:TIGR00350" + /inference="similar to AA sequence:RefSeq:YP_001835063.1" + /inference="similar to AA sequence:UniProtKB:Q7WY78" + /note="putative transcriptional regulator ywtF; + membrane-bound transcriptional regulator LytR; cell + envelope-related function transcriptional attenuator + common domain; cell envelope-related transcriptional + attenuator domain protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14A" + /protein_id="QCO91962.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSVSFAVLADSEIEDVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSTLHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGSYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 5055..5786 + /gene="wzh" + CDS 5055..5786 + /gene="wzh" + /EC_number="3.1.3.48" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4464" + /inference="protein motif:Pfam:PF02811.13" + /inference="similar to AA sequence:RefSeq:YP_003878593.1" + /inference="similar to AA sequence:UniProtKB:Q9AHD4" + /note="capsular polysaccharide biosynthesis protein; PHP + domain protein" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein phosphatase wzh" + /protein_id="QCO91963.1" + /translation="MIDIHSHIVFDVDDGPKSIEDSKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREMAKEVASDLVIAYGAEIYYTPDVLEKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYGLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + gene 5792..6487 + /gene="wzd" + CDS 5792..6487 + /gene="wzd" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:Pfam:PF02706.9" + /inference="protein motif:TIGRFAMs:TIGR01006" + /inference="similar to AA sequence:RefSeq:NP_344881.1" + /inference="similar to AA sequence:UniProtKB:P72367" + /note="capsular polysaccharide type 8 biosynthesis protein + cap8A; capsular polysaccharide biosynthesis protein; MPA1 + family polysaccharide export protein; chain length + determinant protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + wzd" + /protein_id="QCO91964.1" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSAFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKL + DLTPKGLANKIKVTVPVDTRIVSISVNNRVPEEASRIANSLREVAAQKIISITRVSDV + TTLEEARPAISPSSPNIKRNTLIGFLAGGIGTGVIVLLLELLDTHVKRPEDIEDTLQM + PLLGVVPNFNKLK" + gene 6497..7180 + /gene="wze" + CDS 6497..7180 + /gene="wze" + /EC_number="2.7.10.2" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:CLUSTERS:PRK11519" + /inference="protein motif:Pfam:PF01656.17" + /inference="protein motif:TIGRFAMs:TIGR01007" + /inference="similar to AA sequence:RefSeq:YP_001835066.1" + /inference="similar to AA sequence:UniProtKB:Q54520" + /note="tyrosine-protein kinase CpsD; tyrosine kinase; + capsular polysaccharide biosynthesis protein; capsular + exopolysaccharide family protein; CobQ/CobB/MinD/ParA + nucleotide binding domain" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14D" + /protein_id="QCO91965.1" + /translation="MPTLEIAQKKMEFIKKAEEYYNALCTNIQLSGDKLKVISITSVN + AGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVMSGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILITATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGAY + GSYGNYGKK" + gene 7196..8563 + /gene="wchA" + CDS 7196..8563 + /gene="wchA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15204" + /inference="protein motif:Pfam:PF02397.10" + /inference="protein motif:TIGRFAMs:TIGR03025" + /inference="similar to AA sequence:RefSeq:YP_001835067.1" + /inference="similar to AA sequence:UniProtKB:P71241" + /note="putative colanic biosynthesis UDP-glucose lipid + carrier transferase; undecaprenyl-phosphate galactose + phosphotransferase; exopolysaccharide biosynthesis + polyprenyl glycosylphosphotransferase; Bacterial sugar + transferase" + /codon_start=1 + /transl_table=11 + /product="glucosyl-1-phosphate transferase" + /protein_id="QCO91966.1" + /translation="MDEKGLKIFLAVLQSIIVILLIYFLSFVRETELERSSMVILYLL + HFFAFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISILNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKDFGRNKQIHEMVGLDVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQISGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + gene 8594..9766 + /gene="wchF" + CDS 8594..9766 + /gene="wchF" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF09314.5" + /inference="similar to AA sequence:RefSeq:YP_002510379.1" + /note="PEP-CTERM/EpsH1 system-associated sugar + transferase; DUF1972 protein" + /codon_start=1 + /transl_table=11 + /product="rhamnosyltransferase WchF" + /protein_id="QCO91967.1" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVSNIGPARAIAYDIAAINRAIEIAKENKDEAPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYIQYQPKTTYIAYGTDTTRSTLNSGDEKVRAWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASSSKKDFVLITNVEQNKFYNQLLASTGFDKDPRV + KFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALAFTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIADYFTWEKIVTDYEKLFKK" + gene 9763..11034 + /gene="wciU" + CDS 9763..11034 + /gene="wciU" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15484" + /inference="protein motif:Pfam:PF00534.14" + /note="glycosyl transferase group 1 protein" + /codon_start=1 + /transl_table=11 + /product="lipopolysaccharide + 1,2-N-acetylglucosaminetransferase" + /protein_id="QCO91968.1" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMIEQIAQGYQVAALYPGRI + KFFSKKIEIIKATSRQFECYELLNSLPMALFGGISDPTAFLTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPYFYFNGVDYSDKNTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIKSANSIVLSITNSSINHHQRLTTTNNKIRVV + YIGPDEEYKGYFDFVDFAETLDRESYEVATYGHLPNEECPSFIEQKGYFTKEMIDSVY + ENIDILIVPSKWKETFGLITVEALSYGVNVFVSENVGSKDLLPETHVFKNQNDLVVKI + IENDIENTKLKTIDEHSKEVIQYYERVINDS" + gene 11024..11710 + /gene="epsH" + CDS 11024..11710 + /gene="epsH" + /EC_number="2.3.1.-" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0110" + /inference="protein motif:CLUSTERS:PRK09677" + /inference="protein motif:Pfam:PF00132.18" + /inference="protein motif:TIGRFAMs:TIGR03308" + /inference="similar to AA sequence:RefSeq:YP_141472.1" + /inference="similar to AA sequence:UniProtKB:Q7A3E8" + /note="putative acetyltransferase SA2342; putative + lipopolysaccharide biosynthesis O-acetyl transferase WbbJ; + isoleucine patch superfamily acetyltransferase; + phosphonate metabolim protein, transferase hexapeptide + repeat family protein; Bacterial transferase hexapeptide + (six repeats)" + /codon_start=1 + /transl_table=11 + /product="exopolysaccharide biosynthesis + acetyltransferase" + /protein_id="QCO91969.1" + /translation="MIVESLIKKITGKAVDIHPDVSMAYILQRGMNYGFGLFRGFVRG + IGFGQKGKRLFIGQGVSILAKRKLFVGKNVRIGKNVSIDALSKEGIHFADNVKIGDYS + QIIGTGTIKNMGIGLKVGKNSSFSEYSLFGSAGGITIGDNVIAGQNVRFHAENHNYSD + LDKLILEQGISRKGISVGHNCWIGAGAVFLDGSSIGSGCVVGANAVVTKQFPDNVIIG + GVPARILAYR" + gene 11742..12788 + /gene="cpsJ" + CDS 11742..12788 + /gene="cpsJ" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3858" + /inference="protein motif:CLUSTERS:PRK10073" + /inference="protein motif:Pfam:PF00535.20" + /inference="protein motif:TIGRFAMs:TIGR03937" + /inference="similar to AA sequence:RefSeq:YP_006033775.1" + /inference="similar to AA sequence:UniProtKB:Q8L0V4" + /note="hyaluronan synthase; putative glycosyl transferase; + putative glycosyl hydrolase; poly-beta-1,6 + N-acetyl-D-glucosamine synthase; Glycosyl transferase + family 2" + /codon_start=1 + /transl_table=11 + /product="family 2 glycosyl transferase" + /protein_id="QCO91970.1" + /translation="MPTFSVVVPVYNVENYLSQCLNALVNQSFKDFELILVNDGSTDT + SGSLCEEWGKKDHRIKVIHKTNEGLGFARNTGIENCTGDYIVFVDSDDYVSYEMLEIY + DTYLQRFNADVIYSENFYRVDNKGNIIEPLDQSLDSIFYKNDSIFTELLPDVISSPPE + FIGDGKIGVSVWKGVYKRSLFKDKGLLFHSEREFISEDAIFQIDCLKLATSALVIPDI + LYYYRENFGSLSMKYKEDRFELNKILYNEQLKRVEGLPNQEILEERIERILIANIRLC + IFQESLYKSSRIHKRLQRIRQICKDPISKSVLRHYPIRRLPFSKRLICVLAKYNMPLL + LLVLTLLKYRNRSV" + gene 12800..13705 + /gene="wchN" + CDS 12800..13705 + /gene="wchN" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3774" + /inference="protein motif:Pfam:PF05704.6" + /inference="similar to AA sequence:RefSeq:YP_001835073.1" + /note="mannosyltransferase OCH1-related enzyme" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide synthesis protein" + /protein_id="QCO91971.1" + /translation="MNIEKLKLSLKNGTFFSVVIHALRNRWPLWWIGNKAIREVQLED + RAYRILKKKYGSLISSSFDKSYLSEEVPKQIWICWLQGMENAPELVKSCYRSLKKQFP + EYVITVISSENISEYVEIPDIIYKKWGNGVIGNAHFSDILRVELLRKFGGIWIDSTVY + CTGITTIETIEKNPFFMYKSLSSVEERISSSNWMIASVPNHPFMITMSTLLQSYWSKE + VIAIHYYLFHILFTIMIESLPELWQLVPTYTNATPHIMADELNNIFSKERYQQLCQIS + DFHKLNYKKNYNDQSESLYSHLLNQ" + gene 13717..15174 + /gene="wzx" + CDS 13717..15174 + /gene="wzx" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF01943.11" + /inference="similar to AA sequence:RefSeq:YP_001835074.1" + /inference="similar to AA sequence:UniProtKB:P37746" + /note="putative O-antigen transporter; polysaccharide + biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="transporter" + /protein_id="QCO91972.1" + /translation="MPNLKKNIVYNVLYQILAVIVPFITSPYLARVLGAEQIGVYSFT + YSIAFYFMILSMLGISNYGNRTMAQVRTSREHLNQEFSNIYAVQLTCSLVMTVSYLIY + ATVFVNSFQIVAYIQVLHVLSYATDVSWFFYGLEEFRITVARNSFVKLLTLISIFTFV + KSPNDIYLYTFIMAGSTLLGQLITWPFLLKQVNFVRPSLGKIKKHMKPIIILFFPVLA + ISIFSFIDKIMLGMYSSLKETAFYENSDKIISIPKALIQAFGAVMLPRTVHLLSIGDE + QKSLEYVDKTMWVVLVITMGCAFGLAGVSATFAPVYWGEEFRTSSQIIAGMTPALVFS + AFGNVIRTQFLIPRSFDKEYTVSLLYGAVVNILINILLIPKIGAMGAVIGIIVAELVL + CCYQTWIARNYLHIREYLINAGILFLIGSVMYMVLILISSILPTSLLTLIIEIIVGAF + IYISLLILYIFSSKNRVIIGLRTNFLEHTHLFKRK" + gene 15177..16451 + /gene="wzy" + CDS 15177..16451 + /gene="wzy" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04932.9" + /codon_start=1 + /transl_table=11 + /product="O-antigen ligase" + /protein_id="QCO91973.1" + /translation="MKFKFNPIAILYILLVYLELATDRQHLYPVTYMTKYYIGILIIV + LFVLLLVGRGKLIFVNKKLLYLAKILAIPTIVLFLYSVLLDVMNPVEFNGYFSRLSST + TIFGLLAIFQAIVVFQFFGQKVVDYTFTAISLSYLTSIIVAFRQGGLSQFILILTDDS + FNGSVLEMHEVAPITALFILYYLYKYFIKENSFSSVFHNILIALIILFLSLKRIVFLS + VLIIIPVFLVIYWYDKKVSKLGKERKILSLLNIFSLIFITGIFLYVYSVKSDFIYTFI + QEHNINSMARTDLWKGVESTYNFAPIFMGRGIGFVTKWMDNNWMTLNINGLTGSMGIH + NDILKYYIEIGFVGLFIYFYTLLYRNAKRIFVKIGHKESFIYFVLIMFQMLIWFTDNI + SIYHNFLWILNLLLFSLTNSDTELENLDFKNF" + CDS 16505..17506 + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3274" + /inference="protein motif:Pfam:PF01757.16" + /inference="similar to AA sequence:RefSeq:YP_001036126.1" + /note="acyltransferase family protein" + /codon_start=1 + /transl_table=11 + /product="transmembrane protein" + /protein_id="QCO91974.1" + /translation="MKTDARTKKRENETLYILKVWATFSVIAIHFGFLGQIGVFYKVL + ARFAVPLFFMISGFYSFSISEEKLKKRIKNLSLLIISSTSFYFLLDVFLQLTQGNLRV + VFERFTFNNIFNFLVFNQISALIGSLATPLWFLYALLYVYIYLFFSNKKWIFNTILTV + IILCCSFIIELKANSALFYRNFLFMGVPFFSFGMYFAQIQRKIINYKHFKELFIIGIM + ISGFLTLFEYTFLGANFELYISSVIISCMLMVFSIKYPQLWTLDFAVNIAKKNATFIY + ISHQFVILLFKTYVRDGIAYKIGTFLIFLACVIMSIIFNYIVDIISRCCIKEKQDII" + gene 17503..18663 + /gene="wchX" + CDS 17503..18663 + /gene="wchX" + /EC_number="2.7.8.12" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04464.8" + /inference="similar to AA sequence:RefSeq:YP_002510384.1" + /inference="similar to AA sequence:UniProtKB:P13485" + /note="CDP-glycerol:poly(glycerophosphate) + glycerophosphotransferase" + /codon_start=1 + /transl_table=11 + /product="glycerol phosphotransferase WchX" + /protein_id="QCO91975.1" + /translation="MKFYIKNLLKKVFTLPLHLLPIQSNKIIFDNFGGRGFGDNPKYI + LEELVSREKNLDLVWVTKDREISIPEGVRVVKYGSYRSFYEWLTARVWVDNIRNSDRP + WKRKGQIYLQTWHGSDGVKLIEKSVARNLKKTYLRMAKYDGKITDGIVSSRHFQTLGM + QNNFWLTENVEFLEFGLPRNDDFFKSEKIKTTNIKFRTLFDIDLDELVVLYMPTFRDD + GSLNAYNLDYSKLIHVFQNKFRKNVKILVRFHPNVDSSFINLQDTDCINVSTYSNPQD + LMMSADVMITDYSSASIDFMLLNRPVFLYLPDYQSYVNDRPLDDNFDKLPFPRAYHNN + ELTEIIRDFERSKYDEKVRLYELEDVRFDRGKASVQCANWIEEKIKNNKVID" + gene 18705..19097 + /gene="gct" + CDS 18705..19097 + /gene="gct" + /EC_number="2.7.7.39" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0615" + /inference="protein motif:CLUSTERS:PRK11316" + /inference="protein motif:Pfam:PF01467.1" + /inference="protein motif:TIGRFAMs:TIGR01518" + /inference="similar to AA sequence:RefSeq:YP_003875983.1" + /inference="similar to AA sequence:UniProtKB:P27623" + /note="glycerol-3-phosphate cytidylyltransferase; + bifunctional heptose 7-phosphate kinase/heptose + 1-phosphate adenyltransferase; cytidylyltransferase" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="QCO91976.1" + /translation="MKRVITYGTFDLLHYGHINLLKRAKQLGDYLIVVVSSDEFNLKE + KNKVCYFNYEHRKNLVEAIRYVDLVIPETSWEQKKSDVKKYHIDTFVMGDDWKGKFDY + LEEEGVEVVYLPRTKEISTTKIKEDLSE" + CDS 19195..19308 + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_006742607.1" + /codon_start=1 + /transl_table=11 + /product="heme-based aerotactic transducer" + /protein_id="QCO91977.1" + /translation="MAVIFKDVLVEEKTDEEKQHILSILNDENVRAFDCGY" + gene 19943..20812 + /gene="rmlA" + CDS 19943..20812 + /gene="rmlA" + /EC_number="2.7.7.24" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4750" + /inference="protein motif:CLUSTERS:PRK15480" + /inference="protein motif:Pfam:PF00483.17" + /inference="protein motif:TIGRFAMs:TIGR01207" + /inference="similar to AA sequence:RefSeq:YP_815843.1" + /inference="similar to AA sequence:UniProtKB:P26393" + /note="glucose-1-phosphate thymidylyltransferase RfbA; + CTP:phosphocholine cytidylyltransferase; nucleotidyl + transferase" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase" + /protein_id="QCO91978.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + gene 20813..21406 + /gene="rmlC" + CDS 20813..21406 + /gene="rmlC" + /EC_number="5.1.3.13" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF00908.11" + /inference="protein motif:TIGRFAMs:TIGR01221" + /inference="similar to AA sequence:RefSeq:YP_003878604.1" + /inference="similar to AA sequence:UniProtKB:Q5XCG7" + /note="putative dTDP-4-dehydrorhamnose 3,5-epimerase" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-dehydrorhamnose 3,5-epimerase" + /protein_id="QCO91979.1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + gene 21419..22468 + /gene="rmlB" + CDS 21419..22468 + /gene="rmlB" + /EC_number="4.2.1.46" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK10084" + /inference="protein motif:Pfam:PF01370.15" + /inference="protein motif:TIGRFAMs:TIGR01181" + /inference="similar to AA sequence:RefSeq:YP_006742612.1" + /inference="similar to AA sequence:UniProtKB:P95780" + /note="dTDP-glucose 4,6 dehydratase; NAD-dependent + epimerase/dehydratase family protein" + /codon_start=1 + /transl_table=11 + /product="dTDP-glucose 4,6-dehydratase" + /protein_id="QCO91980.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + gene 22534..23385 + /gene="rmlD" + CDS 22534..23385 + /gene="rmlD" + /EC_number="1.1.1.133" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09987" + /inference="protein motif:Pfam:PF04321.11" + /inference="protein motif:TIGRFAMs:TIGR01214" + /inference="similar to AA sequence:RefSeq:YP_141831.1" + /inference="similar to AA sequence:UniProtKB:P29781" + /note="dTDP-4-dehydrorhamnose reductase; RmlD + substrate-binding domain protein" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase" + /protein_id="QCO91981.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + gene 23470..23895 + /gene="tnp" + CDS 23470..23895 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3436" + /inference="protein motif:Pfam:PF03050.8" + /inference="similar to AA sequence:RefSeq:YP_002037044.1" + /note="transposase IS66 Orf2-like protein" + /codon_start=1 + /transl_table=11 + /product="IS66-Spn1 transposase" + /protein_id="QCO91982.1" + /translation="MLVSLAHSFGSVSIIAHTIHQKFNLKVPNYRQEEDWARMGLPIT + RKEISNWHIKASQYYLESLYNLLREKLLEQPLLHADETSYRVLGSDSHLTYYWTFLSG + KAENQAITLYHHDQRRSGSVVQEFLGDYSGYVHCDMLRQ" + gene 23968..24225 + /gene="tnp" + CDS 23968..24225 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3436" + /inference="protein motif:Pfam:PF03050.8" + /inference="similar to AA sequence:RefSeq:YP_003878608.1" + /note="transposase IS66 family protein" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO91983.1" + /translation="MVNCEPLEAYRQLEEAELVGCWAHVRRKFFEATPKQADKSSLGA + KGLAYCDQLFSLERDWEALPADERLQKRQEELQPLMEDFFA" + gene 23968..24225 + /gene="tnp" + CDS 24488..24646 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_003878609.1" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO91984.1" + /translation="MSLLETAKRHQLNSEKYLFYLLECLSNEETLVNKEVLEAYLPWT + KVVQEKCK" + gene 24948..26930 + /gene="aliA" + CDS 24948..26930 + /gene="aliA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4166" + /inference="protein motif:CLUSTERS:PRK15104" + /inference="protein motif:Pfam:PF00496.16" + /inference="protein motif:TIGRFAMs:TIGR02294" + /inference="similar to AA sequence:RefSeq:YP_001835080.1" + /inference="similar to AA sequence:UniProtKB:P31306" + /note="76 kDa cell surface lipoprotein; oligopeptide ABC + transporter substrate-binding protein OppA; ABC-type + oligopeptide transport system, periplasmic component; + nickel ABC transporter, nickel/metallophore periplasmic + binding protein; Bacterial extracellular solute-binding + proteins, family 5 Middle" + /codon_start=1 + /transl_table=11 + /product="oligopeptide ABC transporter + oligopeptide-binding protein AliA" + /protein_id="QCO91985.1" + /translation="MKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETDP + DNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDA + KWYTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDAYVKGEIKDFSQVG + IKALDDQTVQYTLNKPESFWNSKTTMGVLAPVNEEFLNSKGDDFAKATDPSSLLYNGP + YLLKSIVTKSSVEFAKNPNYWDKDNVHIDKVKLSFWDGQDTSKPAENFKDGSLTAARL + YPTSASFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKALL + NKDFRQAIAFGFDRTAYASQLNGQTGASKILRNIFVPPTFVQADGKNFGDMVKEKLVT + YGDEWKDVNLADSQDGLYNPEKAKAEFAKAKSALQAEGVTFPIHLDMPVDQTATTKVQ + RVQSMKQSLEATLGADNVVIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPDFA + DPSTYLDIIKPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDETTDVAKRY + DKYAAAQAWLTDSALIIPTTSRTGRPILSKMVPFTIPFALSGNKGTSEPVLYKYLELQ + DKAVTVDEYQKAQEKWMKEKEESNKKAQEDLAKHVK" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg aagatggaat tggcgatttg ccaggtatta ccagtaagtt ggactatcta + 121 gccaagctag gaatcacagc gatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctatg atattgctga ttatcaagcg attgcggcta tttttggaac catggaggat + 241 atggatcagc tgattgcaga agctaagaag cgtgatatcc gtatcatcat ggacttggtg + 301 gtcaatcata cctcggatga gcatgcctgg tttgtagagg cctgtgaaaa tcctaatagc + 361 cctgagcgag actactatat ctggcgggat gagcctaacg atttagattc tatctttagt + 421 gggtctgctt gggaatacga tgaaaagtca ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaagg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agctaaggat ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcagc ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttacttcat + 1021 ctcatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatctctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaaccc + 1261 tggttggcgg ttaatccaaa ttacaagatg atcaatgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 attcgagctg actttgaatt gcttgatacg gctgataagg tatttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacactg cggctaaaga agtacttgaa + 1561 aaacaggtct tggctccatg ggatgctttc tgtgtggaaa tgactgacta gaatgagcaa + 1621 acctcaagtt tttgaagctt gaggtttttt actatagtgg attgaaacta gaatagtgca + 1681 cctctacttc taaaacattg ttagaaatcg atttgtcctg ttcttatttc attttactat + 1741 atttttgttt cgcgggaagt ctactaagat atttaaagat gcagatagta aaaaaagatg + 1801 tgtcaatcga aagtgattat gtcccccaaa aatggagagt ttgagggcaa ttattttgat + 1861 ttcatttgac acgaggaatc cttgaagctg ttttgtcagc taaaccaagg ctagtcttag + 1921 ccttggctct ccagcctaac agctccaagc ctcttatcaa atgaaatgct tgtcttacac + 1981 tcctcacttt ctctctccta aatgtaaggg atagagtgac ttcctttaag gaaaagcttc + 2041 ccatttagcg agaaatagat tatacttgta gttgaggaga atgaagctcc tcactagtaa + 2101 actcttcata atccttttta tttttatgaa ggtattgttt gaaagatgtg agtttccacg + 2161 gatgggtttg tggagggata tacttgcgtc tttctttttt ttgttctggt tcttgttcaa + 2221 agtttttcga atagagttca taatctagta gctcctttgt gtgatagatt ttgtcagcga + 2281 tattgaggta gatgtcacca tcaaatgctt ttagaactaa tgctttcgtc tttctgatga + 2341 aatagacttc ttttccttgt tcggtaggaa tatagtaacg attttggaat cggatatggt + 2401 gtccactatc gacgactctc tccgccagtc tagctagaat gagattccgt tcagagaggt + 2461 taggagcctc ctcaaaaaca gagagttttg tcttgtttcc aaactgttca ttaaaggttt + 2521 ggatgtagga aagaaggaaa gtattggctt cttccaatgt atgaatcttg tttcgttcca + 2581 gttcgatagg caggcgtgat tgtagtgtct gattgagtct ttcgaccctc cctttagctt + 2641 gagggataga ggtggtctca aggagaatcc ctagttggtg acaggcgtat ccaaattgtg + 2701 tataggtgtc gtcctccatt ttcttagagt tggatgcttg ataggtaaag accgttctct + 2761 tatcagtttt catttgaagg ggaatgccgt gattggctaa gatttgttcg aggacatggt + 2821 agtaggcatt caaggtctct tgtttgtcaa aataagcgcc taggatattg ccggaagcat + 2881 catcaatggc taagtgtaag ttggtggttt ctggtccaaa ccaggcatga gggctggcat + 2941 ccatttgaat gagttctcca gcaaatttct ttctgggtct actaggatgt acctttttag + 3001 ggttttccag gaagtcttta gccgtcggta agattggatt gtctaggggt tgattcaggt + 3061 tcagtttagc ttgttttctt actctcttct ttgtctttct gtgagactta ggagaaagga + 3121 tgtttttctt atagagtatt tttctaacag ttgtatcaga gagcttaatt ccctcttctt + 3181 cagctagtaa ttcacagaaa tgaaggacat ttggtttata tgtttcatag gagaggtatt + 3241 tctttaggac acgttctttg atttcatcag ggattgcatg ttttggtttt ctatttctgt + 3301 ttccgtgtct gaaggcttct tttcctttct gttgataggc tagtagcaga cgattgattt + 3361 gtctttcaga aagattgagt tcgacacagg cccgtttctt tgttttcttt ccttgggcta + 3421 tagcttttat tacaagatat tttttcgttt cattcatatt cagttggatc cttttcatat + 3481 gactattcta tcaaatggga cattatcaca ttcgaattac aaaaagatgc ggatagtaaa + 3541 aaaaggtgta gacattaccg taaaaaagtg atataattgt acgatgttca atgtataggt + 3601 gttaatcatg agtagacgtt ttaaaaaatc acgttcacag aaagtgaagc gaagtgttaa + 3661 tatagttttg ttgactattt atttattgtt agtttgtttt ttattgttct taatctttaa + 3721 gtacaatatc cttgctttta gatatcttaa tctagtggta actgcgttag tcctactagt + 3781 tgccttggta gggctactcc tgattatcta taaaaaagct gaaaaattta ctatttttct + 3841 gttggtgttc tctatccttg tcagctctgt gtcgctcttt gcagtacagc agtttgttgg + 3901 actgaccaat cgtttaaatg cgacttctaa ttactcagaa tattcggtca gtttcgctgt + 3961 tttagcagat agtgagatcg aagatgttac gcaactgacg agtgtgacag caccgactgg + 4021 gactgataat gaaaatattc aaaaactact agctgatatc aagtcaagtc agaataccga + 4081 tttgacggtc aaccagagtt cgtcttactt ggcagcttac aagagtttga ttgcagggga + 4141 gactaaggcc attgtcctaa atagtgtctt tgaaaatatc atcgagtcag agtatccaga + 4201 ctacgcatcg aagataaaaa agatttatac caagggattc actaaaaaag tagaagctcc + 4261 taagacgtct aagaatcagt ctttcaatat ctatgttagt ggaattgaca cctatggtcc + 4321 tattagttcg gtgtcgcgat cagatgtcaa tatcctgatg actgtcaatc gagataccaa + 4381 gaaaatcctc ttgaccacaa caccacgtga tgcctatgta ccaatcgcag atggtggaaa + 4441 taatcaaaaa gataaattaa cccatgcggg tatttatgga gttgattcgt ccattcacac + 4501 cttagaaaat ctttatggag tggatatcaa ttactatgtg cgattgaact tcacttcttt + 4561 cttgaaaatg attgacttat tgggaggggt agatgttcat aatgatcaag agttttcaac + 4621 tctacatggg aagttccatt tcccagtagg gaatgttcat ctagactctg agcaggctct + 4681 aggttttgta cgtgaacgct actcactagc cgatggagac cgtgaccgtg gtcgcaacca + 4741 acaaaaggtc attgtggcta tccttcaaaa attaacgtca accgaagcac tgaaaaatta + 4801 tagtacgatc attgatagct tgcaagattc tatccaaaca aatatgccac ttgagactat + 4861 gataaatttg gtcaatgctc agttagaaag tggagggagt tataaagtaa attctcaaga + 4921 tttaaaaggt acaggtcgga cggatcttcc ttcttatgca atgccagaca gtaacctcta + 4981 tgtgatggaa atagatgata gtagtttagc tgtagttaaa gcagctatac aggatgtgat + 5041 ggagggtaga tgaaatgata gacatccatt cgcatatcgt ttttgatgta gatgacggtc + 5101 ccaagtcaat agaggatagc aaggctctct tggcagaatc ctacaggcag ggggtgcgaa + 5161 ccattgtctc tacctctcac cgtcgcaagg gcatgtttga aactccggaa gagaagatag + 5221 cagaaaactt tcttcaggtt cgggaaatgg ctaaggaagt ggcgagtgac ttggtcattg + 5281 cttacggggc tgaaatttac tacacaccag atgttctgga aaagctggaa aaaaagcgga + 5341 ttccgaccct caatgatagt cgttatgcct tgatagagtt tagtatgaac actccttatc + 5401 gcgatattca tagcgccttg agcaagatct tgatgttggg aattactcca gtcattgccc + 5461 acattgagcg ctatgatgct cttgaaaata atgaaaaacg cgttcgagaa ctaatcgata + 5521 tgggctgtta cacgcaagta aatagttcac atgtcctcaa acccaaactt tttggcgaac + 5581 gttataaatt catgaaaaaa agagctcagt attttttaga gcaggatttg gttcatgtca + 5641 ttgcaagtga tatgcacaat ctagacggta gacctcctca tatggcagaa gcatatggcc + 5701 ttgttaccca aaaatacgga gaagcgaagg ctcaggaact ttttatagac aatcctcgaa + 5761 aaattgtaat ggatcaacta atttaggaga aatgatgaaa gaacaaaaca cgatagaaat + 5821 cgatgtattt caattattta aaaccttgtg gaaacgcaag ctaatgattt taatagtggc + 5881 acttgtgaca ggtgcggggg cttttgcata tagcgctttt attgttaagc cagaatatac + 5941 gagtaccacg cgaatttacg tagtgaatcg caatcaagga gacaagccgg ggctgacaaa + 6001 tcaggatttg caggcaggat cttatctagt aaaagactac cgtgagatta tcctttcgca + 6061 ggatgttttg gaggaagtta tttctgattt gaaactagat ttgacgccaa aaggtttggc + 6121 taataaaatt aaagtaacag taccagttga tacccgtatt gtctctattt cagttaataa + 6181 tcgagttcct gaagaggcaa gccgtatcgc taactctttg agagaagtag ctgctcaaaa + 6241 aattatcagt attactcgtg tttctgatgt gacaacactg gaggaggcaa gaccggcgat + 6301 atccccgtct tcgccaaata ttaaacgcaa tacactaatt ggttttttgg caggggggat + 6361 tggaactggt gttatagttc ttcttcttga acttttggac actcatgtga aacgtccgga + 6421 agatatcgaa gatacactgc agatgccact tttgggagtt gtaccaaact ttaataagtt + 6481 gaaataggag agaggaatgc cgacattaga aatagcacaa aaaaaaatgg agttcattaa + 6541 gaaggcagaa gaatattaca atgccttgtg tacaaatata cagttgagcg gagataaact + 6601 aaaagtaatt tccattactt ctgttaacgc tggggaagga aaaacaacta cttccgtaaa + 6661 tatagcaagg tcgtttgcgc gtgcaggcta taaaactctt ttgatcgatg gcgatactcg + 6721 aaattcagtt atgtcaggag tttttaaatc tcgtgaaaaa attacagggc taacagaatt + 6781 tttatctggg acagctgatt tatctcacgg tttatgtgat acaaatattg aaaatttatt + 6841 tgtagttcaa tcgggatctg tatcaccaaa ccctacagcc ttgttacaaa gtaaaaattt + 6901 taatgatatg attgaaacat tgcgtaaata ttttgattat atcattgttg atacaccacc + 6961 tattggaatt gttattgatg cggcaattat cactcaaaag tgtgatgcgt ccatcttgat + 7021 aacagcaaca ggtgaggtga ataaacgtga tgtccaaaaa gcgaaacaac aattagaaca + 7081 aacagggaaa ctgttcctgg gagttgtttt aaataaattg gatatctcgg ttgataagta + 7141 tggagcttac ggttcctatg gaaattatgg taaaaaataa cttagaaaag attttatgga + 7201 tgaaaaagga ttgaaaattt ttctggcagt attgcagagt attattgtca ttttattgat + 7261 ttattttctt agctttgtta gagagacaga acttgaacgt tcttcgatgg ttatactata + 7321 ccttctccac ttttttgcat tttattttag ttcctatggt aacaattttt ttaaaagagg + 7381 gtacctagtt gagtttaata gtactataag atatattttt ttctttgcaa tagctataag + 7441 tatattaaac ttttttatag cggaacggtt tagtatctct agaagaggaa tggtatactt + 7501 cttaacttta gaaggaatat ccttatactt gttgaatttc ttagtaaaaa aatattggaa + 7561 gcatgtgttt tttaatctaa aaaatagcaa gaaaatttta ctgttaacag taacgaaaaa + 7621 tatggaaaaa gttcttgata aattgctaga atctgatgaa ctttcatgga aattggtagc + 7681 agtaagtgtt ttggataaat ctgactttca acatgataaa atacctgtaa ttgaaaagga + 7741 aaaaattatt gaatttgcaa cgcatgaagt tgtggatgag gtgtttgtca atcttccagg + 7801 agagagctac gatattggag aaattatctc taggtttgag acaatgggga tagatgtaac + 7861 tgtaaatctt aaagcatttg ataaggattt tggtcgcaat aaacaaattc atgagatggt + 7921 aggattggat gtagtcactt tctctacaaa tttttataaa actagtcatg tgatttcaaa + 7981 gagaattctc gatatttgtg gtgccactat tggccttatt ctttttgcta tagctagtct + 8041 agttttagtt ccattgattc gtaaagatgg cggaccagct atttttgctc aaactcgtat + 8101 agggaaaaat ggtcgacatt tcacctttta taaattccgt tcgatgcgga tcgatgctga + 8161 agctatcaaa gaacagttga tggatcaaaa tacgatgcaa ggtggtatgt ttaagataga + 8221 caatgatcct cgtgttacaa aaattggtcg ctttattcgt aaaaccagtt tggatgaatt + 8281 gccgcagttt tggaatgtct ttataggaga tatgagtttg gtaggaacac gtccacctac + 8341 agtagacgag tatgatcagt atactccaga acagaaacgt cgactcagct ttaaacctgg + 8401 gattacaggc ttatggcaga ttagtggccg aagtaaaata accgattttg acgatgttgt + 8461 aaaattagat gtggcttata ttgataattg gacaatctgg aaagatattg aaattttgct + 8521 taaaactgtt aaagttgtat ttatgagaga tggagcgaag taatttctgt atatccatca + 8581 tattaggaga gaaatgaaaa agtcagttta tatcattggt tcaaaaggaa ttcctgctaa + 8641 gtatggagga tttgaaactt ttgttgaaaa attaacagcc ttccaacaag ataaggctat + 8701 ccaatattat gtggcttgta tgcgtgaaaa ctctgcaaaa tcagggacta ctgaggatgt + 8761 ttttgaacat aatggtgcta tctgttataa cgtcgatgtt tctaatattg gtccagcgcg + 8821 agctatagcg tatgatatcg ctgcaattaa cagagctatt gaaattgcca aagaaaataa + 8881 ggatgaagct ccaatcttct atattttagc ttgtcgaatc ggtccgttca tccatggaat + 8941 taagaaaaaa atccaggcga taggtgggac tcttctagtt aatccagatg gtcacgagtg + 9001 gttacgagct aagtggagcg ctccagttcg tcgttattgg aaaatttccg aaggtcttat + 9061 ggtcaaacat gcagatcttt tagtgtgtga tagtaagaat attgaaaaat atatccaaga + 9121 agattatata cagtatcaac ctaagacaac ctatatcgct tatgggacag atacaacacg + 9181 ctccacatta aatagcggtg atgaaaaagt gcgtgcttgg ttcaaggaga aaaatgtttc + 9241 tgaaaacgag tattacctag ttgtaggacg ttttgttcca gaaaataatt atgagtctat + 9301 gatacgtggt ttcttggcgt ctagctctaa gaaggatttt gtcctaatca caaatgtaga + 9361 acagaataaa ttttataatc agctattagc aagtactgga tttgataaag atccacgagt + 9421 gaaatttgtt ggaacagtct acgaccaaga acttctgaag tatattcgag aaaatgcttt + 9481 tgcttacttc cacggacatg aagttggtgg aacaaatcct tcgttacttg aagcattagc + 9541 attcacaaag ttaaacttac tactcgatgt tggttttaac cgcgaagttg gggagcaaag + 9601 tgcgatctat tggaaaaaag atgagctttc ccaagtaatc gagaaagttg aacaatttga + 9661 tgcaaaaatg attgatgagt tagatagaca atcaaatcag agaattgcgg attatttcac + 9721 ttgggaaaag attgtcacag actacgagaa attatttaaa aaatgaaaat attacattat + 9781 actttaggat ttcaacccca gcgaacaggt ggtttggtta aatatgctga ggatttaatg + 9841 atagagcaaa ttgctcaagg ttatcaagta gctgccctat atccaggaag aattaagttc + 9901 ttttcaaaaa aaatagaaat aattaaagcg acgtcaagac agtttgaatg ttatgaactg + 9961 cttaatagct tacctatggc tttatttgga ggtatatccg atccaactgc tttcctgaca + 10021 ccttgtgaca aaaatgttta tcgtactttt ttagaaaaag tacaacccga cattatacat + 10081 attcactcgt ttatgggatt gcataaagaa ttcctcgaaa ttgctaaaaa cttgaatatt + 10141 agagtggttt ttacgagcca tgattattat ggattagcac ccgtacctta tttctatttt + 10201 aatggggtgg attatagtga taaaaataca aacttaacat ggaatattat gtcttccaat + 10261 gctttaagtg tgaaaaaact aagacttttt caggtttcgt tttatcctac tattcgtaaa + 10321 cttttgaaac tattagggaa aaatccaaaa tctaaaaaga atttagttat tcgagatgtt + 10381 attgaggagc aagattatag tgagcttcga tactattata atgagatgtt tcacttaata + 10441 gatggttatt tgtttaatag tagacttgca aagaaggtat atgagataaa tgagattaag + 10501 tcagctaata gtatagtatt atctataaca aatagttcaa ttaatcatca tcagagattg + 10561 acaactacaa ataataaaat tagagttgtt tatattggtc cagatgaaga atataaagga + 10621 tattttgatt ttgttgactt tgctgaaact ttagatcgag agtcctatga agtggcaact + 10681 tatggccatt taccaaatga agagtgtcct tcattcattg aacaaaaagg atattttact + 10741 aaggaaatga ttgacagtgt ctatgaaaat attgatattc ttattgttcc aagtaagtgg + 10801 aaggaaacat ttgggttgat aacagtagaa gcattatcct atggggtaaa tgttttcgtg + 10861 agtgaaaatg ttggatcaaa agacttgctt ccagaaacac atgtttttaa aaatcagaat + 10921 gacttagtag ttaaaattat agaaaatgat atagaaaata caaaattaaa aactatagat + 10981 gaacactcga aagaagtgat tcagtattat gaaagagtga taaatgatag ttgagagctt + 11041 aataaaaaag attactggaa aagcagtaga cattcaccct gatgtatcca tggcgtatat + 11101 actacaaaga ggcatgaact atggttttgg actttttcgt ggatttgtac gtggaatcgg + 11161 atttggtcaa aaagggaagc gtttattcat tggacaagga gtttctatct tagcaaagcg + 11221 taaattattt gttgggaaaa atgttcgaat tggtaaaaac gtgtctatag atgcactgtc + 11281 gaaagaagga atccattttg cagataatgt gaagattgga gattattctc aaattattgg + 11341 aacaggaact ataaaaaata tggggattgg cttgaaagtt ggtaagaact catctttttc + 11401 agaatatagt ttatttggtt ctgctggagg tatcacaatt ggtgataatg ttatcgcagg + 11461 tcagaatgtt cgttttcatg ctgaaaatca taattatagt gatttagata aactcattct + 11521 tgaacaaggg atatctcgaa agggaatttc agtaggacat aattgttgga ttggtgctgg + 11581 agctgttttt ttggatgggt ccagcatcgg ttcaggttgt gttgttggag cgaatgctgt + 11641 cgtcactaag cagtttccag ataatgttat cataggtgga gtaccagcta ggatactggc + 11701 ttatagatag tgtttaacta tttctgaaag gaagaaaatt tatgcctaca tttagtgtag + 11761 ttgttccagt ttataatgta gagaattatt tatcgcaatg tttaaatgct cttgtaaatc + 11821 agtcttttaa agattttgaa cttatcctgg taaacgatgg ttctactgac acatctggaa + 11881 gtctttgtga agaatggggg aaaaaagatc atcggataaa agtaatacat aaaaccaatg + 11941 aaggtcttgg ttttgcacgt aacacaggta ttgaaaactg tacaggagat tatattgtct + 12001 ttgttgattc ggatgattat gtctcatatg agatgcttga aatttatgat acatacttac + 12061 aacgttttaa tgcagacgtg atttatagtg aaaattttta tcgagtggat aataaaggaa + 12121 atattataga accacttgat cagagcctag attccatttt ttataaaaat gattcaattt + 12181 tcacagaact tttaccagat gtaatatctt caccaccaga atttattgga gatggaaaga + 12241 taggtgtttc agtgtggaaa ggggtatata aacgttcttt gtttaaggat aaggggctat + 12301 tatttcattc agaaagagaa ttcatttcag aagatgctat ttttcaaatt gattgtttaa + 12361 aattagcaac atctgccctt gttatcccag atattttata ctactatcgt gaaaactttg + 12421 gttctttaag tatgaaatat aaagaagatc ggtttgagtt gaataaaata ttgtataacg + 12481 agcaattaaa aagagttgag gggttaccta atcaagaaat tttggaagaa agaattgaga + 12541 gaattttaat tgctaatatc cgtttatgta tctttcagga atccctatat aaaagttcta + 12601 gaattcataa acgcttgcaa agaattagac agatttgtaa ggacccaata tcaaaatcag + 12661 tattacgtca ttatccaatc cgtcgtttac ctttttctaa acgcttgatc tgcgtattag + 12721 ctaagtataa tatgccgttg ttgcttttag ttttaacctt attaaaatat cggaatcgga + 12781 gtgtataact tttatgggga tgaatataga aaaattaaaa ctatctttga aaaatggaac + 12841 gtttttttct gttgttattc acgccttacg aaatcgttgg cctttatggt ggattgggaa + 12901 caaggctatt cgagaagtgc aacttgaaga tagggcttac agaatactaa aaaagaaata + 12961 cggctcctta atttcaagct cttttgataa atcatattta tcagaagaag ttcccaagca + 13021 aatctggatt tgttggcttc aaggtatgga gaatgctcca gagttggtga aatcatgtta + 13081 tagatcacta aaaaaacaat ttcctgaata tgtcattacg gttatttctt cagaaaatat + 13141 ttccgaatat gtagaaatac ctgatattat ttataaaaaa tggggaaatg gtgtaatagg + 13201 aaatgctcat ttttctgata tccttcgggt agagctgtta cgtaagtttg ggggaatatg + 13261 gattgactca acagtgtatt gtacaggaat tactaccata gagacaattg aaaaaaatcc + 13321 attttttatg tataaaagtt tatcttcagt tgaggagaga atttcctctt ccaactggat + 13381 gattgcttct gttcccaatc atccatttat gattacgatg agcacactct tgcaatctta + 13441 ttggtcaaaa gaagttatag caattcatta ttatctattt catattcttt ttacgattat + 13501 gattgaatca cttcctgagt tgtggcagct tgtacccacc tatacgaacg caacaccaca + 13561 tataatggct gatgaattaa ataatatttt ttcaaaggaa cgttaccagc aattgtgtca + 13621 aatttcagat tttcataaat taaattataa aaaaaattac aatgatcaat cagagagttt + 13681 gtacagtcac ttactgaatc agtagagggg agaatcttgc ctaatttaaa gaaaaacatt + 13741 gtttacaatg tcttatatca gatcttagct gtaatagtac cgtttattac ctcaccttac + 13801 ttagcgcgtg tgttaggtgc agagcaaatt ggagtttatt cttttactta ttccattgct + 13861 ttttacttta tgattctgtc catgttggga atttctaatt atgggaatcg gacaatggca + 13921 caggtacgaa caagtagaga acatttgaat caagaatttt cgaatattta cgcggttcag + 13981 ttgacgtgtt cactagtaat gaccgtctca tatttgattt atgcaacagt atttgtgaat + 14041 agttttcaga ttgtagccta tatccaagta ttacatgttt tatcgtatgc aacagatgtt + 14101 agttggtttt tttatggtct tgaagagttt cgtattacgg ttgctaggaa ttcatttgtt + 14161 aagttattaa ctttaatatc tatctttaca tttgtaaaaa gccctaatga tatctattta + 14221 tataccttta taatggcagg gagtaccctg cttggtcagt tgattacatg gccatttttg + 14281 ctaaaacaag taaactttgt gcgccctagt cttggaaaaa taaagaaaca catgaaacct + 14341 attattattt tatttttccc cgtcttagcg attagtattt tttcgtttat agataaaata + 14401 atgcttggga tgtatagtag tttgaaggaa actgcttttt atgagaattc agataagatc + 14461 attagtattc caaaagctct gattcaagcc tttggagctg taatgttgcc tcgaacagta + 14521 catttactga gtataggtga tgaacaaaaa agtttagaat atgttgataa aacgatgtgg + 14581 gttgttttag tgattacaat gggctgtgct ttcggtttag caggagtttc tgcaaccttt + 14641 gctcctgttt attggggtga agaatttagg accagtagcc aaattattgc aggaatgaca + 14701 ccggctttag tattttcggc ttttggaaat gtcatccgaa cccagttttt aattccacga + 14761 agttttgaca aggaatatac tgtatctttg ctttatggag ccgtagttaa tatcttgatt + 14821 aatattcttt tgattccgaa gataggagca atgggagctg ttatcggaat aattgttgca + 14881 gagttagttc tatgttgcta tcaaacatgg attgctagaa attatttaca tatcagagaa + 14941 tatctgataa atgctgggat attgtttctt attggttcag taatgtatat ggttttaatt + 15001 cttatttcaa gtattttacc tacatcgtta cttacactta ttattgaaat tatagtcgga + 15061 gctttcattt atattagttt actgattctg tatatctttt cttcaaaaaa cagggtaatt + 15121 attggtttac gaacaaattt tttagaacat actcatttat ttaaaaggaa gtaatagtga + 15181 aatttaaatt taatccaatc gcgatactgt atatattgct agtatactta gagttggcta + 15241 cagataggca acatctgtat cctgtaacgt acatgacaaa atattatatt ggtattttaa + 15301 tcattgtgtt gtttgtttta ttattagtag gccgtgggaa gcttattttt gttaataaaa + 15361 aattattata tcttgctaag atattagcta taccaacaat tgttcttttc ctgtactcag + 15421 tcttactaga cgtaatgaac ccagttgaat ttaatggata ttttagtagg ttatcaagta + 15481 cgactatttt tggtttgtta gctatctttc aagctatagt tgtttttcaa ttttttggac + 15541 aaaaagtagt agattacact tttacagcta tctccctcag ctacttaacc agtatcattg + 15601 ttgcctttag gcagggagga cttagtcaat ttatcttgat actaacagat gatagtttca + 15661 atggttcggt actagaaatg catgaagttg cacctattac agctctcttt attctgtact + 15721 atttgtacaa atattttata aaagaaaata gtttttcttc agtatttcat aatatcttaa + 15781 tagctctcat tattcttttt ttaagcctta aacgaatcgt ttttttgagt gtattaatta + 15841 tcataccagt atttttggta atttattggt atgataaaaa agtaagcaaa ctagggaaag + 15901 aacgaaaaat tttaagttta ttaaatatct tttccttaat atttataaca ggaatattcc + 15961 tttatgttta tagtgtgaaa tctgatttta tatatacatt tattcaagaa cataatatta + 16021 attcgatggc tagaacagat ttatggaagg gagttgaatc aacctataat ttcgccccta + 16081 tatttatggg gagagggata gggtttgtaa caaaatggat ggataataat tggatgactt + 16141 tgaatatcaa tggtcttaca gggtcaatgg ggatccataa tgatattttg aagtactaca + 16201 ttgagatagg atttgtagga ttatttattt atttttacac tcttctttat agaaatgcta + 16261 aacgtatatt tgtaaaaatt ggtcataaag aatcattcat atattttgta ttgataatgt + 16321 ttcagatgct gatatggttt acagataata tttcaattta ccataatttt ttatggatcc + 16381 taaatctact actcttttct ttaactaatt cggatacaga attggaaaat ttagatttta + 16441 aaaattttta atgtgtaagt agtaactact aattttatta gaaaatcaga atataggtgt + 16501 atttatgaag acagatgcta ggactaaaaa gagagagaat gaaacgttat atattctaaa + 16561 agtttgggca acatttagtg tgattgctat acattttggt tttttgggcc aaattggagt + 16621 gttttacaaa gtattagctc gatttgctgt acctttattt ttcatgattt caggatttta + 16681 ttcgtttagt atttcagaag aaaaactgaa gaaaagaatt aaaaatctga gtttattgat + 16741 aatttccagt acaagttttt attttttact ggatgttttt cttcaattaa cacaaggaaa + 16801 tctaagagtt gtatttgaaa gatttacttt taataatatt tttaattttt tggtattcaa + 16861 tcaaatttct gctctaattg gctcgttagc aacaccacta tggttcttat atgcattact + 16921 gtatgtttat atttatctat ttttttcaaa taaaaaatgg atatttaata ctattttgac + 16981 tgtgatcata ctctgttgtt catttataat cgagttaaaa gcaaatagtg ctttatttta + 17041 tagaaacttc ttatttatgg gagttccctt cttttctttt gggatgtatt ttgctcaaat + 17101 tcagagaaaa attataaatt ataagcactt caaagaactt tttataattg gaattatgat + 17161 ttcaggattt ctaactctgt ttgaatatac ctttttagga gcaaattttg aactttatat + 17221 aagttcggtg ataatatctt gtatgcttat ggtcttttcg attaaatatc ctcaactctg + 17281 gacgctagat tttgctgtca atattgctaa aaaaaatgcg acgtttattt atattagtca + 17341 tcaatttgtg attttattat ttaaaacata cgttagagat ggaattgctt ataaaattgg + 17401 aactttcttg atatttttag catgtgttat tatgagtatt attttcaact atatagtcga + 17461 tataatcagt cgttgttgca taaaagaaaa acaagatata atatgaaatt ttatataaaa + 17521 aatttattaa aaaaagtctt tacattaccg ttgcatttat tgcctattca gtctaataag + 17581 ataatatttg ataattttgg tggtagaggt tttggggaca atcctaagta tatacttgaa + 17641 gaacttgtct ctcgagaaaa gaatctagat cttgtgtggg taacaaaaga tagagaaatt + 17701 tctatccctg aaggcgttcg agtagtaaaa tacggcagtt accgttcttt ttatgaatgg + 17761 ttaacagcta gagtttgggt agataatatt cgtaattctg atcgaccttg gaagcgaaaa + 17821 ggacagattt atcttcaaac ttggcatggt tcagatgggg taaagttaat tgaaaaaagt + 17881 gttgcaagga acctaaaaaa aacatatctt agaatggcga agtatgatgg aaagattaca + 17941 gacggtatcg tatcaagtcg gcactttcaa actttgggta tgcaaaataa tttttggctg + 18001 acagagaatg tggaatttct ggaatttgga ttacctcgaa atgatgattt ttttaaaagt + 18061 gaaaaaatca aaaccacaaa tataaaattt agaacattat ttgatatcga tttagacgaa + 18121 ctggtagttt tgtatatgcc gacgttcaga gatgatggat cgttgaatgc ctataattta + 18181 gattactcga aactaataca tgtttttcaa aataaattta gaaaaaatgt aaaaatatta + 18241 gttcgttttc atccaaatgt tgattctagt tttataaatt tacaggatac agactgtata + 18301 aatgtgtcga cctattcaaa tcctcaggat ctgatgatga gtgcagatgt gatgattacg + 18361 gattattcat cggcttctat tgattttatg ttattaaatc gtccagtatt tctgtattta + 18421 ccagattatc aaagttatgt gaatgataga ccattggatg ataactttga taaattgcca + 18481 tttccaagag catatcataa caatgagttg acagaaatta ttagagactt tgaaagaagt + 18541 aaatatgatg aaaaagttcg tctgtatgaa ttagaggatg ttcgttttga tagaggaaaa + 18601 gcatcagtac agtgtgctaa ttggattgaa gaaaaaataa aaaacaataa agttattgat + 18661 tgaaataatt gtatttattg aattataaat aaggaggcct ttagatgaaa agagttataa + 18721 catatggtac atttgattta ttgcattatg gtcatatcaa tcttttaaaa cgtgctaaac + 18781 agctaggtga ttatttgatt gtagttgttt caagtgatga gtttaattta aaagaaaaga + 18841 ataaagtatg ttactttaac tacgaacaca gaaaaaattt agtagaagct attcgatatg + 18901 tcgatttagt aatccctgaa actagttggg aacagaaaaa gtcagatgtt aaaaagtacc + 18961 atattgacac ttttgtaatg ggtgatgatt ggaaaggtaa atttgattat cttgaagaag + 19021 aaggtgttga agtagtctat ttgcctagaa caaaggaaat atcaaccaca aagataaaag + 19081 aagatttatc ggaatgaaat attattaaaa aatgctgaca taagaaattg tggcttttgt + 19141 gtctagtttt tgatagaata aagtaacaac actttaacca atgaggtgtg aataatggca + 19201 gtaattttta aagatgtact tgttgaagag aaaactgatg aagaaaaaca acatatttta + 19261 tctattttaa atgatgagaa tgttagagct tttgattgtg gatattaaga attgaatgat + 19321 gttttttgat atttagaaca aatacgatga agaaacaggc catgtattgc ctattgtaaa + 19381 tcaaaatttt gaattattag gttttatttc ttgtagacta gtatcatttt ctttcatagc + 19441 tcaggttaaa gagatgggaa ttagcataga ttatcttggt attcataagg attgccagaa + 19501 aatgggggat cggttcgctt ttggtgctct ttgcgcttcg attatcttta actattgact + 19561 gttgattacc aataaaaggt gtaatagttc atgttttaga ggatgttgta gaattctatg + 19621 acaaactggg ttttattgac cctagagata tagtgattta taatggcaaa ccggttacta + 19681 tatattttag tattgaaaaa ctaagaaatg gtgaaaatta ttcctctcac acagttattt + 19741 gaaacatcct tagaaaatga tttttaattg tatgcaaaca aagtagaatt cgcttatttc + 19801 atcttatgct aaatgtaata tgaaacaagt gaatttttat agataaagaa gaattttaaa + 19861 aaatgtgatg attattttct ttttagagca gtacagaatt aatagtaatt gactctaaat + 19921 caataaagaa aggtacccta ctatgaaagg tattattcta gcaggtggtt cggggacacg + 19981 tttatatcct ttgactcgag ccgcatcaaa acaacttatg ccggtttatg ataaaccgat + 20041 gatttactac ccactttcaa cattgatgtt ggctgggatt agggatattt tgattatttc + 20101 cactccacag gatttacatc gatttcaaga gcttcttcaa gacggatctg agtttgggat + 20161 caaactttct tatgcagagc aaccaagtcc agatggtttg gcacaagcct ttatcattgg + 20221 ggaagagttt atttctgatg atagcgttgc gctaatctta ggtgataata tctaccatgg + 20281 ttctgggctt tccaagatgc tacaaaaggc agcgagtaag gagtcgggag caactgtttt + 20341 tggctaccat gtcaaggatc cagagcgctt tggtgtggtt gagtttgatc aggatatgaa + 20401 ggctatttct attgaagaaa agccagagca acctcgttca aactatgcag tgacaggact + 20461 ctatttctat gataatgatg tagtagagat tgccaagagt attaaaccaa gtcctcgtgg + 20521 tgaactggaa attacagatg taaacaaagc ttacctagat cgtggtgatt tgtctgttga + 20581 gcttatggga cgtggctttg cttggctgga tactggaact catgaaagtt tactagaggc + 20641 ttcacagtac atcgaaacag tccaacggat gcaaaatgtt caggtagcaa acttagaaga + 20701 aattgcttac cgtatgggct atatcagtcg agaagatgta ttggccttag cccaaccact + 20761 taagaaaaat gaatacggac agtatctgct ccgtttgatt ggagaagcat agatgacaga + 20821 taattttttc ggtaagacgc ttgcggcacg caaggttgaa gctattccag gcatgttgga + 20881 gtttgatata cccgttcatg gagataatcg tggctggttt aaagaaaatt tccaaaagga + 20941 aaaaatgctt ccacttggat ttccagagtc tttctttgca gaaggaaaat tgcaaaacaa + 21001 tgtatccttc tcacgtaaaa atgtccttcg aggcctccac gcagagcctt gggataagta + 21061 catctctgta gcagatggag ggaaagttct gggttcttgg gttgatctac gcgagggtga + 21121 aacctttggg aatacctatc agacagtaat tgatgcaagc aagggaatct ttgttcctcg + 21181 aggcgtagct aatggcttcc aagttctatc agatacagtg tcatatagct atctggtcaa + 21241 tgattactgg gctctcgagc tcaaacccaa gtatgccttt gtgaactacg ctgatccaag + 21301 ccttggtatt gaatgggaaa atattgcaga agcagaggtt tcagaagcag ataaacatca + 21361 tcccctactt aaggatgtaa aacctttgaa aaaagaagat ttgtaaaaag gaaagaatat + 21421 gactgaatac aaaaatatta tcgtgacagg tggagctggc tttatcggtt ctaactttgt + 21481 ccattatgtt tacgagaact ttccaggtgt tcacgtgaca gtcctagata agttgactta + 21541 tgctggaaat cgcgcgaata ttgaggaaat tttaggtaat cgtgttgagt tagttgttgg + 21601 tgacattgct gatgcggagt tggtagacaa gttggctgct caagcagatg ctatcgttca + 21661 ttatgcagcg gaaagccaca atgataattc gctcaatgat ccatcgccat ttattcatac + 21721 taacttcatc ggaacctata ctcttttaga agctgctcgt aagtatgata ttcgcttcca + 21781 ccatgtatcg acagatgaag tttatgggga tctcccttta cgcgaagatt tgccaggtca + 21841 tggtgaagga ccaggtgaga aatttactgc tgaaacaaaa tacaacccaa gctctccgta + 21901 ctcatcaacc aaggcagcct cagatttgat tgtcaaagcc tgggtgcgtt cttttggagt + 21961 caaggcaacg atttccaact gttcaaataa ctacggtcct tatcaacata tcgaaaaatt + 22021 catcccacgt cagattacta acattctaag tggaattaag ccaaaacttt acggtgaagg + 22081 taagaatgtt cgtgactgga ttcataccaa tgaccattct tcaggagttt ggacaatctt + 22141 gacaaaaggg caaatcggtg aaacctactt gattggggct gatggtgaga agaacaataa + 22201 ggaagttttg gaacttatcc ttaaggaaat gggacaagct acggatgcct atgatcatgt + 22261 gactgaccgt gcaggacatg accttcgcta tgcgattgat gccagcaagc tccgtgatga + 22321 gttggggtgg aaacctgaat ttaccaactt tgaagctggg ctcaaggcaa caatcaagtg + 22381 gtatacagat aaccaagaat ggtggaaagc agaaaaagaa gctgttgaag ccaattatgc + 22441 caagactcag gagattatta cagtataaaa agcaggaaat agctgctttt tattgctata + 22501 ttgggaagag ttacatatta gaaaggtcta gagatgattt taattacagg ggcaaatggc + 22561 caattaggaa cggaacttcg ctatttattg gatgaacgta atgaagaata cgtggcagta + 22621 gatgtggctg agatggacat taccaatgaa gaaatggttg agaaagtttt tgaagaggtg + 22681 aaaccgactt tagtctacca ttgtgcagcc tacaccgctg ttgatgcagc agaggatgaa + 22741 ggaaaagagt tggacttcgc catcaatgtg acggggacaa aaaatgtcgc aaaagcatct + 22801 gaaaagcatg gtgcaactct agtttatatt tctacggact atgtctttga cggtaagaaa + 22861 ccagttggac aagagtggga agttgatgac cgaccagatc cacagacaga atatggacgc + 22921 actaagcgta tgggggaaga gttagttgag aagcatgtgt ctaatttcta tattatccgt + 22981 actgcctggg tatttggaaa ttatggcaaa aacttcgttt ttaccatgca aaatcttgcg + 23041 aaaactcata agactttaac agttgtaaat gaccagtacg gtcgtccgac ttggactcgt + 23101 accttggctg agttcatgac ctacctagct gaaaatcgta aggaatttgg ttattatcat + 23161 ttgtcaaatg atgcgacaga agacacaaca tggtatgatt ttgcagttga aattttgaaa + 23221 gatacagatg tcgaagtcaa gccagtagat tccagtcaat ttccagccaa agctaaacgt + 23281 ccgctaaact caacgatgag cctggccaaa gccaaagcta ctggatttgt tattccaact + 23341 tggcaagatg cattgcaaga attttacaaa caagaagtga gataagtagt agaatgattt + 23401 tctagtctaa taaaagaggc agagaatgaa ctccaaagga gcttaagatg tacgattatc + 23461 ttgttgttgg tgctggtctc tttggcgcat agctttggct cagtttctat tatcgctcac + 23521 accatccatc agaagtttaa tctgaaggta cccaattatc gccaagaaga agattgggct + 23581 aggatgggtt taccaatcac acgtaaggaa atctctaatt ggcatatcaa ggcaagtcaa + 23641 tactatttag agtcccttta taacctttta cgagaaaagt tgttagaaca acctcttctt + 23701 catgcggatg aaacctctta tcgggttcta gggagtgata gccatctgac ctactattgg + 23761 acctttttgt ctgggaaagc tgagaatcaa gcaatcacgc tgtaccatca tgatcagcgt + 23821 cggagtggtt cggtagtgca agaattccta ggagattatt ctggctatgt gcattgtgat + 23881 atgttgcggc agtaacttag gactttagtc ctctagttct gcctatgcga tagcagtcca + 23941 aggtttagga gcaaggcgac gctaagcttg gtaaactgcg aaccgctaga agcttatcgt + 24001 caactggaag aagctgaact tgttggatgt tgggcacatg tgagaaggaa gttttttgaa + 24061 gcgaccccca agcaagcaga taaatcatcc ttaggagcta aaggtttagc ttattgtgat + 24121 cagttatttt ccctggaaag agactgggag gctttgccag ctgatgaacg actacagaaa + 24181 cgtcaagaag agctccagcc cttaatggaa gacttctttg cttagtgccg gcgtcagtca + 24241 gttttagcag gttcaaaact aggaagggca attgaataca gcctcaagta tgaagaaacc + 24301 tttaagacta ttttgaaaga cggacatctg gtcctttcca ataatctagc tgaacgcgcc + 24361 attaaatcat tggttatggg acggagtaaa agagtccagt ggactctttt agcctaagct + 24421 aaattttaaa aagcgagggt ggttattttc tcaaagtttt gaaggagcta aagcaagaac + 24481 tattattatg agtttgttgg aaacagctaa acgtcatcaa ttaaatagcg agaaatatct + 24541 attctatctt ctagaatgtc tttcaaacga ggaaactctc gtaaacaaag aggttttaga + 24601 ggcttattta ccatggacta aagttgtaca agaaaagtgc aaataagaaa tctccagatt + 24661 aggaactatc cgtgagttct ctagtctgga gatttttcgg ctctttgtca actgtagtgg + 24721 gttgaaaaaa agctaagctc gagaaaggac aaattttgtc ctttcttttt ttagaaatag + 24781 tattaaaaat tccttgacta tgtgatatag ttgagggatt tttaaatgat attcatattt + 24841 tttgcaaaga tgttgtttga aaaataattt tcaaaaattc tgaaaattct gttgacatct + 24901 ttctgaaaag agtctataat ggagagaaag ttttaaagga gaaaatgatg aaaagttcaa + 24961 aactatttgc ccttgcgggc gtgacattat tggcggcgac tactttagct gcatgctctg + 25021 gatcaggttc aagcactaaa ggtgagaaga cattctcata catttatgag acagaccctg + 25081 ataacctcaa ctatttgaca actgctaagg ctgcgacagc aaatattacc agtaacgtgg + 25141 ttgatggttt gctagaaaat gatcgctacg ggaactttgt gccgtctatg gctgaggatt + 25201 ggtctgtatc caaggatgga ttgacttaca cttatactat ccgtaaggat gcaaaatggt + 25261 atacttctga aggtgaagaa tacgcggcag tcaaagctca agactttgta acaggactaa + 25321 aatatgctgc tgataaaaaa tcagatgctc tttaccttgt tcaagaatca atcaaagggt + 25381 tggatgccta tgtaaaaggg gaaatcaaag atttctcaca agtaggaatt aaggctctgg + 25441 atgatcagac agttcagtac actttgaaca aaccagaaag cttctggaat tctaagacaa + 25501 ccatgggtgt gcttgcgcca gttaatgaag agtttttgaa ttcaaaaggg gatgattttg + 25561 ccaaagctac ggatccaagt agtctcttgt ataacggtcc ttatttgttg aaatccattg + 25621 tgaccaaatc ctctgttgaa tttgcgaaaa atccgaacta ctgggataag gacaatgtgc + 25681 atattgacaa agttaaattg tcattctggg atggtcaaga taccagcaaa cctgcagaaa + 25741 actttaaaga tggtagcctt acagcagctc gtctctatcc aacaagtgca agtttcgcag + 25801 agcttgagaa gagtatgaag gacaatattg tctatactca acaagactct attacgtatc + 25861 tagttggtac aaatattgac cgtcagtcct ataaatacac atctaagacc agcgacgaac + 25921 aaaaggcatc gactaaaaag gctctcttaa acaaggattt ccgtcaggct attgcttttg + 25981 gttttgatcg tacagcctat gcctctcagt tgaatggaca aactggagca agcaaaatct + 26041 tacgtaatat ctttgttcca ccaacatttg ttcaagcaga cggtaaaaac tttggcgata + 26101 tggtcaaaga gaaattggtc acttatgggg atgaatggaa ggatgttaat cttgcagatt + 26161 ctcaggatgg tctttacaat ccagaaaaag ccaaggctga atttgctaaa gctaaatcag + 26221 ccttacaagc agaaggtgtg acattcccaa ttcatttgga tatgccagtt gaccaaacag + 26281 caactacaaa agttcagcgc gtccaatcta tgaaacaatc cttggaagca actttaggag + 26341 cggataatgt agtcattgat attcaacaac tacaaaaaga cgaagtaaac aatattacat + 26401 attttgctga aaatgctgct ggcgaagact gggatttatc agataatgtc ggttggggtc + 26461 cagactttgc cgatccatca acctaccttg atatcatcaa accatctgta ggagaaagta + 26521 ctaaaacata tttagggttt gactcagggg aagataatgt agctgctaaa aaagtaggtc + 26581 tatatgacta cgaaaaattg gttactgagg ctggtgatga gactacagat gttgctaaac + 26641 gctatgataa atacgctgca gcccaagctt ggttgacaga tagtgctttg attattccaa + 26701 ctacatctcg tacagggcgt ccaatcttgt ctaagatggt accatttaca ataccatttg + 26761 cattgtcagg aaataaaggt acaagtgaac cagtcttgta taaatacttg gaacttcaag + 26821 acaaggcagt cactgtagat gaataccaaa aagctcagga aaaatggatg aaagaaaaag + 26881 aagagtctaa taaaaaggct caagaagatc tcgcaaaaca tgtgaaataa +// + diff --git a/public/res/serotype_genbank/serotype_19A.gb b/public/res/serotype_genbank/serotype_19A.gb new file mode 100644 index 0000000..5daef2e --- /dev/null +++ b/public/res/serotype_genbank/serotype_19A.gb @@ -0,0 +1,866 @@ +LOCUS CR931675 18617 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Nr. 141/68 (serotype 19a). +ACCESSION CR931675 +VERSION CR931675.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18617) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 18617) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..18617 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Nr. 141/68" + /db_xref="taxon:1313" + gene <1..136 + /gene="dexB" + /locus_tag="SPC19A_0001" + CDS <1..136 + /gene="dexB" + /locus_tag="SPC19A_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33621.1" + /db_xref="UniProtKB/TrEMBL:Q4K117" + /translation="ANEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVEMTD + " + gene complement(267..1697) + /gene="tnp" + /locus_tag="SPC19A_0002" + /pseudo + CDS complement(267..1697) + /gene="tnp" + /locus_tag="SPC19A_0002" + /note="member of homology group 17; + member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(693..1193) + /gene="tnp" + /locus_tag="SPC19A_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.8e-21" + /pseudo + gene 1852..3297 + /gene="wzg" + /locus_tag="SPC19A_0003" + CDS 1852..3297 + /gene="wzg" + /locus_tag="SPC19A_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33623.1" + /db_xref="GOA:Q4K116" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K116" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLMSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEHPDYASKIKKIYTKGFTKKVEAP + KTSKDQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVYNDQ + DFTSLHGKFHFPVGNVHLDSEQALGFVRERYSLADGDHDRGRNQQKVIAAILQKLTSS + EALKNYSRIIDSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGMGRTDLPSY + AMPDSNLYMMEINDSSLASVKTAIQDVLEGR" + misc_feature 1852..1968 + /gene="wzg" + /locus_tag="SPC19A_0003" + /note="Signal peptide predicted for SPC0963 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 2056..2403 + /gene="wzg" + /locus_tag="SPC19A_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.7e-63" + misc_feature 2581..3024 + /gene="wzg" + /locus_tag="SPC19A_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 3e-72" + gene 3299..4030 + /gene="wzh" + /locus_tag="SPC19A_0004" + CDS 3299..4030 + /gene="wzh" + /locus_tag="SPC19A_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33624.1" + /db_xref="GOA:Q9ZFU0" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q9ZFU0" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTSDVLDKLEKNRIPTLNNS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELINMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLERDLVHIIASDMHNVDSRPPHMAEAYDLVS + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3302..3910 + /gene="wzh" + /locus_tag="SPC19A_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 5.8e-37" + gene 4036..4731 + /gene="wzd" + /locus_tag="SPC19A_0005" + CDS 4036..4731 + /gene="wzd" + /locus_tag="SPC19A_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33625.1" + /db_xref="GOA:Q9ZFT9" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q9ZFT9" + /translation="MMKEQNTIEIDVFQLLKTLWKHKLIILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLTSKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPAMTPSSPNVRRNTLVGFLGGAAVTVITVLLIELLDTRVKRPEDVEDVLQM + PLLGVVPDFDKMK" + misc_feature 4057..4473 + /gene="wzd" + /locus_tag="SPC19A_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.8e-56" + misc_feature 4579..4656 + /gene="wzd" + /locus_tag="SPC19A_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4741..5430 + /gene="wze" + /locus_tag="SPC19A_0006" + CDS 4741..5430 + /gene="wze" + /locus_tag="SPC19A_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33626.1" + /db_xref="GOA:Q9ZFT8" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q9ZFT8" + /translation="MPTLEISQAKLELVKKAEEYYNALCTNLQLSGDDLKVFSITSVK + AGEGKTTTSTNIAWAFARAGYKTLLIDADMRNSVMSGVFKSRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIVVDTAPVGVVI + DAAIIMQKCDASILVTKAGETKRRDLQKAKEQLEQTGKSCLGVVLNKLDTSVEKYGSY + GSYGNYRKQKK" + gene 5445..6806 + /gene="wchA" + /locus_tag="SPC19A_0007" + CDS 5445..6806 + /gene="wchA" + /locus_tag="SPC19A_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33627.1" + /db_xref="GOA:Q9ZFT7" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q9ZFT7" + /translation="MSEKLAKPSVAIVQSFLVILLTYLLSAVRETEIVSTTAIVLYIL + HYFVFYISDYGRNFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LLLHVFLVYVLNPFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESDDVVGEL + VAVSVLDKPDFQHDDLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDWARNKQICEMAGLNVVTFSTTFYKTSHVIAKRIIDIVGSLVGLILCG + LVSIVLVPLIRKDGGSAFFAQTRIGKNGRHFTFYKFRSMCVDAEEKKRELMEQNTMQG + GMFKVDDDPRITKIGHFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQK + RRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDGWTIWKDIEILLKTVKVVLMKD + GAK" + misc_feature 6222..6803 + /gene="wchA" + /locus_tag="SPC19A_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.8e-158" + gene 6812..7555 + /gene="wchO" + /locus_tag="SPC19A_0008" + CDS 6812..7555 + /gene="wchO" + /locus_tag="SPC19A_0008" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI33628.1" + /db_xref="GOA:Q9ZFT6" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q9ZFT6" + /translation="MNERIQILGITIDPLTMKETVDAVEQYVLKKHPLHLMGVNADKI + NQCYEDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMKHLLELSNEKG + YSVYFFGAKEDVLQDMLKIFEERYPALNVVGYRNGYFSPEDEKHIQEDIKEKKPDFVF + VGITSPKKEYIIQSFMDNGINAVFMGVGGSFDVLSGHIKRAPLWMQNAHLEWLFRVAN + EPKRLFKRYFVGNVSFIRKVLRAKRGYKL" + misc_feature 6974..7489 + /gene="wchO" + /locus_tag="SPC19A_0008" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 3.8e-91" + gene 7552..8376 + /gene="wchP" + /locus_tag="SPC19A_0009" + CDS 7552..8376 + /gene="wchP" + /locus_tag="SPC19A_0009" + /note="member of homology group 95" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33629.1" + /db_xref="GOA:Q4K110" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K110" + /translation="MNQTEIVKLIQKVELDAIKEFQKICKENNIDFFLRGGSVLGAVK + YDGFIPWDDDMDIAVPREGYDKLPGIFKDRIIAGKYQVLAYQYCDTLHCYFPRLFLLE + DERKRLGLPRNTNLGLHLIDIIPLDGAPNHSFLRKLYFGKVYWYRFLASLGTTYVGDH + VDMHSAKQKLIIGFFKKLGFAKLFPQNYVYRRLDNLYKKYDWKKQKYAGTINASLFAK + EVMPVEIWGEGVEKPFEDAFFKVPTEYDRYLKRLYGENYLHEEPSDDEKKSHLGGQ" + misc_feature 7624..8313 + /gene="wchP" + /locus_tag="SPC19A_0009" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 1.2e-104" + gene 8378..9256 + /gene="wchQ" + /locus_tag="SPC19A_0010" + CDS 8378..9256 + /gene="wchQ" + /locus_tag="SPC19A_0010" + /note="member of homology group 43" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33630.1" + /db_xref="GOA:Q4K109" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K109" + /translation="MFCYIILHYKVLEETISCVKSIKEGNSNTKQIVIIDNFSNNGTG + EKLQELYESDSEIDVLINHENAGFARGNNVAYQFAKEKYKPDFMVIMNNDIEIETEEF + EKIVTDIYRKEKFHLLGPDIFSTTYQLHQNPKRLTHYTYEEVKALNEKFKKGSQVSLA + LKIKCWLKSSKVLRTAIYQNRRKKKSVDYRKQVENPILHGSFIVYSRDFIEKEEYAFN + PNTFFYYETEILDYEAELKGYKRIYTPKIKVLHHQNVATNQVYTNLVEKTLFSNKCNF + ESTSYFLKLMKENEGV" + misc_feature 8384..9019 + /gene="wchQ" + /locus_tag="SPC19A_0010" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6.3e-10" + gene 9257..10591 + /gene="wzy" + /locus_tag="SPC19A_0011" + CDS 9257..10591 + /gene="wzy" + /locus_tag="SPC19A_0011" + /note="member of homology group 161" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33631.1" + /db_xref="UniProtKB/TrEMBL:Q9ZFT3" + /translation="MTYLFLLCLTLFLLTFFYFFAFNQDLIAPPVVMSVMFLISSVFA + LINVQNWNIEYSGLAYLLIISGIIVFSMPLLALNSPSLNTKIKVTDRLIDIQFWKIAL + TIIVDLIILYLYRREIHNLALSHGYTGSNFQWFFRNATSYEGELTVRTSIRVLIRIID + VSAYIFGYTFINNFFIYSHKRSKDLLLLVPFLIFISKTLLSGGRLDIIKILIAYVVMA + YIQQKRKVGWDKVISHKYMRLGFVGLIAGIPTFYYSLFLSGRSTTRTVFESISTYLGG + SIQHFNQYIQNPIGVAEVFGDESFVAIMNILGNLGFVNYNSTVHLEFRQLGITMGNVY + TFFRRPWHDFGLVGMYIFSFVVGVFFAIFYLKLRKSRAGFKLDIHTIIYSYFFYWIFL + SSIEQYSFTTISLFTLVFIVLVYLMAFFYWNLDFHRGKLVIKLSDTSIKSEN" + misc_feature 9257..9388 + /gene="wzy" + /locus_tag="SPC19A_0011" + /note="Signal peptide predicted for SPC0971 by SignalP 2.0 + HMM (Signal peptide probability 0.988) with cleavage site + probability 0.615 between residues 44 and 45" + gene 10619..12043 + /gene="wzx" + /locus_tag="SPC19A_0012" + CDS 10619..12043 + /gene="wzx" + /locus_tag="SPC19A_0012" + /note="member of homology group 82" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33632.1" + /db_xref="GOA:Q4K107" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K107" + /translation="MNSKIKNILTNFSYVISSNLLTVLTSSLVVLIFPKLMGVTEYSY + WQLYIFYLTYIGFFHLGWIDGIYLKYGGLEYNNLDRKQFYSQMILFSSFLMIISLLLF + GLNVLAVTDSNARYIYNMTIISMIITNLRTLYVYVLQMTNRLKDSSIILLSDRVLYVL + LLFLFIVFGWHEYKVMILADILGRSFSLILSFWICKDIVFQPLSKFIFNIKESFDNIR + VGINLMLSNIASSLIIGIVRLGIQWNWNIETFGKVSLTLSVSNLLMTFINAIGLVVFP + LLRRTKAENLPKIYSNLRNVLMLIMFAILLIYYPLKIVLDLWLPAYQDALIFMTLIFP + MSVYEGKMALVINTYLKALRMERDILRVNALVMLISMGVTLVTTYLLNSLELTVVSIV + VLLALRSIIAELILSKKLDVSVKKDIVLEFLLTLVFISSSWYLPIGLAVIVYTIAYGL + YLYLKHEDIKTYLAYFKASKKTSN" + misc_feature 10619..10738 + /gene="wzx" + /locus_tag="SPC19A_0012" + /note="Signal peptide predicted for SPC0972 by SignalP 2.0 + HMM (Signal peptide probability 0.731) with cleavage site + probability 0.397 between residues 40 and 41" + gene 12108..13196 + /gene="mnaA" + /locus_tag="SPC19A_0013" + CDS 12108..13196 + /gene="mnaA" + /locus_tag="SPC19A_0013" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33633.1" + /db_xref="GOA:Q4K106" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K106" + /translation="MKKIMLVFGTRPEAIKMCPLVNELKKHEDMETIVCVTGQHKEMV + SPVLDLFGVVPDYDLEIMKANQTLFSITTSILEKIKPVLEKEQPDIVLVHGDTTTTYA + AALAAFYLGIKVGHVEAGLRTYNLQSPFPEEFNRQSTSIIATYHFAPTELAKENLLKE + GRENVYVTGNTVIDALTTTVQEDYTHTHLDLNANNRLILLTAHRRENLGEPMRHMFRA + VKRVLNEYEDVKVIYPIHKNPLVRETAAEIFGDTERIQIIEPLDVLDFHNFMNQSYMI + LTDSGGVQEEAPSLGKPVLVMRDTTERPEGVAAGTLKLVGTDEETIYQNFKLLLDDSG + EYKKMSQASNPYGNGDASQQIVQILRGI" + misc_feature 12171..13187 + /gene="mnaA" + /locus_tag="SPC19A_0013" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 1.9e-193" + gene 13359..14228 + /gene="rmlA" + /locus_tag="SPC19A_0014" + CDS 13359..14228 + /gene="rmlA" + /locus_tag="SPC19A_0014" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33634.1" + /db_xref="GOA:Q4K105" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K105" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFLIGEEFIGDDSV + ALILGDNIYHGPGLSTMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKQIKPSARGELEITDVNKAYLNRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEISYRMGYISREDVLELAQPLKKN + EYGQYLLRLIGEA" + misc_feature 13362..14078 + /gene="rmlA" + /locus_tag="SPC19A_0014" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 7.9e-118" + gene 14229..14825 + /gene="rmlC" + /locus_tag="SPC19A_0015" + CDS 14229..14825 + /gene="rmlC" + /locus_tag="SPC19A_0015" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33635.1" + /db_xref="GOA:Q9ZFS9" + /db_xref="HSSP:1NYW" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q9ZFS9" + /translation="MSDNFFGKTLVVRKIDAIPGLLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAAGKLQNNVSFSRKNVLRGLHAEPWDKYISVADDGKVLGSWVDLREG + ETFGNVYQTEIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDLE" + misc_feature 14262..14795 + /gene="rmlC" + /locus_tag="SPC19A_0015" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 2.6e-16" + gene 14835..15884 + /gene="rmlB" + /locus_tag="SPC19A_0016" + CDS 14835..15884 + /gene="rmlB" + /locus_tag="SPC19A_0016" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33636.1" + /db_xref="GOA:Q9RQL6" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9RQL6" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLREELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 14850..15806 + /gene="rmlB" + /locus_tag="SPC19A_0016" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 5e-05" + misc_feature 14853..15689 + /gene="rmlB" + /locus_tag="SPC19A_0016" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0045" + misc_feature 14853..15593 + /gene="rmlB" + /locus_tag="SPC19A_0016" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.4e-77" + misc_feature 14856..15668 + /gene="rmlB" + /locus_tag="SPC19A_0016" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.4e-05" + gene 15950..16801 + /gene="rmlD" + /locus_tag="SPC19A_0017" + CDS 15950..16801 + /gene="rmlD" + /locus_tag="SPC19A_0017" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33637.1" + /db_xref="GOA:Q9RQL5" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9RQL5" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGRELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 15950..16798 + /gene="rmlD" + /locus_tag="SPC19A_0017" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.1e-148" + misc_feature 15953..16594 + /gene="rmlD" + /locus_tag="SPC19A_0017" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 9.3e-05" + misc_feature 15953..16582 + /gene="rmlD" + /locus_tag="SPC19A_0017" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.4e-19" + misc_feature 15956..16684 + /gene="rmlD" + /locus_tag="SPC19A_0017" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.4e-08" + gene order(16877..17830,17841..18059) + /gene="tnp" + /locus_tag="SPC19A_0018" + /pseudo + CDS join(16877..17830,17841..18059) + /gene="tnp" + /locus_tag="SPC19A_0018" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 16883..17326 + /gene="tnp" + /locus_tag="SPC19A_0018" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 7.5e-05" + /pseudo + gene 18258..>18617 + /gene="aliA" + /locus_tag="SPC19A_0019" + CDS 18258..>18617 + /gene="aliA" + /locus_tag="SPC19A_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33639.1" + /db_xref="GOA:Q4JZ60" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JZ60" + /translation="MMKSSRLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 18258..18344 + /gene="aliA" + /locus_tag="SPC19A_0019" + /note="Signal peptide predicted for SPC0979 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 18504..18572 + /gene="aliA" + /locus_tag="SPC19A_0019" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 tgccaatgaa gagcaagact tgacagtaga aggaaaagtc aaatctgtct tgattgaaaa + 61 caccctagct caagaagtct ttgaaaaaca aatcttagtt ccatgggatg ctttctgtgt + 121 ggaaatgact gactagaatg agcaaacctc aagtttttga agcttgaggt tttttactat + 181 agtggattga aactagaata gtgcacctct gcttctaaaa cattgttaga aatcgatttg + 241 actgtcccga tcgatttgtc ctattcttat ttcattttgc tatacttgta gttgaggaga + 301 attaagctcc tcactagtaa actcttcata atccttttta tttttatgaa gatattgttt + 361 gaaagatgtg agtttccacg gatgggtttg tggagggata tacttgcgtc tttctttttt + 421 tgttctggtt cttgttcaaa gtttttcgaa tagagttcat gatttagtag ctcctttgtg + 481 tgatagattt tgtcagcgat attgaggtag atgtctccgt caaatgcttt tataactaat + 541 gctttcgtct ttctgatgaa atagacttct tttccttgtt cggtagggat atagtaacga + 601 ttttggaatc ggatatggtg tccactatcg acgactctct ccgccagtct agccagaatg + 661 agattccttt cagaggggtt aggaacctcc tcgaagacag agagttttgt cttgtttcca + 721 aactgttcat taaaggtttg aatgtaggaa agcaggaagg tattggcttc ttccaaggta + 781 tgaatattgt tttgttccag ttcgataggc aggcgagatt gtagtgtctg attgagtctt + 841 tcgactctcc ctttagcttg agggatagag gttgtctcaa ggagaatccc tagttggtga + 901 caggcgtatc caaactgtgt atgggtatcg tcctccattt tcttagagtt ggaggcttga + 961 taggtaaaga ccgttctctt atctgtttta atttgaaggg gaatgccgtg attggctaag + 1021 atttgttcga ggacatgata gtaagcattc aagttctctt gtttatcaaa ataagcgcct + 1081 aggatattgc cggaagcatc atcaatggct aagtgtaagt tagatgtttg ggctccaaac + 1141 taggcatgag ggctggcatc catttgaatg agttcaccag caaatttctt tctgggtcta + 1201 ctaggatgta cttttttagg gtcttcaagg aagttttcag ccgtcggtaa gattggattg + 1261 tctaggggtt gattcaggtt cagtttagct tgttttctta ctctcttctt tgtctttcta + 1321 tgggacttag gcgacaggat atttttctta tagagtattt ttctaacagt agtatcagag + 1381 agctgaattc cttcttcttc agctagcaat tcacagaaat gaaggacatt tggtttatat + 1441 gtttcatagg agaggtattt ttttaggaga cgttctttga tttcatcagg gattgcatgt + 1501 tttggttttc gatttctgtt tccgtgtctg aaggcttctt ttcctttcag ttgataggct + 1561 agtagcagac gattgatttg tctttcagaa agattgagct cgacacaggc tcgtttcttt + 1621 gttttctttc cttgggctat agcttttatc acaagatatt ttttcgtttc attcatattc + 1681 agttggatcc ttttcatatg actattctac caaatgggac attttcacgt tcgatttact + 1741 aaagacatta tcacattcga attacacaag atgcagatag tgaaaaaagg tgtagacatt + 1801 accgtaaaaa agtgatataa tcgtatgatg ttcaaggtat aggtgttaat catgagtaga + 1861 cgttttaaaa aatcacgttc acagaaagtg aagcgaagtg ttaatatcgt tttgctgact + 1921 atttatttat tgttagtttg ttttttattg ttcttaatct ttaagtacaa tatccttgct + 1981 tttagatatc ttaacctagt ggtaactgcg ttagtcctac tagttgcctt ggtagggcta + 2041 ctcttgatta tctataaaaa agctgaaaag tttactattt ttctgttggt gttctctatc + 2101 cttgtcagct ctgtgtcgct ctttgcagta cagcagtttg tgggactgac caatcgttta + 2161 aatgcgactt ctaattactc agaatattcg atcagtgttg ctgttttagc agatagtgag + 2221 attgagaatg ttacgcaact gatgagtgtg acagcaccga ctgggactga taatgaaaat + 2281 attcaaaaac tactagctga tatcaaatca agtcagaata ccgatttgac ggtcaatcag + 2341 agttcgtctt acttggcagc ttataagagt ttgattgcag gagagactaa ggccattgtc + 2401 ttaaatagtg tctttgaaaa tatcatcgaa tcggagcatc cagattacgc atcgaagata + 2461 aaaaagattt ataccaaggg attcactaaa aaagtagaag ctcctaagac gtctaaggat + 2521 cagtctttca atatctatgt tagtggaatt gacacctatg gtcctattag ttcggtgtcg + 2581 cgttcagatg tcaatatcct gatgactgtc aatcgagata ccaagaaaat tctcttgacc + 2641 acaacgccac gtgatgctta tgtaccaatc gcagatggtg ggaataatca aaaagataaa + 2701 ttgacccatg cgggcatcta tggagttgat tcgtccatcc acactttaga aaatctctat + 2761 ggagtggata tcaattacta tgtgcgattg aacttcactt ctttcttgaa attgatcgat + 2821 ttgttgggtg gggtagatgt ttataatgac caagatttta catctctaca tgggaagttc + 2881 catttcccag ttggaaatgt ccacttagat tctgagcagg ctctgggatt tgttcgtgag + 2941 cgctattccc tagcggatgg tgatcatgac cgcgggcgca atcaacaaaa ggtgattgcg + 3001 gccatccttc aaaaattaac ttcgagcgaa gcgctgaaaa attatagtag gatcattgat + 3061 agcttgcaag attctatcca aacaaacatg ccacttgaga ccatgataaa cttggtcaat + 3121 gctcagttag aaagtggtgg aacgtacaaa gtgaattcgc aagacttgaa gggtatggga + 3181 cggacggatc ttccttccta tgcgatgcca gatagtaacc tctatatgat ggaaattaac + 3241 gacagtagcc ttgcatctgt caaaactgct attcaggatg tgttggaggg cagatgaaat + 3301 gattgatatt cattcgcaca tcgtctttga tgtagatgat ggtcccaagt caagagagga + 3361 aagcaaggct ctcttggcag aatcctacag gcagggggtg cgaaccattg tctctacctc + 3421 tcaccgtcgc aagggcatgt ttgaaactcc ggaagagaag atagcagaaa actttcttca + 3481 ggttcgggaa atagctaagg aagtggcgag tgacttggtc attgcttacg gggctgaaat + 3541 ttactacaca tcagatgttt tggataagct ggaaaaaaat cggattccga ccctcaataa + 3601 tagtcgttat gccttgatag agtttagtat gaacacccct tatcgcgata ttcatagtgc + 3661 cttgagtaaa atattgatgt tgggaattac tccagtcatt gcccacattg agcgctatga + 3721 tgcacttgaa aataatgaaa aacgcgttcg agagctgatc aatatgggct gttacacgca + 3781 agtaaatagt tcacatgtcc tcaaatccaa actttttgga gaacgttata aattcatgaa + 3841 aaaaagagct cagtattttt tggagcgtga cttggttcat atcattgcaa gtgatatgca + 3901 taatgtggac agcagacctc cccatatggc agaagcatat gaccttgttt cccaaaaata + 3961 cggagaagcg aaggctcagg aactttttat agacaatcct cgaaaaattg taatggatca + 4021 actaatttag gagaaatgat gaaagaacaa aacacgatag aaatcgatgt atttcaatta + 4081 cttaaaacct tgtggaaaca caagctaata attttattag tggcacttgt gacaggggcg + 4141 ggagcttttg catatagcac ttttattgtt aagccagaat atacaagcac cacgcgtatt + 4201 tacgtagtca accgtaatca aggagataag ccgggactga cgaatcagga cttgcaggca + 4261 ggaacttatc tggtaaaaga ctaccgcgaa attatccttt cgcaagatgt attggaaaag + 4321 gtagcgacaa atttgaagtt ggatatgcca gcaaaaacgt taactagcaa agtgcaagtg + 4381 actgtaccag ccgacactcg tatcgtctca atctctgtca aggataaaca accagaggaa + 4441 gccagtcgca ttgctaattc tctacgagaa gttgctgcag aaaagatcat cgctgtaacg + 4501 cgagtatctg atgtaacgac gcttgaagaa gcgcgaccag ctatgactcc ctcttctcca + 4561 aatgttcgac gcaacacctt agttggtttt cttggaggag ccgccgtaac agtaattact + 4621 gttcttttga ttgagttgct cgatacccgt gtaaaacgtc ctgaagatgt tgaagatgta + 4681 ctgcaaatgc cacttctagg agtcgttcca gattttgata aaatgaaata ggaggaagtt + 4741 atgccaacgt tagaaatctc acaggcgaaa ttagaacttg tgaaaaaggc agaggaatat + 4801 tataatgctt tgtgcacgaa cctacagtta agtggagatg atttgaaagt attttctatc + 4861 acttctgtga aagcaggaga aggaaaaaca acgacttcca ccaatatcgc ttgggctttt + 4921 gcgcgtgcag gttacaaaac gcttctgatt gatgcagaca tgcgtaactc cgttatgtca + 4981 ggtgtcttta aatcaaggga aaggattact ggactaacag aatttctatc agggacaaca + 5041 gacctgtcac aggggctttg cgataccaat attgagaatc tctttgtgat tcaggctggc + 5101 tctgtgtcac caaatccgac agcccttctt caaagtaaga atttcactac aatgcttgaa + 5161 accttgcgta aatattttga ctatatcgtc gtagacactg cccctgtcgg tgtcgtgatt + 5221 gatgcggcta tcattatgca gaaatgtgat gcttctattt tagtgacgaa ggcaggtgaa + 5281 acaaaacgac gggatcttca aaaagcgaaa gaacagttgg aacaaactgg gaagtcgtgt + 5341 ttaggagttg tgttgaataa actcgatact tcagtagaga aatacggttc ttatgggagt + 5401 tatgggaatt acaggaaaca gaaaaaatag gttgagggat agaaatgagt gaaaaactag + 5461 caaagccttc agtagccata gtccagagtt ttcttgttat tttattgact tatctactta + 5521 gtgctgtgag agaaacggag attgtttcaa caacagctat tgtactttat atcctccact + 5581 attttgtctt ttatatcagt gattatggac ggaatttctt taaaagggga tatttgattg + 5641 aacttgtcca gacattgaaa tatatcctat tctttgcgct agcgattagt atttctaatt + 5701 ttttcttaga agatcgattt agtatttcca gaagaggcat gatttacttc ctcttattac + 5761 atgttttctt agtctatgtg ctaaacccat ttatcaagtg gtattggaag cgggcttatc + 5821 ccaactttaa aggaagtaag aagattctcc tacttacagc aacttctcgt gttgaaaagg + 5881 tactggatag actaatagaa tcagatgatg ttgttgggga gttggtagcc gtcagtgttt + 5941 tagataaacc agattttcag catgatgatt taaaggttgt agcagagggg gagatagtaa + 6001 attttgcgac tcatgaggtg gtcgatgaag tctttatcaa tcttccaagt gaaaaataca + 6061 atattggaga gcttgtctct cagtttgaaa cgatgggaat tgatgtaaca gtcaatctaa + 6121 atgctttcga ttgggcacgt aacaagcaaa tttgtgagat ggcaggacta aatgttgtga + 6181 ctttttctac aacattttat aagactagcc atgtgattgc taagcggatt attgatattg + 6241 tcggttccct ggtaggtttg atattatgtg gtctagtcag tattgtgctg gttcctttga + 6301 ttcgaaagga tgggggttct gctttttttg ctcagacgcg tataggaaaa aatggccgcc + 6361 attttacttt ttataagttt cgctctatgt gtgtggatgc tgaggagaaa aaaagagaac + 6421 tcatggaaca aaataccatg caaggtggaa tgtttaaggt ggacgatgat cctcgtatca + 6481 cgaaaattgg tcattttata cggaagacga gcttggacga gctaccacag ttttataatg + 6541 ttctaaaggg agatatgagt ttggtaggta cacgaccacc aacagtggac gagtatgagc + 6601 actatacccc agaacaaaaa cgtcgcctaa gttttaaacc tggcataaca ggtttatggc + 6661 aggtcagcgg acgaagtgaa atcaaaaatt tcgatgaagt tgtcaaatta gatgtggcct + 6721 atattgatgg ttggacaatc tggaaagata ttgaaatttt attgaagaca gttaaggttg + 6781 tattgatgaa ggatggagcg aaatagttca tatgaatgag agaattcaaa tattaggaat + 6841 tactatagat ccattaacga tgaaagaaac agtggatgct gttgaacagt atgttttaaa + 6901 gaagcaccct ttgcacttga tgggagttaa cgcggataaa attaatcagt gctatgaaga + 6961 tgagaaaatc aaaaaaatcg ttaatgaatc aggaataatt aatgccgacg gtgcttcagt + 7021 agttttagcg agtaagtttt taggaacacc agttcctgag cgagttgctg gaatagactt + 7081 gatgaaacat ttactagagt tgtctaatga aaaaggatac tcggtctact tttttggagc + 7141 aaaagaagac gttttacaag atatgttaaa aatttttgaa gaaagatatc cagctctaaa + 7201 tgttgttggc tatagaaatg gatatttttc gcctgaagat gaaaaacata ttcaggaaga + 7261 tattaaagag aaaaaaccag attttgtgtt tgtaggaatt acttctccta agaaagaata + 7321 tattatccaa tcattcatgg ataatggaat taatgctgtg tttatggggg ttggtggaag + 7381 ttttgatgta ctatcagggc atatcaaacg agctccatta tggatgcaaa atgctcacct + 7441 agagtggttg tttcgtgtgg caaatgagcc taaacgtctc tttaagcgtt attttgtagg + 7501 gaatgtttca tttataagaa aagttttaag agcgaaaagg ggatataaac tttgaaccaa + 7561 acagaaatag ttaaattgat tcagaaagtt gaattggatg ctataaaaga gtttcaaaaa + 7621 atttgtaaag agaacaatat agatttcttc cttcgtgggg ggagtgtact tggggcagtc + 7681 aaatatgatg gctttattcc atgggatgat gacatggata ttgctgtgcc tcgtgaaggc + 7741 tacgataaac ttccaggtat ctttaaggat agaattatcg caggcaaata tcaggttctt + 7801 gcttatcaat attgcgatac tttacattgc tactttcctc gcttattcct tttagaagat + 7861 gaaagaaaac gtttgggatt gccacgaaat accaatttag gtttgcattt gattgatatc + 7921 attcctttgg atggtgcccc aaatcattca tttttaagaa agctttactt cggtaaagta + 7981 tactggtatc gttttttagc aagtttagga actacctatg ttggagacca tgtggatatg + 8041 cattccgcta agcaaaaact aatcattggt ttctttaaaa agctaggatt tgcaaaacta + 8101 ttccctcaaa attatgtgta cagacgcttg gataatctct ataaaaagta tgattggaaa + 8161 aagcagaagt atgctgggac aattaatgca tctctgtttg ccaaagaagt catgccagta + 8221 gagatttggg gagaaggagt agagaagcct tttgaggatg ccttctttaa agttcccacg + 8281 gagtatgacc gctatctgaa aagactttac ggagaaaact atcttcacga agagcctagt + 8341 gatgatgaaa agaaatcgca tttaggagga caataatttg ttttgttata ttattttgca + 8401 ttacaaagtc ttagaggaaa ctatttcttg tgttaaatca ataaaagaag gcaattccaa + 8461 tacaaagcag atcgttatta ttgataattt ttctaataac ggtacgggtg aaaaactaca + 8521 agagctgtat gagtcagatt cagagattga tgtcttgatt aaccatgaaa atgctggttt + 8581 cgctcgaggt aataatgtag catatcagtt tgctaaggaa aagtacaaac ctgattttat + 8641 ggttatcatg aataatgata ttgagataga aacagaagag tttgaaaaaa tcgtgacaga + 8701 tatctatcgg aaggaaaaat tccatttgtt aggaccagat atcttttcga cgacgtatca + 8761 gcttcaccaa aacccaaaac ggttgacgca ttatacttat gaagaggtta aggctctcaa + 8821 tgaaaaattt aagaaaggga gccaagttag tctagcatta aaaattaaat gttggttgaa + 8881 gtctagtaaa gttcttcgga cagcaatcta tcaaaatagg cgtaaaaaga aatcagtaga + 8941 ctatagaaaa caggtagaaa acccaattct tcatggttcg tttattgtat attctagaga + 9001 ttttattgag aaagaggagt atgcttttaa tcccaatacc ttcttctatt atgaaacaga + 9061 gatattagat tatgaagctg agttaaaagg atataagaga atttatacac cgaagattaa + 9121 ggtcttgcac catcaaaatg ttgcaaccaa tcaagtctat acaaacttag tagaaaaaac + 9181 cttgttttca aacaaatgca actttgaatc cactagttat tttttgaagt tgatgaaaga + 9241 aaacgagggt gtgtaaatga cttatttatt tttactctgc ctgaccttat tcttattaac + 9301 tttcttctat ttttttgctt tcaatcaaga tttgatagct ccgccagttg tcatgtctgt + 9361 tatgtttctc attagttctg tatttgccct tattaatgtg caaaactgga atattgagta + 9421 tagtggttta gcttatcttt tgattattag tggcattatt gttttttcaa tgcctctctt + 9481 ggctcttaat tcgcctagtc taaataccaa gattaaagtg acggatcggc tcattgatat + 9541 ccaattctgg aaaatagctc ttactattat agttgacctc attattctat atctttatag + 9601 gagagagatt cataatcttg cacttagcca tggttatacg ggttcaaatt ttcagtggtt + 9661 ctttagaaat gctaccagtt atgaaggtga gctaacagtg cgaacttcga ttcgggtcct + 9721 cattcgtatc attgacgtat ctgcttatat ttttggatat acttttatta ataatttctt + 9781 catttatagt cataaacgct ctaaagattt actgctctta gttccattct tgatttttat + 9841 ttctaaaacc ttattatctg ggggtagatt ggatattata aaaattttaa ttgcgtatgt + 9901 tgtaatggcc tatattcagc aaaaacgaaa agttggctgg gataaggtca tctcccataa + 9961 atatatgaga cttggttttg taggcttgat agctgggatt cctacctttt actattcttt + 10021 attcttatct ggacgttcta cgactagaac tgtatttgaa agtatttcaa cctatttagg + 10081 aggttcgatt cagcatttta atcagtatat tcaaaatcct attggagtag ctgaggtttt + 10141 tggcgatgag tcatttgtag ctattatgaa tattttgggt aatcttggct ttgtcaatta + 10201 caatagtacc gttcacttag aatttcggca gttagggatt actatgggta acgtttatac + 10261 tttctttaga agaccctggc atgactttgg gttagtcggt atgtatatct tttcctttgt + 10321 tgtcggtgtg ttttttgcta ttttttattt gaaattaaga aagagccgtg ctggttttaa + 10381 attggatatt catacaatta tttactctta tttcttttat tggatttttt tatcgtccat + 10441 tgagcaatac tcgtttacaa caatcagttt gtttacactt gtatttatag tcttggttta + 10501 cctaatggct ttcttctatt ggaatttgga tttccacaga ggaaaactag taattaaact + 10561 ctctgacaca agtattaaat cggaaaactg aaaacaataa aaatagagag gatagttgat + 10621 gaatagcaaa attaaaaata tactaactaa tttctcttat gtcatttctt caaatctttt + 10681 gacagtcttg acctcttcct tggttgtctt aattttcccc aaattaatgg gggtaacaga + 10741 gtacagttac tggcaacttt atatttttta tctgacctat atcggttttt tccacttggg + 10801 ttggattgat gggatttatc ttaaatatgg tggcttagaa tataataatt tagatagaaa + 10861 acagttttat tctcagatga ttctattttc tagcttctta atgattatct ccttgctatt + 10921 gtttggttta aatgtattag ctgtaacaga ttcgaatgca cgatatattt ataatatgac + 10981 tattataagt atgataatca caaatttaag aacgctctac gtgtatgttt tgcagatgac + 11041 aaaccgcttg aaggatagtt ccatcattct actcagtgat cgcgttttat atgtgctcct + 11101 tttattcctg tttattgtat ttggttggca tgaatacaag gttatgattt tggcagatat + 11161 tctaggtcga tcattttctc tcatactttc cttctggatt tgtaaagata ttgtgtttca + 11221 gcctttgtca aaattcatct ttaatataaa agagtctttt gataatatcc gagttggtat + 11281 caatttaatg ttatccaaca tcgcaagtag tttgattatc ggtattgttc gtctaggaat + 11341 ccaatggaac tggaatatcg aaacattcgg gaaagtatct ctgaccttga gtgtttccaa + 11401 tctattgatg actttcatta atgccattgg actagtcgtc tttccgctat taagacgaac + 11461 aaaagcagaa aacttaccta agatttattc taatttaaga aacgttttga tgcttatcat + 11521 gttcgcgatt ttgctcattt actatccttt aaaaattgta ttagacctct ggttgccagc + 11581 ctatcaagat gccttgattt tcatgaccct tattttccct atgtcagtct atgaagggaa + 11641 aatggcattg gtcattaata cttacttaaa ggcattaaga atggaaagag atatccttag + 11701 agtcaatgcc ttagtaatgt tgatcagtat gggagtgacc ctggttacaa catacctgtt + 11761 aaatagtttg gagctgactg ttgtatcgat agttgttttg ctagctttga gaagtatcat + 11821 agccgaatta attctgtcta aaaaactgga tgtttcggtt aagaaggata ttgtattaga + 11881 atttcttttg acgcttgtct ttatttcttc aagttggtat ttgccgattg ggctggcagt + 11941 aattgtctac acaatagcct acggtttata tctctatttg aaacacgaag atatcaaaac + 12001 ctatttagct tactttaaag ctagtaaaaa aacatcaaat taaaaaatta tataatgatt + 12061 aagtggtaga ttctatttct accgttttag atattcggga ggtaatgatg aaaaaaatta + 12121 tgttagtatt cggtacacgt ccggaagcca tcaaaatgtg tccattagtc aatgagttga + 12181 aaaaacacga agatatggaa acaattgtgt gtgttactgg acaacacaaa gagatggtta + 12241 gtcctgtttt agatttattt ggtgttgtac cagattatga tttagaaatt atgaaggcta + 12301 accaaacctt gttctctatc acaactagta tcttggaaaa gataaaacca gttttagaga + 12361 aggaacaacc agatattgtc ctagttcacg gtgacactac gacaacttat gcagcagcct + 12421 tggcagcatt ctatttggga attaaagtag gacatgttga agctggtttg cgaacgtaca + 12481 atttacaaag tccatttcct gaagaattta acaggcaatc gacatcaatc attgcaactt + 12541 accattttgc tccaactgag ttggctaaag aaaatctctt aaaagaaggt agagagaatg + 12601 tttatgtgac tggaaatact gtcattgatg ctcttacaac tactgttcaa gaggattata + 12661 cacacactca tttagattta aacgctaaca atcgtctcat cttattgact gctcatagac + 12721 gcgaaaatct cggcgaaccg atgagacata tgtttagagc agttaaacga gtattgaatg + 12781 aatacgaaga tgttaaagtc atttatccaa ttcataagaa tcctttggta cgtgaaacag + 12841 ctgcagagat ctttggagat acagaacgga ttcaaattat tgaacctttg gatgttcttg + 12901 atttccacaa cttcatgaac caaagttata tgattttaac agattctggc ggagttcagg + 12961 aagaagcacc ttctttagga aaacctgtat tggttatgcg cgatactact gaaagacctg + 13021 aaggagtagc ggcaggaacc ttgaaattag taggaactga cgaagaaaca atttatcaaa + 13081 acttcaaact acttctagat gattctggag aatacaaaaa aatgagtcag gctagcaatc + 13141 catacggtaa tggtgatgct agtcaacaga ttgttcagat tttgcgtggg atttaagaag + 13201 attctctaaa agagtctaag aggaatccac tccacaaaca taaaactctt atgctatcat + 13261 ttatgattga gatagactca taacttaata tttttatcct aagaaaattc gttcatattc + 13321 aatatgaatg aaaaacaacg aagaaaggtt atttcattat gaaaggtatt attcttgcag + 13381 gcggctcagg tacccgcctg tacccactta ctcgggctgc gtcaaaacag ctgatgccgg + 13441 tttatgataa acctatgatt tattatccgt tgtcgacatt aatgttggct ggaattaaag + 13501 atattttgat tatctcaact cctcaagatt tgccccgttt taaggacttg ctcttggatg + 13561 gttccgaatt tgggatcaag ctttcctatg cggaacaacc tagtcccgat ggacttgctc + 13621 aggcttttct tatcggtgaa gaatttatcg gtgacgatag cgttgccttg attttaggcg + 13681 acaatatcta ccatggtcct ggtctgagca caatgcttca aaaagcagcc aagaaagaga + 13741 aaggtgcgac tgtttttggc taccaagtga aggatccaga gcgttttggt gtggttgagt + 13801 ttgatacaga catgaatgct atttctatag aagaaaaacc ggagtatcct cgctccaact + 13861 atgcagtgac aggactgtat ttctatgata atgatgttgt ggagattgct aaacagatca + 13921 aacctagtgc tcgtggcgag ttagaaatta cagacgttaa caaggcttac ctaaatcgtg + 13981 gtgacctttc tgttgagctg atggggcgtg gttttgcctg gttggatacg ggaacccatg + 14041 aaagcttgct agaagcttct cagtatattg aaacggttca gcgtatgcag aacgttcaag + 14101 tggcaaatct agaagaaatt tcctatcgta tgggctacat tagtcgtgaa gacgtgctgg + 14161 aattggctca gcctcttaag aaaaatgaat acggacaata tttgctccgt ttgattggag + 14221 aagcatagat gtcagataat ttttttggaa agacacttgt ggtacgcaag attgatgcta + 14281 taccaggact gctagagttt gatattcccg ttcatggaga caatcgtggt tggtttaagg + 14341 aaaatttcca gaaggaaaag atgctaccgc ttggttttcc tgaaagcttc tttgctgcag + 14401 ggaaactgca aaataacgtc agcttttctc gcaaaaatgt tcttcgagga ctccatgctg + 14461 aaccttggga caagtatatc tctgttgcag acgatgggaa ggttttagga tcttgggtag + 14521 atttgcgtga aggcgagacc tttggaaatg tttaccagac agagattgat gcaagcaagg + 14581 gaatctttgt tcctcgaggc gtagctaatg gcttccaagt tctatcagat acagtgtcat + 14641 atagctatct ggtcaatgat tactgggcgc ttgaactcaa acccaagtat gcctttgtga + 14701 actacgctga tccaagcctt ggtattgaat gggaaaatat tgcagaagca gaggtttcag + 14761 aagcagataa aaatcatcca ctacttaagg atgtaaaacc tttgaaaaaa gaagatttgg + 14821 aataaggaaa gaatatgact gaatacaaaa atattatcgt gacaggtgga gctggcttta + 14881 tcggttctaa ctttgtccat tatgtttacg agaactttcc agatgttcat gtgacagtcc + 14941 tagataagtt gacttatgct ggaaaccgcg cgaatattga ggaaatttta ggtaatcgtg + 15001 ttgagttagt tgttggtgac attgctgatg cggagttggt agacaagttg gctgctcaag + 15061 cagatgctat cgttcattat gcagcggaaa gccacaatga taattcgctc aatgatccat + 15121 cgccatttat tcatactaac ttcattggaa cctatactct tttagaagct gctcgtaagt + 15181 atgatattcg cttccaccat gtatcgacag atgaagttta tggggatctc cctttacgcg + 15241 aagatttgcc aggtcatgga gaagggccgg gtgagaaatt tacggctgaa accaagtaca + 15301 atccaagctc gccttactca tcaaccaagg cagcctcaga tttgattgtc aaagcctggg + 15361 tgcgttcttt tggagtcaag gcaacgattt ccaactgttc aaataactac ggtccttatc + 15421 aacatatcga aaaattcatc ccacgtcaga ttactaacat cctaagtgga attaagccaa + 15481 aactttacgg tgaaggtaag aatgttcgtg actggattca taccaatgac cattcttcag + 15541 gagtttggac aatcttgaca aaagggcaaa tcggtgaaac ctacttgatt ggggctgatg + 15601 gtgagaagaa caataaggaa gttttggaac ttatccttaa ggaaatggga caagctacgg + 15661 atgcctatga tcatgtgact gaccgtgcag gacatgacct tcgctatgcg attgatgcca + 15721 gcaagctccg tgaggagttg gggtggaaac ctgaatttac caactttgaa gctgggctca + 15781 aggcaacaat caagtggtat acagataacc aagaatggtg gaaagcagaa aaagaagctg + 15841 ttgaagccaa ttatgctaag actcaggaga ttattacagt ataaaaagca ggaaatagct + 15901 gctttttatt gctatattgg gaagagttac atattagaaa ggtctagaga tgattttaat + 15961 tacaggggca aatggccaat taggaacgga acttcgctat ttattggatg aacgtaatga + 16021 agaatacgtg gcagtagatg tggctgagat ggacattacc gatgcagaaa tggttgagaa + 16081 agtttttgaa gaggtgaaac cgactttagt ctaccactgt gcagcctaca ccgctgttga + 16141 tgcagcagag gatgaaggaa gagagttgga cttcgccatc aatgtgacgg ggacaaaaaa + 16201 tgtcgcaaaa gcatctgaaa agcatggtgc aactctagtt tatatttcta cggactatgt + 16261 ctttgatggt aagaaaccag ttggacaaga gtgggaagtt gatgaccgac cagatccaca + 16321 gacagaatat ggccgtacta agcgtatggg ggaagagtta gttgagaagc atgtgtctaa + 16381 tttctatatt atccgtactg cctgggtatt tggaaattat ggcaaaaact tcgtttttac + 16441 catgcaaaat cttgcgaaaa ctcataagac tttaacagtt gtaaatgacc agtacggtcg + 16501 tccgacttgg actcgtacct tggctgagtt catgacctac ctagctgaaa atcgtaagga + 16561 atttggttat tatcatttgt caaatgatgc gacagaagac acaacatggt atgattttgc + 16621 agttgaaatt ttgaaagata cagatgtcga agtcaagcca gtagattcca gtcaatttcc + 16681 agccaaagct aaacgtccgc taaactcaac gatgagcctg gccaaagcca aagctactgg + 16741 atttgttatt ccaacttggc aagatgcatt gcaagaattt tacaaacaag aagtgagata + 16801 agtagtagaa tgattttcta gtctaataaa agaggcagat aatgaactcc aaaggagctt + 16861 aagatgtacg attatcttgt tgttggtgct ggtctctttg gcgcatagct ttggctcagc + 16921 ttctattatc gctcacacca tccatcagaa gtttaatctg aaggtaccca attatcgcca + 16981 agaagaagat tgggctagga tgggtttacc aatcacacgt aaggaaatct ctaattggca + 17041 tatcaaggca agtcaatact atttagagtc cctttataac cttttacgag aaaagttgtt + 17101 agaacaacct cttcttcatg cggatgaaac ctcttatcgg gtgctagaga gtgatagcca + 17161 tctgacctac tattggacct ttttgtctgg gaaagctgag aatcaagcaa tcacgctgta + 17221 ccatcatgat cagcgtcgga gtggtttagt agtacaagaa ttcctaggag attattctgg + 17281 ctatgtgcat tgtgatatgt tgcggcagta acttaggact ttagtcctct agttctgcct + 17341 atgcgatagc agtccaaggt ttaggagcaa ggcgacgcta agcttggtaa actacgaacc + 17401 gctagaagct tatcgtcaac tggaagaagc tgaacttgtt ggatgttggg cgcatgtgag + 17461 aaggaagttt tttgaagcgc cccccaagca agcggataaa tcatcgttag gagctaaagg + 17521 tttagcttat tgtgatcagt tatttgcctt ggaaagagac tgggaggctt tgctagctga + 17581 tgaacgacta cagaaacgtc aagaagagct ccaaccccta atggaagatt tctttgcttg + 17641 gtgccggcgt cagtcagttt tatcgggttc aaaactagga agggcaattg aatacagcct + 17701 caagtataaa gaaacctttc agaccatttt aaaagacgga catctggtcc tttccaataa + 17761 tctagctgaa cgcgccatta aatcattggt tatgggacgg agtaaaagag tccagtggac + 17821 tcttttagcc taagctcagt ttaaaaaagt gagggtggtt attttctcaa aattttgaag + 17881 gagctaaagc aagagctatt attatgagct tattggaaac agctaaacgt catcaactaa + 17941 atagcgagaa atatctatcc tatcttctag aatgtcttcc aaacgaggaa actctcgtaa + 18001 acaaagaggt tttagaggct tatttaccat gtactaaagt tgtacaagaa aagtgcaaat + 18061 aagaaatctc cagattagga actatatatg agttctctag tctggagatt tttcaatata + 18121 cttcgttatt ggacggttac gatattcata ttttttgcaa agatgttgtt tgaaaaataa + 18181 ttttcaaaaa ttctgaaaat tctgttgaca actttctgaa aagagtctat aatggagaga + 18241 aagttttaaa ggagaaaatg atgaaaagtt caagactatt tgcccttgcg ggcgtgacat + 18301 tattggcggc gactacttta gctgcatgct ctggatcagg ttcaagcact aaaggtgaga + 18361 aaacattctc atacatttat gagacagacc ctgataacct caactatttg acaactgcta + 18421 aggctgcgac agcaaatatt accagtaacg tggttgatgg tttgctagaa aatgatcgct + 18481 acgggaactt tgtgccgtct atggctgagg attggtctgt atccaaggat ggattgactt + 18541 acacttatac tatccgtaag gatgcaaaat ggtatacttc tgaaggtgaa gaatacgcgg + 18601 cagtcaaagc tcaagac +// + diff --git a/public/res/serotype_genbank/serotype_19B.gb b/public/res/serotype_genbank/serotype_19B.gb new file mode 100644 index 0000000..3eed017 --- /dev/null +++ b/public/res/serotype_genbank/serotype_19B.gb @@ -0,0 +1,971 @@ +LOCUS CR931676 21567 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain nr. 4594 (serotype 19b). +ACCESSION CR931676 +VERSION CR931676.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21567) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21567) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21567 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="nr. 4594" + /db_xref="taxon:1313" + gene <1..133 + /gene="dexB" + /locus_tag="SPC19B_0001" + CDS <1..133 + /gene="dexB" + /locus_tag="SPC19B_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33640.1" + /db_xref="GOA:Q4K100" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K100" + /translation="VNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC19B_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC19B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(462..979) + /gene="tnp" + /locus_tag="SPC19B_0003" + /pseudo + CDS complement(join(462..521,482..979)) + /gene="tnp" + /locus_tag="SPC19B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1201..2646 + /gene="wzg" + /locus_tag="SPC19B_0004" + CDS 1201..2646 + /gene="wzg" + /locus_tag="SPC19B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33643.1" + /db_xref="GOA:Q4K0Z9" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0Z9" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMIDLVNAQLESGGTYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1201..1317 + /gene="wzg" + /locus_tag="SPC19B_0004" + /note="Signal peptide predicted for SPC0983 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1405..1752 + /gene="wzg" + /locus_tag="SPC19B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.7e-65" + misc_feature 1930..2373 + /gene="wzg" + /locus_tag="SPC19B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 2648..3379 + /gene="wzh" + /locus_tag="SPC19B_0005" + CDS 2648..3379 + /gene="wzh" + /locus_tag="SPC19B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33644.1" + /db_xref="GOA:Q4K0Z8" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0Z8" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 2651..3259 + /gene="wzh" + /locus_tag="SPC19B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.3e-37" + gene 3388..4080 + /gene="wzd" + /locus_tag="SPC19B_0006" + CDS 3388..4080 + /gene="wzd" + /locus_tag="SPC19B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33645.1" + /db_xref="GOA:Q4K0Z7" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0Z7" + /translation="MKEQNTLEIDVLQLFRSLWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPATSPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 3406..3822 + /gene="wzd" + /locus_tag="SPC19B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 5.3e-53" + misc_feature 3928..4005 + /gene="wzd" + /locus_tag="SPC19B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4090..4773 + /gene="wze" + /locus_tag="SPC19B_0007" + CDS 4090..4773 + /gene="wze" + /locus_tag="SPC19B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33646.1" + /db_xref="GOA:Q4K0Z6" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0Z6" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GFYGNYGKK" + gene 4789..6156 + /gene="wchA" + /locus_tag="SPC19B_0008" + CDS 4789..6156 + /gene="wchA" + /locus_tag="SPC19B_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33647.1" + /db_xref="GOA:Q4K0X4" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0X4" + /translation="MDEKGLKIFLAVLQSIIVILSVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGENYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRYFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKMDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQISGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5572..6153 + /gene="wchA" + /locus_tag="SPC19B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 7e-146" + gene 6160..6903 + /gene="wchO" + /locus_tag="SPC19B_0009" + CDS 6160..6903 + /gene="wchO" + /locus_tag="SPC19B_0009" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI33648.1" + /db_xref="GOA:Q4K0X3" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q4K0X3" + /translation="MRDRIQLLGLTIDLLTMNETIDIVEQYVLEKRPLHLMGVNADKI + NQCHTDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMQCLLELSNKKG + YSVYFFGAKEEVLQDMLKVFKRDYPNLIVIGHRNGYFSEEDEQAIQEDIREKNPDFVF + IGITSPKKEYIIQKFMDSGVNSVFMGVGGSFDVLSGHIQRAPLWMQKSNLEWLFRVAN + EPKRLFKRYFVGNISFIGKVLKAKRGVKY" + misc_feature 6322..6837 + /gene="wchO" + /locus_tag="SPC19B_0009" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 1.6e-95" + gene 6915..7721 + /gene="wchP" + /locus_tag="SPC19B_0010" + CDS 6915..7721 + /gene="wchP" + /locus_tag="SPC19B_0010" + /note="member of homology group 95" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33649.1" + /db_xref="GOA:Q4K0X2" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K0X2" + /translation="MIRLIQKVELDAIKEFKKICEENDIDFFLRGGSVLGAVKYDGFI + PWDDDMDIAVPREAYDKLPSVFKDRIIAGKYQVLTYQYCDTLHCYFPRLFLLEDERKR + LGLPRNTNLGLHLIDIIPLDGAPNHSVLRKIYFGKVYWYRFLASLGTTYVGDHVDMHS + TKQKLIIGFFKKLGFAKLFPQNSVYRRLDNLYKKYDWKKQKYAGTINASLFAKEVMPV + EIWGEGVEKPFEDTFFKVPTEYDRYLKRLYGENYLHEEPSDDEKKSHLGG" + misc_feature 6972..7661 + /gene="wchP" + /locus_tag="SPC19B_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 9.7e-110" + gene 7726..8598 + /gene="wchQ" + /locus_tag="SPC19B_0011" + CDS 7726..8598 + /gene="wchQ" + /locus_tag="SPC19B_0011" + /note="member of homology group 43" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33650.1" + /db_xref="GOA:Q4K0X1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0X1" + /translation="MFCYIILHYKVLDETISCVKSIKEGNSNEKQIVIIDNFSNNGTG + EKLQELYESDLEIDVLINHENAGFARGNNVAYQFAKEKYNPDFMVIMNNDIEIETEDF + EKIVTDIYHKEKFHLLGPDIFSTTYQLHQNPKRLTHYTYEEVVALNEKFKRGSQLSLT + LKIKCWLKASKVLRTAIYQNRRKKGSVDHRKQVENPILHGSFIVYSRDFIEKEEYAFN + PNTFFYYETEILDYEAELKGYKRIYTPKIKVLHHQNVATNQVYTNLVEKTLFSNKCNF + ESTSYFLTLMEKNE" + misc_feature 7732..8367 + /gene="wchQ" + /locus_tag="SPC19B_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 8.2e-10" + gene 8602..9687 + /gene="wchR" + /locus_tag="SPC19B_0012" + CDS 8602..9687 + /gene="wchR" + /locus_tag="SPC19B_0012" + /note="member of homology group 162" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="CAI33651.1" + /db_xref="UniProtKB/TrEMBL:Q4K0X0" + /translation="MMKKILYVTNVDWNWIKQRPQFIAENLSNFYEMLVLYRYWYNRK + GLTEDRNTNITNISRIYALPFVNRSPKLKQLNDKIVAWNIRRKVKAFKPEYVYLTNPM + QFASLVDNSEQKIIYDCMDYHVAFIENREERQRLKDLEEKLVNRANLILVSSEKLREN + IISDYNLEEQVNKIVVVRNGYNGKILSIPTRHKKNNQKLVLAYVGTISHWFDFDIILR + SLKDFDNIEYNLIGPISKADIPEHDRIHYLGSVPHEKIYQYIENADVLIMPFQINDIV + EAVDPVKLYEYINFKKNILTVCYKEILRFEPFVYMYSNYLDYQMNLLQLIENNNLKYD + SIAREDFLKSNTWEKRAELIHQLINQL" + gene 9706..10950 + /gene="wzy" + /locus_tag="SPC19B_0013" + CDS 9706..10950 + /gene="wzy" + /locus_tag="SPC19B_0013" + /note="member of homology group 163" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33652.1" + /db_xref="UniProtKB/TrEMBL:Q4K0W9" + /translation="MKRQKFEFIEILYYFTVMLSVGMFLMFTLNLYWHRNLLTILSIA + LSFLMLPILIVNAKRISKSAFIYGTFLSICIIYEILRAKTLYNYSVSNIFLASRQYIW + IFLFFVLIYLFKNKQENMRKILDNTLNIFMFSLGIRAFTWFLYTLFQVELFPSILREF + GDLWYRNEFSVRIDGTPLIIIGLLISTFFYFKFGNRKYFYYLFLILMYITFVNQTRVL + LVSVLISIFLMFVFSRRTSRLLTSLSFVTIIIAFVYGGGLDYIKAYLNIDAGTFDLGL + GFRYWELKYYLGLLANDVWKLGVGILTSSNINSNFILAGPSAVKMYLDDLGFLELFVQ + FGVAAIFMYGYIFYKLINLILRMSNDKYRVDRAFFIALLTNLIITSISLNIFGAQRSF + SLAIVLALIFYYDYRLKNDIEN" + gene 10958..11860 + /gene="wchS" + /locus_tag="SPC19B_0014" + CDS 10958..11860 + /gene="wchS" + /locus_tag="SPC19B_0014" + /note="member of homology group 164" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33653.1" + /db_xref="GOA:Q4K0Y9" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0Y9" + /translation="MDKVCIVILNYNNYEETIECVQSLRSTIKSNEYDIVIVDNNSVN + DSVKELSKALSPIKIITSLENRGYANGNNIGIKYAEDNGYDYICILNNDTLIEVDFLE + SCKRELENNSFVAFVSPVLVEYKDNNLVQSTGGDIFINRGIVTLKNHGAQRDKLPSKI + ESDYIGGACLMFKTSILKIIGYIPESYFLFYEETEWCYRAKKLGYKNICLTQSYVYHK + GSVSIKAVNGLQEYLMARNRVVFVRRNINSKLKYSAFLFYLFMQQLYHCFLRRDCSKR + KYKYYLDGVFNRIDPSYPFIFISE" + misc_feature 10970..11497 + /gene="wchS" + /locus_tag="SPC19B_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.4e-23" + gene 12064..13998 + /gene="rbsF" + /locus_tag="SPC19B_0015" + CDS 12064..13998 + /gene="rbsF" + /locus_tag="SPC19B_0015" + /note="member of homology group 49" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI33654.1" + /db_xref="GOA:Q4K0Y8" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006439" + /db_xref="UniProtKB/TrEMBL:Q4K0Y8" + /translation="MKMFDISQIKTKTVAFDFFDTVVHRNCHPEQILYQWAKEMALEV + NFNISPSILYQIRKSVENNKKLGTEEMCYLDLLSGIYNEIKDKIKNTSKEEFIHRAKI + LELKIELQHIYLDSEIKEVLKKLKSDSKQIILVSDFYTDKELIETVLKKFEIFDYFSS + IYISSEKGCRKSTGNLYKLILKELGLNPIEITMIGDNCKSDYEVPRSLGLNAIYRRYI + DKNSTVSEKELVRLYDQILFSNSKKAPFNIFLADIVFFISELHKKMIQDDVQIALFCS + REGQLLKRLFDIYQDTFLRENQKICTEYFYVSRRSTLYSSFTSLENEEFEMIFRQYKK + ITLQNFLLNLNFSNNEITLICQDLNVKPTYVLTVDDHLLENLRKHPQFIKKFNQEKKD + SQLLREYIKHLTKNRNEAYLVDVGWKGTIQDSIKKALPDKRIVGYYLGLMLNVYSVEN + KTDKTGLLFSDYPSKSKFYDIVSRNFGFYEDIFVADHGPVLKYKKESDIIPIIDDDKK + HVSIYQAVKDYQEELVLGFSEILEAYKKMKFLPFEQKNLWLTMSLKKECIYIPKLQSF + SESLKEKVVENFGEIVTLKTTKKSIKTLLREKSDLLWVDFVYRLFGGVNFLFIPELYT + RVIFLLKYLDLKLRLKNYGE" + misc_feature 12094..12717 + /gene="rbsF" + /locus_tag="SPC19B_0015" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 4.9e-15" + gene 13988..15433 + /gene="wzx" + /locus_tag="SPC19B_0016" + CDS 13988..15433 + /gene="wzx" + /locus_tag="SPC19B_0016" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33655.1" + /db_xref="GOA:Q4K0Y7" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K0Y7" + /translation="MGNKSIKLNALLNIVLTLSNIIFPLITFPYISRILNPNGIGLTS + FFSSIGNYGILLASLGISTYGIKAVASVRDDRDKLSKVVQELMIINVAMSIITTAILL + FMTILITQLNREFSLLLITCGTILSSPFALNWLYSGMEEYTYITTRSVVFKILSLILI + FLLVKRPEDYIVFASISLFSSLSSNILNLWHSRHFINIKLYKNLQFKYHFKPMWYLFA + SLLAVNIYTNLDTVMLGFINGNEAVGYYSVASKVKWILLSLITSISAVLLPRLSFYIS + KNDTSNFIKMLKESSAVIFFIAIPLMVFFIVEAKDSILLLGGSQYLPATLAMQILMPI + LLISGFSNITGNQILIPMNREKYFMVAVTIGAVINLILNLLLMPKFGIIGASVATLFA + ELSQMTVQLHFSKEYLVSNISIKSLVNVIIATVVSIIPLIILNQLITITIPFYSLMLA + GFAFFSLYLVILLLLKEEVTIQLFSLLAKKK" + misc_feature 14003..14812 + /gene="wzx" + /locus_tag="SPC19B_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 3.8e-80" + gene 15497..16582 + /gene="mnaA" + /locus_tag="SPC19B_0017" + CDS 15497..16582 + /gene="mnaA" + /locus_tag="SPC19B_0017" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33656.1" + /db_xref="GOA:O07871" + /db_xref="HSSP:1O6C" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:O07871" + /translation="MKIMLVFGTRPEAIKMCPLVNELKKQADMETVVCVTGQHKEMVS + PVLELFGVQPDYDLEIMKANQTLFSITTSILEKIKPVLEEEQPDIVLVHGDTTTTYAA + ALAAFYLGIKVGHVEAGLRTYNLQSPFPEEFNRQSTSIIANYHFAPTELAKENLTKEG + RNNVYVTGNTVIDALKTTVQKDYTHPDLDLNADNRLILLTAHRRENLGEPMKHMFRAV + KRILNEYDDVKVIYPIHKNPLVRETAAEIFGDIERIQIIEPLDVLDFHNFMNNSYMIL + TDSGGVQEEAPSLGKPVLVMRDTTERPEGVAAGTLKLVGTDEETIYQNFKMLLDDSEE + YKKMSQASNPYGNGDASKQIVRILRGI" + misc_feature 15557..16573 + /gene="mnaA" + /locus_tag="SPC19B_0017" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 5.6e-202" + gene 16621..17490 + /gene="rmlA" + /locus_tag="SPC19B_0018" + CDS 16621..17490 + /gene="rmlA" + /locus_tag="SPC19B_0018" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33657.1" + /db_xref="GOA:Q4K0Y5" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K0Y5" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + misc_feature 16624..17340 + /gene="rmlA" + /locus_tag="SPC19B_0018" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 4.9e-120" + gene 17491..18087 + /gene="rmlC" + /locus_tag="SPC19B_0019" + CDS 17491..18087 + /gene="rmlC" + /locus_tag="SPC19B_0019" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33658.1" + /db_xref="GOA:Q4K0Y4" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4K0Y4" + /translation="MTDKFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 17527..18057 + /gene="rmlC" + /locus_tag="SPC19B_0019" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 18097..19146 + /gene="rmlB" + /locus_tag="SPC19B_0020" + CDS 18097..19146 + /gene="rmlB" + /locus_tag="SPC19B_0020" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33659.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18112..19068 + /gene="rmlB" + /locus_tag="SPC19B_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 18115..18855 + /gene="rmlB" + /locus_tag="SPC19B_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 18118..18930 + /gene="rmlB" + /locus_tag="SPC19B_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 19212..20063 + /gene="rmlD" + /locus_tag="SPC19B_0021" + CDS 19212..20063 + /gene="rmlD" + /locus_tag="SPC19B_0021" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33660.1" + /db_xref="GOA:Q9AH81" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH81" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19212..20060 + /gene="rmlD" + /locus_tag="SPC19B_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4.3e-146" + misc_feature 19215..19856 + /gene="rmlD" + /locus_tag="SPC19B_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00011" + misc_feature 19215..19844 + /gene="rmlD" + /locus_tag="SPC19B_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2e-18" + misc_feature 19218..19946 + /gene="rmlD" + /locus_tag="SPC19B_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-08" + gene order(20139..21092,21109..21324) + /gene="tnp" + /locus_tag="SPC19B_0022" + /pseudo + CDS join(20139..21092,21109..21324) + /gene="tnp" + /locus_tag="SPC19B_0022" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 20145..20588 + /gene="tnp" + /locus_tag="SPC19B_0022" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 7.7e-05" + /pseudo + gene 21520..>21567 + /gene="aliA" + /locus_tag="SPC19B_0023" + CDS 21520..>21567 + /gene="aliA" + /locus_tag="SPC19B_0023" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33662.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtcaatgaa gagcaagact tgacagtaga aggaaaagtc aaatctgtct tgattgaaaa + 61 cactgcggct aaagaagtac ttgaaaaaca ggtcttggct ccatgggatg ctttctgtgt + 121 ggaattacta taaatatttt ttgcagaaaa atttaaaatt gaaatcatat aaaaacaagg + 181 gaggactgta taaaagacag aaatcctttg ttttttataa ccaaggttta taaactttca + 241 ttctcgaaat tcaattaact ttacaaattc ccactattta aggagaaaga agatgaacat + 301 aaagaagcga gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttggtggaa atccaactac + 421 atttaactat ctattagact attacgctga taacatagtc aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt atggcaactt ggtaatacct tttacgaggc tttttgatat + 541 gagcccatgt tttctcaata ggattgtact caggtgagta gggaggaaga ggtaaaagtt + 601 tatacccaaa ctcttcacac aagagttcta acttacccat tctatggaat cttgcattat + 661 ccataataat aaccgatggt gtggttaatg ttggtaagag aaacttctga aaccaagctt + 721 caaaaaagtc gctcgtcatc gtctcttcgt aagtcattgg agcgattaac tcaccatttg + 781 ttagacctgc aaccaaagaa atcctctgat atcttcttcc agatacttta cctcttatta + 841 actgaccttt taatgagcga ccatattctc gataaaaata agtatcgaat cctgtttcgt + 901 caatctaaac aggtgctagg tgctttaaac tattaaaatt cttaagaaat aaggctactt + 961 tttctgggtc ttgttcataa ttagattgaa actagaatag tacacctctg cttctaaaac + 1021 attgttagaa atcgatttga ctgtcctgat cgatttgtca tgttcttatt tcattttact + 1081 atatttttgt ttcgcgggaa gtctactaag atacttaaag atgcagatag taaaaaaaat + 1141 gcggacatta ccgtaaaaaa gtgatataat cgtatgatgt tcaaggtata ggtgttaatc + 1201 atgagtagac gttttaaaaa atcacgttca cagaaagtga agcgaagtgt taatatcgtt + 1261 ttgctgacta tttatttatt gttagtttgt tttttattgt tcttaatctt taagtacaat + 1321 atccttgctt ttagatatct taacctagtg gtaactgcgt tagtcctact agttgccttg + 1381 gtagggctac tcttgattat ctataaaaaa gctgaaaagt ttactatttt tctgttggtg + 1441 ttctctatcc ttgtcagctc tgtgtcgctc tttgcagtac agcagtttgt tggactgacc + 1501 aatcgtttaa atgcgacttc taattactca gaatattcaa tcagtgtcgc tgttttagca + 1561 gatagtgata tcgaaaatgt tacgcaactg acgagtgtga cagcaccgac tgggactgat + 1621 aatgaaaata ttcaaaaact actagctgat attaagtcaa gtcagaatac cgatttgacg + 1681 gtcgaccaga gttcgtctta cttggcagct tacaagagtt tgattgcagg ggagactaag + 1741 gccattgtct taaatagtgt ctttgaaaat atcatcgagt cagagtatcc agactacgca + 1801 tcgaagataa aaaagattta taccaaggga ttcactaaaa aagtagaagc tcctaagacg + 1861 tctaagaatc agtctttcaa tatctatgtt agtggaattg acacctatgg tcctattagt + 1921 tcggtgtcgc gatcagatgt caatatcctg atgactgtca atcgagatac caagaaaatc + 1981 ctcttgacca caacaccacg tgatgcctat gtaccaatcg cagatggtgg aaataatcaa + 2041 aaagataaat taacccatgc gggcatttat ggagttgatt cgtccattca caccttagaa + 2101 aatctctatg gagtggatat caattactat gtgcgattga acttcacttc tttcttgaaa + 2161 atgattgact tattgggagg ggtagatgtt cataatgacc aagagttttc agctctacat + 2221 gggaagttcc atttcccagt agggaatgtc catctagact ctgagcaagc tctaggtttt + 2281 gtacgtgaac gctactcact agccgatgga gaccgtgacc gtggtcgcaa ccaacaaaag + 2341 gtgattgtgg ctatccttca aaaattaacg tcaaccgaag cacttaaaaa ttatagcacg + 2401 atcattgata gcttgcaaga ttctatccaa acaaatatgc cacttgagac catgatagat + 2461 ttggtcaatg ctcagttaga aagtggtgga acttacaaag tgaattcgca agacttgaaa + 2521 ggtacaggtc ggatggatct tccttcttat gcaatgccag acagtaacct ctatgtgatg + 2581 gaaatagatg atagtagttt agctgtagtt aaagcagcta tacaggatgt gatggagggt + 2641 agatgaaatg atagacatcc attcgcatat cgtttttgat gtagatgacg gccccaagtc + 2701 aagagaggaa agcaaggctc tcttggcaga atcctacagg cagggggtgc gaaccattgt + 2761 ctctacctct caccgtcgca agggcatgtt tgaaactccg gaagagaaga tagcagaaaa + 2821 ctttcttcag gttcgggaaa ttgcaaaaga agtagcagat gatttagtca ttgcttatgg + 2881 cgcagagata tactatactc tggatgctct agaaaagcta gaaaaaaaag aaattcctac + 2941 ccttaatgat agtcgttatg ctttgattga gtttagcatg catacttcct atcgtcagat + 3001 tcatacggga ttgagcaata ttttgatgtt gggaatcaca ccagtaattg ctcatattga + 3061 acggtatgat gctttagaga ataacgaaaa acgtgttcgt gaactgattg atatgggctg + 3121 ttacacgcaa gtaaatagtt cacatgtcct caaacccaaa ctttttggcg aacgttataa + 3181 attcatgaaa aaaagagctc agtatttttt ggaacgtgat ttagttcatg tagttgcaag + 3241 tgacatgcac aatttagaca gtagacctcc atatatgcaa caggcatatg atatcattgc + 3301 taagaaatat ggagcgaaaa aagcgaaaga actttttgta gataatccca gaaaaattat + 3361 aatggatcaa ttaatttagg agaaaatatg aaggaacaaa acactttgga aatcgatgta + 3421 ttgcaactat tcagatcttt atggaaaaga aagttggtca ttttattagt ggcaattata + 3481 acttcttcag ttgcttttgc ctacagtact tttgttatca aacctgagtt tactagtacg + 3541 actcggattt atgtagttaa ccgtaatcag gaagagaagt ctggtttaac caatcaagac + 3601 ttgcaggcag gaacttatct ggtaaaagac taccgtgaga ttatcctttc gcaggatgtt + 3661 ttggaggaag ttatttctga tttgaaacta gatttgacgc caaaaggttt ggctaataaa + 3721 attaaagtaa cagtaccagt tgatacccgt attgtctctg tttcagttaa tgatcgagtt + 3781 cctgaagagg caagccgtat cgctaactct ttgagagaag tagctgctca aaaaattatc + 3841 agtattactc gtgtttctga tgtgacaaca ctggaggagg caagaccggc gacatcaccg + 3901 tcttcgccaa atattaaacg caatacacta attggttttt tggcaggggg gattggaact + 3961 agtgttatag ttcttcttct tgaacttttg gacactcatg tgaaacgtcc ggaagatatc + 4021 gaagatacac tgcagatgac acttttggga gttgtaccaa acttgagtaa gttgaaatag + 4081 gagagaggaa tgccgacatt agaaatagca caaaaaaaac tggagttcat taagaaggca + 4141 gaagaatatt acaatgcctt gtgtacaaat atacagttga gcggagataa actaaaagta + 4201 atttccgtta cttctgttaa ccctggggaa ggaaaaacaa ctacttccgt aaatatagca + 4261 aggtcgtttg cgcgtgcagg ctataaaact cttttgatcg atggcgatac tcgaaattca + 4321 gttatatcag gagtttttaa atcgcgtgaa aaaattacag ggctaacaga atttttatct + 4381 gggacagctg atttatctca cggtttatgt gatacaaata ttgaaaattt atttgtaatt + 4441 caatcgggat ctgtatcacc aaaccctaca gccttgttac aaagtaaaaa ttttaatgat + 4501 atgattgaaa cattgcgtaa atattttgat tatatcattg ttgatacagc acctattgga + 4561 attgttattg atgcggcaat tatcactcaa aagtgtgatg cgtccatctt ggtaacagca + 4621 acaggtgagg tgaataaacg tgatgtccaa aaagcgaaac aacaattaga acaaacaggg + 4681 aaactgttcc taggagttgt tttaaataaa ttggatatct cggttgataa gtatggagtt + 4741 tacggtttct atggaaatta tggtaaaaaa taacttagga aagattttat ggatgaaaaa + 4801 ggattgaaaa tttttctggc agtattacag agtattattg tcattttatc ggtttatttt + 4861 cttagctttg ttagagagac agaacttgaa cgttcttcga tggttatact ataccttctc + 4921 cacttttttg tattctattt tagttcctat ggtaacaatt tttttaaaag agggtaccta + 4981 gttgagttta atagtactat aagatatatt tttttctttg caatagctat aagtgtatta + 5041 aactttttta tagcggaacg gtttagtatc tctagaagag gaatggtata cttcttaact + 5101 ttagaaggga tatccttata cttgttaaat ttcttagtaa agaaatattg gaagcatgtg + 5161 ttttttaatc taaaaaatag caagaaaatt ttactgttaa cagtaacgaa aaatatggaa + 5221 aaagttcttg ataaattgct agaatctgat gaactttcat ggaaattggt agcagtaagt + 5281 gttttggata aatctgattt tcaacatgat aaaatacctg taattgaaaa ggaaaaaatt + 5341 attgaatttg caacgcatga agttgtggat gaggtgtttg tcaatcttcc aggagagaac + 5401 tacgatattg gagaaattat ctctaggttt gagacaatgg ggatagatgt aactgtaaat + 5461 cttaaagcat ttgataagaa tttgggtcgc aataaacaaa ttcatgagat ggtaggattg + 5521 aatgtagtca ctttctctac aaatttttat aaaactagtc atgtgatttc aaagagaatt + 5581 ctcgatattt gtggtgccac tattggcctt attctttttg ctatagctag tctagtttta + 5641 gttccattga ttcgtaaaga tggcggacca gctatttttg ctcagacgcg tatagggaaa + 5701 aatggtcgat attttacctt ttataaattc cgttcgatgc ggatcgatgc tgaagctata + 5761 aaagaacaat tgatggatca aaatacgatg caaggtggta tgtttaagat ggacaatgat + 5821 cctcgtgtta caaaaattgg tcgctttatt cgtaaaacca gtttagatga gttaccccag + 5881 ttttggaatg tctttatagg agatatgagt ttggtgggaa cacgtccacc tacagtagat + 5941 gagtatgatc agtatactcc agaacagaaa cgtcgactca gctttaaacc tggtattaca + 6001 ggcttatggc agattagtgg ccgaagtaaa ataaccgatt ttgacgatgt tgtaaaatta + 6061 gatgtggctt atattgataa ttggacaatt tggaaagata ttgaaatttt gcttaaaact + 6121 gttaaagttg tatttatgag agatggagcg aagtgaggaa tgagggatag aatccaactt + 6181 ttaggtttaa caattgatct gcttacgatg aatgaaacga tagatattgt agaacaatat + 6241 gtattagaaa aaagaccact acacttgatg ggcgtgaatg ctgataaaat taatcagtgc + 6301 catacagatg agaaaatcaa aaaaatcgtt aatgagtcag gaatcattaa tgcggatgga + 6361 gcatcagttg ttcttgcaag taagttttta ggaacgcctg ttcctgaacg agtagcgggt + 6421 attgatttga tgcaatgtct tttagagttg tcaaataaaa aaggatattc agtttacttt + 6481 tttggagcaa aagaagaagt tttgcaagat atgctcaaag tatttaagag agattatcca + 6541 aatttgatag ttattggaca cagaaatggc tatttttctg aagaggatga acaagctatt + 6601 caagaagata ttcgtgaaaa gaaccctgat tttgtgttta ttggaattac gtctcctaaa + 6661 aaagaatata ttattcaaaa atttatggat agtggcgtca attcggtatt tatgggagtt + 6721 ggcggtagtt ttgatgtctt gtctggtcat atccaacgag cacctctatg gatgcaaaag + 6781 tcaaatttag agtggttatt ccgtgtagct aatgagccta aacgtctctt taaacgttat + 6841 tttgtaggga atatttcatt cataggaaaa gttttaaaag caaaaagagg tgtaaaatat + 6901 tgaaccagac agagatgatt cgcttaattc aaaaagttga attagatgct ataaaagagt + 6961 ttaaaaaaat ctgtgaagag aatgatatag attttttcct ccgcggtggt agtgtacttg + 7021 gtgcagtcaa atacgacggc tttattccat gggatgatga tatggatatc gctgtccctc + 7081 gtgaagcata cgacaaactt ccaagtgttt tcaaagatag aattatcgct gggaaatatc + 7141 aggttcttac ttatcaatac tgtgatacgt tgcattgcta ctttcctcga ctatttcttt + 7201 tagaagatga aagaaaacgt ttgggcttgc cacgaaatac caatctggga ttgcatttga + 7261 ttgatatcat tcctttagat ggagcaccaa atcattcggt tttaagaaag atttactttg + 7321 gtaaagtata ctggtatcgt tttttagcaa gtttaggaac aacttatgtt ggcgaccatg + 7381 tggatatgca ttccactaag caaaaactaa ttattggttt ctttaaaaaa ctaggatttg + 7441 caaaactatt tcctcaaaat tctgtataca gacgcttgga taatctctat aaaaagtatg + 7501 attggaaaaa gcagaagtat gctgggacta tcaatgcttc tttatttgcc aaagaagtta + 7561 tgccagtaga gatttgggga gaaggagtag agaagccttt tgaggatacc ttctttaaag + 7621 ttccaacgga gtatgatcgc tacctgaaaa gactttacgg agaaaactat cttcacgaag + 7681 agccgagtga tgatgaaaag aaatcgcatt tagggggata aaaatttgtt ttgttatatt + 7741 attttacatt acaaagtctt agatgaaact atttcttgtg ttaaatctat aaaagaaggc + 7801 aattccaatg aaaagcaaat cgttattatt gataattttt ctaataatgg tacaggtgaa + 7861 aaactacaag agctttatga atcagattta gagattgatg tattgattaa ccacgaaaat + 7921 gctggatttg ctcgaggaaa taatgtagct tatcaatttg ctaaggaaaa gtataacccc + 7981 gatttcatgg ttatcatgaa taacgatatt gagatagaaa cagaagattt tgaaaaaatc + 8041 gtgacagata tctatcacaa agaaaaattt catttgctag ggccagacat tttttcgaca + 8101 acatatcagc tacatcaaaa tcctaaacgc ctgacacatt atacttatga agaggtagtg + 8161 gctctcaatg aaaaatttaa aagagggagc caacttagtc taactttaaa aatcaaatgt + 8221 tggttgaaag ctagcaaagt tcttcgaaca gcaatctatc aaaatagacg taaaaaagga + 8281 tcagtagacc atagaaaaca ggtagaaaac ccgattcttc atggttcctt tattgtatat + 8341 tcgagagatt ttattgaaaa agaggagtat gcttttaacc ctaatacctt cttttactat + 8401 gaaacagaga tattagatta tgaagctgag ttaaaaggat acaagagaat ttatacaccg + 8461 aagattaagg ttttacacca tcaaaatgtg gcaacaaatc aggtttatac aaacttagta + 8521 gaaaaaactt tgttttcaaa caaatgcaac tttgaatcca ctagttattt tttaacttta + 8581 atggagaaaa atgaataaaa aatgatgaaa aaaattttat atgtgacaaa tgttgattgg + 8641 aattggataa aacaacgtcc acaatttatt gcagaaaact tatctaattt ttatgagatg + 8701 ctagttctgt atcgctattg gtacaataga aaaggattga ctgaggatag aaatactaac + 8761 attacaaata tatcacgtat ttatgcccta ccttttgtta ataggtcacc gaaactaaag + 8821 caactgaatg ataaaattgt tgcttggaat attcgaagaa aagttaaggc ttttaaaccg + 8881 gaatatgtat atttgacaaa tccaatgcag tttgcatctc ttgtagacaa ttcagaacaa + 8941 aaaataatat atgattgtat ggattatcat gtggctttta tagaaaatag agaagaacgt + 9001 cagcgattaa aggatttaga agagaaactg gtcaatagag ctaatttaat cttggtttcg + 9061 agtgagaaac taagagaaaa tattatttct gattataact tggaagagca ggttaataaa + 9121 atagtggttg ttagaaatgg ttataatggt aaaatcttaa gcattcctac tcggcataaa + 9181 aagaataacc aaaagcttgt acttgcatat gttggaacta tcagtcattg gtttgacttt + 9241 gatatcattt tacgaagttt aaaagatttt gataatattg aatataattt gattggtccg + 9301 attagcaaag ctgatattcc tgaacatgat agaattcatt atttaggaag tgtaccacac + 9361 gagaagattt atcagtatat tgagaatgca gatgttctga ttatgccgtt tcaaattaat + 9421 gatattgttg aagcagtgga tccagtcaag ttgtatgaat atattaattt taaaaaaaat + 9481 atacttacgg tatgttataa ggaaattctg agatttgaac catttgtata catgtattca + 9541 aattatttag attaccaaat gaatttgttg caattgattg aaaataataa tttgaaatat + 9601 gacagtatag ctagagaaga ttttttgaaa agtaatactt gggaaaaaag agcggagctg + 9661 attcatcagc tgattaacca attgtaattt tttatggaga gatgaatgaa gagacagaag + 9721 tttgaattta tagagattct atactatttt acagtgatgt tatcagtggg aatgtttctt + 9781 atgtttaccc tcaacttata ttggcacaga aacttattaa ctattttatc tattgctctc + 9841 tcatttttaa tgcttcctat actgattgtt aatgctaaaa gaatttctaa atctgctttt + 9901 atctatggta cttttttatc tatatgtatt atatatgaga tattaagagc taaaacactg + 9961 tataattaca gtgtgagtaa tatttttttg gcctctagac aatatatatg gatttttcta + 10021 ttttttgtat tgatttacct ttttaaaaac aaacaagaaa atatgagaaa aattttagat + 10081 aatacactca atatttttat gttttctctc ggaattagag catttacttg gtttttatat + 10141 acgttatttc aagttgaatt atttccatct attttaagag aattcggaga tttgtggtat + 10201 cgaaatgaat tttcagtacg aatagatgga acaccattaa ttataatagg tttgttaatt + 10261 tccacttttt tctattttaa atttggaaat aggaaatact tttattattt gttcttgata + 10321 ttaatgtata taacatttgt aaatcagaca agagtgctac tggtttctgt tttgatttca + 10381 atttttctta tgtttgtatt ttctagaaga acttctagat tgctcacctc tttaagtttt + 10441 gtaactataa ttatagcatt cgtttatgga ggtggattgg attatattaa agcatattta + 10501 aatatagatg ctggaacatt tgatctggga ttaggattta gatactggga gttgaaatac + 10561 tatctgggtt tattagctaa tgatgtatgg aaacttgggg ttggaattct aacatcaagt + 10621 aatataaata gtaattttat tttggctggg ccaagtgctg ttaagatgta tctagatgat + 10681 ttaggttttt tagagttatt cgttcaattt ggtgtagccg caatttttat gtatggttat + 10741 atattttata aattaatcaa tttaattcta agaatgtcaa atgataaata tagagttgac + 10801 cgcgcctttt ttattgcact cttaactaat ttaataatta cttcaatttc tttaaatatc + 10861 tttggagcgc agagaagttt ctcattggca attgttcttg cattaatatt ctactatgac + 10921 tataggctga aaaatgacat agaaaattag gtgtataatg gataaagtat gtatagttat + 10981 tctcaattat aataattatg aagaaacgat tgagtgtgta caaagtttga gaagtactat + 11041 aaaatcaaat gagtatgaca tcgtgattgt agataataat tcggtgaatg atagtgtcaa + 11101 agagttatcc aaggcgttat cccctattaa gattattact agtttagaaa atagaggata + 11161 tgcgaatgga aacaatattg gaataaagta tgctgaggat aatggatatg attacatttg + 11221 tatattaaac aacgatacat taattgaggt tgattttttg gaatcgtgta aacgagaact + 11281 agaaaataat tccttcgttg cctttgttag tccagtgtta gttgaatata aagataataa + 11341 cttggtacaa tctacaggtg gtgatatttt tattaatagg ggaattgtaa ctttaaaaaa + 11401 tcatggtgct cagagagaca aacttccttc taaaatcgaa agtgactata ttgggggagc + 11461 atgtttgatg ttcaaaacct ctatcttgaa aattattgga tatatacctg aaagttactt + 11521 tctattttat gaagaaactg aatggtgtta tagggctaaa aaattaggct ataagaatat + 11581 atgccttact caaagttatg tgtatcataa aggttcggtc tctataaaag cggtcaatgg + 11641 acttcaagaa tatttaatgg caagaaatag agttgtattt gttcgtagaa atataaatag + 11701 caaactaaag tattctgctt ttttgttcta tttattcatg caacaacttt atcattgctt + 11761 cttgcgaagg gattgttcta aaagaaagta taaatattat ttagatggtg tatttaatag + 11821 aattgatcca tcctatccat ttattttcat aagcgaataa gttactactt ataactgtag + 11881 atgcactaag ataattatag tagactgaat ctaaaatagt acgaaataat tgctaaaaca + 11941 tttatagaaa ttaattttac tttcctaatc gatttgttct tatcttattt caatctgcta + 12001 tagattaaat aagtgaagaa agtggtcatt ataggaacat aatttaacat agttaggtga + 12061 aacatgaaaa tgtttgatat atctcaaata aaaacaaaaa cagttgcatt tgattttttt + 12121 gatactgttg tgcataggaa ttgtcatcct gagcaaattt tgtatcagtg ggctaaggaa + 12181 atggctttgg aggtgaattt caatatatct ccttcaatat tatatcaaat cagaaaaagt + 12241 gtcgaaaaca ataaaaagtt aggcactgaa gaaatgtgtt atctagacct tttgtctgga + 12301 atatataatg aaattaaaga taagataaaa aatacatcga aagaagagtt tattcataga + 12361 gctaaaattc tagagttgaa aattgaatta caacatattt atttggattc ggaaattaaa + 12421 gaagttttaa aaaaattgaa aagtgattca aaacagatta tcttagtttc tgatttttat + 12481 actgataaag aattaataga aactgtatta aaaaagtttg aaatttttga ttatttctct + 12541 tctatctata tttcgagtga gaaaggttgc cgtaaatcca caggaaattt atataagtta + 12601 attttaaaag aattaggctt aaatcctata gaaattacca tgataggaga taattgtaaa + 12661 tctgattatg aagtgccgcg ttctctagga ttaaatgcta tttatagacg atatatagat + 12721 aaaaattcaa cagtgtcaga gaaagagttg gtaagactct atgatcaaat tttattttct + 12781 aacagtaaaa aagcaccgtt taatattttt ttagctgaca tcgtattttt tatttcggaa + 12841 ttgcataaaa agatgattca ggatgatgtt caaatagcac tcttttgctc aagagaagga + 12901 cagttattga aaagactttt tgatatatat caagatactt ttttgagaga aaatcaaaag + 12961 atttgtacag aatattttta tgtttctaga cgatcgacat tatattcttc ttttacttct + 13021 ttagagaatg aagaatttga gatgatcttt cgtcaatata aaaaaattac gttacaaaat + 13081 ttcttattaa acttgaactt ttctaataat gaaatcacat tgatttgtca agatttaaat + 13141 gtgaaaccta catatgtatt aacagtagac gatcatttat tagagaacct aagaaaacac + 13201 cctcagttta ttaagaagtt caatcaagag aaaaaagata gccaattact acgtgagtat + 13261 attaagcatt taacaaaaaa ccgaaatgag gcatatttag ttgatgtagg ttggaaagga + 13321 acgatacaag atagtatcaa aaaggctctt ccagacaaga gaatagtagg atattatcta + 13381 ggattgatgc tcaatgttta ttcagtagaa aataaaacgg ataaaactgg tttattattt + 13441 tctgattatc caagtaaatc gaaattttat gatattgtga gtagaaattt tggtttttat + 13501 gaagatattt ttgtagcaga tcatggtcca gttttgaaat ataaaaaaga gagtgatatt + 13561 atccccatta ttgacgatga taagaaacat gtgagtattt atcaggcagt taaagattat + 13621 caagaagagt tagtattagg attttcagaa attttggaag cttataagaa aatgaagttt + 13681 ctcccttttg aacaaaaaaa tctgtggcta acgatgtcgc taaaaaaaga atgtatttat + 13741 atacctaagt tacaatcatt ttctgaatct ttaaaagaaa aagttgttga aaattttggt + 13801 gagatagtaa ctcttaagac tacgaaaaaa tctataaaaa cgttattaag agagaaaagc + 13861 gatttacttt gggttgattt cgtttataga ttgtttggtg gtgtcaattt cctatttatt + 13921 ccagaattat atacaagagt tatattttta ttgaaatatt tagatttgaa attgaggttg + 13981 aaaaattatg gggaataaat ccataaagtt gaatgcatta ttaaatattg tcctgacgct + 14041 atcaaatatc attttcccat taatcacttt tccttatata tctagaatat tgaatccaaa + 14101 tggtataggt ttaacttcat tttttagttc aatagggaat tatggtattt tacttgcttc + 14161 tctgggaatt tcaacttatg gtatcaaagc agtagcaagt gttagagatg atagagataa + 14221 gttgtcaaaa gtagtacagg agttaatgat tataaacgtt gctatgtcta taataacaac + 14281 tgcaatacta ttatttatga ctatacttat aacacaattg aatagagaat tttcactcct + 14341 attgatcaca tgtgggacta ttttatcttc tcctttcgcc ttaaattggt tgtatagtgg + 14401 aatggaagaa tatacgtata ttactactag gtcagtagtg tttaaaattc tatcattaat + 14461 attgattttt ctacttgtga aaaggccaga ggattatatt gtttttgcta gtatttcatt + 14521 gttttcttct ctaagttcaa atatcttaaa tctatggcat agccgacatt tcattaatat + 14581 taaattatat aaaaatttac aatttaaata tcattttaaa ccaatgtggt atttatttgc + 14641 ctcattactt gcagtaaata tttatactaa tttagataca gtgatgctcg gttttattaa + 14701 tggtaatgag gctgtgggat actattctgt ggcatcaaag gttaagtgga ttttgctttc + 14761 tcttattaca tctattagtg cagttttgct accgagactt tcattttata ttagtaaaaa + 14821 tgacacctcg aattttataa aaatgttaaa ggagtcatct gcggttatat tttttattgc + 14881 gattccattg atggtattct ttattgtaga ggcgaaagat agtatcttat tactaggagg + 14941 aagtcagtat cttcctgcga ctttagcgat gcaaatactt atgccaattt tacttatttc + 15001 tggtttctcg aatattacag gaaatcaaat attgattcca atgaatagag aaaaatattt + 15061 tatggttgca gtaacgattg gtgctgtgat taatcttatt ttgaatctac tgttaatgcc + 15121 taagtttgga attattggtg cttctgtcgc aactcttttt gcggaattgt cgcagatgac + 15181 ggtacaatta catttttcaa aagaatattt agtatcaaat atatcgataa agagtttggt + 15241 taatgtgata attgcaacag ttgtttctat aataccacta atcattttga atcagctgat + 15301 aacgataact ataccatttt attctctaat gctagcaggt tttgctttct tttcattata + 15361 tttagtaatt ctgcttttat taaaggagga agtgacgatt caattatttt ctcttcttgc + 15421 aaagaagaag taaattggtc agaaattgaa atgtataaac aaataaataa tttaattatt + 15481 aattgaggag gaaatcatga agataatgct agtttttggt acacgtccag aagcgataaa + 15541 aatgtgtcca ttagtgaatg agttgaaaaa acaggcagat atggaaacag ttgtttgtgt + 15601 aactggtcaa cacaaggaga tggttagccc tgttttggaa ttgtttggag ttcaaccaga + 15661 ttatgattta gaaattatga aagctaatca aaccttgttt tctataacaa caagtatttt + 15721 agaaaaaatt aaacctgttt tagaagaaga acaaccagat attgttctag ttcacggtga + 15781 cactactacg acatatgcag cagctttggc agcattttat ctaggaatta aggttggtca + 15841 tgttgaagct gggttacgaa cttacaacct gcaaagtccc ttcccagaag aatttaatag + 15901 acaatcgact tctattattg caaattatca ttttgcccct acagaattag ctaaagaaaa + 15961 tctaacaaaa gagggtagaa acaatgttta tgtgacaggt aatacggtaa ttgatgcact + 16021 taaaactaca gtacaaaagg attatacaca ccctgattta gatttaaacg ctgataatcg + 16081 tctcattcta ttgactgctc atagacgtga aaatctcgga gaacctatga aacacatgtt + 16141 tagagctgtt aaacgaattt taaatgaata tgacgatgtt aaggtaattt atccaattca + 16201 taagaatcct ttggttcgtg aaacagctgc ggaaattttt ggagacatag aacgaattca + 16261 gattattgaa cctttagatg ttctggattt tcataacttt atgaataata gttacatgat + 16321 tttaactgac tcaggaggag ttcaggaaga agcgccttcg ttaggaaagc ctgtattggt + 16381 catgcgagat acgacagaaa gacctgaagg agtagctgct ggaacgttga aattggttgg + 16441 gactgatgag gagactattt atcaaaattt taagatgctt ttagacgatt ccgaagaata + 16501 taaaaaaatg agtcaagcta gtaatcctta tggaaatggt gatgctagta aacagattgt + 16561 tcgaatttta cgtggaattt gagtgtgttt agataaagta atacagaaag gtaccctact + 16621 atgaaaggta ttattctagc aggtggttcg gggactcgct tgtatccttt gactcgcgct + 16681 gcatcaaaac aactgatgcc ggtttatgat aaacccatga tttactaccc actttcaaca + 16741 ttgatgttgg ctggaattag ggatattttg attatttcca ctccacagga tttacatcga + 16801 tttcaagagc ttcttcaaga cggatctgag tttgggatca aactttctta tgcagagcaa + 16861 ccaagtccag atggtttggc acaagccttt atcattgggg aagagtttat ttctgatgat + 16921 agcgttgcgc taatcttagg tgataatatc tatcacggtt ctgggctttc caagatgcta + 16981 caaaaggcag cgagtaagga gtcgggagca actgtttttg gctaccacgt caaggatcca + 17041 gagcgctttg gtgtggttga gtttgatcag gatatgaagg ctatttctat tgaagaaaag + 17101 ccagagcaac ctcgttcaaa ctatgcagtg acaggactct atttctatga taatgatgta + 17161 gtagagattg ccaaaagtat taaaccaagt cctcgtggtg aattggaaat tacagatgtc + 17221 aacaaggctt acttggatcg tggtgatttg tctgttgagc tcatgggacg tggttttgct + 17281 tggttggata ctggcactca tgaaagttta ctagaggctt cgcagtacat cgaaacagtc + 17341 caacggatgc aaaatgttca ggtagcaaac ttagaagaaa ttgcttaccg tatgggctat + 17401 atcagtcgag aagatgtatt ggccttagcc caaccactta agaaaaatga atacggacag + 17461 tatctgctcc gtttgattgg agaagcatag atgacagata agtttttcgg taagacgctt + 17521 gcggcacgca aggttgaagc tattccaggc atgttggagt ttgatatccc cgttcatgga + 17581 gataatcgtg gctggtttaa agaaaatttc caaaaggaaa aaatgcttcc acttggattt + 17641 ccagagtctt tctttgcaga aggaaaattg caaaacaatg tatccttctc acgtaaaaat + 17701 gtccttcgag gcctccacgc agagccttgg gataagtaca tctctgtagc agatggaggg + 17761 aaagttctgg gttcttgggt tgatctacgc gagggtgaaa cctttgggaa tacctatcag + 17821 acagtgattg atgcgagtaa gggaatcttt gttcctcgag gcgtagctaa tggcttccaa + 17881 gttttatcag atacagtgtc atatagctat ctggtcaatg attactgggc gcttgaactc + 17941 aaacccaagt atgcctttgt gaactacgct gatccaagcc ttggtattga atgggaaaat + 18001 attgcagaag cagaggtttc agaagcagat aaacatcatc ccctacttaa ggacgtgaag + 18061 cctttgaaaa aagaagattt ggaataagga aagaatatga ctgaatacaa aaatattatc + 18121 gtgacaggtg gagctggctt tatcggttct aactttgtcc attatgttta cgagaacttt + 18181 ccagatgttc acgtgacagt cctagataag ttgacttatg ctggaaaccg cgcgaatatt + 18241 gaggaaattt taggtaatcg tgttgagtta gttgttggtg acattgctga tgcggagttg + 18301 gtagacaagt tggctgctca agcagatgct atcgttcatt atgcagcgga aagccacaat + 18361 gataattcgc tcaatgatcc atcgccattt attcatacta acttcattgg aacctatact + 18421 cttttagaag ctgctcgtaa gtatgatatt cgcttccacc atgtatcgac agatgaagtt + 18481 tatggggatc tccctttacg cgaagatttg ccaggtcatg gagaagggcc gggtgagaaa + 18541 tttacggctg aaaccaagta caatccaagc tcgccttact catcaaccaa ggcagcctca + 18601 gatttgattg tcaaagcctg ggtgcgttct tttggagtta aggcaacgat ttccaactgt + 18661 tcaaataact acggtcctta tcaacatatc gaaaaattca tcccacgtca gattactaac + 18721 atcctaagtg gtatcaagcc aaaactttac ggtgaaggta aaaacgttcg tgactggatt + 18781 cataccaatg accattcttc aggagtttgg acaatcttga caaaagggca aatcggtgaa + 18841 acctacttga ttggggctga tggtgagaag aacaataagg aagttttgga acttatcctt + 18901 aaggaaatgg gacaagctgc ggatgcctat gatcatgtga ctgaccgtgc aggacatgac + 18961 cttcgctatg cgattgatgc tagcaagctc cgtgatgagt tggggtggaa acctgaattt + 19021 accaactttg aagctgggct caaggcaaca atcaagtggt atacagataa ccaagaatgg + 19081 tggaaagcag aaaaagaagc tgttgaagcc aattatgcta agactcagga gattattaca + 19141 gtataaaaag caggaaatag ctgcttttta ttgctatatt gggaagagtt acatattaga + 19201 aaggtctaga gatgatttta attacagggg caaatggcca attaggaacg gaacttcgct + 19261 atttattgga tgaacgtaat gaagaatacg tggcagtaga tgtggctaag atggacatta + 19321 ccaatgaaga aatggttgag aaagtttttg aagaggtgaa accgacttta gtctaccatt + 19381 gtgcagccta caccgctgtt gatgcagcag aggatgaagg aaaagagttg gacttcgcca + 19441 tcaatgtgac ggggacaaaa aatgtcgcaa aagcatctga aaagcatggt gcaactctag + 19501 tttatatttc tacggactat gtctttgacg gtaagaaacc agttggacaa gagtgggaag + 19561 ttgatgaccg accagatcca cagacagaat atggacgcac taagcgtatg ggggaagagt + 19621 tagttgagaa gcatgtgtct aatttctata ttatccgtac tgcctgggta tttggaaatt + 19681 atggcaaaaa cttcgttttt accatgcaaa atcttgcgaa aactcataag actttaacag + 19741 ttgtaaatga tcagtacggt cgtccgactt ggactcgtac cttggctgag ttcatgacct + 19801 acctagctga aaatcgtaag gaatttggtt attatcattt gtcaaatgat gcgacagaag + 19861 atacaacatg gtatgatttt gcagttgaaa ttttgaaaga tacagatgtc gaagtcaagc + 19921 cagtagattc cagtcaattt ccagccaaag ctaaacgtcc gctaaactca acgatgagcc + 19981 tggccaaagc caaagctact ggatttgtta ttccaacttg gcaagatgca ttgcaagaat + 20041 tttacaaaca agaagtgaga taagtagtag aatgattttc tagtctaata aaagaggcag + 20101 ataatgaact ccaaaggagc ttaagatata caattatctt gttgttggtg ctgatctctt + 20161 tggcgcatag ctttggctca gtttctatta tcgctcacac catccatcag aagtttaatc + 20221 tgaaggtacc caattatcgc caagaagaag attgggctag gatgggttta ccaatcacac + 20281 gtaaggaaat ctctaattgg catatcaagg caagtcaata ctatttagag tccctttata + 20341 accttttacg agaaaagttg ttagaacaac ctcttcttca tgcggatgaa acctcttatc + 20401 gggtgctaga gagtgatagc catctgacct actattggac ctttttgtct gggaaagctg + 20461 agaatcaagc aatcacgctg taccatcatg atcagcgtcg gagtggttta gtagtacaag + 20521 aattcctagg agattattct ggctatgtgc attgtgatat gttgcggcag taacttagga + 20581 ctttagtcct ctagttctgc ctatgcgata gcagtccaag gtttaggagc aaggcgacgc + 20641 taagcttggt aaactgcgaa ccgctagaag cttatcgtca actggaagaa gctgaacttg + 20701 ttggatgttg ggcacatgtg agaaggaagt tttttgaagc gacccccaag caagcagata + 20761 aatcatcctt aggagctaaa ggtttagctt attgtgatca gttattttcc ctggaaagag + 20821 actgggaggc tttgccagct gatgaacgac tacagaaacg tcaagaacat ctccagccct + 20881 taatggaaga cttctttgct tagtgccggc gtcagtcagt tttagcaggt tcaaaactag + 20941 gaagggcaat tgaatacagc ctcaagtatg aagaaacctt taagactatt ttgaaagacg + 21001 gacatctggt cctttccaat aatctagctg aacgcgccat taaatcattg gttatgggac + 21061 ggagtaaaag aattcagtgg actcttttag cctaagctaa attttaaaaa gcgagggtgg + 21121 ttattttctc aaagttttga aggagctaaa gcaacagcta ttattatgag tttgttggaa + 21181 acagctaaac gtcatcaatt aaatagcgag aaatatctat tctatcttct agaatgtctt + 21241 ccaaacgagg aaactctcgt aaacaaagag gttttagagg cttatttacc atggactaaa + 21301 gttgtacaag aaaagtgcaa ataagaaatc tccagattag gaactatccg tgagttctct + 21361 agtctggaga tttttcaata tacttcgtta ttggacggtt acgatattca tattttttgc + 21421 aaagatgttg tttgaaaaat aattttcaaa aattctgaaa attctgttga caactttctg + 21481 aaaagagtct ataatggaga gaaagtttta aaggagaaaa tgatgaaaag ttcaaaacta + 21541 tttgcccttg cgggcgtgac attattg +// + diff --git a/public/res/serotype_genbank/serotype_19C.gb b/public/res/serotype_genbank/serotype_19C.gb new file mode 100644 index 0000000..00f7ab3 --- /dev/null +++ b/public/res/serotype_genbank/serotype_19C.gb @@ -0,0 +1,1127 @@ +LOCUS CR931677 25632 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 7588/39 (serotype 19c). +ACCESSION CR931677 +VERSION CR931677.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 25632) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 25632) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..25632 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="7588/39" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC19C_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC19C_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33663.1" + /db_xref="GOA:Q4K0Y0" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K0Y0" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVEMTD + " + gene complement(287..1678) + /gene="tnp" + /locus_tag="SPC19C_0002" + /pseudo + CDS complement(join(287..418,418..1548,1547..1678)) + /gene="tnp" + /locus_tag="SPC19C_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(694..1194) + /gene="tnp" + /locus_tag="SPC19C_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.1e-21" + /pseudo + gene complement(1783..2736) + /gene="tnp" + /locus_tag="SPC19C_0003" + CDS complement(1783..2736) + /gene="tnp" + /locus_tag="SPC19C_0003" + /note="member of homology group 39" + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + /protein_id="CAI33665.1" + /db_xref="GOA:Q4K0X9" + /db_xref="InterPro:IPR001584" + /db_xref="InterPro:IPR012337" + /db_xref="UniProtKB/TrEMBL:Q4K0X9" + /translation="MQEHYTPKGKHLTIDNRRLIERWKNENKSNREIAGLLGKAPQTI + HNEVKRGTTLQQVRKGLYKKVYSADYAQTVYQFNRKRSVKKLILTKEIREKILHYHKQ + KFSPEMMVNKKQVKVGISTIYYWFHNGHLGLTKADMLYPRKRKGVKKQASPNFKPAGK + SIEERPDVINLRLENGHYEIDTVLLTKIKNYCLLVLTDRRSRHQIIRLIPNKTAESVN + QALTLLLGEHRILSITADNGSEFKRLSEVFPEEHIYYAHAYSSWERGSNENHNRLIRR + WLPKGTKKTTPKEVAFIENWINNYPKKCLDYKSPSEFLLGG" + misc_feature complement(1792..2229) + /gene="tnp" + /locus_tag="SPC19C_0003" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 6.6e-23" + misc_feature complement(2590..2655) + /gene="tnp" + /locus_tag="SPC19C_0003" + /note="Predicted helix-turn-helix motif with score + 1087.000, SD 2.89 at aa 28-49, sequence + KSNREIAGLLGKAPQTIHNEVK" + gene 3099..4544 + /gene="wzg" + /locus_tag="SPC19C_0004" + CDS 3099..4544 + /gene="wzg" + /locus_tag="SPC19C_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33666.1" + /db_xref="GOA:Q4K0X8" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0X8" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVLSILVSSVSLFAVQQFVGLTNR + LNATSSYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLM + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 3099..3215 + /gene="wzg" + /locus_tag="SPC19C_0004" + /note="Signal peptide predicted for SPC1006 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 3303..3650 + /gene="wzg" + /locus_tag="SPC19C_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.8e-63" + misc_feature 3828..4271 + /gene="wzg" + /locus_tag="SPC19C_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 4546..5277 + /gene="wzh" + /locus_tag="SPC19C_0005" + CDS 4546..5277 + /gene="wzh" + /locus_tag="SPC19C_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33667.1" + /db_xref="GOA:Q4K0X7" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0X7" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTLYRDIHNALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEKDLVHIIASDMHNLDGRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 4549..5157 + /gene="wzh" + /locus_tag="SPC19C_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.4e-36" + gene 5286..5978 + /gene="wzd" + /locus_tag="SPC19C_0006" + CDS 5286..5978 + /gene="wzd" + /locus_tag="SPC19C_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33668.1" + /db_xref="GOA:Q4K0X6" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0X6" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTRVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 5304..5720 + /gene="wzd" + /locus_tag="SPC19C_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-53" + misc_feature 5826..5903 + /gene="wzd" + /locus_tag="SPC19C_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 5988..6671 + /gene="wze" + /locus_tag="SPC19C_0007" + CDS 5988..6671 + /gene="wze" + /locus_tag="SPC19C_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33669.1" + /db_xref="GOA:Q4K0X5" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0X5" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SRGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 6687..8054 + /gene="wchA" + /locus_tag="SPC19C_0008" + CDS 6687..8054 + /gene="wchA" + /locus_tag="SPC19C_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33670.1" + /db_xref="GOA:Q4K0X4" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0X4" + /translation="MDEKGLKIFLAVLQSIIVILSVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGENYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRYFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKMDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQISGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 7470..8051 + /gene="wchA" + /locus_tag="SPC19C_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 7e-146" + gene 8058..8801 + /gene="wchO" + /locus_tag="SPC19C_0009" + CDS 8058..8801 + /gene="wchO" + /locus_tag="SPC19C_0009" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI33671.1" + /db_xref="GOA:Q4K0X3" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q4K0X3" + /translation="MRDRIQLLGLTIDLLTMNETIDIVEQYVLEKRPLHLMGVNADKI + NQCHTDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMQCLLELSNKKG + YSVYFFGAKEEVLQDMLKVFKRDYPNLIVIGHRNGYFSEEDEQAIQEDIREKNPDFVF + IGITSPKKEYIIQKFMDSGVNSVFMGVGGSFDVLSGHIQRAPLWMQKSNLEWLFRVAN + EPKRLFKRYFVGNISFIGKVLKAKRGVKY" + misc_feature 8220..8735 + /gene="wchO" + /locus_tag="SPC19C_0009" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 1.6e-95" + gene 8813..9619 + /gene="wchP" + /locus_tag="SPC19C_0010" + CDS 8813..9619 + /gene="wchP" + /locus_tag="SPC19C_0010" + /note="member of homology group 95" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33672.1" + /db_xref="GOA:Q4K0X2" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K0X2" + /translation="MIRLIQKVELDAIKEFKKICEENDIDFFLRGGSVLGAVKYDGFI + PWDDDMDIAVPREAYDKLPSVFKDRIIAGKYQVLTYQYCDTLHCYFPRLFLLEDERKR + LGLPRNTNLGLHLIDIIPLDGAPNHSVLRKIYFGKVYWYRFLASLGTTYVGDHVDMHS + TKQKLIIGFFKKLGFAKLFPQNSVYRRLDNLYKKYDWKKQKYAGTINASLFAKEVMPV + EIWGEGVEKPFEDTFFKVPTEYDRYLKRLYGENYLHEEPSDDEKKSHLGG" + misc_feature 8870..9559 + /gene="wchP" + /locus_tag="SPC19C_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 9.7e-110" + gene 9624..10496 + /gene="wchQ" + /locus_tag="SPC19C_0011" + CDS 9624..10496 + /gene="wchQ" + /locus_tag="SPC19C_0011" + /note="member of homology group 43" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33673.1" + /db_xref="GOA:Q4K0X1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0X1" + /translation="MFCYIILHYKVLDETISCVKSIKEGNSNEKQIVIIDNFSNNGTG + EKLQELYESDLEIDVLINHENAGFARGNNVAYQFAKEKYNPDFMVIMNNDIEIETEDF + EKIVTDIYHKEKFHLLGPDIFSTTYQLHQNPKRLTHYTYEEVVALNEKFKRGSQLSLT + LKIKCWLKASKVLRTAIYQNRRKKGSVDHRKQVENPILHGSFIVYSRDFIEKEEYAFN + PNTFFYYETEILDYEAELKGYKRIYTPKIKVLHHQNVATNQVYTNLVEKTLFSNKCNF + ESTSYFLTLMEKNE" + misc_feature 9630..10265 + /gene="wchQ" + /locus_tag="SPC19C_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 8.2e-10" + gene 10500..11585 + /gene="wchR" + /locus_tag="SPC19C_0012" + CDS 10500..11585 + /gene="wchR" + /locus_tag="SPC19C_0012" + /note="member of homology group 162" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="CAI33674.1" + /db_xref="UniProtKB/TrEMBL:Q4K0X0" + /translation="MMKKILYVTNVDWNWIKQRPQFIAENLSNFYEMLVLYRYWYNRK + GLTEDRNTNITNISRIYALPFVNRSPKLKQLNDKIVAWNIRRKVKAFKPEYVYLTNPM + QFASLVDNSEQKIIYDCMDYHVAFIENREERQRLKDLEEKLVNRANLILVSSEKLREN + IISDYNLEEQVNKIVVVRNGYNGKILSIPTRHKKNNQKLVLAYVGTISHWFDFDIILR + SLKDFDNIEYNLIGPISKADIPEHDRIHYLGSVPHEKIYQYIENADVLIMPFQINDIV + EAVDPVKLYEYINFKKNILTVCYKEILRFEPFVYMYSNYLDYQMNLLQLIENNNLKYD + SIAREDFLKSNTWEKRAELIHQLINQL" + gene 11604..12848 + /gene="wzy" + /locus_tag="SPC19C_0013" + CDS 11604..12848 + /gene="wzy" + /locus_tag="SPC19C_0013" + /note="member of homology group 163" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33675.1" + /db_xref="UniProtKB/TrEMBL:Q4K0W9" + /translation="MKRQKFEFIEILYYFTVMLSVGMFLMFTLNLYWHRNLLTILSIA + LSFLMLPILIVNAKRISKSAFIYGTFLSICIIYEILRAKTLYNYSVSNIFLASRQYIW + IFLFFVLIYLFKNKQENMRKILDNTLNIFMFSLGIRAFTWFLYTLFQVELFPSILREF + GDLWYRNEFSVRIDGTPLIIIGLLISTFFYFKFGNRKYFYYLFLILMYITFVNQTRVL + LVSVLISIFLMFVFSRRTSRLLTSLSFVTIIIAFVYGGGLDYIKAYLNIDAGTFDLGL + GFRYWELKYYLGLLANDVWKLGVGILTSSNINSNFILAGPSAVKMYLDDLGFLELFVQ + FGVAAIFMYGYIFYKLINLILRMSNDKYRVDRAFFIALLTNLIITSISLNIFGAQRSF + SLAIVLALIFYYDYRLKNDIEN" + gene 12856..13758 + /gene="wchS" + /locus_tag="SPC19C_0014" + CDS 12856..13758 + /gene="wchS" + /locus_tag="SPC19C_0014" + /note="member of homology group 164" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33676.1" + /db_xref="GOA:Q4K0W8" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0W8" + /translation="MDKVCIVILNYNNYEETIECVQSLRSTIKSNEYDIVIVDNNSVN + DSVKELSKALSPIKIITSLENRGYANGNNIGIKYAEDNGYDYICILNNDTLIEVDFLE + SCKRELENNSFVAFVSPVLVEYKDNNLVQSTGGDIFINRGIVTLKNHGAQRDKLPSKI + ESDYIGGACLMFKTSILKIIGYIPESYFLFYEETEWCYRAKKLGYKNICLTQSYVYHK + GSVSIKAVNGLQEYLMARNRVVFVRRNVNSKLKYSAFLFYLFMQQLYHCFLRRDCFKR + KYKYYLDGVFNRIDPSYPFIFISE" + misc_feature 12868..13395 + /gene="wchS" + /locus_tag="SPC19C_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.4e-23" + gene 13962..15896 + /gene="rbsF" + /locus_tag="SPC19C_0015" + CDS 13962..15896 + /gene="rbsF" + /locus_tag="SPC19C_0015" + /note="member of homology group 49" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI33677.1" + /db_xref="GOA:Q4K0W7" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006439" + /db_xref="UniProtKB/TrEMBL:Q4K0W7" + /translation="MKVFDISQIKTKTVAFDFFDTIVHRNCHPEQILYQWAKEMALEV + NFNISPSILYQIRKSVENNKKLGTEEMCYLDLLSGIYNEIKDKIKNTSKEEFIHRAKI + LELKIELQHIYLDSEIKEVLKKLKSDSKQIILVSDFYTDKELIETVLKKFEVFDYFSS + IYISSEKGCRKSTGNLYKLILKELGLNPKEITMIGDNYKSDYEVPRSLGLNAIYRQYI + DKNTIVAEKELVRLYNQILFSNSKKAPFNIFLADIVFFISKLHKKMIQDDVQIALFCS + REGQLLKILFDIYQNTFFGKNQKICTEYFYVSRRSTLYSSFTSLDNEEFETIFRQYKK + ITLQNFLLNLNFSDNEIILICQDLKEKPTYVLTVDDHLLEKLKKHPQFITKFNKEKKD + SQLLRDYIEYLTKNQNEVYLVDVGWKGTIQDNIKKALPDKRIVGYYLGLILNAYSVEN + KMDKTGLLFSDYPSKSKFYDIVSRNFGFYEDIFVADHGPVLKYKKESDIIPIIDDDKK + HVSIYQAVKDYQEELVLGFSEILEAYKKMKFLPFEQKNLWLMMSLKKECIYIPKLQSF + SESLKEKVVENFGEIVTLKTTKKSIKTLLRKKSDLLWVDFVYRLFGGVNFLFIPELYT + RVIFLLKYLDLKLRLKNYGE" + misc_feature 13992..14615 + /gene="rbsF" + /locus_tag="SPC19C_0015" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 7.9e-16" + gene 15886..17331 + /gene="wzx" + /locus_tag="SPC19C_0016" + CDS 15886..17331 + /gene="wzx" + /locus_tag="SPC19C_0016" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33678.1" + /db_xref="GOA:Q4K0W6" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K0W6" + /translation="MGNKSIKLNALLNIVLTLSNIIFPLITFPYISRILNPNGIGLTS + FFSSIGNYGILLASLGISTYGIKAVASVRDDRDKLSKVVQELMIINVAMSIITTAILL + FMTIFITQLNREFSLLLITCGTILSSPFALNWLYSGMEEYTYITTRSVVFKILSLILI + FLLVKRPEDYIVFASISLFSSLSSNILNLWHSRHFINIKLYKNLQFKYHFKPMWYLFA + SLLAVNIYTNLDTVMLGFINGNEAVGYYSVASKVKWILLSLITSISAVLLPRLSFYIS + KNDTSNFIKMLKESSAVIFFIAIPLMVFFIVEAKDSILLLGGSQYLPATLAMQILMPI + LLISGFSNITGNQILIPMNREKYFMVAVTIGAVINLILNLLLMPKFGIIGASVATLFA + ELSQMTVQLHFSKEYLVSNISIKSLVNVIIATVVSTIPLIILNQLITITIPFYSLMLA + GFAFFSLYLVILLLLKEEVTIQLFSLLAKKK" + misc_feature 15901..16710 + /gene="wzx" + /locus_tag="SPC19C_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 3.1e-80" + gene 17395..18480 + /gene="mnaA" + /locus_tag="SPC19C_0017" + CDS 17395..18480 + /gene="mnaA" + /locus_tag="SPC19C_0017" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33679.1" + /db_xref="GOA:Q9Z636" + /db_xref="HSSP:1O6C" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q9Z636" + /translation="MKIMLVFGTRPEAIKMCPLVNELKKQADMETVVCVTGQHKEMVS + PVLELFGVQPDYDLEIMKANQTLFSITTSILEKIKPVLEEEQPDIVLVHGDTTTTYAA + ALAAFYLGIKVGHVEAGLRTYNLQSPFPEEFNRQSTSIIANYHFAPTELAKENLLKEG + RENVYVTGNTVIDALTTTVQKDYTHPDLDLNVNTRLILLTAHRRENLGEPMKHMFRAV + KRVLNEYDDVKVIYPIHKNPLVRETATEIFGDTERIQIIEPLDVLDFHNFMNHSYMIL + TDSGGVQEEAPSLGKPVLVMRDTTERPEGVAAGTLKLVGTDEETIYQNFKMLLDDSEE + YKKMSQASNPYGKGDASKQIVHILSGI" + misc_feature 17455..18471 + /gene="mnaA" + /locus_tag="SPC19C_0017" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 9.9e-198" + gene 18831..19940 + /gene="wchU" + /locus_tag="SPC19C_0018" + CDS 18831..19940 + /gene="wchU" + /locus_tag="SPC19C_0018" + /note="member of homology group 237" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33680.1" + /db_xref="GOA:Q9Z635" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q9Z635" + /translation="MKIVIPRIIHNKEQLTWDWSGTITNIKKFLGKYEIVEEQNIFYT + FRMNVHKVLVRLGIKKSDMSMTYIKYAENQVHLSPEDVCLTFDEFPLSFPDNPVYIYQ + DLNLHYLIESSQNNSQSFKYSGFQNVPADILDRRMRKQEIFYNQATGIFTMSKWFSDY + LIAQQGLPVEKVHYVGAGTNMNNLFLDHSHKERNKFLFIGKDFFRKGGDLVYNAFVYL + QNNLMPEAELYIIGPSDVPMEFNNPNVYFLGNLSADKVQYFYNLCDVFVLPSRFEAFG + IVFVEALCYGLPCIGRDLMEMPNLIQNNETGLLLPTEEENPQVLADVMYNLIKDESFF + KNVQTKQDYYKAEYSWDTVAKRMISIMKQDMNNNL" + misc_feature 19371..19850 + /gene="wchU" + /locus_tag="SPC19C_0018" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.8e-22" + gene 20399..20506 + /gene="HG264" + /locus_tag="SPC19C_0019" + /pseudo + CDS 20399..20506 + /gene="HG264" + /locus_tag="SPC19C_0019" + /note="member of homology group 264" + /pseudo + /codon_start=1 + /transl_table=11 + /product="hypothetical protein (fragment)" + /db_xref="PSEUDO:CAI33681.1" + gene 20574..21443 + /gene="rmlA" + /locus_tag="SPC19C_0020" + CDS 20574..21443 + /gene="rmlA" + /locus_tag="SPC19C_0020" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33682.1" + /db_xref="GOA:Q4K0W3" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K0W3" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIQLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + misc_feature 20577..21293 + /gene="rmlA" + /locus_tag="SPC19C_0020" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 8e-121" + gene 21444..22037 + /gene="rmlC" + /locus_tag="SPC19C_0021" + CDS 21444..22037 + /gene="rmlC" + /locus_tag="SPC19C_0021" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33683.1" + /db_xref="GOA:Q4K0W2" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4K0W2" + /translation="MTDKFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 21480..22010 + /gene="rmlC" + /locus_tag="SPC19C_0021" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 22050..23099 + /gene="rmlB" + /locus_tag="SPC19C_0022" + CDS 22050..23099 + /gene="rmlB" + /locus_tag="SPC19C_0022" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33684.1" + /db_xref="GOA:Q4K0W1" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0W1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLATQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 22065..23021 + /gene="rmlB" + /locus_tag="SPC19C_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00013" + misc_feature 22068..22865 + /gene="rmlB" + /locus_tag="SPC19C_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0053" + misc_feature 22068..22808 + /gene="rmlB" + /locus_tag="SPC19C_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 7.8e-76" + misc_feature 22071..22883 + /gene="rmlB" + /locus_tag="SPC19C_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.1e-05" + gene 23165..24016 + /gene="rmlD" + /locus_tag="SPC19C_0023" + CDS 23165..24016 + /gene="rmlD" + /locus_tag="SPC19C_0023" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33685.1" + /db_xref="GOA:Q9AH81" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH81" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 23165..24013 + /gene="rmlD" + /locus_tag="SPC19C_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4.3e-146" + misc_feature 23168..23809 + /gene="rmlD" + /locus_tag="SPC19C_0023" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00011" + misc_feature 23168..23797 + /gene="rmlD" + /locus_tag="SPC19C_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2e-18" + misc_feature 23171..23899 + /gene="rmlD" + /locus_tag="SPC19C_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-08" + gene order(24079..24159,24163..25162) + /gene="glf" + /locus_tag="SPC19C_0024" + CDS join(24079..24159,24163..24582,24549..24683,24659..25162) + /gene="glf" + /locus_tag="SPC19C_0024" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33686.1" + /db_xref="GOA:Q4K0V9" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0V9" + /translation="MYDYLVVGAVFAHEAVLKGKKVKVIEKNHIAGNIYTREEEGIQV + HQYGAHIFHTSDKEIWDYVNQFAEFNRYINSPVANYKGEIYNLPFNMNTFNKLWGVVT + PAEAQAKIDEQRAILNGKTPENLEEQAISLVATDIYEKLIKDYTEKQWGKPTTELPSF + IIVCQYATSILYYCLPVRLTYDNNYFNDTYQGIPIGRYTQIVEKCWIMKILMMLDHEN + IDVETNVDFFVNKEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQ + GNAVVNYTDAETPYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNH + LYKSYKKLADEQGNVIFGGRLGHYRYYDIHQVIGAALQCVRNELN" + misc_feature join(24499..24549,24582..24659,24683..25102) + /gene="glf" + /locus_tag="SPC19C_0024" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.5e-95" + gene 25480..>25632 + /gene="aliA" + /locus_tag="SPC19C_0025" + CDS 25480..>25632 + /gene="aliA" + /locus_tag="SPC19C_0025" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33687.1" + /db_xref="UniProtKB/TrEMBL:Q4K0V8" + /translation="MMKSSRLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYL" + misc_feature 25480..25566 + /gene="aliA" + /locus_tag="SPC19C_0025" + /note="Signal peptide predicted for SPC1027 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc cccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaaacct caagcttttg aagcttgagg ttttttacta + 181 tagtagattg aaactggaat agtacacctc tacttctaaa acattgttag aaatcgattt + 241 gattgtcctg atcgttttgt cctattctta tttcatttta ctatgcttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttatga agatattgtt + 361 tgaaagatgt gagtttccac ggataggttt gtggagggat atacttgcgt ctttcttttt + 421 ttgttctggt tcttgttcaa agtttttcga atagagttca tgatctagta gctcctttgt + 481 gcgatagatt ttgtcagcga tattgaggta gatatctccg tcaaatgctt ttataactaa + 541 tgctttcgtc tttctgatga aatagacttc tttttcttgt tcggtaggga tatagtaacg + 601 attttggaat cggatatggt gtccactatc ggcgactctc tccgccagtc tagccagaat + 661 gagattcctt tcagaggggt taggaacctc ctcgaagaca gagagttttg tcttgtttcc + 721 aaactgttca ttaaaggttt gaatgtagga aagcaggaag gtattggctt cttccaaggt + 781 atgaatattg ttttgttcca gttcgatagg taggcgagat tgtagtgtct gattgagtct + 841 ttcgactctc cctttagctt gagggataga ggttgtctca aggagaatcc ctagttggtg + 901 acaggcgcat ccaaactgtg tatgggtatc gtcctccatt ttcttagagt tggaggcttg + 961 ataggtaaag accgttctct tatctgtttt aatttgaagg ggaatgccgt gattggctaa + 1021 gatttgttcg aggacatgat agtaagcatt caagttctct tgtttatcaa aataagcgcc + 1081 taggatattg ccagaagcat catcaatggc taagtgtaag ttagatgttt gggctccaaa + 1141 ctaggcatga ggactggcat ccatttgaat gagttcacca gcaaatttct ttctgggtct + 1201 actaggatgt acttttttag ggtcttcaag gaagttttca gccgtcggta agattggatt + 1261 gtctaggggt tgattcaggt tcagtttagc ttgttttctt actctcttct ttgtctttct + 1321 atgggactta ggcgacagga tatttttctt atagagtatt tttctaacag tagtatcaga + 1381 gagctgaatt ccttcttctt cagctagcaa ttcacagaaa tgaaggacat ttggtttata + 1441 tgtttcatag gagaggtatt tttttaggag acgttctttg atttcatcag ggattgcatg + 1501 ttttggtttt cgatttctgt ttccgtgtct gaaggcttct ttgtcctttc agttgatagg + 1561 ctagtagcag acgattgatt tgtctttcag aaagattgag ctcgacacag gctcgtttct + 1621 ttgttttctt tccttgggct atagctttta tcacaagata ttttttcgtt tcattcatat + 1681 tcagttggat ccttttcata tgactattct accaaatggg acattttcac gttcgattta + 1741 ctaaagacat tatcacattc gaacccaaat ttcaagttga agttagccac ccaaaagaaa + 1801 ttcacttggc gacttgtagt ccaagcattt tttagggtag ttgttaatcc aattttcgat + 1861 aaaagctact tctttcggag tcgttttctt ggttccttta ggtaaccatc tccgaattaa + 1921 tcgattatga ttttcatttg aacctctctc ccatgaagag taagcatgtg cgtagtagat + 1981 atgttcctca ggaaatacct cagacaatcg tttgaactcc gaaccattat ctgcagtaat + 2041 ggacagaata cgatgctccc ctaatagtaa cgtaagcgcc tgattgacag attcagcagt + 2101 tttatttgga attaacctta taatttggtg tctgctccgc cggtcggtta agactaacag + 2161 gcaataattt tttatcttag tcagtaggac ggtatcaatt tcataatgac cattttccaa + 2221 gcgaagatta ataacgtcag gacgttcttc gatagattta cctgccggct taaagttcgg + 2281 actagcttgc ttcttgacac ctttcctttt tctgggataa agcatgtcgg ccttcgttaa + 2341 tcctaaatga ccattatgaa accagtagta gatggttgaa ataccaactt tcacttgctt + 2401 cttgttaacc atcatttcag gcgaaaattt ttgcttatga tagtgtaaga tcttctctct + 2461 gatttccttt gttaaaatta actttttcac cgaccgtttt cgattgaatt ggtaaacagt + 2521 ttgtgcgtaa tcggcagaat agaccttttt gtatagccct tttctcactt gttgtaaagt + 2581 tgtacctctt ttgacttcat tatgaatcgt ttgaggcgcc tttcctaaca agcctgcaat + 2641 ttcacgattg gacttatttt cattcttcca ccgctcaatc aagcgacggt tatctattgt + 2701 caaatgtttc ccttttgggg tataatgttc ttgcatctct gtgcctttcc ttgtgtttgt + 2761 ggtgaacaac aagtatagca cagaggtgtt ttcttatacc ttaaatcaca tttcatttga + 2821 caacaggaac ccttgaacct gttttttcag ctaaaccaag gctatgatta gccttggcca + 2881 cctagcctaa cagtttcaaa cctgttatca aatgaaatca tcaacttact caaacatagt + 2941 gaaacatcta attcttgact aaggtaaggt ggctaacttc attatagaac tttcatatca + 3001 cattcgaatt acacaagatg cagatagtga aaaaagatgt agacattacc gtaaaaaagt + 3061 gatataatcg tatgatgttc aatgtatagg tgttaatcat gagtagacgt tttaaaaaat + 3121 caggttcaca gaaagtgaag cgaagtgtta atatcgtttt gctgactatt tatttattgt + 3181 tagtttgttt tttattgttc ttaatcttta agtacaatat ccttgctttt agatatctta + 3241 atctcgtggt aactgcgtta gtcctactag ttgccttggt agggctactc ttgattatct + 3301 ataaaaaagc tgaaaagttt actatttttc tgttggtgct ctctatcctt gtcagctctg + 3361 tgtcgctctt tgcagtacag cagtttgttg gactgaccaa tcgtttaaat gcgacttcta + 3421 gttactcaga atattcaatc agtgtcgctg ttttagcaga tagtgagatc gaaaatgtta + 3481 cgcaactgac gagtgtgaca gcaccgactg ggactgataa tgaaaatatt caaaaactac + 3541 tagctgatat caagtcaagt cagaataccg atttgatggt caaccagagt tcgtcttact + 3601 tggcagctta caagagtttg attgcagggg agactaaggc cattgtccta aatagtgtct + 3661 ttgaaaatat catcgagtca gagtatccag actacgcatc gaagataaaa aagatttata + 3721 ccaagggatt cactaaaaaa gtagaagctc ctaagacgtc taagaatcag tctttcaata + 3781 tctatgttag tggaattgac acctatggtc ctattagttc ggtgtcgcga tcagatgtca + 3841 atatcctgat gactgtcaat cgagatacca agaaaatcct cttgaccaca acaccacgtg + 3901 atgcctatgt accaatcgca gatggtggaa ataatcaaaa agataaatta acccatgcgg + 3961 gcatttatgg agttgattcg tccattcaca ccttagaaaa tctctatgga gtggatatca + 4021 attactatgt gcgattgaac ttcacttctt tcttgaaaat gattgactta ttgggagggg + 4081 tagatgttca taatgaccaa gagttttcag ctctacatgg gaagttccat ttcccagtag + 4141 ggaatgtcca tctagactct gagcaagctc taggttttgt acgtgaacgc tactcactag + 4201 ccgatggaga ccgtgaccgt ggtcgcaacc aacaaaaggt gattgtggct atccttcaaa + 4261 aattaacgtc aaccgaagca ctgaaaaatt atagtacgat cattgatagc ttgcaagatt + 4321 ctatccaaac aaatatgcca cttgagacca tgataaattt ggtcaatgct cagttagaaa + 4381 gtggagggaa ttataaagta aattctcaag atttaaaagg tacaggtcgg atggatcttc + 4441 cttcttatgc aatgccagac agtaacctct atgtgatgga aatagatgat agtagtttag + 4501 ctgtagttaa agcagctata caggatgtga tggagggtag atgaaatgat agacatccat + 4561 tcgcatatcg tttttgatgt agatgacggt cccaagtcaa gagaggaaag caaggctctc + 4621 ttggcagaat cctacaggca gggggtgcga accattgtct ctacctctca ccgtcgcaag + 4681 ggcatgtttg aaactccgga agagaagata gcagaaaact ttcttcaggt tcgggaaata + 4741 gctaaggaag tggcgagtga cttagtcatt gcttacggag ctgaaattta ctacacacca + 4801 gatgttctgg ataagctggg aaaaaagcgg attccgaccc tcaatgatag tcgttatgcc + 4861 ttgatagagt ttagtatgaa cactctttat cgcgatattc ataacgcctt gagcaagatc + 4921 ttgatgttgg gaattactcc agtcattgcc cacatcgaac gctatgatgc tcttgaaaat + 4981 aatgaaaaac gcgttcggga actgatcgat atgggctgtt acacgcaagt aaatagttca + 5041 catgtcctca aacccaaact ttttggcgaa cgttataaat tcatgaaaaa aagagctcag + 5101 tattttttag agaaggattt ggttcatatc attgcaagtg atatgcacaa tctagacggt + 5161 agacctccat atatgcaaca ggcatatgat atcattgcta agaaatatgg agcgaaaaaa + 5221 gcgaaagaac tttttgtaga taatcccaga aaaattataa tggatcaatt aatttaggag + 5281 aaaatatgaa ggaacaaaac actttggaaa tcgatgtatt gcaactattc agagctttat + 5341 ggaaaagaaa gttggtcatt ttattagtgg caattataac ttcttcagtt gcttttgcct + 5401 acagtacttt tgttatcaaa cctgagttta ctagtacgac tcggatttat gtagttaacc + 5461 gtaatcagga agagaagtct ggtttaacca atcaagactt gcaggcagga tcatacttgg + 5521 ttaaagacta tcgtgaaatt atcctatcgc aggatgtttt ggaggaagtt atttctgatt + 5581 tgaaactaga tttgacgcca aaaggtttgg ctaataaaat taaagtaaca gtaccagttg + 5641 atacccgtat tgtctctgtt tcagttaatg atcgagttcc tgaagaggca agccgtatcg + 5701 ctaactcttt gagagaagta gctgctcaaa aaattatcag tattactcgt gtttctgatg + 5761 tgacaacact ggaggaggca agaccggcga tatcaccgtc ttcgccaaat attaaacgca + 5821 atacactaat tggttttttg gcagggggga ttggaactag tgttatagtt cttcttcttg + 5881 aacttttgga cactcgtgtg aaacgtccgg aagatatcga agatacactg cagatgacac + 5941 ttttgggagt tgtaccaaac ttgagtaagt tgaaatagga gagaggaatg ccgacattag + 6001 aaatagcaca aaaaaaactg gagttcatta agaaggcaga agaatattac aatgccttgt + 6061 gtacaaatat acagttgagc ggagataaac taaaagtaat ttccgttact tctgttaacc + 6121 ctggggaagg aaaaacaact acttccgtaa atatagcaag gtcgtttgcg cgtgcaggtt + 6181 ataaaactct tttgatcgat ggcgatactc gaaattcagt tatatcagga gtttttaaat + 6241 cgcgtgaaaa aattacaggg ctaacagaat ttttatctgg gacagctgat ttatctcgcg + 6301 gtttatgtga tacaaatatt gaaaatttat ttgtaattca atcgggatct gtatcaccaa + 6361 accctacagc cttgttacaa agtaaaaatt ttaatgatat gattgaaaca ttgcgtaaat + 6421 attttgatta tatcattgtt gatacagcac ctattggaat tgttattgat gcggcaatta + 6481 tcactcaaaa gtgtgatgcg tccatcttgg taacagcaac aggtgaggtg aataaacgtg + 6541 atgtccaaaa agcgaaacaa caattagaac aaacagggaa actgttccta ggagttgttt + 6601 taaataaatt ggatatctcg gttgataagt atggagttta cggttcctat ggaaattatg + 6661 gtaaaaaata acttaggaaa gattttatgg atgaaaaagg attgaaaatt tttctggcag + 6721 tattacagag tattattgtc attttatcgg tttattttct tagctttgtt agagagacag + 6781 aacttgaacg ttcttcgatg gttatactat accttctcca cttttttgta ttctatttta + 6841 gttcctatgg taacaatttt tttaaaagag ggtacctagt tgagtttaat agtactataa + 6901 gatatatttt tttctttgca atagctataa gtgtattaaa cttttttata gcggaacggt + 6961 ttagtatctc tagaagagga atggtatact tcttaacttt agaagggata tccttatact + 7021 tgttaaattt cttagtaaag aaatattgga agcatgtgtt ttttaatcta aaaaatagca + 7081 agaaaatttt actgttaaca gtaacgaaaa atatggaaaa agttcttgat aaattgctag + 7141 aatctgatga actttcatgg aaattggtag cagtaagtgt tttggataaa tctgattttc + 7201 aacatgataa aatacctgta attgaaaagg aaaaaattat tgaatttgca acgcatgaag + 7261 ttgtggatga ggtgtttgtc aatcttccag gagagaacta cgatattgga gaaattatct + 7321 ctaggtttga gacaatgggg atagatgtaa ctgtaaatct taaagcattt gataagaatt + 7381 tgggtcgcaa taaacaaatt catgagatgg taggattgaa tgtagtcact ttctctacaa + 7441 atttttataa aactagtcat gtgatttcaa agagaattct cgatatttgt ggtgccacta + 7501 ttggccttat tctttttgct atagctagtc tagttttagt tccattgatt cgtaaagatg + 7561 gcggaccagc tatttttgct cagacgcgta tagggaaaaa tggtcgatat tttacctttt + 7621 ataaattccg ttcgatgcgg atcgatgctg aagctataaa agaacaattg atggatcaaa + 7681 atacgatgca aggtggtatg tttaagatgg acaatgatcc tcgtgttaca aaaattggtc + 7741 gctttattcg taaaaccagt ttagatgagt taccccagtt ttggaatgtc tttataggag + 7801 atatgagttt ggtgggaaca cgtccaccta cagtagatga gtatgatcag tatactccag + 7861 aacagaaacg tcgactcagc tttaaacctg gtattacagg cttatggcag attagtggcc + 7921 gaagtaaaat aaccgatttt gacgatgttg taaaattaga tgtggcttat attgataatt + 7981 ggacaatttg gaaagatatt gaaattttgc ttaaaactgt taaagttgta tttatgagag + 8041 atggagcgaa gtgaggaatg agggatagaa tccaactttt aggtttaaca attgatctgc + 8101 ttacgatgaa tgaaacgata gatattgtag aacaatatgt attagaaaaa agaccactac + 8161 acttgatggg cgtgaatgct gataaaatta atcagtgcca tacagatgag aaaatcaaaa + 8221 aaatcgttaa tgagtcagga atcattaatg cggatggagc atcagttgtt cttgcaagta + 8281 agtttttagg aacgcctgtt cctgaacgag tagcgggtat tgatttgatg caatgtcttt + 8341 tagagttgtc aaataaaaaa ggatattcag tttacttttt tggagcaaaa gaagaagttt + 8401 tgcaagatat gctcaaagta tttaagagag attatccaaa tttgatagtt attggacaca + 8461 gaaatggcta tttttctgaa gaggatgaac aagctattca agaagatatt cgtgaaaaga + 8521 accctgattt tgtgtttatt ggaattacgt ctcctaaaaa agaatatatt attcaaaaat + 8581 ttatggatag tggcgtcaat tcggtattta tgggagttgg cggtagtttt gatgtcttgt + 8641 ctggtcatat ccaacgagca cctctatgga tgcaaaagtc aaatttagag tggttattcc + 8701 gtgtagctaa tgagcctaaa cgtctcttta aacgttattt tgtagggaat atttcattca + 8761 taggaaaagt tttaaaagca aaaagaggtg taaaatattg aaccagacag agatgattcg + 8821 cttaattcaa aaagttgaat tagatgctat aaaagagttt aaaaaaatct gtgaagagaa + 8881 tgatatagat tttttcctcc gcggtggtag tgtacttggt gcagtcaaat acgacggctt + 8941 tattccatgg gatgatgata tggatatcgc tgtccctcgt gaagcatacg acaaacttcc + 9001 aagtgttttc aaagatagaa ttatcgctgg gaaatatcag gttcttactt atcaatactg + 9061 tgatacgttg cattgctact ttcctcgact atttctttta gaagatgaaa gaaaacgttt + 9121 gggcttgcca cgaaatacca atctgggatt gcatttgatt gatatcattc ctttagatgg + 9181 agcaccaaat cattcggttt taagaaagat ttactttggt aaagtatact ggtatcgttt + 9241 tttagcaagt ttaggaacaa cttatgttgg cgaccatgtg gatatgcatt ccactaagca + 9301 aaaactaatt attggtttct ttaaaaaact aggatttgca aaactatttc ctcaaaattc + 9361 tgtatacaga cgcttggata atctctataa aaagtatgat tggaaaaagc agaagtatgc + 9421 tgggactatc aatgcttctt tatttgccaa agaagttatg ccagtagaga tttggggaga + 9481 aggagtagag aagccttttg aggatacctt ctttaaagtt ccaacggagt atgatcgcta + 9541 cctgaaaaga ctttacggag aaaactatct tcacgaagag ccgagtgatg atgaaaagaa + 9601 atcgcattta gggggataaa aatttgtttt gttatattat tttacattac aaagtcttag + 9661 atgaaactat ttcttgtgtt aaatctataa aagaaggcaa ttccaatgaa aagcaaatcg + 9721 ttattattga taatttttct aataatggta caggtgaaaa actacaagag ctttatgaat + 9781 cagatttaga gattgatgta ttgattaacc acgaaaatgc tggatttgct cgaggaaata + 9841 atgtagctta tcaatttgct aaggaaaagt ataaccccga tttcatggtt atcatgaata + 9901 acgatattga gatagaaaca gaagattttg aaaaaatcgt gacagatatc tatcacaaag + 9961 aaaaatttca tttgctaggg ccagacattt tttcgacaac atatcagcta catcaaaatc + 10021 ctaaacgcct gacacattat acttatgaag aggtagtggc tctcaatgaa aaatttaaaa + 10081 gagggagcca acttagtcta actttaaaaa tcaaatgttg gttgaaagct agcaaagttc + 10141 ttcgaacagc aatctatcaa aatagacgta aaaaaggatc agtagaccat agaaaacagg + 10201 tagaaaaccc gattcttcat ggttccttta ttgtatattc gagagatttt attgaaaaag + 10261 aggagtatgc ttttaaccct aataccttct tttactatga aacagagata ttagattatg + 10321 aagctgagtt aaaaggatac aagagaattt atacaccgaa gattaaggtt ttacaccatc + 10381 aaaatgtggc aacaaatcag gtttatacaa acttagtaga aaaaactttg ttttcaaaca + 10441 aatgcaactt tgaatccact agttattttt taactttaat ggagaaaaat gaataaaaaa + 10501 tgatgaaaaa aattttatat gtgacaaatg ttgattggaa ttggataaaa caacgtccac + 10561 aatttattgc agaaaactta tctaattttt atgagatgct agttctgtat cgctattggt + 10621 acaatagaaa aggattgact gaggatagaa atactaacat tacaaatata tcacgtattt + 10681 atgccctacc ttttgttaat aggtcaccga aactaaagca actgaatgat aaaattgttg + 10741 cttggaatat tcgaagaaaa gttaaggctt ttaaaccgga atatgtatat ttgacaaatc + 10801 caatgcagtt tgcatctctt gtagacaatt cagaacaaaa aataatatat gattgtatgg + 10861 attatcatgt ggcttttata gaaaatagag aagaacgcca gcgattaaag gatttagaag + 10921 agaaactggt caatagagct aatttaatct tggtttcgag tgagaaacta agagaaaata + 10981 ttatttctga ttataacttg gaagagcagg ttaataaaat agtggttgtt agaaatggtt + 11041 ataatggtaa aatcttaagc attcctactc ggcataaaaa gaataaccaa aagcttgtac + 11101 ttgcatatgt tggaactatc agtcattggt ttgactttga tatcatttta cgaagtttaa + 11161 aagattttga taatattgaa tataatttga ttggtccgat tagcaaagct gatattcctg + 11221 aacatgatag aattcattat ttaggaagtg taccacacga gaagatttat cagtatattg + 11281 agaatgcaga tgttctgatt atgccgtttc aaattaatga tattgttgaa gcagtggatc + 11341 cagtcaagtt gtatgaatat attaatttta aaaaaaatat acttacggta tgttataagg + 11401 aaattctgag atttgaacca tttgtataca tgtattcaaa ttatttagat taccaaatga + 11461 atttattgca attgattgaa aataataatt tgaaatatga cagtatagct agagaagatt + 11521 ttttgaaaag taatacttgg gaaaaaagag cggagctgat tcatcagctg attaaccaat + 11581 tgtaattttt tatggagaga tgaatgaaga gacagaagtt tgaatttata gagattctat + 11641 actattttac agtgatgtta tcagtgggaa tgtttcttat gtttaccctc aacttatatt + 11701 ggcacagaaa cttattaact attttatcta ttgctctctc atttttaatg cttcctatac + 11761 tgattgttaa tgctaaaaga atttctaaat ctgcttttat ctatggtact tttttatcta + 11821 tatgtattat atatgagata ttaagagcta aaacactgta taattacagt gtgagtaata + 11881 tttttttggc ctctagacaa tatatatgga tttttctatt ttttgtattg atttaccttt + 11941 ttaaaaacaa acaagaaaat atgagaaaaa ttttagataa tacactcaat atttttatgt + 12001 tttctcttgg aattagagca tttacttggt ttttatatac gttatttcaa gttgaattat + 12061 ttccatctat tttaagagaa ttcggagatt tgtggtatcg aaatgaattt tcagtacgaa + 12121 tagatggaac accattaatt ataataggtt tgttaatttc cacttttttc tattttaaat + 12181 ttggaaatag gaaatacttt tattatttgt tcttgatatt aatgtatata acatttgtaa + 12241 atcagacaag agtgctactg gtttctgttt tgatttcaat ttttcttatg tttgtatttt + 12301 ctagaagaac ttctagattg ctcacctctt taagttttgt aactataatt atagcattcg + 12361 tttatggagg tggattggat tatattaaag catatttaaa tatagatgct ggaacatttg + 12421 atctgggatt aggatttaga tactgggagt tgaaatacta tctgggttta ttagctaatg + 12481 atgtatggaa acttggggtt ggaattctaa catcaagtaa tataaatagt aattttattt + 12541 tggctgggcc aagtgctgtt aagatgtatc tagatgattt aggtttttta gagttattcg + 12601 ttcaatttgg tgtagccgca atttttatgt atggttatat attttataaa ttaatcaatt + 12661 taattctaag aatgtcaaat gataaatata gagttgaccg cgcctttttt attgcactct + 12721 taactaattt aataattact tcaatttctt taaatatctt tggagcgcag agaagtttct + 12781 cattggcaat tgttcttgca ttaatattct actatgacta taggctgaaa aatgacatag + 12841 aaaattaggt gtataatgga taaagtatgt atagttattc tcaattataa taattatgaa + 12901 gaaacgattg agtgtgtaca aagtttgaga agtactataa aatcaaatga gtatgacatc + 12961 gtgattgtag ataataattc ggtgaatgat agtgtcaaag agttatccaa ggcgttatcc + 13021 cctattaaga ttattactag tttagaaaat agaggatatg cgaatggaaa caatattgga + 13081 ataaagtatg ctgaggataa tggatatgat tacatttgta tattaaacaa cgatacatta + 13141 attgaggttg attttttgga atcgtgtaaa cgagaactag aaaataattc cttcgttgcc + 13201 tttgttagtc cagtgttagt tgaatataaa gataataact tggtacaatc tacaggtggt + 13261 gatattttta ttaatagggg aattgtaact ttaaaaaatc atggtgctca gagagacaaa + 13321 cttccttcta aaatcgaaag tgactatatt gggggagcat gtttgatgtt caaaacctct + 13381 atcttgaaaa ttattggata tatacctgaa agttactttc tattttatga agaaactgaa + 13441 tggtgttata gggctaaaaa attaggctat aagaatatat gccttactca aagttatgtt + 13501 tatcataaag gttcggtctc tataaaagcg gtcaatggac ttcaagaata tttaatggca + 13561 agaaatagag ttgtatttgt tcgtagaaat gtaaatagta aactaaagta ttctgctttt + 13621 ttgttctatt tattcatgca acaactttat cattgctttt tgcgaaggga ttgttttaaa + 13681 agaaagtata aatattattt agatggtgta tttaatagaa ttgatccatc ctatccattt + 13741 attttcataa gcgaataagt tactacttat aactgtagat gcactaagat aattatagta + 13801 gactgaatct aaaatagtac gaaataattg ctaaaacatt tatagaaatt aattttattt + 13861 tcccaatcga tttgttctta tcttatttca atctgctata gattaaataa gtaaagaaag + 13921 tggtcattat aggaacataa tttaacatag ttaggtgaaa tatgaaagtg tttgatatat + 13981 ctcaaataaa aacaaaaaca gttgcatttg atttttttga tactattgtg cataggaatt + 14041 gtcatcctga gcaaattttg tatcagtggg ctaaggaaat ggctttggag gtgaatttca + 14101 atatatctcc ttcaatatta taccaaatca gaaaaagtgt cgaaaacaat aaaaagttag + 14161 gcactgaaga aatgtgttat ctagaccttt tgtctggaat atataatgaa attaaagata + 14221 agataaaaaa tacatcgaaa gaagagttta ttcatagagc taaaattcta gagttgaaaa + 14281 ttgaattaca acatatttat ttggattcgg aaattaaaga agttttaaaa aaattgaaaa + 14341 gtgattcaaa acagattatc ttagtttctg atttttatac tgataaagaa ttaatagaaa + 14401 ctgtattaaa aaagtttgaa gtttttgatt atttctcttc tatctatatt tcgagtgaga + 14461 aaggctgccg taaatccaca ggaaatttat ataagttaat tttaaaagaa ttaggcttaa + 14521 atcctaaaga aattaccatg ataggagata attataaatc tgattatgaa gtgccacgtt + 14581 ctctaggatt aaatgctatt tatagacaat acatagataa aaatacaata gtagcagaaa + 14641 aagagttggt aagactatat aatcaaattt tattttctaa cagtaaaaaa gcaccgttta + 14701 atattttttt agctgacatc gtattcttta tttcgaaatt gcataaaaag atgattcaag + 14761 atgatgttca aatagcactc ttttgctcaa gagaaggaca gttattgaaa atactttttg + 14821 atatatatca aaatactttt tttgggaaaa atcaaaagat ttgtacagaa tatttttatg + 14881 tttctagacg atcgacatta tattcttctt ttacttcttt agataatgaa gagtttgaga + 14941 cgatttttcg tcaatataaa aaaattacat tacaaaattt cttgttaaat ttaaactttt + 15001 ctgataatga aatcatattg atttgtcaag atttaaaaga gaaaccaaca tatgtattaa + 15061 cagtagacga tcatttatta gagaaactca aaaaacatcc tcagttcatt acgaagttca + 15121 ataaagagaa aaaagacagt caattactac gtgattatat agagtattta actaaaaacc + 15181 aaaatgaagt atatttagtc gatgtgggtt ggaaaggaac gatacaagat aatatcaaaa + 15241 aggctcttcc agacaagaga atagtaggtt attatctggg attgatactc aatgcttact + 15301 cagtagaaaa taaaatggat aaaactggtt tattgttttc tgattatcca agtaaatcga + 15361 aattttatga tattgtgagt agaaattttg gtttttatga agatattttt gtagcagatc + 15421 atggtccagt tttgaaatat aaaaaagaga gtgatattat ccccattatt gacgatgata + 15481 agaaacatgt gagtatttat caggcagtta aagattatca agaagagtta gtattaggat + 15541 tttcagaaat tttggaagct tataagaaaa tgaagtttct cccttttgaa caaaaaaatc + 15601 tgtggctaat gatgtcgcta aaaaaagaat gtatttatat acctaagtta caatcatttt + 15661 ctgaatcttt aaaagaaaaa gttgttgaaa attttggtga gatagtaact cttaagacta + 15721 cgaaaaaatc tataaaaacg ttattaagaa agaaaagcga tttactttgg gttgatttcg + 15781 tttatagatt gtttggtggt gtcaatttcc tatttattcc agaattatat acaagagtta + 15841 tatttttatt gaaatattta gatttgaaat tgaggttgaa aaattatggg gaataaatcc + 15901 ataaagttga atgcattatt aaatattgtc ctgacgctat caaatatcat tttcccatta + 15961 atcacttttc cttatatatc tagaatattg aatccaaatg gtataggttt aacttcattt + 16021 tttagttcaa tagggaatta tggtatttta cttgcttctc tgggaatttc aacttatggt + 16081 atcaaagcag tagcaagtgt tagagatgat agagataagt tgtcaaaagt agtacaggag + 16141 ttaatgatta taaacgttgc tatgtctata ataacaactg caatactatt atttatgact + 16201 atatttataa cacaattgaa tagagaattt tcactcctat tgatcacatg tgggactatt + 16261 ttatcttctc ctttcgcctt aaattggttg tatagtggaa tggaagaata tacgtatatt + 16321 actactaggt cagtagtgtt taaaattcta tcattaatat tgatttttct acttgtgaaa + 16381 aggccagagg attatattgt ttttgctagt atttcattgt tttcttctct aagttcaaat + 16441 atcttaaatc tatggcatag ccgacatttc attaatatta aattatataa aaatttacaa + 16501 tttaaatatc attttaaacc aatgtggtat ttatttgcct cattacttgc agtaaatatt + 16561 tatactaatt tagatacagt gatgctcggt tttattaatg gtaatgaggc tgtgggatac + 16621 tattctgtgg catcaaaggt taagtggatt ttgctttctc ttattacatc tattagtgca + 16681 gttttgctac cgagactttc attttatatt agtaaaaatg acacctcgaa ttttataaaa + 16741 atgttaaagg agtcatctgc ggttatattt tttattgcga ttccattgat ggtattcttt + 16801 attgtagagg cgaaagatag tatcttatta ctaggaggaa gtcagtatct tcctgcgact + 16861 ttagcgatgc aaatacttat gccaatttta cttatttctg gtttctcgaa tattacagga + 16921 aatcaaatat tgattccaat gaatagagaa aaatatttta tggttgcagt aacgattggt + 16981 gctgtgatta atcttatttt gaatctactg ttaatgccta agtttggaat tattggtgct + 17041 tctgtcgcaa ctctttttgc ggaattgtcg cagatgacgg tacaattaca tttttcaaaa + 17101 gaatatttag tatcaaatat atcgataaag agtttggtta atgtgataat tgcaacagtt + 17161 gtttctacaa taccactaat cattttgaat cagctgataa cgataactat accattttat + 17221 tctctaatgc tagcaggttt tgctttcttt tcattatatt tagtaattct gcttttatta + 17281 aaggaggaag tgacgattca attattttct cttcttgcaa agaagaagta aattggttag + 17341 aaattgaaat gtataaacaa ataaagaatt taattattga tttaggagga aatcatgaag + 17401 ataatgctag tttttggtac acgtccagaa gcgataaaaa tgtgtccatt agtgaatgag + 17461 ttgaaaaaac aggcagatat ggaaacagtt gtttgtgtaa ctggtcaaca caaggagatg + 17521 gttagccctg ttttggaatt gtttggagtt caaccagact atgatttaga aataatgaaa + 17581 gctaatcaaa ccttgttctc tataacaaca agtattttag aaaaaattaa acctgtttta + 17641 gaagaagaac aaccagatat tgttctagtt catggtgaca ctactacaac atatgcagca + 17701 gctttggcag cattttatct tggaattaag gttggccatg ttgaagctgg gttacgaact + 17761 tacaacctgc aaagtccctt cccagaagaa tttaatagac aatcgacttc tattattgca + 17821 aattatcatt ttgctccaac tgaattggct aaagaaaatc tcttaaaaga gggtagagag + 17881 aatgtttatg taactggaaa tacagttatt gatgcactta caactacagt acaaaaggat + 17941 tatacacacc ctgatttaga tttaaacgtt aacactcgtc ttattctact gactgctcat + 18001 agacgtgaaa atctcggaga acctatgaaa cacatgttta gagctgttaa acgagtctta + 18061 aatgaatatg acgatgttaa ggtaatttat ccaattcata agaatccctt ggtgcgtgaa + 18121 acagctacag aaatttttgg agacacagaa cgtattcaga ttattgaacc tttggatgtt + 18181 cttgattttc ataatttcat gaatcatagt tacatgattt taactgattc aggaggagtt + 18241 caggaagagg ctccttcttt aggaaaacct gtattggtca tgcgagatac gacagaaaga + 18301 cctgaaggag tagctgccgg aacgttgaaa ttggttggaa ctgatgagga gactatttat + 18361 caaaacttta agatgctttt agacgattcc gaagaatata aaaaaatgag tcaagctagt + 18421 aatccttatg gaaaaggtga tgctagtaaa cagattgttc atattttaag cggaatttaa + 18481 gcgaggccaa ataaagtaat aaaaaacact atcttataaa aggtattgat cttgtagttg + 18541 attcgggaac atgttcatat cctttgactc gagctacata aaaataactt gtgctgattt + 18601 atgatagatc gataatttac tactactttg gacattgatg ttagcagtta ttagggatgt + 18661 tttgattaac tcaacttttc aggattcgcc ttgctttcta gattttcttc tgatttttat + 18721 cattacttca gtaagttaaa tcgtctattt actagaatta aaacttttaa aaaatccatt + 18781 gttagctcat gttttagata taggtaaaca taaatttagg aggtgttagt ttgaagattg + 18841 taattccaag aattattcat aacaaagaac aactgacctg ggattggtcc gggacaataa + 18901 ctaatataaa aaaattttta gggaaatacg agattgttga ggaacagaat attttctata + 18961 cttttagaat gaatgtgcac aaagtgcttg ttcgtttagg tattaaaaaa tctgatatga + 19021 gcatgacgta tataaaatat gctgaaaatc aagttcatct atcgccagag gatgtttgtc + 19081 tcacgtttga tgaatttcct ttatcttttc ctgataatcc agtttatatc tatcaagact + 19141 taaatcttca ttatttgata gagagttctc aaaacaatag tcaatcgttc aaatatagtg + 19201 gttttcaaaa cgtcccggct gatattctag atagacgaat gagaaaacag gaaatatttt + 19261 ataatcaagc tactggaata tttactatga gtaaatggtt ttcagattac ttgatagctc + 19321 aacaaggact tccagttgaa aaagttcatt atgtgggggc aggaacaaat atgaataatc + 19381 tatttcttga ccactctcat aaggaacgta ataagttttt atttattggt aaagattttt + 19441 ttcgtaaagg aggagatctt gtttataatg cttttgtcta tttgcaaaat aatctcatgc + 19501 cggaggcaga gttgtacatt ataggtcctt cagatgttcc gatggaattt aacaatccga + 19561 atgtttattt tttaggtaat ctatcagctg ataaggtgca atatttttat aatctttgtg + 19621 atgtatttgt tttaccttcc cgatttgagg catttggaat tgtatttgtt gaagctcttt + 19681 gctatggttt accatgtatc ggtcgtgatt taatggaaat gccaaaccta attcaaaata + 19741 atgaaactgg attattatta cctactgaag aggaaaatcc acaggtttta gctgacgtaa + 19801 tgtataattt gataaaagat gaaagctttt ttaaaaatgt tcagactaaa caagattatt + 19861 ataaagcaga atattcgtgg gacacagttg ccaaaagaat gatttcaatt atgaagcaag + 19921 atatgaacaa caatctataa gtgaaaaatt aaaagatatt ctagtctaac ggtctattcc + 19981 tactaacagt aatactgaaa gaaattttaa aatacaagtt atacgtatag tgacttctcc + 20041 taattctgac atggtgaaaa gattatttaa aacctaattt aaaagattaa aggaagttaa + 20101 attcagctta ttgaataaaa ttaatttagt ctagttattt tcttgtcagt cttattcatt + 20161 tttttccgaa ccttgtgagt tgtttgcaac taccagaata cacaaagaac agaatctctt + 20221 agcatcattg aatagaacaa tatctgcata aatttcagat ataactagtg gtgcagaaag + 20281 tggatctttg aaaataagaa ttctttgtag agctatttca ctagctggtg aagaattgtt + 20341 tttcaatttt tcgtacagat tacaataatg ttatggtggg tttaaatttc tttgttggtt + 20401 gtgtttgatg aatagagatg cacgtatcga aattcaagat agtggtgata tcgcttgctt + 20461 aatctcttct ccagtatttg tagtagaatt aagtgttctt gattaaaata aagaacacaa + 20521 cactttttat tcagtgttgt gtattgggtg aaacgaaagg aacgattgta cttatgaaag + 20581 gtattattct cgcgggtggt tcggggacac gtttatatcc tttgactcga gctgcatcaa + 20641 agcaactgat gccggtttat gataaaccga tgatttacta cccactttca actttgatgt + 20701 tggctgggat tagggatatt ttgattatct caactcctca agatttgcct cgttttaaag + 20761 agctccttca agatggctct gagtttggga ttcaattgtc ttatgcagag caaccgagtc + 20821 cagatggttt ggcacaagcc tttattattg gtgaagaatt tattggtgat gatagcgttg + 20881 cgctaatctt aggtgataat atctaccatg gttctgggct ttccaagatg ctacaaaagg + 20941 cagcgagtaa ggagtcggga gcaactgttt ttggctacca tgtcaaggat ccagagcgct + 21001 ttggtgtggt tgagtttgat caggatatga aggctatttc tattgaagaa aagccagagc + 21061 aacctcgttc aaactatgca gttacaggtc tctatttcta tgataatgat gtagtagaga + 21121 ttgccaagag tattaaacca agtcctcgtg gtgaactgga aattacagat gtaaacaagg + 21181 cttacctaga tcgtggtgat ttgtctgttg agcttatggg acgtggcttt gcttggctgg + 21241 atactggaac tcatgaaagt ttactagagg cttcacagta catcgaaaca gtgcaacgga + 21301 tgcaaaatgt tcaggtagca aacttagaag aaattgctta ccgtatgggc tatatcagtc + 21361 gagaagatgt attggcctta gcccaaccac ttaagaaaaa tgaatacgga cagtatctgc + 21421 tccgtttgat tggagaagca tagatgacag ataagttttt cggtaagacg cttgcggcac + 21481 gcaaggttga agctattcca ggcatgttgg agtttgatat ccccgttcat ggagataatc + 21541 gtggctggtt taaagaaaat ttccaaaagg aaaaaatgct tccacttgga tttccagagt + 21601 ctttctttgc agaaggaaaa ttgcaaaaca atgtatcctt ctcacgtaaa aatgtccttc + 21661 gagggctcca cgcagagcct tgggataagt acatctctgt agcagatgga gggaaagttc + 21721 tgggttcttg ggttgatcta cgcgagggtg aaacctttgg gaatacctat cagacagtaa + 21781 ttgatgcaag caagggaatc tttgttcctc gaggcgtagc taatggcttc caagttctat + 21841 cagatacagt gtcatatagc tatctggtca atgattactg ggctctcgag ctcaaaccca + 21901 agtatgcctt tgtgaactac gctgatccaa gccttggtat tgaatgggaa aatattgcag + 21961 aagcagaggt ttcagaagca gataaacatc atcccctact taaggatgta aaacctttga + 22021 aaaaagaaga tttgtaaaaa ggaaagaata tgactgaata caaaaatatt atcgtgacag + 22081 gtggagctgg ctttatcggt tctaactttg tccattatgt ttacgagaac tttccaggtg + 22141 ttcacgtgac agtcctagat aagttgactt atgctggaaa tcgcgcgaat attgaggaaa + 22201 ttttaggtaa tcgtgttgag ttagttgttg gtgacattgc tgatgcggag ttggtagaca + 22261 agttggctac tcaagcagat gctatcgttc attatgcagc ggaaagccac aatgataatt + 22321 cgctcaatga tccatcgcca tttattcata ctaacttcat cggaacctat actcttttag + 22381 aagctgctcg taagtatgat attcgcttcc accatgtatc gacagatgaa gtttatgggg + 22441 atctcccttt acgcgaagat ttgccaggtc atggagaagg gccgggtgag aaatttacgg + 22501 ctgaaaccaa gtacaatcca agctcgcctt actcatcaac caaggcagcc tcagatttga + 22561 ttgtcaaagc ctgggtgcgt tcttttggag tcaaggcaac gatttccaac tgttcaaata + 22621 actacggtcc ttaccagcat attgagaagt ttattccacg acaaatcacc aatatcttga + 22681 gcggtatcaa gccaaaactt tacggtgaag gtaagaacgt tcgtgactgg attcatacca + 22741 atgaccattc ttcaggagtt tggacaatct tgacaaaagg gcaaatcggt gaaacctact + 22801 tgattggggc tgatggtgag aagaacaata aggaagtttt ggaacttatc cttaaggaaa + 22861 tgggacaagc tgcggatgcc tatgatcatg tgactgaccg tgcaggacat gaccttcgct + 22921 atgcgattga tgctagcaag ctccgtgatg agttggggtg gaaacctgaa tttaccaact + 22981 ttgaagctgg gctcaaggca acaatcaagt ggtatacaga taaccaagaa tggtggaaag + 23041 cagaaaaaga agctgttgaa gccaattatg ctaagactca ggagattatt acagtataaa + 23101 aagcaggaaa tagctgcttt ttattgctat attgggaaga gttacatatt agaaaggtct + 23161 agagatgatt ttaattacag gggcaaatgg ccaattagga acggaacttc gctatttatt + 23221 ggatgaacgt aatgaagaat acgtggcagt agatgtggct aagatggaca ttaccaatga + 23281 agaaatggtt gagaaagttt ttgaagaggt gaaaccgact ttagtctacc attgtgcagc + 23341 ctacaccgct gttgatgcag cagaggatga aggaaaagag ttggacttcg ccatcaatgt + 23401 gacggggaca aaaaatgtcg caaaagcatc tgaaaagcat ggtgcaactc tagtttatat + 23461 ttctacggac tatgtctttg atggtaagaa accagttgga caagagtggg aagttgatga + 23521 ccgaccagat ccacagacag aatatggacg cactaagcgt atgggggaag agttagttga + 23581 gaagcatgtg tctaatttct atattatccg tactgcctgg gtatttggaa attatggcaa + 23641 aaacttcgtt tttaccatgc aaaatcttgc gaaaactcat aagactttaa cagttgtaaa + 23701 tgaccagtac ggtcgtccga cttggactcg taccttggct gagttcatga cctacctagc + 23761 tgaaaatcgt aaggaatttg gttattatca tttgtcaaat gatgcgacag aagatacaac + 23821 atggtatgat tttgcagttg aaattttgaa agatacagat gtcgaagtca agccagtaga + 23881 ttccagtcaa tttccagcca aagctaaacg tccgctaaac tcaacgatga gcctggccaa + 23941 agccaaagct actggatttg ttattccaac ttggcaagat gcattgcaag aattttacaa + 24001 acaagaagtg agataagtag tagaatgatt ttctagtcta ataaaagagg cagagaatga + 24061 actccaaagg agcttaagat gtacgattat cttgttgttg gtgcagtctt tgcccatgaa + 24121 gcagtcttaa aaggaaaaaa agtaaaagtt attgaaaaat gaaatcatat cgcgggtaat + 24181 atctatactc gtgaagagga aggaattcaa gttcatcaat atggtgctca tatcttccat + 24241 acttctgata aggagatctg ggattatgta aatcagtttg cagagtttaa ccgttacata + 24301 aattctcctg ttgcaaacta taagggtgag atttataacc ttccttttaa tatgaatact + 24361 ttcaataaac tctggggagt tgtaacgcca gcagaagcac aagctaagat tgatgaacaa + 24421 cgtgctattt taaatggtaa aactcctgaa aatttggaag aacaggcgat ttctcttgta + 24481 gctacagaca tctacgaaaa attaatcaaa gactatacag agaaacagtg gggcaaacca + 24541 actactgaac ttccatcctt tattattgtt tgccagtacg cctgacctat gataacaact + 24601 attttaacga tacctatcaa gggattccaa ttggtagata cactcaaata gttgaaaaat + 24661 gttggatcat gaaaatattg atgtagaaac aaacgttgat ttctttgtga ataaagagca + 24721 atatctgaaa gattttccta agattgtctt tactggtatg attgatgaat tctttgacta + 24781 taagttgggc gaactagagt accgtagtct tcgttttgaa aatgagacct tggatatgga + 24841 aaattaccaa ggaaatgcag ttgtgaacta tacggatgca gaaaccccat atactcgcat + 24901 tattgaacac aaacattttg agtttgggag tcaagcaaag actatcatta ctaaagaaca + 24961 ttctaaaaca tgggaaaaag gtgatgagcc ttattatcca gttaataatg atcgtaataa + 25021 tcatttgtat aaatcatata aaaaacttgc tgatgagcaa gggaatgtta tctttggtgg + 25081 ccgcttagga cactatcgtt attacgatat tcaccaagta attggagcag ctttgcagtg + 25141 cgtgagaaat gagttaaatt aatactcaat gaaaatcaaa gagcaaacta ggaagctagc + 25201 cacaggttgc tcaaaacact gttttgaggt tgcagatgga cgctgacgcg gtttgaagag + 25261 attttcgaag agtataaaca agtaaaactg actaccagtt attatttaga aatagtatta + 25321 aaaattcctt gactatgtga tatagttgag ggatttttaa atgatattca tattttttgc + 25381 aaagatgttg tttgaaaaat aattttcaaa aattctgaaa attctgttga caactttctg + 25441 aaaagagtct ataatggaga gaaagtttta aaggagaaaa tgatgaaaag ttcaagacta + 25501 tttgcccttg cgggcgtgac attattggcg gcgactactt tagctgcatg ctctggatca + 25561 ggttcaagca ctaaaggtga gaagacattc tcatacattt atgagacaga ccctgataac + 25621 ctcaactatt tg +// + diff --git a/public/res/serotype_genbank/serotype_19F.gb b/public/res/serotype_genbank/serotype_19F.gb new file mode 100644 index 0000000..fff2e2f --- /dev/null +++ b/public/res/serotype_genbank/serotype_19F.gb @@ -0,0 +1,904 @@ +LOCUS CR931678 19798 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 485/61 (serotype 19f). +ACCESSION CR931678 +VERSION CR931678.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 19798) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 19798) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..19798 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="485/61" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC19F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC19F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33688.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC19F_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC19F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene 1107..2384 + /gene="intron" + /locus_tag="SPC19F_0003" + CDS 1107..2384 + /gene="intron" + /locus_tag="SPC19F_0003" + /note="member of homology group 108" + /codon_start=1 + /transl_table=11 + /product="putative group II intron protein" + /protein_id="CAI33690.1" + /db_xref="GOA:Q4K0V6" + /db_xref="InterPro:IPR000477" + /db_xref="InterPro:IPR013597" + /db_xref="InterPro:IPR015706" + /db_xref="UniProtKB/TrEMBL:Q4K0V6" + /translation="MSKLLDKILSRENMLEAYNQVKSNKGSAGIDGMTIEEMDNYLRQ + NWRLTKELIKQRKYKPQPVLKVEIPKPDGGIRQLGIPTVMDRMIQQAIVQVMSPICEP + HFSDTSYGFRPNRSCEKAIMKLLEYLNDGYEWIVDIDLEKFFDTVPQDRLMSLVHNII + EDGDTESLIRKYLHSGVIINGQRYKTLVGTPQGGNLSPLLSNIMLNELDKELEKRGLR + FVRYADDCVITVGSEAAAKRVMYSVSRFIEKRLGLKVNMTKTKITRPRELKYLGFGFW + KSSDGWKSRPHQDSVRRFKLKLKKLTQRKWSIDLTRRIEQLNLSIRGWINYFSLGNMK + SIVASIDERLRTRLRVIIWKQWKKKSRRLWGLLKLGVPKWIADKVSGWGDHYQLVAQK + SVLKRAISKPVLEKRGLVSCLDYYLERHALKVS" + misc_feature 1281..1931 + /gene="intron" + /locus_tag="SPC19F_0003" + /note="HMMPfam hit to PF00078, Reverse transcriptase + (RNA-dependent DNA pol, score 1.3e-65" + misc_feature 1977..2228 + /gene="intron" + /locus_tag="SPC19F_0003" + /note="HMMPfam hit to PF08388, Group II intron, + maturase-specific domain, score 5.5e-30" + gene complement(2441..3226) + /gene="tnp" + /locus_tag="SPC19F_0004" + /pseudo + CDS complement(2441..3226) + /gene="tnp" + /locus_tag="SPC19F_0004" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(2855..3226) + /gene="tnp" + /locus_tag="SPC19F_0004" + /note="HMMPfam hit to PF01710, Transposase, score 1.1e-14" + /pseudo + gene 3475..4920 + /gene="wzg" + /locus_tag="SPC19F_0005" + CDS 3475..4920 + /gene="wzg" + /locus_tag="SPC19F_0005" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33692.1" + /db_xref="GOA:Q4K0V5" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0V5" + /translation="MSRRFKKSRSQRVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIQKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 3475..3591 + /gene="wzg" + /locus_tag="SPC19F_0005" + /note="Signal peptide predicted for SPC1032 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 3679..4026 + /gene="wzg" + /locus_tag="SPC19F_0005" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.6e-64" + misc_feature 4204..4647 + /gene="wzg" + /locus_tag="SPC19F_0005" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 3.5e-70" + gene 4922..5653 + /gene="wzh" + /locus_tag="SPC19F_0006" + CDS 4922..5653 + /gene="wzh" + /locus_tag="SPC19F_0006" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33693.1" + /db_xref="GOA:Q4K0V4" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0V4" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKVKELFVDNPRKIIMDQLI" + misc_feature 4925..5533 + /gene="wzh" + /locus_tag="SPC19F_0006" + /note="HMMPfam hit to PF02811, PHP domain, score 1.3e-37" + gene 5662..6354 + /gene="wzd" + /locus_tag="SPC19F_0007" + CDS 5662..6354 + /gene="wzd" + /locus_tag="SPC19F_0007" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33694.1" + /db_xref="GOA:Q4K0V3" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0V3" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSMTRIYVVNRNQGEKSGLTNQDLQAGSSLVKDYREIILSQDVLEEVVSDLKLD + LTPKDLANKIKVTVPVDTRIVSVSVSDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPATSPSSPNIKRSTLIVFLAGVIGTSVIVLILELLDTRVKRPKDIEDTLHMT + LLGIVPNLNKLK" + misc_feature 5680..6096 + /gene="wzd" + /locus_tag="SPC19F_0007" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.4e-52" + gene 6364..7053 + /gene="wze" + /locus_tag="SPC19F_0008" + CDS 6364..7053 + /gene="wze" + /locus_tag="SPC19F_0008" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33695.1" + /db_xref="GOA:Q4K0V2" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0V2" + /translation="MPTLEIAQKKLEFVKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PEEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVMSGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGTVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GFYGNYGKKII" + gene 7064..8431 + /gene="wchA" + /locus_tag="SPC19F_0009" + CDS 7064..8431 + /gene="wchA" + /locus_tag="SPC19F_0009" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33696.1" + /db_xref="GOA:Q4K0V1" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0V1" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYVQYTSE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 7847..8428 + /gene="wchA" + /locus_tag="SPC19F_0009" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.7e-155" + gene 8435..9178 + /gene="wchO" + /locus_tag="SPC19F_0010" + CDS 8435..9178 + /gene="wchO" + /locus_tag="SPC19F_0010" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI33697.1" + /db_xref="GOA:Q54522" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q54522" + /translation="MRDRIQLLGVTIDLLTMNETIDSVEQYVLEKRPLHLMGVNADKI + NQCHTDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMQCLLELSNKKG + YSVYFFGAKEEVLQDMLKVFKRDYPNLIVIGHRNGYFSEEDEQAIQEDIREKNPDFVF + IGITSPKKEYIIQKFMDSGVNSVFMGVGGSFDVLSGHIQRAPLWMQKSNLEWLFRVAN + EPKRLFKRYFVGNISFIGKVLKAKRGVKY" + misc_feature 8597..9112 + /gene="wchO" + /locus_tag="SPC19F_0010" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 1.6e-95" + gene 9175..9999 + /gene="wchP" + /locus_tag="SPC19F_0011" + CDS 9175..9999 + /gene="wchP" + /locus_tag="SPC19F_0011" + /note="member of homology group 95" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33698.1" + /db_xref="GOA:Q4K0U9" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K0U9" + /translation="MNQTEMIRLIQKVELDAIKEFKKICEENDIDFFLRGGSVLGAVK + YDGFIPWDDDMDIAVPREAYDKLPSVFKDRIIAGKYQVLTYQYCDTLHCYFPRLFLLE + DERKRLGLPRNTNLGLHLIDIIPLDGAPNHSVLRKIYFGKVYWYRFLASLGTTYVGDH + VDMHSTKQKLIIGFFKKLGFAKLFPQNSVYRRLDNLYRKYDWKKQKYAGTINASLFAK + EVMPVEIWGEGVEKPFEDTFFKVPTEYDRYLKRLYGENYLYEEPSDDEKKSHLGGH" + misc_feature 9247..9936 + /gene="wchP" + /locus_tag="SPC19F_0011" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 5.5e-109" + gene 10001..10879 + /gene="wchQ" + /locus_tag="SPC19F_0012" + CDS 10001..10879 + /gene="wchQ" + /locus_tag="SPC19F_0012" + /note="member of homology group 43" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33699.1" + /db_xref="GOA:P97000" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:P97000" + /translation="MFCYIILHYKVLEETISCVKSIKEGNYNAKQIVIIDNFSNNGTG + EKLQELYESDLEIDVLINHENAGFARGNNVAYQFAKEKYNPDFMVIMNNDIEIETENF + EKIVTDIYREEKFHLLGPDIFSTTYQLHQNPKRLTHYTYGEVKALNEKFKKGSQVSLA + LKIKCWLKASKVLRTAIYQNRRKKGSVDYRKQVENPILHGSFIVYSRDFIEKEEYAFN + PNTFFYYETEILDYEAELKGYKRIYTPKIRVLHHQNVATNQVYTNLLEKTLFSNKCNF + KSTSYFLKLMKENEDV" + misc_feature 10007..10546 + /gene="wchQ" + /locus_tag="SPC19F_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 5.1e-11" + gene 10880..12217 + /gene="wzy" + /locus_tag="SPC19F_0013" + CDS 10880..12217 + /gene="wzy" + /locus_tag="SPC19F_0013" + /note="member of homology group 161" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33700.1" + /db_xref="UniProtKB/TrEMBL:P97001" + /translation="MSYLFLLCLTLFLLTIFYFFAFIQDLIAPPVVMSVMFLISSVFA + LVNSKNWNIEYSGIAYILIISGIIIFSIPLMALKSPNFNTEVKIADRLIDIQFWKIAL + TIIIDLFILYLYRKEIYNLVLSNGYTGSNIQWFFRNATSYEGELTVRTFIRVLIRVID + VSAYIFGYTFINNFLIYRHKRPKDILLLVPLLIFISKTLISGGRQDIIKILIAYVIMM + YIQQKRKVGWNRVISHKYIHLGFVGLIAGIPAFYYSLFLAGRSTTRTLFESVSTYLGG + SIQHFNQYIENPLDPGEVFGSETLVPILNILGEMGLVNYRSTIHLEFRTLGVTVGNVY + TFFRRPLHDFGLVGMYVFVFAVGAFFAIYYLVLRKKQVGFNLDIHTIIYSYVFYWIFL + SSIEQYSFTMISLYTLVFIVLVYFMAIFYWCTDFKRGKLIFKISDSSIKLKEE" + misc_feature 10880..11011 + /gene="wzy" + /locus_tag="SPC19F_0013" + /note="Signal peptide predicted for SPC1040 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.610 between residues 44 and 45" + gene 12240..13661 + /gene="wzx" + /locus_tag="SPC19F_0014" + CDS 12240..13661 + /gene="wzx" + /locus_tag="SPC19F_0014" + /note="member of homology group 82" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33701.1" + /db_xref="UniProtKB/TrEMBL:Q4K0U6" + /translation="MNTKIKNIITSFSYVISSNLLIVLTSSLVVLIFPKIMGVTEYSY + WQLYIFYLTYIGFFHLGWIDGIYLKYGGLEYTNLDRKQFYSQMILFSSFLMLISLVLF + TLNLITVRDENARYIYNMAIISMIVTNLRTLYVYILQMTNRLKDSSVILISDRVLYVL + LLFMFIVFGWHEYKVMIWADILGRTFSLMLSFWICKDIVFQPLSKFILDFKESLDNIR + VGINLMLSNIASSMIIGIVRMGIQWNWNIETFGKVSLTLSISNLLMTFINAIGLVIFP + LIKRTKTENLPKIYSNLRNALMLVMFAILLFYYPLKFILDIWLPAYKDALVFMALIFP + MSVYEGKMALVINTYLKAMRMEKDILKINALVMLTSIVVTLVTTILLNNLGLTVVSIV + ILLALRSIIAELILSKKLKISVKQDIALELLMTIIFISSSWYLSIWIAVIIYLLAYTL + YLYLKHKDIRMYIEYFKNHKKIS" + misc_feature 12240..12359 + /gene="wzx" + /locus_tag="SPC19F_0014" + /note="Signal peptide predicted for SPC1041 by SignalP 2.0 + HMM (Signal peptide probability 0.685) with cleavage site + probability 0.363 between residues 40 and 41" + gene 13725..14813 + /gene="mnaA" + /locus_tag="SPC19F_0015" + CDS 13725..14813 + /gene="mnaA" + /locus_tag="SPC19F_0015" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33702.1" + /db_xref="GOA:Q4K0U5" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K0U5" + /translation="MKKIMLVFGTRPEAIKMCSLVNELRKQEDMKTVVCVTGQHKEMV + SPVLDLFGVQPDYDLEIMKANQNLFSITISILEKIKPVLEKEQPDIVLVHGDTTTTYA + AALAAFYLGIKVGHVEAGLRTYNLQSPFPEEFNRQSTSIIANYHFAPTELAKENLIKE + GRNNIYVTGNTVIDALTTTVQKDYTHPDLDLNDGNRLILLTAHRRENLGEPMRHMFRA + VKRVLNEYDDVKVIYPIHKNPLVRETATEIFGDTERIQIIEPLDVLDFHNFMNHSYMI + LTDSGGVQEEAPSLGKPVLVMRDTTERPEGVAAGTLKLVGTDEETIYQNFKMLLDDPE + EYKKMSQASNPYGNGDASKQIVRILRGI" + misc_feature 13788..14804 + /gene="mnaA" + /locus_tag="SPC19F_0015" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 1.3e-195" + gene 14852..15721 + /gene="rmlA" + /locus_tag="SPC19F_0016" + CDS 14852..15721 + /gene="rmlA" + /locus_tag="SPC19F_0016" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33703.1" + /db_xref="GOA:P97004" + /db_xref="HSSP:1FXO" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:P97004" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGLKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + misc_feature 14855..15571 + /gene="rmlA" + /locus_tag="SPC19F_0016" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 1.1e-119" + gene 15722..16318 + /gene="rmlC" + /locus_tag="SPC19F_0017" + CDS 15722..16318 + /gene="rmlC" + /locus_tag="SPC19F_0017" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33704.1" + /db_xref="GOA:P97005" + /db_xref="HSSP:1NZC" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:P97005" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 15758..16288 + /gene="rmlC" + /locus_tag="SPC19F_0017" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 16328..17377 + /gene="rmlB" + /locus_tag="SPC19F_0018" + CDS 16328..17377 + /gene="rmlB" + /locus_tag="SPC19F_0018" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33705.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 16343..17299 + /gene="rmlB" + /locus_tag="SPC19F_0018" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 16346..17086 + /gene="rmlB" + /locus_tag="SPC19F_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 16349..17161 + /gene="rmlB" + /locus_tag="SPC19F_0018" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 17443..18294 + /gene="rmlD" + /locus_tag="SPC19F_0019" + CDS 17443..18294 + /gene="rmlD" + /locus_tag="SPC19F_0019" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33706.1" + /db_xref="GOA:P97007" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:P97007" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVARASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 17443..18291 + /gene="rmlD" + /locus_tag="SPC19F_0019" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.9e-148" + misc_feature 17446..18087 + /gene="rmlD" + /locus_tag="SPC19F_0019" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 9.7e-05" + misc_feature 17446..18075 + /gene="rmlD" + /locus_tag="SPC19F_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 3.5e-19" + misc_feature 17449..18177 + /gene="rmlD" + /locus_tag="SPC19F_0019" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.9e-08" + gene order(18370..19323,19340..19555) + /gene="tnp" + /locus_tag="SPC19F_0020" + /pseudo + CDS join(18370..19323,19340..19555) + /gene="tnp" + /locus_tag="SPC19F_0020" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 18376..18819 + /gene="tnp" + /locus_tag="SPC19F_0020" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 8e-05" + /pseudo + gene 19751..>19798 + /gene="aliA" + /locus_tag="SPC19F_0021" + CDS 19751..>19798 + /gene="aliA" + /locus_tag="SPC19F_0021" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33708.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaataag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt ctcactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct tgtaaaaggt attgcaactt ggtaatacct ttttgatgta cgacgggcat + 541 gtcgtatatc tgaggtgtaa gtcctcggtg ggcacctgct accagtgaac ccaatagcga + 601 ttcccaagcc tgactatcgt gaggtagcag ggagaggaag ggatagcgaa atcgtggctc + 661 tacgaacagg aacgtgatag taaggcgtat atagcggata agggggcctc aaactctaaa + 721 gtccaaaaag gtagtcgtaa cctgtatgcg taaatcacga gagtaattga attcggacta + 781 agatttccta ttttcactgt aaccttttaa cgtcctcata tcttgtataa acgaggaaag + 841 atgtacgatt tatcccgtga ggtctcatga gcgctgaaag cgtagtaaca acgaatcatg + 901 agaagtcagc cgaacccata gtagtgagga aacttctgta gtggaagtgg agcgaagggg + 961 tgagcaacta attgaagtaa tcctacttca cttgtgtctg taaaacgaga ggtctgatag + 1021 aactggagtc tgtcacgtat tgactagatg aaggttcacc aatataagat gtccctcagg + 1081 caccaaaaca agaaaggaat acgcacatgt caaaactgct agataagata ttatcacgcg + 1141 aaaatatgct ggaagcctac aatcaagtaa aatccaataa aggctcagct gggattgatg + 1201 gaatgactat cgaagagatg gataattatc tcagacaaaa ctggcgcttg actaaggaac + 1261 tgataaaaca gagaaaatat aagcctcaac cagttcttaa agttgagata cctaaaccag + 1321 acggaggcat ccgtcaacta ggaattccaa cagttatgga tagaatgatt caacaggcca + 1381 ttgtccaagt catgagcccc atttgtgaac cccatttctc agatacgagt tatggtttca + 1441 gaccaaatag gtcatgtgaa aaagccatca tgaagctctt agaatactta aatgacggct + 1501 atgagtggat agtggatata gacctagaga aatttttcga tacagttcct caagatagat + 1561 tgatgtcctt agtacataac attatcgaag acggagatac ggaatccttg attcgtaagt + 1621 atcttcattc aggtgttatc attaatggtc aacgttataa aacactagtt ggtacaccac + 1681 agggaggaaa tttatctcct ctcttatcca atatcatgct taatgaattg gacaaggaat + 1741 tagaaaagag gggacttcga tttgtgcgct acgcagatga ttgtgtgatt acggtcggaa + 1801 gcgaggcagc cgctaagcgt gtgatgtatt cagtcagtcg ttttattgag aaacggctag + 1861 gtttgaaagt aaacatgacc aagactaaga ttaccagacc aagagagttg aaatatctag + 1921 gttttgggtt ctggaaatca tcagatggtt ggaaaagccg tccacatcaa gatagtgttc + 1981 ggagatttaa gcttaaattg aagaaactaa cacagaggaa atggagtata gacctaacaa + 2041 gacgtattga gcaactgaat ttgtctattc gaggatggat aaactatttc tcattgggaa + 2101 atatgaaaag tatagtcgcc agcatagatg agcgcttgcg tactcgccta cgagtgatta + 2161 tctggaagca atggaagaag aaatcgagac gattatgggg attgcttaag ttaggagttc + 2221 ctaaatggat agcagataag gtatctggct ggggcgacca ttatcaatta gtagctcaga + 2281 agtcggtact taaacgtgct atatcaaaac cagtcctgga aaaacgtgga ctggtttcgt + 2341 gtttggatta ttaccttgaa cgacatgcgt taaaagttag ttgaaccgcc gtatgccgaa + 2401 cggcacgtac ggtggtgtga gaggggctag agattatccc ctactcgatg tgctttttga + 2461 tatgagccca tgttttctca ataggattgt actcaggtga gtagggagga agaggtaaaa + 2521 gtttacgccc aaactcttca cataagagtt ctagcttccc cattctatgg aatcttgcat + 2581 tatccataat aataaccgat ggtgtggtta atgttggtaa gagaaacttc tgaaaccaag + 2641 cttcaaaaaa gtcgctcgtc atcgtctctt cgtaagtcat tggagcgatt aactcaccat + 2701 ttgttagacc tgaaaccaaa gaaatcctct gatatcttct tccagatact ttgcctcttc + 2761 ttaactgacc ttttaatgag cgaccatatt ctcgataaaa ataagtatcg aatcctgttt + 2821 cgtcaatcta aacaggtgct aggtgcttta aactattaaa attcttaaga aataaggcta + 2881 cttttctggg tcttgttcat agtaggtgtg gttctttttt tagagtgtag cccatagctt + 2941 tgagcgcata gtggatggta gttggatgac agccaaattc agaagctatt tcagtcaaat + 3001 aagcgtctgg attgtcagta agatagtttt taagtctatc tctatcaact tttcttggtt + 3061 ttattccttt tacttggtgg tttagctctc ctgttttctc ttttagcttt aaccagccat + 3121 aaatggtatt acgtgagatt tggaaaacgt gtgatacttc tgttatacta cctgttcgct + 3181 cacaataaga gagaactttt ttacgaaaat ctattgaata ttccataaaa gattatacca + 3241 cattgtgtac tatagtagat tgaaactaga atagtacacc tctgcttcta aaacattgtt + 3301 agaaatcgat ttgactgtcc tgatcgattt gtcatgttct tatttcattt tactatattt + 3361 ttgtttcgcg ggaagtctac taagatactt aaagatgcag atagtaaaaa aaatgtagac + 3421 attaccgtaa aaaagtgata taatcgtatg atgttcaagg tataggtgtt aatcatgagt + 3481 agacgtttta aaaaatcacg ttcacagaga gtgaagcgaa gtgttaatat cgttttgctg + 3541 actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta caatatcctt + 3601 gcttttagat atcttaacct agtggtaact gcgttagtcc tactagttgc cttggtaggg + 3661 ctactcttga ttatctataa aaaagctgaa aagtttacta tttttctgtt ggtgttctct + 3721 atccttgtca gctctgtgtc gctctttgca gtacagcagt ttgttggact gaccaatcgt + 3781 ttaaatgcga cttctaatta ctcagaatat tcaatcagtg tcgctgtttt agcagatagt + 3841 gatatcgaaa atgttacgca actgacgagt gtgacagcac cgactgggac tgataatgaa + 3901 aatattcaaa aactactagc tgatattaag tcaagtcaga ataccgattt gacggtcaac + 3961 cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac taaggccatt + 4021 gtcctaaata gtgtctttga aaacatcatc gagtcagagt atccagacta cgcatcgaag + 4081 ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa gacgtctaag + 4141 aatcagtctt tcaatatcta tgttagtgga attgacacct atggtcctat tagttcggtg + 4201 tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa aatcctcttg + 4261 accacaacgc cacgtgatgc ctatgtacca atcgcagatg gtggaaataa tcaaaaagat + 4321 aaattaaccc atgcaggcat ttatggagtt gattcgtcca ttcacacctt agaaaatctc + 4381 tatggagtgg atatcaatta ctatgtgcga ttgaacttca cttctttctt gaaaatgatt + 4441 gacttattgg gaggggtaga tgttcataat gatcaagagt tttcagctct acatgggaag + 4501 ttccatttcc cagtagggaa tgtccatcta gactctgagc aggctctagg ttttgtacgt + 4561 gaacgctact cactagccga tggagaccgt gaccgtggtc gcaaccaaca aaaggtcatt + 4621 gtagcaatta ttcagaagtt aacttctaca gaggttttga aaaactatag tagtattctt + 4681 caaggattgc aggattctct tcaaacaaat atgccgattg agactatgat agatttagtg + 4741 aatactcagt tggaaagtgg ggggaattat aaagtaaatt ctcaagattt aaaagggaca + 4801 ggtcggatgg atcttccttc ttatgcaatg ccagacagta acctctatgt gatggaaata + 4861 gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga gggtagatga + 4921 aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca agtcaagaga + 4981 ggaaagcaag gctctcttgg cagaatccta caggcagggg gtgcgaacca ttgtctctac + 5041 ctctcaccgt cgcaagggca tgtttgaaac tccggaagag aagatagcag aaaactttct + 5101 tcaggttcgg gaaattgcaa aagaagtggc agatgattta gtcattgctt atggcgcaga + 5161 gatatactat actctggatg ctctagaaaa gctagaaaaa aaagaaattc ctacccttaa + 5221 tgatagtcgt tatgccttga ttgagtttag catgcatact tcctatcgtc agattcatac + 5281 gggattgagc aatattttga tgttgggaat cacgccagta attgctcata ttgaacgtta + 5341 tgatgcttta gagaataacg aaaaacgtgt tcgtgaactg attgatatgg ggtgctatac + 5401 tcagataaat agttatcatg tttcaaaacc taagttcttt ggtgaaaaat ataaattcat + 5461 gaaaaagaga gctcggtatt ttttggaacg tgatttagtt catgtagttg caagtgacat + 5521 gcacaattta gacagtagac ctccatatat gcaacaggca tatgatatca ttgctaagaa + 5581 atatggagcg aaaaaagtaa aagaactttt tgtagataat cccagaaaaa ttataatgga + 5641 tcaattaatt taggagaaaa tatgaaggaa caaaacactt tggaaatcga tgtattgcaa + 5701 ctattcagag ctttatggaa aagaaagttg gtcattttat tagtggcaat tataacttct + 5761 tcagttgctt ttgcctacag tacttttgtt atcaaacctg agtttactag tatgactcgg + 5821 atttatgtag ttaaccgtaa tcagggagag aagtctggtt taaccaatca agacttgcag + 5881 gcaggatcat ccttggttaa agactatcgt gaaattatcc tatcgcagga tgttttggag + 5941 gaagttgttt ctgatttgaa actagatttg acgccaaaag atttggctaa taaaattaaa + 6001 gtaacagtac cagttgatac ccgtattgtc tctgtttcag ttagtgatcg agttcctgaa + 6061 gaggcaagcc gtatcgctaa ctctttgaga gaagtagctg ctcaaaaaat tatcagtatt + 6121 actcgtgttt ctgatgtgac aacactggag gaggcaagac cggcgacatc accgtcttcg + 6181 ccaaatatta aacgcagtac actaattgtt tttttggcag gagtgattgg aactagtgtt + 6241 atagttctta ttcttgaact tttggacact cgtgtgaaac gtccgaaaga tatcgaagat + 6301 acactgcata tgacactttt gggaattgta ccaaacttga ataagttgaa ataggagaga + 6361 ggaatgccga cattagaaat agcacaaaaa aaactggagt tcgttaagaa ggcagaagaa + 6421 tattacaatg ccttgtgtac aaatatacag ttgagcggag ataaactaaa agtaatttcc + 6481 gttacttctg ttaaccctga ggaaggaaaa acaactactt ccgtaaatat agcaaggtcg + 6541 tttgcgcgtg caggctataa aactcttttg atcgatggcg atactcgaaa ttcagttatg + 6601 tcaggatttt ttaaatctcg tgaaaaaatt acagggctaa cggaattttt atctgggaca + 6661 gctgatttat ctcacggttt atgtgataca aatattgaaa atttatttgt agttcaatcg + 6721 ggcactgtat caccaaaccc tacagccttg ttacaaagta aaaattttaa tgatatgatt + 6781 gaaacattgc gtaaatattt tgattatatc attgttgata cagcacctat tggaattgtt + 6841 attgatgcgg caattatcac tcaaaagtgt gatgcgtcca tcttggtaac agcaacaggt + 6901 gaggtgaata aacgtgatgt ccaaaaagcg aaacaacaat tagaacaaac agggaaactg + 6961 ttcctaggag ttgttttgaa taaattagat atctcggttg ataagtatgg agtttacggt + 7021 ttctatggaa attatggtaa aaaaataatt taggaaagat tctatggatg aaaaaggatt + 7081 gaaaattttt ttggcagtat tacagagtat tattgtcatt ttattggttt attttcttag + 7141 ctttgttaga gagacagaac ttgaacgttc ttcgatggtt atactatacc ttctccactt + 7201 ttttgtattc tattttagtt cctatggtaa caattttttt aaaagagggt acctagttga + 7261 gtttaatagt accataagat atattttttt ctttgcaata gctataagtg tattaaactt + 7321 ttttatagcg gaacggttta gtatctctag aagaggaatg gtatacttct taactttaga + 7381 aggaatatcc ttatacttgt taaatttctt agtaaagaaa tattggaagc atgtgttttt + 7441 taatctaaaa aatagcaaga aaattttact gttaacagta acgaaaaata tggaaaaagt + 7501 tcttgataaa ttgctagaat ctgatgaact ttcatggaaa ttggtagcag taagtgtttt + 7561 ggataaatct gattttcaac atgataaaat acctgtaatt gaaaaggaaa aaattattga + 7621 atttgcaacg catgaagttg tggatgaggt gtttgtcaat cttccaggag agagctacga + 7681 tattggagaa attatctcta ggtttgagac aatggggata gatgtaactg taaatcttaa + 7741 agcatttgat aagaatttgg gtcgcaataa acaaattcat gagatggtag gattgaatgt + 7801 agtcactttc tctacaaatt tttataaaac tagtcatgta attgctaagc ggattattga + 7861 tatcatgggt gcattggtag ggctgatact atgtggttta gtcagtattg tattggttcc + 7921 tttgattcga aaggatgggg gctctgctat ttttgctcag acgcgtatag gaaaaaatgg + 7981 tcgtcagttc actttttata agtttcgctc tatgtgtgta gatgccgagg cgaaaaaaag + 8041 agaactcatg gaacaaaata ccatgcaggg tggaatgttt aaggtggacg atgatcctcg + 8101 tatcacgaaa attggtcgtt ttatacggaa gactagcttg gacgagttac cacagtttta + 8161 taatgttcta aagggagata tgagtttggt tggcacacgg ccacctacag tggacgagta + 8221 tgttcagtat acttcagaac agaaacgtcg actcagcttt aaacctggta ttacaggttt + 8281 atggcaggtt agcggccgta gtaaaataac cgattttgac gatgttgtaa aattagatgt + 8341 ggcttatatt gataattgga caatctggaa agatattgaa attttgctta aaactgttaa + 8401 agttgtattt atgagagatg gagcgaagtg aggaatgagg gatagaatcc aacttttagg + 8461 tgtaacaatt gatttgctta cgatgaatga aacgatagat agtgtagaac aatatgtatt + 8521 agaaaaaaga ccactacact tgatgggggt gaatgctgat aaaattaatc agtgtcatac + 8581 agatgagaaa atcaaaaaaa tcgttaatga gtcaggaatc attaatgcgg atggagcatc + 8641 agttgttctt gcaagtaagt ttttaggaac gcctgttcct gaacgagtag cgggtattga + 8701 tttgatgcaa tgtcttttag agttgtcaaa taaaaaagga tattcagttt acttttttgg + 8761 agcaaaagaa gaagttttgc aagatatgct caaagtattt aagagagatt atccaaattt + 8821 gatagttatt ggacacagaa atggctattt ttctgaagag gatgaacaag ctattcaaga + 8881 agatattcgt gaaaagaacc ctgattttgt gtttattgga attacgtctc ctaaaaaaga + 8941 atatattatt caaaaattta tggatagtgg cgtcaattcg gtatttatgg gagttggcgg + 9001 tagttttgat gtcttgtctg gtcatatcca acgagcacct ctatggatgc aaaagtcaaa + 9061 tttagagtgg ttattccgtg tagctaatga gcctaaacgt ctctttaaac gttattttgt + 9121 agggaatatt tcattcatag gaaaagtttt aaaagcaaaa agaggtgtaa aatattgaac + 9181 cagacagaga tgattcgctt aattcaaaaa gttgaattag atgctataaa agagtttaaa + 9241 aaaatctgtg aagagaatga tatagatttt ttcctccgcg gtggtagtgt acttggtgcg + 9301 gtcaaatacg acggctttat tccatgggat gatgatatgg atatcgctgt ccctcgtgaa + 9361 gcatacgaca aacttccaag tgttttcaaa gatagaatta tcgctgggaa atatcaggtt + 9421 cttacttatc aatactgtga tacgttgcat tgctactttc ctcgactatt ccttttagaa + 9481 gatgaaagaa aacgtttggg cttgccacga aataccaatc taggattgca tttgattgat + 9541 atcattcctt tagatggagc accaaatcat tcggttttaa gaaagattta ctttggcaaa + 9601 gtatactggt atcgtttttt agcaagttta ggaacaactt atgttggcga ccatgtggat + 9661 atgcattcca ctaagcaaaa actaattatt ggtttcttta aaaaactagg atttgcaaaa + 9721 ctatttcctc aaaattctgt atacagacgc ttggataatc tctatagaaa gtatgattgg + 9781 aaaaagcaga agtatgcggg gactatcaat gcttctttat ttgctaaaga agttatgcca + 9841 gtagagattt ggggagaagg agtagagaag ccttttgagg ataccttctt taaagttcca + 9901 acggagtatg atcgctacct gaaaagactt tacggagaaa actatcttta cgaagagcct + 9961 agtgatgatg aaaagaaatc gcatttagga ggacactaat ttgttttgtt atattatttt + 10021 gcattacaaa gtcttagaag aaactatttc ttgtgttaaa tctataaaag aaggcaatta + 10081 taatgcaaag caaatcgtta ttattgataa tttctctaat aatggtactg gtgaaaaact + 10141 acaagagctt tatgaatcag atttagaaat tgatgttttg attaaccatg aaaatgctgg + 10201 ttttgctcgt ggaaataatg tggcttatca atttgctaag gaaaagtata accccgattt + 10261 catggttatc atgaataacg atattgagat agaaacagaa aattttgaaa aaattgtgac + 10321 agatatctat cgtgaggaaa aattccattt gctcgggcca gatatcttct cgactactta + 10381 ccaacttcac caaaacccaa aacggttgac acattatact tatggagaag ttaaagctct + 10441 aaatgaaaaa tttaaaaaag ggagccaagt tagtctagct ttaaaaatca aatgttggtt + 10501 gaaagctagt aaagttcttc gaacagcaat ctatcaaaat agacgtaaaa aaggatcagt + 10561 agactataga aaacaggtag aaaacccaat tcttcatggt tcttttattg tatattcgag + 10621 agattttatc gaaaaagagg agtatgcttt taaccctaac accttctttt actatgaaac + 10681 agagatatta gattatgaag ctgaattaaa aggatacaag agaatttata cacctaaaat + 10741 tagagttttg caccatcaaa atgttgcaac taatcaagtt tacacgaact tgttagaaaa + 10801 aaccttgttt tcaaataaat gcaactttaa atccaccagt tattttttga agttgatgaa + 10861 agaaaacgag gatgtttaaa tgagttattt atttttactt tgccttacat tattcttatt + 10921 gactatattc tatttctttg cttttattca agatttaatt gctcctccag tagttatgtc + 10981 tgtaatgttt ctaattagtt cagtatttgc actggttaat tcaaaaaact ggaatattga + 11041 atatagtgga atagcctata ttctcataat tagtggtatt attatatttt cgattccttt + 11101 aatggcatta aaatcaccta attttaatac tgaggttaag attgctgatc gattaattga + 11161 tatccaattt tggaaaattg ctctaactat tataattgat ctctttattt tgtatcttta + 11221 caggaaggaa atatacaacc ttgttcttag taatggatat acggggtcaa atattcagtg + 11281 gttttttaga aatgcaacga gttatgaagg tgaattgaca gtgcgaactt ttattcgagt + 11341 tctcattcgt gttattgacg tatctgctta tatttttgga tatactttta ttaataattt + 11401 tcttatctat cgccataaac gccctaaaga catattactt ttagtacctt tattaatatt + 11461 tatttcaaaa actttaatat caggaggccg gcaagatatt attaaaattc tgattgccta + 11521 tgtaatcatg atgtatatcc aacaaaaacg gaaagttgga tggaatagag tcatatctca + 11581 taaatatatt caccttggat ttgttggttt aatagcaggt attccagcat tttactactc + 11641 tttgttttta gccggtcgtt caacgactag gacgctattt gagagtgttt cgacctatct + 11701 aggaggctca attcagcatt ttaatcagta tattgaaaat ccattagatc ctggtgaagt + 11761 ttttggcagt gaaacattgg tgcctatatt aaatatatta ggggaaatgg gcctagttaa + 11821 ttatcgtagt acaattcatt tagaatttcg gacactagga gttactgtag gaaatgttta + 11881 tacttttttt agaagaccct tgcatgattt tggtctagtt ggtatgtatg tatttgtctt + 11941 tgctgtaggt gctttttttg ctatttatta tttagttctg agaaagaaac aggttggttt + 12001 taatttggat attcatacca ttatttattc ttatgtcttt tattggattt ttttatcatc + 12061 aatcgagcaa tactcgttca caatgattag tctatataca cttgtattta ttgtgttggt + 12121 ttactttatg gctatctttt actggtgtac agattttaaa agaggaaaac tgatttttaa + 12181 aatttctgac tcaagtatca aattaaaaga agaataacag aatgtatagg agagggtaga + 12241 tgaatactaa aattaaaaat ataataacta gtttttctta tgttatttct tcaaatctgc + 12301 tcatagtttt aacctcatca ctagttgttt tgatttttcc taaaataatg ggggtaactg + 12361 agtacagtta ctggcaactt tatatttttt atctgaccta tatcggtttt ttccacttgg + 12421 gttggattga tgggatttat ctcaaatatg gtggcttaga atatacaaat ttagatagaa + 12481 aacagtttta ttctcagatg attctatttt ctagtttctt aatgctaatc tcgctggtat + 12541 tatttacttt gaacctaata actgtaaggg atgaaaacgc aagatatatt tataatatgg + 12601 ctatcattag catgatagtc acaaacttaa gaacactcta tgtttatatc ttgcagatga + 12661 caaatcgctt gaaggatagt tcagtcattc taattagtga tcgcgtttta tatgtactcc + 12721 ttttattcat gtttattgta tttggatggc atgagtacaa ggtcatgatt tgggctgata + 12781 ttctaggtcg aacattttct ctcatgcttt ccttctggat ttgtaaagat attgtgtttc + 12841 agcctttgtc aaaatttatc ttagatttca aggagtccct tgataatatc cgtgttggaa + 12901 tcaatttaat gctatctaac attgcgagta gcatgattat aggcattgtt cgtatgggaa + 12961 ttcaatggaa ttggaatatt gaaacattcg ggaaagtgtc attaactttg agtatatcta + 13021 atttattaat gacttttatt aatgccattg gattagttat ctttcctttg ataaagcgaa + 13081 caaagactga gaatttacct aaaatttatt ctaatttaag aaatgctttg atgttggtta + 13141 tgttcgcaat cttgctcttc tactatcctt taaaatttat tcttgatatt tggcttcctg + 13201 cttataagga tgccttagtt ttcatggccc taatttttcc tatgtcagtt tatgaaggga + 13261 aaatggcttt ggtgataaat acatatttaa aagcaatgag aatggaaaaa gacattctca + 13321 aaattaatgc tttggttatg ttaactagta tagtagtgac attagtgact actatactac + 13381 taaataattt ggggctgaca gttgtatcta tagttatttt acttgcttta agaagtataa + 13441 tagctgaatt aattttatcc aaaaaactga agatatcagt caagcaagac attgctttag + 13501 agttacttat gacgattata tttatttctt caagttggta tctctctatt tggattgcag + 13561 taataattta tttattggcg tatactttat atttgtattt aaagcacaaa gatatcagaa + 13621 tgtatataga atactttaaa aatcataaaa aaatatcata aaaattatat atcaatgaaa + 13681 tggtagatta catttctacc tttttatcca tttaggagga aacgatgaaa aagataatgc + 13741 tagttttcgg tacacgtcca gaagcaataa aaatgtgttc attagtcaat gagttgagaa + 13801 aacaggaaga tatgaaaaca gttgtttgtg taactggtca acacaaggag atggttagcc + 13861 ctgttttaga tttatttgga gttcaaccag actatgattt agaaattatg aaggctaatc + 13921 aaaacttgtt ctctataaca ataagtattt tagaaaaaat aaaacctgtg ttagaaaaag + 13981 aacaaccaga tattgttttg gttcacggtg atactactac gacatatgca gcagctttag + 14041 cggcatttta tctaggaatt aaagttggtc atgttgaagc tggattacga acttacaacc + 14101 tgcaaagtcc tttcccagaa gagttcaaca gacaatcgac ttctattatt gcaaattatc + 14161 attttgctcc tacagaatta gctaaagaaa atctaataaa agagggtaga aataatatct + 14221 atgttactgg aaatacagtg attgatgcac ttacaactac agtacaaaag gattatacac + 14281 accccgatct agatttaaac gatggaaatc gcctcatctt attgactgct catagacgcg + 14341 aaaatctcgg agaacctatg agacatatgt ttagagctgt taaacgagtt ttaaatgaat + 14401 atgacgatgt taaagtaatt tatccaattc ataaaaatcc attggtacgg gaaacagcta + 14461 cagaaatttt tggagataca gaacgtattc agatcattga acctttagat gttcttgatt + 14521 ttcacaactt tatgaatcat agttatatga ttctaactga ctcaggaggg gttcaagaag + 14581 aggcaccttc gttaggaaag cctgtattgg tcatgcgaga tacgacagaa agacctgaag + 14641 gagtagctgc tggaacgttg aaattggttg ggactgatga ggagactatt tatcaaaact + 14701 ttaagatgct tttagacgat cccgaagaat ataaaaaaat gagtcaagct agtaatcctt + 14761 atggaaatgg tgatgctagt aaacagattg ttcgaatttt acgtggaatt tgagtgtgtt + 14821 cagataaagt aatatagaaa ggtaccctac tatgaaaggt attattctag caggtggttc + 14881 ggggacacgt ttatatcctt tgactcgcgc tgcatcaaaa caacttatgc cggtttatga + 14941 taaaccgatg atttactacc cactttcaac attgatgttg gctgggatta gggatatttt + 15001 gattatttcc actccacagg atttacatcg attccaagag cttcttcaag acggatctga + 15061 gtttgggctc aaactttctt atgcagagca accaagtcca gatggtttgg cacaagcctt + 15121 tatcattggg gaagagttta tttctgatga tagcgttgcg ctgatcttag gtgacaatat + 15181 ctatcacggt tctgggcttt ccaagatgct acaaaaggca gcgagtaagg agtcgggagc + 15241 aactgttttt ggctaccatg tcaaggatcc agagcgcttt ggtgtggttg agtttgatca + 15301 ggatatgaag gctatttcta ttgaagaaaa gccagagcaa cctcgttcaa actatgcagt + 15361 tacaggtctc tatttctatg ataatgatgt agtagagatt gccaagagta ttaaaccaag + 15421 tcctcgtggt gaactggaaa ttacagatgt aaacaaggct tacctagatc gtggtgattt + 15481 gtctgttgag cttatgggac gtggctttgc ttggctggat actggaactc atgaaagttt + 15541 actagaggct tcacagtaca tcgaaacagt gcaacggatg caaaatgttc aggtagcaaa + 15601 cttagaagaa attgcttacc gtatgggcta tatcagtcga gaagatgtat tggccttagc + 15661 ccaaccactt aagaaaaatg aatacggaca gtatctgctc cgtttgattg gagaagcata + 15721 gatgacagat aattttttcg gtaagacgct tgcggcacgc aaggttgaag ctattccagg + 15781 catgttggag tttgatatcc ccgttcatgg agataatcgt ggctggttta aagaaaattt + 15841 ccaaaaggaa aaaatgcttc cacttggatt tccagagtct ttctttgcag aaggaaaatt + 15901 gcaaaacaat gtatccttct cacgtaaaaa tgtccttcga ggtctccacg cagagccttg + 15961 ggataagtac atctctgtag cagatggagg gaaagttctg ggttcttggg ttgatctacg + 16021 cgagggtgaa acctttggga atacctatca gacagtgatt gatgcgagta agggaatctt + 16081 tgttcctcga ggcgtagcta atggctttca agttttatca gatacagtgt catatagcta + 16141 tctggtcaat gattactggg ctcttgaact caaacccaag tatgcctttg tgaactacgc + 16201 tgatccaagc cttggtattg aatgggaaaa tattgcagaa gcagaggttt cagaagcaga + 16261 caaacatcat ccactactta aggatgtaaa acctttgaaa aaagaagatt tggaataagg + 16321 aaagaatatg actgaataca aaaatattat cgtgacaggt ggagctggct ttatcggttc + 16381 taactttgtc cattatgttt acgagaactt tccagatgtt catgtgacag tcctagataa + 16441 gttgacttat gctggaaacc gcgcgaatat tgaggaaatt ttaggtaatc gtgttgagtt + 16501 agttgttggt gacattgctg atgcggagtt ggtagacaag ttggctgctc aagcagatgc + 16561 tatcgttcat tatgcagcgg aaagccacaa tgataattcg ctcaatgatc catcgccatt + 16621 tattcatact aacttcatcg gaacctatac tcttttagaa gctgctcgta agtatgatat + 16681 tcgcttccac catgtatcga cagatgaagt ttatggggat ctccctttac gcgaagattt + 16741 gccaggtcat ggtgaaggac caggtgagaa atttactgct gaaacaaaat acaacccaag + 16801 ctctccgtac tcatcaacca aggcagcctc agatttgatt gtcaaagcct gggtgcgttc + 16861 ttttggagtc aaggcaacga tttccaactg ttcaaataac tacggtcctt atcaacatat + 16921 cgaaaaattc atcccacgtc agattactaa catcctaagt ggtatcaagc caaaacttta + 16981 cggtgaaggt aagaacgttc gtgattggat tcataccaat gaccattctt caggagtttg + 17041 gacaatcttg acaaaagggc aaatcggtga aacctacttg attggggctg atggtgagaa + 17101 gaacaataag gaagttttgg aacttatcct taaggaaatg ggacaagctg cggatgccta + 17161 tgatcatgtg actgaccgtg caggacatga ccttcgctat gcgattgatg ctagcaagct + 17221 ccgtgatgag ttggggtgga aacctgaatt taccaacttt gaagctgggc tcaaggcaac + 17281 aatcaagtgg tatacagata accaagaatg gtggaaagca gagaaagaag ctgttgaagc + 17341 caattatgct aagactcagg agattattac agtataaaaa gcaggaaata gctgcttttt + 17401 attgctatat tgggaagagt tacatattag aaaggtctag agatgatttt aattacaggg + 17461 gcaaatggcc aattaggaac ggaacttcgc tatttattgg atgaacgtaa tgaagaatac + 17521 gtggcagtag atgtggctga gatggacatt accgatgcag aaatggttga gaaagttttt + 17581 gaagaggtga aaccgacttt agtctaccac tgtgcagcct acaccgctgt tgatgcagca + 17641 gaggatgaag gaaaagagtt ggacttcgcc atcaatgtga cggggacaaa aaatgtcgca + 17701 agagcatctg aaaagcatgg tgcaactcta gtttatattt ctacggacta tgtctttgac + 17761 ggtaagaaac cagttggaca agagtgggaa gttgatgacc gaccagatcc acagacagaa + 17821 tatggacgca ctaagcgtat gggggaagag ttagttgaga agcatgtgtc taatttctat + 17881 attatccgta ctgcctgggt atttggaaat tatggcaaaa acttcgtttt taccatgcaa + 17941 aatcttgcga aaactcataa gactttaaca gttgtaaatg accagtacgg tcgtccgact + 18001 tggactcgta ccttggctga gttcatgacc tacctagctg aaaatcgtaa ggaatttggt + 18061 tattatcatt tgtcaaatga tgcgacagaa gacacaacat ggtatgattt tgcagttgaa + 18121 attttgaaag atacagatgt cgaagtcaag ccagtagatt ccagtcaatt tccagccaaa + 18181 gctaaacgtc cgctaaactc aacgatgagc ctggccaaag ccaaagctac tggatttgtt + 18241 attccaactt ggcaagatgc attgcaagaa ttttacaaac aagaagtgag ataagtagta + 18301 gaatgatttt ctagtctaat aaaagaggca gataatgaac tccaaaggag cttaagatgt + 18361 acgattatct tgttgttggt gctggtctct ttggcgcata gctttggctc agtttctatt + 18421 atcgctcaca ccatccatca gaagtttaat ctgaaggtac ccaattatcg ccaagaagaa + 18481 gattgggcta ggatgggttt accaatcaca cgtaaggaaa tctctaattg gcatatcaag + 18541 gcaagtcaat actatttaga gtccctttat aaccttttac gagaaaagtt gttagaacaa + 18601 cctcttcttc atgcggatga aacctcttat cgggtcttag aaagtgatag tcagctgacc + 18661 tactattgga cctttttgtc tgggaaagct gagaatcaag taatcacgct ttaccaccat + 18721 gatcagtgtc ggagtggttc ggtagtgcaa gaattcctag gagattattc tggctatgtg + 18781 cattgtgata tgttgcggca gtaacttagg actttagtcc tctagttctg tctatgcgat + 18841 agcagtccaa ggtttaggag caaggcgacg ctaagcttgg taaactgcga accgctagaa + 18901 gcttatcgtc aactggaaga agctgaactt gttggatgtt gggcgcatgt gagaaggaaa + 18961 ttttttgaag tgccccccaa gcaagcagat aaatcatcct taggagctaa aggtttagct + 19021 tattgtgatc agttattttc cttggaaaga gactgggagg ctttgccagc tgatgaacga + 19081 ctacagaaac gtcaagaaca tctccaaccc ctaatggaag acttctttgc ttagtgccgt + 19141 cgtcagtcag ttttatcggg ttcaaaacta ggaagggcaa ttgaatacag cctcaagtat + 19201 gaagaaacct ttaagaccat tttaaaagac ggacatctgg tcctttccaa taatctagct + 19261 gaacgcgcca ttaaatcatt ggttatggga cggagtaaaa gagtccagtg gactctttta + 19321 gcctaagcta aattttaaaa agcgagggtg gttattttct caaagttttg aaggagctaa + 19381 agcaagagct attattatga gcttattgga aacagctaaa cgtcatcaac taaatagtga + 19441 gaaatatcta tcctatcttc tagaatgtct tccaaacgag gaaactctcg taaacaaaga + 19501 ggttttagag gcctatttac catggactaa agttgtacaa gaaaagtgca aataagaaat + 19561 ctccagatta ggaactatcc gtgagttcac taatctggag atttttcaat agacctcgtt + 19621 attgggcggt tacgatattc atattttttg caaagatgtt gtttgaaaaa taattttcaa + 19681 aaattctgaa aattctgttg acatctttct gaaaagagtc tataatggag agaaagtttt + 19741 aaaggagaaa atgatgaaaa gttcaaaact acttgccctt gcgggcgtga cattattg +// + diff --git a/public/res/serotype_genbank/serotype_2.gb b/public/res/serotype_genbank/serotype_2.gb new file mode 100644 index 0000000..6de5f23 --- /dev/null +++ b/public/res/serotype_genbank/serotype_2.gb @@ -0,0 +1,971 @@ +LOCUS CR931633 20602 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain pn2L (serotype 2). +ACCESSION CR931633 +VERSION CR931633.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 20602) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 20602) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..20602 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="pn2L" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC02_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC02_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI32716.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 294..459 + /gene="aliB" + /locus_tag="SPC02_0002" + /pseudo + CDS 294..459 + /gene="aliB" + /locus_tag="SPC02_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(460..1101,1103..1429)) + /gene="tnp" + /locus_tag="SPC02_0003" + /pseudo + CDS complement(join(460..1101,1103..1429)) + /gene="tnp" + /locus_tag="SPC02_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(1039..1101,1103..1411)) + /gene="tnp" + /locus_tag="SPC02_0003" + /note="HMMPfam hit to PF01710, Transposase, score 7.7e-24" + /pseudo + gene 1653..3107 + /gene="wzg" + /locus_tag="SPC02_0004" + CDS 1653..3107 + /gene="wzg" + /locus_tag="SPC02_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32719.1" + /db_xref="GOA:Q4K376" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K376" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIELEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNVPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1653..1778 + /gene="wzg" + /locus_tag="SPC02_0004" + /note="Signal peptide predicted for SPC0032 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 1866..2213 + /gene="wzg" + /locus_tag="SPC02_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.6e-63" + misc_feature 2391..2834 + /gene="wzg" + /locus_tag="SPC02_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 3109..3840 + /gene="wzh" + /locus_tag="SPC02_0005" + CDS 3109..3840 + /gene="wzh" + /locus_tag="SPC02_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32720.1" + /db_xref="GOA:Q4JZ01" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ01" + /translation="MIDVHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMSGITPVIAHIERYDALGNNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3112..3720 + /gene="wzh" + /locus_tag="SPC02_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.5e-36" + gene 3846..4541 + /gene="wzd" + /locus_tag="SPC02_0006" + CDS 3846..4541 + /gene="wzd" + /locus_tag="SPC02_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32721.1" + /db_xref="GOA:Q4JZ00" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZ00" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKSGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPTDTRIVSISVKDKQPEEASRIANSLREVAVEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELFDTRVKRPEDIEDVLQI + PLLGLVPDLDKMK" + misc_feature 3846..3962 + /gene="wzd" + /locus_tag="SPC02_0006" + /note="Signal peptide predicted for SPC0034 by SignalP 2.0 + HMM (Signal peptide probability 0.721) with cleavage site + probability 0.467 between residues 39 and 40" + misc_feature 3867..4283 + /gene="wzd" + /locus_tag="SPC02_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1e-55" + misc_feature 4389..4466 + /gene="wzd" + /locus_tag="SPC02_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4551..5231 + /gene="wze" + /locus_tag="SPC02_0007" + CDS 4551..5231 + /gene="wze" + /locus_tag="SPC02_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32722.1" + /db_xref="GOA:Q4K373" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K373" + /translation="MPTLEISQAKLDFVKKAEEYYNSLCTNLQLSGDGLKVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GDYGKNKK" + gene 5246..6613 + /gene="wchA" + /locus_tag="SPC02_0008" + CDS 5246..6613 + /gene="wchA" + /locus_tag="SPC02_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI32723.1" + /db_xref="GOA:Q4K372" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K372" + /translation="MNGKTVKSSLAIIQSFLIILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYCKRAYLNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKSDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFGCSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQVYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5246..5338 + /gene="wchA" + /locus_tag="SPC02_0008" + /note="Signal peptide predicted for SPC0036 by SignalP 2.0 + HMM (Signal peptide probability 0.861) with cleavage site + probability 0.343 between residues 31 and 32" + misc_feature 6029..6610 + /gene="wchA" + /locus_tag="SPC02_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 9.5e-158" + gene 6645..7829 + /gene="wchF" + /locus_tag="SPC02_0009" + CDS 6645..7829 + /gene="wchF" + /locus_tag="SPC02_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI32724.1" + /db_xref="GOA:Q4K371" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K371" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTEYQKDGNIQYYVACIR + ENSAKSGFTADTFEYNGAICYNIDVPNIGPARAIAYDIAAVNKAIELAKGNKDEAPIF + YILACRIGPFISGLKKKIRSIGGRLLVNPDGHEWLRAKWSLPVRKYWKFSEQLMVKHA + DLLVCDSKNIEKYVREDYKQYQPKTTYIAYGTDTTPSSLKSEDAKVRNWYREKGVSEN + GYYLVVGRFVPENNYETMIREFMKSNSKKDFVLITNVEQNKFYDQLLKDTGFDKDPRV + KFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTRLNLLLDVGFNREVGE + NGAIYWRKDELARVIEAVEQFDENAISELDKKSSQRIAEAFTWEEIVVDYEEEFEGGK + SE" + misc_feature 7263..7766 + /gene="wchF" + /locus_tag="SPC02_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0027" + gene 7846..8766 + /gene="wchG" + /locus_tag="SPC02_0010" + CDS 7846..8766 + /gene="wchG" + /locus_tag="SPC02_0010" + /note="member of homology group 133" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32725.1" + /db_xref="GOA:Q4K370" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K370" + /translation="MMATYNGAKYIGEQIDSILRQTYQDWKLFIHDDCSNDATFQILQ + QYQEKYPKKIKVITDSSVIGGSSEKNFAAIQKWVTNNHDFSYFMFADQDDFWFPNKIE + RSLYKMKESEKDDLPILVHTDLEVVDDNLNIINDSFFEYRALDVDVTELNRILIQNNI + TGCTMLWNRSLNNLLDLNSNAVAMHDWWISLVAASFGKIVCLKEPTIKYRQHGGNVVG + ATQVNTLGFIIKRLLGNSHVKETLKLSFEQAESFLKVYQNSLSNEETDIIREFISIPH + KHKLARISTVIKGGYLKQSVVQVIGELMFI" + misc_feature 7846..8370 + /gene="wchG" + /locus_tag="SPC02_0010" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.3e-12" + gene 8815..9828 + /gene="wchH" + /locus_tag="SPC02_0011" + CDS 8815..9828 + /gene="wchH" + /locus_tag="SPC02_0011" + /note="member of homology group 134" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32726.1" + /db_xref="GOA:Q4K369" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K369" + /translation="MTGGIRVIYTYANYLIDQGHDVVCYVPMISYRGRNQTIFYRIKA + SLGNTLKNDNWFDKKFDLKRIPVVSEKYIRDADVVIATAWQTAYDVANFSSSKGHKFY + FIQDYEIFNGGKEEVEASYRLPLTLITVTRSLKKAIQKFTDKTIYVVYNGLSDNEYLH + TEKISHKDLTLMMMYHESEHKKSQEGLQIIAKLKKRYPDMKINIFGRRIPEKLPDTYN + VLINPEREKILKMYQESDVYLFTSEIEAWGLPIVEAMANKCAVVGRSRGALLELSNGQ + NTIVVEELSEIYNKVVHLQEDRLLLAQVQNEGYKTVIPLNWSNSCLEFEKIISGVYIE + NGK" + misc_feature 9280..9747 + /gene="wchH" + /locus_tag="SPC02_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00011" + gene 9869..11032 + /gene="wzy" + /locus_tag="SPC02_0012" + CDS 9869..11032 + /gene="wzy" + /locus_tag="SPC02_0012" + /note="member of homology group 135" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32727.1" + /db_xref="UniProtKB/TrEMBL:Q4K368" + /translation="MLSLYTGNGVTPVIVILFFLSALYSLYRKSKLSINLNFLFIYIF + LAYYLLLTVIFTQDLLVMTSKFILFPIFVYYIIPKNINGVIRILSIFKSFIGFTAIFG + LYEYMQHFNLMVNFVKIDAVKWIQTMNLNSVYYPSSIFLHYTYFAYVLLLAFILVIVI + PYKNRVLNLVYKTLIAISIFLPQSRIVWIAFGVILILSFILNRQGILTYRKLSVIVLI + LIIVVSLCLYFDVFAFISNYISLRFSSLYRYGLADGSLGQRIGTLRNWENYLDSDTIK + AIIGSGFGGVNSYLSTYSFFNGYTTADSTVTSFLIDTGVIGLFIFLLSMFQILVIVVK + GKGIFRELALYTIVASSIVSLTIDFWANYVILHIFYVVIICAFIGMRLTKQEK" + gene 11162..12319 + /gene="wchI" + /locus_tag="SPC02_0013" + CDS 11162..12319 + /gene="wchI" + /locus_tag="SPC02_0013" + /note="member of homology group 136" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32728.1" + /db_xref="GOA:Q4K367" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K367" + /translation="MTKSILYFLSTSDISSGATRSLLRLVSIVEDSDFRVIIILPEHG + NVEDELVNKGIKYYVVKQYIWNYWIKYLSHTKNIFYYLKLPLKYLLNRISFHKINRII + KKEKVDIIHMNTLTSFLGAQAAIKQRKILIWHIREFMEEDLGIEFCNRKKAIDLINKS + TCVISISDSISKNFSNEVLAYKKVIHNGLSIDDYFIDKVAFQNQKINILSSGRITPGK + GQVDLVRAIANLPERYKQMFKVDIIGIVESEEYFKEIKEVISNYKLDGIEFHGFQSDP + TDFFRKCDIVCVCSKKEAFGRITVEGMLSGALVIGTNSGGTKEIISTGETGYLYEPGD + YMQLSEILKTIINNRSSILEIALRGQEKATLRFSDKNNAMQIMQLYKELEN" + misc_feature 11735..12247 + /gene="wchI" + /locus_tag="SPC02_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.5e-34" + gene 12316..13725 + /gene="wzx" + /locus_tag="SPC02_0014" + CDS 12316..13725 + /gene="wzx" + /locus_tag="SPC02_0014" + /note="member of homology group 111" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32729.1" + /db_xref="GOA:Q4K366" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K366" + /translation="MSRRYNYLLKNIGLLTLSNFGSKILVFLMVPLYTSVLSTSDYGT + YDLFNTTISLLIPIISINISEGVLRFALDEKNDSSIVYSIGWNIIIKGFLVVVLGIIF + NNIFNIFPLLKENSITFLLLYLSTIVYQFLSSFIRGIDKVSILSIAAILNTISILGFN + ILFLIIIPLGLVGYFWSNILGLVLPSLYLIYKISQYNIKYTSLQNKKLQQRLVSYSIP + LILNSLGWWINNAIDRYVVIAFCGVAVNGIYSVGYKIPSILNIFANIFNQAWILSSVK + SYRDEDSEYFFSQVYNKYNMIMVLISGLLISCSKILAKFLYMNEFYDAWKFVPFLLIA + NVFGAISGFAGGIFSAVKDSKIYSQSTLVGAIVNIIFTFVFVYYYGAIGAAIATMISY + FVVWIIRVHTMRKYIKLKIFIRRDVFSYVLLIFQSIVLWLENSYILYPIQVVLFLLLV + MLFYKEIKSIIGELKKFLT" + misc_feature 12337..13149 + /gene="wzx" + /locus_tag="SPC02_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2e-24" + gene 13761..14999 + /gene="ugd" + /locus_tag="SPC02_0015" + CDS 13761..14999 + /gene="ugd" + /locus_tag="SPC02_0015" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI32730.1" + /db_xref="GOA:Q4K365" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K365" + /translation="MKIAVAGTGYVGLSIAVLLSQQHQVMAVDIIPEKVELINQRKSP + IQDDYIEKYLAKKDLNLVATLDAKEAYQDADFVVIAAPTNYDPKKNFFDTSAVESVIE + TALKYNPDAIMVIKSTVPVGYTESARKKFQTENILFSPEFLRESKALYDNLYPSRIIL + GTDKNNERLVSAAETFARLLQEGALKENIDTLYMGFTEAEAVKLFANTYLALRVSYFN + ELDTYSEMKGLDTQAIIDGVGLDPRIGSHYNNPSFGYGGYCLPKDTKQLLANYEDIPE + ELIGAIVRSNSTRKDFIADQVLKMVDYYDYSAHNIFDERVEKDIIIGIYRLTMKSNSD + NFRQSSIQGIMKRIKAKGVRVVIYEPTLESGSTFFGSSVINDLEEFKRLSNAIVANRY + DNSLEDVKEKVYTRDIFERD" + misc_feature 13761..14315 + /gene="ugd" + /locus_tag="SPC02_0015" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 5.4e-51" + misc_feature 13761..14273 + /gene="ugd" + /locus_tag="SPC02_0015" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00015" + misc_feature 14346..14627 + /gene="ugd" + /locus_tag="SPC02_0015" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 2.8e-38" + misc_feature 14727..14978 + /gene="ugd" + /locus_tag="SPC02_0015" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 3.7e-06" + gene 15028..15633 + /gene="glf" + /locus_tag="SPC02_0016" + CDS 15028..15633 + /gene="glf" + /locus_tag="SPC02_0016" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI32731.1" + /db_xref="GOA:Q4K364" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K364" + /translation="MLEAVHTEKQWERSATELPPFIIKRLPVRLTFDNNYFNDRYQVI + PIGGYNVIIENILKDVEVGLGVDCFDYREELEASANKVAFTGMIDQYFDYKHGELEYR + SLRFKHEVLDEENHQGNAVVNYTDREIPYTRIIEHKKFEYGLQPKTVITHEYPADWKR + GDEPYYPINDEKNNAIFSKYHEEASQNDKVIFCGRLADYKY" + misc_feature 15028..15630 + /gene="glf" + /locus_tag="SPC02_0016" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 3.2e-138" + gene 15711..16580 + /gene="rmlA" + /locus_tag="SPC02_0017" + CDS 15711..16580 + /gene="rmlA" + /locus_tag="SPC02_0017" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI32732.1" + /db_xref="GOA:Q4K363" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K363" + /translation="MKGIILAGGSGTRLYPLTRATSKQLMPVYDKPMIYYPLSTLMLA + GIKDILIISTPQDLPRFKDLLLDGSEFGIRLSYAEQPSPDGLAQAFLIGEDFIGDDSV + ALILGDNIYHGPGLSKMLQKTVSKEKGATVFGYQVKDPERFGVVEFDENMNAISIEEK + PECPRSNYAVTGLYFYDNDVVEIAKSIKPSARGELEITDVNKAYLDRGNLSVEVMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLELAQPLKKN + EYGQYLLRLIGEV" + misc_feature 15714..16430 + /gene="rmlA" + /locus_tag="SPC02_0017" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 6.3e-118" + gene 16581..17174 + /gene="rmlC" + /locus_tag="SPC02_0018" + CDS 16581..17174 + /gene="rmlC" + /locus_tag="SPC02_0018" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI32733.1" + /db_xref="GOA:Q4K362" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4K362" + /translation="MTDNFFGKILAVRKIDAIPGMLEFDIPVHGDNRGWFKENFQKEK + MEPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTIIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 16614..17147 + /gene="rmlC" + /locus_tag="SPC02_0018" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 6.3e-16" + gene 17187..18236 + /gene="rmlB" + /locus_tag="SPC02_0019" + CDS 17187..18236 + /gene="rmlB" + /locus_tag="SPC02_0019" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI32734.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 17202..18158 + /gene="rmlB" + /locus_tag="SPC02_0019" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 17205..17945 + /gene="rmlB" + /locus_tag="SPC02_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 17208..18020 + /gene="rmlB" + /locus_tag="SPC02_0019" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 18302..19153 + /gene="rmlD" + /locus_tag="SPC02_0020" + CDS 18302..19153 + /gene="rmlD" + /locus_tag="SPC02_0020" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI32735.1" + /db_xref="GOA:O54665" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54665" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 18302..19150 + /gene="rmlD" + /locus_tag="SPC02_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 3.4e-148" + misc_feature 18305..18946 + /gene="rmlD" + /locus_tag="SPC02_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 18305..18934 + /gene="rmlD" + /locus_tag="SPC02_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.6e-19" + misc_feature 18308..19036 + /gene="rmlD" + /locus_tag="SPC02_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.8e-08" + gene order(19229..20139,20141..20356) + /gene="tnp" + /locus_tag="SPC02_0021" + /pseudo + CDS join(19229..19636,19636..20139,20141..20356) + /gene="tnp" + /locus_tag="SPC02_0021" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature join(19235..19636,19636..19674) + /gene="tnp" + /locus_tag="SPC02_0021" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 0.00033" + /pseudo + gene 20555..>20602 + /gene="aliA" + /locus_tag="SPC02_0022" + CDS 20555..>20602 + /gene="aliA" + /locus_tag="SPC02_0022" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32737.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactattt aaggagaaag aagatgaaca + 301 taaagaagcg tgtccttagt gcaggcctga cttttgcatc tgctttgctt ttagctgctt + 361 gcggccaatc aggttcagat acaaaaactt actcatcaac ctttggtgga aatccaacta + 421 catttaacta tctattagac tattacgctg ataacatagt caattgaaac aagaacagga + 481 caaaagagcc tcgtaaaagg tatggcaact tggtaatacc tttttgaggt gctttttgat + 541 ataagcccat gttttctcaa taggattgta ctcaggtgag tagggaggaa gaggtaaaag + 601 tttatgccca gacccttcgc ataaaagttc tagcttcccc attctatgga atcttgcatt + 661 atccataata tagtagattg aaactagaat agtacacctc tacttctaaa acattgttag + 721 aattcgattt tactgtcctg atcgatttat cttattctta tttcatttta ctataataac + 781 cgatggtgtg gttaatgttg gtaagagaaa cttctgaaac catacttcaa aaaagtcgct + 841 cgtcatcgtc tcttcgtaag tcattggaac gattaattca ccatttatta gacctgcaac + 901 caaagaaatc ctctgatatc ttcttccaga tactttgcct cttcttaact gaccttttaa + 961 tgagcgacca tattctcgat aaaaataagt atcgaatcct gtttcgtcaa tctaaacagg + 1021 tgctaggtgc tttaaactat taaaattctt aagaaataag gctacttttt ctgggtcttg + 1081 ttcatagtag gtgtggttct ttttttcgag tgtagcccat agctttgagc gcatagtgga + 1141 tggtagttgg atgacagcca aattcagaag ctatttcagt caaataagcg tctggattat + 1201 tagtaagata gtttttaagt ctatctctat caacttttct tggttttgtt ccttttactt + 1261 ggtggtttag ctctcctgtt ttctctttta gctttaacca gccataaatg gtattacgtg + 1321 agatttggaa aacgtgtgat gcttctgtta tactacctgt tcgctcacaa taagagagaa + 1381 cttttttacg aaaatctatt gaatatgcca taaaaagatt ataccacatt gtgtactata + 1441 ttatattgaa actagaatag tacacatctg cttctaaaat attgttagaa aacgatttga + 1501 ctgtcctgat caatttgtca tgttcttatt tcattttact atatttttgg ttcgcgggaa + 1561 gtctactaag atacttaaag atgcagatag tgaaaaaagg tgtagacatt accgtaaaaa + 1621 agtgatataa tcgtaagatg ttcaatgtat aggtgttaat catgagtaga cgttttaaaa + 1681 aatcacgttc acagaaagtg aagcgaagtg ttaatatagt tttgttgact atttatttat + 1741 tgttagtttg ttttttattg ttcttaatct ttaagtacaa tatccttgct tttagatatc + 1801 ttaatctagt ggtaactgcg ttagtcctac tagttgcctt ggtagggcta ctcttgatta + 1861 tctataaaaa agctgaaaaa tttactattt ttctgttggt gttctctatc cttgtcagct + 1921 ctgtgtcgct ctttgcagtc cagcagtttg ttggactgac caatcgttta aatgcgactt + 1981 ctaattactc agaatattcg ctcagtgtcg ctgttttagc agatagtgag atcgaaaatg + 2041 ttacgcaact gacgagtgtg acagcaccga ctgggactga taatgaaaat attcaaaaac + 2101 tactagctga tatcaagtca agtcagaata ccgatttgac ggttaaccag agttcgtctt + 2161 acttggcagc ttacaagagt ttgattgcag gggagactaa ggccattgtc ctaaatagtg + 2221 tctttgaaaa tatcatcgag ttagagtatc cagactacgc atcgaagata aagaagattt + 2281 ataccaaggg attcactaaa aaagtagaag ctcctaagac gtctaagaat cagtctttca + 2341 atatctatgt tagtggaatt gacacctatg gtcctattag ttcggtgtcg cgatcagatg + 2401 tcaatatcct gatgactgtc aatcgtgata ccaagaaaat cctcttgacc acaacgccac + 2461 gtgatgccta tgtaccaatc gcagatggtg gaaataatca aaaagataaa ttaacccatg + 2521 cgggcattta tggagttgat tcgtccattc acaccttaga aaacctctat ggagtggata + 2581 tcaattacta tgtgcgattg aacttcactt ctttcttgaa aatgattgac ttattgggag + 2641 gggtagatgt tcataatgat caagagtttt cagctctaca tgggaagttc catttcccag + 2701 tagggaatgt ccatctagac tctgagcaag ctctaggttt tgtacgtgaa cgctactcac + 2761 tagccgatgg agaccgtgac cgcgggcgca atcaacaaaa ggtgattgtg gctatccttc + 2821 aaaaattaac gtcaaccgaa gcactgaaaa attatagtac gatcattaat agcttgcaag + 2881 attctatcca aacaaatgtg ccacttgaga ctatgataaa tttggtcaat gctcagttag + 2941 aaagtggagg aaattataaa gtaaattctc aagatttaaa agggacaggt cggatggatc + 3001 ttccttctta tgcaatgcca gacagtaacc tctatgtgat ggaaatagat gatagtagtt + 3061 tagctgtagt taaagcagct atacaggatg tgatggaggg tagatgaaat gatagacgtc + 3121 cattcgcata tcgtttttga tgtagatgac ggtcccaagt caagagagga aagcaaggct + 3181 ctcttggcag aatcctacag gcagggggtg cgaaccattg tctctacctc tcaccgtcgc + 3241 aagggtatgt ttgaaactcc ggaagagaag atagcagaaa actttcttca ggttcgggaa + 3301 attgcaaaag aagtagcaga tgatttagtc attgcttacg gggctgaaat ttactacaca + 3361 ccagatgttc tggataagct gggaaaaaag cggattccga ccctcaatga tagtcgttat + 3421 gccttgatag aatttagtat gaacactcct tatcgcgata ttcatagcgc cttgagcaag + 3481 atcttgatgt cgggaattac tccagtcatt gcccacattg agcgctatga tgctcttgga + 3541 aataatgaaa aacgcgttcg agaactgatt gatatgggct gttacacgca agtaaatagt + 3601 tcacatgtcc tcaaaccaaa actttttgga gaacgttata aattcatgaa aaaaagagct + 3661 cagtattttt tagagcagga tttggttcat gtcattgcaa gtgatatgca caatctagac + 3721 ggtagacctc ctcatatggc agaagcatat gaccttgtta cccaaaaata cggagaagcg + 3781 aaggctcagg aactttttat agacaatcct cgaaaaattg taatggatca actaatttag + 3841 gagaaatgat gaaagaacaa aacacgatag aaatcgatgt atttcaatta tttaaaacct + 3901 tgtggaaacg caagctaatg attttattag tggcacttgt gacaggtgcg ggggcttttg + 3961 catatagcac ttttattgtt aagccagaat atacgagtac cacgcgaatt tacgtagtga + 4021 atcgcaatca aggagacaag tcggggctga caaatcagga tttgcaggca ggatcttatc + 4081 tggtaaaaga ctaccgtgag attatccttt cgcaggatgc attggaaaaa gtagcgacaa + 4141 atttgaagtt ggacatgcca gcaaaaacgt tagctagcaa agttcaagtg actgtaccaa + 4201 ctgacactcg tatcgtctca atctctgtca aggataaaca gccagaggaa gccagtcgta + 4261 tcgctaattc tctacgagaa gttgctgtag aaaagatcgt cgctgtaacg cgagtatctg + 4321 atgtaacgac acttgaagaa gcgcgaccag ctacgactcc ttcttctcca aatgttcgac + 4381 gcaattcctt gtttggtttt cttggaggag cagtcgtaac agtaattgct gttcttttga + 4441 ttgagttgtt cgacacccgt gtgaaacgtc ctgaagatat tgaagatgta ctgcaaattc + 4501 cacttttagg gctcgttcca gatttggaca aaatgaaata ggaggaagtt atgccaacgt + 4561 tagaaatctc acaggcaaaa ttggattttg taaaaaaggc agaggaatat tataactctt + 4621 tgtgcacgaa cctacagtta agtggagatg gtttgaaagt attttctatc acttctgtga + 4681 aactaggaga aggaaaatca acgacttcca ccaatatcgc ttgggctttt gcgcgtgcag + 4741 gttacaaaac gctgctgatt gatggagata ttcgcaattc tgttatgtta ggtgtcttta + 4801 aagcaaggga taagattaca ggcctgacag aatttttatc aggaactaca gacctatcac + 4861 aagggctttg tgataccaat atcgaaaatc tctttgtaat tcaggctggc tctgtgtcac + 4921 cgaatccgac agctcttctt caaagtaaga atttcagtac aatgcttgaa accttgcgta + 4981 aatattttga ctacatcatt gtagatacag ctcctgtcgg tgtcgtgatt gatgcggcta + 5041 ttattacgcg aaaatgcgat gcttctattt tagtgacgga ggcaggtgaa ataaatcgac + 5101 gggatattca aaaagcaaaa gaacagttgg aacacacagg gaagccgttt ttgggagttg + 5161 tgttgaataa attcgatact tcagtagaca aatacggttc ttatggagat tacgggaaaa + 5221 ataaaaaata ggtcggggga tagagatgaa tggaaaaaca gtaaagtctt cattggccat + 5281 aatccagagt tttcttatta ttttattgac ttatctactt agtgctgtga gagaagcgga + 5341 gattgtttca acaacagcta ttgcacttta tatcctccat tattttgtct tttatatcag + 5401 tgattatgga caagatttct ttaaaagggg atatttgatt gaacttgtcc agacattgaa + 5461 atatatccta ttctttgcac tagcgattag tatttctaat tttttcttag aggatcgatt + 5521 tagtatttcc agacgaggca tgatttactt cctcacatta catgctctct tagtctatgt + 5581 gctaaaccta tttatcaagt ggtattgtaa gcgggcttat ctcaacttta aaggaagtaa + 5641 gaagattctc ctacttacag caacttctcg tgtcgaaaag gtactggata gattaataga + 5701 atcaaatgag gttgttgggg agttggtagc cgtcagtgtc ttagataaat cagattttca + 5761 gcatgattgt ttaaaggtag tagcagaggg ggagatagta aactttgcga ctcatgaggt + 5821 ggtcgatgaa gtctttatca atcttccgag tgaaaaatac aatattggag agcttgtctc + 5881 tcagtttgaa acgatgggaa ttgatgtaac agttaatcta aatgcttttg gttgtagttt + 5941 ggcacgtaac aagcaaattc gtgagatggc aggattaaac gttgtgactt tttctacaac + 6001 attttataag actagtcatg taattgctaa gcggattatt gatatcatgg gtgcattggt + 6061 agggctgata ctatgtggtt tagtcagtat tgtactggtt cctttgattc gaaaggatgg + 6121 gggctctgct atttttgctc agacgcgtat aggaaaaaat ggtcgtcagt tcacttttta + 6181 taagtttcgc tctatgtgtg tagatgccga ggcgaaaaaa agagaactca tggaacaaaa + 6241 taccatgcag ggtggaatgt ttaaggtgga cgatgatcct cgtatcacga aaattggtcg + 6301 ttttatacgg aagactagct tggacgagct accacaggtt tataatgttc taaagggaga + 6361 tatgagtttg gttggcacac ggccaccaac agtggacgag tatgaacact ataccccaga + 6421 acaaaaacgt cgtctgagtt ttaaacctgg cataacaggc ttatggcagg tcagcggacg + 6481 aagtgaaatc aaaaatttcg atgaagttgt caaattagat gtagcctata tagacgattg + 6541 gacaatttgg aaagacattg aaattttatt gaagacagtt aaagtagtat ttatgagaga + 6601 tggagcgaag tagtttactt ttgttttaga ctactaggag aaaaatgaag aagtcagttt + 6661 atatcattgg ttcaaagggg attcctgcca agtatggagg atttgaaacc tttgttgaga + 6721 aattaacaga atatcaaaaa gatgggaaca tccaatacta tgttgcctgc atacgcgaaa + 6781 attctgcaaa atcaggattt acagcagata catttgagta caatggtgct atttgttaca + 6841 acattgatgt gcctaatatt ggtcctgcta gagccattgc ttacgatatt gcagcggtca + 6901 ataaggctat tgaattggct aagggaaaca aggacgaggc tcccattttt tacattctag + 6961 cttgtcgtat cggacctttt atttctggac ttaagaaaaa aattcgttcg atcggaggcc + 7021 gtttgctggt aaatccagat ggtcatgagt ggcttcgggc taaatggagc ctgccagttc + 7081 ggaagtattg gaaattttcg gaacagttga tggtcaaaca tgcagattta ttagtctgtg + 7141 atagcaaaaa tatcgaaaaa tatgtccgag aggactataa acagtatcag cccaagacga + 7201 cctatatcgc ttatggtaca gatactaccc cttcaagtct gaaatcagaa gatgccaaag + 7261 ttcgaaactg gtatcgtgaa aagggagtaa gcgaaaatgg ctattatcta gtggtgggac + 7321 gatttgttcc cgaaaacaac tatgagacca tgattcgtga atttatgaag tctaattcta + 7381 aaaaagactt tgttctcatt acaaatgtgg aacagaataa gttttacgat cagttgctca + 7441 aagatacagg cttcgacaaa gacccgagag tcaaatttgt tgggactgtc tatgaccaag + 7501 aattgctcaa atacatccga gagaatgctt ttgcctattt tcacggtcat gaagtgggag + 7561 ggaccaatcc atccttgctt gaagcattgg catccactag gcttaatcta ttactagatg + 7621 taggttttaa ccgtgaagtc ggagagaatg gtgccatcta ttggagaaaa gatgagctag + 7681 cgcgcgttat tgaagcagtg gagcaatttg atgagaacgc catttctgaa ctagataaaa + 7741 aatctagcca acgaattgca gaagctttta cgtgggaaga gatagtggtg gattatgagg + 7801 aagagtttga agggggaaaa agtgagtaac aagcaaattg cgattatgat ggcaacttat + 7861 aatggagcta aatacattgg agaacagata gactctattc ttaggcaaac ttatcaagat + 7921 tggaaattat ttatccatga cgattgttca aatgatgcta cttttcaaat ccttcagcaa + 7981 taccaagaaa aataccctaa aaaaattaag gttatcacag attcctctgt tatagggggg + 8041 agctcagaga aaaattttgc agctattcaa aaatgggtga cgaataatca tgatttttct + 8101 tattttatgt ttgcagatca agatgatttt tggtttccaa ataagattga gcgctcactt + 8161 tataaaatga aagaatcaga aaaggatgat ttacctattt tagttcatac tgatttagaa + 8221 gttgttgatg ataatttaaa tataattaac gattctttct tcgaatatcg tgccttagat + 8281 gtagatgtga cagaattgaa tcgtatactt atacaaaata acattacggg ttgtacaatg + 8341 ttatggaata gaagtttaaa caatctgtta gatttgaata gtaatgcagt agctatgcat + 8401 gattggtgga taagtttagt tgctgctagc tttgggaaaa ttgtttgcct taaagaacca + 8461 acaattaaat atcgtcaaca cggtgggaat gttgtggggg cgacacaagt caatacttta + 8521 ggttttatta tcaagaggtt gttaggaaat tctcatgtca aggaaacttt gaagctatca + 8581 tttgaacaag cagaatcatt tttaaaagtt tatcagaatt ctctaagtaa tgaggagaca + 8641 gatattattc gtgaatttat cagcattcca cataagcata aattggcgag aataagcact + 8701 gttataaaag gaggctatct aaagcaaagt gtggtgcaag taatcggtga gttaatgttt + 8761 atttagattt ttggagaaaa aatgaaaatt aattttatcc ttccatttaa gagaatgaca + 8821 ggtggaataa gagttatcta tacctatgca aattacctta ttgatcaagg acatgatgtg + 8881 gtttgttatg ttcctatgat tagttataga ggtagaaacc agacaatttt ttatcggata + 8941 aaagcttctt tggggaatac tctaaaaaac gataattggt ttgataagaa gtttgattta + 9001 aaacggatac cagtggtatc agaaaaatat atacgtgatg cagatgtagt aattgcgaca + 9061 gcttggcaaa cagcctatga tgtcgcaaat ttctcatcaa gcaaaggtca caaattttat + 9121 tttattcaag attatgaaat cttcaatgga ggaaaggaag aggtggaggc atcgtatcgc + 9181 ttgccactta cattaattac tgttacgagg agtttaaaaa aagctattca aaagtttaca + 9241 gataaaacta tttatgttgt atataatggt ctttctgaca acgagtatct tcatacagaa + 9301 aaaattagtc ataaggacct cactttgatg atgatgtatc atgaaagtga gcataagaaa + 9361 agtcaagagg ggttacaaat tatcgcaaaa ttaaagaagc gatatcctga tatgaagatt + 9421 aatatatttg gacgccgtat tccagaaaag ttacctgata cctataatgt gttgattaat + 9481 cctgaaagag aaaaaatttt aaagatgtat caggaatcgg atgtctatct ttttacaagt + 9541 gaaattgaag catggggact acctattgta gaagccatgg caaataaatg tgcagttgtt + 9601 ggtagaagtc gaggagcttt gttggaactc tcaaatggtc agaatactat agttgtagaa + 9661 gagttatcag aaatatataa taaggtagta catttacaag aggatcgatt attgttggca + 9721 caagttcaaa atgaagggta taaaactgtt ataccactaa attggagtaa ctcttgttta + 9781 gaatttgaga agattatatc aggggtatat attgaaaacg gtaaatagta taacaaatta + 9841 tattttatta ttagtatgga tagttataat gctctctcta tatacaggaa atggtgttac + 9901 tcctgttatt gttattttat tttttttgtc ggcattgtat tctttatatc gaaaaagcaa + 9961 attaagtata aatttaaatt ttttgtttat atatattttt ttagcctact atttgttatt + 10021 aacagttata ttcacacaag atttattggt gatgacttct aaatttatat tatttccaat + 10081 atttgtttat tatataatac ctaaaaatat aaatggcgtt ataagaatac tatctatttt + 10141 taaatctttc attggtttta ctgctatttt tggattatat gaatatatgc aacatttcaa + 10201 tcttatggtg aattttgtaa aaatagatgc agttaaatgg atacaaacga tgaatttgaa + 10261 tagtgtgtat tatcccagtt caatatttct ccactacacc tattttgcat atgttttgtt + 10321 actagctttt attttggtaa ttgttatccc atataagaac cgagtgttaa atttagttta + 10381 taaaacactt attgcaattt caattttttt gccccaatct cgtatagttt ggatagcttt + 10441 tggggtaatt ttaattcttt cgtttatact aaatagacag gggatattaa cctatagaaa + 10501 gttgagtgtt atagtactta ttttaattat agtagtctct ctctgcctat attttgatgt + 10561 gtttgcgttt atttctaatt atataagttt aagattttct tcactttatc gttatggact + 10621 ggctgatggt tctctaggtc aacgtattgg aactcttaga aattgggaaa attatttaga + 10681 ctctgatact ataaaggcta ttattgggtc aggatttggt ggtgtcaata gttacttgag + 10741 tacttattca ttttttaatg gctatactac agctgattca acagtgacaa gtttccttat + 10801 tgatactggg gttattggct tatttatctt tttattatct atgtttcaga tattagtaat + 10861 agtggtaaaa ggaaaaggaa tttttagaga attagcgtta tatactattg tagcttcttc + 10921 tatagttagt ttaacaattg atttttgggc aaattatgtt attcttcata tattttacgt + 10981 ggttattatc tgtgcattta taggaatgag attgactaag caagaaaaat aaaaatggat + 11041 ggggaaattc aaggttgtat gataatgtgc agaaggcata tggaatagtt gttttttaga + 11101 tttttaattt attttttaat acataatttt ctgtttttat ctaaaattaa ggaaggataa + 11161 tatgacaaaa agtatcttat attttttatc tacatctgat atatcatcgg gagctacccg + 11221 gtcattgtta cgattagttt cgatagttga ggattcagac tttagggtta ttatcatttt + 11281 accagaacat ggaaatgtgg aagatgagct tgtaaacaaa ggaattaaat actatgttgt + 11341 aaaacaatat atttggaatt attggataaa atatctcagt catactaaaa atatttttta + 11401 ctatttgaaa ttgccgttaa agtatttatt aaacagaata tcgtttcaca aaatcaacag + 11461 aattataaaa aaagaaaaag ttgatattat tcatatgaat acgttgactt cttttttagg + 11521 agctcaggca gcaatcaaac agagaaaaat attaatatgg catataaggg agtttatgga + 11581 agaggactta ggaattgaat tttgtaatag aaaaaaagca attgatttaa taaataaatc + 11641 aacatgtgta atttctatat ctgattcaat ttctaaaaat ttttccaacg aagttttggc + 11701 ttataaaaaa gtcattcata atggtttatc aattgatgac tattttatag ataaagtcgc + 11761 atttcagaac caaaagatta acattttatc ttcaggtaga attacgcctg gaaaagggca + 11821 ggttgattta gttagagcga tagctaatct tcctgagaga tataaacaga tgtttaaagt + 11881 tgatattata ggaatagttg aaagcgaaga atattttaaa gaaataaaag aagttatttc + 11941 aaattataaa cttgacggta ttgagtttca tggttttcaa tctgatccaa ctgatttttt + 12001 cagaaaatgt gatatcgtat gtgtgtgttc caaaaaagaa gctttcggtc gtattacagt + 12061 tgagggaatg ttgtctggag cgttagttat tgggacaaat tcaggtggta caaaagagat + 12121 aatttctaca ggagaaacag gatatctgta tgaaccagga gattatatgc agcttagtga + 12181 aattttaaaa actataataa acaataggag ttccatcttg gaaattgctt tgagaggaca + 12241 agagaaggct acattacgtt tttcagataa aaataatgcc atgcagatca tgcaactata + 12301 taaggaacta gaaaattgag tagaagatat aattacttac taaaaaatat tggattacta + 12361 actttaagca actttggttc taaaatttta gtctttttaa tggttccgtt atatacaagc + 12421 gtactatcta catctgatta tggaacatat gatttattta atacgacaat ctcattgcta + 12481 attccaatta tttcaattaa tatttctgaa ggggttcttc gatttgcatt agatgaaaaa + 12541 aatgacagta gtatagtata ttcaattggc tggaatatta taataaaagg tttcttagtt + 12601 gtagtattag gaattatttt caataatatc tttaatatat tcccattact taaagaaaat + 12661 tccataactt ttttattact ttatttatca actattgttt atcaatttct ttcttcattt + 12721 attagaggta tagataaagt ttctatatta tcaattgctg ctattctcaa tacaatttct + 12781 atattggggt ttaacattct atttcttata attatacctc taggtttggt tggatatttt + 12841 tggtctaata tattgggttt ggtgctacct agtttatact tgatatataa gatatctcaa + 12901 tataacatta agtacactag ccttcagaat aaaaagttac agcaaagact tgttagttac + 12961 agtattccct taatcttaaa ttcattaggt tggtggatta ataatgcaat agatagatac + 13021 gtagttattg cattttgtgg tgtagcggtg aatggcatct attcagttgg ttataaaatc + 13081 ccatcaattt taaatatttt tgcaaatata tttaaccaag cgtggatatt atcatctgta + 13141 aagtcttatc gtgatgaaga tagtgaatat ttcttttctc aagtttataa taagtataac + 13201 atgattatgg tattaatttc cgggctacta atttcttgta gtaaaatact tgctaagttt + 13261 ctatatatga atgaatttta tgatgcttgg aagtttgttc cgtttttact aattgcaaat + 13321 gtttttggag ctatttcagg atttgctggt ggaatttttt ccgcggttaa agattcaaaa + 13381 atatatagtc agtcaacctt agtaggagcg atagtgaata ttattttcac atttgttttt + 13441 gtatattatt atggagctat aggtgctgct attgccacta tgatatctta ctttgttgtt + 13501 tggataatac gtgttcatac aatgagaaaa tatataaagt taaaaatttt tattagaaga + 13561 gatgtatttt cctatgtatt gcttattttt cagtcaatag tcttatggtt ggaaaatagt + 13621 tatattcttt atcctataca agttgtgtta ttcttattat tagttatgtt attttataaa + 13681 gaaataaaga gtattattgg tgaattaaaa aagtttctaa cataagaacc aataagtacg + 13741 agtattgaaa ggagaaaaat gtgaaaatag cagtagcagg tacgggatat gttggtctat + 13801 ccattgcagt tttattgtct caacaacatc aagtaatggc ggtggacatt attcctgaga + 13861 aggtcgaatt aattaatcaa agaaagtcac ctattcaaga tgactatata gagaaatatc + 13921 tggcaaaaaa ggatttaaat ttagtggcta cattggatgc aaaagaagca tatcaagatg + 13981 cggattttgt tgtgattgca gctccaacta actatgatcc aaagaagaac ttttttgaca + 14041 cttctgctgt agagtctgtc attgaaacgg cgcttaaata taatccagat gccatcatgg + 14101 tcattaaaag tacagttcca gttggttata cagagtcagc tcgaaagaaa tttcagactg + 14161 aaaatatctt atttagtcct gaatttttgc gtgagtcaaa ggcgctttac gataacttat + 14221 atcccagccg tattatttta gggacagata aaaataatga acgcttggta agtgctgctg + 14281 agacatttgc gagattgctc caagaaggcg ctttaaaaga aaacattgat acattataca + 14341 tgggctttac tgaagctgag gcggtcaagc tttttgcaaa tacttacctt gctttgcgtg + 14401 tttcttattt taatgagctg gatacttatt ctgagatgaa ggggctagac actcaagcta + 14461 ttattgatgg agttggtttg gatccccgta ttggttcgca ctacaacaat ccttccttcg + 14521 gctatggtgg ctattgtctt cctaaagata ccaagcaact tcttgccaac tatgaagata + 14581 taccagaaga acttatagga gccatagtac ggagcaattc gacacgtaaa gactttattg + 14641 ctgatcaggt tcttaagatg gtagattatt atgattattc agcccataat attttcgatg + 14701 agagagtaga aaaagatatt attattggca tctatagatt gaccatgaag agtaatagcg + 14761 ataattttcg tcaaagctct attcaaggta ttatgaaacg tataaaagct aagggagtaa + 14821 gagtagttat ttatgaaccc actttagaaa gcgggagtac attttttgga agttccgtta + 14881 tcaatgattt agaggaattc aaacgactga gtaatgccat tgttgctaat cgctatgata + 14941 actcattaga agatgtcaag gaaaaagtct atacacgtga tatttttgaa agagattaat + 15001 ttagtataat aaaaatgaaa aaaataattg ttagaagcgg tccatactga gaagcaatgg + 15061 gaacgctcag cgacagaact tcctccattt atcattaaac gccttccagt tcgtttaacc + 15121 tttgataata actattttaa cgaccgttat caagtgattc ctattggtgg atacaatgtg + 15181 attattgaaa atatacttaa agacgtagaa gttgggctag gagtggattg ctttgactat + 15241 cgtgaagagc tggaagcatc tgctaacaaa gttgctttta caggaatgat tgaccagtat + 15301 tttgattata agcatggtga gctagagtat cgcagtttac gttttaagca cgaagtgctt + 15361 gatgaggaaa atcaccaagg aaatgctgta gtgaactata cagatcgtga gattccttat + 15421 actcgtatca ttgagcataa aaaatttgag tatggtctgc agcctaagac agtcataacg + 15481 catgaatatc cagctgactg gaaacgtgga gatgaaccat attatccaat taatgatgag + 15541 aaaaataatg ctatcttttc taaataccac gaagaagctt cacagaatga taaggttatc + 15601 ttctgtggac gtttagcaga ttataaatat tagtggtgat tgaacggata cttagtgtag + 15661 tagaggaaga atttagtaat taaaaaacaa cgaagaaagg ttatttcatt atgaaaggta + 15721 ttattcttgc gggtggctca ggtacccgtc tgtatccact tactcgagct acatcgaaac + 15781 agctgatgcc ggtttatgat aaacccatga tttactatcc tctgtcaact ttgatgttgg + 15841 cgggtattaa ggatattttg attatttcaa cgccacagga tttgccgcgc tttaaggact + 15901 tgctcttgga tggttccgaa tttgggatca gactttccta tgcggaacag cctagtccag + 15961 atggccttgc tcaggccttt cttatcggtg aggattttat tggtgacgat agcgttgctt + 16021 taatcttggg tgacaatatt tatcacggtc caggtttgag caagatgctc caaaaaactg + 16081 tttcgaaaga aaagggtgcg actgtttttg gttaccaagt gaaggatcca gaacgctttg + 16141 gtgttgtaga atttgatgaa aatatgaatg ctatttccat agaagaaaaa ccagagtgtc + 16201 ctcgctccaa ctatgcagtg acaggactgt atttctatga taacgatgtt gtcgaaattg + 16261 ccaagagtat caaaccaagt gctcgtggtg agttagaaat cacagatgtc aacaaggctt + 16321 acttggatcg tggtaattta tctgtcgaag tcatgggacg tggctttgct tggcttgata + 16381 caggaaccca tgaaagcttg ttggaagcct ctcaatatat tgaaacggtt caacgcatgc + 16441 aaaatgttca agttgccaat ttggaagaaa tcgcctatcg catgggttat attagtcgtg + 16501 aagatgtgct ggagttggcg caacctctta agaagaatga atacggacag tatctgctcc + 16561 gtttgattgg agaagtctag atgacagata attttttcgg aaaaatactt gcggtgcgta + 16621 aaattgatgc cattccaggt atgttagagt ttgatatccc agttcatggt gacaatcgtg + 16681 gctggtttaa ggaaaatttc cagaaggaaa agatggagcc acttggcttt cctgaaagct + 16741 tctttgctga agggaaacta caaaataacg tcagcttttc tcgcaaaaat gtccttcgag + 16801 gcctccacgc agagccttgg gataagtaca tctctgtagc agatggaggg aaagttctgg + 16861 gttcttgggt tgatctacgc gagggtgaaa cctttgggaa tacctatcag acaataattg + 16921 atgcaagcaa gggaatcttt gttcctcgag gcgtagctaa tggcttccaa gttttatcag + 16981 atacagtgtc atatagctat ctggtcaatg attattgggc tcttgaactc aaacccaagt + 17041 atgcctttgt gaactacgct gatccaagcc ttggtattga atgggaaaat attgcagaag + 17101 cagaggtttc agaagcagat aaacatcatc ccctacttaa ggatgtaaaa cctttgaaaa + 17161 aagaagattt gtaaaaagga aagaatatga ctgaatacaa aaatattatc gtgacaggtg + 17221 gagctggctt tatcggttct aactttgtcc attatgttta cgagaacttt ccagatgttc + 17281 acgtgacagt cctagataag ttgacttatg ctggaaaccg cgcgaatatt gaggaaattt + 17341 taggtaatcg tgttgagtta gttgttggtg acattgctga tgcggagttg gtagacaagt + 17401 tggctgctca agcagatgct atcgttcatt atgcagcgga aagccacaat gataattcgc + 17461 tcaatgatcc atcgccattt attcatacta acttcatcgg aacctatact cttttagaag + 17521 ctgctcgtaa gtatgatatt cgcttccacc atgtatcgac agatgaagtt tatggggatc + 17581 tccctttacg cgaagatttg ccaggtcatg gtgaaggacc aggtgagaaa tttactgctg + 17641 aaacaaaata caacccaagc tcgccttact catcaaccaa ggccgcatca gacttgattg + 17701 tcaaagcctg ggtgcgttct tttggagtca aggcaacgat ttccaactgt tcaaataact + 17761 acggtcctta tcaacatatc gaaaaattca tcccacgtca gattactaac atcctaagtg + 17821 gaattaagcc aaaactttac ggtgaaggta agaatgttcg tgactggatt cataccaatg + 17881 accattcttc aggagtttgg acaatcttga caaaagggca aatcggtgaa acctacttga + 17941 ttggggctga tggtgagaag aacaataagg aagttttgga gcttatcctt aaggaaatgg + 18001 gacaagctgc ggatgcctat gatcatgtga ctgaccgtgc aggacatgac cttcgctatg + 18061 cgattgatgc tagcaagctc cgtgatgagt tggggtggaa acctgaattt accaactttg + 18121 aagctgggct caaggcaaca atcaagtggt atacagataa ccaagaatgg tggaaagcag + 18181 aaaaagaagc tgttgaagcc aattatgcta agactcagga gattattaca gtataaaaag + 18241 caggaaatag ctgcttttta ttgctatatt gggaagagtt acatattaga aaggtctaga + 18301 gatgatttta attacagggg caaatggcca attaggaacg gaacttcgct atttattgga + 18361 tgaacgtaat gaagaatacg tggcagtaga tgtggctgag atggacatta ccgatgcaga + 18421 aatggttgag aaagtttttg aagaggtgaa accgacttta gtctaccact gtgcagccta + 18481 caccgctgtt gatgcagcag aggatgaagg aaaagagttg gacttcgcca tcaatgtgac + 18541 ggggacaaaa aatgtcgcaa aagcatctga aaagcatggt gcaactctag tttatatttc + 18601 tacggactat gtctttgacg gtaagaaacc agttggacaa gagtgggaag ttgatgaccg + 18661 accagatcca cagacagaat atggacgcac taagcgtatg ggggaagagt tagttgagaa + 18721 gcatgtgtct aatttctata ttatccgtac tgcctgggta tttggaaatt atggcaaaaa + 18781 cttcgttttt accatgcaaa atcttgcgaa aactcataag actttaacag ttgtaaatga + 18841 ccagtacggt cgtccgactt ggactcgtac cttggctgag ttcatgacct acctagctga + 18901 aaatcgtaag gaatttggtt attatcattt gtcaaatgat gcgacagaag acacaacatg + 18961 gtatgatttt gcagttgaaa ttttgaaaga tacagatgtc gaagtcaagc cagtagattc + 19021 cagtcaattt ccagccaaag ctaaacgtcc gctaaactca acgatgagcc tggccaaagc + 19081 caaagctact ggatttgtta ttccaacttg gcaagatgca ttgcaagaat tttacaaaca + 19141 agaagtgaga taagtagtag aatgattttc tagtctaata aaagaggcag ataatgaact + 19201 ccaaaggagc ttaagatgta cgattatctt gttgttggtg ctggtctctt tggcgcatag + 19261 ctttggctca gtttctatta tcgctcacac catccatcag aagtttaatc tgaaggtacc + 19321 caattatcgc caagaagaag attgggctag gatgggttta ccaatcacac gtaaggaaat + 19381 ctctaattgg catatcaagg caagtcaata ctatttagag tccctttata accttttacg + 19441 agaaaagttg ttagaacaac ctcttcttca tgcggatgaa acctcttatc gggttctaga + 19501 gagtgatagc catctgacct actattggac ctttttgtct gggaaatcag agaaacaagg + 19561 gattacgctt taccatcatg atcagcgtcg gagtggttcg gtagtgcaag aattcctagg + 19621 aaattattct gcctatgcga tagcagtcca aagtttagga gcaaggcgac gctaagcttg + 19681 gtaaactacg aaccgctaga agcttatcgt caactggaag aagctgaact tgttggatgt + 19741 tgggcgcatg tgagaaggaa gttttttgaa gcgcccccca agcaagcgga taaatcatcg + 19801 ttaggagcta aaggtttagc ttattgtgat cagttatttg ccttggaaag agactgggag + 19861 gctttgctag ctgatgaacg actacagaaa cgtcaagaag agctccaacc cctaatggaa + 19921 gatttctttg cttggtgccg gcgtcagtca gttttatcgg gttcaaaact aggaagggca + 19981 attgaataca gcctcaagta taaagaaacc tttaagacca ttttaaaaga cggacatctg + 20041 gtcctttcca ataatctagc tgaacgcgcc attaaatcat tggttatggg acggagtaaa + 20101 agagtccagt ggactctttt agcctaagct cagtttaaaa aagtgagggt ggttattttc + 20161 tcaaagtttt gaaggagcta aagcaagagc tattattatg agcttattgg aaacagctaa + 20221 acgtcatcaa ctaaatagcg agaaatatct atcctatctt ctagaatgtc ttccaaacga + 20281 ggaaactctc gtaaacaaag aggttttaga ggcctattta ccatggacta aagttgtaca + 20341 agaaaagtgc aaataagaaa tctccagatt aggaactatc cgtgagttct ctagtctgga + 20401 gatttttcaa tatacttcgt tattgggcgc ttacaatgat attcatattt tttgcaaaga + 20461 tgttgtttga aaaataattt tcaaaaattc tgaaaattct gttgacaact ttctgaaaag + 20521 agtctataat ggagagaaag ttttaaagga gaaaatgatg aaaagttcaa aactacttgc + 20581 ccttgcgggc gtgacattat tg +// + diff --git a/public/res/serotype_genbank/serotype_20A.gb b/public/res/serotype_genbank/serotype_20A.gb new file mode 100644 index 0000000..d091165 --- /dev/null +++ b/public/res/serotype_genbank/serotype_20A.gb @@ -0,0 +1,538 @@ +LOCUS JQ653094 18024 bp DNA linear BCT 15-NOV-2023 +DEFINITION Streptococcus pneumoniae strain 6320 CPS gene locus, complete + sequence. +ACCESSION JQ653094 +VERSION JQ653094.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18024) + AUTHORS Calix,J.J., Porambo,R.J., Brady,A.M., Larson,T.R., Yother,J., + Abeygunwardana,C. and Nahm,M.H. + TITLE Biochemical, Genetic, and Serological Characterization of Two + Capsule Subtypes among Streptococcus pneumoniae Serotype 20 + Strains: DISCOVERY OF A NEW PNEUMOCOCCAL SEROTYPE + JOURNAL J. Biol. Chem. 287 (33), 27885-27894 (2012) + PUBMED 22736767 +REFERENCE 2 (bases 1 to 18024) + AUTHORS Calix,J.J. and Brady,A.M. + TITLE Direct Submission + JOURNAL Submitted (09-FEB-2012) Department of Microbiology, University of + Alabama at Birmingham, 845 19th Street South, Birmingham, AL 35294, + USA +FEATURES Location/Qualifiers + source 1..18024 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="6320" + /serotype="20 alpha" + /db_xref="taxon:1313" + misc_feature 1..18024 + /note="CPS gene locus" + misc_feature <1..544 + /note="similar to transposase" + mobile_element <1..544 + /mobile_element_type="insertion sequence:IS630" + CDS 757..2202 + /note="Wzg" + /codon_start=1 + /transl_table=11 + /product="CpsA" + /protein_id="AFN40474.1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVVVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIELEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFYFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + CDS 2204..2935 + /note="wzh" + /codon_start=1 + /transl_table=11 + /product="CpsB" + /protein_id="AFN40475.1" + /translation="MIDIHSHIVFDVDDGPKSIEESKALLREAYNQGVRMIVSTSHRR + KGMFETPEEKIATNFIKVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHAGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + CDS 2944..3636 + /note="wzd" + /codon_start=1 + /transl_table=11 + /product="CpsC" + /protein_id="AFN40476.1" + /translation="MKEQNTLEIDVLQLFRTLWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIGSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + CDS 3646..4329 + /note="wze" + /codon_start=1 + /transl_table=11 + /product="CpsD" + /protein_id="AFN40477.1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTEKLFLGVILNKFDVQHEKYGSY + GGYGNYGKK" + CDS 4351..5721 + /note="CpsE; glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WchA" + /protein_id="AFN40478.1" + /translation="MEGRGFYNITLAFLQSILVSLLAYILIAISETDIALNTVFVLFF + LHFVAFYISGYGKDFFKRGQYIELVETIKYIIFYSLLISFSSLFLKEKFVISRRGMLY + LLFLYGVLNYLLNFFLKSYWRKFTYNLKRSRKILLVTATSRVERVMDCLLLANDVQGK + LVAVSVLDKPEFTHEKLLVVPKEELISYATHEVVDEVFVNLPSEDYDIGAIISQFETM + GGDVTVNLNAFDKNLSRNKRIHEMAGLNVVTFSTNFYKPSHVITKRILDICGAIVGLF + ICGIASIFIVPQIRKDGGSAIFSQTRVGKNGRHFTFYKFRSMRVDAEAIKEQLMDQNT + MQGGMFKIDNDPRVTKIGKFIRKTSLDELPQFWNVLIGDMSLVGTRPPTVDEYEKYTP + EQKRRLSFKPGITGLWQISGRSEITNFDEVVKLDVAYIDDWTIWKDFEILLKTVKVVL + MRDGAK" + CDS 5729..6520 + /note="glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciB" + /protein_id="AFN40479.1" + /translation="MTNIKIIVATHKSFEMPQNKELYFPVHVGCEGKDDLGYQGDNTG + ENISQLNPYYCELTGLYWAWKNLDCDYLGLVHYRRYFTKKTQFYKENLKIDEVILNQE + EIELLLRKGDIIVPKKRKYYIETLCSHYAHTLDASHLDLARKVIEKQQPEYLDSFDKV + MKQRSGYMFNMFIMKKELANNYFEWLFPILDCMFDQINLSELTAFEARLFGRVSELLF + NVWLEKNLYSLVEVPFMYLEKVNLVEKGKSFLMAKFFGKKYGQSF" + CDS 6532..7599 + /note="polymerase" + /codon_start=1 + /transl_table=11 + /product="Wzy" + /protein_id="AFN40480.1" + /translation="MIYIGTMLLSMLIITFIKYFRISKKWKEAVYFWGFIPLILIGAL + RAYVGIDYTTYSLDQIPAVLAGSQTVKFELLDKLVVYIGYYLANQQHYFYIFAIFHII + LMWFLYKYIVQQSSNVMLSVFFLLTTVFFTFSLSGIRQSIATAIVFYALKYIKQKKSL + HYIIYLGIACLFHSSAVIYILFLVLGKININRFVGFALPMIASLFSFSGSEFVSRIIL + HLNFYSEYVGSRYYTGAYDKQHQLFTIVMCLSVFLLYYIVPKKEWVNLKLYLNINFVL + LLVAIIMPILPTPSRTIYMFVLVHVILIPKLISVIKDYRSKVIITMFFVLGYFIFFSI + TVLQRNAYETLPYHTIFEYLW" + CDS 7600..8628 + /note="putative glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WhaJ" + /protein_id="AFN40481.1" + /translation="MIMKQILISIIIPLHNGEDTIIRAVKSVINSRLYGDLIEIIIVE + NGSTDQSFKISQKLATENSNIRVLKSDKGTSFARNVGIEKSKGKWLIFLDADDYLFES + DLDVIVENLITNNTDLCVYNYEKGLKKIELFSEEVELIDDLDSFIVQSLSEPTKYMTV + WGKAFNKNLIDEYGLKFNTNLRVSEDSDFYLRFLLLIHSLTLTSQTLYHYSIDSPSTM + RTFSSDKLEGYIVSLNESSKVLGNVDNTIQEAFELYKLAHFNLIMVREVFYFDNSKSF + REKIKEMIRLYKMPMFFEPIQNLSVSSVSNLSLVPLFFLKIHLYHLAALVYIIRVGQN + KFKEGRKS" + CDS 8628..9743 + /note="putative glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciL" + /protein_id="AFN40482.1" + /translation="MKRILVFGMNENPGGVESFIMNYFREFNREKLALDFLCNSNDKI + AYEDELISKGARVFHLTARSKNPIRYYWEMYRFFKEYASDYQAIWVNINSLANIDYLK + FARYFGIPVRIVHSHNSQNMDTKLREKLHNHNRDKIEKWATDFWACSHEAAKWFYNEE + TIGKVKIIPNAINMNASIFSSEARDKIRIDYTLDNKFVLGHVGRLHFQKNQEFMIRVL + AKLQEFRDDVCLVLVGQGEDLNKLKILAEELSIQDKVYFVGVQSNISEWLSTFDLFFF + PSNFEGLGIAALEAQVNGLPTLLSEEGVPKEVKINDNTFFYPLKESEESWANFLDEMI + HTTTRLNYEYIQENFEKSGYDIKIAAQNLEKQLLELV" + CDS 9754..10743 + /note="glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WcwK" + /protein_id="AFN40483.1" + /translation="MVNNIDFVVTWVNGNDPVWREEKKKYEVLDGRPTLNDETRYRDM + DLFQYWFRAVEKHAPWVNNIYFITYGHLPEWLDANHPKLKIVKHEDYIPKEYLPTFSS + NVIELNLFRIKELSEQFVLFSDDVFINTFLKEEDLFKNNLPRLLSIYRPLIPTKEFDY + INFNHLLIMNRYFHDKKTLSQHKGKFFNVGYGKFNLYNLFSIFYSGIIGYHDAHVAMP + HLKSTFAEIWNKEGVLLDRVCKNKFRSTKDVNHWLMSYWNIETNSFMPQTLRVGEYVP + LAYSGKIESIIHKQKNKFLCINDDEHTENFINEVNFVRKIFEKKFPEKSKFEK" + CDS 10756..11760 + /note="putative glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciD" + /protein_id="AFN40484.1" + /translation="MKKQKILSVVIPSYNAAPFLMETIPTLVSISSRNDIEVLIVNDG + SKDETLQVAQKLEKEYSGIVSIIDKENGGHGSTINAGIREAKGKYFKVVDADDWVDSE + NFEKLVQFLHKTDADEIISPYTDVFEDDGTKVENNYFKDCSLKPYQDYDYVNFLERIQ + ILPRMHSITIKTSILRDNNIKIDENMFYVDMEYIVFPTPFIKTITYTPDSVYQYRRGY + EGQSTSIQNYIKNRKMVNHVTFALLDFYNKHTLSNILEKLVKETIARCVTIMTNVCLS + MEDTKQGKKELLDFDQKLKSINSEFYYHKQGKKAKVLRYSNYFLFDLLSSYSKKSKKV + " + misc_feature 11780..12743 + /note="nonfunctional WhaF due to mutation" + CDS 12750..14165 + /note="flippase" + /codon_start=1 + /transl_table=11 + /product="Wzx" + /protein_id="AFN40485.1" + /translation="MKVIKNYAYNLSYQLLVIILPIITTPYVTRVFSSNDLGTYGYFS + SIVTYFILLASLGVANYGTKVISGNRKEIEKNFWGIYSLQMGATLLSLFLYLVLCLTL + PFMQNLVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVISIFLFVKSAN + DLYLYVFLLTIFELFGQLSMWLPARDFIGKFHVDIEYARQHLKPIILLFLPQVAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTFVTSLGSVMLPRVSHLLATGERKAVN + KMHEMSFLIYNLLIFPIMAGILIVNDDFVQLFLGQDFQDARYAIAIMVLRMFFIGWTN + IMGTQMLIPHNQNKEFMISTTAPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWVIQ + LFYTRRYLKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSSTLNVLAFAALGGIIYI + FAILSLKVVDVKELKQIIRKN" + CDS 14167..15165 + /note="putative O-acetyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciG" + /protein_id="AFN40486.1" + /translation="MRKNRNINLDLLKVLACVGVVLLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMVNGYLLLGKREITYLYILQKVKWILITVSSWSFIVWLFKRDFTTNPI + KKIVGSLIQRGYFFQFWFFGALILIYLCLPILRQFLNSKRSYLYSLSLLMTIGLIFEL + SNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTIEEIESRFKNWMKIVSILLLLI + SPIILFFIAKTIYHNLFAEYFYDTLFVKVSTLGIFLTILMLTLNESRRESIVSLSNQT + MGVFIIHTYIMKVWEKVLGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + CDS 15179..16288 + /note="galactofuranose mutase" + /codon_start=1 + /transl_table=11 + /product="Glf" + /protein_id="AFN40487.1" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRDHIGGNIYCEN + LEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTADMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELEVDFFAHRE + GLEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + CDS 16275..17327 + /note="putative O-acetyl transferase" + /codon_start=1 + /transl_table=11 + /product="WcjE" + /protein_id="AFN40488.1" + /translation="MTKSRINWIDFGKGFSIFLVLAGHVLLGLYQSEKFPTANNILSL + LIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQKV + AGASVRVPTTISDLLNIYKDPLGVSWYLYILWSILIIYGLLSILVKNRRMLFLISVFA + YCLTLFVQTDIYIIQRTLVWGLCFFLGSVLNEIHFDKINLKKFLFLFVLFDFIYMFAW + FLFYEVGSKKDYVSYSNSGLWGIAFVVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSL + GIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLL + PQKYIKLKGSLSTVVG" + mobile_element 17343..>18024 + /mobile_element_type="insertion sequence:IS1761" + misc_feature 17343..17874 + /note="similar to transposase" +ORIGIN + 1 tgttagacct gcaaccaaag aaatcctctg atatcttctt ccagatactt tgcctcttat + 61 taactgacct tttaatgagc gaccatattc tcgataaaaa taagtatcga atcctgtttc + 121 gtcaatctaa acaggtgcta ggtgctttaa tctattaaaa ttcttaagaa ataaggctac + 181 tttttctggc tcttgttcat agtaggtgtg gttctttttt tcgagtgtag cccatagctt + 241 tgagcgcata gtggatggta gttggatgac agccaaattc agaagctatt tcagtcaaat + 301 aagcgtctgg attgtcagta agatagtttt taagtctatc tctatcaact tttcttggtt + 361 ttattccttt tacttggtgg tttagctctc ctgttttctc ttttagcttt aaccagccat + 421 aaatggtatt acgtgagatt tggaaaacgt gtgatgcttc tgttatacta cctgttcgct + 481 cacaataaga gagaactttt ttacgaaaat ctattgaata tgccataaaa agattatacc + 541 acattgtgta ctatattaga ttgaaactag aatagtacac atctgcttct aaaacattgt + 601 tagaaatcga tttgactgtc cttatttcat tttattatat ttttggttcg cgggaagtct + 661 actaagatac ttaaagatgc agatagtaaa aaaaatgtag acattaccgt aaaaaagtga + 721 tataatcgta tgatgttcaa ggtataggtg ttaatcatga gtagacgttt taaaaaatca + 781 ggttcacaga aagtgaagcg aagtgttaat atcgttttgc tgactattta tttattgtta + 841 gtttgttttt tattgttctt aatctttaag tacaatatcc ttgcttttag atatcttaac + 901 ctagtggtaa ctgcgttagt cctactagtt gccttggtag ggctactctt gattatctat + 961 aaaaaagctg aaaagtttac tatttttctg ttgctgttct ctatccttgt cagctctgtg + 1021 tcgctctttg cagtacagca gtttgttgga ctgaccaatc gtttaaatgc gacttctaat + 1081 tactcagaat attcaatcag tgtcgttgtt ttagcagata gtgatatcga aaatgttacg + 1141 caactgacga gtgtgacagc accgactggg actgataatg aaaatattca aaaactacta + 1201 gctgatatta agtcaagtca gaataccgat ttgacggtca accagagttc gtcttacttg + 1261 gcagcttaca agagtttgat tgcaggggag actaaggcca ttgtcctaaa tagtgtcttt + 1321 gaaaacatca tcgagttaga gtatccagac tacgcatcga agataaaaaa gatttatacc + 1381 aagggattca ctaaaaaagt agaagctcct aagacgtcta agaatcagtc tttcaatatc + 1441 tatgttagtg gaattgacac ctatggtcct attagttcgg tgtcgcgatc agatgtcaat + 1501 atcctgatga ctgtcaatcg agataccaag aaaatcctct tgaccacaac gccacgtgat + 1561 gcctatgtac caatcgcaga tggtggaaat aatcaaaaag ataaattaac ccatgcaggc + 1621 atttatggag ttgattcgtc cattcacacc ttagaaaatc tctatggagt ggatatcaat + 1681 tactatgtgc gattgaactt cacttctttc ttgaaaatga ttgacttatt gggaggggta + 1741 gatgttcata atgatcaaga gttttcagct ctacatggga agttctattt cccagtaggg + 1801 aatgtccatc tagactctga gcaggctcta ggttttgtac gtgaacgcta ctcactagcc + 1861 gatggagacc gtgaccgtgg tcgcaaccaa caaaaggtga ttgtggctat ccttcaaaaa + 1921 ttaacgtcaa ccgaagcact gaaaaattat agtacgatca ttaatagctt gcaagattct + 1981 atccaaacaa atatgccact tgagactatg ataaatttgg tcaatgctca gttagaaagt + 2041 ggagggaatt ataaagtaaa ttctcaagat ttaaaaggta caggtcggac ggatcttcct + 2101 tcttatgcaa tgccagacag taacctctat gtgatggaaa tagatgatag tagtttagct + 2161 gtagttaaag cagctataca ggatgtgatg gagggtagat gaaatgatag acatccattc + 2221 gcatatcgtt tttgatgtag atgacggtcc caagtcaata gaggaaagca aggcactttt + 2281 aagagaagct tataatcaag gagttcgaat gattgtgtct acttcgcatc gtcgaaaagg + 2341 gatgtttgaa actccagaag aaaaaattgc aacaaatttt attaaggttc gtgaaattgc + 2401 aaaagaagta gcagatgatt tagtcatagc ttatggcgca gagatatact atactctgga + 2461 tgctctagaa aagctagaaa aaaaagaaat tcctaccctt aatgatagtc gttatgcttt + 2521 gattgagttt agcatgcata cttcctatcg tgagattcat gcgggattga gcaatatttt + 2581 gatgttggga atcacgccag taattgctca tattgaacgt tatgatgcct tagagaataa + 2641 cgaaaaacgt gttcgtgaac tgattgatat ggggtgctat actcagataa atagttatca + 2701 tgttttaaaa cctaagttct ttggtgaaaa atataaattc atgaaaaaga gagctcggta + 2761 ttttttggaa cgtgatttag ttcatgtagt tgcaagtgac atgcacaatt tagacagtag + 2821 acctccatat atgcaacagg catatgatat cattgctaag aaatatggag cgaaaaaagc + 2881 gaaagaattt tttgtagata atcccagaaa aattataatg gatcaattaa tttaggagaa + 2941 aatatgaagg aacaaaacac tttggaaatc gatgtattgc aactattcag aactttatgg + 3001 aaaagaaagt tggtcatttt attagtggca attataactt cttcagttgc ttttgcctac + 3061 agtacttttg ttatcaaacc tgagtttact agtacgactc ggatttatgt agttaaccgt + 3121 aatcaggaag agaagtctgg tttaaccaat caagacttgc aggcaggatc atacttggtc + 3181 aaagactatc gtgaaattat cctatcgcag gatgttttgg aggaagttat ttctgatttg + 3241 aaactagatt tgacgccaaa aggtttggct aataaaatta aagtaacagt accagttgat + 3301 acccgtattg gctctgtttc agttaatgat cgagttcctg aagaggcaag ccgtatcgct + 3361 aactctttga gagaagtagc tgctcaaaaa attatcagta ttactcgtgt ttctgatgtg + 3421 acaacactgg aggaagcaag accggcgata tcaccatctt cgccaaatat taaacgcaat + 3481 acactaattg gttttttggc aggggggatt ggaactagtg ttatagtttt tcttcttgaa + 3541 cttttggaca ctcatgtgaa acgtccggaa gatatcgaag atacactgca gatgacactt + 3601 ttgggagttg taccaaactt gagtaagttg aaataggaga gaggaatgcc gacattagaa + 3661 atagcacaaa aaaaactgga gttcattaag aaggcagaag aatattacaa tgccttgtgt + 3721 acaaatatac agttgagcgg agataaacta aaagtaattt ccgttacttc tgttaaccct + 3781 ggggaaggaa aaacaactac ttccgtaaat atagcaaggt cgtttgcgcg tgcaggctat + 3841 aaaactcttt tgatcgatgg cgatactcga aattcagtta tatcaggagt ttttaaatcg + 3901 cgtgaaaaaa ttacagggct aacagaattt ttatctggga cagctgattt atctcacggt + 3961 ttatgtgata caaatattga aaatttattt gtaattcaat cgggatctgt atcaccaaac + 4021 cctacagcct tgttacaaag taaaaatttt aatgatatga ttgaaacatt gcgtaaatat + 4081 tttgattata tcattgttga tacagcacct attggaattg ttattgatgc ggcaattatc + 4141 actcaaaagt gtgatgcgtc catcttggta acagcaacag gtgaggtgaa taaacgtgat + 4201 gtccaaaaag cgaaacaaca attagaacaa acagagaaac tgtttttagg tgtcattctc + 4261 aataaatttg atgttcaaca tgaaaaatat ggttcttacg gtggctatgg taattacgga + 4321 aaaaaataga atgaagttag ggagtccagt atggaaggaa ggggtttcta caatataact + 4381 ctggcattct tacagagtat acttgttagt ctattagctt atatactgat tgcaatttca + 4441 gaaaccgaca ttgctttaaa tacagtattc gtcctgtttt ttcttcactt tgtagccttt + 4501 tatattagtg gttatggtaa agattttttc aaaagaggtc agtatattga gttggtagaa + 4561 acgataaaat acataatatt ttattccttg ttgatcagct tttcaagttt gttcttaaaa + 4621 gaaaaatttg ttatttctag acgaggaatg ctctacttgc ttttcctata tggtgttttg + 4681 aattatctac tcaatttctt tttgaaaagt tattggagaa aattcaccta taatttaaag + 4741 cgcagtcgca agattttatt ggttacggca acatcacgcg tcgaaagagt aatggattgc + 4801 ctgttacttg cgaacgatgt tcaagggaaa ttggttgctg ttagtgtttt agataagcca + 4861 gaatttactc atgaaaagct ccttgttgta ccaaaagaag agttgatttc ctacgctacc + 4921 catgaagtag tagatgaagt ttttgtcaat cttccaagtg aggactatga tattggagcc + 4981 attatttctc agtttgaaac aatggggggt gatgtaacag tcaatctcaa tgcttttgat + 5041 aaaaacttaa gccgaaataa acgaatccat gaaatggcag gattgaatgt agtgaccttc + 5101 tctacgaatt tttacaagcc tagtcatgtc attactaaga ggattcttga tatttgtgga + 5161 gctatcgttg gtctttttat ctgtggaatt gctagtatat tcatagttcc tcagattcga + 5221 aaagatggtg ggtctgcaat cttttcacaa actcgtgtag gaaaaaatgg tcgtcacttt + 5281 accttttata aattccgctc gatgcgagtc gatgcagaag cgatcaagga acagttgatg + 5341 gatcaaaata cgatgcaagg tggtatgttt aagatcgata acgatcctcg agtgacaaag + 5401 attggaaaat ttatccgaaa aactagcttg gatgaattgc cacaattttg gaatgtttta + 5461 attggagaca tgagtctagt aggtacgcgc ccaccaactg tagatgagta cgaaaaatac + 5521 acacctgaac aaaaacgtcg cctaagcttt aaacctggta ttacaggttt gtggcaaatt + 5581 agtggtcgaa gtgaaattac aaacttcgat gaggttgtta agttggatgt ggcttatatc + 5641 gatgattgga ccatttggaa agattttgaa atattgttaa aaactgtaaa agttgtgttg + 5701 atgagagatg gagcgaagta ggaggggtat gacaaatatt aaaattatag ttgcaactca + 5761 taagagtttt gagatgccgc aaaataaaga attgtatttc ccagtccatg tggggtgtga + 5821 aggaaaagat gatttgggat atcaaggaga taatactggg gaaaacattt cccagttaaa + 5881 cccttattac tgtgaattaa caggtttata ttgggcatgg aagaatctag attgcgatta + 5941 tcttggacta gttcattacc gccgatattt cacgaagaaa actcaatttt ataaagaaaa + 6001 tctaaaaatt gatgaagtaa ttttaaatca ggaagaaatt gaattgcttt tgagaaaagg + 6061 agatataata gttcctaaaa aaaggaaata ttatattgaa actctatgtt ctcattatgc + 6121 acacacgcta gatgctagcc atctagattt ggctagaaaa gtcattgaga agcaacaacc + 6181 tgaatacctt gattcatttg ataaagttat gaaacaacgt agtggctata tgtttaatat + 6241 gtttataatg aaaaaggaat tagcaaataa ttattttgaa tggctgtttc cgattttaga + 6301 ttgtatgttt gatcagatta atctttcaga gttaactgca tttgaggcac gtctttttgg + 6361 tcgtgtaagt gaactattat tcaacgtatg gctagagaag aatttgtatt ctctagtaga + 6421 agttccattt atgtatttgg aaaaggttaa tctagtagaa aaagggaaat cgtttttaat + 6481 ggctaaattt tttggtaaga agtatggaca gagtttttag ggaggaacta attgatttac + 6541 attggtacga tgcttctctc aatgttgata attactttta tcaagtattt tagaatatca + 6601 aaaaaatgga aagaggcagt ttatttttgg ggttttattc ctcttatctt gataggagca + 6661 cttagagctt atgtaggaat agattatacc acatatagtt tggatcagat accggctgta + 6721 ttagctggta gtcagacagt caaatttgaa ttgttagata aattagtagt gtacataggt + 6781 tactatctag ctaatcagca gcattatttc tatatttttg caatatttca cattatcctg + 6841 atgtggtttc tgtataaata tattgttcaa cagtcgtcta atgtaatgtt gagtgtgttt + 6901 tttcttctaa ccactgtttt ttttactttt tctttatcag gaatacgcca atcaatagct + 6961 acagcgattg ttttttatgc gttgaagtat attaaacaaa aaaaaagttt acattatata + 7021 atttatttag ggattgcttg tttatttcat tctagtgcag taatctatat acttttttta + 7081 gttttaggga aaattaatat taataggttc gttggctttg cattaccgat gattgcatca + 7141 ttattttctt tttctgggtc tgaatttgta tctcgaataa tactacattt aaatttttat + 7201 tcagaatacg ttggttctcg ttattataca ggagcatatg ataaacaaca ccaactattc + 7261 acaatcgtta tgtgtttatc ggtatttcta ttatattata ttgttccgaa aaaagagtgg + 7321 gttaatttaa aattatatct gaatattaat tttgtgctat tactagttgc aataatcatg + 7381 ccaatacttc ctactccatc aagaactatt tatatgtttg ttcttgtaca tgttattcta + 7441 attcctaagt tgatttcagt tattaaagat tataggtcta aggtaatcat aacaatgttc + 7501 tttgttttag gttattttat attcttttct ataacggttc tacagaggaa tgcatatgaa + 7561 acactaccgt accacacaat ctttgagtat ttatggtaat tgattatgaa acaaatatta + 7621 atttctatta ttattccatt acataatgga gaagatacga ttattagagc agtaaaaagt + 7681 gttataaata gcagattata tggagatttg attgaaatta ttattgttga aaatggttca + 7741 acagatcaat catttaaaat ttctcaaaaa ttagcgaccg aaaactcaaa tatacgagtc + 7801 ttgaaatcag ataaaggaac cagttttgcc agaaacgtag gaatcgaaaa atctaaagga + 7861 aagtggctta tttttttaga tgcagatgat tatttatttg aatcggattt agacgttatt + 7921 gttgaaaatt taataaccaa taatacagat ttatgcgttt ataactacga aaaagggctt + 7981 aagaaaatag aacttttttc agaagaggta gagttgatag atgaccttga ttcttttata + 8041 gttcaatctc tttctgaacc cactaaatat atgacagtat ggggaaaagc gtttaataaa + 8101 aatttgattg atgagtacgg tttgaagttt aatacgaatt tgagagtttc agaagatagt + 8161 gatttttatc tcagatttct tttgctgatt cacagtttaa ctttaacttc tcaaacgcta + 8221 taccattatt caattgattc accttcaacg atgaggacat tttcttcaga taaattagaa + 8281 ggttatattg tttccttgaa tgaaagctca aaagtattag gaaatgttga taatactatt + 8341 caagaagcct ttgagttata taagttggcg cattttaatt taataatggt tagagaagtg + 8401 ttctattttg ataattcaaa aagtttcaga gaaaagataa aggaaatgat tagactttat + 8461 aagatgccta tgttttttga gcctatacaa aatctatctg tatctagtgt tagcaattta + 8521 tcgctagtac ctctattttt tttgaaaata catttgtatc atttagcggc attggtttac + 8581 attattcgag tagggcaaaa caaattcaaa gaaggaagaa aaagttgatg aaaagaattc + 8641 tagtattcgg aatgaatgaa aaccctggtg gagttgaatc ctttataatg aattattttc + 8701 gtgaatttaa tcgcgaaaaa ttagccttag attttttgtg taattcaaat gataaaatag + 8761 cttatgagga tgaacttatt tctaaaggag caagagtttt tcacctgaca gcgagaagta + 8821 aaaatccgat acgttattat tgggaaatgt atagattctt caaagaatat gcatctgatt + 8881 atcaggcaat ttgggttaat attaatagct tagcaaatat tgactattta aaatttgcaa + 8941 gatattttgg tattccggtt cgaattgtac acagccataa tagtcaaaat atggatacca + 9001 aacttcgtga aaaattacat aatcataata gagacaaaat tgaaaagtgg gcaaccgatt + 9061 tctgggcttg ttcgcacgaa gctgcaaaat ggttttataa cgaagaaact attggaaaag + 9121 ttaagattat accaaatgct attaatatga atgcttctat tttttcttct gaggcacgag + 9181 ataaaattcg aattgattat acattagaca ataaatttgt gctaggtcat gtaggacgtt + 9241 tgcattttca gaagaatcaa gaatttatga taagagtttt agctaaatta caggaattta + 9301 gagacgatgt ctgcttagtt ttagttggtc aaggtgaaga tcttaacaaa ttaaagatac + 9361 tggctgagga gctatctatt caggataagg tctactttgt gggagttcag tcgaatatat + 9421 cagaatggtt gagtactttt gacttattct tttttccgtc taattttgaa ggtttaggaa + 9481 tagctgcatt agaggctcaa gtaaatggtc taccgacact actctcagaa gaaggtgtac + 9541 caaaggaagt aaaaatcaat gataatactt ttttttatcc attgaaggaa agtgaagaaa + 9601 gctgggcaaa cttccttgat gaaatgattc atacaacaac tcgtttaaat tatgaatata + 9661 tacaagaaaa ttttgagaaa tctggctacg atattaagat agctgctcag aatcttgaaa + 9721 aacaattgct agaattagtt tagggaagat aacatggtta ataatattga ttttgtagtt + 9781 acatgggtta atggaaatga tccagtgtgg cgtgaggaaa aaaagaaata cgaagttcta + 9841 gatggtaggc cgactttaaa tgatgaaaca agatatagag atatggattt gtttcaatat + 9901 tggtttcgag cggtagaaaa acatgcgccc tgggttaata atatttattt cattacatat + 9961 gggcatttac ctgaatggct ggatgcaaat caccctaaat tgaagatagt aaaacatgaa + 10021 gattatattc caaaagaata cttaccgact tttagttcaa atgtaattga actaaatctt + 10081 tttaggatta aggaattgag tgagcagttc gttctgttta gtgatgatgt ttttattaac + 10141 acatttttaa aagaagaaga tttgtttaaa aataacttac ctcgattgtt gagtatatat + 10201 agaccattaa ttccaactaa agaatttgat tatattaatt tcaatcattt attaataatg + 10261 aatagatact ttcatgataa aaaaacatta tcacaacata agggtaaatt ttttaatgta + 10321 ggttatggaa agtttaatct gtataatcta tttagcattt tttattcagg gattattggt + 10381 tatcatgatg ctcatgtcgc tatgcctcat ttgaaaagta cttttgcaga gatttggaat + 10441 aaggaagggg tacttctaga tcgagtttgt aaaaacaaat ttcgttcaac taaagatgtt + 10501 aaccattggt tgatgagcta ttggaatatt gaaacaaatt catttatgcc acagactctt + 10561 cgtgtgggtg aatatgtgcc tctggcttat tcaggtaaaa ttgaatctat tattcacaaa + 10621 caaaagaata agtttttgtg tataaacgac gatgaacata ccgaaaactt cattaacgaa + 10681 gttaactttg ttcgtaaaat atttgagaaa aaatttcctg aaaagtctaa atttgaaaag + 10741 taaaggggaa ctaaattgaa aaaacaaaaa atacttagcg tggtaattcc atcctacaat + 10801 gcggctccat ttttgatgga aactattccg actctagttt ctattagcag cagaaatgat + 10861 attgaggttt tgattgtaaa tgatgggtct aaagatgaga cacttcaagt ggctcagaaa + 10921 ctggaaaaag agtattctgg catagttagt ataattgata aagaaaatgg cggtcatgga + 10981 tctacaatta atgctgggat aagggaagct aaagggaagt actttaaagt tgttgatgct + 11041 gatgattggg tagatagtga aaactttgaa aagcttgtac aatttcttca taaaacagat + 11101 gccgatgaaa ttatctctcc atatacagac gtttttgaag atgatggtac aaaggtagaa + 11161 aataactatt ttaaagattg ttcattaaaa ccataccagg attatgatta tgtgaatttt + 11221 ttagaacgga ttcaaatttt acctagaatg cattctataa caataaaaac ctctatttta + 11281 agagataata acataaaaat tgatgagaat atgttctacg ttgacatgga gtatattgtt + 11341 tttccaactc catttatcaa aacaataact tatacgcctg actctgttta tcagtatcgt + 11401 agaggttacg agggacagag tacgagtatt cagaactata taaaaaatag aaaaatggta + 11461 aatcatgtca cattcgcttt gcttgacttt tataataaac acactttatc taatattctg + 11521 gaaaaactag ttaaagagac aattgctaga tgtgttacta ttatgacaaa tgtttgtcta + 11581 tcaatggaag atactaaaca aggtaaaaag gaacttcttg attttgatca gaaattaaaa + 11641 tcaataaatt ctgagttcta ttatcataaa caagggaaaa aagctaaagt tctaagatat + 11701 tcaaattact tcttgtttga cttgttgtct agctactcta agaagtctaa aaaagtatag + 11761 ttgttgtagg agtatatata tgatacataa aattattaat cgattatcac ttacgattca + 11821 acaatgtagt ggcgataaac catttactat caaattagtt aatgcatatg tagaactatt + 11881 aagaaataca aaatctagag aattaagaaa ttatgtaata aagaaacaca ttaaaaaaac + 11941 cacgaatatt tctcaaatta aggaagtttt tctagagaat agtaatactt taatacaaaa + 12001 aactgaattt cctaaattta tctggactat gtggtggcaa ggagaagaga atgcacctga + 12061 gttagtccaa agtacactct attatattag aaaatttgct gaaactaatg gttatacgac + 12121 agtagttatt gataaaaata atatagataa gtatctagta gttcctgaat tcgtatatgc + 12181 aaagttggag aagggtagta taggtgttgc aaatttttca gatttaatcc gatttatgct + 12241 aatggaacaa tatggaggaa tttggttaga ttcaacgatg tatgtccatc cagatttccc + 12301 tattgaaata ttagaaagag aattttcttc gataaatcat agggataatt ccagccaatc + 12361 aatggatgac aatataacaa ataaacgctg ggtttcattt tgtttgagtg gagagaaagg + 12421 gaacattgtt tctcgagcaa tgcgagcttt tttattagat caaattgaaa ataataaagt + 12481 attacctgat tattttataa ttgactttgg tttagattat ctatatgatg aatttgaaga + 12541 gataagggaa ataataaaaa gtatccctag atattctagt caagaagaca tcttttggtt + 12601 gagaatacat agtaaagata gttttaacaa agaagaatgg tataatgaaa cgaaaaaaaa + 12661 atcaactttt caaaagtcgc tataaagaag atgaaacagt gaaagatagt tatttcgact + 12721 atcttgttaa aagaaagtta taaagtaaaa tgaaagtaat aaaaaactat gcttacaatc + 12781 tttcatatca attattggta attatactcc ctattattac aacaccttat gtaacacggg + 12841 tttttagttc taatgattta gggacatacg gatactttag ttcgatagtt acttacttta + 12901 ttttgctggc tagtcttggc gttgctaact atggtactaa ggtaatctct ggaaatcgca + 12961 aggagattga aaaaaacttt tgggggattt actcattgca aatgggtgca acgcttcttt + 13021 ctctattctt gtaccttgtt ctttgtttga cccttccttt tatgcaaaat ctagtagcct + 13081 acattcttgg attgagtttg gtttctaaag gtttagatat ttcctggctc tttcaaggtt + 13141 tagaggattt tcgaaagatt actgttcgaa atatcacagt caaactcgtt ggtgtcatct + 13201 ccatctttct ctttgtcaaa tctgcaaacg atctttatct ctatgtcttt ttgttaacca + 13261 tatttgaact ctttggacaa ctcagtatgt ggttgccggc tcgagacttt atcggcaagt + 13321 ttcatgttga tatagaatac gccagacagc atttgaagcc aattatttta ttgttcctac + 13381 cacaagtcgc gatttctttg tatgttacct tagatcgtac catgcttgga gcgcttgctt + 13441 ctacaaaaga cgttggcatc tacgatcaag ccctaaaatt ggtaaatatt cttctaacct + 13501 ttgtaacttc attgggaagt gttatgctgc cacgagtatc tcatctgctt gcgacaggtg + 13561 aacgtaaggc agtaaacaag atgcatgaga tgtctttttt gatttataat ttgcttattt + 13621 ttccgattat ggcggggatt ctgatcgtga atgatgattt cgttcagtta tttctaggac + 13681 aagattttca agatgcacgc tatgcaattg cgattatggt tctcaggatg ttctttattg + 13741 gttggactaa tataatggga actcagatgt tgatccccca taaccaaaat aaagaattta + 13801 tgatttcaac aacagctcca gccattatta gcgttggatt gaatctatta ttcctaccca + 13861 agttaggtta tataggagca gccattgtct ctgttttgac agaggcgcta gtttgggtaa + 13921 ttcaattatt ctatactcgc agatatttaa aagaagttcc tataatcgga tcaatgtcaa + 13981 aaattatact agcatctgcc attatgtatg gccttttact aagttcaaaa acagttatac + 14041 atttttcatc gaccttaaat gttctagcat ttgcagcgct tggtggaatc atttatattt + 14101 ttgcaattct atctctgaaa gtggtagatg tgaaagaatt aaaacaaatt attaggaaaa + 14161 actagaatga gaaaaaatcg aaatattaac ctagatttac taaaagtgct tgcatgtgtt + 14221 ggagttgttt tacttcatac aacaatgggc ggatttaaag agacaggctc atggaatctt + 14281 ttggcatatt tatattattt aggtacttac tctattcccc tgttttttat ggtcaatggt + 14341 tatttattgt taggcaagag ggagataact tatctttaca tactccagaa agtaaaatgg + 14401 attttaataa cagtgtcatc atggtcgttt atcgtatggc tttttaagcg tgattttaca + 14461 actaatccta ttaaaaaaat tgtaggttct ttgatacaaa gaggttattt ctttcagttt + 14521 tggtttttcg gtgcactaat acttatctat ttatgtttgc caattttgag acaatttcta + 14581 aattcaaaaa gaagctattt atacagttta tctttattga tgactattgg tttgattttt + 14641 gagttatcaa atatcctact tcaaatgcca atacaaacat atgtaataca aacttttaga + 14701 ttatggacgt ggttttttta ctatctttta ggtggttata tagcgcaatt cactatagaa + 14761 gaaatcgaat caaggtttaa gaattggatg aaaatagtta gcatactttt gttattgatt + 14821 tcaccaataa tattattttt catagcgaag actatatacc ataatctatt tgctgaatac + 14881 ttttatgata ctttatttgt aaaagtcagt actttaggaa tttttctaac tatcctcatg + 14941 cttactttga atgaaagccg aagagaatcg attgtttccc tttctaatca aacaatgggg + 15001 gttttcataa tacatactta tattatgaaa gtgtgggaaa aagtgcttgg ttttaatttt + 15061 gtaggagcat atttactttt tgctctattt actttaagtg ttagttttat tattgttggg + 15121 atgttaatga agattcctta cttcaatcga atcgtcaaat tataaaaagg agaacaagat + 15181 gtacgattat cttattgtcg gtgctggttt gtcaggagca atttttgctt atgaggcgac + 15241 taagcgtgga aaaaaagtaa aagtgattga taaacgtgac cacattggtg ggaatatcta + 15301 ctgtgagaat ctagaaggag ttaatgttca taaatatggt gcccatatct ttcatacttc + 15361 taataagaaa gtttgggatt atgttaatca atttgctgaa tttaacaact acgtcaactc + 15421 gcctgtagct aattacaagg gtagcctcta taatctacct ttcaatatga ataccttcta + 15481 tgctatgtgg gggacaaaaa ctcctcaaga agtcaaagat aagattgctg agcagacagc + 15541 tgatatgaag gatgttgagc cgaaaaatct ggaagaacaa gctatcaagc tgattggtcc + 15601 agatatctac gaaaaattga tcaagggtta tactgaaaag cagtgggggc gctcagcaac + 15661 agaacttcct ccatttatca ttaaacgact tccagttcgt ctaacatttg ataataacta + 15721 ttttaatgac cgttaccaag gaattcctat tggtggttat aatgtgatta ttgaaaatat + 15781 gcttaaagac gtagaagttg aacttgaagt agatttcttt gctcaccgtg aagggttgga + 15841 agcatctgct gaaaaagttg tcttcacagg aatgatcgac caatattttg actacaaaca + 15901 cggagagtta gaataccgta gccttcgttt tgagcatgag attttagacg aggaaaatta + 15961 tcaaggaaat gctgtagtga actatacgga gcgtgagatt ccttatactc gtattatcga + 16021 acacaagcat tttgaatatg gaacgcaggc aaagacagtt atcacgcgtg aatatccagc + 16081 tgactggaag cgtggggacg agccttacta tccgatcaac gatgagaaaa ataatgctat + 16141 gtttgctaag taccaagagg aagcttcaaa gaatgataag gttattttct gtggacgttt + 16201 agcagattat aaatattatg atatgcatgt ggtgattgaa cgggcgcttg aggttgtgga + 16261 gaaagagttt ggatatgaca aaaagtagaa tcaattggat agattttgga aaaggctttt + 16321 ccatattttt agtcttagca gggcatgtgt tgcttggact gtatcaatcg gaaaaatttc + 16381 ccacagcaaa taacatacta tcgttgttga tagcacaagt ctacatattt catataccag + 16441 tattttttgc cttatcagga tactttttca aacctgtgtc ggatttgaag gagttctggc + 16501 aatatgctaa aaagaagaca attgtttttg gtctgccata tattttctat tcgatcattc + 16561 actttggtct tcaaaaagtt gcaggggcat ctgttcgtgt tcctacaacc atatctgatt + 16621 tgctaaatat ctataaagat cctcttggag tttcgtggta tttatatata ctctggtcga + 16681 ttttgataat ctatggatta ttgtctattt tagtcaaaaa tcgtagaatg ttatttttga + 16741 taagtgtttt cgcttattgt ttaaccctat ttgttcaaac agatatttat attattcaaa + 16801 gaacgctagt ttgggggctt tgtttctttc ttggcagtgt attgaatgaa attcactttg + 16861 ataaaattaa tttgaaaaaa tttctttttt tatttgtgct atttgatttt atttatatgt + 16921 tcgcttggtt cttgttttat gaagtagggt ctaagaagga ttatgtaagc tatagtaact + 16981 caggtttgtg ggggattgct tttgttgtct gtgtattagt tgcttttgcg atttttccga + 17041 aaatggagaa aaattttcct aaaactttcc tatatttcac taaatacggg aaagatagtt + 17101 tagggattta tattcttcat gcaccaattt gtagcatgat tcggattcta atgttgaaag + 17161 tgggaataaa ctcagttttt cttcacgttg ttgttgggat tgtgctaggc tggtatttat + 17221 ccatactagc aacttatata ttgaaaaaaa ttccattttt gaatattgtt ttattaccac + 17281 aaaagtatat taaattaaaa ggctctttgt caactgtagt gggttgaagt cagctaagct + 17341 cgagaaagga caaattttgt cctttctttt ttgatattca gggcgataaa aatccgtttt + 17401 ttgaagtttt caaaggtaag cgcgtcataa caaggtattt atcattcatg gaagacctcc + 17461 tgtatactat tagtaaagta aaactattgg aggatattgt aatgccacaa cctattgttc + 17521 ctgtagagat tccacaatct cgtcgttttg attctaaaaa gagaaatgat attctgctta + 17581 aaattcgtat tggcaagctt gaagtaagtt tttttcaatc tctcaatctc gaaatgatag + 17641 aacagctttt ggataaggtg ttgctctatg acaattcatc tatctagcct agggcaggtc + 17701 tatctcgtat gtgggaaaac ggatatgagg caaggcattg attcactggc ttatctggtt + 17761 aaaacccact ttgaattaga tcctttctca ggtcaagttt ttctcttttg tggtggacgt + 17821 aaagaccgct ttaaagccct ttactgggat ggtcaaggat tttggctatt atagtggatt + 17881 taaactagaa tagtacacct ctgcttctaa aacattgtta gaaatcgatt tgactgtcct + 17941 gttcttattt cattttacta taaattcatc agaaagtcgt gatttctatt gaaatgagga + 18001 ctttcttttt atactcatct gctt +// + diff --git a/public/res/serotype_genbank/serotype_20B.gb b/public/res/serotype_genbank/serotype_20B.gb new file mode 100644 index 0000000..a94a74c --- /dev/null +++ b/public/res/serotype_genbank/serotype_20B.gb @@ -0,0 +1,542 @@ +LOCUS JQ653093 17586 bp DNA linear BCT 15-NOV-2023 +DEFINITION Streptococcus pneumoniae strain 5931-06 CPS gene locus, complete + sequence. +ACCESSION JQ653093 +VERSION JQ653093.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17586) + AUTHORS Calix,J.J., Porambo,R.J., Brady,A.M., Larson,T.R., Yother,J., + Abeygunwardana,C. and Nahm,M.H. + TITLE Biochemical, Genetic, and Serological Characterization of Two + Capsule Subtypes among Streptococcus pneumoniae Serotype 20 + Strains: DISCOVERY OF A NEW PNEUMOCOCCAL SEROTYPE + JOURNAL J. Biol. Chem. 287 (33), 27885-27894 (2012) + PUBMED 22736767 +REFERENCE 2 (bases 1 to 17586) + AUTHORS Calix,J.J. and Brady,A.M. + TITLE Direct Submission + JOURNAL Submitted (09-FEB-2012) Department of Microbiology, University of + Alabama at Birmingham, 845 19th Street South, Birmingham, AL 35294, + USA +FEATURES Location/Qualifiers + source 1..17586 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="5931-06" + /serotype="20 beta" + /isolation_source="clinical isolate" + /db_xref="taxon:1313" + misc_feature 1..17586 + /note="CPS gene locus" + misc_feature <1..125 + /note="similar to transposase" + mobile_element <1..125 + /mobile_element_type="insertion sequence:IS630" + CDS 338..1783 + /note="Wzg" + /codon_start=1 + /transl_table=11 + /product="CpsA" + /protein_id="AFN40458.1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVVVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIELEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFYFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + CDS 1785..2516 + /note="Wzh" + /codon_start=1 + /transl_table=11 + /product="CpsB" + /protein_id="AFN40459.1" + /translation="MIDIHSHIVFDVDDGPKSIEESKALLREAYNQGVRMIVSTSHRR + KGMFETPEEKIATNFIKVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHAGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + CDS 2525..3217 + /note="Wzd" + /codon_start=1 + /transl_table=11 + /product="CpsC" + /protein_id="AFN40460.1" + /translation="MKEQNTLEIDVLQLFRTLWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + CDS 3227..3910 + /note="Wze" + /codon_start=1 + /transl_table=11 + /product="CpsD" + /protein_id="AFN40461.1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTEKLFLGVILNKFDVQHEKYGSY + GGYGNYGKK" + CDS 3932..5302 + /note="CpsE; glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WchA" + /protein_id="AFN40462.1" + /translation="MEGRGFYNITLAFLQSILVSLLAYILIAISETDIALNTVFVLFF + LHFVAFYISGYGKDFFKRGQYIELVETIKYIIFYSLLISFSSLFLKEKFVISRRGMLY + LLFLYGVLNYLLNFFLKSYWRKFTYNLKRSRKILLVTATSRVERVMDCLLLANDVQGK + LVAVSVLDKPEFTHEKLLVVPKEELISYATHEVVDEVFVNLPSEDYDIGAIISQFETM + GVDVTVNLNAFDKNLSRNKRIHEMAGLNVVTFSTNFYKPSHVITKRILDICGAIVGLF + ICGIASIFIVPQIRKDGGSAIFSQTRVGKNGRHFTFYKFRSMRVDAEAIKEQLMDQNT + MQGGMFKIDNDPRVTKIGKFIRKTSLDELPQFWNVLIGDMSLVGTRPPTVDEYEKYTP + EQKRRLSFKPGITGLWQISGRSEITNFDEVVKLDVAYIDDWTIWKDFEILLKTVKVVL + MRDGAK" + CDS 5310..6101 + /note="glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciB" + /protein_id="AFN40463.1" + /translation="MTNIKIIVATHKSFEMPQNKELYFPVHVGCEGKDDLGYQGDNTG + ENISQLNPYYCELTGLYWAWKNLDCDYLGLVHYRRYFTKKTQFYKENLKIDEVILNQE + EIELLLRKGDIIVPKKRKYYIETLCSHYAHTLDASHLDLARKVIEKQQPEYLDSFDKV + MKQRSGYMFNMFIMKKELANNYFEWLFPILDCMFDQINLSELTAFEARLFGRVSELLF + NVWLEKNLYSLVEVPFMYLEKVNLVEKGKSFLMAKFFGKKYGQSF" + CDS 6113..7180 + /note="polymerase" + /codon_start=1 + /transl_table=11 + /product="Wzy" + /protein_id="AFN40464.1" + /translation="MIYIGTMLLSMLIITFIKYFRISKKWKEAVYFWGFIPLILIGAL + RAYVGIDYTTYSLDQIPAVLAGSQTVKFELLDKLVVYIGYYLANQQHYFYIFAIFHII + LMWFLYKYIVQQSSNVMLSVFFLLTTVFFTFSLSGIRQSIATAIVFYALKYIKQKKSL + HYIIYLGIACLFHSSAVIYILFLVLGKININRFVGFALPMIASLFSFSGSEFVSRIIL + HLNFYSEYVGSRYYTGAYDKQHQLFTIVMCLSVFLLYYIVPKKEWVNLKLYLNINFVL + LLVAIIMPILPTPSRTIYMFVLVHVILIPKLISVIKDYRSKVIITMFFVLGYFIFFSI + TVLQRNAYETLPYHTIFEYLW" + CDS 7181..8209 + /note="putative glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WhaJ" + /protein_id="AFN40465.1" + /translation="MIMKQILISIIIPLHNGEDTIIRAVKSVINSRLYGDLIEIIIVE + NGSTDQSFKISQKLATENSNIRVLKSDKGTSFARNVGIEKSKGKWLIFLDADDYLFES + DLDVIVENLITNNTDLCVYNYEKGLKKIELFSEEVELIDDLDSFIVQSLSEPTKYMTV + WGKAFNKNLIDEYGLKFNTNLRVSEDSDFYLRFLLLIHSLTLTSQTLYHYSIDSPSTM + RTFSSDKLEGYIVSLNESSKVLGNVDNTIQEAFELYKLAHFNLIMVREVFYFDNSKSF + REKIKEMIRLYKMPMFFEPIQNLSVSSVSNLSLVPLFFLKIHLYHLAALVYIIRVGQN + KFKEGRKS" + CDS 8209..9324 + /note="putative glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciL" + /protein_id="AFN40466.1" + /translation="MKRILVFGMNENPGGVESFIMNYFREFNREKLALDFLCNSNDKI + AYEDELISKGARVFHLTARSKNPIRYYWEMYRFFKEYASDYQAIWVNINSLANIDYLK + FARYFGIPVRIVHSHNSQNMDTKLREKLHNHNRDKIEKWATDFWACSHEAAKWFYNEE + TIGKVKIIPNAINMNASIFSSEARDKIRIDYTLDNKFVLGHVGRLHFQKNQEFMIRVL + AKLQEFRDDVCLVLVGQGEDLNKLKILAEELSIQDKVYFVGVQSNISEWLSTFDLFFF + PSNFEGLGIAALEAQVNGLPTLLSEEGVPKEVKINDNTFFYPLKESEESWANFLDEMI + HTTTRLNYEYIQENFEKSGYDIKIAAQNLEKQLLELV" + CDS 9335..10324 + /note="glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WcwK" + /protein_id="AFN40467.1" + /translation="MVNNIDFVVTWVNGNDPVWREEKKKYEVLDGRPTLNDETRYRDM + DLFQYWFRAVEKHAPWVNNIYFITYGHLPEWLDANHPKLKIVKHEDYIPKEYLPTFSS + NVIELNLFRIKELSEQFVLFSDDVFINTFLKEEDLFKNNLPRLLSIYRPLIPTKEFDY + INFNHLLIMNRYFHDKKTLSQHKGKFFNVGYGKFNLYNLFSIFYSGIIGYHDAHVAMP + HLKSTFAEIWNKEGVLLDRVCKNKFRSTKDVNHWLMSYWNIETNSFMPQTLRVGEYVP + LAYSGKIESIIHKQKNKFLCINDDEHTENFINEVNFVRKIFEKKFPEKSKFEK" + CDS 10337..11341 + /note="putative glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciD" + /protein_id="AFN40468.1" + /translation="MKKQKILSVVIPSYNAAPFLMETIPTLVSISSRNDIEVLIVNDG + SKDETLQVAQKLEKEYSGIVSIIDKENGGHGSTINAGIREAKGKYFKVVDADDWVDSE + NFEKLVQFLHKTDADEIISPYTDVFEDDGTKVENNYFKDCSLKPYQDYDYVNFLERIQ + ILPRMHSITIKTSILRDNNIKIDENMFYVDMEYIVFPTPFIKTITYTPDSVYQYRRGY + EGQSTSIQNYIKNRKMVNHVTFALLDFYNKHTLSNILEKLVKETIARCVTIMTNVCLS + MEDTKQGKKELLDFDQKLKSINSEFYYHKQGKKAKVLRYSNYFLFDLLSSYSKKSKKV + " + CDS 11361..12323 + /note="putative glycosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WhaF" + /protein_id="AFN40469.1" + /translation="MIHKIINRLSLTIQQCSGDKPFTIKLVNAYVELLRNTKSRELRN + YVIKKHIKKTTNISQIKEVFLENSNTLIQKTEFPKFIWTMWWQGEENAPELVQSTLYY + IRKFAETNGYTTVVIDKNNIDKYLVVPEFVYAKLEKGSIGVANFSDLIRFMLMEQYGG + IWLDSTMYVHPDFPIEILEREFSSINHRDNSSQSMDDNITNKRWVSFCLSGEKGNIVS + RAMRAFLLDQIENNKVLPDYFIIDFGLDYLYDEFEEIREIIKSIPRYSSQEDIFWLRI + HSKDSFNKEEWYNETKKNQLFKSSYKEDETVKDSYFDYLVKRKL" + CDS 12330..13745 + /note="flippase" + /codon_start=1 + /transl_table=11 + /product="Wzx" + /protein_id="AFN40470.1" + /translation="MKVIKNYAYNLSYQLLVIILPIITTPYVTRVFSSNDLGTYGYFS + SIVTYFILLASLGVANYGTKVISGNRKEIEKNFWGIYSLQMGATLLSLFLYLVLCLTL + PFMQNLVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVISIFLFVKSAN + DLYLYVFLLTIFELFGQLSMWLPARDFIGKFHVDIEYARQHLKPIILLFLPQVAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTFVTSLGSVMLPRVSHLLATGERKAVN + KMHEMSFLIYNLLIFPIMAGILIVNDDFVQLFLGQDFQDARYAIAIMVLRMFFIGWTN + IMGTQMLIPHNQNKEFMISTTAPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWVIQ + LFYTRRYLKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSSTLNVLAFAALGGIIYI + FAILSLKVVDVKELKQIIRKN" + CDS 13747..14745 + /note="putative O-acetyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciG" + /protein_id="AFN40471.1" + /translation="MRKNRNINLDLLKVLACVGVVLLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMVNGYLLLGKREITYLYILQKVKWILITVSSWSFIVWLFKRDFTTNPI + KKIVGSLIQRGYFFQFWFFGALILIYLCLPILRQFLNSKRSYLYSLSLLMTIGLIFEL + SNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTIEEIESRFKNWMKIVSILLLLI + SPIILFFIAKTIYHNLFAEYFYDTLFVKVSTLGIFLTILMLTLNESRRESIVSLSNQT + MGVFIIHTYIMKVWEKVLGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + CDS 14759..15868 + /note="galactofuranose mutase" + /codon_start=1 + /transl_table=11 + /product="Glf" + /protein_id="AFN40472.1" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRDHIGGNIYCEN + LEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTADMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELEVDFFAHRE + GLEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + CDS 15855..16907 + /note="putative O-acetyl transferase" + /codon_start=1 + /transl_table=11 + /product="WcjE" + /protein_id="AFN40473.1" + /translation="MTKSRINWIDFGKGFSIFLVLAGHVLLGLYQSEKFPTANNILSL + LIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQKV + AGASVRVPTTISDLLNIYKDPLGVSWYLYILWSILIIYGLLSILVKNRRMLFLISVFA + YCLTLFVQTDIYIIQRTLVWGLCFFLGSVLNEIHFDKINLKKFLFLFVLFDFIYMFAW + FLFYEVGSKKDYVSYSNSGLWGIAFVVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSL + GIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLL + PQKYIKLKGSLSTVVG" + mobile_element 16923..>17586 + /mobile_element_type="insertion sequence:IS1761" + misc_feature 16923..17454 + /note="similar to transposase" +ORIGIN + 1 taaatggtat tacgtgagat ttggaaaacg tgtgatgctt ctgttatact acctgttcgc + 61 tcacaataag agagaacttt tttacgaaaa tctattgaat atgccataaa aagattatac + 121 cacattgtgt actatattag attgaaacta gaatagtaca catctgcttc taaaacattg + 181 ttagaaatcg atttgactgt ccttatttca ttttattata tttttggttc gcgggaagtc + 241 tactaagata cttaaagatg cagatagtaa aaaaaatgta gacattaccg taaaaaagtg + 301 atataatcgt atgatgttca aggtataggt gttaatcatg agtagacgtt ttaaaaaatc + 361 aggttcacag aaagtgaagc gaagtgttaa tatcgttttg ctgactattt atttattgtt + 421 agtttgtttt ttattgttct taatctttaa gtacaatatc cttgctttta gatatcttaa + 481 cctagtggta actgcgttag tcctactagt tgccttggta gggctactct tgattatcta + 541 taaaaaagct gaaaagttta ctatttttct gttgctgttc tctatccttg tcagctctgt + 601 gtcgctcttt gcagtacagc agtttgttgg actgaccaat cgtttaaatg cgacttctaa + 661 ttactcagaa tattcaatca gtgtcgttgt tttagcagat agtgatatcg aaaatgttac + 721 gcaactgacg agtgtgacag caccgactgg gactgataat gaaaatattc aaaaactact + 781 agctgatatt aagtcaagtc agaataccga tttgacggtc aaccagagtt cgtcttactt + 841 ggcagcttac aagagtttga ttgcagggga gactaaggcc attgtcctaa atagtgtctt + 901 tgaaaacatc atcgagttag agtatccaga ctacgcatcg aagataaaaa agatttatac + 961 caagggattc actaaaaaag tagaagctcc taagacgtct aagaatcagt ctttcaatat + 1021 ctatgttagt ggaattgaca cctatggtcc tattagttcg gtgtcgcgat cagatgtcaa + 1081 tatcctgatg actgtcaatc gagataccaa gaaaatcctc ttgaccacaa cgccacgtga + 1141 tgcctatgta ccaatcgcag atggtggaaa taatcaaaaa gataaattaa cccatgcagg + 1201 catttatgga gttgattcgt ccattcacac cttagaaaat ctctatggag tggatatcaa + 1261 ttactatgtg cgattgaact tcacttcttt cttgaaaatg attgacttat tgggaggggt + 1321 agatgttcat aatgatcaag agttttcagc tctacatggg aagttctatt tcccagtagg + 1381 gaatgtccat ctagactctg agcaggctct aggttttgta cgtgaacgct actcactagc + 1441 cgatggagac cgtgaccgtg gtcgcaacca acaaaaggtg attgtggcta tccttcaaaa + 1501 attaacgtca accgaagcac tgaaaaatta tagtacgatc attaatagct tgcaagattc + 1561 tatccaaaca aatatgccac ttgagactat gataaatttg gtcaatgctc agttagaaag + 1621 tggagggaat tataaagtaa attctcaaga tttaaaaggt acaggtcgga cggatcttcc + 1681 ttcttatgca atgccagaca gtaacctcta tgtgatggaa atagatgata gtagtttagc + 1741 tgtagttaaa gcagctatac aggatgtgat ggagggtaga tgaaatgata gacatccatt + 1801 cgcatatcgt ttttgatgta gatgacggtc ccaagtcaat agaggaaagc aaggcacttt + 1861 taagagaagc ttataatcaa ggagttcgaa tgattgtgtc tacttcgcat cgtcgaaaag + 1921 ggatgtttga aactccagaa gaaaaaattg caacaaattt tattaaggtt cgtgaaattg + 1981 caaaagaagt agcagatgat ttagtcatag cttatggcgc agagatatac tatactctgg + 2041 atgctctaga aaagctagaa aaaaaagaaa ttcctaccct taatgatagt cgttatgctt + 2101 tgattgagtt tagcatgcat acttcctatc gtgagattca tgcgggattg agcaatattt + 2161 tgatgttggg aatcacgcca gtaattgctc atattgaacg ttatgatgcc ttagagaata + 2221 acgaaaaacg tgttcgtgaa ctgattgata tggggtgcta tactcagata aatagttatc + 2281 atgttttaaa acctaagttc tttggtgaaa aatataaatt catgaaaaag agagctcggt + 2341 attttttgga acgtgattta gttcatgtag ttgcaagtga catgcacaat ttagacagta + 2401 gacctccata tatgcaacag gcatatgata tcattgctaa gaaatatgga gcgaaaaaag + 2461 cgaaagaatt ttttgtagat aatcccagaa aaattataat ggatcaatta atttaggaga + 2521 aaatatgaag gaacaaaaca ctttggaaat cgatgtattg caactattca gaactttatg + 2581 gaaaagaaag ttggtcattt tattagtggc aattataact tcttcagttg cttttgccta + 2641 cagtactttt gttatcaaac ctgagtttac tagtacgact cggatttatg tagttaaccg + 2701 taatcaggaa gagaagtctg gtttaaccaa tcaagacttg caggcaggat catacttggt + 2761 caaagactat cgtgaaatta tcctatcgca ggatgttttg gaggaagtta tttctgattt + 2821 gaaactagat ttgacgccaa aaggtttggc taataaaatt aaagtaacag taccagttga + 2881 tacccgtatt gtctctgttt cagttaatga tcgagttcct gaagaggcaa gccgtatcgc + 2941 taactctttg agagaagtag ctgctcaaaa aattatcagt attactcgtg tttctgatgt + 3001 gacaacactg gaggaagcaa gaccggcgat atcaccatct tcgccaaata ttaaacgcaa + 3061 tacactaatt ggttttttgg caggggggat tggaactagt gttatagttt ttcttcttga + 3121 acttttggac actcatgtga aacgtccgga agatatcgaa gatacactgc agatgacact + 3181 tttgggagtt gtaccaaact tgagtaagtt gaaataggag agaggaatgc cgacattaga + 3241 aatagcacaa aaaaaactgg agttcattaa gaaggcagaa gaatattaca atgccttgtg + 3301 tacaaatata cagttgagcg gagataaact aaaagtaatt tccgttactt ctgttaaccc + 3361 tggggaagga aaaacaacta cttccgtaaa tatagcaagg tcgtttgcgc gtgcaggcta + 3421 taaaactctt ttgatcgatg gcgatactcg aaattcagtt atatcaggag tttttaaatc + 3481 gcgtgaaaaa attacagggc taacagaatt tttatctggg acagctgatt tatctcacgg + 3541 tttatgtgat acaaatattg aaaatttatt tgtaattcaa tcgggatctg tatcaccaaa + 3601 ccctacagcc ttgttacaaa gtaaaaattt taatgatatg attgaaacat tgcgtaaata + 3661 ttttgattat atcattgttg atacagcacc tattggaatt gttattgatg cggcaattat + 3721 cactcaaaag tgtgatgcgt ccatcttggt aacagcaaca ggtgaggtga ataaacgtga + 3781 tgtccaaaaa gcgaaacaac aattagaaca aacagagaaa ctgtttttag gtgtcattct + 3841 caataaattt gatgttcaac atgaaaaata tggttcttac ggtggctatg gtaattacgg + 3901 aaaaaaatag aatgaagtta gggagtccag tatggaagga aggggtttct acaatataac + 3961 tctggcattc ttacagagta tacttgttag tctattagct tatatactga ttgcaatttc + 4021 agaaaccgac attgctttaa atacagtatt cgtcctgttt tttcttcact ttgtagcctt + 4081 ttatattagt ggttatggta aagatttttt caaaagaggt cagtatattg agttggtaga + 4141 aacgataaaa tacataatat tttattcctt gttgatcagc ttttcaagtt tgttcttaaa + 4201 agaaaaattt gttatttcta gacgaggaat gctctacttg cttttcctat atggtgtttt + 4261 gaattatcta ctcaatttct ttttgaaaag ttattggaga aaattcacct ataatttaaa + 4321 gcgcagtcgc aagattttat tggttacggc aacatcacgc gtcgaaagag taatggattg + 4381 cctgttactt gcgaacgatg ttcaagggaa attggttgct gttagtgttt tagataagcc + 4441 agaatttact catgaaaagc tccttgttgt accaaaagaa gagttgattt cctacgctac + 4501 ccatgaagta gtagatgaag tttttgtcaa tcttccaagt gaggactatg atattggagc + 4561 cattatttct cagtttgaaa caatgggggt tgatgtaaca gtcaatctca atgcttttga + 4621 taaaaactta agccgaaata aacgaatcca tgaaatggca ggattgaatg tagtgacctt + 4681 ctctacgaat ttttacaagc ctagtcatgt cattactaag aggattcttg atatttgtgg + 4741 agctatcgtt ggtcttttta tctgtggaat tgctagtata ttcatagttc ctcagattcg + 4801 aaaagatggt gggtctgcaa tcttttcaca aactcgtgta ggaaaaaatg gtcgtcactt + 4861 taccttttat aaattccgct cgatgcgagt cgatgcagaa gcgatcaagg aacagttgat + 4921 ggatcaaaat acgatgcaag gtggtatgtt taagatcgat aacgatcctc gagtgacaaa + 4981 gattggaaaa tttatccgaa aaactagctt ggatgaattg ccacaatttt ggaatgtttt + 5041 aattggagac atgagtctag taggtacgcg cccaccaact gtagatgagt acgaaaaata + 5101 cacacctgaa caaaaacgtc gcctaagctt taaacctggt attacaggtt tgtggcaaat + 5161 tagtggtcga agtgaaatta caaacttcga tgaggttgtt aagttggatg tggcttatat + 5221 cgatgattgg accatttgga aagattttga aatattgtta aaaactgtaa aagttgtgtt + 5281 gatgagagat ggagcgaagt aggaggggta tgacaaatat taaaattata gttgcaactc + 5341 ataagagttt tgagatgccg caaaataaag aattgtattt cccagtccat gtggggtgtg + 5401 aaggaaaaga tgatttggga tatcaaggag ataatactgg ggaaaacatt tcccagttaa + 5461 acccttatta ctgtgaatta acaggtttat attgggcatg gaagaatcta gattgcgatt + 5521 atcttggact agttcattac cgccgatatt tcacgaagaa aactcaattt tataaagaaa + 5581 atctaaaaat tgatgaagta attttaaatc aggaagaaat tgaattgctt ttgagaaaag + 5641 gagatataat agttcctaaa aaaaggaaat attatattga aactctatgt tctcattatg + 5701 cacacacgct agatgctagc catctagatt tggctagaaa agtcattgag aagcaacaac + 5761 ctgaatacct tgattcattt gataaagtta tgaaacaacg tagtggctat atgtttaata + 5821 tgtttataat gaaaaaggaa ttagcaaata attattttga atggctgttt ccgattttag + 5881 attgtatgtt tgatcagatt aatctttcag agttaactgc atttgaggca cgtctttttg + 5941 gtcgtgtaag tgaactatta ttcaacgtat ggctagagaa gaatttgtat tctctagtag + 6001 aagttccatt tatgtatttg gaaaaggtta atctagtaga aaaagggaaa tcgtttttaa + 6061 tggctaaatt ttttggtaag aagtatggac agagttttta gggaggaact aattgattta + 6121 cattggtacg atgcttctct caatgttgat aattactttt atcaagtatt ttagaatatc + 6181 aaaaaaatgg aaagaggcag tttatttttg gggttttatt cctcttatct tgataggagc + 6241 acttagagct tatgtaggaa tagattatac cacatatagt ttggatcaga taccggctgt + 6301 attagctggt agtcagacag tcaaatttga attgttagat aaattagtag tgtacatagg + 6361 ttactatcta gctaatcagc agcattattt ctatattttt gcaatatttc acattatcct + 6421 gatgtggttt ctgtataaat atattgttca acagtcgtct aatgtaatgt tgagtgtgtt + 6481 ttttcttcta accactgttt tttttacttt ttctttatca ggaatacgcc aatcaatagc + 6541 tacagcgatt gttttttatg cgttgaagta tattaaacaa aaaaaaagtt tacattatat + 6601 aatttattta gggattgctt gtttatttca ttctagtgca gtaatctata tacttttttt + 6661 agttttaggg aaaattaata ttaataggtt cgttggcttt gcattaccga tgattgcatc + 6721 attattttct ttttctgggt ctgaatttgt atctcgaata atactacatt taaattttta + 6781 ttcagaatac gttggttctc gttattatac aggagcatat gataaacaac accaactatt + 6841 cacaatcgtt atgtgtttat cggtatttct attatattat attgttccga aaaaagagtg + 6901 ggttaattta aaattatatc tgaatattaa ttttgtgcta ttactagttg caataatcat + 6961 gccaatactt cctactccat caagaactat ttatatgttt gttcttgtac atgttattct + 7021 aattcctaag ttgatttcag ttattaaaga ttataggtct aaggtaatca taacaatgtt + 7081 ctttgtttta ggttatttta tattcttttc tataacggtt ctacagagga atgcatatga + 7141 aacactaccg taccacacaa tctttgagta tttatggtaa ttgattatga aacaaatatt + 7201 aatttctatt attattccat tacataatgg agaagatacg attattagag cagtaaaaag + 7261 tgttataaat agcagattat atggagattt gattgaaatt attattgttg aaaatggttc + 7321 aacagatcaa tcatttaaaa tttctcaaaa attagcgacc gaaaactcaa atatacgagt + 7381 cttgaaatca gataaaggaa ccagttttgc cagaaacgta ggaatcgaaa aatctaaagg + 7441 aaagtggctt atttttttag atgcagatga ttatttattt gaatcggatt tagacgttat + 7501 tgttgaaaat ttaataacca ataatacaga tttatgcgtt tataactacg aaaaagggct + 7561 taagaaaata gaactttttt cagaagaggt agagttgata gatgaccttg attcttttat + 7621 agttcaatct ctttctgaac ccactaaata tatgacagta tggggaaaag cgtttaataa + 7681 aaatttgatt gatgagtacg gtttgaagtt taatacgaat ttgagagttt cagaagatag + 7741 tgatttttat ctcagatttc ttttgctgat tcacagttta actttaactt ctcaaacgct + 7801 ataccattat tcaattgatt caccttcaac gatgaggaca ttttcttcag ataaattaga + 7861 aggttatatt gtttccttga atgaaagctc aaaagtatta ggaaatgttg ataatactat + 7921 tcaagaagcc tttgagttat ataagttggc gcattttaat ttaataatgg ttagagaagt + 7981 gttctatttt gataattcaa aaagtttcag agaaaagata aaggaaatga ttagacttta + 8041 taagatgcct atgttttttg agcctataca aaatctatct gtatctagtg ttagcaattt + 8101 atcgctagta cctctatttt ttttgaaaat acatttgtat catttagcgg cattggttta + 8161 cattattcga gtagggcaaa acaaattcaa agaaggaaga aaaagttgat gaaaagaatt + 8221 ctagtattcg gaatgaatga aaaccctggt ggagttgaat cctttataat gaattatttt + 8281 cgtgaattta atcgcgaaaa attagcctta gattttttgt gtaattcaaa tgataaaata + 8341 gcttatgagg atgaacttat ttctaaagga gcaagagttt ttcacctgac agcgagaagt + 8401 aaaaatccga tacgttatta ttgggaaatg tatagattct tcaaagaata tgcatctgat + 8461 tatcaggcaa tttgggttaa tattaatagc ttagcaaata ttgactattt aaaatttgca + 8521 agatattttg gtattccggt tcgaattgta cacagccata atagtcaaaa tatggatacc + 8581 aaacttcgtg aaaaattaca taatcataat agagacaaaa ttgaaaagtg ggcaaccgat + 8641 ttctgggctt gttcgcacga agctgcaaaa tggttttata acgaagaaac tattggaaaa + 8701 gttaagatta taccaaatgc tattaatatg aatgcttcta ttttttcttc tgaggcacga + 8761 gataaaattc gaattgatta tacattagac aataaatttg tgctaggtca tgtaggacgt + 8821 ttgcattttc agaagaatca agaatttatg ataagagttt tagctaaatt acaggaattt + 8881 agagacgatg tctgcttagt tttagttggt caaggtgaag atcttaacaa attaaagata + 8941 ctggctgagg agctatctat tcaggataag gtctactttg tgggagttca gtcgaatata + 9001 tcagaatggt tgagtacttt tgacttattc ttttttccgt ctaattttga aggtttagga + 9061 atagctgcat tagaggctca agtaaatggt ctaccgacac tactctcaga agaaggtgta + 9121 ccaaaggaag taaaaatcaa tgataatact tttttttatc cattgaagga aagtgaagaa + 9181 agctgggcaa acttccttga tgaaatgatt catacaacaa ctcgtttaaa ttatgaatat + 9241 atacaagaaa attttgagaa atctggctac gatattaaga tagctgctca gaatcttgaa + 9301 aaacaattgc tagaattagt ttagggaaga taacatggtt aataatattg attttgtagt + 9361 tacatgggtt aatggaaatg atccagtgtg gcgtgaggaa aaaaagaaat acgaagttct + 9421 agatggtagg ccgactttaa atgatgaaac aagatataga gatatggatt tgtttcaata + 9481 ttggtttcga gcggtagaaa aacatgcgcc ctgggttaat aatatttatt tcattacata + 9541 tgggcattta cctgaatggc tggatgcaaa tcaccctaaa ttgaagatag taaaacatga + 9601 agattatatt ccaaaagaat acttaccgac ttttagttca aatgtaattg aactaaatct + 9661 ttttaggatt aaggaattga gtgagcagtt cgttctgttt agtgatgatg tttttattaa + 9721 cacattttta aaagaagaag atttgtttaa aaataactta cctcgattgt tgagtatata + 9781 tagaccatta attccaacta aagaatttga ttatattaat ttcaatcatt tattaataat + 9841 gaatagatac tttcatgata aaaaaacatt atcacaacat aagggtaaat tttttaatgt + 9901 aggttatgga aagtttaatc tgtataatct atttagcatt ttttattcag ggattattgg + 9961 ttatcatgat gctcatgtcg ctatgcctca tttgaaaagt acttttgcag agatttggaa + 10021 taaggaaggg gtacttctag atcgagtttg taaaaacaaa tttcgttcaa ctaaagatgt + 10081 taaccattgg ttgatgagct attggaatat tgaaacaaat tcatttatgc cacagactct + 10141 tcgtgtgggt gaatatgtgc ctctggctta ttcaggtaaa attgaatcta ttattcacaa + 10201 acaaaagaat aagtttttgt gtataaacga cgatgaacat accgaaaact tcattaacga + 10261 agttaacttt gttcgtaaaa tatttgagaa aaaatttcct gaaaagtcta aatttgaaaa + 10321 gtaaagggga actaaattga aaaaacaaaa aatacttagc gtggtaattc catcctacaa + 10381 tgcggctcca tttttgatgg aaactattcc gactctagtt tctattagca gcagaaatga + 10441 tattgaggtt ttgattgtaa atgatgggtc taaagatgag acacttcaag tggctcagaa + 10501 actggaaaaa gagtattctg gcatagttag tataattgat aaagaaaatg gcggtcatgg + 10561 atctacaatt aatgctggga taagggaagc taaagggaag tactttaaag ttgttgatgc + 10621 tgatgattgg gtagatagtg aaaactttga aaagcttgta caatttcttc ataaaacaga + 10681 tgccgatgaa attatctctc catatacaga cgtttttgaa gatgatggta caaaggtaga + 10741 aaataactat tttaaagatt gttcattaaa accataccag gattatgatt atgtgaattt + 10801 tttagaacgg attcaaattt tacctagaat gcattctata acaataaaaa cctctatttt + 10861 aagagataat aacataaaaa ttgatgagaa tatgttctac gttgacatgg agtatattgt + 10921 ttttccaact ccatttatca aaacaataac ttatacgcct gactctgttt atcagtatcg + 10981 tagaggttac gagggacaga gtacgagtat tcagaactat ataaaaaata gaaaaatggt + 11041 aaatcatgtc acattcgctt tgcttgactt ttataataaa cacactttat ctaatattct + 11101 ggaaaaacta gttaaagaga caattgctag atgtgttact attatgacaa atgtttgtct + 11161 atcaatggaa gatactaaac aaggtaaaaa ggaacttctt gattttgatc agaaattaaa + 11221 atcaataaat tctgagttct attatcataa acaagggaaa aaagctaaag ttctaagata + 11281 ttcaaattac ttcttgtttg acttgttgtc tagctactct aagaagtcta aaaaagtata + 11341 gttgttgtag gagtatatat atgatacata aaattattaa tcgattatca cttacgattc + 11401 aacaatgtag tggcgataaa ccatttacta tcaaattagt taatgcatat gtagaactat + 11461 taagaaatac aaaatctaga gaattaagaa attatgtaat aaagaaacac attaaaaaaa + 11521 ccacgaatat ttctcaaatt aaggaagttt ttctagagaa tagtaatact ttaatacaaa + 11581 aaactgaatt tcctaaattt atctggacta tgtggtggca aggagaagag aatgcacctg + 11641 agttagtcca aagtacactc tattatatta gaaaatttgc tgaaactaat ggttatacga + 11701 cagtagttat tgataaaaat aatatagata agtatctagt agttcctgaa ttcgtatatg + 11761 caaagttgga gaagggtagt ataggtgttg caaatttttc agatttaatc cgatttatgc + 11821 taatggaaca atatggagga atttggttag attcaacgat gtatgtccat ccagatttcc + 11881 ctattgaaat attagaaaga gaattttctt cgataaatca tagggataat tccagccaat + 11941 caatggatga caatataaca aataaacgct gggtttcatt ttgtttgagt ggagagaaag + 12001 ggaacattgt ttctcgagca atgcgagctt ttttattaga tcaaattgaa aataataaag + 12061 tattacctga ttattttata attgactttg gtttagatta tctatatgat gaatttgaag + 12121 agataaggga aataataaaa agtatcccta gatattctag tcaagaagac atcttttggt + 12181 tgagaataca tagtaaagat agttttaaca aagaagaatg gtataatgaa acgaaaaaaa + 12241 atcaactttt caaaagtagc tataaagaag atgaaacagt gaaagatagt tatttcgact + 12301 atcttgttaa aagaaagtta taaagtaaaa tgaaagtaat aaaaaactat gcttacaatc + 12361 tttcatatca attattggta attatactcc ctattattac aacaccttat gtaacacggg + 12421 tttttagttc taatgattta gggacatacg gatactttag ttcgatagtt acttacttta + 12481 ttttgctggc tagtcttggc gttgctaact atggtactaa ggtaatctct ggaaatcgca + 12541 aggagattga aaaaaacttt tgggggattt actcattgca aatgggtgca acgcttcttt + 12601 ctctattctt gtaccttgtt ctttgtttga cccttccttt tatgcaaaat ctagtagcct + 12661 acattcttgg attgagtttg gtttctaaag gtttagatat ttcctggctc tttcaaggtt + 12721 tagaggattt tcgaaagatt actgttcgaa atatcacagt caaactcgtt ggtgtcatct + 12781 ccatctttct ctttgtcaaa tctgcaaacg atctttatct ctatgtcttt ttgttaacca + 12841 tatttgaact ctttggacaa ctcagtatgt ggttgccggc tcgagacttt atcggcaagt + 12901 ttcatgttga tatagaatac gccagacagc atttgaagcc aattatttta ttgttcctac + 12961 cacaagtcgc gatttctttg tatgttacct tagatcgtac catgcttgga gcgcttgctt + 13021 ctacaaaaga cgttggcatc tacgatcaag ccctaaaatt ggtaaatatt cttctaacct + 13081 ttgtaacttc attgggaagt gttatgctgc cacgagtatc tcatctgctt gcgacaggtg + 13141 aacgtaaggc agtaaacaag atgcatgaga tgtctttttt gatttataat ttgcttattt + 13201 ttccgattat ggcggggatt ctgatcgtga atgatgattt cgttcagtta tttctaggac + 13261 aagattttca agatgcacgc tatgcaattg cgattatggt tctcaggatg ttctttattg + 13321 gttggactaa tataatggga actcagatgt tgatccccca taaccaaaat aaagaattta + 13381 tgatttcaac aacagctcca gccattatta gcgttggatt gaatctatta ttcctaccca + 13441 agttaggtta tataggagca gccattgtct ctgttttgac agaggcgcta gtttgggtaa + 13501 ttcaattatt ctatactcgc agatatttaa aagaagttcc tataatcgga tcaatgtcaa + 13561 aaattatact agcatctgcc attatgtatg gccttttact aagttcaaaa acagttatac + 13621 atttttcatc gaccttaaat gttctagcat ttgcagcgct tggtggaatc atttatattt + 13681 ttgcaattct atctctgaaa gtggtagatg tgaaagaatt aaaacaaatt attaggaaaa + 13741 actagaatga gaaaaaatcg aaatattaac ctagatttac taaaagtgct tgcatgtgtt + 13801 ggagttgttt tacttcatac aacaatgggc ggatttaaag agacaggctc atggaatctt + 13861 ttggcatatt tatattattt aggtacttac tctattcccc tgttttttat ggtcaatggt + 13921 tatttattgt taggcaagag ggagataact tatctttaca tactccagaa agtaaaatgg + 13981 attttaataa cagtgtcatc atggtcgttt atcgtatggc tttttaagcg tgattttaca + 14041 actaatccta ttaaaaaaat tgtaggttct ttgatacaaa gaggttattt ctttcagttt + 14101 tggtttttcg gtgcactaat acttatctat ttatgtttgc caattttgag acaatttcta + 14161 aattcaaaaa gaagctattt atacagttta tctttattga tgactattgg tttgattttt + 14221 gagttatcaa atatcctact tcaaatgcca atacaaacat atgtaataca aacttttaga + 14281 ttatggacgt ggttttttta ctatctttta ggtggttata tagcgcaatt cactatagaa + 14341 gaaatcgaat caaggtttaa gaattggatg aaaatagtta gcatactttt gttattgatt + 14401 tcaccaataa tattattttt catagcgaag actatatacc ataatctatt tgctgaatac + 14461 ttttatgata ctttatttgt aaaagtcagt actttaggaa tttttctaac tatcctcatg + 14521 cttactttga atgaaagccg aagagaatcg attgtttccc tttctaatca aacaatgggg + 14581 gttttcataa tacatactta tattatgaaa gtgtgggaaa aagtgcttgg ttttaatttt + 14641 gtaggagcat atttactttt tgctctattt actttaagtg ttagttttat tattgttggg + 14701 atgttaatga agattcctta cttcaatcga atcgtcaaat tataaaaagg agaacaagat + 14761 gtacgattat cttattgtcg gtgctggttt gtcaggagca atttttgctt atgaggcgac + 14821 taagcgtgga aaaaaagtaa aagtgattga taaacgtgac cacattggtg ggaatatcta + 14881 ctgtgagaat ctagaaggag ttaatgttca taaatatggt gcccatatct ttcatacttc + 14941 taataagaaa gtttgggatt atgttaatca atttgctgaa tttaacaact acgtcaactc + 15001 gcctgtagct aattacaagg gtagcctcta taatctacct ttcaatatga ataccttcta + 15061 tgctatgtgg gggacaaaaa ctcctcaaga agtcaaagat aagattgctg agcagacagc + 15121 tgatatgaag gatgttgagc cgaaaaatct ggaagaacaa gctatcaagc tgattggtcc + 15181 agatatctac gaaaaattga tcaagggtta tactgaaaag cagtgggggc gctcagcaac + 15241 agaacttcct ccatttatca ttaaacgact tccagttcgt ctaacatttg ataataacta + 15301 ttttaatgac cgttaccaag gaattcctat tggtggttat aatgtgatta ttgaaaatat + 15361 gcttaaagac gtagaagttg aacttgaagt agatttcttt gctcaccgtg aagggttgga + 15421 agcatctgct gaaaaagttg tcttcacagg aatgatcgac caatattttg actacaaaca + 15481 cggagagtta gaataccgta gccttcgttt tgagcatgag attttagacg aggaaaatta + 15541 tcaaggaaat gctgtagtga actatacgga gcgtgagatt ccttatactc gtattatcga + 15601 acacaagcat tttgaatatg gaacgcaggc aaagacagtt atcacgcgtg aatatccagc + 15661 tgactggaag cgtggggacg agccttacta tccgatcaac gatgagaaaa ataatgctat + 15721 gtttgctaag taccaagagg aagcttcaaa gaatgataag gttattttct gtggacgttt + 15781 agcagattat aaatattatg atatgcatgt ggtgattgaa cgggcgcttg aggttgtgga + 15841 gaaagagttt ggatatgaca aaaagtagaa tcaattggat agattttgga aaaggctttt + 15901 ccatattttt agtcttagca gggcatgtgt tgcttggact gtatcaatcg gaaaaatttc + 15961 ccacagcaaa taacatacta tcgttgttga tagcacaagt ctacatattt catataccag + 16021 tattttttgc cttatcagga tactttttca aacctgtgtc ggatttgaag gagttctggc + 16081 aatatgctaa aaagaagaca attgtttttg gtctgccata tattttctat tcgatcattc + 16141 actttggtct tcaaaaagtt gcaggggcat ctgttcgtgt tcctacaacc atatctgatt + 16201 tgctaaatat ctataaagat cctcttggag tttcgtggta tttatatata ctctggtcga + 16261 ttttgataat ctatggatta ttgtctattt tagtcaaaaa tcgtagaatg ttatttttga + 16321 taagtgtttt cgcttattgt ttaaccctat ttgttcaaac agatatttat attattcaaa + 16381 gaacgctagt ttgggggctt tgtttctttc ttggcagtgt attgaatgaa attcactttg + 16441 ataaaattaa tttgaaaaaa tttctttttt tatttgtgct atttgatttt atttatatgt + 16501 tcgcttggtt cttgttttat gaagtagggt ctaagaagga ttatgtaagc tatagtaact + 16561 caggtttgtg ggggattgct tttgttgtct gtgtattagt tgcttttgcg atttttccga + 16621 aaatggagaa aaattttcct aaaactttcc tatatttcac taaatacggg aaagatagtt + 16681 tagggattta tattcttcat gcaccaattt gtagcatgat tcggattcta atgttgaaag + 16741 tgggaataaa ctcagttttt cttcacgttg ttgttgggat tgtgctaggt tggtatttat + 16801 ccatactagc aacttatata ttgaaaaaaa ttccattttt gaatattgtt ttattaccac + 16861 aaaagtatat taaattaaaa ggctctttgt caactgtagt gggttgaagt cagctaagct + 16921 cgagaaagga caaattttgt cctttctttt ttgatattca gggcgataaa aatccgtttt + 16981 ttgaagtttt caaaggtaag cgcgtcataa caaggtattt atcattcatg gaagacctcc + 17041 tgtatactat tagtaaagta aaactattgg aggatattgt aatgccacaa cctattgttc + 17101 ctgtagagat tccacaatct cgtcgttttg attctaaaaa gagaaatgat attctgctta + 17161 aaattcgtat tggcaagctt gaagtaagtt tttttcaatc tctcaatctc gaaatgatag + 17221 aacagctttt ggataaggtg ttgctctatg acaattcatc tatctagcct agggcaggtc + 17281 tatctcgtat gtgggaaaac ggatatgagg caaggcattg attcactggc ttatctggtt + 17341 aaaacccact ttgaattaga tcctttctca ggtcaagttt ttctcttttg tggtggacgt + 17401 aaagaccgct ttaaagccct ttactgggat ggtcaaggat tttggctatt atagtggatt + 17461 taaactagaa tagtacacct ctgcttctaa aacattgtta gaaatcgatt tgactgtcct + 17521 gttcttattt cattttacta taaattcatc agaaagtcgt gatttctatt gaaatgagga + 17581 ctttct +// + diff --git a/public/res/serotype_genbank/serotype_20C.gb b/public/res/serotype_genbank/serotype_20C.gb new file mode 100644 index 0000000..96203f6 --- /dev/null +++ b/public/res/serotype_genbank/serotype_20C.gb @@ -0,0 +1,711 @@ +LOCUS 16288_6#60 16761 bp DNA linear UNK 04-OCT-2024 +DEFINITION 16288_6#60, cps sequence. +ACCESSION 16288_6#60 +VERSION 16288_6#60 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 10/04/2024, 14:28:15 + CDSs :: 17 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 1 +FEATURES Location/Qualifiers + source 1..16761 + /mol_type="genomic DNA" + gene 221..1666 + /locus_tag="ONOPKJ_00005" + /gene="wzg" + CDS 221..1666 + /db_xref="BlastRules:WP_000091082" + /db_xref="RefSeq:WP_061762739.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000768ED20" + /db_xref="UniRef:UniRef100_UPI000768ED20" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_Q9R928" + /db_xref="UniprotKB:AFN40458.1" + /db_xref="UserProtein:Wzg" + /product="""CpsA""" + /locus_tag="ONOPKJ_00005" + /protein_id="gnl|Bakta|ONOPKJ_00005" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVNQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFYFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYS + TIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSYAMPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061762739.1" + /gene="wzg" + gene 1668..2399 + /locus_tag="ONOPKJ_00010" + /gene="wzh" + CDS 1668..2399 + /db_xref="EC:3.1.3.48" + /db_xref="GO:0004725" + /db_xref="GO:0030145" + /db_xref="GO:0045227" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI001CE679B7" + /db_xref="UniRef:UniRef100_A0A8G1EJV1" + /db_xref="UniRef:UniRef50_Q54518" + /db_xref="UniRef:UniRef90_Q54518" + /db_xref="UniprotKB:AFN40459.1" + /db_xref="UserProtein:Wzh" + /product="""CpsB""" + /locus_tag="ONOPKJ_00010" + /protein_id="gnl|Bakta|ONOPKJ_00010" + /translation="MIDIHSHIVFDVDDGPKSIEESKALLREAYNQGVRMIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDSRY + ALIEFSMHTSYRQIHAGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQIN + SYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIAKKYG + AKKAKEFFVDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef100_A0A8G1EJV1" + /gene="wzh" + gene 2408..3100 + /locus_tag="ONOPKJ_00015" + /gene="wzd" + CDS 2408..3100 + /db_xref="BlastRules:WP_000664160" + /db_xref="GO:0005351" + /db_xref="GO:0005886" + /db_xref="GO:0009103" + /db_xref="GO:0015774" + /db_xref="GO:0045227" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_Q54519" + /db_xref="UniprotKB:AFN40460.1" + /db_xref="UserProtein:Wzd" + /product="""CpsC""" + /locus_tag="ONOPKJ_00015" + /protein_id="gnl|Bakta|ONOPKJ_00015" + /translation="MKEQNTLEIDVLQLFRTLWKRKLVILLVAIITSSVAFACSTFVIK + PEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLDLT + PKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVTTLE + EARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTHVKRPEDIEDTLQMTLLGV + VPNLSKLK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q54519" + /gene="wzd" + gene 3110..3793 + /locus_tag="ONOPKJ_00020" + /gene="wze" + CDS 3110..3793 + /db_xref="COG:COG0489" + /db_xref="COG:D" + /db_xref="EC:2.7.10.2" + /db_xref="GO:0004715" + /db_xref="GO:0005524" + /db_xref="GO:0016310" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_001142505.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FFE3" + /db_xref="UniRef:UniRef100_Q4K0T5" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_Q54520" + /db_xref="UniprotKB:AFN40461.1" + /db_xref="UserProtein:Wze" + /product="""CpsD""" + /locus_tag="ONOPKJ_00020" + /protein_id="gnl|Bakta|ONOPKJ_00020" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVNP + GEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADLSH + GLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVIDAA + IITQKCDASILVTATGEVNKRDVQKAKQQLEQTEKLFLGVILNKFDVQHEKYGSYGGYG + NYGKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001142505.1" + /gene="wze" + gene 3815..5185 + /locus_tag="ONOPKJ_00025" + /gene="wchA" + CDS 3815..5185 + /db_xref="KEGG:K16566" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_Q4K0T4" + /db_xref="UniprotKB:AFN40462.1" + /db_xref="UserProtein:WchA" + /product="""CpsE; glycosyl transferase""" + /locus_tag="ONOPKJ_00025" + /protein_id="gnl|Bakta|ONOPKJ_00025" + /translation="MEGRGFYNITLAFLQSILVSLLAYILIAISETDIALNTVFVLFFL + HFVAFYISGYGKDFFKRGQYIELVETIKYIIFYSLLISFSSLFLKEKFVISRRGMLYLL + FLYGVLNYLLNFFLKSYWRKFTYNLKRSRKILLVTATSRVERVMDCLLLANDVQGKLVA + VSVLDKPEFTHEKLLVVPKEELISYATHEVVDEVFVNLPSEDYDIGAIISQFETMGVDI + TVNLNTFDKNLSRNKRIHEMAGLNVVTFSTNFYKPSHVITKRILDICGAIVGLFICGIA + SIFIVPQIRKDGGSAIFSQTRVGKNGRHFTFYKFRSMRVDAEAIKEQLMDQNTMQGGMF + KIDNDPRVTKIGKFIRKTSLDELPQFWNVLIGDMSLVGTRPPTVDEYEKYTPEQKRRLS + FKPGITGLWQISGRSEITNFDEVVKLDVAYIDDWTIWKDFEILLKTVKVVLMRDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K0T4" + /gene="wchA" + gene 5193..5984 + /locus_tag="ONOPKJ_00030" + /gene="wciB" + CDS 5193..5984 + /db_xref="RefSeq:WP_000181796.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FFE5" + /db_xref="UniRef:UniRef100_Q4K0T3" + /db_xref="UniRef:UniRef50_A0A081QSA9" + /db_xref="UniRef:UniRef90_Q4K0T3" + /db_xref="UniprotKB:AFN40463.1" + /db_xref="UserProtein:WciB" + /product="""glycosyl transferase""" + /locus_tag="ONOPKJ_00030" + /protein_id="gnl|Bakta|ONOPKJ_00030" + /translation="MTNIKIIVATHKSFEMPQNKELYFPVHVGCEGKDDLGYQGDNTGE + NISQLNPYYCELTGLYWAWKNLDCDYLGLVHYRRYFTKKTQFYKENLKIDEVILNQEEI + ELLLRKGDIIVPKKRKYYIETLCSHYAHTLDASHLDLARKVIEKQQPEYLDSFDKVMKQ + RSGYMFNMFIMKKELANNYFEWLFPILDCMFDQINLSELTAFEARLFGRVSELLFNVWL + EKNLYSLVEVPFMYLEKVNLVEKGKSFLMAKFFGKKYGQSF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000181796.1" + /gene="wciB" + gene 6026..7063 + /locus_tag="ONOPKJ_00035" + /gene="wzy" + CDS 6026..7063 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A4H1DS39" + /db_xref="UniRef:UniRef90_A0A4H1DS39" + /db_xref="UniprotKB:AFN40464.1" + /db_xref="UserProtein:Wzy" + /product="""polymerase""" + /locus_tag="ONOPKJ_00035" + /protein_id="gnl|Bakta|ONOPKJ_00035" + /translation="MLIITFIKYFRISKKWKEAVYFWGFIPLILIGALRAYVGIDYTTY + SLDQIPAVLAGSQTVKFELLDKLVVYIGYYLANQQHYFYIFAIFHIILMWFLYKYIVQQ + SSNVMLSVFFLLTTVFFTFSLSGIRQSIATAIVFYALKYIKQKKSLHYIIYLGIACLFH + SSAVIYILFLVLGKININRFVGFALPMIASLFSFSGSEFVSRIILHLNFYSEYVGSRFY + TGAYDKQHQLFTIVMCLSVFLLYYIVPKKEWVNLKLYLNINFVLLLVAIIMPILPTPSR + TIYMFVLVHVILIPKLISVIKDYRSKVIITMFFVLGYFIFFSITVLQRNAYETLPYHTI + FEYLW" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A4H1DS39" + /gene="wzy" + gene 7070..8092 + /locus_tag="ONOPKJ_00040" + /gene="whaJ" + CDS 7070..8092 + /db_xref="RefSeq:WP_000809622.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0002731E73" + /db_xref="UniRef:UniRef100_A0A4H1DX73" + /db_xref="UniRef:UniRef50_A0A4H1DX73" + /db_xref="UniRef:UniRef90_A0A4H1DX73" + /db_xref="UniprotKB:AFN40465.1" + /db_xref="UserProtein:WhaJ" + /product="""putative glycosyl transferase""" + /locus_tag="ONOPKJ_00040" + /protein_id="gnl|Bakta|ONOPKJ_00040" + /translation="MKQILISIIIPLHNGEDTIIRAVKSVINSRLYGDLIEIIIVENGS + TDQSFKISQKLATENSNIRVLKSDKGTSFARNVGIEKSKGKWLIFLDADDYLFESDLDV + IVENLITNNTDLCVYNYEKGLKKIELFSEEVELIDDLDSFIVQSLSEPTKYMTVWGKAF + NKNLIDEYGLKFNTNLRVSEDSDFYLRFLLLIHSLTLTSQTLYHYSIDSPSTMRTFSSD + KLEGYIVSLNESSKVLGNVDNTIQEAFELYKLAHFNLIMVREVFYFDNSKSFREKIKEM + IRLYKMPMFFEPIQNLSVSSVSNLSLVPLFFLKIHLYHLAALVYIIRVGQNKFKEGRKS + " + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000809622.1" + /gene="whaJ" + gene 8092..9207 + /locus_tag="ONOPKJ_00045" + /gene="wciL" + CDS 8092..9207 + /db_xref="EC:2.4.-.-" + /db_xref="KEGG:K19424" + /db_xref="RefSeq:WP_000821947.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FFE8" + /db_xref="UniRef:UniRef100_Q4K0T0" + /db_xref="UniRef:UniRef50_Q4K0T0" + /db_xref="UniRef:UniRef90_Q4K0T0" + /db_xref="UniprotKB:AFN40466.1" + /db_xref="UserProtein:WciL" + /product="""putative glycosyl transferase""" + /locus_tag="ONOPKJ_00045" + /protein_id="gnl|Bakta|ONOPKJ_00045" + /translation="MKRILVFGMNENPGGVESFIMNYFREFNREKLALDFLCNSNDKIA + YEDELISKGARVFHLTARSKNPIRYYWEMYRFFKEYASDYQAIWVNINSLANIDYLKFA + RYFGIPVRIVHSHNSQNMDTKLREKLHNHNRDKIEKWATDFWACSHEAAKWFYNEETIG + KVKIIPNAINMNASIFSSEARDKIRIDYTLDNKFVLGHVGRLHFQKNQEFMIRVLAKLQ + EFRDDVCLVLVGQGEDLNKLKILAEELSIQDKVYFVGVQSNISEWLSTFDLFFFPSNFE + GLGIAALEAQVNGLPTLLSEEGVPKEVKINDNTFFYPLKESEESWANFLDEMIHTTTRL + NYEYIQENFEKSGYDIKIAAQNLEKQLLELV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000821947.1" + /gene="wciL" + gene 9218..10207 + /locus_tag="ONOPKJ_00050" + /gene="wcwK" + CDS 9218..10207 + /db_xref="EC:2.7.-.-" + /db_xref="GO:0000271" + /db_xref="GO:0016772" + /db_xref="RefSeq:WP_000247840.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FFE9" + /db_xref="UniRef:UniRef100_Q4K0S9" + /db_xref="UniRef:UniRef50_Q4K0S9" + /db_xref="UniRef:UniRef90_Q4K0S9" + /db_xref="UniprotKB:AFN40467.1" + /db_xref="UserProtein:WcwK" + /product="""glycosyl transferase""" + /locus_tag="ONOPKJ_00050" + /protein_id="gnl|Bakta|ONOPKJ_00050" + /translation="MVNNIDFVVTWVNGNDPVWREEKKKYEVLDGRPTLNDETRYRDMD + LFQYWFRAVEKHAPWVNNIYFITYGHLPEWLDANHPKLKIVKHEDYIPKEYLPTFSSNV + IELNLFRIKELSEQFVLFSDDVFINTFLKEEDLFKNNLPRLLSIYRPLIPTKEFDYINF + NHLLIMNRYFHDKKTLSQHKGKFFNVGYGKFNLYNLFSIFYSGIIGYHDAHVAMPHLKS + TFAEIWNKEGVLLDRVCKNKFRSTKDVNHWLMSYWNIETNSFMPQTLRVGEYVPLAYSG + KIESIIHKQKNKFLCINDDEHTENFINEVNFVRKIFEKKFPEKSKFEK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000247840.1" + /gene="wcwK" + gene 10220..11224 + /locus_tag="ONOPKJ_00055" + /gene="wciD" + CDS 10220..11224 + /db_xref="RefSeq:WP_050204382.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E79A7F" + /db_xref="UniRef:UniRef100_UPI0005E79A7F" + /db_xref="UniRef:UniRef50_A0A448K3M3" + /db_xref="UniRef:UniRef90_A0A4H1DXM5" + /db_xref="UniprotKB:AFN40468.1" + /db_xref="UserProtein:WciD" + /product="""putative glycosyl transferase""" + /locus_tag="ONOPKJ_00055" + /protein_id="gnl|Bakta|ONOPKJ_00055" + /translation="MKKQKILSVVIPSYNAAPFLMETIPTLVSISSRNDIEVLIVNDGS + KDETLQVAQKLEKEYSGIVSIIDKENGGHGSTINAGIREAKGKYFKVVDADDWVDSENF + EKLVQFLHKTDADEIISPYTDVFEDDGTKVENNYFKDCSLKPYQDYDYVNFLERIQILP + RMHSITIKTSILRDNNIKIDENMFYVDMEYIVFPTPFIKTITYTPDSVYQYRRGYEGQS + TSIQNYIKNRKMVNHVTFALLGFYNKHTLSNILEKLVKETIARCVTIMTNVCLSMEDTK + QGKKELLDFDQKLKSINSEFYYHKQGKKAKVLRYSNYFLFDLLSSYSKKSKKV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050204382.1" + /gene="wciD" + gene 11242..11487 + /locus_tag="ONOPKJ_00060" + CDS 11242..11487 + /product="hypothetical protein" + /locus_tag="ONOPKJ_00060" + /protein_id="gnl|Bakta|ONOPKJ_00060" + /translation="MIHKIINRLSLTIQQLSGDKPFTIKLVNAYVELLRNTKSRESIKK + IVGSLIQRGYFFQFWFFGALILIYLCLPILRQFLNS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + gene 11451..12323 + /locus_tag="ONOPKJ_00065" + /gene="whaF" + CDS 11451..12323 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_Q4K0S7" + /db_xref="UniRef:UniRef90_Q4K0S7" + /db_xref="UniprotKB:AFN40469.1" + /db_xref="UserProtein:WhaF" + /product="""putative glycosyl transferase""" + /locus_tag="ONOPKJ_00065" + /protein_id="gnl|Bakta|ONOPKJ_00065" + /translation="MFANFETISKFIRNYVIKKHIKKTTNISQIKEVFLENSNTLIQKT + EFPKFIWTMWWQGEENAPELVQSTLYYIRKFAETNGYTTVVIDKNNIDKYLVVPEFVYA + KLEKGSIGVANFSDLIRFMLMEQYGGIWLDSTMYVHPDFPIEILEREFSSINHRDNSSQ + SMDDNITNKRWVSFCLSGEKGNIVSRAMRAFLLDQIENNKVLPDYFIIDFGLDYLYDEF + EEIREIIKSIPRYSSQEDIFWLRIHSKDSYNKDEWNNETKKNQIFKSSYKEDETVKDSY + FDYLVKRKL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K0S7" + /gene="whaF" + gene 12330..13745 + /locus_tag="ONOPKJ_00070" + /gene="wzx" + CDS 12330..13745 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_K8MPI1" + /db_xref="UniRef:UniRef90_Q4K0S6" + /db_xref="UniprotKB:AFN40470.1" + /db_xref="UserProtein:Wzx" + /product="""flippase""" + /locus_tag="ONOPKJ_00070" + /protein_id="gnl|Bakta|ONOPKJ_00070" + /translation="MKVIKNYAYNLSYQLLVFILPIITTPYVTRIFSSNDLGIYGYFSS + IVTYFILLATLGVANYGTKVISGNRKEIEKNFWGIYSLQMGATLLSLFLYLVLCLTLPF + MKNPVAYILGLSLVSKGLDISWLFQGVEDFQKITVRNITVKLVGVISIFLFVKSSNDLY + LYVFLLTIFELLGQFSMWMPARDFIGKFHVDIEYARQHLKPIILLFLPQVAISLYVTLD + RTMLGALASTKDVGIYDQALKLVNILLTFVTSLGSVMLPRVSHLLATGERKAVNKMHEM + SFLIYNLLIFPIMAGILIVNDDFVQLFLGQDFQDARYAIAIMVLRMFFIGWTNIMGIQM + LIPHNQNKEFMISTTAPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQLFYTRRY + LKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSSTLNVLAFAALGGIIYLFAILSLKV + VDVKELKQIIRKN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K0S6" + /gene="wzx" + gene 13747..14626 + /gene="wciG" + /note="O-acetyltrasnferase" + /pseudo + gene 14640..15749 + /locus_tag="ONOPKJ_00085" + /gene="glf" + CDS 14640..15749 + /db_xref="COG:COG0562" + /db_xref="COG:M" + /db_xref="EC:5.4.99.9" + /db_xref="GO:0008767" + /db_xref="GO:0009273" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A4S2G265" + /db_xref="UniRef:UniRef90_F8WRM7" + /db_xref="UniprotKB:AFN40472.1" + /db_xref="UserProtein:Glf" + /product="""galactofuranose mutase""" + /locus_tag="ONOPKJ_00085" + /protein_id="gnl|Bakta|ONOPKJ_00085" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCENV + EGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYAMW + GTKTPQEVKDKITEQTADMKDVEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSATEL + PPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHREELEA + SANKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPYTRIIE + HKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDKVIFCGR + LADYKYYDMHVVIERALEVVEKEFGYDKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_F8WRM7" + /gene="glf" +ORIGIN + 1 attagattga aactagaata gtacacctct gcttctaaaa cattgttaga aatcgatttg + 61 actgtcctga tcgttttgtt atgttcttat ttcattttac tatatttttg gttcgcggga + 121 agtctactaa gatacttaaa gatgcagata gtaaaaaaat gtagacatta ccgtaaaaaa + 181 gtgatataat cgtatgatgt tcaaggtata ggtgttaatc atgagtagac gttttaaaaa + 241 atcaggttca cagaaagtga agcgaagtgt taatatcgtt ttgctgacta tttatttatt + 301 gttagtttgt tttttattgt tcttaatctt taagtacaat atccttgctt ttagatatct + 361 taacctagtg gtaactgcgt tagtcctact agttgccttg gtagggctac tcttgattat + 421 ctataaaaaa gctgaaaagt ttactatttt tctgttgctg ttctctatcc ttgtcagctc + 481 tgtgtcgctc tttgcagtac agcagtttgt tggactgacc aatcgtttaa atgcgacttc + 541 taattactca gaatattcaa tcagtgtcgc tgttttagca gatagtgata tcgaaaatgt + 601 tacgcaactg acgagtgtga cagcaccgac tgggactgat aatgaaaata ttcaaaaact + 661 actagctgat attaagtcaa gtcagaatac cgatttgacg gtcaaccaga gttcgtctta + 721 cttggcagct tacaagagtt tgattgcagg ggagactaag gccattgtcc taaatagtgt + 781 ctttgaaaac atcatcgagt cagagtatcc agactacgca tcgaagataa aaaagattta + 841 taccaaggga ttcactaaaa aagtagaagc tcctaagacg tctaagaatc agtctttcaa + 901 tatctatgtt agtggaattg acacctatgg tcctattagt tcggtgtcgc gatcagatgt + 961 caatatcctg atgactgtca atcgagatac caagaaaatc ctcttgacca caacgccacg + 1021 tgatgcctat gtaccaatcg cagatggtgg aaataatcaa aaagataaat taacccatgc + 1081 aggcatttat ggagttgatt cgtccattca caccttagaa aatctctatg gagtggatat + 1141 caattactat gtgcgattga acttcacttc tttcttgaaa atgattgact tattgggagg + 1201 ggtagatgtt cataatgatc aagagttttc agctctacat gggaagttct atttcccagt + 1261 agggaatgtc catctagact ctgagcaggc tctaggtttt gtacgtgaac gctactcact + 1321 agccgatgga gaccgtgacc gtggtcgcaa ccaacaaaag gtgattgtgg ctatccttca + 1381 aaaattaacg tcaaccgaag cactgaaaaa ttatagtacg atcattaata gcttgcaaga + 1441 ttctatccaa acaaatatgc cacttgagac tatgataaat ttggtcaatg ctcagttaga + 1501 aagtggaggg aattataaag taaattctca agatttaaaa ggtacaggtc ggacggatct + 1561 tccttcttat gcaatgccag acagtaacct ctatgtgatg gaaatagatg atagtagttt + 1621 agctgtagtt aaagcagcta tacaggatgt gatggagggt agatgaaatg atagacatcc + 1681 attcgcatat cgtttttgat gtagatgacg gtcccaagtc aatagaggaa agcaaggcac + 1741 ttttaagaga agcttataat caaggagttc gaatgattgt gtctacttcg catcgtcgaa + 1801 aagggatgtt tgaaactccg gaagagaaga tagcagaaaa ctttcttcag gttcgggaaa + 1861 ttgcaaaaga agtagcagat gatttagtca tagcttatgg cgcagagata tactatactc + 1921 tggatgctct agaaaagcta gaaaaaaaag aaattcctac ccttaatgat agtcgttatg + 1981 ctttgattga gtttagcatg catacttcct atcgtcagat tcatgcggga ttgagcaata + 2041 ttttgatgtt gggaatcacg ccagtaattg ctcatattga acgttatgat gccttagaga + 2101 ataacgaaaa acgtgttcgt gaactgattg atatggggtg ctatactcag ataaatagtt + 2161 atcatgtttt aaaacctaag ttctttggtg aaaaatataa attcatgaaa aagagagctc + 2221 ggtatttttt ggaacgtgat ttagttcatg tagttgcaag tgacatgcac aatttagaca + 2281 gtagacctcc atatatgcaa caggcatatg atatcattgc taagaaatat ggagcgaaaa + 2341 aagcgaaaga attttttgta gataatccca gaaaaattat aatggatcaa ttaatttagg + 2401 agaaaatatg aaggaacaaa acactttgga aatcgatgta ttgcaactat tcagaacttt + 2461 atggaaaaga aagttggtca ttttattagt ggcaattata acttcttcag ttgcttttgc + 2521 ctgcagtact tttgttatca aacctgagtt tactagtacg actcggattt atgtagttaa + 2581 ccgtaatcag gaagagaagt ctggtttaac caatcaagac ttgcaggcag gatcatactt + 2641 ggtcaaagac tatcgtgaaa ttatcctatc gcaggatgtt ttggaggaag ttatttctga + 2701 tttgaaacta gatttgacgc caaaaggttt ggctaataaa attaaagtaa cagtaccagt + 2761 tgatacccgt attgtctctg tttcagttaa tgatcgagtt cctgaagagg caagccgtat + 2821 cgctaactct ttgagagaag tagctgctca aaaaattatc agtattactc gtgtttctga + 2881 tgtgacaaca ctggaggaag caagaccggc gatatcacca tcttcgccaa atattaaacg + 2941 caatacacta attggttttt tggcaggggg gattggaact agtgttatag tttttcttct + 3001 tgaacttttg gacactcatg tgaaacgtcc ggaagatatc gaagatacac tgcagatgac + 3061 acttttggga gttgtaccaa acttgagtaa gttgaaatag gagagaggaa tgccgacatt + 3121 agaaatagca caaaaaaaac tggagttcat taagaaggca gaagaatatt acaatgcctt + 3181 gtgtacaaat atacagttga gcggagataa actaaaagta atttccgtta cttctgttaa + 3241 ccctggggaa ggaaaaacaa ctacttccgt aaatatagca aggtcgtttg cgcgtgcagg + 3301 ctataaaact cttttgatcg atggcgatac tcgaaattca gttatatcag gagtttttaa + 3361 atcgcgtgaa aaaattacag ggctaacaga atttttatct gggacagctg atttatctca + 3421 cggtttatgt gatacaaata ttgaaaattt atttgtaatt caatcgggat ctgtatcacc + 3481 aaaccctaca gccttgttac aaagtaaaaa ttttaatgat atgattgaaa cattgcgtaa + 3541 atattttgat tatatcattg ttgatacagc acctattgga attgttattg atgcggcaat + 3601 tatcactcaa aagtgtgatg cgtccatctt ggtaacagca acaggtgagg tgaataaacg + 3661 tgatgtccaa aaagcgaaac aacaattaga acaaacagag aaactgtttt taggtgtcat + 3721 tctcaataaa tttgatgttc aacatgaaaa atatggttct tacggtggct atggtaatta + 3781 cggaaaaaaa tagaatgaag ttagggagtc cagtatggaa ggaaggggtt tctacaatat + 3841 aactctggca ttcttacaga gtatacttgt tagtctatta gcttatatac tgattgcaat + 3901 ttcagaaacc gacattgctt taaatacagt attcgtcctg ttttttcttc actttgtagc + 3961 cttttatatt agtggttatg gtaaagattt tttcaaaaga ggtcagtata ttgagttggt + 4021 agaaacgata aaatacataa tattttattc cttgttgatc agcttttcaa gtttgttctt + 4081 aaaagaaaaa tttgttattt ctagacgagg aatgctctac ttgcttttcc tatatggtgt + 4141 tttgaattat ctactcaatt tctttttgaa aagttattgg agaaaattca cctataattt + 4201 aaagcgcagt cgcaagattt tattggttac ggcaacatca cgcgtcgaaa gagtaatgga + 4261 ttgcctgtta cttgcgaacg atgttcaagg gaaattggtt gctgttagtg ttttagataa + 4321 gccagaattt actcatgaaa agctccttgt tgtaccaaaa gaagagttga tttcctacgc + 4381 tacccatgaa gtagtagatg aagtttttgt caatcttcca agtgaggact atgatattgg + 4441 agccattatt tctcagtttg aaacaatggg ggttgatata acagtcaatc tcaatacttt + 4501 tgataaaaac ttaagccgaa ataaacgaat ccatgaaatg gcaggattga atgtagtgac + 4561 cttctctacg aatttttaca agcctagtca tgtcattact aagaggattc ttgatatttg + 4621 tggagctatc gttggtcttt ttatctgtgg aattgctagt atattcatag ttcctcagat + 4681 tcgaaaagat ggtgggtctg caatcttttc acaaactcgt gtaggaaaaa atggtcgtca + 4741 ctttaccttt tataaattcc gctcgatgcg agtcgatgca gaagcgatca aggaacagtt + 4801 gatggatcaa aatacgatgc aaggtggtat gtttaagatc gataacgatc ctcgagtgac + 4861 aaagattgga aaatttatcc gaaaaactag cttggatgaa ttgccacaat tttggaatgt + 4921 tttaattgga gacatgagtc tagtaggtac gcgcccacca actgtagatg agtacgaaaa + 4981 atacacacct gaacaaaaac gtcgcctaag ctttaaacct ggtattacag gtttgtggca + 5041 aattagtggt cgaagtgaaa ttacaaactt cgatgaggtt gttaagttgg atgtggctta + 5101 tatcgatgat tggaccattt ggaaagattt tgaaatattg ttaaaaactg taaaagttgt + 5161 gttgatgaga gatggagcga agtaggaggg gtatgacaaa tattaaaatt atagttgcaa + 5221 ctcataagag ttttgagatg ccgcaaaata aagaattgta tttcccagtc catgtggggt + 5281 gtgaaggaaa agatgatttg ggatatcaag gagataatac tggggaaaac atttcccagt + 5341 taaaccctta ttactgtgaa ttaacaggtt tatattgggc atggaagaat ctagattgcg + 5401 attatcttgg actagttcat taccgccgat atttcacgaa gaaaactcaa ttttataaag + 5461 aaaatctaaa aattgatgaa gtaattttaa atcaggaaga aattgaattg cttttgagaa + 5521 aaggagatat aatagttcct aaaaaaagga aatattatat tgaaactcta tgttctcatt + 5581 atgcacacac gctagatgct agccatctag atttggctag aaaagtcatt gagaagcaac + 5641 aacctgaata ccttgattca tttgataaag ttatgaaaca acgtagtggc tatatgttta + 5701 atatgtttat aatgaaaaag gaattagcaa ataattattt tgaatggctg tttccgattt + 5761 tagattgtat gtttgatcag attaatcttt cagagttaac tgcatttgag gcacgtcttt + 5821 ttggtcgtgt aagtgaacta ttattcaacg tatggctaga gaagaatttg tattctctag + 5881 tagaagttcc atttatgtat ttggaaaagg ttaatctagt agaaaaaggg aaatcgtttt + 5941 taatggctaa attttttggt aagaagtatg gacagagttt ttagggagga actaattgat + 6001 ttacattggt acgatgcttc tctcaatgtt gataattact tttatcaagt attttagaat + 6061 atcaaaaaaa tggaaagagg cagtttattt ttggggtttt attcctctta tcttgatagg + 6121 agcacttaga gcttatgtag gaatagatta taccacatat agtttggatc agataccggc + 6181 tgtattagct ggtagtcaga cagtcaaatt tgaattgtta gataaattag tagtgtacat + 6241 aggttactat ctagctaatc agcagcatta tttctatatt tttgcaatat ttcacattat + 6301 cctgatgtgg tttctgtata aatatattgt tcaacagtcg tctaatgtaa tgttgagtgt + 6361 gttttttctt ctaaccactg ttttttttac tttttcttta tcaggaatac gccaatcaat + 6421 agctacagcg attgtttttt atgcgttgaa gtatattaaa caaaaaaaaa gtttacatta + 6481 tataatttat ttagggattg cttgtttatt tcattctagt gcagtaatct atatactttt + 6541 tttagtttta gggaaaatta atattaatag gttcgttggc tttgcattac cgatgattgc + 6601 atcattattt tctttttctg ggtctgaatt tgtatctcga ataatactac atttaaattt + 6661 ttattcagaa tacgttggtt ctcgttttta tacaggagca tatgataagc aacaccaact + 6721 attcacaatc gttatgtgtt tatcggtatt tctattatat tatattgttc cgaaaaaaga + 6781 gtgggttaat ttaaaattat atctgaatat taattttgtg ctattactag ttgcaataat + 6841 catgccaata cttcctactc catcaagaac tatttatatg tttgttcttg tacatgttat + 6901 tctaattcct aagttgattt cagttattaa agattatagg tctaaggtaa tcataacaat + 6961 gttctttgtt ttaggttatt ttatattctt ttctataacg gttctacaga ggaatgcata + 7021 tgaaacacta ccgtaccaca caatctttga gtatttatgg taattgatta tgaaacaaat + 7081 attaatttct attattattc cattacataa tggagaagat acgattatta gagcagtaaa + 7141 aagtgttata aatagcagat tatatggaga tttgattgaa attattattg ttgaaaatgg + 7201 ttcaacagat caatcattta aaatttctca aaaattagcg accgaaaact caaatatacg + 7261 agtcttgaaa tcagataaag gaaccagttt tgccagaaac gtaggaatcg aaaaatctaa + 7321 aggaaagtgg cttatttttt tagatgcaga tgattattta tttgaatcgg atttagacgt + 7381 tattgttgaa aatttaataa ccaataatac agatttatgc gtttataact acgaaaaagg + 7441 gcttaagaaa atagaacttt tttcagaaga ggtagagttg atagatgacc ttgattcttt + 7501 tatagttcaa tctctttctg aacccactaa atatatgaca gtatggggaa aagcgtttaa + 7561 taaaaatttg attgatgagt acggtttgaa gtttaatacg aatttgagag tttcagaaga + 7621 tagtgatttt tatctcagat ttcttttgct gattcatagt ttaactttaa cttctcaaac + 7681 gctataccat tattcaattg attcaccttc aacgatgagg acattttctt cagataaatt + 7741 agaaggttat attgtttcct tgaatgaaag ctcaaaagta ttaggaaatg ttgataatac + 7801 tattcaagaa gcctttgagt tatataagtt ggcgcatttt aatttaataa tggttagaga + 7861 agtgttctat tttgataatt caaaaagttt cagagaaaag ataaaggaaa tgattagact + 7921 ttataagatg cctatgtttt ttgagcctat acaaaatcta tctgtatcta gtgttagcaa + 7981 tttatcgcta gtacctctat tttttttgaa aatacatttg tatcatttag cggcattggt + 8041 ttacattatt cgagtagggc aaaacaaatt caaagaagga agaaaaagtt gatgaaaaga + 8101 attctagtat tcggaatgaa tgaaaaccct ggtggagttg aatcctttat aatgaattat + 8161 tttcgtgaat ttaatcgcga aaaattagcc ttagattttt tgtgtaattc aaatgataaa + 8221 atagcttatg aggatgaact tatttctaaa ggagcaagag tttttcacct gacagcgaga + 8281 agtaaaaatc cgatacgtta ttattgggaa atgtatagat tcttcaaaga atatgcatct + 8341 gattatcagg caatttgggt taatattaat agcttagcaa atattgacta tttaaaattt + 8401 gcaagatatt ttggtattcc ggttcgaatt gtacacagcc ataatagtca aaatatggat + 8461 accaaacttc gtgaaaaatt acataatcat aatagagaca aaattgaaaa gtgggcaacc + 8521 gatttctggg cttgttcgca cgaagctgca aaatggtttt ataacgaaga aactattgga + 8581 aaagttaaga ttataccaaa tgctattaat atgaatgctt ctattttttc ttctgaggca + 8641 cgagataaaa ttcgaattga ttatacatta gacaataaat ttgtgctagg tcatgtagga + 8701 cgtttgcatt ttcagaagaa tcaagaattt atgataagag ttttagctaa attacaggaa + 8761 tttagagacg atgtctgctt agttttagtt ggtcaaggtg aagatcttaa caaattaaag + 8821 atactggctg aggagctatc tattcaggat aaggtctact ttgtgggagt tcagtcgaat + 8881 atatcagaat ggttgagtac ttttgactta ttcttttttc cgtctaattt tgaaggttta + 8941 ggaatagctg cattagaggc tcaagtaaat ggtctaccga cactactctc agaagaaggt + 9001 gtaccaaagg aagtaaaaat caatgataat actttttttt atccattgaa ggaaagtgaa + 9061 gaaagctggg caaacttcct tgatgaaatg attcatacaa caactcgttt aaattatgaa + 9121 tatatacaag aaaattttga gaaatctggc tacgatatta agatagctgc tcagaatctt + 9181 gaaaaacaat tgctagaatt agtttaggga agataacatg gttaataata ttgattttgt + 9241 agttacatgg gttaatggaa atgatccagt gtggcgtgag gaaaaaaaga aatacgaagt + 9301 tctagatggt aggccgactt taaatgatga aacaagatat agagatatgg atttgtttca + 9361 atattggttt cgagcggtag aaaaacatgc gccctgggtt aataatattt atttcattac + 9421 atatgggcat ttacctgaat ggctggatgc aaatcaccct aaattgaaga tagtaaaaca + 9481 tgaagattat attccaaaag aatacttacc gacttttagt tcaaatgtaa ttgaactaaa + 9541 tctttttagg attaaggaat tgagtgagca gttcgttctg tttagtgatg atgtttttat + 9601 taacacattt ttaaaagaag aagatttgtt taaaaataac ttacctcgat tgttgagtat + 9661 atatagacca ttaattccaa ctaaagaatt tgattatatt aatttcaatc atttattaat + 9721 aatgaataga tactttcatg ataaaaaaac attatcacaa cataagggta aattttttaa + 9781 tgtaggttat ggaaagttta atctgtataa tctatttagc attttttatt cagggattat + 9841 tggttatcat gatgctcatg tcgctatgcc tcatttgaaa agtacttttg cagagatttg + 9901 gaataaggaa ggggtacttc tagatcgagt ttgtaaaaac aaatttcgtt caactaaaga + 9961 tgttaaccat tggttgatga gctattggaa tattgaaaca aattcattta tgccacagac + 10021 tcttcgtgtg ggtgaatatg tgcctctggc ttattcaggt aaaattgaat ctattattca + 10081 caaacaaaag aataagtttt tgtgtataaa cgacgatgaa cataccgaaa acttcattaa + 10141 cgaagttaac tttgttcgta aaatatttga gaaaaaattt cctgaaaagt ctaaatttga + 10201 aaagtaaagg ggaactaaat tgaaaaaaca aaaaatactt agcgtggtaa ttccatccta + 10261 caatgcggct ccatttttga tggaaactat tccgactcta gtttctatta gcagcagaaa + 10321 tgatattgag gttttgattg taaatgatgg gtctaaagat gagacacttc aagtggctca + 10381 gaaactggaa aaagagtatt ctggcatagt tagtataatt gataaagaaa atggcggtca + 10441 tggatctaca attaatgctg ggataaggga agctaaaggg aagtacttta aagttgttga + 10501 tgctgatgat tgggtagata gtgaaaactt tgaaaagctt gtacaatttc ttcataaaac + 10561 agatgccgat gaaattatct ctccatatac agacgttttt gaagatgatg gtacaaaggt + 10621 agaaaataac tattttaaag attgttcatt aaaaccatac caggattatg attatgtgaa + 10681 ttttttagaa cggattcaaa ttttacctag aatgcattct ataacaataa aaacctctat + 10741 tttaagagat aataacataa aaattgatga gaatatgttc tacgttgaca tggagtatat + 10801 tgtttttcca actccattta tcaaaacaat aacttatacg cctgactctg tttatcagta + 10861 tcgtagaggt tacgaaggac agagtacgag tattcagaac tatataaaaa atagaaaaat + 10921 ggtaaatcat gtcacattcg ctttgcttgg cttttataat aaacacactt tatctaatat + 10981 tctggaaaaa ctagttaaag agacaattgc tagatgtgtt actattatga caaatgtttg + 11041 tctatcaatg gaagatacta aacaaggtaa aaaggaactt cttgattttg atcagaaatt + 11101 aaaatcaata aattctgagt tctattatca taaacaaggg aaaaaagcta aagttttaag + 11161 atattcaaat tacttcttgt ttgacttatt atctagctac tctaagaagt ctaaaaaagt + 11221 atagttgctg taggagtata tatgatacat aaaattatta atcgattatc acttacgatt + 11281 caacaactta gtggcgataa accatttact atcaaattag ttaatgcata tgtagaacta + 11341 ttaagaaata caaaatctag agaatctatt aaaaaaattg taggttcttt gatacaaaga + 11401 ggttatttct ttcagttttg gtttttcggt gcactcatac ttatctattt atgtttgcca + 11461 attttgagac aatttctaaa ttcataagaa attatgtaat aaagaaacac attaaaaaaa + 11521 ccacgaatat ttctcaaatt aaggaagttt ttctagagaa tagtaatact ttaatacaaa + 11581 aaactgaatt tcctaaattt atctggacta tgtggtggca aggagaagag aatgcacctg + 11641 agttagtcca aagtacactc tattatatta gaaaatttgc tgaaactaat ggttatacga + 11701 cagtagttat tgataaaaat aatatagata agtatctagt agttcctgaa ttcgtatatg + 11761 caaagttgga gaagggtagt ataggtgttg caaatttttc agatttaatc cgatttatgc + 11821 taatggaaca atatggagga atttggttag attcaacgat gtatgtccat ccagatttcc + 11881 ctattgaaat attagaaaga gaattttctt cgataaatca tagggataat tccagccaat + 11941 caatggatga caatataaca aataaacgct gggtttcatt ttgtttgagt ggagagaaag + 12001 ggaacattgt ttctcgagca atgcgagctt ttttattaga tcaaattgaa aataataaag + 12061 tattacctga ttattttata attgactttg gtttagatta tctatatgat gaatttgaag + 12121 agataaggga aataataaaa agtatcccta gatattctag tcaagaagac atcttttggt + 12181 tgagaataca tagtaaagat agttataaca aagatgaatg gaataatgaa acgaaaaaaa + 12241 atcaaatttt caagagtagt tataaagaag atgaaacagt gaaagatagt tatttcgact + 12301 accttgttaa aagaaagtta taaagtaata tgaaagttat aaaaaactat gcttacaatc + 12361 tttcatatca attgttggtg ttcatactcc ctattatcac aactccttat gtgactcgga + 12421 tttttagttc taatgattta gggatatacg gatactttag ttcgatagtt acttatttta + 12481 ttttgctggc tactcttgga gttgctaact atgggaccaa ggtaatctct gggaatcgaa + 12541 aggaaattga aaaaaacttt tgggggattt actcattgca aatgggtgca acgcttcttt + 12601 ctctattctt gtaccttgtt ctttgtctga ctcttccctt tatgaaaaat ccggtagcct + 12661 atattctagg cttgagttta gtttctaaag gtttagacat ctcctggctc tttcaagggg + 12721 tggaggattt tcaaaagatt actgtccgaa atatcacagt caaactcgtt ggtgtcatct + 12781 ccatctttct ctttgttaaa tcatcaaatg acctttacct ctatgtcttt ttgctaacca + 12841 tttttgaact cttgggccaa ttcagtatgt ggatgccggc tcgagacttt atcggcaagt + 12901 ttcatgttga tatagaatac gccagacagc atttgaagcc aattatttta ttgttccttc + 12961 cgcaagtggc gatttccttg tatgttacgc tagatcgtac catgcttgga gcgttagctt + 13021 ctacaaaaga cgttggcatc tacgatcaag ccctaaaatt ggtaaatatt cttctaacct + 13081 ttgtaacttc attgggaagt gttatgctgc cacgagtatc tcatctgctt gcgacaggtg + 13141 aacgtaaggc agtaaacaag atgcatgaga tgtctttttt gatttataat ttgcttattt + 13201 ttccgattat ggcggggatt ctgatcgtga atgatgattt cgttcagtta tttctaggac + 13261 aagattttca agatgcacgc tatgcaattg cgattatggt tctcaggatg ttctttatcg + 13321 gttggaccaa tatcatggga attcagatgt tgatacctca taatcaaaat aaagaattca + 13381 tgatttcaac aacagctcca gccattatta gcgttggatt gaatctatta ttcctaccca + 13441 agttaggtta tataggagca gccattgtct ctgttttaac agaggcactt gtatgggcaa + 13501 tccaattatt ctatactcgc agatatttaa aagaagttcc tataatcgga tcaatgtcaa + 13561 aaattatact agcatctgcc attatgtatg gccttttact aagttcaaaa acagttatac + 13621 atttttcatc gaccttaaat gttctagcat ttgcagcgct tggtggaatc atttatcttt + 13681 ttgcaattct atctctgaaa gtggtagatg tgaaagaatt aaaacaaatt attaggaaaa + 13741 actagaatga gaaaaaatcg aaatattaac ctagatttac taaaagtgct tgcatgtgtt + 13801 ggagttgttt tacttcatac aacaatgggc ggatttaaag agacagactc atggaatctt + 13861 ttggcatatt tatattattt aggtacttac tctattcccc tgttttttat ggtcaatggt + 13921 tatttattgt taggcaagag ggagataact tatctttaca tactccagaa agtaaaatgg + 13981 attttaataa cagtgtcatc atggtcattt atcgtatggc tttttaagcg tgattttaca + 14041 actaatcaaa agaagctatt tatacagttt atctttattg atgactattg gtttgatttt + 14101 tgagttatca aatatcctac ttcaaatgcc aatacaaaca tatgtaatac aaacttttag + 14161 attatggacg tggttttttt actatctttt aggtggttat atagcgcaat tcactataga + 14221 agaaatcgaa tcaaggttta agaattggat gaaaatagtt agcatacttt tgttattgat + 14281 ttcaccaata atattatttt tcatagcgaa gactatatac cataatctat ttgctgaata + 14341 cttttatgat actttatttg taaaagtcag tactttagga atttttctaa ctatcctcat + 14401 gcttactttg aatgaaaacc gaagagaatc gattgtttcc ctttctaatc aaacaatggg + 14461 ggttttcata atacatactt atattatgaa agtgtgggaa aaagtgcttg gttttaattt + 14521 tgtaggagca tatttacttt ttgctctatt tactttaagt gttagtttta ttattgttgg + 14581 gatgttaatg aagattcctt acttcaatcg aatcgtcaaa ttataaaaag gagaacaaga + 14641 tgtacgatta tcttattgtc ggtgctggtt tgtcaggagc aatttttgct tatgaggcga + 14701 ccaagcgtgg aaaaaaagta aaagtgattg ataaacgtaa ccacattggt gggaatatct + 14761 actgtgagaa tgtagaagga gttaatgttc ataaatatgg tgcccatatc tttcatactt + 14821 ctaataagaa agtttgggat tatgttaatc aatttgctga atttaacaac tacgtcaact + 14881 cgcctgtagc taattacaag ggtagcctct ataatctacc tttcaatatg aataccttct + 14941 atgctatgtg ggggacaaaa actcctcaag aagtcaaaga taagattact gagcagacag + 15001 ctgatatgaa ggatgttgag ccgaaaaatc tggaagaaca ggctatcaag ttgattggtc + 15061 cagatgtcta tgaaaagtta atcaagggtt atactgaaaa gcagtgggga cgctcagcaa + 15121 cagaacttcc tccatttatc attaaacgac ttccagttcg tttaaccttt gataataact + 15181 attttaatga ccgttaccaa gggattccta ttggtggtta caatgtcatc atcgaaaata + 15241 tgctgaaaga tgtagaagtt gaacttggag tagacttttt tgctcatcgt gaagagttgg + 15301 aagcatctgc taacaaagtt gtcttcacag gaatgatcga ccaatatttt gattacaagc + 15361 acggagagtt agaataccgt agccttcgtt ttgagcatga gattttagac gaggaaaatt + 15421 atcaaggaaa tgctgtagtg aactatacgg agcgtgagat tccttatact cgtattatcg + 15481 aacacaagca ttttgaatat ggaacacagg caaagacagt tatcacgcgt gaatatccag + 15541 ctgactggaa gcgtggggac gagccttact atccgatcaa cgatgagaaa aataatgcta + 15601 tgtttgctaa gtaccaagag gaagcttcaa agaatgataa ggttattttc tgtggacgtt + 15661 tagcagatta taaatattat gatatgcatg tggtgattga acgggcgctt gaggttgtgg + 15721 agaaagagtt tggatatgac aaaaagtaga atcaattgga tagattttgg aaaaggcttt + 15781 tccatatttt tagtcttagc agggcatgtg ttgcttggac tgtatcaatc ggaaaaattt + 15841 cccacagcaa ataacatact atcgttgttg atagcacaag tctacatatt tcatatacca + 15901 gtattttttg ccttatcagg atactttttc aaacctgtgt cggatttgaa ggagttctgg + 15961 caatatgcta aaaagaagac aattgttttt ggtctgccat atattttcta ttcgatcatt + 16021 cactttggtc ttcaaaaagt tgcaggggca tctgttcgtg ttcctacaac catatctgat + 16081 ttgctaaata tctataaaga tcctcttgga gtttcgtggt atttatatat actctggtcg + 16141 attttgataa tctatggatt attgtctatt ttagtcaaaa atcgtagaat gttatttttg + 16201 ataagtgttt tcgcttattg tttaacccta tttgttcaaa cagatattta tattattcaa + 16261 agaacgctag tttgggggct ttgtttcttt cttggcagtg tattgaatga aattcacttt + 16321 gataaaatta atttgaaaaa atttcttttt ttctttgtgc tatttgattt tatttatatg + 16381 ttcgcttggt tcttgtttta tgaagtaggg tctaagaagg attatgtaag ctatagtaac + 16441 ccaggtttgt gggggattgc ttttgttgtc tgtgtattag ttgcttttgc gatttttccg + 16501 aaaatggaga aaaattttcc taaaactttc ctatatttca ctaaatacgg gaaagatagt + 16561 ttagggattt atattcttca tgcaccaatt tgtagcatga ttcggattct aatgttgaaa + 16621 gtgggaataa actcagtttt tcttcacgtt gttgttggga ttgtgctagg ctggtattta + 16681 tccatactag caacttatat attgaaaaaa attccatttt tgaatattgt tttattacca + 16741 caaaagtata ttaaattaaa a +// diff --git a/public/res/serotype_genbank/serotype_21.gb b/public/res/serotype_genbank/serotype_21.gb new file mode 100644 index 0000000..60d222d --- /dev/null +++ b/public/res/serotype_genbank/serotype_21.gb @@ -0,0 +1,1153 @@ +LOCUS CR931680 25559 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 546/62 (serotype 21). +ACCESSION CR931680 +VERSION CR931680.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 25559) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 25559) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..25559 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="546/62" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC21_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC21_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33732.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..463 + /gene="aliB" + /locus_tag="SPC21_0002" + /pseudo + CDS 293..463 + /gene="aliB" + /locus_tag="SPC21_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(462..995,997..1323)) + /gene="tnp" + /locus_tag="SPC21_0003" + /pseudo + CDS complement(join(462..995,997..1323)) + /gene="tnp" + /locus_tag="SPC21_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(933..995,997..1305)) + /gene="tnp" + /locus_tag="SPC21_0003" + /note="HMMPfam hit to PF01710, Transposase, score 1.2e-23" + /pseudo + gene 1547..3001 + /gene="wzg" + /locus_tag="SPC21_0004" + CDS 1547..3001 + /gene="wzg" + /locus_tag="SPC21_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33735.1" + /db_xref="GOA:Q4K0S0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0S0" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILASSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDL + PSYAMPDSNLYVLEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1547..1672 + /gene="wzg" + /locus_tag="SPC21_0004" + /note="Signal peptide predicted for SPC1079 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 1760..2107 + /gene="wzg" + /locus_tag="SPC21_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.5e-63" + misc_feature 2285..2728 + /gene="wzg" + /locus_tag="SPC21_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 3003..3734 + /gene="wzh" + /locus_tag="SPC21_0005" + CDS 3003..3734 + /gene="wzh" + /locus_tag="SPC21_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33736.1" + /db_xref="GOA:Q4K0R9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0R9" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLIIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDKGCYT + QVNSSHILKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3006..3614 + /gene="wzh" + /locus_tag="SPC21_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.3e-37" + gene 3740..4435 + /gene="wzd" + /locus_tag="SPC21_0006" + CDS 3740..4435 + /gene="wzd" + /locus_tag="SPC21_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33737.1" + /db_xref="GOA:Q4K0R8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0R8" + /translation="MMKEQNTIEIDVFQLLKTLWKRRLMILLVALVTGAGAFAYSTFV + VKPEYTSTTRIYVVNRNQEDKPGLTNQDLQAGTYLVKDYREIILSHDVLEKVATNLKL + DMPARALASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFSFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLRI + PLLGLVPDLDKMK" + misc_feature 3740..3856 + /gene="wzd" + /locus_tag="SPC21_0006" + /note="Signal peptide predicted for SPC1081 by SignalP 2.0 + HMM (Signal peptide probability 0.725) with cleavage site + probability 0.447 between residues 39 and 40" + misc_feature 3761..4177 + /gene="wzd" + /locus_tag="SPC21_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 9.7e-55" + gene 4445..5134 + /gene="wze" + /locus_tag="SPC21_0007" + CDS 4445..5134 + /gene="wze" + /locus_tag="SPC21_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33738.1" + /db_xref="GOA:Q4K0R7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0R7" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDNLKVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMSGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5150..6517 + /gene="wchA" + /locus_tag="SPC21_0008" + CDS 5150..6517 + /gene="wchA" + /locus_tag="SPC21_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33739.1" + /db_xref="GOA:Q4K0R6" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0R6" + /translation="MNGKIVKSSLVIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQAFFKRGYLIELVQTLKYILFFALAIGISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDATVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSVVLVPLIRKDGGSAIFAQTRIGKNGRYFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5150..5242 + /gene="wchA" + /locus_tag="SPC21_0008" + /note="Signal peptide predicted for SPC1083 by SignalP 2.0 + HMM (Signal peptide probability 0.894) with cleavage site + probability 0.356 between residues 31 and 32" + misc_feature 5933..6514 + /gene="wchA" + /locus_tag="SPC21_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 6.1e-159" + gene 6504..7721 + /gene="wchF" + /locus_tag="SPC21_0009" + CDS 6504..7721 + /gene="wchF" + /locus_tag="SPC21_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33740.1" + /db_xref="GOA:Q4K0R5" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K0R5" + /translation="MERNSLLLFQTTRRKMKKSVYIIGSKGIPAKYGGFETFVEKLTE + YQKDGNIQYYVTCMRENSAKSGFTADTFEYNGAICYNIDVPNIGPARAIAYDIAAVNK + AIELAKENKDEAPIFYILACRIGPFISGLKKKIRSIGGRLLVNPDGHEWLRAKWSLPV + RKYWKFSEQLMVKHADLLVCDSKNIEKYIREDYKQYQPKTTYIAYGTDTTPSSLKSED + AKVRNWYREKGVSENGYYLVVGRFVPENNYETMIREFIKSKSNKDFVLITNVEQNKFY + DQLLKETGFDKDLRVKFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTK + LNLLLDVGFNREVGEDGAIYWKKDELAHVIEEVERFDEGDISELDEKSSQRIADAFTW + EKIVSDYEEVFKG" + misc_feature 7167..7658 + /gene="wchF" + /locus_tag="SPC21_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0022" + gene 7725..8882 + /gene="wcwA" + /locus_tag="SPC21_0010" + CDS 7725..8882 + /gene="wcwA" + /locus_tag="SPC21_0010" + /note="member of homology group 63" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33741.1" + /db_xref="GOA:Q4K0R4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K0R4" + /translation="MKRILYLHAGAEMYGADKVLLELIKGLDSKEFETHVILPNDGVL + VEALRQVGAQVSVLDYPILRRKYFNPKGIFEYLKSYHRYSQKIAQYVRENGIVLVHNN + TTAVLEGIYLKRKVKLPLIWHVHEIIVKPKAISDFINFLMGRYANKIVTVSQAVASHV + NQSPFIKEGQVQVIYNGVDNAVYHPMPASTVREQFSIPEEALVIGMVGRVNAWKGQGD + FLEAVTPILEQNPNAIAFLAGSAFAGEEWRVEELESKIAKSSVVSQIKRIDYYEHTTE + LYNMFDIFVLPSTNPDPLPTVVLEAMACGKPVVGYRHGGVCEMVDEGTNGLLATPNQP + AELSKVIQELVENPEKRNQFGQASVERQRELFSLDSYIKNFSELYKTDRKD" + misc_feature 8286..8807 + /gene="wcwA" + /locus_tag="SPC21_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.7e-31" + gene 8885..9883 + /gene="wcwK" + /locus_tag="SPC21_0011" + CDS 8885..9883 + /gene="wcwK" + /locus_tag="SPC21_0011" + /note="member of homology group 64" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33742.1" + /db_xref="GOA:Q4K0R3" + /db_xref="UniProtKB/Swiss-Prot:Q4K0R3" + /translation="MNKIDFVVTWVDGNDPVWKEKKSRYDGSVSTSKQSMNSVKAYRE + WGTFKYWFRGVERFAPWVNKVYLVTDQQRPSWLDINSEKLVLVDHTEIICNDCLPVFS + ANPIESNIHRIPGLSEHFVFFNDDMYLTAPVEPTDFFSEDGLPKYNTALSPIIPERYG + TGNFQINDMEIVTSYFSRNEILKNGQFFDPKQGLKSIVKSLLYRNSQFICGFWESHLP + YPLLKSTMDLIWEKEKAVLGRTSASRFRNPSDTNVWLFKYWQIASGQYAVGNPKLGRL + FSLDNAGPDFWNLLNSGKYKIMCINDVYDIKDEEKVMQEFIAAMKNLLPDKSTFEL" + gene 9899..10876 + /gene="wcyT" + /locus_tag="SPC21_0012" + CDS 9899..10876 + /gene="wcyT" + /locus_tag="SPC21_0012" + /note="member of homology group 194" + /codon_start=1 + /transl_table=11 + /product="glycosyl transferase" + /protein_id="CAI33743.1" + /db_xref="GOA:Q4K0R2" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0R2" + /translation="MPSVCALVVTYNRSKYLQKALEGILNQQQEISGILIYNNNATDN + TEEILMKFGYVDSKGDKIKENYLYSTEKDGKHFYYYHNDENLGGAGGFANGIRLISEL + DYDYVWIMDDDVYPEPNCLSEIMKQMSVQNVQVGIPNRTDENFDDRAIIGFDFDDYHK + FWTEMRKTVTYGPFDEEAIKVVDMPFEGPVVEMALLRKVGIPDSGFFIEYDDSDFAQR + LQQYSDIIFATKAQLHRQLAVKVDPSEVKKVEPYNWRNYYKIRNNIIFDKRYGKNWKV + RQLSPLILIAHHIVIAIRHQHLKHNLPIIWKGFWDGVFQRMGKRVDPNY" + misc_feature 9911..10498 + /gene="wcyT" + /locus_tag="SPC21_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 9.5e-22" + gene 10889..11917 + /gene="wcyU" + /locus_tag="SPC21_0013" + CDS 10889..11917 + /gene="wcyU" + /locus_tag="SPC21_0013" + /note="member of homology group 195" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33744.1" + /db_xref="GOA:Q4K0R1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0R1" + /translation="MSDLLLSFIMPTYNSAEYLADTMDSLVASIGDYNHLVEIICVDD + GSWDNTVTILEGYKSIYDNLIIIRNEHGGVSQARNTALDIVSGKYISFVDSDDLYEKD + FLNTFISLDKNFDFLFTDVGGLKDEISFQEINEKEKLKIFKNNFNLGEYTIHPGIAGK + FFRTSLINDIQLRFNTQLSFAEDILFNFTLLTASRHVILSPVNFYHVNGTHSLMYYNE + KNLKGQIVFVDRIRQILKGYSESSEIVLIENFIILKAMTVYIDRYFGPLWLNGTYSLN + EASKLMKSTIEDNDFSKAFNSNRLDYSIGNRYVVFRKLLRFRQYKLCLLYNRIMDKIK + GYERFRKQ" + misc_feature 10907..11401 + /gene="wcyU" + /locus_tag="SPC21_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.5e-29" + gene 11914..13134 + /gene="wzy" + /locus_tag="SPC21_0014" + CDS 11914..13134 + /gene="wzy" + /locus_tag="SPC21_0014" + /note="member of homology group 240" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33745.1" + /db_xref="UniProtKB/TrEMBL:Q4K0R0" + /translation="MIKLSIHDIYRYFLYLIFFMNLLFFNIVSDLTYTIQNFSVYLTF + LLMGMYLLQRRISKLTIFTSITVLLFFLLIMFNLYRQGLPVNGFLSFNSKIYLLRNFS + FILLVFPISEILKPKYSLNFLKVVFVFGILAILFRTFIWMSYNYAGLNIAPGIIEERG + VNWTRYGAVRLQALFLDGYVLAYLLCKLLISDSKNKVSYSLLLLITLFYEGVIYASRS + QLIGFSIMFIAIYLLKNKNLLNKLLSFLSLSLASFAILLSPYYEKFIDSFSVSNSDYG + AGTMVRIVGRRYYQEIWNQNKLLGFGPISDGNIFAGWKYYLSDLGIIRMLYQFGIIGF + IICLLPILYGCLVGFKNRLHFKGMLLFCLSLFVLVTSFASQNLYDYNRIMLLPLLLGL + ANAVSSTQADKDMV" + gene 13131..14555 + /gene="wzx" + /locus_tag="SPC21_0015" + CDS 13131..14555 + /gene="wzx" + /locus_tag="SPC21_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33746.1" + /db_xref="GOA:Q4K0Q9" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K0Q9" + /translation="MKVLKNYAYNLSYQLLLIILPVITTPYITRVFSSDDLGTYGYFN + SIVTYFILLATLGVANYGTKEISGHRKEIRRNFWGIYTLQLGATILSGTLYAILCLSL + PSMQDSVAYILGFSLLSKGLDISWLFQGLEDFRKIIVRNITVKLVGVISIFLFVKSAK + DLYLYVFLLTIFELLGQLSMWVPAREFIGKPHIDINHAKKHLKPVILLFLPQIAISLY + VTLDRTMLGALASKTDVGIYDQALKLVNILLTLVTSLGSVMLPRVSSLLSQSDYKSVK + KMYQMSFLIYNSVIFPIIAGMLIVNDDFVQFFLGRDFQDARYAIAIMMFRMFFIGWTN + IMGIQILIPHNKNKEFMISTTVPAIVSVGLNLIFLPNLGFIGAAIVSVLTEALVWGIQ + LHFTWSYLKEVPIIGSMIKIVIASGIMYAFLVSMKSVVHVSPAINVALYALLGGVIYV + ALILLFKVVNLKELKQELLKNREI" + misc_feature 13137..13931 + /gene="wzx" + /locus_tag="SPC21_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.9e-68" + gene 14557..15657 + /gene="glf" + /locus_tag="SPC21_0016" + CDS 14557..15657 + /gene="glf" + /locus_tag="SPC21_0016" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33747.1" + /db_xref="GOA:Q4K0Q8" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0Q8" + /translation="MYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTADTKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEVSAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQPKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALSVVEEEFSN" + misc_feature 14992..15594 + /gene="glf" + /locus_tag="SPC21_0016" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.2e-138" + gene 15685..16554 + /gene="rmlA" + /locus_tag="SPC21_0017" + CDS 15685..16554 + /gene="rmlA" + /locus_tag="SPC21_0017" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33748.1" + /db_xref="GOA:Q4K0Q7" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K0Q7" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFIIGEKFIGDDSV + ALILGDNIYHGPGLSKMLQKAAQKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PKDPRSNYAVTGLYFYDNDVVEIAKGIKPSARGELEITDINKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLELAQPLKKN + EYGRYLLRLIGEV" + misc_feature 15688..16404 + /gene="rmlA" + /locus_tag="SPC21_0017" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 2.7e-118" + gene 16555..17151 + /gene="rmlC" + /locus_tag="SPC21_0018" + CDS 16555..17151 + /gene="rmlC" + /locus_tag="SPC21_0018" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33749.1" + /db_xref="GOA:Q4K0Q6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4K0Q6" + /translation="MTDNFFGKTLAVRKIDAISGMLEFDIPVHGDNRGWFKENFQKEK + MVPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADNGKVLGTWVDLREG + ETFGNIYQTEIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYS + DPELGIEWENLEEAEVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 16588..17121 + /gene="rmlC" + /locus_tag="SPC21_0018" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 4.4e-16" + gene 17161..18210 + /gene="rmlB" + /locus_tag="SPC21_0019" + CDS 17161..18210 + /gene="rmlB" + /locus_tag="SPC21_0019" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33750.1" + /db_xref="GOA:Q4K0Q5" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0Q5" + /translation="MTKYKNIIVTGGAGFIGSNFVHYVYNNFPDVYVTVLDKLTYAGN + RANIEEILGDRVELVVGDIADAALVDKLAAEADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDLRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQTAD + AYDHVTDRAGHDLRYAIDASKLCDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 17176..18132 + /gene="rmlB" + /locus_tag="SPC21_0019" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00028" + misc_feature 17179..17919 + /gene="rmlB" + /locus_tag="SPC21_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 3.1e-76" + misc_feature 17182..17994 + /gene="rmlB" + /locus_tag="SPC21_0019" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 4.1e-05" + gene 18276..19127 + /gene="rmlD" + /locus_tag="SPC21_0020" + CDS 18276..19127 + /gene="rmlD" + /locus_tag="SPC21_0020" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33751.1" + /db_xref="GOA:Q4K0Q4" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0Q4" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATKDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 18276..19124 + /gene="rmlD" + /locus_tag="SPC21_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.3e-147" + misc_feature 18279..18920 + /gene="rmlD" + /locus_tag="SPC21_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 18279..18908 + /gene="rmlD" + /locus_tag="SPC21_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.6e-19" + misc_feature 18282..19010 + /gene="rmlD" + /locus_tag="SPC21_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.4e-08" + gene 19477..20139 + /gene="glf" + /locus_tag="SPC21_0021" + CDS 19477..20139 + /gene="glf" + /locus_tag="SPC21_0021" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33752.1" + /db_xref="GOA:Q4K0Q3" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0Q3" + /translation="MNTFNKLWGVVTPAGAQAKIEEQRAILNGKTPENLEEQEISLVG + TDIYEKLIKDYTEKQWGKPTTELPSFIIRRLPVHLTYDNNYFNDTYQGIPIGDYNVII + ENMLKDVEVELGVNFFANRQELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFDHEVL + DEENYQGNAVVNYTEREIPYTRIIEHKHFEYGTQEKTVITREYPADFFLHNRKHYKRN + SK" + misc_feature 19624..20136 + /gene="glf" + /locus_tag="SPC21_0021" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 2.7e-76" + gene 20136..21209 + /gene="wcyO" + /locus_tag="SPC21_0022" + CDS 20136..21209 + /gene="wcyO" + /locus_tag="SPC21_0022" + /note="member of homology group 80" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33753.1" + /db_xref="GOA:Q4K0Q2" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4K0Q2" + /translation="MTRISMKKIKEYEILKVIAIILVVVGHSTYYNIYTGYGGIDYQQ + YINNHLSLAVYKLLSKLTEIIYYFHMPLFMAISGAFFSIQVKNNRWHGIGSLLTNKFR + RLMIPFLVFTLVYTIPIKYISNYFDGISFWKAVSGQLFLFGNSHLWYLYALFIVFIVG + FYILKKRTLFYVYLLLYILHILSYSVHLTLVSAPLQYLFWFSMGFLFEFKREQYNHYL + KNNKWLSFLLVLLFIACVALKFVLKDNHEVLNRIIMDLAAVLGSLICYNISYYLSDKR + ELTENRLFNVILINGLGIYIFSDTLNYLILNISYSISNRFMFTSFGILALFLIRIFFT + LFIGLGLTLLFKKIFKKHSWLVN" + misc_feature 20160..21167 + /gene="wcyO" + /locus_tag="SPC21_0022" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 1.2e-05" + gene complement(order(21403..21984,22038..22706)) + /gene="tnp" + /locus_tag="SPC21_0023" + /pseudo + CDS complement(join(21403..21984,22038..22706)) + /gene="tnp" + /locus_tag="SPC21_0023" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(21904..21984,22038..22250)) + /gene="tnp" + /locus_tag="SPC21_0023" + /note="HMMPfam hit to PF01610, Transposase, score 1.8e-40" + /pseudo + gene complement(22824..23333) + /gene="tnp" + /locus_tag="SPC21_0024" + /pseudo + CDS complement(22824..23333) + /gene="tnp" + /locus_tag="SPC21_0024" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase (fragment)" + misc_feature complement(22830..23333) + /gene="tnp" + /locus_tag="SPC21_0024" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 4.7e-06" + /pseudo + gene complement(23500..23691) + /gene="tnp" + /locus_tag="SPC21_0025" + /pseudo + CDS complement(23500..23691) + /gene="tnp" + /locus_tag="SPC21_0025" + /note="Lone member of homology group 0242" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative ISPSy5-like transposase (fragment)" + gene complement(23864..24461) + /gene="tnp" + /locus_tag="SPC21_0026" + /pseudo + CDS complement(join(23864..24211,24195..24461)) + /gene="tnp" + /locus_tag="SPC21_0026" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature complement(23870..24193) + /gene="tnp" + /locus_tag="SPC21_0026" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 3.7e-53" + /pseudo + gene order(24528..24833,24862..25251) + /gene="tnp" + /locus_tag="SPC21_0027" + CDS join(24528..24833,24862..25251) + /gene="tnp" + /locus_tag="SPC21_0027" + /note="member of homology group 19; + member of homology group 19" + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + /protein_id="CAI33758.1" + /db_xref="GOA:Q4K0Q1" + /db_xref="InterPro:IPR002559" + /db_xref="UniProtKB/TrEMBL:Q4K0Q1" + /translation="MLAVLKTAYQLKHAKGGRKPKLSLEDLLMATLQYVREYRTYEEI + AADFGIHESNLLRRSQWVEVTLVQSGVTISRTPLSSEDTVMIDATEVKINRPKKRISE + MKAQAIVTSQGRIVSLDIAVNYCHDMKLFKMSRRNIGQAGKILADSGYQGLMKIYSQA + QTPRKSSKLKPLTVEDKTYNHALSKERSKVENIFAKVKTFKMISTTYRNHRKRFGLRM + NLIAGIINHELGF" + misc_feature 24642..24707 + /gene="tnp" + /locus_tag="SPC21_0027" + /note="Predicted helix-turn-helix motif with score + 1106.000, SD 2.95 at aa 39-60, sequence + RTYEEIAADFGIHESNLLRRSQ" + misc_feature join(24774..24833,24862..25242) + /gene="tnp" + /locus_tag="SPC21_0027" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 4.2e-14" + gene 25512..>25559 + /gene="aliA" + /locus_tag="SPC21_0028" + CDS 25512..>25559 + /gene="aliA" + /locus_tag="SPC21_0028" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33759.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga aaatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttggtggaa atccaactac + 421 atttaactat ctattagact attacgctga taacatagtc aattgaaaca agaacaggac + 481 aaaagagcct cgtaaaaggt attgcaactg ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttacgcccaa actcctcgca taaaagttct aacttaccca ttctatggaa tcttacatta + 661 tccataataa taaccgatgg tgtgtttaat gttggtaaga gaaaattctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ttcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtactag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaattca gaagctattt cagtcaaata + 1081 agcgtctgga ttgtcagtaa gatagttttt aagtctatct ctatcaactt ttcttggttt + 1141 tgttcctttt acttggtggc ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatagtatta cgtgagattt ggaaaacgtg tgatgcttct gttatactac ctgttcgctc + 1261 acaataagag agaacttttt tacgaaaatc tattgaatat gccataaaaa gattatgcca + 1321 cattgtgtac tatagtagat tgaaactaga atagtacacc tctgcttcta aaacattgtt + 1381 agaaatcgat ttgactgtcc tgatcgattt gtcctgttct tatttcattt tactatattt + 1441 ttgtttcgcg ggaagtctac taagatattt aaagatgcag atagtaaaaa aagatgtaga + 1501 cattaccgta aaaaagtgat ataatcgtat gatgttcaat gtataggtgt taatcatgag + 1561 tagacgtttt aaaaaatcac gttcacagaa agtgaagcga agtgttaata tcgttttgct + 1621 gactatttat ttattgttag tttgtttttt attgttctta atctttaagt acaatatcct + 1681 tgcttttaga tatcttaatc tagtggtaac tgcgttagtc ctactagttg ccttggtagg + 1741 gctactcttg attatctata aaaaagctga aaagtttact atttttctgt tggtgttctc + 1801 tatccttgcc agctctgtgt cgctctttgc agtacagcag tttgttggac tgaccaatcg + 1861 tttaaatgcg acttcgaatt actcagaata ttcaatcagt gtcgctgttt tagcagatag + 1921 tgagatcgaa aatgttacgc aactgacgag tgtgacagca ccgactggga ctgataacga + 1981 aaatattcaa aaactactag ctgatatcaa gtcaagtcag aataccgatt tgacggtcaa + 2041 ccagagttcg tcttacttgg cagcttacaa gagtttgatt gcaggggaga ctaaggccat + 2101 tgtcctaaat agtgtctttg aaaatatcat cgagtcagag tatccagact acgcatcgaa + 2161 gataaagaag atttatacca agggattcac taaaaaagta gaagctccta agacgtctaa + 2221 gaatcagtct ttcaatatct atgttagtgg aattgacacc tatggtccta ttagttcggt + 2281 gtcgcgatca gatgtcaata tcctgatgac tgtcaatcga gataccaaga aaatcctctt + 2341 gaccacaacg ccacgtgatg cctatgtacc aatcgcagat ggtggaaata atcaaaaaga + 2401 taaattaact catgcgggca tttatggagt tgattcgtcc attcataccc tagagaacct + 2461 ttatggtgta gatattaatt attatgttcg tttgaatttt acctcatttt tgaaattgat + 2521 tgacttattg ggaggggtag atgttcataa tgatcaagag ttttcagctc tacatgggaa + 2581 gttccatttc ccagtaggga atgtccatct agactctgag caggctctag gttttgtacg + 2641 tgaacgctac tcactagccg atggagaccg tgaccgtggt cgcaaccaac aaaaggtgat + 2701 tgtggctatc cttcaaaaat taacgtcaac cgaagcactg aaaaattata gtacgatcat + 2761 taatagcttg caagattcta tccaaacaaa tatgccactt gagactatga taaatttggt + 2821 caatgctcag ttagaaagtg gagggaatta taaagtaaat tctcaagatt taaaaggtac + 2881 aggtcggacg gatcttcctt cttatgcaat gccagacagt aacctctatg tgctggaaat + 2941 agatgatagt agtttagctg tagttaaagc agctatacag gatgtgatgg agggtagatg + 3001 aaatgataga catccattcg catatcgttt ttgatgtaga tgacggtccc aaatcaagag + 3061 aggaaagcaa ggctctcttg gcagaatcct acagacaggg ggtgcgaacc attgtctcta + 3121 cctctcaccg tcgtaagggc atgtttgaaa ctccggaaga gaagatagca gaaaactttc + 3181 ttcaggttcg ggaaatagct aaggaagtgg cgagtgactt gatcattgct tacggggctg + 3241 aaatttacta cacaccagat gttctggata agctggaaaa aaagcggatt ccgaccctca + 3301 atgatagtcg ttatgccttg atagagttta gtatgaacac tccttatcgc gatattcata + 3361 gcgctttgag caagatcttg atgttgggaa ttactccagt cattgcccac attgagcgct + 3421 atgatgctct tgaaaataat gaaaaacgcg ttcgagaact gatcgataag ggctgttaca + 3481 cgcaagtaaa tagttcacat atcctcaaat ctaaactttt tggcgaacgt tataaattca + 3541 tgaaaaaaag agctcagtat tttttagagc aggatttggt ccatgtcatt gcaagtgata + 3601 tgcacaatct agatggtaga cctcctcata tggcagaagc atatgacctt gttacccaaa + 3661 aatacggaga agcgaaggct caggaacttt ttatagacaa tcctcgaaaa attgtaatgg + 3721 atcaactaat ttaggagaaa tgatgaaaga acaaaacacg atagaaatcg atgtatttca + 3781 attattaaaa accttgtgga aacgcaggct aatgatttta ttagtggcac ttgtgacagg + 3841 tgcgggggct tttgcatata gcacttttgt tgttaagcca gaatatacga gtaccacgcg + 3901 aatttacgta gtgaatcgca atcaagaaga caagccgggg ctgacaaatc aggatttgca + 3961 ggcaggaact tacctggtaa aagactaccg tgagattatc ctttcgcatg atgtattgga + 4021 aaaagtagcg acaaatttga agttggatat gccagcaaga gcgttagcca gcaaagttca + 4081 agtgactgta ccagctgaca ctcgtatcgt ctcaatctct gtcaaggata aacagccaga + 4141 ggaagccagt cgcatcgcta attctctacg agaagttgct gcagaaaaga tcgtcgctgt + 4201 aacgcgagta tctgatgtaa cgacacttga agaagcgcga ccagctacga ctccctcttc + 4261 tccaaatgtt cgacgcaatt ccttgtttag ttttcttgga ggagcagtcg taacagtaat + 4321 tgctgttctt ttgattgagt tgctcgacac tcgtgtgaaa cgtcctgaag atgtcgaaga + 4381 tgtactgcga attccacttt tagggctcgt tccagatttg gacaaaatga aataggagga + 4441 agttatgcca acgttagaaa tctcacaggc aaaattggat tttgtaaaaa aggcagagga + 4501 atattataat gctttgtgca cgaacctaca gttaagtgga gataatttaa aagtattttc + 4561 tatcacttct gtgaaactag gagaaggaaa atcaacgact tccaccaata tcgcttgggc + 4621 ttttgcgcgt gcaggttaca aaacgctgct gattgatgga gatattcgca attctgttat + 4681 gtcaggtgtc tttaaagcaa gggataagat tacaggcctg acagaatttt tatcaggaac + 4741 tacagaccta tcacaagggc tttgtgatac caatatcgaa aatctctttg taattcaggc + 4801 tggttctgtg tcaccgaatc cgacagctct tcttcaaagt aagaatttca gtacaatgct + 4861 tgaaaccttg cgtaaatatt ttgactacat cattgtagat actgctcctg tcggtgtcgt + 4921 gattgatgca gctattatta cgcgaaaatg cgatgcttct attttagtga cggaggcagg + 4981 tgaaataaat cgacgggata ttcaaaaagc aaaagaacag ttggaacaca cagggaagcc + 5041 gtttttggga gttgtgttga ataaattcga tacttcagta gacaaatatg gttcttatgg + 5101 aaattatgga gattacggga aaaataaaaa ataggtcggg gggatagaga tgaatggaaa + 5161 aatagtaaag tcttcattgg tcataatcca gagttttctt gttattttat tgacttatct + 5221 acttagtgct gtgagagaag cggagattgt ttcaacaaca gctattgcac tttatatcct + 5281 ccattatttt gtcttttata tcagtgatta tggacaggct ttctttaaaa ggggatattt + 5341 gattgaactt gtccagacat tgaaatatat cctattcttt gcactagcga ttggtatttc + 5401 taattttttc ttagaggatc gatttagtat ttccagacga ggcatgattt acttcctcac + 5461 attacatgct ctcttagtct atgtgctaaa cctatttatc aagtggtatt ggaagcgggc + 5521 ttatcccaac tttaaaggaa gtaagaagat tctcctactt acagcaactt ctcgtgtcga + 5581 aaaggtactg gatagattaa tagaatcaaa tgaggttgtt ggggagttgg tagccgtcag + 5641 tgtcttagat aaaccagatt ttcagcatga ttgtttaaag gtagtagcag agggggagat + 5701 agtaaacttt gcgactcatg aggtggtcga tgaagtcttt atcaatcttc caagtgaaaa + 5761 atacaatatt ggagagcttg tctctcagtt tgaaacgatg ggaattgatg caacagttaa + 5821 tctaaatgcc tttgatcgta gtttggcacg taacaagcaa attcgtgaga tggcaggatt + 5881 aaacgttgtg actttttcta caacatttta taagactagt catgtaattg ctaagcggat + 5941 tattgatatc gtgggtgcat tggtagggct gatactatgt ggtctagtca gtgttgtact + 6001 ggttcctttg attcgaaagg atgggggctc tgctattttt gctcagacgc gtattggaaa + 6061 aaatggtcgc tacttcactt tttacaagtt ccgctccatg tgtgtagatg ccgaggcgaa + 6121 aaaaagagaa ctcatggaac aaaataccat gcagggtgga atgtttaagg tggacgatga + 6181 tccgcgtatc acgaaaattg gtcgttttat aaggaagact agcttggacg agttgccaca + 6241 gttttataat gttttaaagg gagatatgag tttggttggc acacggccac caacagtgga + 6301 cgaatatgag cactataccc cagaacaaaa acgtcgtcta agttttaaac ctggtataac + 6361 aggcttatgg caggtcagtg gacgaagtga aatcaaaaat ttcgatgaag ttgtcaaatt + 6421 agatgtggct tatatagatg attggacaat ttggaaagac attgaaattt tattgaagac + 6481 agttaaagta gtatttatga gagatggagc gaaatagttt acttttgttt cagactacta + 6541 ggagaaaaat gaagaagtca gtttatatca taggttcaaa gggaattcct gccaagtatg + 6601 gaggatttga aacctttgtt gagaaattaa cagaatatca aaaagatggt aacatccaat + 6661 actatgttac ctgcatgcgc gaaaattcgg caaagtcagg atttacagca gatacatttg + 6721 agtacaacgg tgctatttgt tacaacattg atgtgcctaa tattggtcct gctagagcca + 6781 ttgcctacga cattgcagcg gtcaataagg ctattgaatt ggctaaagaa aacaaggacg + 6841 aggctcccat tttttacatt ttagcttgtc gtatcgggcc ttttatttct ggacttaaga + 6901 aaaaaattcg ttcgatcgga ggccgtttgc tggtaaatcc agatggtcat gagtggcttc + 6961 gagctaaatg gagcttgcca gttcggaagt attggaaatt ttcggaacag ttgatggtta + 7021 aacatgcaga tttattagtc tgcgatagca aaaatatcga aaaatatatt cgagaggact + 7081 ataaacagta tcagcccaag acgacctata tcgcttatgg tacagatact accccttcaa + 7141 gtctgaaatc agaagatgcc aaagttcgaa actggtatcg tgaaaaggga gtaagcgaaa + 7201 atggctatta tctagtggtg ggacgattcg ttcccgaaaa caactatgaa accatgattc + 7261 gtgaatttat caagtctaag tccaataagg actttgtcct tattacaaat gtggaacaga + 7321 ataaatttta cgatcagttg ctcaaggaaa caggtttcga caaggatcta agagtcaaat + 7381 ttgtgggaac agtctatgac caagaattgc tcaagtatat ccgtgaaaat gctttcgcct + 7441 atttccatgg acatgaagtt gggggtacca atccatcgct tcttgaagct ttagcatcca + 7501 ctaaactcaa cttgttgttg gatgtcggct ttaaccgtga agttggtgaa gacggagcca + 7561 tttattggaa aaaagatgag ctagcgcatg taatcgaaga agtggaacga tttgatgaag + 7621 gtgatatttc ggaattagac gaaaagtcta gccaacgaat tgcggatgca tttacgtggg + 7681 aaaagattgt gtcagattat gaagaagtgt ttaaaggata aggaatgaaa cggattttat + 7741 acttgcatgc tggtgcagaa atgtatggag cagataaggt tttattggag ttgatcaaag + 7801 gattggattc caaagaattt gagacgcacg ttatcttgcc aaatgacggt gttttagtcg + 7861 aggctttgcg ccaggttgga gctcaggtca gcgtgttgga ttatccgatt ttacgtagaa + 7921 aatactttaa tcctaagggg atttttgaat atctgaaatc ctatcatcgc tactctcaaa + 7981 aaatcgctca atatgtgcgt gagaatggga tagttcttgt tcataacaat acaacagccg + 8041 ttctggaagg gatttatcta aagagaaaag taaaacttcc cttgatctgg catgttcatg + 8101 agattattgt taagcctaag gccatttcag attttatcaa cttcttgatg ggacgttatg + 8161 caaataaaat cgtaacagta tctcaagcag tggccagtca tgtcaatcag tctcccttca + 8221 tcaaagaagg gcaggtccag gttatctata atggagtgga caatgcggtc tatcatccga + 8281 tgccagcaag cacagtgcgt gaacaatttt ctatcccgga agaggctctt gtcattggta + 8341 tggttggtcg cgtcaacgct tggaaggggc aaggagattt tctagaagcg gtgacgccga + 8401 ttttggagca gaatcccaat gccatcgctt ttctggctgg aagtgccttt gctggtgaag + 8461 agtggcgagt tgaagaactc gagtctaaga ttgccaaatc aagtgtagtc tcacaaatca + 8521 aacgaattga ctattatgag catacgactg agctttataa tatgtttgat atctttgttt + 8581 taccaagtac caatcctgat cccctaccaa cagtggtact agaggcgatg gcatgcggca + 8641 aaccagtagt cggctatcgt catggtggtg tttgcgaaat ggttgatgaa gggacaaatg + 8701 gcttactggc cactccaaat cagcctgctg aactatcgaa agtcattcaa gaattggtgg + 8761 agaatccaga gaaaagaaac caatttggcc aagcatcagt agaaagacaa agagagttgt + 8821 tttctttaga tagttacatt aagaacttct cggagttgta taaaacagat agaaaagatt + 8881 agttatgaat aaaatagatt ttgttgttac ttgggttgat gggaatgacc ctgtatggaa + 8941 agaaaaaaaa tcaaggtatg atggctcggt cagtacttct aaacagagta tgaactcggt + 9001 caaagcttac cgagaatggg gaacctttaa atactggttt agaggagttg aaagatttgc + 9061 cccttgggtc aataaggtct acctcgtgac cgaccagcaa agaccaagct ggttagatat + 9121 aaacagtgaa aaattggtct tggtagatca tacagagatt atctgtaatg actgcctacc + 9181 agttttttct gccaatccga tcgaaagtaa tatccatcga attcctggtc tctctgagca + 9241 ctttgtcttt tttaatgacg atatgtattt gacggctcca gttgaaccga cagatttttt + 9301 ctcagaggat ggtttaccca aatataatac ggctctttct ccgattattc ctgaaagata + 9361 tggaacagga aattttcaga taaatgacat ggaaattgtc actagctatt tcagtcgaaa + 9421 tgaaattttg aagaatgggc aattctttga tccaaagcag ggattaaaaa gtattgttaa + 9481 gtcgctacta tacagaaata gtcagtttat ctgtggtttc tgggagagtc atctgcccta + 9541 tcctctacta aaatcaacga tggatttgat atgggaaaag gaaaaagctg tcttggggag + 9601 aacctcagcg agtcgcttta gaaatccgtc tgataccaat gtttggctct ttaagtattg + 9661 gcagattgct agtggtcaat acgctgtcgg aaatcctaag ttggggagac tcttttcttt + 9721 ggataatgcc ggaccagatt tttggaactt actaaattct ggcaaataca aaattatgtg + 9781 tatcaatgat gtgtatgata ttaaggatga agaaaaagta atgcaagaat ttattgctgc + 9841 aatgaaaaat cttttgcctg ataaaagtac atttgaatta taaaaaagga gtgggaatat + 9901 gccatcagtt tgtgctttag ttgtgacata taatcgttca aaatatctgc aaaaggcttt + 9961 ggaaggtatt ttgaatcaac aacaagaaat ttcgggaatt ttaatttata acaataatgc + 10021 tacagataat actgaagaaa ttcttatgaa attcggttat gttgattcaa aaggcgataa + 10081 gataaaagaa aattatcttt attcgaccga aaaagatgga aaacacttct actattacca + 10141 taatgacgaa aacctaggag gagctggagg ctttgcaaat ggaattcgat taatttcaga + 10201 gcttgattat gattatgttt ggattatgga cgatgatgtc tatccggaac ctaattgttt + 10261 atccgaaatt atgaaacaaa tgagtgtcca aaatgtacag gtaggtatcc cgaatcgtac + 10321 agatgaaaat tttgatgacc gtgccattat cggttttgat tttgatgact atcataaatt + 10381 ttggacggaa atgagaaaaa cagtaacata cggtcccttt gatgaagaag cgataaaagt + 10441 ggttgatatg ccatttgaag gaccagttgt tgaaatggca ttgcttcgta aagttggtat + 10501 tcctgatagt ggctttttta ttgagtacga tgattcggac tttgcacaac gcctacaaca + 10561 gtattcagat ataatttttg caacaaaagc acaattgcat cgtcaacttg ctgtaaaagt + 10621 ggatccaagc gaggtaaaaa aagtggaacc ttataattgg agaaattact ataaaattcg + 10681 aaataatatt attttcgata agcgatatgg aaaaaattgg aaagtacgtc aattgagtcc + 10741 tttaattcta attgctcacc atattgtgat tgctattcgc catcagcatt taaaacataa + 10801 cttgccaatt atttggaagg gtttttggga tggagttttt caacgaatgg ggaaacgagt + 10861 agaccccaat tattaaaagg agaaaaaaat gtctgattta ctgttgagtt tcattatgcc + 10921 gacctataac tctgcagaat acttagcaga tacaatggat agtttagtag cctctatagg + 10981 tgattataat catttagtgg aaattatttg tgttgacgat ggctcatggg ataatacagt + 11041 tactatttta gaaggataca agtctattta tgataatttg attattataa gaaatgagca + 11101 tggtggggtt agtcaggcta gaaatacagc tttagatata gtttctggga aatatatcag + 11161 ttttgttgat agtgatgatt tgtatgagaa agatttttta aatactttta tttcattgga + 11221 caagaatttt gatttccttt tcactgatgt gggtggactt aaggatgaaa ttagtttcca + 11281 agaaattaat gaaaaggaaa aattaaaaat ttttaaaaat aattttaatt taggtgagta + 11341 tacaattcat cctggaatag ctgggaaatt ttttagaaca agtttaatta atgatattca + 11401 attgagattt aacacgcaac tgtcatttgc tgaggatatt ttatttaatt ttacattgct + 11461 gacagcctca agacatgtga ttctatcccc tgtaaatttt tatcatgtca atgggactca + 11521 tagtttaatg tactacaatg aaaaaaattt aaaagggcag attgtatttg tagatagaat + 11581 acgtcaaatt ttaaaaggat actctgaatc atcggaaata gtcttaatag agaattttat + 11641 tatcttgaag gctatgactg tttatattga tcgttatttt ggaccattgt ggttgaatgg + 11701 aacttattca ttgaatgaag catcaaaatt aatgaaatct acaattgagg ataatgactt + 11761 ttcaaaagct tttaatagta atcgcttaga ttattctatt ggaaatcgtt atgttgtttt + 11821 cagaaaattg ttgaggttta gacagtacaa actatgtttg ttatacaatc gtataatgga + 11881 taaaattaag ggatatgaga ggtttaggaa acaatgatta aactttcaat tcacgatata + 11941 tatcgttatt ttctctacct catttttttt atgaacttat tattctttaa tattgtttca + 12001 gacctaacct atacaatcca aaatttttcg gtttatttga catttttatt gatgggaatg + 12061 tatttactac aaagacgaat atcaaagtta acaattttca cgtcaattac agttctatta + 12121 tttttcttat tgataatgtt caatttatat agacaaggac tacctgttaa tggctttttg + 12181 tcttttaata gtaaaatata tttgttgaga aatttcagtt ttattctact agtctttcca + 12241 atatcagaga tattaaagcc aaagtatagt ttaaattttt taaaagtagt ttttgtattt + 12301 ggaattcttg caattttatt tcgtactttt atttggatga gttataatta tgctggttta + 12361 aatatcgctc cgggtataat tgaagaaaga ggtgtgaatt ggacacgtta tggagcggtt + 12421 cgtctacaag cccttttttt ggatggctac gttttggcat atttgttatg taagttatta + 12481 ataagtgatt caaagaataa agtatcttat agtctacttt tgttgattac tttgttctat + 12541 gagggagtga tttatgcttc taggtcacaa cttattggtt tcagtataat gtttattgca + 12601 atttatttat taaaaaataa gaacttacta aataaattac tcagtttttt atcactcagt + 12661 ttagcttctt ttgcaattct actgagtcca tattatgaaa aatttattga tagtttctct + 12721 gtatcaaata gcgattatgg tgcaggtacg atggttcgta ttgttggaag gagatactat + 12781 caagaaatat ggaatcaaaa taaactttta ggttttgggc caatctcaga tggcaatatt + 12841 tttgctggtt ggaagtatta tttatctgat ttaggtatta ttagaatgct ctatcaattc + 12901 ggaattatag gttttatcat ttgtttatta cctattttgt atggatgttt agttggtttc + 12961 aagaatagat tacactttaa aggtatgctg ttattttgtc tttctctatt tgtattagta + 13021 actagctttg cttcgcaaaa tttatatgat tataatagaa ttatgcttct tccgttgtta + 13081 ttagggttag caaatgctgt ttcatcaact caagcagata aggatatggt atgaaagttc + 13141 ttaaaaatta cgcctataat ctctcttatc aactgttgct gattattttg ccggttatta + 13201 ctactcctta cattactcgg gtgtttagct cggatgactt gggtacctat ggttatttca + 13261 actcaatcgt cacctatttt atcttattgg caactttagg agtagctaat tatggtacca + 13321 aggaaatttc agggcatcga aaagaaattc gaaggaattt ctgggggatt tataccctac + 13381 agctaggagc gactatttta tccggtaccc tctatgctat actatgtctg agtttgccat + 13441 ctatgcaaga ttcagttgcc tatatcttag ggtttagttt gctttcaaag ggattagata + 13501 tttcttggtt atttcaaggt ttggaagact tccggaagat tattgtgcga aatattacag + 13561 tcaaacttgt cggtgtaatc tcaatcttct tgtttgtaaa atctgctaaa gacctttatc + 13621 tctatgtttt tttactaacc atatttgaac tgttaggcca gttgagtatg tgggtgcctg + 13681 ctcgagaatt tattggaaag ccacatatag atattaacca cgcaaagaag catctaaagc + 13741 ctgtcattct tctctttctt cctcaaatcg ccatttcctt gtatgtgacc ttggatagaa + 13801 ctatgcttgg agctttagct tcaaaaacag atgtagggat ttatgatcag gctttaaagc + 13861 tagtaaacat cttgttgact ctagtaacct cactagggag tgttatgttg ccacgagtgt + 13921 ctagtcttct atcacaaagt gattataagt ctgtgaagaa aatgtaccaa atgtcctttt + 13981 taatttataa ttcagtcatt tttccaatta ttgctgggat gttgatcgtg aatgacgact + 14041 ttgttcaatt ctttttagga agggatttcc aagatgcccg ctatgcaatt gcaattatga + 14101 tgtttagaat gttctttatt ggatggacca atatcatggg aattcaaatc ctcatccccc + 14161 ataataaaaa taaagaattt atgatttcga ccactgttcc cgctattgtc agtgtcggat + 14221 tgaacctcat cttcttaccg aatctaggtt ttatcggggc agcgattgtg tctgtgttga + 14281 cagaagcttt ggtatggggg attcaacttc acttcacatg gtcttatctt aaagaggtac + 14341 caattattgg ctcaatgatc aagattgtta ttgcttcggg gatcatgtat gctttcttgg + 14401 tatctatgaa gtccgttgtt catgtttcac ctgctattaa tgttgctctg tatgctttgc + 14461 taggtggagt gatttatgta gccttgattt tgcttttcaa ggtggtgaat ttgaaagagt + 14521 tgaaacagga actattaaaa aatagggaga tttaatatgt acgactattt aatcgttgga + 14581 gctggtttgt ctggagctat ttttgctcac gaagctacaa aacgtggaaa aaaagtaaaa + 14641 gtgattgata aacgcgatca cattggaggg aacatatact gtgagaatgt agaaggtatc + 14701 aatgttcata aatatggtgc ccatatcttc catacttcta ataaaaaagt ttgggactat + 14761 gtcaatcaat tcgctgaatt taacaactat atcaattcac ctgtcgcgaa ctacaaagga + 14821 agtctttata atcttccttt caatatgaat actttctatg ctatgtgggg gacaaaaact + 14881 ccacaggaag tgaaagataa gattgctgag cagacggctg atacgaagga tgttgagcca + 14941 aaaaatctgg aagaacaagc tatcaagttg attggtccgg atatctatga aaagttgatc + 15001 aagggctata ctgaaaagca atggggacgc tcagcaacgg aacttcctcc atttatcatt + 15061 aaacgtcttc cagttcgtct aacatttgat aataactatt ttaacgaccg ttaccaagga + 15121 attcctattg gtggttataa tgtaattatc gaaaacatgc ttaaagacgt tgaagttgag + 15181 cttggtgttg atttctttgc tcaccgtgaa gagttagaag tatcagctga aaaagttgtc + 15241 ttcacaggaa tgatcgacca gtattttgac tacaaacacg gggagttaga ataccgtagc + 15301 cttcgctttg agcatgaaat tttggacgag gaaaattatc aagggaatgc tgtagtgaac + 15361 tatacagagc gtgagatccc ttatactcgt atcatcgaac acaaacattt tgaatatgga + 15421 acgcagccaa agacagttat cacgcgtgaa tatccggctg actggaagcg tggagacgag + 15481 ccctactatc cgatcaacga tgagaaaaat aatgctatgt ttgctaagta ccaagaggaa + 15541 gcttcaaaga atgataaagt tatcttctgt ggacggttag cagattataa atattatgat + 15601 atgcatgtag ttattgagcg agcgcttagc gtagtagaag aagaatttag taattgaaaa + 15661 acaacggaga aaggttattc cattatgaaa ggtattattc ttgcaggcgg ctcaggtacc + 15721 cgactgtacc cccttacacg agctgcatca aaacaactga tgccggttta tgataaacct + 15781 atgatttatt atcctttgtc gacattaatg ttggctggaa ttaaagatat tttgattatc + 15841 tcaactcctc aagatctacc tcgttttaag gatttacttt tagatggttc cgagtttggt + 15901 atcaagcttt cttatgccga gcagcctagt ccagatggac tagcgcaagc ctttatcatc + 15961 ggtgaaaaat ttatcggtga cgatagtgtt gctttaattt taggcgataa tatctatcat + 16021 ggacctggtt tgagcaaaat gcttcaaaag gcagcccaga aagagaaagg tgcgactgtt + 16081 tttggctacc aagtgaagga tccagagcgt tttggtgtag tcgagtttga tacagacatg + 16141 aatgccattt ccatagaaga aaaaccgaag gatcctcgct ctaactatgc tgtgactggt + 16201 ctgtatttct atgataatga tgttgtagaa attgctaaag gcattaaacc aagtgcacgt + 16261 ggcgaattag aaattacaga tatcaacaag gcttacttgg atcgtggtga tttgtctgtt + 16321 gaactcatgg gacgtggttt tgcttggttg gatactggca ctcatgaaag tttactagaa + 16381 gcttctcagt atatcgaaac agttcaacgg atgcagaatg ttcaagttgc aaacttggaa + 16441 gaaattgcct atcgtatggg ctatatcagt cgtgaagatg tactagagtt ggcacaacct + 16501 ctgaagaaga atgaatacgg acgatatttg ctccgtttga ttggagaagt ctagatgaca + 16561 gataattttt ttggaaaaac acttgcagtt cgtaaaattg atgccatttc aggtatgtta + 16621 gagtttgata ttcccgttca tggagacaat cgtggttggt ttaaggaaaa tttccagaag + 16681 gaaaagatgg tgccacttgg ctttcctgaa agcttctttg ctgaagggaa actgcaaaat + 16741 aacgtcagct tttctcgcaa aaatgttctt cgaggcctcc atgctgagcc ttgggacaag + 16801 tacatctctg ttgcagataa tgggaaggtt ctaggaacat gggttgattt gcgtgagggt + 16861 gaaacttttg ggaatattta ccagacagag attgacgcta gtaagggaat ctttgtccct + 16921 cgtggcgtag ccaatggatt tcaagtccta tctgatacag tttcttatag ttatctggtt + 16981 aatgactatt gggcgcttga actcaaacct aagtatgcat ttgttaacta ctctgaccca + 17041 gaattaggaa ttgagtggga aaatctggaa gaagcagagg tatctgaagc agacaaacat + 17101 catcccctac ttaaggacgt gaaacctttg aaaaaagaag atttggaata aggaaataat + 17161 atgactaaat ataaaaacat catcgtgaca ggtggggctg gttttatcgg ttctaacttt + 17221 gtccactatg tttacaataa ctttccagat gtgtatgtga cagtgctgga caagctgact + 17281 tatgcaggta atcgtgccaa tattgaagaa attttaggcg accgtgttga gttagtcgtt + 17341 ggagatattg ctgatgcagc cttggtagat aagttagcag ctgaagcgga tgccattgta + 17401 cactatgcgg cagaaagcca caatgacaat tcgcttaatg acccctcgcc atttatccat + 17461 accaacttca tcggaactta tacactcttg gaagcggctc gtaaatacga ccttcgtttc + 17521 caccatgtgt cgactgacga agtctatggg gatctgccgc tgcgtgaaga tttaccaggt + 17581 catggggaag gaccaggtga gaaatttacg gctgaaacca agtacaatcc aagctcgcct + 17641 tactcatcga ctaaggcggc ttcagacttg attgtcaaag cttgggtacg ctcatttggc + 17701 gtcaaagcga ctatttccaa ctgttccaac aactatggtc cttaccagca tattgagaag + 17761 tttattccac gacaaatcac caatatcttg agcggtatca agccaaaact ctatggtgaa + 17821 ggtaaaaacg ttcgtgactg gatccatacc aatgaccatt cttcaggagt ttggacaatc + 17881 ttgacaaaag ggcaaatcgg tgaaacctac ttgattgggg ctgatggtga gaagaacaat + 17941 aaggaagttt tggaacttat ccttaaggaa atgggacaaa ctgcggatgc ctatgatcat + 18001 gtgactgatc gtgcaggaca tgaccttcgc tatgcgattg atgcaagcaa gctctgtgat + 18061 gagttggggt ggaaacctga atttaccaac tttgaagctg ggctcaaggc aacaatcaag + 18121 tggtatacag ataaccaaga atggtggaaa gcagaaaaag aagctgttga agccaattat + 18181 gctaagactc aggagattat tacagtataa aaagcaggaa atagctactt tttattgcta + 18241 tattgggaag agttacatat tagaaaggcc tagagatgat tttaattaca ggggcaaatg + 18301 gccaattagg aacggaactt cgctatttat tggatgaacg taatgaagaa tacgtggcag + 18361 tagatgtggc tgagatggac attaccgatg cagaaatggt tgagaaagtt tttgaagagg + 18421 tgaaaccgac tttagtctac cactgtgcag cctacaccgc tgttgatgca gcagaggatg + 18481 aaggaaaaga gttggacttc gccatcaatg tgacggggac aaaaaatgtc gcaaaagcat + 18541 ctgaaaagca tggtgcaact ctagtttata tttctacgga ctatgtcttt gacggtaaga + 18601 aaccagttgg acaagagtgg gaagttgatg accgaccaga tccacagaca gaatatggcc + 18661 gtactaagcg tatgggggaa gagttagttg agaagcatgt gtctaatttc tatattatcc + 18721 gtactgcctg ggtatttgga aattatggca aaaacttcgt ttttaccatg caaaatcttg + 18781 cgaaaactca taagacttta acagttgtaa atgaccagta cggtcgtccg acttggactc + 18841 gtaccttggc tgaattcatg acctacctag ctgaaaaccg caaggaattt ggttattatc + 18901 atttgtcaaa tgatgcgaca aaagacacaa catggtatga ttttgcagtt gaaattttga + 18961 aagatacaga tgtcgaagtc aagccagtag attccagtca atttccagcc aaagctaaac + 19021 gtccgctaaa ctcaacgatg agcctggcca aagccaaagc tactggattt gttattccaa + 19081 cttggcaaga tgcattgcaa gaattttaca aacaagaagt gagataagta gtagaatgat + 19141 tttctagtct aataaaagag gcagataatg aactccaaag gagcttaaga tgtacgatta + 19201 tcttgttgtt ggtgctggtc tctttggtgc agtctttgcc catgaagcag ccttaaaagg + 19261 aaaaaagtaa aagttattga aaaacgaaat catatcgcgg gtaatatcta tactcgtgaa + 19321 gaggaaggaa ttcaagttta tcaatatggt gctcatatct tccatacttc tgataaggag + 19381 atctgtgatt atgtaaatca gcttgcagag tttaaccgtt acacaaattc tcctgttgca + 19441 aactataagg gtgagattta taaccttcct tttaatatga atactttcaa taaactctgg + 19501 ggagttgtaa cgccagcagg agcacaagct aagattgagg aacaacgtgc tattttaaat + 19561 ggtaaaactc ctgaaaattt ggaagaacag gagatttctc ttgtaggtac agatatctac + 19621 gaaaaattaa tcaaagacta tacagagaaa cagtggggca aaccaactac tgaacttcca + 19681 tcctttatta ttcgccgttt accagtacac ctgacctatg ataacaacta ttttaacgat + 19741 acctatcaag ggattccaat tggtgattat aatgttatca tcgaaaatat gctgaaggat + 19801 gtagaagtag aacttggagt gaactttttt gccaatcgtc aagaattaga ggcttctgct + 19861 gaaaaggttg tctttacagg aatgattgac caatactttg attataaaca tggtgagtta + 19921 gaataccgta gtcttcgttt tgatcatgaa gttctagatg aggaaaacta tcaaggaaac + 19981 gcagttgtaa actatacaga acgagaaatt ccttatactc gtattattga gcataaacac + 20041 tttgagtatg gtactcagga gaaaacggtt attactcgtg aatacccagc tgatttcttt + 20101 ttgcataata gaaaacatta taagaggaac tctaaatgac aaggattagt atgaaaaaaa + 20161 taaaagaata cgaaatttta aaagtaatag ccattatctt agttgtggta ggacacagca + 20221 cctactataa tatttatact ggttatggtg ggatagatta tcaacaatac ataaacaacc + 20281 atttatcctt agctgtatat aagctgttaa gtaaattgac agagattatt tattattttc + 20341 atatgccttt attcatggct atatctggtg cgtttttctc tattcaggtt aaaaataatc + 20401 gatggcatgg cattggctca ttattaacaa ataagtttag aagactaatg ataccatttt + 20461 tagtctttac tctagtatat acaataccaa taaaatacat atcaaattac tttgatggta + 20521 tctctttctg gaaagcggtc tctggacaat tatttctatt tggaaattct cacttgtggt + 20581 atttgtatgc attgtttatt gtctttatag ttggctttta tattctgaaa aaacgtacgt + 20641 tattttatgt ttatctactg ctatatattc tacacatctt gagttactca gttcatttaa + 20701 cattagtaag tgcaccatta caatatctct tttggttttc tatgggcttc ttatttgaat + 20761 ttaagaggga gcagtataat cattatttaa agaataataa gtggctaagc tttttattgg + 20821 tgctactatt tatagcatgt gtagccctaa aatttgtgct taaagataac catgaagttt + 20881 tgaataggat aattatggat ctagcagctg tgctaggctc acttatttgt tataatatat + 20941 cgtattatct cagtgataaa agagaattaa cagagaatag actatttaat gttattttga + 21001 ttaacggatt aggaatttac atcttttctg atactttaaa ttatttaata ttaaatatct + 21061 catattctat cagtaatcga ttcatgttta catcatttgg tattttagca ttatttttga + 21121 ttagaatttt ctttacttta tttatagggt taggtttaac actgttattt aaaaaaatat + 21181 tcaaaaaaca ttcttggtta gtaaactaac caactttagt taatttatta ttgtcttgag + 21241 gaaatattca aagagaagtt tttgaaattt ttctattact ctagaaatag atactggaag + 21301 attgtggtca tgtatttctt atctattttg taaccgccca ataacgaagt atattgaaaa + 21361 atctcggctc tttgtcaact gtagtgggtt gaaaaaaagc taagctcgag aaaggacaaa + 21421 ttttgtcctt tcttttttga tattcagagc gataaaaatc cgttttttga agttttcaaa + 21481 gtttcgaaaa ccaaaggcat tgcgtttgat aagtttgatg agattattgg tcgcttccaa + 21541 tttggcgtta gaatagtgta gttgaagggc gttgacgatt ttctctttgt cctttagaaa + 21601 ggctttaaag acagtctgaa aaagaggatg aacctgcttt agattgtcct caatgagtcc + 21661 gaaaaatttc tccggtttct tattctgaaa gtgaaacagc aagagttgat agagctgata + 21721 gtggtgtttc aagtcttctg aatagcttaa aatcttgtct aaaatctctt tattggttaa + 21781 gtgcatacga aaagtaggac gataaaatcg cttatcactc agtttacggc tatcctgttg + 21841 tatgagcttc cagtagcgct tgatagcctt gtattcatgg gattttcgat gaaactgatt + 21901 catgatttga acacgcacac gactcatagc acggctaaga tgttgtacaa tatgaaagcg + 21961 ttcaagaacg attttagcat tcgggagtga aacagtctgg gagactgttt cagcctgagt + 22021 ctagaaattt gaaagcgaag ctgtttagcc aagtcatagt aaggactaaa catatccata + 22081 gtaatgattt tgacgcgaca tcggacaact ctatcatatt taagaaagtg atctcggatg + 22141 acagcttgtg ttctaccctc aagaacagtg atgatattga gattgttaaa atcttgcgca + 22201 atgaagctca tctttccctt tgtaaaagca tactcatccc aagatataat ctcaggaaga + 22261 caagaaaaat catgtttaaa gtgaaaatca ttgagcttac gaataacagt tgaagttgag + 22321 atggaaagct gatgggcaat atcggtcata gaaatctttt caatcaactt ttgagcagtc + 22381 ttttggttga tgatacgagg gatttggtga tttttcttga cgagggaagt ctcagcgacc + 22441 gctatttttg aacagtgata gcacttaaag cgacgctttc taaggagaat tctagtaggc + 22501 ataccagtcg tttcaagata aggaatttta gaaggttttt gaaagtcata tttcttcaat + 22561 tggtttccgc actcagggca agatggggcg tcgtagtcca gtttggcgat gatttctttg + 22621 tgtgaatccc tattgacgac atctataatt tggatatttg tgtctttgat atcgagtagt + 22681 tttgtgataa aatgtaattg ttccatatga atctttctaa tgagttgttt ggtcgctttt + 22741 cattatagat cttatgggac tttttttcta caataaaata ggctccataa tatctatagt + 22801 ggatttaccc actacaaata ttatagagcc gaataatctc ctaggaattc ttgtactact + 22861 gaaccacttc gacactgatc atggtggtaa agcgtaatcc cttgtttctc tgatttacct + 22921 gacaaaaaag tccaatagta agtcagctga ctatcacttt ctaagacccg ataagaggtt + 22981 tcatctgcat gaagaagagc ttgttctaac aacttttctc ataaaaggtt ataaagagac + 23041 tctaaatagt attgactcgt cttgatatgc caattagaaa tttccttacg tgtgattggt + 23101 aaacccatct tagcccaatc ttcttcttag cgataattgg gtaccttcag attaaacttc + 23161 tgatggatgg tgtgagcgat aatagaggct gaaccaaggc tatgcgccaa aggggcttta + 23221 gggacaggag cttttacaat tttatcactt ggatttttat cactgcatgc ttggcatttg + 23281 taagcgtgtt ggatatgatc cactcttttt aattgcgcag gaataaagac caattcttgt + 23341 cgttgaaggc tcgctccaat ctcttttaaa tcgtcctgac aatcagggca aatgctctct + 23401 tctacttgat gatgaacttc ttctgaatca aattgggcaa gaatagcttg acgtttccct + 23461 ttagctttct tacgtttata ggtgatttct tctctttcaa ctgggtaagt cagagtcttc + 23521 ttccatattt tgttcctctt caaaaagact gagttgtcca aaagggcaaa cacttttctc + 23581 agaggatttt ccatagagct tttgcgttag ataagccact tgttcacgca gaagggaaag + 23641 ttcattagtg agactatcaa ttatagcact ctgttgttga atgattttca atcttctccc + 23701 atagactttc ctccttattt cctaacttta ttatatagtg tattgaatct ataacagtac + 23761 accttgactg ctaaaatatt tctataaatt aatttgactt ttctgataga gatgttcata + 23821 tcttatttca attcactata ctaaaaagaa agtcctcatt tcaatagaaa tcacgacttt + 23881 ctgataaatt tattttggga gtgatagaaa agcccttcat aagccagtct atttgttcag + 23941 gtgtgagagc tttgacatcc ttttatgtac tggaccaagt cagtctgccg ttctcaaagc + 24001 gtttatatag tagccaaaat ccttgaccat cccagtaaag ggctttaaag cggtctttac + 24061 gtccaccaca aaagagaaaa acttgaccgg agaaaggatc taattcaaaa tgggttttaa + 24121 ccagataagc cagtgaatca atgccttgcc tcatatccgt tttcccacat acgagataga + 24181 cctgccctag gctagataga tgaattgtca tagagcaaca ccttatccaa aagctgttct + 24241 atcatttcga gattgagaga ttgaaaaaaa cttacttcaa gcttgccaat acgaatttta + 24301 agcagaatat catttctctt tttagaatca aaacgacgag attgtggaat ctctacagga + 24361 acaataggtt gtggcattaa aatatcctcc aatagtttta ctttactaat agtatacagg + 24421 aggagctcca tgaatgatag ataccttgtt atgacgcgct tactaaacaa ctaactgatg + 24481 cacgatttaa gcgccttgtt ggtgttcagc gcacgacttt tgaagagatg ttagctgtat + 24541 taaaaacagc ttatcaactt aaacacgcaa aaggtggacg aaaacctaaa ttaagcctag + 24601 aagaccttct tatggccact cttcaatatg tgcgagaata tcgaacttat gaagaaattg + 24661 cggctgattt tggtatccac gaaagcaact tactccgtcg gagccaatgg gttgaagtaa + 24721 ctcttgttca aagtggtgtt acgatttcaa gaactcctct cagttctgag gacacggtaa + 24781 tgattgatgc gacggaagta aaaatcaatc gccctaaaaa aagaattagc gaatgattct + 24841 ggtaaaaaga aatgccacgc tatgaaggct caagcgattg tcacaagtca agggagaatt + 24901 gtttctttgg atatcgctgt gaactattgt catgatatga agttgttcaa aatgagtcgc + 24961 agaaatatcg gacaagctgg aaaaatcttg gctgacagtg gttatcaagg gctcatgaag + 25021 atatattctc aagcacaaac tccacgtaaa tccagcaaac tcaagccgct aacagttgaa + 25081 gataaaacct ataaccatgc gctatctaag gagagaagca aggttgagaa catctttgcc + 25141 aaagtaaaaa cgtttaaaat gatttcaaca acctatcgaa atcatcgtaa acgcttcgga + 25201 ttacgaatga atttgattgc tggtattatc aatcatgaac taggattcta gttttgcagg + 25261 aagtctattg aaggatcttt tgctttagtt ccttggtcaa ggttgattat tttcacggag + 25321 cgcttccgat tgttttcata aaccatttgc gcatagtcag cagaataaat ctttttgaaa + 25381 cgtccctttc ctagacatta tagaactttc agattcatct gaatttacca aattaacaca + 25441 aaaattctga aaattctgtt gacatctttc tgaaaagagt ttataatgga gagaaagttt + 25501 taaaggagaa aatgatgaaa agttcaaaac tacttgccct tgcgggcgtg acattattg +// + diff --git a/public/res/serotype_genbank/serotype_22A.gb b/public/res/serotype_genbank/serotype_22A.gb new file mode 100644 index 0000000..044cdb7 --- /dev/null +++ b/public/res/serotype_genbank/serotype_22A.gb @@ -0,0 +1,1062 @@ +LOCUS CR931681 22591 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 3405/39 (serotype 22a). +ACCESSION CR931681 +VERSION CR931681.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22591) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22591) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22591 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="3405/39" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC22A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC22A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33760.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC22A_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC22A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(462..974,976..1305)) + /gene="tnp" + /locus_tag="SPC22A_0003" + /pseudo + CDS complement(join(462..974,976..1305)) + /gene="tnp" + /locus_tag="SPC22A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(915..974,976..1287)) + /gene="tnp" + /locus_tag="SPC22A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 6e-23" + /pseudo + gene 1536..2981 + /gene="wzg" + /locus_tag="SPC22A_0004" + CDS 1536..2981 + /gene="wzg" + /locus_tag="SPC22A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33763.1" + /db_xref="GOA:Q4K0M6" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0M6" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVLEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1536..1652 + /gene="wzg" + /locus_tag="SPC22A_0004" + /note="Signal peptide predicted for SPC1114 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1740..2087 + /gene="wzg" + /locus_tag="SPC22A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.7e-65" + misc_feature 2265..2708 + /gene="wzg" + /locus_tag="SPC22A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 2983..3714 + /gene="wzh" + /locus_tag="SPC22A_0005" + CDS 2983..3714 + /gene="wzh" + /locus_tag="SPC22A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33764.1" + /db_xref="GOA:Q4K0M5" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0M5" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRIIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2986..3594 + /gene="wzh" + /locus_tag="SPC22A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 6.1e-37" + gene 3720..4415 + /gene="wzd" + /locus_tag="SPC22A_0006" + CDS 3720..4415 + /gene="wzd" + /locus_tag="SPC22A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33765.1" + /db_xref="GOA:Q4K0M4" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0M4" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRDQGDKPGLTNQDLQAGSYLVKDYREIILSQNVLEKVATNLKL + DMPTKTLASKVKVTVPTDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQI + PLLGVVPDLNKMK" + misc_feature 3720..3836 + /gene="wzd" + /locus_tag="SPC22A_0006" + /note="Signal peptide predicted for SPC1116 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3741..4157 + /gene="wzd" + /locus_tag="SPC22A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 5.8e-56" + misc_feature 4263..4340 + /gene="wzd" + /locus_tag="SPC22A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4425..5114 + /gene="wze" + /locus_tag="SPC22A_0007" + CDS 4425..5114 + /gene="wze" + /locus_tag="SPC22A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33766.1" + /db_xref="GOA:Q4K0M3" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0M3" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDDLKVFSITSVK + LGEGKSTTSTNIAWAFAHAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNVENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEVDEVNRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5130..6497 + /gene="wchA" + /locus_tag="SPC22A_0008" + CDS 5130..6497 + /gene="wchA" + /locus_tag="SPC22A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33767.1" + /db_xref="GOA:Q4K0M2" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0M2" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDGWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5130..5222 + /gene="wchA" + /locus_tag="SPC22A_0008" + /note="Signal peptide predicted for SPC1118 by SignalP 2.0 + HMM (Signal peptide probability 0.902) with cleavage site + probability 0.355 between residues 31 and 32" + misc_feature 5913..6494 + /gene="wchA" + /locus_tag="SPC22A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.8e-159" + gene 6528..7700 + /gene="wchF" + /locus_tag="SPC22A_0009" + CDS 6528..7700 + /gene="wchF" + /locus_tag="SPC22A_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33768.1" + /db_xref="GOA:Q4K0M1" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K0M1" + /translation="MKQSVYIIGSKGIPAKYGGFETFVEKLTEYQKDGNIQYYVACMR + ENSAKSGFTADTFEYNGAICYNIDVPNIGPARAIAYDIAAVNKAIELSKGNKDEAPIF + YILACRIGPFISGLKKKIRSIGGRLLVNPDGHEWLRAKWSLPVRKYWKFSEQLMVKHA + DLLVCDSKNIEKYIREDYKQYQPKTTYIAYGTDTSKSILKPDDEKVRNWYQEKGVAEN + GYYLVVGRFVPENNYETMIREFIKSKSNKDFVLITNVEQNKFYDQLLKDTGFDKDPRV + KFVGTVYDQELLKYIRENAFTYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + DGAIYWKKDELAHVIEEVERFDEGAISELDERSSQRIADAFTWEKIVSDYEEVFKG" + gene 7704..8861 + /gene="wcwA" + /locus_tag="SPC22A_0010" + CDS 7704..8861 + /gene="wcwA" + /locus_tag="SPC22A_0010" + /note="member of homology group 63" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33769.1" + /db_xref="GOA:Q4K0P2" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K0P2" + /translation="MKRILYLHAGAEMYGADKVLLELIKGLNPQEFEAHIILPNDGVL + VEALRQVGAQVSVLDYPILRRKYFNPKGILEYLKFYRRYSQKIAQYVRENGIDLVHNN + TTAVLEGIYLKRKVKLPLIWHVHEIIVKPKAISDFINFLMGRYADKIVTVSQAVASHV + KQSPFIKEGQVQVIYNGVDNAIYHPMQSSAVREKFGIPEDALVIGMVGRVNAWKGQGD + FLEAVTPILEHNPNSVAFLAGSAFAGEEWRVEELESKISKSSVASQIKRIEYYEHTAE + LYNMFDIFVLPSTNPDPLPTVVLEAMACGKPVVGYRHGGVSEMVVEGTNGLLAIPGQS + QELSDAILELVSDPEKRLQFGQASVRRQGESFSLESYIRSFSELYKSYKNE" + misc_feature 8265..8786 + /gene="wcwA" + /locus_tag="SPC22A_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.7e-33" + gene 8854..9492 + /gene="wcwC" + /locus_tag="SPC22A_0011" + CDS 8854..9492 + /gene="wcwC" + /locus_tag="SPC22A_0011" + /note="member of homology group 48" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33770.1" + /db_xref="GOA:Q4K0L9" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4K0L9" + /translation="MNKEIIKNKLKLIVYPIINFISRRRLKNKKFTIICDNCWAGKVY + QELGLPYQTPFIGMFVFSPDYIKMLKNLKYYLSGNISLKFVKESKHIENFDNAYPIAL + LDDIELHFLHYADEKEATQKWQRRLERIHWDNLYFKFNDNDACTYDLMREFDQLPYKS + KVIFSSKNYSDLHSLTYFKEKEKDCSVGIDLKIYHRYFDVVRWLNEGGVDLS" + gene 9524..10768 + /gene="ugd" + /locus_tag="SPC22A_0012" + CDS 9524..10768 + /gene="ugd" + /locus_tag="SPC22A_0012" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI33771.1" + /db_xref="GOA:Q4K0L8" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K0L8" + /translation="MSKMKIAVVGTGYVGLSISVLLAQHHHVVAVDIVKEKVELINNK + ISPIQDDFIERYLSESNLDLVATIDAETAYKDASFIVVATPTNYDSERNFFDTSAVES + VIQQVQNVNSTATIVIKSTVPVGFTDSIRKKLGISNLLFSPEFLRESRALYDNLYPSR + IIVGTDLNDQKLIEKAQVFSNLLVQGAIKKDIPILIMGFTEAEAVKLFANTYLALRVS + YFNELDTYAETKGLDTQKIIEGVSLDPRIGTHYNNPSFGYGGYCLPKDTKQLLANYEN + IPEELIGAIVRSNATRKDFIAKQVLKMVNYNNPEDDISVRQMDKEVVIGIYRLTMKSN + SDNFRQSSIQGVMKRIKDRGAKVIIFEPTLKDNGTFFGNAVINDLEEFKAKCDAIIAN + RYDEMLNDVKDKVYTRDIFRRD" + misc_feature 9524..9613 + /gene="ugd" + /locus_tag="SPC22A_0012" + /note="Signal peptide predicted for SPC1122 by SignalP 2.0 + HMM (Signal peptide probability 0.931) with cleavage site + probability 0.611 between residues 30 and 31" + misc_feature 9533..10090 + /gene="ugd" + /locus_tag="SPC22A_0012" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.2e-45" + misc_feature 9533..10045 + /gene="ugd" + /locus_tag="SPC22A_0012" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00017" + misc_feature 10118..10399 + /gene="ugd" + /locus_tag="SPC22A_0012" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 5e-38" + misc_feature 10496..10747 + /gene="ugd" + /locus_tag="SPC22A_0012" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 1.1e-06" + gene 10776..11900 + /gene="wcwV" + /locus_tag="SPC22A_0013" + CDS 10776..11900 + /gene="wcwV" + /locus_tag="SPC22A_0013" + /note="member of homology group 165" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33772.1" + /db_xref="GOA:Q4K0L7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K0L7" + /translation="MKKVLIVRSGPYQVTPNEYNLQELGLASALSQQGYQCDVMYYHK + TKNYDQLFEKNGEKIKVFWRRGIRLFRSGIYPQILKKKFLSQYDKIIISEYSQIMAVL + LSRIHSNVYIYNGPYYNLFKIPIIESMYDFLFVRMLNKRTKTVFCKTEKAKHYLKNKG + FNDCKVVGVGLDVEKFEQEEEPTENTIELLKRMENKQNILYVGSLSKRKNTAHLIRIF + NILKSKSGKKNELQLVLIGKDEGNIVEKINYSRFKDDIIYQPYLKNSQLQFIYPSSQL + FVLPSIQEIFGMVLLEAMYFKLSVVSSASAGGETLIQDGINGKIMNDFNDEHWVDCIE + NLLNNPLELKRLGECAHKRITEQFMWSSIARKIIETFDER" + misc_feature 11322..11834 + /gene="wcwV" + /locus_tag="SPC22A_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 5.1e-24" + gene 11909..12751 + /gene="whaB" + /locus_tag="SPC22A_0014" + CDS 11909..12751 + /gene="whaB" + /locus_tag="SPC22A_0014" + /note="member of homology group 120" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33773.1" + /db_xref="GOA:Q4K0L6" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0L6" + /translation="MNFCFVILHYRTSNDTIECIKSIQKLEGNYKIVIVDNASQNGSI + ERVEALFANNDEIVIIKNTKNLGFAAGNNIGYAYARTQIKANMIAVLNNDIVIKQKDF + INRIFELYRNSQFHIAGPDIVSLVDGHHQSPVVEKINSISKANKELFKYRILRIINKI + GLYELMTRQPKKKLNRVSAADPIGYQENVILHGSCVIFSPLYVSEEEFAFRPDTFMYM + EEPILYEYCMLKNYKTVFDPSIVIYHKEDSSTNSLYNAAYAKREFVFKNMIRSLKIYR + SLLK" + misc_feature 11918..12460 + /gene="whaB" + /locus_tag="SPC22A_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.7e-13" + gene 12781..14061 + /gene="wzy" + /locus_tag="SPC22A_0015" + CDS 12781..14061 + /gene="wzy" + /locus_tag="SPC22A_0015" + /note="member of homology group 166" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33774.1" + /db_xref="UniProtKB/TrEMBL:Q4K0L5" + /translation="MNLSMLALTIGSVVFVKKTYRTFLNPIILFAILWFIITTLSNLK + LFQLFEISTHTQQIILLGTSLFVIGGGIAIWFRDKFYFKVGGNSYFTTDFEINYNLFF + LLGIICLFYYLPDFFSSLVSLIRGGNLNLVRQSAQDAVDTSGLKNFIGTFIVIPSAMV + LEILGILDFWSNKKGRKLFYLNLAVIFVRVVADAGRTPLFNVVIYLLLTVLANRFSEK + TEKKRKVSKIKIVNYGMLGSIILWLSTLSRTTTSVYRILYFYFAMSPILLEKWSSILD + SEKLVTKGLVSLNGFFFSISYVLKNLFRIGYSQRVLEAYTMIANTDAIWYNIAPGLTK + ANAYVSLFWFFYADGRLLGVLIGSLLYGAFCGYIFCRYIQQQNKKNLAMLLFIYQGVF + FSFIRFPFSKSNYAIAFVLLLFFAFKKKGIEKSV" + gene 14054..15061 + /gene="wcwX" + /locus_tag="SPC22A_0016" + CDS 14054..15061 + /gene="wcwX" + /locus_tag="SPC22A_0016" + /note="member of homology group 167" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI33775.1" + /db_xref="UniProtKB/TrEMBL:Q4K0L4" + /translation="MFNINDQSIIYVACPYFNKTGGTELVHQLVYSINHFGGKAIVAY + YGSESAPNEVNPAFREYVSTFVDIKDVIDSLDNIIILPEINPDLAANLESIQKAVWWM + SVDNYLKRNGILGSLEHFGLLRTIKLFVKGNIKIGGYRIDKEIPHLYQSEYAKQFLLA + KGVKKYYRLSDYLNESYIQRSISTDTKKDVILYNPKKGIEFTRELIKQAPELTFSPIE + NMSTEQVKKLLSKSKVYIDFGNHPGKDRFPREAAISGCCVITGKRGSAKYYKDIPIPD + SYKFEDTVENIPNIIETLKSCLKNYDKHTVDFEKYQQYIKSEHDLFERDVKELFTRNR + G" + gene 15066..16508 + /gene="wzx" + /locus_tag="SPC22A_0017" + CDS 15066..16508 + /gene="wzx" + /locus_tag="SPC22A_0017" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33776.1" + /db_xref="GOA:Q4K0L3" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K0L3" + /translation="MSTRNSLIKNSLYNVAYRMLNIIFPLVSATYTARIILASGVGEV + SFAQNVVSYFTTIAAMGIPNYGIREIAKTRNKEEATNKVFSELFLINGLSTLLCSIVY + LILILTFNSIFDNTSMYLAVGLTLVFNFLNIDWFYQGKEDYAYITKRSFSIKLISLFS + LFIFVRDTDDAVNYALISSLAIGGNNIFNLVNLRKYNIRFSFNNIKIRRHLKPIFVLL + GSVIAIEIYTMLDTTMIGAMVGTTEVGYYTNSMKLVKLLITVITAIGGVLLPRLSDYY + SKGEFEKLNHIVDKVFRIMLFLFLPAQVALILVAPVIMPILFGDSFIPAVLTLQLTSL + LICTLGFSNLFGTQILLTFGDERKLLISTILGALSNIALNLILIPVMAQNGAALASVI + SETIVTLTAYYYAKKRVTIRFDLGFYLPTVVSTIIMGGAIYVVMQLYIGDIEKMLFST + LLGGVVFLLINVFMKNPIIYEFTGIIKRKR" + misc_feature 15084..15893 + /gene="wzx" + /locus_tag="SPC22A_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 5e-47" + gene 16511..17611 + /gene="glf" + /locus_tag="SPC22A_0018" + CDS 16511..17611 + /gene="glf" + /locus_tag="SPC22A_0018" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33777.1" + /db_xref="GOA:Q4K0L2" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0L2" + /translation="MYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTAGMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + IELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASANKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGMQPKTVITHEYPADWKRGDEPYYPINDEKNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFSN" + misc_feature 16946..17548 + /gene="glf" + /locus_tag="SPC22A_0018" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 4.4e-138" + gene 17638..18507 + /gene="rmlA" + /locus_tag="SPC22A_0019" + CDS 17638..18507 + /gene="rmlA" + /locus_tag="SPC22A_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33778.1" + /db_xref="GOA:Q4K0L1" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K0L1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17641..18357 + /gene="rmlA" + /locus_tag="SPC22A_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 1.4e-119" + gene 18508..19101 + /gene="rmlC" + /locus_tag="SPC22A_0020" + CDS 18508..19101 + /gene="rmlC" + /locus_tag="SPC22A_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33779.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 18544..19074 + /gene="rmlC" + /locus_tag="SPC22A_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 19114..20163 + /gene="rmlB" + /locus_tag="SPC22A_0021" + CDS 19114..20163 + /gene="rmlB" + /locus_tag="SPC22A_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33780.1" + /db_xref="GOA:Q4K121" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K121" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 19129..20085 + /gene="rmlB" + /locus_tag="SPC22A_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 7.1e-05" + misc_feature 19132..19968 + /gene="rmlB" + /locus_tag="SPC22A_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0039" + misc_feature 19132..19872 + /gene="rmlB" + /locus_tag="SPC22A_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2.7e-76" + misc_feature 19135..19947 + /gene="rmlB" + /locus_tag="SPC22A_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.6e-05" + gene 20229..21080 + /gene="rmlD" + /locus_tag="SPC22A_0022" + CDS 20229..21080 + /gene="rmlD" + /locus_tag="SPC22A_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33781.1" + /db_xref="GOA:Q4K1G6" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G6" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 20229..21077 + /gene="rmlD" + /locus_tag="SPC22A_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-147" + misc_feature 20232..20873 + /gene="rmlD" + /locus_tag="SPC22A_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 20232..20861 + /gene="rmlD" + /locus_tag="SPC22A_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 20235..20963 + /gene="rmlD" + /locus_tag="SPC22A_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene order(21143..21223,21227..22310) + /gene="glf" + /locus_tag="SPC22A_0023" + CDS join(21143..21223,21227..22027,22020..22310) + /gene="glf" + /locus_tag="SPC22A_0023" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33782.1" + /db_xref="GOA:Q4K0M9" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0M9" + /translation="MYDYLVVGAVFAHEAVLKGKKVKVIEKNHIAGNIYTREEEGIQV + HQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNKLWGVVT + PAEAQAKIDEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPTTELPSF + IIRRLPVHLTYDNNYFNDTYQGIPIGGYNVIIENMLKDVEVELGVNFFANRQELEASA + EKVVFTGMIDQYFDYKHGELEYCSLRFDHEVLDEENYQGNAVVNYTDAETPYTRIIEH + KHFEFGSQAKTIITNRTFEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQGNVIF + GGRLGHYRYYDMHQVIGAALQCVRNELDSYSMKIKEQTRKLAVGCSKHCFEVADGS" + misc_feature join(21563..22020,22027..22166) + /gene="glf" + /locus_tag="SPC22A_0023" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 4.2e-112" + gene 22544..>22591 + /gene="aliA" + /locus_tag="SPC22A_0024" + CDS 22544..>22591 + /gene="aliA" + /locus_tag="SPC22A_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33783.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga aaatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attacgctga taatatagtc aattgaaaca agagcaggac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct tttacgaggc tttttgatat + 541 gagcccatgt tttctcaata ggattgtact caggtgagta gggaggaaga aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtaat cgtctcttcg taagtcattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc ttaactgacc ttttaaagag + 841 cgaccatatt ctcgataaaa ataagtatca aatcctgttt cgtcaatcta aacagctgct + 901 aggtgcttta aactattaaa attcttaaga aataaggcta ctttttctgg gtcttgttca + 961 tagtaggtgt ggttcttttt ttcgagtgta gcccatagct ttgagcgcat agtggatggt + 1021 agttggatga cagccaaatt cagaagctat ttcagtcaaa taagcgtctg gattatcagt + 1081 aagatagttt ttaagtctat ctctatcaac ttttcttggt tttattcctt ttacttggtg + 1141 gtttagctct cctgttttct cttttagctt taaccagcca taaatggtat tacgtgagat + 1201 ttggaaaacg tgtgatgctt ctgttatact acctgttcgc tcacaataag agagaacttt + 1261 tttacgaaaa tctattgaat atgccataaa aagattatac cacattgtgt actatattag + 1321 attgaaacta gagtagtaca cctctgcttc taaaaaattt ttagaaatcg atttaactgt + 1381 cctgatcgat ttgtcatgtt cttatttcat tttactatat ttttgtttcg cgggaagtct + 1441 actaagatac ttaaagatgc agatagtaaa aaaatgtaga cattaccgta aaaaagtgat + 1501 ataattgtac gatgttcaag gtataggtgt taatcatgag tagacgtttt aaaaaatcac + 1561 gttcacagaa agtgaagcga agtgttaata tcgttttgct gactatttat ttattgttag + 1621 tttgtttttt attgttctta atctttaagt acaatatcct tgcttttaga tatcttaacc + 1681 tagtggtaac tgcgttagtc ctactagttg ccttggtagg gctactcttg attatctata + 1741 aaaaagctga aaagtttact atttttctgt tggtgttctc tatccttgtc agctctgtgt + 1801 cgctctttgc agtacagcag tttgttggac tgaccaatcg tttaaatgcg acttctaatt + 1861 actcagaata ttcaatcagt gtcgctgttt tagcagatag tgatatcgaa aatgttacgc + 1921 aactgacgag tgtgacagca ccgactggga ctgataatga aaatattcaa aaactactag + 1981 ctgatattaa gtcaagtcag aataccgatt tgacggtcga ccagagttcg tcttacttgg + 2041 cagcttacaa gagtttgatt gcaggggaga ctaaggccat tgtcttaaat agtgtctttg + 2101 aaaatatcat cgagtcagag tatccagact acgcatcgaa gataaaaaag atttatacca + 2161 agggattcac taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct + 2221 atgttagtgg aattgacacc tatggcccta ttagttcggt gtcgcgatca gatgtcaata + 2281 tcctgatgac tgtcaatcga gataccaaga aaatcctctt gaccacaacg ccacgtgatg + 2341 cctatgtacc aatcgcagat ggtggaaata atcaaaaaga taaattaacc catgcgggca + 2401 tttatggagt tgattcgtcc attcacacct tagaaaatct ctatggagtg gatatcaatt + 2461 actatgtgcg attgaacttc acttctttct tgaaaatgat tgacttattg ggaggggtag + 2521 atgttcataa tgatcaagag ttttcagctc tacatgggaa gttccatttc ccagtaggga + 2581 atgtccatct agactctgag caggctctag gttttgtacg tgaacgctac tcactagccg + 2641 atggagaccg tgaccgtggt cgcaaccaac aaaaggtgat tgtggctatc cttcaaaaat + 2701 taacgtcaac cgaagcactg aaaaattata gtacgatcat taatagcttg caagattcta + 2761 tccaaacaaa tatgccactt gagactatga taaatttggt caatgctcag ttagaaagtg + 2821 gagggaatta taaagtaaat tctcaagatt taaaagggac aggtcggacg gatcttcctt + 2881 cttatgcaat gccagacagt aacctctatg tgttggaaat agatgatagt agtttagctg + 2941 tagttaaagc agctatacag gatgtgatgg agggtagatg aaatgataga catccattcg + 3001 catatcgttt ttgatgtaga tgacggtccc aagtcaagag aggaaagcaa ggctctcttg + 3061 gcagaatcct acaggcaagg ggtacgaatc attgtctcta cctctcaccg tcgcaagggc + 3121 atgtttgaaa ctccggaaga gaagatagca gaaaactttc ttcaggttcg ggaaatagct + 3181 aaggaagtgg cgagtgactt ggtcattgct tacggagctg aaatttacta cacaccagat + 3241 gttctggata agctggaaaa aaagcggatt ccgaccctca atgatagtcg ttatgccttg + 3301 atagagttta gtatgaacac tccttatcgc gatattcata gcgccttgag caagatcttg + 3361 atgttgggaa ttactccagt cattgcccac attgagcgct atgatgctct tgaaaataat + 3421 gaaaaacgcg ttcgagaact gatcgatatg ggctgttaca cgcaagtaaa tagttcacat + 3481 gtcctcaaac ccaaactttt tggcgaacgt tataaattca tgaaaaaaag agctcagtat + 3541 tttttagagc aggatttggt tcatgtcatt gcaagtgata tgcacaatct agacggtaga + 3601 cctcctcata tggcagaagc atatgacctt gttacccaaa aatacggaga agcgaaggct + 3661 caggaacttt ttatagacaa tcctcgaaaa attgtaatgg atcaactaat ttaggagaaa + 3721 tgatgaaaga acaaaacacg atagaaatcg atgtatttca attatttaaa accttgtgga + 3781 aacgcaagct aatgatttta atagtggcac ttgtgacagg tgcgggggct tttgcatata + 3841 gcacttttat tgttaagcca gaatatacga gtaccacgcg aatttacgta gtgaatcgcg + 3901 atcaaggaga caagccgggg ctgacaaatc aggatttgca ggcaggatct tatctggtaa + 3961 aagactaccg tgagattatc ctttcgcaga atgtattgga aaaagtagcg acaaatttga + 4021 agttggatat gccaacaaaa acgttagcca gcaaagttaa agtgactgta ccaactgaca + 4081 ctcgtatcgt ctcaatctct gtcaaagata aacaaccaga agaagccagt cgtatcgcta + 4141 attctctacg agaagttgct gcagaaaaga tcgtcgctgt aacgcgagta tctgatgtaa + 4201 cgacacttga agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgacgcaatt + 4261 ccttgtttgg ttttcttgga ggagcagtcg taacagtaat tgctgttctt ttgattgagt + 4321 tgctcgacac ccgtgtgaaa cgtcctgaag atgtcgaaga tgtactgcaa attccacttt + 4381 taggggtcgt tccagatttg aacaaaatga aataggagga agttatgcca acattagaaa + 4441 tctcacaggc aaaattggat tttgtaaaaa aggcagagga atattataac gctttgtgca + 4501 cgaacctaca gttaagtgga gatgatttga aagtattttc tatcacttct gtgaaactag + 4561 gagaaggaaa atcaacgact tccaccaata tcgcttgggc ttttgcgcat gcaggttaca + 4621 aaacgctgct gattgatgga gatattcgca attctgttat gttaggtgtc tttaaagcaa + 4681 gggataagat tacaggcctg acagaatttt tatcaggaac tacagaccta tcacaagggc + 4741 tttgtgatac caatgtcgaa aatctctttg taattcaggc tggctctgtg tcaccgaatc + 4801 cgacagctct tcttcaaagt aagaatttca gtacaatgct tgaaaccttg cgtaaatatt + 4861 ttgactacat cattgtagat actgctcctg tcggtgtcgt gattgatgcg gctattatta + 4921 cgcgaaaatg cgatgcttct attttagtga cggaggtaga tgaagtaaat cgacgggata + 4981 ttcaaaaagc aaaagaacag ttggaacaca caggaaagcc gtttttggga gttgtgttga + 5041 ataaattcga tacttcagta gacaaatacg gttcttatgg aaattatgga gattacggga + 5101 aaaataaaaa ataggtcggg ggattagaga tgaatggaaa aatagtaaag tcttcattgg + 5161 ccataatcca gagttttctt gttattttat tgacttatct acttagtgct gtgagagaag + 5221 cggagattgt ttcaacaaca gctattgcac tttatatcct ccattatttt gtcttttata + 5281 tcagtgatta tggacaggat ttctttaaaa gaggatattt gattgaactt gtccagacat + 5341 tgaaatatat cctattcttt gcactagcga ttagtatttc taattttttc ttagaggatc + 5401 gatttagtat ttccagacga ggcatgattt acttcctcac attacatgct ctcttagtct + 5461 atgtgctaaa cctatttatc aagtggtatt ggaagcgggc ttatcccaac tttaaaggaa + 5521 gtaagaagat tctcctactt acagcaactt ctcgtgtcga aaaggtactg gatagattaa + 5581 tagaatcaaa tgaggttgtt ggggagttgg tagccgtcag tgtcttagat aaaccagatt + 5641 ttcagcatga ttgtttaaag gtagtagcag agggggagat agtaaacttt gcgactcatg + 5701 aggtggtcga tgaagtcttt atcaatcttc caagtgaaaa atacaatatt ggagagcttg + 5761 tctctcagtt tgaaacgatg ggaattgatg taacagttaa tctaaatgct tttgatcgta + 5821 gtttggcacg taacaagcaa attcgtgaga tggcaggatt aaacgttgtg actttttcta + 5881 caacatttta taagactagt catgtaattg ctaagcggat tattgatatc atgggtgcat + 5941 tggtagggct gatactatgt ggtttagtca gtattgtact ggttcctttg attcgaaagg + 6001 atgggggctc tgctattttt gctcagacgc gtataggaaa aaatggtcgt cagttcactt + 6061 tttataagtt tcgctctatg tgtgtagatg ccgaggcgaa aaaaagagaa ctcatggaac + 6121 aaaataccat gcagggtgga atgtttaagg tggacgatga tcctcgtatc acgaaaattg + 6181 gtcgttttat acggaagact agcttggacg agctaccaca gttttataat gttctaaagg + 6241 gagatatgag tttggttggc acacggccac caacagtgga cgagtatgaa cactataccc + 6301 cagaacaaaa acgtcggcta agttttaaac ctggtataac aggcttatgg caggtcagtg + 6361 gacgaagtga gattaagaat tttgatgaag ttgtcaaatt agatgtggcc tatatagatg + 6421 gttggacaat ttggaaagac attgaaattt tattgaagac agttaaagtt gtatttatga + 6481 gagatggagc gaagtgattt ttgcccttca gtcttgttag gagagatatg aaacagtcag + 6541 tttatatcat tggttcaaag gggattcctg ccaagtatgg aggatttgaa acctttgttg + 6601 agaaattaac agaatatcaa aaagatggta acatccaata ctatgttgcc tgcatgcgcg + 6661 aaaattctgc aaagtcagga tttacagcag acacatttga gtacaacggt gctatttgtt + 6721 acaacattga tgtgcctaat attggtcctg ctagagccat tgcttacgat attgcagcgg + 6781 tcaataaggc tattgaattg tctaagggaa acaaggacga ggctcccatt ttttacattc + 6841 tagcttgtcg tatcggacct tttatttctg gacttaagaa aaaaattcgt tcgatcggag + 6901 gccgtttgct ggtaaatcca gatggtcatg agtggcttcg agctaaatgg agcttgccag + 6961 ttcggaagta ttggaaattt tcggaacagt tgatggtcaa acatgcagat ttattagtct + 7021 gtgatagcaa aaatatcgaa aaatatattc gagaggacta taaacagtat cagcccaaga + 7081 cgacttatat cgcctatgga acagatacaa gcaagtctat tttaaaacct gatgacgaaa + 7141 aagttcgtaa ttggtatcag gaaaaaggcg ttgctgaaaa cggatattat ctagttgtgg + 7201 gacgatttgt tcccgaaaac aactatgaaa ccatgattcg tgaatttatc aagtctaagt + 7261 ccaataagga ctttgtcctt attacaaatg tagaacaaaa taaattttac gatcagttgc + 7321 tcaaggatac aggctttgac aaagacccga gagtcaaatt tgttgggact gtctatgatc + 7381 aagaattgct caaatatatc cgagagaatg cttttaccta cttccatggc catgaagttg + 7441 gtgggacaaa cccatcgctt ttagaagctc ttgcttcaac aaagcttaat ttactgctag + 7501 atgttggctt taaccgtgaa gttggtgagg atggagccat ttactggaaa aaagatgagc + 7561 tagcgcatgt aatcgaagaa gtggaacgat ttgatgaagg tgctatttcg gaattagacg + 7621 aaaggtctag ccaacgaatt gcggatgcat ttacgtggga aaagattgtg tcagattatg + 7681 aggaagtgtt taaaggatag agaatgaaac ggattttata tttacatgct ggtgcagaaa + 7741 tgtatggagc agataaggtt ttattggaat tgatcaaagg attaaatcct caagaatttg + 7801 aagctcatat tatcctgcct aatgacggtg ttttagtcga agccctacgc caagttggcg + 7861 ctcaggttag cgtgttggat tatccgattt tacgtagaaa atactttaat cctaaaggga + 7921 ttttggaata tctgaaattt tatcgtcgtt actcccaaaa aattgcccaa tatgtgcgtg + 7981 aaaatggaat agatcttgta cataacaata caacagctgt cttggaagga atctatctca + 8041 aaagaaaggt gaaacttccc ttgatctggc acgttcatga gattattgtt aagcccaagg + 8101 ctatttcaga ttttattaac ttcttgatgg ggcgttatgc agataagatt gtaacagtct + 8161 ctcaagctgt ggccagtcat gtcaaacagt ctccctttat caaagagggt caggttcagg + 8221 ttatctataa cggagtggac aatgcgatct atcatccgat gcagtcaagt gcagtgcgtg + 8281 aaaaatttgg gatcccagag gatgctctcg tcattggtat ggttggacgt gtcaacgcgt + 8341 ggaaggggca aggagatttt ctagaagctg tgacaccgat tttggagcat aatccgaatt + 8401 ccgtagcttt tctagcgggg agtgcctttg ctggtgaaga gtggcgagtt gaagaattag + 8461 agtctaagat ttccaaatca agtgtagcct cacaaatcaa acgaattgaa tattatgagc + 8521 atacggctga actttataat atgtttgata tctttgtctt accaagtacc aatcccgatc + 8581 cactaccaac agtggtacta gaggctatgg cttgtggtaa gccagtagtc ggctaccgtc + 8641 atggtggtgt ctctgaaatg gttgttgaag gaaccaatgg cttactggca atcccaggac + 8701 aatcacaaga actatcggat gcgattttgg agttggtttc tgatccagaa aaacggctcc + 8761 aatttggcca agcatcagta agaagacaag gagaatcgtt ttctttggaa tcttatatcc + 8821 gtagtttctc agaattatat aagagttata aaaatgaata aagaaataat aaagaataaa + 8881 ttaaaactaa ttgtttatcc tatcattaat tttatttcta ggagaagatt aaaaaataaa + 8941 aaattcacca ttatttgtga taattgttgg gctggaaaag tgtaccaaga gttaggtttg + 9001 ccctaccaaa caccctttat cgggatgttt gttttttcgc ctgattatat caagatgctc + 9061 aagaatttga aatactattt gagcggaaat atctcgttga aatttgttaa ggaatcaaag + 9121 cacattgaaa actttgataa tgcttatcca attgcactcc ttgacgatat cgagcttcat + 9181 ttcttgcact atgcagatga aaaagaggct actcagaaat ggcaacgtcg tttagaaaga + 9241 attcattggg ataatttgta ttttaagttc aatgacaatg atgcttgtac ctatgacctt + 9301 atgagagaat ttgatcaatt accgtacaaa agtaaagtca ttttttcatc taagaattat + 9361 tctgatttac attcattaac ttattttaaa gagaaggaaa aagattgtag tgttggaatt + 9421 gatcttaaaa tctatcatcg ttatttcgat gttgtaaggt ggctgaatga aggcggagtg + 9481 gacttgagtt aatcagatta aaactaaaaa aggagttgtt aatatgtcta aaatgaaaat + 9541 tgcagtagtt gggactggtt atgttggttt atccatttct gtgttacttg cacaacacca + 9601 tcatgtagta gcagtagata ttgtaaaaga gaaagtagaa ttaattaata ataaaatttc + 9661 acctattcag gatgatttta ttgaaagata tctttcagaa agtaatttag atttagttgc + 9721 aacaatagac gctgaaacag cttataaaga tgcctctttt atcgtagtag cgacgccaac + 9781 aaattatgac tcagaaagaa atttttttga tacatcagca gttgaatcgg ttattcaaca + 9841 ggttcagaat gtgaattcta cagcaactat agtaataaaa tcaacagtcc ccgtgggttt + 9901 tactgattca attcgtaaaa aattaggaat ttcaaatctt ctattcagcc ctgaattttt + 9961 gcgcgaatca agagcacttt atgataactt atatccaagt cggatcatag ttggaacaga + 10021 tttaaatgat caaaaattaa ttgaaaaggc ccaagttttc tctaatcttt tagtgcaagg + 10081 tgctatcaaa aaagatatcc ctattttaat tatgggattt actgaagctg aagcagttaa + 10141 attatttgct aatacctact tagcattgcg ggtatcatat tttaatgaat tagatactta + 10201 tgcagagacc aaaggactag atactcaaaa aataattgag ggtgttagtt tagatccccg + 10261 tatcggaacc cattataata atccgagctt tgggtacggt ggatattgct taccaaagga + 10321 cactaagcaa cttttagcta attatgagaa tatcccagaa gaacttattg gggctatagt + 10381 acgtagcaat gcaacacgta aggattttat tgctaaacaa gttcttaaaa tggtgaatta + 10441 taataatcca gaagacgata tttctgtcag acagatggat aaagaagttg ttattgggat + 10501 ataccgatta actatgaaaa gtaacagtga taactttcgt cagagttcaa tacagggagt + 10561 tatgaaacgt attaaggata gaggagctaa agtaattatt tttgagccta ctctaaaaga + 10621 taatggtacg ttctttggga acgctgttat aaatgattta gaagagttca aagcaaagtg + 10681 cgatgcgatt attgcaaatc gttatgatga aatgttgaac gacgttaagg ataaagtata + 10741 tacacgagat atcttcagaa gagattaata aaaatatgaa aaaagtatta attgtccgaa + 10801 gtggacctta ccaagttact ccaaatgaat acaaccttca ggagcttgga ttagcttctg + 10861 ctctcagtca gcagggatac caatgtgacg tgatgtatta tcacaaaaca aaaaactatg + 10921 atcaattatt tgagaaaaac ggggaaaaaa ttaaagtatt ttggagaagg ggaataagat + 10981 tatttagaag tggaatttat ccccagattt taaaaaagaa atttttgagt cagtatgata + 11041 aaataattat ttccgagtat agccagatta tggcagtttt attgtctaga attcattcca + 11101 atgtatatat ttataatggt ccatactata atctatttaa gatccccatt attgaatcta + 11161 tgtacgattt tctttttgta agaatgctca ataagagaac caagacagtt ttctgcaaga + 11221 cagaaaaggc aaagcattat cttaaaaata agggattcaa tgattgtaaa gtagtgggcg + 11281 taggtctaga tgttgaaaag tttgaacaag aagaggaacc tacggagaat actatagaac + 11341 ttttaaaaag aatggagaat aagcaaaata ttctttatgt aggctcacta tcaaaaagaa + 11401 aaaacacagc tcatttaatt agaattttta atattttaaa atctaaaagt ggtaagaaaa + 11461 acgaacttca attggtattg attggtaagg atgagggtaa tattgttgaa aaaattaact + 11521 attcacggtt taaagatgat attatttatc aaccttattt aaagaactct cagcttcaat + 11581 ttatttaccc atcatcacaa ctatttgtgc tcccgtcgat tcaagagatt tttggtatgg + 11641 tattacttga ggcaatgtat tttaagttgt ctgttgtttc cagcgcaagt gctggaggag + 11701 agacactgat tcaagatggt ataaacggta aaattatgaa tgattttaat gatgaacact + 11761 gggtggattg tatagaaaat ctattaaata acccattgga attgaaacgg cttggagaat + 11821 gtgcccataa gcgaattacg gaacagttta tgtggtcttc aattgcgaga aaaataattg + 11881 agacatttga tgaaaggtaa gacttactat gaatttttgt tttgtgattt tgcattatcg + 11941 taccagcaat gacactatag agtgtatcaa atcgattcaa aagcttgagg gaaattataa + 12001 aattgtaatt gttgataacg cttctcaaaa tggcagtata gaaagggtag aagccttatt + 12061 tgcaaataat gacgagatag ttataataaa aaacacgaaa aacttaggat ttgctgcagg + 12121 aaataatatt ggatacgcct atgctcggac tcaaataaaa gctaatatga ttgctgtact + 12181 taataatgat attgttatta agcaaaaaga tttcattaat cgtatatttg aactctatag + 12241 aaattctcag tttcatatcg ctggtccaga cattgtctct cttgtagatg gtcatcatca + 12301 aagtcctgtt gttgagaaga tcaattctat atctaaggca aataaagaac tttttaaata + 12361 tagaatcttg agaattatta ataaaatagg attatatgag ctgatgacta gacagccaaa + 12421 aaaaaaatta aatagagtaa gtgctgcaga ccctatagga tatcaggaaa atgttatttt + 12481 acatgggagt tgtgtaattt tttcaccatt atatgtttca gaggaggagt ttgcttttag + 12541 accagatacg ttcatgtata tggaagagcc tattctatat gaatattgca tgcttaaaaa + 12601 ttataagaca gtatttgatc cttctattgt aatttatcat aaagaggact catcaacaaa + 12661 ttcgttgtat aatgcggcat atgcaaaaag agagtttgtt tttaaaaata tgattagatc + 12721 tctaaagatt tatagaagtc tattgaagta gtaaactagg gaaaggatag taattaaaaa + 12781 ttgaatctta gtatgttagc cttgacaata ggatcagtgg tatttgttaa aaaaacgtat + 12841 aggacgtttc tcaatcccat aattttattt gcaattttgt ggtttattat aacaactttg + 12901 tcaaatttaa aactattcca acttttcgag attagtactc atacacaaca aattattttg + 12961 cttgggactt ctctatttgt tataggggga gggatagcaa tttggtttcg ggataaattt + 13021 tattttaaag ttggcggtaa ctcatatttt acaacagact ttgaaattaa ttataatttg + 13081 ttctttttgc taggtatcat ttgtcttttc tattatttgc cagatttctt ttcctcactg + 13141 gtatcattaa taagaggtgg gaatttaaac ttagttagac aatctgcgca ggatgcagta + 13201 gataccagtg gattaaagaa tttcattgga acatttattg ttattcctag tgccatggta + 13261 ttagaaatat taggaatatt agatttctgg agcaataaaa aaggcagaaa actattttat + 13321 cttaatttag ctgtcatttt tgtaagagtt gttgcagatg ctggtagaac gcctctattt + 13381 aatgttgtca tatatttatt acttactgtt ttagcaaata ggttctctga aaaaactgaa + 13441 aagaagagaa aagttagtaa aattaagata gtaaattatg gtatgctagg ttcaattatc + 13501 ttatggctat caactttatc taggacaaca acctccgttt ataggattct ttatttttat + 13561 ttcgcaatgt ccccaatact attagaaaag tggagtagta tacttgattc tgaaaaatta + 13621 gtaacaaagg gtttggtttc gttgaacggt ttcttttttt caatctcata tgtacttaaa + 13681 aatctgttta gaataggtta ttctcaaaga gtattagaag catacacaat gattgcgaat + 13741 actgatgcaa tctggtataa tattgcacct ggtttgacca aggcaaatgc atatgtctct + 13801 ctgttttggt ttttttatgc ggatggacgt ttattaggag ttttaatagg atcccttcta + 13861 tatggtgcct tttgtggcta tatcttttgc aggtatatcc agcaacaaaa taaaaagaat + 13921 ttggctatgt tactatttat ttatcaaggt gtttttttct cttttattag atttccgttt + 13981 tcaaaatcaa attatgcaat tgcattcgta ctcttattat tttttgcttt taagaagaaa + 14041 ggaatagaga aaagtgttta atatcaatga ccagtctatt atttatgttg catgtcctta + 14101 ttttaataaa acaggtggaa cggagctcgt ccatcaatta gtttattcta ttaatcattt + 14161 tggggggaaa gctatcgttg cttattatgg tagtgaaagt gctccaaatg aggtgaatcc + 14221 tgcgtttaga gaatatgttt ctacgtttgt tgatataaaa gatgttattg actctcttga + 14281 taatattatt attttaccgg aaattaatcc ggatttagcc gctaatctag agtctattca + 14341 aaaagcagta tggtggatga gcgttgacaa ttatttgaag cgtaatggta ttttaggttc + 14401 cttggaacat tttggacttt tacgaacaat taaattattt gtaaaaggaa atattaaaat + 14461 aggtggatat agaatagata aagagattcc ccatctttat caaagtgaat acgccaagca + 14521 atttcttcta gctaaaggtg tcaaaaagta ctatagattg tctgattatt taaacgagtc + 14581 ttatattcag cgatctattt caacagacac taaaaaagat gttattcttt acaatcctaa + 14641 aaaagggatt gaatttactc gtgagctaat taaacaggct ccagaattaa cgttctctcc + 14701 aattgagaat atgtcaactg aacaggtgaa aaaattactt tcaaaaagca aagtatatat + 14761 tgattttggc aaccatcctg ggaaagatag attcccacgg gaggcagcga tatcaggttg + 14821 ttgtgtgata actgggaaac gaggttctgc aaaatattat aaggatattc ctattccaga + 14881 ttcatacaaa tttgaagaca ctgttgaaaa tatccccaac attattgaga ccctgaaatc + 14941 atgcttaaaa aattatgaca aacatactgt tgactttgag aaatatcaac aatatattaa + 15001 atctgaacat gatttatttg aaagagatgt gaaagaatta ttcactagga ataggggtta + 15061 aggttatgtc aaccagaaat tcacttatta aaaattctct ttataatgtt gcttatagaa + 15121 tgttaaatat catatttcca ttagtatccg caacatatac tgcacggata attttagcta + 15181 gtggagttgg ggaggtctcg tttgcacaaa atgttgtttc ttactttaca acgatagctg + 15241 ctatgggtat tccaaattat ggtatacgag aaattgctaa aactagaaat aaagaagagg + 15301 ctacgaataa agttttttca gagctatttc tgattaatgg attgtctaca ttactgtgtt + 15361 ctatagtata tttaattctg attttgacat tcaatagcat ttttgataat acatcaatgt + 15421 atcttgctgt gggtttaaca ttagtgttta acttccttaa tatcgattgg ttctatcaag + 15481 gaaaagagga ctatgcatac atcacgaaac gtagtttcag tataaaactt atttctcttt + 15541 ttagtttatt tatttttgtt agagatactg acgatgcagt taactatgca ttgatttcta + 15601 gcttagcaat tggcgggaat aatattttta atcttgttaa tttaaggaaa tataatatta + 15661 gatttagttt taataatatt aagattagaa gacacttaaa acctattttt gttttgttgg + 15721 gttcagtgat tgctattgaa atctatacta tgctggatac cactatgatt ggtgctatgg + 15781 taggaacgac tgaggtaggt tattatacaa attctatgaa gctagttaaa ttgctgataa + 15841 ctgtgattac cgctattgga ggagtgcttt taccacgact aagtgattat tattctaagg + 15901 gagaatttga aaaattaaat cacatcgttg ataaagtttt tagaatcatg ttgtttcttt + 15961 ttttaccagc ccaagttgca ttaattctag ttgcaccagt aattatgccg attttatttg + 16021 gtgatagttt tataccagca gtgttaacac ttcaacttac ttctttgctt atatgtacat + 16081 tagggtttag taatttattt gggactcaaa tattactaac atttggagat gagcgaaagc + 16141 ttttgattag cacaatttta ggagcgctta gtaatatcgc tttgaaccta attctgattc + 16201 cagtaatggc tcaaaatgga gcagcgttgg catctgtgat tagtgaaaca attgttactt + 16261 taacagcata ctactatgcg aaaaaacgtg tgacaattag gtttgactta ggattttatt + 16321 tgccaactgt tgtttcaaca ataatcatgg gtggagctat atatgtagta atgcaattgt + 16381 atattgggga tatagaaaaa atgttatttt caactttgtt aggaggtgtt gtattccttt + 16441 taattaacgt ttttatgaag aatcctatta tatatgaatt tacaggtatt ataaagagaa + 16501 agagataatt atgtacgact atttaatcgt tggagcgggt ttgtctggag caatcttcgc + 16561 acacgaagct acaaagcgtg gaaaaaaagt aaaagtgatt gataaacgcg atcacattgg + 16621 agggaacata tactgtgaga atgtagaagg tatcaatgtt cataaatatg gtgcccatat + 16681 cttccatact tctaataaaa aagtctggga ctacgtcaat caatttgctg agtttaacaa + 16741 ctatatcaac tcacctgtcg caaactataa gggaagtctt tataaccttc ctttcaatat + 16801 gaataccttc tatgctatgt ggggcacaaa aactccacaa gaagtgaagg ataagattgc + 16861 tgagcagaca gctggtatga aggatgttga gccgaaaaat ctggaagaac aagctatcaa + 16921 gttgattggt ccggatatct atgaaaagtt gatcaagggt tatacagaaa agcaatgggg + 16981 acgctcagcg atagaacttc ctccatttat cataaaacgc cttccagttc gtttaacctt + 17041 tgataataac tattttaatg accgttacca agggattcct attggtggtt acaatgtcat + 17101 catcgaaaat atgctgaaag atgtagaagt tgaacttgga gtagactttt ttgctcatcg + 17161 tgaagagttg gaagcatctg ctaacaaagt tgtcttcaca ggaatgatcg accaatattt + 17221 tgactacaag cacggagagt tagaataccg tagccttcgt tttgagcatg agattttaga + 17281 cgaggaaaat tatcaaggga atgctgtagt gaactataca gagcgtgaga tcccttatac + 17341 tcgtatcatc gaacacaaac attttgaata tggaatgcag ccaaagacag ttatcacgca + 17401 tgaatatcca gctgactgga agcgtgggga cgagccctac tatcctatta acgatgagaa + 17461 aaataatgct atgtttgcta aataccaaga agaagcagcg cagaatgata aagttatctt + 17521 ttgtgggcgt ttagcagatt ataagtatta cgatatgcat gtggtgattg aacgggcgct + 17581 tgaggttgtg gagaaagaat ttagtaattg aaaaacaacg aagaaaggtt gcttattatg + 17641 aaaggtatta ttctagcagg tggttcggga actcgcttgt atcctttgac tcgagccgca + 17701 tcaaaacaac ttatgccggt ttatgataaa ccgatgattt actacccact ttcaacatta + 17761 atgttggctg ggattaggga tattttgatt atctcaactc ctcaagattt gcctcgtttt + 17821 aaagagcttc ttcaagatgg ttccgagttt ggtattaaac tttcttatgc tgagcaacca + 17881 agtccagatg gtttggcaca agcctttatc attggggaag agtttatttc tgatgatagc + 17941 gttgcgctaa tcttaggtga taatatctac catggttctg ggctttccaa gatgctacaa + 18001 aaggcagcga gtaaggagtc gggagcaact gtttttggct accatgtcaa ggatccagag + 18061 cgctttggtg tggttgagtt tgatcaggat atgaaggcta tttctattga agaaaagcca + 18121 gagcaacctc gttcaaacta tgcagttaca ggtctctatt tctatgataa tgatgtagta + 18181 gagattgcca agagtattaa accaagtcct cgtggtgaac tggaaattac agatgtaaac + 18241 aaagcttacc tagatcgtgg tgatttgtct gttgagctta tgggacgtgg ctttgcttgg + 18301 ctggatactg gaactcatga aagtttacta gaggcttcac agtacatcga aacagtccaa + 18361 cggatgcaaa atgttcaggt agcaaactta gaagaaattg cctatcgcat gggttatatc + 18421 agtcgtgaag atgtattgac cttagctcaa ccacttaaga aaaatgaata cggacagtat + 18481 ctgctccgtt tgattggaga agcatagatg acagataatt ttttcggtaa gacgcttgcg + 18541 gcacgcaagg ttgaagctat tccaggcatg ttggagtttg atatccccgt tcatggagat + 18601 aatcgtggct ggtttaaaga aaatttccaa aaggaaaaaa tgcttccact tggatttcca + 18661 gagtctttct ttgcagaagg aaaattgcaa aacaatgtat ccttctcacg taaaaatgtc + 18721 cttcgagggc tccacgcaga gccttgggat aagtacatct ctgtagcaga tggagggaaa + 18781 gttctgggtt cttgggttga tctacgcgag ggtgaaacct ttgggaatac ctatcagaca + 18841 gtaattgatg caagcaaggg aatctttgtt cctcgaggcg tagctaatgg cttccaagtt + 18901 ctatcagata cagtgtcata tagctatctg gtcaatgatt actgggctct cgagctcaaa + 18961 cccaagtatg cctttgtgaa ctacgctgat ccaagccttg gtattgaatg ggaaaatatt + 19021 gcagaagcag aggtttcaga agcagataaa catcatcccc tacttaagga tgtaaaacct + 19081 ttgaaaaaag aagatttgta aaaaggaaag aatatgactg aatacaaaaa tattatcgtg + 19141 acaggtggag ctggctttat cggttctaac tttgtccatt atgtttacga gaactttcca + 19201 ggtgttcacg tgacagtcct agataagttg acttatgctg gaaatcgcgc gaatattgag + 19261 gaaattttag gtaatcgtgt tgagttagtt gttggtgaca ttgctgatgc ggagttggta + 19321 gacaagttgg ctgctcaagc agatgctatc gttcattatg cagcggaaag ccacaatgat + 19381 aattcgctca atgatccatc gccatttatt catactaact tcatcggaac ctatactctt + 19441 ttagaagctg ctcgtaagta tgatattcgc ttccaccatg tatcgacaga tgaagtttat + 19501 ggggatctcc ctttacgcga agatttgcca ggtcatggtg aaggaccagg tgagaaattt + 19561 actgctgaaa caaaatacaa cccaagctct ccgtactcat caaccaaggc agcctcagat + 19621 ttgattgtca aagcctgggt gcgttctttt ggagtcaagg caacgatttc caactgttca + 19681 aataactacg gtccttatca acatatcgaa aaattcatcc cacgtcagat tactaacatc + 19741 ctaagtggaa ttaagccaaa actttacggt gaaggtaaga atgttcgtga ctggattcat + 19801 accaatgacc attcttcagg agtttggaca atcttgacaa aagggcaaat cggtgaaacc + 19861 tacttgattg gggctgatgg tgagaagaac aataaggaag ttttggaact tatccttaag + 19921 gaaatgggac aagctacgga tgcctatgat catgtgactg accgtgcagg acatgacctt + 19981 cgctatgcga ttgatgccag caagctccgt gatgagttgg ggtggaaacc tgaatttacc + 20041 aactttgaag ctgggctcaa ggcaacaatc aagtggtata cagataacca agaatggtgg + 20101 aaagcagaaa aagaagctgt tgaagccaat tatgctaaga ctcaggagat tattacagta + 20161 taaaaagcag gaaatagctg ctttttattg ctatattggg aagagttaca tattagaaag + 20221 gtctagagat gattttaatt acaggggcaa atggccaatt aggaacggaa cttcgctatt + 20281 tattggatga acgtaatgaa gaatacgtgg cagtagatgt ggctgagatg gacattacca + 20341 atgaagaaat ggttgagaaa gtttttgaag aggtgaaacc gactttagtc taccattgtg + 20401 cagcctacac cgctgttgat gcagcagagg atgaaggaaa agagttggac ttcgccatca + 20461 atgtgacggg gacaaaaaat gtcgcaaaag catctgaaaa gcatggtgca actctagttt + 20521 atatttctac ggactatgtc tttgacggta agaaaccagt tggacaagag tgggaagttg + 20581 atgaccgacc agatccacag acagaatatg gacgcactaa gcgtatgggg gaagagttag + 20641 ttgagaagca tgtgtctaat ttctatatta tccgtactgc ctgggtattt ggaaattatg + 20701 gcaaaaactt cgtttttacc atgcaaaatc ttgcgaaaac tcataagact ttaacagttg + 20761 taaatgacca gtacggtcgt ccgacttgga ctcgtacctt ggctgagttc atgacctacc + 20821 tagctgaaaa tcgtaaggaa tttggttatt atcatttgtc aaatgatgcg acagaagaca + 20881 caacatggta tgattttgca gttgaaattt tgaaagatac agatgtcgaa gtcaagccag + 20941 tagattccag tcaatttcca gccaaagcta aacgtccgct aaactcaacg atgagcctgg + 21001 ccaaagccaa agctactgga tttgttattc caacttggca agatgcattg caagaatttt + 21061 acaaacaaga agtgagataa gtagtagaat gattttctag tctaataaaa gaggcagaga + 21121 atgaactcca aaggagctta agatgtacga ttatcttgtt gttggtgcag tctttgccca + 21181 tgaagcagtc ttaaaaggaa aaaaagtaaa agttattgaa aaatgaaatc atatcgcggg + 21241 taatatctat actcgtgaag aggaaggaat tcaagttcat caatatggtg ctcatatctt + 21301 ccatacttct gataaggaga tctgggatta tgtaaatcag tttgcagagt ttaaccgtta + 21361 taccaattct cctgttgcaa actataaggg agagatttat aacttacctt ttaatatgaa + 21421 taccttcaat aaactctggg gagttgtgac gccagcagaa gcacaagcta agattgatga + 21481 acaacgtgct attttaaatg gtaaaactcc tgaaaatttg gaagaacagg cgatttctct + 21541 tgtaggtaca gacatctacg aaaaattaat caaagactat acagagaaac agtggggcaa + 21601 accaactact gaacttccat cctttattat tcgccgttta ccagtacacc tgacctatga + 21661 taacaactat tttaacgata cctatcaagg gattccaatt ggtggttata atgttatcat + 21721 cgaaaatatg ctgaaggatg tagaagtaga acttggagtg aacttttttg ccaatcgtca + 21781 agaattagag gcttctgctg aaaaggttgt ctttacaggg atgattgacc aatactttga + 21841 ttataaacat ggtgagttag aatactgtag tcttcgtttt gatcatgaag ttctagatga + 21901 ggaaaactat caaggaaacg cagttgtgaa ctatacggat gcagaaaccc catatactcg + 21961 cattattgaa cacaaacatt ttgagtttgg gagtcaagca aagactatca ttactaatag + 22021 aacattctaa aacatgggaa aaaggtgatg agccttatta tccagttaat aatgatcgta + 22081 ataatcattt gtataaatca tataaaaaac ttgctgatga gcaagggaat gttatctttg + 22141 gtggccgctt aggacactat cgttattacg atatgcacca agtaattgga gcagctttgc + 22201 agtgcgtgag aaatgagtta gattcatact caatgaaaat caaagagcaa actaggaagc + 22261 tagccgtagg ttgctcaaaa cactgttttg aggttgcaga tggaagctga cgcggtttga + 22321 agagattttc gaagagtata aacaagtaaa actgactacc agttattatt tagaaatagt + 22381 attaaaaatt ccttgactat gtgatatagt tgagggattt ttaaatgata ttcatatttt + 22441 ttgcaaagat gttgtttgaa aaataatttt caaaaattct gaaaattctg ttgacaactt + 22501 tctgaaaaga gtctataatg gagagaaagt tttaaaggag aaaatgatga aaagttcaaa + 22561 actatttgcc cttgcgggcg tgacattatt g +// + diff --git a/public/res/serotype_genbank/serotype_22F.gb b/public/res/serotype_genbank/serotype_22F.gb new file mode 100644 index 0000000..11d2ce6 --- /dev/null +++ b/public/res/serotype_genbank/serotype_22F.gb @@ -0,0 +1,1061 @@ +LOCUS CR931682 22696 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 1772/40 (serotype 22f). +ACCESSION CR931682 +VERSION CR931682.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22696) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22696) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22696 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="1772/40" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC22F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC22F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33784.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC22F_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC22F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(462..974,976..1305)) + /gene="tnp" + /locus_tag="SPC22F_0003" + /pseudo + CDS complement(join(462..974,976..1305)) + /gene="tnp" + /locus_tag="SPC22F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(915..974,976..1287)) + /gene="tnp" + /locus_tag="SPC22F_0003" + /note="HMMPfam hit to PF01710, Transposase, score 6e-23" + /pseudo + gene 1536..2981 + /gene="wzg" + /locus_tag="SPC22F_0004" + CDS 1536..2981 + /gene="wzg" + /locus_tag="SPC22F_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33787.1" + /db_xref="GOA:Q4K0M6" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0M6" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVLEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1536..1652 + /gene="wzg" + /locus_tag="SPC22F_0004" + /note="Signal peptide predicted for SPC1138 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1740..2087 + /gene="wzg" + /locus_tag="SPC22F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.7e-65" + misc_feature 2265..2708 + /gene="wzg" + /locus_tag="SPC22F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 2983..3714 + /gene="wzh" + /locus_tag="SPC22F_0005" + CDS 2983..3714 + /gene="wzh" + /locus_tag="SPC22F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33788.1" + /db_xref="GOA:Q4K0M5" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0M5" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRIIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2986..3594 + /gene="wzh" + /locus_tag="SPC22F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 6.1e-37" + gene 3720..4415 + /gene="wzd" + /locus_tag="SPC22F_0006" + CDS 3720..4415 + /gene="wzd" + /locus_tag="SPC22F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33789.1" + /db_xref="GOA:Q4K0M4" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0M4" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRDQGDKPGLTNQDLQAGSYLVKDYREIILSQNVLEKVATNLKL + DMPTKTLASKVKVTVPTDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQI + PLLGVVPDLNKMK" + misc_feature 3720..3836 + /gene="wzd" + /locus_tag="SPC22F_0006" + /note="Signal peptide predicted for SPC1140 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3741..4157 + /gene="wzd" + /locus_tag="SPC22F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 5.8e-56" + misc_feature 4263..4340 + /gene="wzd" + /locus_tag="SPC22F_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4425..5114 + /gene="wze" + /locus_tag="SPC22F_0007" + CDS 4425..5114 + /gene="wze" + /locus_tag="SPC22F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33790.1" + /db_xref="GOA:Q4K0M3" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0M3" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDDLKVFSITSVK + LGEGKSTTSTNIAWAFAHAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNVENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEVDEVNRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5130..6497 + /gene="wchA" + /locus_tag="SPC22F_0008" + CDS 5130..6497 + /gene="wchA" + /locus_tag="SPC22F_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33791.1" + /db_xref="GOA:Q4K0M2" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0M2" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDGWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5130..5222 + /gene="wchA" + /locus_tag="SPC22F_0008" + /note="Signal peptide predicted for SPC1142 by SignalP 2.0 + HMM (Signal peptide probability 0.902) with cleavage site + probability 0.355 between residues 31 and 32" + misc_feature 5913..6494 + /gene="wchA" + /locus_tag="SPC22F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.8e-159" + gene 6528..7700 + /gene="wchF" + /locus_tag="SPC22F_0009" + CDS 6528..7700 + /gene="wchF" + /locus_tag="SPC22F_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33792.1" + /db_xref="GOA:Q4K0M1" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K0M1" + /translation="MKQSVYIIGSKGIPAKYGGFETFVEKLTEYQKDGNIQYYVACMR + ENSAKSGFTADTFEYNGAICYNIDVPNIGPARAIAYDIAAVNKAIELSKGNKDEAPIF + YILACRIGPFISGLKKKIRSIGGRLLVNPDGHEWLRAKWSLPVRKYWKFSEQLMVKHA + DLLVCDSKNIEKYIREDYKQYQPKTTYIAYGTDTSKSILKPDDEKVRNWYQEKGVAEN + GYYLVVGRFVPENNYETMIREFIKSKSNKDFVLITNVEQNKFYDQLLKDTGFDKDPRV + KFVGTVYDQELLKYIRENAFTYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + DGAIYWKKDELAHVIEEVERFDEGAISELDERSSQRIADAFTWEKIVSDYEEVFKG" + gene 7704..8861 + /gene="wcwA" + /locus_tag="SPC22F_0010" + CDS 7704..8861 + /gene="wcwA" + /locus_tag="SPC22F_0010" + /note="member of homology group 63" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33793.1" + /db_xref="GOA:Q4K0M0" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K0M0" + /translation="MKRILYLHAGAEMYGADKVLLELIKGLNPQEFEAHIILPNDGVL + VEALRQVGAQVSVLDYPILRRKYFNPKGILEYLKFYRRYSQKIAQYVRENGIDLVHNN + TTAVLEGIYLKRKVKLPLIWHVHEIIVKPKAISDFINFLMGRYADKIVTVSQAVASHV + KQSPFIKEGQVQVIYNGVDNAIYHPMQSSAVREKFGIPEDALVIGMVGRVNAWKGQGD + FLEAVTPILEHNPNSVAFLAGSAFAGEEWRVEELESKISKSSVASQIKRIEYYEHTTE + LYNMFDIFVLPSTNPDPLPTVVLEAMACGKPVVGYRHGGVSEMVVEGTNGLLAIPGQS + QELSDAILELVSDPEKRLQFGQASVRRQGESFSLESYIRSFSELYKSYKNE" + misc_feature 8265..8786 + /gene="wcwA" + /locus_tag="SPC22F_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.7e-32" + gene 8854..9492 + /gene="wcwC" + /locus_tag="SPC22F_0011" + CDS 8854..9492 + /gene="wcwC" + /locus_tag="SPC22F_0011" + /note="member of homology group 48" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33794.1" + /db_xref="GOA:Q4K0L9" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4K0L9" + /translation="MNKEIIKNKLKLIVYPIINFISRRRLKNKKFTIICDNCWAGKVY + QELGLPYQTPFIGMFVFSPDYIKMLKNLKYYLSGNISLKFVKESKHIENFDNAYPIAL + LDDIELHFLHYADEKEATQKWQRRLERIHWDNLYFKFNDNDACTYDLMREFDQLPYKS + KVIFSSKNYSDLHSLTYFKEKEKDCSVGIDLKIYHRYFDVVRWLNEGGVDLS" + gene 9524..10768 + /gene="ugd" + /locus_tag="SPC22F_0012" + CDS 9524..10768 + /gene="ugd" + /locus_tag="SPC22F_0012" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI33795.1" + /db_xref="GOA:Q4K0L8" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K0L8" + /translation="MSKMKIAVVGTGYVGLSISVLLAQHHHVVAVDIVKEKVELINNK + ISPIQDDFIERYLSESNLDLVATIDAETAYKDASFIVVATPTNYDSERNFFDTSAVES + VIQQVQNVNSTATIVIKSTVPVGFTDSIRKKLGISNLLFSPEFLRESRALYDNLYPSR + IIVGTDLNDQKLIEKAQVFSNLLVQGAIKKDIPILIMGFTEAEAVKLFANTYLALRVS + YFNELDTYAETKGLDTQKIIEGVSLDPRIGTHYNNPSFGYGGYCLPKDTKQLLANYEN + IPEELIGAIVRSNATRKDFIAKQVLKMVNYNNPEDDISVRQMDKEVVIGIYRLTMKSN + SDNFRQSSIQGVMKRIKDRGAKVIIFEPTLKDNGTFFGNAVINDLEEFKAKCDAIIAN + RYDEMLNDVKDKVYTRDIFRRD" + misc_feature 9524..9613 + /gene="ugd" + /locus_tag="SPC22F_0012" + /note="Signal peptide predicted for SPC1146 by SignalP 2.0 + HMM (Signal peptide probability 0.931) with cleavage site + probability 0.611 between residues 30 and 31" + misc_feature 9533..10090 + /gene="ugd" + /locus_tag="SPC22F_0012" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.2e-45" + misc_feature 9533..10045 + /gene="ugd" + /locus_tag="SPC22F_0012" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00017" + misc_feature 10118..10399 + /gene="ugd" + /locus_tag="SPC22F_0012" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 5e-38" + misc_feature 10496..10747 + /gene="ugd" + /locus_tag="SPC22F_0012" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 1.1e-06" + gene 10776..11900 + /gene="wcwV" + /locus_tag="SPC22F_0013" + CDS 10776..11900 + /gene="wcwV" + /locus_tag="SPC22F_0013" + /note="member of homology group 165" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33796.1" + /db_xref="GOA:Q4K0L7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K0L7" + /translation="MKKVLIVRSGPYQVTPNEYNLQELGLASALSQQGYQCDVMYYHK + TKNYDQLFEKNGEKIKVFWRRGIRLFRSGIYPQILKKKFLSQYDKIIISEYSQIMAVL + LSRIHSNVYIYNGPYYNLFKIPIIESMYDFLFVRMLNKRTKTVFCKTEKAKHYLKNKG + FNDCKVVGVGLDVEKFEQEEEPTENTIELLKRMENKQNILYVGSLSKRKNTAHLIRIF + NILKSKSGKKNELQLVLIGKDEGNIVEKINYSRFKDDIIYQPYLKNSQLQFIYPSSQL + FVLPSIQEIFGMVLLEAMYFKLSVVSSASAGGETLIQDGINGKIMNDFNDEHWVDCIE + NLLNNPLELKRLGECAHKRITEQFMWSSIARKIIETFDER" + misc_feature 11322..11834 + /gene="wcwV" + /locus_tag="SPC22F_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 5.1e-24" + gene 11909..12751 + /gene="whaB" + /locus_tag="SPC22F_0014" + CDS 11909..12751 + /gene="whaB" + /locus_tag="SPC22F_0014" + /note="member of homology group 120" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33797.1" + /db_xref="GOA:Q4K0L6" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0L6" + /translation="MNFCFVILHYRTSNDTIECIKSIQKLEGNYKIVIVDNASQNGSI + ERVEALFANNDEIVIIKNTKNLGFAAGNNIGYAYARTQIKANMIAVLNNDIVIKQKDF + INRIFELYRNSQFHIAGPDIVSLVDGHHQSPVVEKINSISKANKELFKYRILRIINKI + GLYELMTRQPKKKLNRVSAADPIGYQENVILHGSCVIFSPLYVSEEEFAFRPDTFMYM + EEPILYEYCMLKNYKTVFDPSIVIYHKEDSSTNSLYNAAYAKREFVFKNMIRSLKIYR + SLLK" + misc_feature 11918..12460 + /gene="whaB" + /locus_tag="SPC22F_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.7e-13" + gene 12781..14061 + /gene="wzy" + /locus_tag="SPC22F_0015" + CDS 12781..14061 + /gene="wzy" + /locus_tag="SPC22F_0015" + /note="member of homology group 166" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33798.1" + /db_xref="UniProtKB/TrEMBL:Q4K0L5" + /translation="MNLSMLALTIGSVVFVKKTYRTFLNPIILFAILWFIITTLSNLK + LFQLFEISTHTQQIILLGTSLFVIGGGIAIWFRDKFYFKVGGNSYFTTDFEINYNLFF + LLGIICLFYYLPDFFSSLVSLIRGGNLNLVRQSAQDAVDTSGLKNFIGTFIVIPSAMV + LEILGILDFWSNKKGRKLFYLNLAVIFVRVVADAGRTPLFNVVIYLLLTVLANRFSEK + TEKKRKVSKIKIVNYGMLGSIILWLSTLSRTTTSVYRILYFYFAMSPILLEKWSSILD + SEKLVTKGLVSLNGFFFSISYVLKNLFRIGYSQRVLEAYTMIANTDAIWYNIAPGLTK + ANAYVSLFWFFYADGRLLGVLIGSLLYGAFCGYIFCRYIQQQNKKNLAMLLFIYQGVF + FSFIRFPFSKSNYAIAFVLLLFFAFKKKGIEKSV" + gene 14054..15061 + /gene="wcwX" + /locus_tag="SPC22F_0016" + CDS 14054..15061 + /gene="wcwX" + /locus_tag="SPC22F_0016" + /note="member of homology group 167" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI33799.1" + /db_xref="UniProtKB/TrEMBL:Q4K0L4" + /translation="MFNINDQSIIYVACPYFNKTGGTELVHQLVYSINHFGGKAIVAY + YGSESAPNEVNPAFREYVSTFVDIKDVIDSLDNIIILPEINPDLAANLESIQKAVWWM + SVDNYLKRNGILGSLEHFGLLRTIKLFVKGNIKIGGYRIDKEIPHLYQSEYAKQFLLA + KGVKKYYRLSDYLNESYIQRSISTDTKKDVILYNPKKGIEFTRELIKQAPELTFSPIE + NMSTEQVKKLLSKSKVYIDFGNHPGKDRFPREAAISGCCVITGKRGSAKYYKDIPIPD + SYKFEDTVENIPNIIETLKSCLKNYDKHTVDFEKYQQYIKSEHDLFERDVKELFTRNR + G" + gene 15066..16508 + /gene="wzx" + /locus_tag="SPC22F_0017" + CDS 15066..16508 + /gene="wzx" + /locus_tag="SPC22F_0017" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33800.1" + /db_xref="GOA:Q4K0L3" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K0L3" + /translation="MSTRNSLIKNSLYNVAYRMLNIIFPLVSATYTARIILASGVGEV + SFAQNVVSYFTTIAAMGIPNYGIREIAKTRNKEEATNKVFSELFLINGLSTLLCSIVY + LILILTFNSIFDNTSMYLAVGLTLVFNFLNIDWFYQGKEDYAYITKRSFSIKLISLFS + LFIFVRDTDDAVNYALISSLAIGGNNIFNLVNLRKYNIRFSFNNIKIRRHLKPIFVLL + GSVIAIEIYTMLDTTMIGAMVGTTEVGYYTNSMKLVKLLITVITAIGGVLLPRLSDYY + SKGEFEKLNHIVDKVFRIMLFLFLPAQVALILVAPVIMPILFGDSFIPAVLTLQLTSL + LICTLGFSNLFGTQILLTFGDERKLLISTILGALSNIALNLILIPVMAQNGAALASVI + SETIVTLTAYYYAKKRVTIRFDLGFYLPTVVSTIIMGGAIYVVMQLYIGDIEKMLFST + LLGGVVFLLINVFMKNPIIYEFTGIIKRKR" + misc_feature 15084..15893 + /gene="wzx" + /locus_tag="SPC22F_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 5e-47" + gene 16511..17611 + /gene="glf" + /locus_tag="SPC22F_0018" + CDS 16511..17611 + /gene="glf" + /locus_tag="SPC22F_0018" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33801.1" + /db_xref="GOA:Q4K0L2" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0L2" + /translation="MYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTAGMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + IELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASANKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGMQPKTVITHEYPADWKRGDEPYYPINDEKNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFSN" + misc_feature 16946..17548 + /gene="glf" + /locus_tag="SPC22F_0018" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 4.4e-138" + gene 17638..18507 + /gene="rmlA" + /locus_tag="SPC22F_0019" + CDS 17638..18507 + /gene="rmlA" + /locus_tag="SPC22F_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33802.1" + /db_xref="GOA:Q4K0L1" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K0L1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17641..18357 + /gene="rmlA" + /locus_tag="SPC22F_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 1.4e-119" + gene 18508..19101 + /gene="rmlC" + /locus_tag="SPC22F_0020" + CDS 18508..19101 + /gene="rmlC" + /locus_tag="SPC22F_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33803.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 18544..19074 + /gene="rmlC" + /locus_tag="SPC22F_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 19114..20163 + /gene="rmlB" + /locus_tag="SPC22F_0021" + CDS 19114..20163 + /gene="rmlB" + /locus_tag="SPC22F_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33804.1" + /db_xref="GOA:Q4K121" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K121" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 19129..20085 + /gene="rmlB" + /locus_tag="SPC22F_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 7.1e-05" + misc_feature 19132..19968 + /gene="rmlB" + /locus_tag="SPC22F_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0039" + misc_feature 19132..19872 + /gene="rmlB" + /locus_tag="SPC22F_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2.7e-76" + misc_feature 19135..19947 + /gene="rmlB" + /locus_tag="SPC22F_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.6e-05" + gene 20229..21080 + /gene="rmlD" + /locus_tag="SPC22F_0022" + CDS 20229..21080 + /gene="rmlD" + /locus_tag="SPC22F_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33805.1" + /db_xref="GOA:Q4K1G6" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G6" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 20229..21077 + /gene="rmlD" + /locus_tag="SPC22F_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-147" + misc_feature 20232..20873 + /gene="rmlD" + /locus_tag="SPC22F_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 20232..20861 + /gene="rmlD" + /locus_tag="SPC22F_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 20235..20963 + /gene="rmlD" + /locus_tag="SPC22F_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene order(21125..21223,21227..22310) + /gene="glf" + /locus_tag="SPC22F_0023" + /pseudo + CDS join(21125..21223,21227..22027,22020..22310) + /gene="glf" + /locus_tag="SPC22F_0023" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + misc_feature join(21563..22020,22027..22166) + /gene="glf" + /locus_tag="SPC22F_0023" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 4.2e-112" + /pseudo + gene 22544..>22696 + /gene="aliA" + /locus_tag="SPC22F_0024" + CDS 22544..>22696 + /gene="aliA" + /locus_tag="SPC22F_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33807.1" + /db_xref="UniProtKB/TrEMBL:Q4K0S2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYL" + misc_feature 22544..22630 + /gene="aliA" + /locus_tag="SPC22F_0024" + /note="Signal peptide predicted for SPC1158 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga aaatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attacgctga taatatagtc aattgaaaca agagcaggac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct tttacgaggc tttttgatat + 541 gagcccatgt tttctcaata ggattgtact caggtgagta gggaggaaga aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtaat cgtctcttcg taagtcattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc ttaactgacc ttttaaagag + 841 cgaccatatt ctcgataaaa ataagtatca aatcctgttt cgtcaatcta aacagctgct + 901 aggtgcttta aactattaaa attcttaaga aataaggcta ctttttctgg gtcttgttca + 961 tagtaggtgt ggttcttttt ttcgagtgta gcccatagct ttgagcgcat agtggatggt + 1021 agttggatga cagccaaatt cagaagctat ttcagtcaaa taagcgtctg gattatcagt + 1081 aagatagttt ttaagtctat ctctatcaac ttttcttggt tttattcctt ttacttggtg + 1141 gtttagctct cctgttttct cttttagctt taaccagcca taaatggtat tacgtgagat + 1201 ttggaaaacg tgtgatgctt ctgttatact acctgttcgc tcacaataag agagaacttt + 1261 tttacgaaaa tctattgaat atgccataaa aagattatac cacattgtgt actatattag + 1321 attgaaacta gagtagtaca cctctgcttc taaaaaattt ttagaaatcg atttaactgt + 1381 cctgatcgat ttgtcatgtt cttatttcat tttactatat ttttgtttcg cgggaagtct + 1441 actaagatac ttaaagatgc agatagtaaa aaaatgtaga cattaccgta aaaaagtgat + 1501 ataattgtac gatgttcaag gtataggtgt taatcatgag tagacgtttt aaaaaatcac + 1561 gttcacagaa agtgaagcga agtgttaata tcgttttgct gactatttat ttattgttag + 1621 tttgtttttt attgttctta atctttaagt acaatatcct tgcttttaga tatcttaacc + 1681 tagtggtaac tgcgttagtc ctactagttg ccttggtagg gctactcttg attatctata + 1741 aaaaagctga aaagtttact atttttctgt tggtgttctc tatccttgtc agctctgtgt + 1801 cgctctttgc agtacagcag tttgttggac tgaccaatcg tttaaatgcg acttctaatt + 1861 actcagaata ttcaatcagt gtcgctgttt tagcagatag tgatatcgaa aatgttacgc + 1921 aactgacgag tgtgacagca ccgactggga ctgataatga aaatattcaa aaactactag + 1981 ctgatattaa gtcaagtcag aataccgatt tgacggtcga ccagagttcg tcttacttgg + 2041 cagcttacaa gagtttgatt gcaggggaga ctaaggccat tgtcttaaat agtgtctttg + 2101 aaaatatcat cgagtcagag tatccagact acgcatcgaa gataaaaaag atttatacca + 2161 agggattcac taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct + 2221 atgttagtgg aattgacacc tatggcccta ttagttcggt gtcgcgatca gatgtcaata + 2281 tcctgatgac tgtcaatcga gataccaaga aaatcctctt gaccacaacg ccacgtgatg + 2341 cctatgtacc aatcgcagat ggtggaaata atcaaaaaga taaattaacc catgcgggca + 2401 tttatggagt tgattcgtcc attcacacct tagaaaatct ctatggagtg gatatcaatt + 2461 actatgtgcg attgaacttc acttctttct tgaaaatgat tgacttattg ggaggggtag + 2521 atgttcataa tgatcaagag ttttcagctc tacatgggaa gttccatttc ccagtaggga + 2581 atgtccatct agactctgag caggctctag gttttgtacg tgaacgctac tcactagccg + 2641 atggagaccg tgaccgtggt cgcaaccaac aaaaggtgat tgtggctatc cttcaaaaat + 2701 taacgtcaac cgaagcactg aaaaattata gtacgatcat taatagcttg caagattcta + 2761 tccaaacaaa tatgccactt gagactatga taaatttggt caatgctcag ttagaaagtg + 2821 gagggaatta taaagtaaat tctcaagatt taaaagggac aggtcggacg gatcttcctt + 2881 cttatgcaat gccagacagt aacctctatg tgttggaaat agatgatagt agtttagctg + 2941 tagttaaagc agctatacag gatgtgatgg agggtagatg aaatgataga catccattcg + 3001 catatcgttt ttgatgtaga tgacggtccc aagtcaagag aggaaagcaa ggctctcttg + 3061 gcagaatcct acaggcaagg ggtacgaatc attgtctcta cctctcaccg tcgcaagggc + 3121 atgtttgaaa ctccggaaga gaagatagca gaaaactttc ttcaggttcg ggaaatagct + 3181 aaggaagtgg cgagtgactt ggtcattgct tacggagctg aaatttacta cacaccagat + 3241 gttctggata agctggaaaa aaagcggatt ccgaccctca atgatagtcg ttatgccttg + 3301 atagagttta gtatgaacac tccttatcgc gatattcata gcgccttgag caagatcttg + 3361 atgttgggaa ttactccagt cattgcccac attgagcgct atgatgctct tgaaaataat + 3421 gaaaaacgcg ttcgagaact gatcgatatg ggctgttaca cgcaagtaaa tagttcacat + 3481 gtcctcaaac ccaaactttt tggcgaacgt tataaattca tgaaaaaaag agctcagtat + 3541 tttttagagc aggatttggt tcatgtcatt gcaagtgata tgcacaatct agacggtaga + 3601 cctcctcata tggcagaagc atatgacctt gttacccaaa aatacggaga agcgaaggct + 3661 caggaacttt ttatagacaa tcctcgaaaa attgtaatgg atcaactaat ttaggagaaa + 3721 tgatgaaaga acaaaacacg atagaaatcg atgtatttca attatttaaa accttgtgga + 3781 aacgcaagct aatgatttta atagtggcac ttgtgacagg tgcgggggct tttgcatata + 3841 gcacttttat tgttaagcca gaatatacga gtaccacgcg aatttacgta gtgaatcgcg + 3901 atcaaggaga caagccgggg ctgacaaatc aggatttgca ggcaggatct tatctggtaa + 3961 aagactaccg tgagattatc ctttcgcaga atgtattgga aaaagtagcg acaaatttga + 4021 agttggatat gccaacaaaa acgttagcca gcaaagttaa agtgactgta ccaactgaca + 4081 ctcgtatcgt ctcaatctct gtcaaagata aacaaccaga agaagccagt cgtatcgcta + 4141 attctctacg agaagttgct gcagaaaaga tcgtcgctgt aacgcgagta tctgatgtaa + 4201 cgacacttga agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgacgcaatt + 4261 ccttgtttgg ttttcttgga ggagcagtcg taacagtaat tgctgttctt ttgattgagt + 4321 tgctcgacac ccgtgtgaaa cgtcctgaag atgtcgaaga tgtactgcaa attccacttt + 4381 taggggtcgt tccagatttg aacaaaatga aataggagga agttatgcca acattagaaa + 4441 tctcacaggc aaaattggat tttgtaaaaa aggcagagga atattataac gctttgtgca + 4501 cgaacctaca gttaagtgga gatgatttga aagtattttc tatcacttct gtgaaactag + 4561 gagaaggaaa atcaacgact tccaccaata tcgcttgggc ttttgcgcat gcaggttaca + 4621 aaacgctgct gattgatgga gatattcgca attctgttat gttaggtgtc tttaaagcaa + 4681 gggataagat tacaggcctg acagaatttt tatcaggaac tacagaccta tcacaagggc + 4741 tttgtgatac caatgtcgaa aatctctttg taattcaggc tggctctgtg tcaccgaatc + 4801 cgacagctct tcttcaaagt aagaatttca gtacaatgct tgaaaccttg cgtaaatatt + 4861 ttgactacat cattgtagat actgctcctg tcggtgtcgt gattgatgcg gctattatta + 4921 cgcgaaaatg cgatgcttct attttagtga cggaggtaga tgaagtaaat cgacgggata + 4981 ttcaaaaagc aaaagaacag ttggaacaca caggaaagcc gtttttggga gttgtgttga + 5041 ataaattcga tacttcagta gacaaatacg gttcttatgg aaattatgga gattacggga + 5101 aaaataaaaa ataggtcggg ggattagaga tgaatggaaa aatagtaaag tcttcattgg + 5161 ccataatcca gagttttctt gttattttat tgacttatct acttagtgct gtgagagaag + 5221 cggagattgt ttcaacaaca gctattgcac tttatatcct ccattatttt gtcttttata + 5281 tcagtgatta tggacaggat ttctttaaaa gaggatattt gattgaactt gtccagacat + 5341 tgaaatatat cctattcttt gcactagcga ttagtatttc taattttttc ttagaggatc + 5401 gatttagtat ttccagacga ggcatgattt acttcctcac attacatgct ctcttagtct + 5461 atgtgctaaa cctatttatc aagtggtatt ggaagcgggc ttatcccaac tttaaaggaa + 5521 gtaagaagat tctcctactt acagcaactt ctcgtgtcga aaaggtactg gatagattaa + 5581 tagaatcaaa tgaggttgtt ggggagttgg tagccgtcag tgtcttagat aaaccagatt + 5641 ttcagcatga ttgtttaaag gtagtagcag agggggagat agtaaacttt gcgactcatg + 5701 aggtggtcga tgaagtcttt atcaatcttc caagtgaaaa atacaatatt ggagagcttg + 5761 tctctcagtt tgaaacgatg ggaattgatg taacagttaa tctaaatgct tttgatcgta + 5821 gtttggcacg taacaagcaa attcgtgaga tggcaggatt aaacgttgtg actttttcta + 5881 caacatttta taagactagt catgtaattg ctaagcggat tattgatatc atgggtgcat + 5941 tggtagggct gatactatgt ggtttagtca gtattgtact ggttcctttg attcgaaagg + 6001 atgggggctc tgctattttt gctcagacgc gtataggaaa aaatggtcgt cagttcactt + 6061 tttataagtt tcgctctatg tgtgtagatg ccgaggcgaa aaaaagagaa ctcatggaac + 6121 aaaataccat gcagggtgga atgtttaagg tggacgatga tcctcgtatc acgaaaattg + 6181 gtcgttttat acggaagact agcttggacg agctaccaca gttttataat gttctaaagg + 6241 gagatatgag tttggttggc acacggccac caacagtgga cgagtatgaa cactataccc + 6301 cagaacaaaa acgtcggcta agttttaaac ctggtataac aggcttatgg caggtcagtg + 6361 gacgaagtga gattaagaat tttgatgaag ttgtcaaatt agatgtggcc tatatagatg + 6421 gttggacaat ttggaaagac attgaaattt tattgaagac agttaaagtt gtatttatga + 6481 gagatggagc gaagtgattt ttgcccttca gtcttgttag gagagatatg aaacagtcag + 6541 tttatatcat tggttcaaag gggattcctg ccaagtatgg aggatttgaa acctttgttg + 6601 agaaattaac agaatatcaa aaagatggta acatccaata ctatgttgcc tgcatgcgcg + 6661 aaaattctgc aaagtcagga tttacagcag acacatttga gtacaacggt gctatttgtt + 6721 acaacattga tgtgcctaat attggtcctg ctagagccat tgcttacgat attgcagcgg + 6781 tcaataaggc tattgaattg tctaagggaa acaaggacga ggctcccatt ttttacattc + 6841 tagcttgtcg tatcggacct tttatttctg gacttaagaa aaaaattcgt tcgatcggag + 6901 gccgtttgct ggtaaatcca gatggtcatg agtggcttcg agctaaatgg agcttgccag + 6961 ttcggaagta ttggaaattt tcggaacagt tgatggtcaa acatgcagat ttattagtct + 7021 gtgatagcaa aaatatcgaa aaatatattc gagaggacta taaacagtat cagcccaaga + 7081 cgacttatat cgcctatgga acagatacaa gcaagtctat tttaaaacct gatgacgaaa + 7141 aagttcgtaa ttggtatcag gaaaaaggcg ttgctgaaaa cggatattat ctagttgtgg + 7201 gacgatttgt tcccgaaaac aactatgaaa ccatgattcg tgaatttatc aagtctaagt + 7261 ccaataagga ctttgtcctt attacaaatg tagaacaaaa taaattttac gatcagttgc + 7321 tcaaggatac aggctttgac aaagacccga gagtcaaatt tgttgggact gtctatgatc + 7381 aagaattgct caaatatatc cgagagaatg cttttaccta cttccatggc catgaagttg + 7441 gtgggacaaa cccatcgctt ttagaagctc ttgcttcaac aaagcttaat ttactgctag + 7501 atgttggctt taaccgtgaa gttggtgagg atggagccat ttactggaaa aaagatgagc + 7561 tagcgcatgt aatcgaagaa gtggaacgat ttgatgaagg tgctatttcg gaattagacg + 7621 aaaggtctag ccaacgaatt gcggatgcat ttacgtggga aaagattgtg tcagattatg + 7681 aggaagtgtt taaaggatag agaatgaaac ggattttata tttacatgct ggtgcagaaa + 7741 tgtatggagc agataaggtt ttattggaat tgatcaaagg attaaatcct caagaatttg + 7801 aagctcatat tatcctgcct aatgacggtg ttttagtcga agccctacgc caagttggcg + 7861 ctcaggttag cgtgttggat tatccgattt tacgtagaaa atactttaat cctaaaggga + 7921 ttttggaata tctgaaattt tatcgtcgtt actcccaaaa aattgcccaa tatgtgcgtg + 7981 aaaatggaat agatcttgta cataacaata caacagctgt cttggaagga atctatctca + 8041 aaagaaaggt gaaacttccc ttgatctggc acgttcatga gattattgtt aagcccaagg + 8101 ctatttcaga ttttattaac ttcttgatgg ggcgttatgc agataagatt gtaacagtct + 8161 ctcaagctgt ggccagtcat gtcaaacagt ctccctttat caaagagggt caggttcagg + 8221 ttatctataa cggagtggac aatgcgatct atcatccgat gcagtcaagt gcagtgcgtg + 8281 aaaaatttgg gatcccagag gatgctctcg tcattggtat ggttggacgt gtcaacgcgt + 8341 ggaaggggca aggagatttt ctagaagctg tgacaccgat tttggagcat aatccgaatt + 8401 ccgtagcttt tctagcgggg agtgcctttg ctggtgaaga gtggcgagtt gaagaattag + 8461 agtctaagat ttccaaatca agtgtagcct cacaaatcaa acgaattgaa tattatgagc + 8521 atacgactga actttataat atgtttgata tctttgtctt accaagtacc aatcccgatc + 8581 cactaccaac agtggtacta gaggctatgg cttgtggtaa gccagtagtc ggctaccgtc + 8641 atggtggtgt ctctgaaatg gttgttgaag gaaccaatgg cttactggca atcccaggac + 8701 aatcacaaga actatcggat gcgattttgg agttggtttc tgatccagaa aaacggctcc + 8761 aatttggcca agcatcagta agaagacaag gagaatcgtt ttctttggaa tcttatatcc + 8821 gtagtttctc agaattatat aagagttata aaaatgaata aagaaataat aaagaataaa + 8881 ttaaaactaa ttgtttatcc tatcattaat tttatttcta ggagaagatt aaaaaataaa + 8941 aaattcacca ttatttgtga taattgttgg gctggaaaag tgtaccaaga gttaggtttg + 9001 ccctaccaaa caccctttat cgggatgttt gttttttcgc ctgattatat caagatgctc + 9061 aagaatttga aatactattt gagcggaaat atctcgttga aatttgttaa ggaatcaaag + 9121 cacattgaaa actttgataa tgcttatcca attgcactcc ttgacgatat cgagcttcat + 9181 ttcttgcact atgcagatga aaaagaggct actcagaaat ggcaacgtcg tttagaaaga + 9241 attcattggg ataatttgta ttttaagttc aatgacaatg atgcttgtac ctatgacctt + 9301 atgagagaat ttgatcaatt accgtacaaa agtaaagtca ttttttcatc taagaattat + 9361 tctgatttac attcattaac ttattttaaa gagaaggaaa aagattgtag tgttggaatt + 9421 gatcttaaaa tctatcatcg ttatttcgat gttgtaaggt ggctgaatga aggcggagtg + 9481 gacttgagtt aatcagatta aaactaaaaa aggagttgtt aatatgtcta aaatgaaaat + 9541 tgcagtagtt gggactggtt atgttggttt atccatttct gtgttacttg cacaacacca + 9601 tcatgtagta gcagtagata ttgtaaaaga gaaagtagaa ttaattaata ataaaatttc + 9661 acctattcag gatgatttta ttgaaagata tctttcagaa agtaatttag atttagttgc + 9721 aacaatagac gctgaaacag cttataaaga tgcctctttt atcgtagtag cgacgccaac + 9781 aaattatgac tcagaaagaa atttttttga tacatcagca gttgaatcgg ttattcaaca + 9841 ggttcagaat gtgaattcta cagcaactat agtaataaaa tcaacagtcc ccgtgggttt + 9901 tactgattca attcgtaaaa aattaggaat ttcaaatctt ctattcagcc ctgaattttt + 9961 gcgcgaatca agagcacttt atgataactt atatccaagt cggatcatag ttggaacaga + 10021 tttaaatgat caaaaattaa ttgaaaaggc ccaagttttc tctaatcttt tagtgcaagg + 10081 tgctatcaaa aaagatatcc ctattttaat tatgggattt actgaagctg aagcagttaa + 10141 attatttgct aatacctact tagcattgcg ggtatcatat tttaatgaat tagatactta + 10201 tgcagagacc aaaggactag atactcaaaa aataattgag ggtgttagtt tagatccccg + 10261 tatcggaacc cattataata atccgagctt tgggtacggt ggatattgct taccaaagga + 10321 cactaagcaa cttttagcta attatgagaa tatcccagaa gaacttattg gggctatagt + 10381 acgtagcaat gcaacacgta aggattttat tgctaaacaa gttcttaaaa tggtgaatta + 10441 taataatcca gaagacgata tttctgtcag acagatggat aaagaagttg ttattgggat + 10501 ataccgatta actatgaaaa gtaacagtga taactttcgt cagagttcaa tacagggagt + 10561 tatgaaacgt attaaggata gaggagctaa agtaattatt tttgagccta ctctaaaaga + 10621 taatggtacg ttctttggga acgctgttat aaatgattta gaagagttca aagcaaagtg + 10681 cgatgcgatt attgcaaatc gttatgatga aatgttgaac gacgttaagg ataaagtata + 10741 tacacgagat atcttcagaa gagattaata aaaatatgaa aaaagtatta attgtccgaa + 10801 gtggacctta ccaagttact ccaaatgaat acaaccttca ggagcttgga ttagcttctg + 10861 ctctcagtca gcagggatac caatgtgacg tgatgtatta tcacaaaaca aaaaactatg + 10921 atcaattatt tgagaaaaac ggggaaaaaa ttaaagtatt ttggagaagg ggaataagat + 10981 tatttagaag tggaatttat ccccagattt taaaaaagaa atttttgagt cagtatgata + 11041 aaataattat ttccgagtat agccagatta tggcagtttt attgtctaga attcattcca + 11101 atgtatatat ttataatggt ccatactata atctatttaa gatccccatt attgaatcta + 11161 tgtacgattt tctttttgta agaatgctca ataagagaac caagacagtt ttctgcaaga + 11221 cagaaaaggc aaagcattat cttaaaaata agggattcaa tgattgtaaa gtagtgggcg + 11281 taggtctaga tgttgaaaag tttgaacaag aagaggaacc tacggagaat actatagaac + 11341 ttttaaaaag aatggagaat aagcaaaata ttctttatgt aggctcacta tcaaaaagaa + 11401 aaaacacagc tcatttaatt agaattttta atattttaaa atctaaaagt ggtaagaaaa + 11461 acgaacttca attggtattg attggtaagg atgagggtaa tattgttgaa aaaattaact + 11521 attcacggtt taaagatgat attatttatc aaccttattt aaagaactct cagcttcaat + 11581 ttatttaccc atcatcacaa ctatttgtgc tcccgtcgat tcaagagatt tttggtatgg + 11641 tattacttga ggcaatgtat tttaagttgt ctgttgtttc cagcgcaagt gctggaggag + 11701 agacactgat tcaagatggt ataaacggta aaattatgaa tgattttaat gatgaacact + 11761 gggtggattg tatagaaaat ctattaaata acccattgga attgaaacgg cttggagaat + 11821 gtgcccataa gcgaattacg gaacagttta tgtggtcttc aattgcgaga aaaataattg + 11881 agacatttga tgaaaggtaa gacttactat gaatttttgt tttgtgattt tgcattatcg + 11941 taccagcaat gacactatag agtgtatcaa atcgattcaa aagcttgagg gaaattataa + 12001 aattgtaatt gttgataacg cttctcaaaa tggcagtata gaaagggtag aagccttatt + 12061 tgcaaataat gacgagatag ttataataaa aaacacgaaa aacttaggat ttgctgcagg + 12121 aaataatatt ggatacgcct atgctcggac tcaaataaaa gctaatatga ttgctgtact + 12181 taataatgat attgttatta agcaaaaaga tttcattaat cgtatatttg aactctatag + 12241 aaattctcag tttcatatcg ctggtccaga cattgtctct cttgtagatg gtcatcatca + 12301 aagtcctgtt gttgagaaga tcaattctat atctaaggca aataaagaac tttttaaata + 12361 tagaatcttg agaattatta ataaaatagg attatatgag ctgatgacta gacagccaaa + 12421 aaaaaaatta aatagagtaa gtgctgcaga ccctatagga tatcaggaaa atgttatttt + 12481 acatgggagt tgtgtaattt tttcaccatt atatgtttca gaggaggagt ttgcttttag + 12541 accagatacg ttcatgtata tggaagagcc tattctatat gaatattgca tgcttaaaaa + 12601 ttataagaca gtatttgatc cttctattgt aatttatcat aaagaggact catcaacaaa + 12661 ttcgttgtat aatgcggcat atgcaaaaag agagtttgtt tttaaaaata tgattagatc + 12721 tctaaagatt tatagaagtc tattgaagta gtaaactagg gaaaggatag taattaaaaa + 12781 ttgaatctta gtatgttagc cttgacaata ggatcagtgg tatttgttaa aaaaacgtat + 12841 aggacgtttc tcaatcccat aattttattt gcaattttgt ggtttattat aacaactttg + 12901 tcaaatttaa aactattcca acttttcgag attagtactc atacacaaca aattattttg + 12961 cttgggactt ctctatttgt tataggggga gggatagcaa tttggtttcg ggataaattt + 13021 tattttaaag ttggcggtaa ctcatatttt acaacagact ttgaaattaa ttataatttg + 13081 ttctttttgc taggtatcat ttgtcttttc tattatttgc cagatttctt ttcctcactg + 13141 gtatcattaa taagaggtgg gaatttaaac ttagttagac aatctgcgca ggatgcagta + 13201 gataccagtg gattaaagaa tttcattgga acatttattg ttattcctag tgccatggta + 13261 ttagaaatat taggaatatt agatttctgg agcaataaaa aaggcagaaa actattttat + 13321 cttaatttag ctgtcatttt tgtaagagtt gttgcagatg ctggtagaac gcctctattt + 13381 aatgttgtca tatatttatt acttactgtt ttagcaaata ggttctctga aaaaactgaa + 13441 aagaagagaa aagttagtaa aattaagata gtaaattatg gtatgctagg ttcaattatc + 13501 ttatggctat caactttatc taggacaaca acctccgttt ataggattct ttatttttat + 13561 ttcgcaatgt ccccaatact attagaaaag tggagtagta tacttgattc tgaaaaatta + 13621 gtaacaaagg gtttggtttc gttgaacggt ttcttttttt caatctcata tgtacttaaa + 13681 aatctgttta gaataggtta ttctcaaaga gtattagaag catacacaat gattgcgaat + 13741 actgatgcaa tctggtataa tattgcacct ggtttgacca aggcaaatgc atatgtctct + 13801 ctgttttggt ttttttatgc ggatggacgt ttattaggag ttttaatagg atcccttcta + 13861 tatggtgcct tttgtggcta tatcttttgc aggtatatcc agcaacaaaa taaaaagaat + 13921 ttggctatgt tactatttat ttatcaaggt gtttttttct cttttattag atttccgttt + 13981 tcaaaatcaa attatgcaat tgcattcgta ctcttattat tttttgcttt taagaagaaa + 14041 ggaatagaga aaagtgttta atatcaatga ccagtctatt atttatgttg catgtcctta + 14101 ttttaataaa acaggtggaa cggagctcgt ccatcaatta gtttattcta ttaatcattt + 14161 tggggggaaa gctatcgttg cttattatgg tagtgaaagt gctccaaatg aggtgaatcc + 14221 tgcgtttaga gaatatgttt ctacgtttgt tgatataaaa gatgttattg actctcttga + 14281 taatattatt attttaccgg aaattaatcc ggatttagcc gctaatctag agtctattca + 14341 aaaagcagta tggtggatga gcgttgacaa ttatttgaag cgtaatggta ttttaggttc + 14401 cttggaacat tttggacttt tacgaacaat taaattattt gtaaaaggaa atattaaaat + 14461 aggtggatat agaatagata aagagattcc ccatctttat caaagtgaat acgccaagca + 14521 atttcttcta gctaaaggtg tcaaaaagta ctatagattg tctgattatt taaacgagtc + 14581 ttatattcag cgatctattt caacagacac taaaaaagat gttattcttt acaatcctaa + 14641 aaaagggatt gaatttactc gtgagctaat taaacaggct ccagaattaa cgttctctcc + 14701 aattgagaat atgtcaactg aacaggtgaa aaaattactt tcaaaaagca aagtatatat + 14761 tgattttggc aaccatcctg ggaaagatag attcccacgg gaggcagcga tatcaggttg + 14821 ttgtgtgata actgggaaac gaggttctgc aaaatattat aaggatattc ctattccaga + 14881 ttcatacaaa tttgaagaca ctgttgaaaa tatccccaac attattgaga ccctgaaatc + 14941 atgcttaaaa aattatgaca aacatactgt tgactttgag aaatatcaac aatatattaa + 15001 atctgaacat gatttatttg aaagagatgt gaaagaatta ttcactagga ataggggtta + 15061 aggttatgtc aaccagaaat tcacttatta aaaattctct ttataatgtt gcttatagaa + 15121 tgttaaatat catatttcca ttagtatccg caacatatac tgcacggata attttagcta + 15181 gtggagttgg ggaggtctcg tttgcacaaa atgttgtttc ttactttaca acgatagctg + 15241 ctatgggtat tccaaattat ggtatacgag aaattgctaa aactagaaat aaagaagagg + 15301 ctacgaataa agttttttca gagctatttc tgattaatgg attgtctaca ttactgtgtt + 15361 ctatagtata tttaattctg attttgacat tcaatagcat ttttgataat acatcaatgt + 15421 atcttgctgt gggtttaaca ttagtgttta acttccttaa tatcgattgg ttctatcaag + 15481 gaaaagagga ctatgcatac atcacgaaac gtagtttcag tataaaactt atttctcttt + 15541 ttagtttatt tatttttgtt agagatactg acgatgcagt taactatgca ttgatttcta + 15601 gcttagcaat tggcgggaat aatattttta atcttgttaa tttaaggaaa tataatatta + 15661 gatttagttt taataatatt aagattagaa gacacttaaa acctattttt gttttgttgg + 15721 gttcagtgat tgctattgaa atctatacta tgctggatac cactatgatt ggtgctatgg + 15781 taggaacgac tgaggtaggt tattatacaa attctatgaa gctagttaaa ttgctgataa + 15841 ctgtgattac cgctattgga ggagtgcttt taccacgact aagtgattat tattctaagg + 15901 gagaatttga aaaattaaat cacatcgttg ataaagtttt tagaatcatg ttgtttcttt + 15961 ttttaccagc ccaagttgca ttaattctag ttgcaccagt aattatgccg attttatttg + 16021 gtgatagttt tataccagca gtgttaacac ttcaacttac ttctttgctt atatgtacat + 16081 tagggtttag taatttattt gggactcaaa tattactaac atttggagat gagcgaaagc + 16141 ttttgattag cacaatttta ggagcgctta gtaatatcgc tttgaaccta attctgattc + 16201 cagtaatggc tcaaaatgga gcagcgttgg catctgtgat tagtgaaaca attgttactt + 16261 taacagcata ctactatgcg aaaaaacgtg tgacaattag gtttgactta ggattttatt + 16321 tgccaactgt tgtttcaaca ataatcatgg gtggagctat atatgtagta atgcaattgt + 16381 atattgggga tatagaaaaa atgttatttt caactttgtt aggaggtgtt gtattccttt + 16441 taattaacgt ttttatgaag aatcctatta tatatgaatt tacaggtatt ataaagagaa + 16501 agagataatt atgtacgact atttaatcgt tggagcgggt ttgtctggag caatcttcgc + 16561 acacgaagct acaaagcgtg gaaaaaaagt aaaagtgatt gataaacgcg atcacattgg + 16621 agggaacata tactgtgaga atgtagaagg tatcaatgtt cataaatatg gtgcccatat + 16681 cttccatact tctaataaaa aagtctggga ctacgtcaat caatttgctg agtttaacaa + 16741 ctatatcaac tcacctgtcg caaactataa gggaagtctt tataaccttc ctttcaatat + 16801 gaataccttc tatgctatgt ggggcacaaa aactccacaa gaagtgaagg ataagattgc + 16861 tgagcagaca gctggtatga aggatgttga gccgaaaaat ctggaagaac aagctatcaa + 16921 gttgattggt ccggatatct atgaaaagtt gatcaagggt tatacagaaa agcaatgggg + 16981 acgctcagcg atagaacttc ctccatttat cataaaacgc cttccagttc gtttaacctt + 17041 tgataataac tattttaatg accgttacca agggattcct attggtggtt acaatgtcat + 17101 catcgaaaat atgctgaaag atgtagaagt tgaacttgga gtagactttt ttgctcatcg + 17161 tgaagagttg gaagcatctg ctaacaaagt tgtcttcaca ggaatgatcg accaatattt + 17221 tgactacaag cacggagagt tagaataccg tagccttcgt tttgagcatg agattttaga + 17281 cgaggaaaat tatcaaggga atgctgtagt gaactataca gagcgtgaga tcccttatac + 17341 tcgtatcatc gaacacaaac attttgaata tggaatgcag ccaaagacag ttatcacgca + 17401 tgaatatcca gctgactgga agcgtgggga cgagccctac tatcctatta acgatgagaa + 17461 aaataatgct atgtttgcta aataccaaga agaagcagcg cagaatgata aagttatctt + 17521 ttgtgggcgt ttagcagatt ataagtatta cgatatgcat gtggtgattg aacgggcgct + 17581 tgaggttgtg gagaaagaat ttagtaattg aaaaacaacg aagaaaggtt gcttattatg + 17641 aaaggtatta ttctagcagg tggttcggga actcgcttgt atcctttgac tcgagccgca + 17701 tcaaaacaac ttatgccggt ttatgataaa ccgatgattt actacccact ttcaacatta + 17761 atgttggctg ggattaggga tattttgatt atctcaactc ctcaagattt gcctcgtttt + 17821 aaagagcttc ttcaagatgg ttccgagttt ggtattaaac tttcttatgc tgagcaacca + 17881 agtccagatg gtttggcaca agcctttatc attggggaag agtttatttc tgatgatagc + 17941 gttgcgctaa tcttaggtga taatatctac catggttctg ggctttccaa gatgctacaa + 18001 aaggcagcga gtaaggagtc gggagcaact gtttttggct accatgtcaa ggatccagag + 18061 cgctttggtg tggttgagtt tgatcaggat atgaaggcta tttctattga agaaaagcca + 18121 gagcaacctc gttcaaacta tgcagttaca ggtctctatt tctatgataa tgatgtagta + 18181 gagattgcca agagtattaa accaagtcct cgtggtgaac tggaaattac agatgtaaac + 18241 aaagcttacc tagatcgtgg tgatttgtct gttgagctta tgggacgtgg ctttgcttgg + 18301 ctggatactg gaactcatga aagtttacta gaggcttcac agtacatcga aacagtccaa + 18361 cggatgcaaa atgttcaggt agcaaactta gaagaaattg cctatcgcat gggttatatc + 18421 agtcgtgaag atgtattgac cttagctcaa ccacttaaga aaaatgaata cggacagtat + 18481 ctgctccgtt tgattggaga agcatagatg acagataatt ttttcggtaa gacgcttgcg + 18541 gcacgcaagg ttgaagctat tccaggcatg ttggagtttg atatccccgt tcatggagat + 18601 aatcgtggct ggtttaaaga aaatttccaa aaggaaaaaa tgcttccact tggatttcca + 18661 gagtctttct ttgcagaagg aaaattgcaa aacaatgtat ccttctcacg taaaaatgtc + 18721 cttcgagggc tccacgcaga gccttgggat aagtacatct ctgtagcaga tggagggaaa + 18781 gttctgggtt cttgggttga tctacgcgag ggtgaaacct ttgggaatac ctatcagaca + 18841 gtaattgatg caagcaaggg aatctttgtt cctcgaggcg tagctaatgg cttccaagtt + 18901 ctatcagata cagtgtcata tagctatctg gtcaatgatt actgggctct cgagctcaaa + 18961 cccaagtatg cctttgtgaa ctacgctgat ccaagccttg gtattgaatg ggaaaatatt + 19021 gcagaagcag aggtttcaga agcagataaa catcatcccc tacttaagga tgtaaaacct + 19081 ttgaaaaaag aagatttgta aaaaggaaag aatatgactg aatacaaaaa tattatcgtg + 19141 acaggtggag ctggctttat cggttctaac tttgtccatt atgtttacga gaactttcca + 19201 ggtgttcacg tgacagtcct agataagttg acttatgctg gaaatcgcgc gaatattgag + 19261 gaaattttag gtaatcgtgt tgagttagtt gttggtgaca ttgctgatgc ggagttggta + 19321 gacaagttgg ctgctcaagc agatgctatc gttcattatg cagcggaaag ccacaatgat + 19381 aattcgctca atgatccatc gccatttatt catactaact tcatcggaac ctatactctt + 19441 ttagaagctg ctcgtaagta tgatattcgc ttccaccatg tatcgacaga tgaagtttat + 19501 ggggatctcc ctttacgcga agatttgcca ggtcatggtg aaggaccagg tgagaaattt + 19561 actgctgaaa caaaatacaa cccaagctct ccgtactcat caaccaaggc agcctcagat + 19621 ttgattgtca aagcctgggt gcgttctttt ggagtcaagg caacgatttc caactgttca + 19681 aataactacg gtccttatca acatatcgaa aaattcatcc cacgtcagat tactaacatc + 19741 ctaagtggaa ttaagccaaa actttacggt gaaggtaaga atgttcgtga ctggattcat + 19801 accaatgacc attcttcagg agtttggaca atcttgacaa aagggcaaat cggtgaaacc + 19861 tacttgattg gggctgatgg tgagaagaac aataaggaag ttttggaact tatccttaag + 19921 gaaatgggac aagctacgga tgcctatgat catgtgactg accgtgcagg acatgacctt + 19981 cgctatgcga ttgatgccag caagctccgt gatgagttgg ggtggaaacc tgaatttacc + 20041 aactttgaag ctgggctcaa ggcaacaatc aagtggtata cagataacca agaatggtgg + 20101 aaagcagaaa aagaagctgt tgaagccaat tatgctaaga ctcaggagat tattacagta + 20161 taaaaagcag gaaatagctg ctttttattg ctatattggg aagagttaca tattagaaag + 20221 gtctagagat gattttaatt acaggggcaa atggccaatt aggaacggaa cttcgctatt + 20281 tattggatga acgtaatgaa gaatacgtgg cagtagatgt ggctgagatg gacattacca + 20341 atgaagaaat ggttgagaaa gtttttgaag aggtgaaacc gactttagtc taccattgtg + 20401 cagcctacac cgctgttgat gcagcagagg atgaaggaaa agagttggac ttcgccatca + 20461 atgtgacggg gacaaaaaat gtcgcaaaag catctgaaaa gcatggtgca actctagttt + 20521 atatttctac ggactatgtc tttgacggta agaaaccagt tggacaagag tgggaagttg + 20581 atgaccgacc agatccacag acagaatatg gacgcactaa gcgtatgggg gaagagttag + 20641 ttgagaagca tgtgtctaat ttctatatta tccgtactgc ctgggtattt ggaaattatg + 20701 gcaaaaactt cgtttttacc atgcaaaatc ttgcgaaaac tcataagact ttaacagttg + 20761 taaatgacca gtacggtcgt ccgacttgga ctcgtacctt ggctgagttc atgacctacc + 20821 tagctgaaaa tcgtaaggaa tttggttatt atcatttgtc aaatgatgcg acagaagaca + 20881 caacatggta tgattttgca gttgaaattt tgaaagatac agatgtcgaa gtcaagccag + 20941 tagattccag tcaatttcca gccaaagcta aacgtccgct aaactcaacg atgagcctgg + 21001 ccaaagccaa agctactgga tttgttattc caacttggca agatgcattg caagaatttt + 21061 acaaacaaga agtgagataa gtagtagaat gattttctag tctaataaaa gaggcagaga + 21121 atgaactcca aaggagctta agatgtacga ttatcttgtt gttggtgcag tctttgccca + 21181 tgaagcagtc ttaaaaggaa aaaaagtaaa agttattgaa aaatgaaatc atatcgcggg + 21241 taatatctat actcgtgaag aggaaggaat tcaagttcat caatatggtg ctcatatctt + 21301 ccatacttct gataaggaga tctgggatta tgtaaatcag tttgcagagt ttaaccgtta + 21361 taccaattct cctgttgcaa actataaggg agagatttat aacttacctt ttaatatgaa + 21421 taccttcaat aaactctggg gagttgtgac gccagcagaa gcacaagcta agattgatga + 21481 acaacgtgct attttaaatg gtaaaactcc tgaaaatttg gaagaacagg cgatttctct + 21541 tgtaggtaca gacatctacg aaaaattaat caaagactat acagagaaac agtggggcaa + 21601 accaactact gaacttccat cctttattat tcgccgttta ccagtacacc tgacctatga + 21661 taacaactat tttaacgata cctatcaagg gattccaatt ggtggttata atgttatcat + 21721 cgaaaatatg ctgaaggatg tagaagtaga acttggagtg aacttttttg ccaatcgtca + 21781 agaattagag gcttctgctg aaaaggttgt ctttacaggg atgattgacc aatactttga + 21841 ttataaacat ggtgagttag aatactgtag tcttcgtttt gatcatgaag ttctagatga + 21901 ggaaaactat caaggaaacg cagttgtgaa ctatacggat gcagaaaccc catatactcg + 21961 cattattgaa cacaaacatt ttgagtttgg gagtcaagca aagactatca ttactaatag + 22021 aacattctaa aacatgggaa aaaggtgatg agccttatta tccagttaat aatgatcgta + 22081 ataatcattt gtataaatca tataaaaaac ttgctgatga gcaagggaat gttatctttg + 22141 gtggccgctt aggacactat cgttattacg atatgcacca agtaattgga gcagctttgc + 22201 agtgcgtgag aaatgagtta gattcatact caatgaaaat caaagagcaa actaggaagc + 22261 tagccgtagg ttgctcaaaa cactgttttg aggttgcaga tggaagctga cgcggtttga + 22321 agagattttc gaagagtata aacaagtaaa actgactacc agttattatt tagaaatagt + 22381 attaaaaatt ccttgactat gtgatatagt tgagggattt ttaaatgata ttcatatttt + 22441 ttgcaaagat gttgtttgaa aaataatttt caaaaattct gaaaattctg ttgacaactt + 22501 tctgaaaaga gtctataatg gagagaaagt tttaaaggag aaaatgatga aaagttcaaa + 22561 actatttgcc cttgcgggcg tgacattatt ggcggcgact actttagctg catgctctgg + 22621 atcaggttca agcactaaag gtgagaagac attctcatac atttatgaga cagaccctga + 22681 taacctcaac tatttg +// + diff --git a/public/res/serotype_genbank/serotype_23A.gb b/public/res/serotype_genbank/serotype_23A.gb new file mode 100644 index 0000000..aff67dc --- /dev/null +++ b/public/res/serotype_genbank/serotype_23A.gb @@ -0,0 +1,976 @@ +LOCUS CR931683 21475 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 1196/45 (serotype 23a). +ACCESSION CR931683 +VERSION CR931683.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21475) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21475) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21475 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="1196/45" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC23A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC23A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33808.1" + /db_xref="GOA:Q4K1T1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K1T1" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC23A_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC23A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..980) + /gene="tnp" + /locus_tag="SPC23A_0003" + /pseudo + CDS complement(459..980) + /gene="tnp" + /locus_tag="SPC23A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1204..2649 + /gene="wzg" + /locus_tag="SPC23A_0004" + CDS 1204..2649 + /gene="wzg" + /locus_tag="SPC23A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33811.1" + /db_xref="GOA:Q4K0K5" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0K5" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1204..1320 + /gene="wzg" + /locus_tag="SPC23A_0004" + /note="Signal peptide predicted for SPC1162 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 1408..1755 + /gene="wzg" + /locus_tag="SPC23A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.6e-64" + misc_feature 1933..2376 + /gene="wzg" + /locus_tag="SPC23A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2651..3382 + /gene="wzh" + /locus_tag="SPC23A_0005" + CDS 2651..3382 + /gene="wzh" + /locus_tag="SPC23A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33812.1" + /db_xref="GOA:Q4K0K4" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0K4" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNGKRVRELIDMGCYT + QINSYHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 2654..3262 + /gene="wzh" + /locus_tag="SPC23A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.9e-37" + gene 3391..4083 + /gene="wzd" + /locus_tag="SPC23A_0006" + CDS 3391..4083 + /gene="wzd" + /locus_tag="SPC23A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33813.1" + /db_xref="GOA:Q4K0K3" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0K3" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFTYSTFVI + KPEFTSTTRIYVVNRNQGEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNILIGFLAGVIGTSVIVLLLELLDTRVKRPEDIEDTLQMT + LLGVVPNLNKLK" + misc_feature 3409..3825 + /gene="wzd" + /locus_tag="SPC23A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.9e-52" + misc_feature 3931..4008 + /gene="wzd" + /locus_tag="SPC23A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4093..4776 + /gene="wze" + /locus_tag="SPC23A_0007" + CDS 4093..4776 + /gene="wze" + /locus_tag="SPC23A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33814.1" + /db_xref="GOA:Q4K0K2" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0K2" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVS + PGEGKTTTSVNIAWSFARAGYKTLLIDGDTRNSVISGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEANKRDVQKAKQQLKQTGKLFLGVVLNKLDISVDKYGVY + GFYGNYGKK" + gene 4792..6159 + /gene="wchA" + /locus_tag="SPC23A_0008" + CDS 4792..6159 + /gene="wchA" + /locus_tag="SPC23A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33815.1" + /db_xref="GOA:Q4K0K1" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0K1" + /translation="MDEKGLKIFMAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYVSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLNKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVSYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5575..6156 + /gene="wchA" + /locus_tag="SPC23A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.9e-146" + gene 6190..7368 + /gene="wchF" + /locus_tag="SPC23A_0009" + CDS 6190..7368 + /gene="wchF" + /locus_tag="SPC23A_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33816.1" + /db_xref="GOA:Q4K0K0" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K0K0" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIVYDIAAINRAIEIAKENKDEDPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSTPVRRYWKISEGLMVKHA + DLLVCDSKNIEQYIQEDYKQFQPKTTYIAYGTDTTRSILKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMILGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYNQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVAE + DGADYWEKDNLHKVIEASEQKTQEEINEKNILSTKQVTERFSWDLIVNEYEKLFTRKN + " + misc_feature 6805..7302 + /gene="wchF" + /locus_tag="SPC23A_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0028" + gene 7578..8984 + /gene="wzy" + /locus_tag="SPC23A_0010" + CDS 7578..8984 + /gene="wzy" + /locus_tag="SPC23A_0010" + /note="member of homology group 243" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33817.1" + /db_xref="UniProtKB/TrEMBL:Q4K0J9" + /translation="MRYGIMRISFSKKTMLCGLLYIGLILSVVTIPTIVTFLYSLLFI + GIVTVLNYNSILASDEDANSFFVALPIILSSFQNVYLGFGADRLNSVTLQVLLSISIA + IITITVFLGIILNRFKSKEFSWLVLSILVIIIQSVILLIFFPTTLPAYLSSMRNILAP + LLIFYFSIYGFKNINLQKFYKYMFIIILVVLIFGFIEYIYGNSLWTRLNIKKLWALKG + LAIENRVVPGNWHSSELIGGKQLRRMVSTFADPVNLGSYLFAAFMLAWYKNKKLLQVL + LLASFVLSVSKAAFLSMLVYIIIYTWVVDKNKILSIFGIIISTVLGLYFYNFSQVSSY + GSINAHIDGFFSALSTPLHYPFGMGVGSVGVLASKLGSQTALSSEVLETGIGMIIAQL + GFVGVIIYLIFFVKLSVIGKNINNKRDKILWFTLIYSFLANAFFNEVALSPNSCTLYF + LILGLLYNKNKIRSTEFS" + misc_feature 7578..7748 + /gene="wzy" + /locus_tag="SPC23A_0010" + /note="Signal peptide predicted for SPC1168 by SignalP 2.0 + HMM (Signal peptide probability 0.974) with cleavage site + probability 0.336 between residues 57 and 58" + gene 8984..9955 + /gene="wchV" + /locus_tag="SPC23A_0011" + CDS 8984..9955 + /gene="wchV" + /locus_tag="SPC23A_0011" + /note="member of homology group 109" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33818.1" + /db_xref="GOA:Q4K0J8" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0J8" + /translation="MEKLVSIILPVYNVEQYIKNCLESIQQQTYPNLEVIIVNDGSTD + KSVEYCEQICKIDSRFSITHKENGGLSDARNVGIDKAKGDYLIFVDSDDFVSQDMVSY + LVSCMENNEADIAICDPVHYYSDRQNNDLNIFSPASSVKVYETTEALCEMFYQKSFLV + SAWAKIFKRELFDDIRFPVGKLFEDSAIMYLLLEKCETIAYSDAKLYAYVHRDNSITT + KKFSDRDLDILEITNTIINHYGDNLRVYTAAVSYKVSACFRILLNSPSEEKYKKVQKE + CLSYILQNWRNILFNNNVRLKNKLALISITIFNPFVKLIYSKVNRWE" + misc_feature 8999..9511 + /gene="wchV" + /locus_tag="SPC23A_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1e-49" + gene 9962..11194 + /gene="wchW" + /locus_tag="SPC23A_0012" + CDS 9962..11194 + /gene="wchW" + /locus_tag="SPC23A_0012" + /note="member of homology group 110" + /codon_start=1 + /transl_table=11 + /product="putative transferase" + /protein_id="CAI33819.1" + /db_xref="GOA:Q9R924" + /db_xref="UniProtKB/TrEMBL:Q9R924" + /translation="MNKYEERYQENLSKNDFYKLINKSYLSDKELQVQQVKAGIVLPP + KAFETKLSNKLGLQKSLHGKGGVVDSNGNYIELSAQKAVGMRNRVYGPYKINYDNLPI + RNEKVIYLNYFIKQWGHFLLDVVGRLWYPLLQDNDTKLVYTCYAGTETKIEGNYLEFL + KLLGIDQSRLIMINCPTQFSEVIIPESSILPGGYYTKEYKQLFSSVVENIKLDKYDVN + AKMIYCSRSKLGIAKSKEFGEDGIEGIFKQNGYTSVYMETMSLEEQIKTLLSAKTIVL + TSGSLAHNLLFVNKDIDVFILNKTYRVNLHQFLINEISDATVRFVDIYRSPLPILYGY + GPFLMDLTKPLANFLDDNEFVYEKGTVLSKKDYFKYYLKWLWSYRFFLFRLNGIKEGN + SEFEKSFKIIRRYYKTGR" + gene 11196..12581 + /gene="wzx" + /locus_tag="SPC23A_0013" + CDS 11196..12581 + /gene="wzx" + /locus_tag="SPC23A_0013" + /note="member of homology group 111" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33820.1" + /db_xref="GOA:Q4K0J6" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K0J6" + /translation="MSKYKELAKNTGIFALANFSSKILIFLLVPIYTRVLTTTEYGFY + DLVYTTIQLFVPILTLNISEAVMRFLMKDGVSKKSVFSIAVLDIFIGSIAFALLLLVN + NLFSLSDLISQYSIYIFVIFVFYTLNNFLIQFSKGIDKIGVTAISGVISTAVMLAMNV + ILLVVFDWGLLGFFIANVCGYVIPCIYIVSRLRLWELFEIKIDKKLQWEMVYYALPLV + LNILSWWVNNTSDRYIVTAIVGIQASAIISVAYKIPQILSTISAIFIQSWQISAIKIQ + EDKSGTTFVSNMLLYYNALLLIIASGIILFVKPISNILFGISFYSAWELVPFLIISSL + FNAISGCIGAIMGAKMDTHNIAKSALVGMIANIILNIVLTFLMGPQGITISTLIASFL + IFYMRKDSVKEINSETYRAIYLSWILLVVEACLLIYMDFIIGALIAMVINLFLLKDVI + KPLYLKIFKRN" + misc_feature 11214..12023 + /gene="wzx" + /locus_tag="SPC23A_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 6.3e-67" + gene 12589..13737 + /gene="wchX" + /locus_tag="SPC23A_0014" + CDS 12589..13737 + /gene="wchX" + /locus_tag="SPC23A_0014" + /note="member of homology group 53" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33821.1" + /db_xref="GOA:Q9R922" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q9R922" + /translation="MIVLQYFKILARFVFMFLISAVLLPFKIKPNKIVFINFNGKGYG + DNPKSICEYLRTTYPDLDLVWLARDNEGFPDGVRVVKYGTFQAFYEQASSKVWVYNVR + AFARILKKRGQIYIQTWHGASSFKLIEKQADLPINYVLEAKYDARVTDIMISDSRKQT + EEFQKYFWYSGEIFEVGMPRNDALFHYKEDYDKLNNIRKELSIHSDDYVILYAPTFRD + DGDASYLDINFERLLQCVEHGIKKKCKFLIRLHPNHSHLCNNISFNKNIINATFYSDM + QELTLLADVLVTDYSSSIFDFMLLNKPYVRYVNDLEKYAELRGVSDTYYELPDSIIKT + AEELYDLLPKKIENFDYDSIKKYRNEILCPIFNGTASENVGRRIIQEL" + misc_feature 13177..13728 + /gene="wchX" + /locus_tag="SPC23A_0014" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 4.3e-73" + gene 13773..14801 + /gene="gtp1" + /locus_tag="SPC23A_0015" + CDS 13773..14801 + /gene="gtp1" + /locus_tag="SPC23A_0015" + /note="member of homology group 40" + /codon_start=1 + /transl_table=11 + /product="putative glycerol-2-phosphate dehydrogenase" + /protein_id="CAI33822.1" + /db_xref="GOA:Q9R921" + /db_xref="InterPro:IPR002658" + /db_xref="InterPro:IPR016205" + /db_xref="UniProtKB/TrEMBL:Q9R921" + /translation="MKNNDLKIGSGAIHQISATLSQNSISGKILYCADPVVDDLYGSI + VRSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFIS + KRPYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKA + GIGDTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLV + NSLVLSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENS + VDTVVDYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQI + YKELISEL" + misc_feature 13794..14714 + /gene="gtp1" + /locus_tag="SPC23A_0015" + /note="HMMPfam hit to PF01761, 3-dehydroquinate synthase, + score 2.9e-70" + gene 14817..15521 + /gene="gtp2" + /locus_tag="SPC23A_0016" + CDS 14817..15521 + /gene="gtp2" + /locus_tag="SPC23A_0016" + /note="member of homology group 41" + /codon_start=1 + /transl_table=11 + /product="putative nucleotidyl transferase" + /protein_id="CAI33823.1" + /db_xref="GOA:O85005" + /db_xref="InterPro:IPR005835" + /db_xref="UniProtKB/TrEMBL:O85005" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQN + NITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLM + MNADVFYDASVIKSLLLHKAPNAIVTDLGIYIEESMKVVEKNGRLVEISKQISPEETL + GASIDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILSEVEFVACPLEGRWL + EIDNHEDLVAAEKLFA" + misc_feature 14820..15518 + /gene="gtp2" + /locus_tag="SPC23A_0016" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 1e-07" + gene 15536..16369 + /gene="gtp3" + /locus_tag="SPC23A_0017" + CDS 15536..16369 + /gene="gtp3" + /locus_tag="SPC23A_0017" + /note="member of homology group 42" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI33824.1" + /db_xref="GOA:Q4K0F2" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006357" + /db_xref="UniProtKB/TrEMBL:Q4K0F2" + /translation="MKLTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLEL + LDYIHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPK + SKVYCQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDV + PFIATNPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRKKLNYSL + FETVVIGDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQDSIKPTYTFKNVKEMWKGI + V" + misc_feature 15593..16279 + /gene="gtp3" + /locus_tag="SPC23A_0017" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 5.9e-25" + gene 16529..17398 + /gene="rmlA" + /locus_tag="SPC23A_0018" + CDS 16529..17398 + /gene="rmlA" + /locus_tag="SPC23A_0018" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33825.1" + /db_xref="GOA:Q4K0F1" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K0F1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSTMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRRGYISREDVLALAQSLKKN + EYGQYLLRLIGEA" + misc_feature 16532..17248 + /gene="rmlA" + /locus_tag="SPC23A_0018" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.7e-121" + gene 17399..17992 + /gene="rmlC" + /locus_tag="SPC23A_0019" + CDS 17399..17992 + /gene="rmlC" + /locus_tag="SPC23A_0019" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33826.1" + /db_xref="GOA:Q9AHA9" + /db_xref="HSSP:1NXM" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q9AHA9" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + misc_feature 17435..17965 + /gene="rmlC" + /locus_tag="SPC23A_0019" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 4.5e-16" + gene 18005..19054 + /gene="rmlB" + /locus_tag="SPC23A_0020" + CDS 18005..19054 + /gene="rmlB" + /locus_tag="SPC23A_0020" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33827.1" + /db_xref="GOA:Q9AHA8" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AHA8" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAVD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18020..18976 + /gene="rmlB" + /locus_tag="SPC23A_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 9.7e-05" + misc_feature 18023..18763 + /gene="rmlB" + /locus_tag="SPC23A_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 18026..18838 + /gene="rmlB" + /locus_tag="SPC23A_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.6e-05" + gene 19120..19971 + /gene="rmlD" + /locus_tag="SPC23A_0021" + CDS 19120..19971 + /gene="rmlD" + /locus_tag="SPC23A_0021" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33828.1" + /db_xref="GOA:Q4K0E8" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0E8" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGRELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKGTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19120..19968 + /gene="rmlD" + /locus_tag="SPC23A_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.6e-147" + misc_feature 19123..19764 + /gene="rmlD" + /locus_tag="SPC23A_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 9.3e-05" + misc_feature 19123..19752 + /gene="rmlD" + /locus_tag="SPC23A_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.4e-19" + misc_feature 19126..19854 + /gene="rmlD" + /locus_tag="SPC23A_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.4e-08" + gene order(20047..21000,21011..21232) + /gene="tnp" + /locus_tag="SPC23A_0022" + /pseudo + CDS join(20047..21000,21011..21232) + /gene="tnp" + /locus_tag="SPC23A_0022" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 20053..20496 + /gene="tnp" + /locus_tag="SPC23A_0022" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 7.1e-05" + /pseudo + gene 21428..>21475 + /gene="aliA" + /locus_tag="SPC23A_0023" + CDS 21428..>21475 + /gene="aliA" + /locus_tag="SPC23A_0023" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33830.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaagactgt ataaaaggca gaaatccttt gttttttata accaaggttt ataaaccttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaata agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gatttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaggac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcaca caagagttct aacttaccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga aaaacttctg aaaccatact + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ttcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata attagattga aactagaata gtacacatct gcttctaaaa + 1021 cattgttaga aaacgatttg actgtcctga acaatttgtc atgttcttgt ttcattttac + 1081 tatatttttg gttcgcggga agtctactaa gatacttaaa gatgcagata gtgaaaaaaa + 1141 ggtgtagaca ttaccgtaaa aaagtgatat aatcgtatga tgttcaatgt ataggtgtta + 1201 atcatgagta gacgttttaa aaaatcaggt tcacagaaag tgaagcgaag tgttaatata + 1261 gttttgttga ctatttattt attgttagtt tgttttttat tgttcttaat ctttaagtac + 1321 aatatccttg cttttagata tcttaatcta gtggtaactg cgttagtcct actagttgcc + 1381 ttggtagggc tacttctgat tatctataaa aaagctgaaa aatttactat ttttctgttg + 1441 gtgttctcta tccttgtcag ctctgtgtcg ctctttgcag tacagcagtt tgttggactg + 1501 accaatcgtt taaatgcgac ttctaattac tcagaatatt caatcagtgt cgctgtttta + 1561 gcagatagtg atatcgaaaa tgttacgcaa ctgacgagtg tgacagcacc gactgggact + 1621 gataatgaaa atattcaaaa actactagct gatatcaagt caagtcagaa taccgatttg + 1681 acggtcaacc agagttcgtc ttacttggca gcttacaaga gtttgattgc aggggagact + 1741 aaggccattg tcctaaatag tgtctttgaa aatatcatcg agtcagagta tccagactat + 1801 gcatcgaaga taaaaaagat ttataccaag ggattcacta aaaaagtaga agctcctaag + 1861 acgtctaaga atcagtcttt caatatctat gttagtggaa ttgacaccta tggccctatt + 1921 agttcggtgt cgcgatcaga tgtcaatatc ctgatgactg tcaatcgaga taccaagaaa + 1981 atcctcttga ccacaacgcc acgtgatgcc tatgtaccaa tcgcagatgg tggaaataat + 2041 caaaaagata aattaaccca tgcgggcatt tatggagttg attcgtccat tcacacctta + 2101 gaaaatctct atggagtgga tatcaattac tatgtgcgat tgaacttcac ttcgtttttg + 2161 aaattgattg atttgttggg tggaattgat gtttataatg atcaagaatt tactgcccat + 2221 acgaatggaa agtattaccc tgcaggcaat gttcatcttg attcagaaca ggctctcggt + 2281 tttgttcgtg agcgctactc actagcagat ggcgatcgtg accgcgggcg caatcaacaa + 2341 aaggtgattg tggctatcct tcaaaaatta acgtcaaccg aagcactgaa aaattatagc + 2401 acgatcatta atagcttgca agattctatc caaacaaata tgccacttga gactatgata + 2461 aatttggtca atgctcagtt agaaagtgga gggaattata aagtaaattc tcaagattta + 2521 aaaggtacag gtcggacgga tcttccttct tatgcaatgc cagacagtaa cctctatgtg + 2581 atggaaatag atgatagtag tttagctgta gttaaagcag ctatacagga tgtgatggag + 2641 ggtagataaa atgatagaca tccattcgca tatcgttttt gatgtagatg acggtcccaa + 2701 gtcaagagag gaaagcaagg ctctcttgac agaatcctac aggcaggggg tgcgaaccat + 2761 tgtctctacc tctcaccgtc gcaagggcat gtttgaaact ccggaagaga agatagcaga + 2821 aaactttctt caggttcggg aaattgcaaa agaagtagca gatgatttag tcattgctta + 2881 tggcgcagag atatactata ctctggatgc tctagaaaag ctagaaaaaa aagaaattcc + 2941 taccctcaat gatagtcgtt atgccttgat agagtttagt atgaacactc cttatcgcga + 3001 tatccatagc gccttgagca agatcttgat gttgggaatt actccagtca ttgcccacat + 3061 tgagcgctat gatgctcttg aaaataacgg aaaacgtgtt cgtgaactga ttgatatggg + 3121 gtgctatact cagataaata gttatcatgt ttcaaaacct aagttctttg gtgaaaaata + 3181 taaattcatg aaaaagagag ctcggtattt tttggaacgt gatttagttc atgtagttgc + 3241 aagtgatatg cacaatttag acagtagacc tccatatatg caacaggcat atgatatcat + 3301 tgctaagaaa tatggagcga aaaaagcgaa agaacttttt gtagataatc ccagaaaaat + 3361 tataatggat caattaattt aggagaaaat atgaaggaac aaaacacttt ggaaatcgat + 3421 gtattgcaac tattcagagc tttatggaaa agaaagttgg tcattttatt agtggcaatt + 3481 ataacttctt cggttgcttt tacctacagt acttttgtta tcaaacctga gtttactagt + 3541 acgactcgga tttatgtagt taaccgtaat cagggagaga agtctggttt aaccaatcaa + 3601 gacttgcagg caggaacata cttggttaaa gactatcgtg aaattatcct atcgcaggat + 3661 gttttggagg aagttgtttc tgatttgaaa ctagatttga cgccaaaagg tttggctaat + 3721 aaaattaaag taacagtacc agttgatacc cgtattgtct ctgtttcagt taatgatcga + 3781 gttcctgaag aggcaagccg tatcgctaac tctttgagag aagtagctgc tcaaaaaatt + 3841 atcagtatta ctcgtgtttc tgatgtgaca acactggagg aggcaagacc ggcgatatcc + 3901 ccgtcttcgc caaatattaa acgcaatata ctaattggtt ttttggcagg ggtgattgga + 3961 actagtgtta tagttcttct tcttgaactt ttagacactc gtgtgaaacg tccggaagat + 4021 atcgaagata cactgcagat gacacttttg ggagttgtac caaacttgaa taagttgaaa + 4081 taggagagag agatgccgac attagaaata gcacaaaaaa aactggagtt cattaagaag + 4141 gcagaagaat attacaatgc cttgtgtaca aatatacagt tgagcggaga taaactaaaa + 4201 gtaatttccg ttacttctgt tagccctggg gaaggaaaaa caactacttc cgtaaatata + 4261 gcatggtcgt ttgcgcgtgc aggctataaa actcttttga tcgatggcga tactcgaaat + 4321 tcagttatat caggattttt taaatctcgt gaaaaaatta cagggctaac agaattttta + 4381 tctgggacag ctgatttatc tcacggttta tgtgatacaa atattgaaaa tttatttgta + 4441 gttcaatcgg gatctgtatc accaaaccct acagccttgt tacaaagtaa aaattttaat + 4501 gatatgattg aaacattgcg taaatatttt gattatatca ttgttgatac agcacctatt + 4561 ggaattgtta ttgatgcggc aattatcact caaaagtgtg atgcgtccat cttggtaaca + 4621 gcaacaggtg aggcgaataa acgtgatgtc caaaaagcga aacaacaatt aaaacaaaca + 4681 ggaaaactgt tcctaggggt tgttttaaat aaattagata tctcggttga taagtatgga + 4741 gtttacggtt tctatggaaa ttatggtaaa aaataattta ggaaagattc tatggatgaa + 4801 aaaggattga aaatttttat ggcagtatta cagagtatta ttgtcatttt attggtttat + 4861 tttcttagct ttgttagaga gacagaactt gaacgttctt cgatggttat actatacctt + 4921 ctccactttt ttgtattcta tgttagttcc tatggtaaca atttttttaa aagagggtac + 4981 ctagttgagt ttaatagtac tataagatat atttttttct ttgcaatagc tataagtgta + 5041 ttaaactttt ttatagcgga acggtttagt atctctagaa gaggaatggt atacttctta + 5101 actttagaag gaatatcctt atacttgtta aatttcttag taaagaaata ttggaaacat + 5161 gtgtttttta atctaaaaaa tagcaagaaa attttactgt taacagtaac gaaaaatatg + 5221 gaaaaagttc ttgataaatt gctagaatct gatgaacttt catggaagtt ggtagcagta + 5281 agtgttttga ataaatctga ttttcaacat gataaaatac ctgtaattga aaaggaaaaa + 5341 attattgaat ttgcaacgca tgaagttgtg gatgaggtgt ttgtcaatct tccaggagag + 5401 agctacgata ttggagaaat tatctctagg tttgagacaa tggggataga tgtaactgta + 5461 aatcttaaag catttgataa gaatttgggt cgcaataaac aaattcatga gatggtagga + 5521 ttgaatgtag tcactttctc tacaaatttt tataaaacta gtcatgtgat ttcaaagaga + 5581 attctcgata tttgtggtgc cactattggc cttattcttt ttgctatagc tagtctagtt + 5641 ttagttccat tgattcgtaa agatggcgga ccagctattt ttgctcaaac tcgtataggg + 5701 aaaaatggtc gacattttac cttttataaa ttccgttcga tgaggatcga tgctgaagct + 5761 atcaaagaac agttgatgga tcaaaatacg atgcaaggtg gtatgtttaa gatagacaat + 5821 gatcctcgtg ttacaaaaat tggtcgcttt attcgtaaaa ccagtttaga tgaattgccg + 5881 cagttttgga atgtctttat aggagatatg agtttggtgg gaacacgtcc acctacagta + 5941 gacgagtatg atcagtatac tccagaacaa aaacgtcgac tcagctttaa acctggtatt + 6001 acaggtttat ggcaggttag cggccgtagt aaaataaccg attttgacga tgttgtaaaa + 6061 ttagatgtgt cttatattga taattggaca atctggaaag atattgaaat tttgcttaaa + 6121 actgttaaag ttgtatttat gagagatgga gcgaagtaat ttctgtatat ccatcatatt + 6181 aggagagaaa tgaaaaagtc agtttatatc attggttcaa aaggaattcc tgctaagtat + 6241 ggaggatttg aaacttttgt tgaaaaatta acagccttcc aacaagataa ggctatccaa + 6301 tattatgtgg cttgtatgcg tgaaaactct gcaaaatcag ggactactga ggatgttttt + 6361 gaacataatg gtgctatctg ttataacgtc gatgttccta atattggtcc agcgcgagcc + 6421 atagtatatg atatcgcggc aattaacaga gctattgaaa ttgccaaaga aaataaggat + 6481 gaagatccaa tcttctatat tttagcttgt cgaatcggtc cgttcatcca tggaattaag + 6541 aaaaaaatcc aggcgatagg tgggactctt ctagttaatc cagatggtca cgagtggtta + 6601 cgagctaagt ggagcactcc agttcgtcgt tattggaaaa tttccgaagg tcttatggtc + 6661 aaacatgcag atttattggt ttgtgacagt aaaaatatcg aacagtatat ccaagaagat + 6721 tataaacagt tccaacctaa gaccacctat atcgcttatg ggaccgatac aacacgctcc + 6781 atattaaaga gtagtgatga aaaagtacgt tcttggttca aagagaagaa tgtttctgag + 6841 aacgagtatt atctagttgt aggacgattt gttccagaga ataactatga atctatgatt + 6901 cttggcttct tggcttctaa ctctaagaag gactttgttt taattacaaa tgtagaacag + 6961 aataaatttt ataatcagtt gttggcaaaa actggttttg ataaagatcc acgagtaaaa + 7021 tttgtaggga cagtctacaa ccaagagctt ctaaagtata ttcgagaaaa tgcttttgct + 7081 tacttccacg ggcatgaagt tggtggaaca aatccttcgt tacttgaagc attagcatcc + 7141 acaaagttaa acttactact cgatgttggc tttaaccgag aagtagctga ggatggtgct + 7201 gattactggg aaaaagataa tcttcataag gttattgaag cgagtgaaca aaaaacacaa + 7261 gaagagataa atgaaaaaaa tatactgtca acaaagcaag tgacggagcg cttctcttgg + 7321 gatttgatag ttaatgagta tgagaaactt tttacgagaa aaaactagaa actcataagg + 7381 gattatttga ataaataagt ttttgctttt tctcattgat agaacaataa gattgcttta + 7441 gtaaataata attagaaaac tgtatataaa atttcataat atggaaaatg agtttcgaag + 7501 agaagagtac atatgtcatg aatgtagtaa ttgataacag aaaattaggg gggataagtt + 7561 gaaagtagat atgatttttg aggtacggaa taatgagaat tagttttagt aaaaaaacta + 7621 tgctgtgtgg tttattgtat attggtttaa ttttatccgt agtaacaata cctacaattg + 7681 taacattttt atattctttg ctattcatcg ggattgtaac agtcttaaat tataattcta + 7741 ttctagcaag tgacgaagat gcgaactctt tttttgttgc attacctatt attttatctt + 7801 cttttcaaaa tgtatatttg ggatttggag cggatcgatt aaattctgtc acactacaag + 7861 ttctgctatc tattagcatt gctattatta caattacagt ttttctaggt attatcttaa + 7921 atagattcaa atcaaaagaa tttagttggt tagttttaag tattcttgta attataattc + 7981 aatcagtaat tcttttaata ttctttccca ctaccttgcc agcatattta tcatctatga + 8041 gaaatatact agccccacta ctgatttttt atttttctat ctatgggttt aaaaatatta + 8101 atttacaaaa attttataaa tatatgttca taattatatt agttgttcta atttttggat + 8161 ttattgagta tatatacgga aatagtttat ggacaagatt gaatattaaa aagctttggg + 8221 ctttgaaggg gctggcgatt gagaataggg ttgttcctgg gaattggcac tcttctgaat + 8281 taattggcgg taaacaatta aggcgtatgg tttcaacatt tgccgatccc gtaaatctag + 8341 gttcgtatct ctttgcggca tttatgttag cttggtacaa aaataagaaa ctacttcaag + 8401 ttttattgct cgcttctttt gtactcagtg taagtaaagc agcgttttta agcatgttgg + 8461 tatatataat aatttatacc tgggttgtgg ataaaaataa aattttatcg atttttggaa + 8521 taataatttc aactgtattg gggttgtatt tttataattt tagtcaagtt agcagttatg + 8581 gtagtataaa tgcacatatc gatggttttt ttagtgcgtt aagtactccc ctccattacc + 8641 catttggtat gggagtaggg agtgtgggag ttctagcttc aaaattaggt tcacaaacag + 8701 cactttcttc agaggtttta gaaacaggaa ttggaatgat aattgctcaa ttaggattcg + 8761 tgggtgtgat aatatatttg attttctttg taaaactctc cgtaatagga aagaatatta + 8821 ataataaaag agataaaatt ttatggttta ctttaattta tagctttttg gctaatgcct + 8881 tttttaacga ggttgcactt tctcctaact catgcacctt atatttttta attttaggac + 8941 tgctttataa taaaaataaa attagaagca cagagtttag ttaatggaaa aattagttag + 9001 tattattctg cccgtctaca atgtcgaaca gtatataaaa aattgtttag aatcaattca + 9061 acaacaaact tatccaaatt tggaagtaat cattgttaat gacggttcaa ccgataaaag + 9121 cgttgaatat tgtgagcaaa tttgtaagat agattctagg ttttctatca ctcacaaaga + 9181 aaatggtgga ctttccgatg caagaaatgt cggtatagat aaagccaagg gagattacct + 9241 catttttgtt gacagtgatg attttgtttc tcaagatatg gtatcttatt tagtatcttg + 9301 tatggagaac aatgaggcag acattgctat ttgcgatcct gttcattatt atagtgatcg + 9361 tcaaaacaat gatcttaata ttttttctcc agcatcaagc gttaaggttt acgaaacaac + 9421 ggaggctcta tgtgagatgt tttatcaaaa atcttttttg gtgtctgcct gggccaagat + 9481 atttaaaaga gagttgtttg atgatataag atttcctgta ggtaagctat ttgaagatag + 9541 tgcgattatg tatttgctcc tcgaaaagtg tgaaacaatt gcatactctg atgcgaaatt + 9601 atatgcttat gtacacaggg ataatagtat cacaacaaag aaattttcgg atagagactt + 9661 agatattttg gagattacga acacaattat taatcactat ggtgataatt tacgcgtgta + 9721 tactgcagcg gtgtcttata aggtatctgc atgtttcaga attctattaa actcaccttc + 9781 tgaagaaaag tataaaaaag tacaaaaaga atgtttgagt tatattttac aaaattggag + 9841 aaacatatta tttaataata atgttcgatt gaagaacaag cttgccttaa tttctataac + 9901 tattttcaat ccttttgtta aattgatcta tagtaaagta aacagatggg aatgatagca + 9961 aatgaacaaa tatgaagaaa gatatcaaga aaatttatct aagaatgatt tttataaatt + 10021 aattaataag agttacttat cagataaaga acttcaagta caacaagtaa aagctgggat + 10081 agtcttacca ccaaaggcat ttgaaacaaa attatcaaat aaacttggcc tacaaaaatc + 10141 tttgcatgga aagggtggag ttgtagactc aaatggaaat tacattgaac tatctgcaca + 10201 aaaagcagtc gggatgagaa atagagtcta tggtccgtat aaaattaatt acgataatct + 10261 gccaattaga aatgaaaaag taatctattt gaactatttc atcaaacaat ggggacattt + 10321 tttactggat gttgttggaa ggttatggta tccattgctg caggataatg atactaagtt + 10381 agtctatacc tgctatgctg gaacagaaac aaagattgag ggaaactatt tagagttttt + 10441 gaagcttctc ggcatagatc aatcacgttt aatcatgata aactgtccca ctcagttctc + 10501 agaagtcatt attcctgaaa gctccatttt accgggggga tattatacaa aagagtataa + 10561 acaactattc agttcggtag tagaaaatat taaattggac aagtatgatg tgaatgctaa + 10621 aatgatttat tgttcgaggt ctaaattagg gattgctaaa agtaaagaat ttggcgaaga + 10681 cggtattgag gggattttta aacaaaatgg ctatacatct gtttacatgg aaacaatgtc + 10741 tttggaagag caaataaaaa ccttattatc ggctaagaca atagtattaa cgagtggttc + 10801 gttagcacat aatcttttat ttgtaaataa agatattgat gtttttattt tgaataaaac + 10861 ctatagagta aatctccatc aatttttaat aaacgagatc tcagatgcta cagtaagatt + 10921 tgtagatatc tatcgatcac ctttaccgat tttatacgga tatggaccat ttttaatgga + 10981 tcttacaaaa cctttggcta atttcttgga cgataatgaa tttgtatatg aaaaaggtac + 11041 tgttttaagt aaaaaagatt attttaaata ctatttgaaa tggttgtgga gttatagatt + 11101 ctttttattt aggttaaatg gtattaaaga aggaaatagt gaattcgaga agagttttaa + 11161 gataattagg agatactata aaacaggacg atagaatgag taaatataag gaattagcaa + 11221 aaaatacagg tatttttgct ttggctaact tttcatcaaa gattttaatt tttttgttag + 11281 tacctatata tacacgggta cttaccacta cggaatatgg tttttatgac ttagtctata + 11341 caactattca gctttttgta ccaatcttga cattaaatat atctgaagcc gttatgaggt + 11401 tcctaatgaa agatggtgtt tctaaaaaat cagtcttttc aattgctgtt ttagatatat + 11461 ttattggatc aattgctttt gctttattgt tgttagtaaa taacctgttt tctttatcag + 11521 atttaatttc tcaatacagt atttacatat ttgtaatctt tgttttctat accctaaata + 11581 attttttgat acaattttct aagggaattg ataaaattgg tgttacagct atctctgggg + 11641 tcataagtac agcagttatg cttgccatga atgtcattct tctagtagta tttgattggg + 11701 gattgttagg tttctttatt gctaatgttt gtggatatgt tataccttgt atttatatag + 11761 tttctagatt aagattgtgg gaattatttg aaattaagat tgataaaaaa ttacaatggg + 11821 aaatggttta ctatgctttg ccattagttt taaatatatt aagctggtgg gtaaataata + 11881 cttcagatag atatattgtg actgcaatag taggtataca agctagtgca attatttcag + 11941 tcgcttataa aattccacag attttgtcta cgattagtgc aatttttatt caatcatggc + 12001 aaatctctgc aattaaaata caagaagata agagcggtac tacatttgta tcaaacatgc + 12061 tcctatacta taatgcactt ctattgatta tagcgagtgg tatcatatta tttgtcaaac + 12121 ctatttctaa tatattgttt ggtatttcct tctattctgc gtgggagctg gtaccatttt + 12181 taataattag cagtctattc aatgcaattt caggttgtat aggagcaatt atgggagcta + 12241 aaatggatac tcataacatt gcaaagtcgg ctttagttgg gatgattgca aatattattt + 12301 taaatatagt gttaacattc ttaatgggtc cacagggaat tacaatttct accctgatag + 12361 ctagttttct tattttttat atgcgaaaag atagtgtaaa agaaattaat tcagaaacat + 12421 atagagcaat ttatttatcg tggatactat tagttgtaga ggcctgtctg ctaatttata + 12481 tggattttat tattggtgct ttaatagcaa tggtaataaa cttattttta ctaaaagatg + 12541 ttatcaaacc tttatattta aaaattttca aaagaaatta ggtacaaaat gattgtttta + 12601 caatacttta agattttagc tagattcgtt tttatgtttt tgataagtgc ggtgttactg + 12661 cctttcaaaa taaaacctaa taagattgtt tttattaatt tcaatgggaa aggatatggt + 12721 gataatccga aaagtatttg tgagtatctt agaactactt acccagattt agatttggtt + 12781 tggcttgcaa gagataacga aggttttcca gatggggtta gggttgttaa atatgggact + 12841 ttccaagctt tttatgagca agcgagttcg aaggtttggg tatataatgt aagagctttt + 12901 gcaagaatac taaaaaaacg aggacagatt tatattcaaa cttggcatgg tgcttctagt + 12961 tttaagttga tagaaaaaca agctgattta ccaataaatt atgttttaga agctaagtat + 13021 gatgcaagag tcacagatat aatgatttca gatagcagaa aacaaactga agaatttcaa + 13081 aagtattttt ggtattcagg agaaattttt gaggtgggga tgccgagaaa tgatgccttg + 13141 tttcactata aggaagacta cgacaagtta aataatatca gaaaagaact aagcattcat + 13201 tcagatgatt atgttatttt atatgcccct actttcagag atgatgggga tgcatcttat + 13261 ttagatataa attttgaacg gcttttgcaa tgtgttgaac acggaattaa aaagaaatgt + 13321 aaattcttaa ttaggttaca ccctaatcac tcccatttgt gtaataatat ttcatttaat + 13381 aagaatataa tcaatgctac gttttattca gatatgcaag agcttacttt gttggcagat + 13441 gttttagtca cagattattc ttcctcgata tttgatttta tgcttttaaa caagccttat + 13501 gtcagatatg tgaatgattt agaaaaatat gctgagctta ggggggtatc agatacatat + 13561 tacgaattgc cggattcgat tattaaaact gctgaagaat tgtatgactt actgcctaaa + 13621 aaaatagaaa attttgatta tgattctata aaaaaatata gaaatgaaat actgtgtcca + 13681 atctttaatg gaaccgctag tgaaaatgta ggaaggagaa taattcaaga gttgtgaagt + 13741 aaaacattgg gttattttta aggtaacgag atttgaaaaa taatgattta aagataggaa + 13801 gtggagctat tcatcaaatt tccgctacac tttctcaaaa tagtatttcg ggaaagattt + 13861 tatattgtgc tgatccagtt gtcgatgact tgtacggttc gatagtacgt tcacaaatag + 13921 aggaaattgg tcgggtaaag gaagaaagtt gcaattataa tactattgct tatgcgatga + 13981 atatagcaga acgggctatt gccacagata ttgactgtat tgtgggaatg ggaggaggtc + 14041 gtgttttaga tgtctgcaag tatgcatctt ttatttcgaa acgtccttac ctatcgattc + 14101 cgacaacagc agcaaatgat ggcattgctt ccccagttgc tgttttgaaa aggcaggatg + 14161 atagaccaaa aagcttaggg gcggctatcc cctcaatgac actaattgat attgatgtta + 14221 ttgcatcagg acctatacaa aatataaaag ctggtatcgg tgatacaata tccaattaca + 14281 ctgcattgaa agattgggag ttggcagttg agcgagggaa agatgagatg catggttttg + 14341 catatctaat gtcgcaaaat tctttagatg ctttaatgaa aacgaagtat aattctatta + 14401 cccctgattt tattgaagtt ttggtaaact ctttagtttt atcaggcatt gcaatggatt + 14461 ttgcgggaag tagtagacct gtcagtgggt cagagcactt atttagtcat gcattagatt + 14521 actatggttc tacaaggaat cttcatggaa ttcaggttgc attaggtaca gtcgcagttt + 14581 tgaaattaat tgaaaattct gttgatactg tagtggatta cttgcaaaga tttgaggttc + 14641 atattaaccc gaaacttttg gggatagatg aagagttgtt tatttattgt atgcaacatg + 14701 ctacaaaaat gagaagtaat cgctatacct atctgcatga agttgatctt agcacagata + 14761 gattgaaaca aatatataag gaactcataa gcgagttgta gagaagagag gaaaaaatga + 14821 aagcacttat tttagcagca gggttaggaa cacgtctagc tccaattacc aatgaggtac + 14881 caaaatcttt ggtaccagtc aatggtaagc caattttgat gaaacaaatt gaaaatttat + 14941 atcaaaataa tattacagat attacgatta ttgctggata taagtcatct gtattaacag + 15001 atgcagttac tgaaaagtat ccagaaatta atattattga taatgttgat tttaaaacga + 15061 ctaataatat gtattcagcc tatctaggaa aagctgcaat gggtgatagt gacttcttaa + 15121 tgatgaatgc agatgtattt tatgatgctt ctgttattaa aagtctgttg cttcataaag + 15181 ctccaaatgc aattgtaact gatttaggta tttatattga agagtctatg aaagtcgtag + 15241 aaaaaaatgg tcgtttagta gaaatttcta aacagatttc acctgaggaa actttaggag + 15301 cttctattga tgtttataaa ttctcttatg aagcaggtgc tcgattcttt gaaaagtgta + 15361 aggaatttat tgaagataaa cgagaacttc aaatgtggag tgaggttgct cttaatgcaa + 15421 ttctttctga agttgaattt gtagcatgtc cattagaggg tcgttggtta gaaattgata + 15481 atcatgaaga cttagttgct gcagaaaaac tatttgcttg aaccgaatac ggagaatgaa + 15541 attgacaaat agagttgatt attttggtgc tgatattagt gaacttcaga ataaaaaatt + 15601 attcttattt gatatggatg gtaccattta tgaagaagat aggttgtttg agggtactct + 15661 cgaattatta gactatattc ataatattgg cggtgagtat atttttatta caaacaattc + 15721 atctaagtct gttgttgact atgttgaaaa agttaacaga ttaggtatta aagctgaacg + 15781 agataatttt tttacctctg ctcaagccac aattgtttat attaaagaaa attatcctaa + 15841 atctaaagtt tattgccaag gaacaaaatc tttgataaaa gaactatctg acgcaggaat + 15901 tgatgtaact gagcaagtta gtgctgatat agatgttgtt cttgttggtt ttgatacaga + 15961 attaaccagt gataaaattc gcaatacctg cgagattcta tcaacaaagg acgtaccttt + 16021 catagctact aaccctgata ttcgctgccc agtatcgttt ggattcatcc cggattgtgg + 16081 ttctatttgt gatatgatta gtaaatcagt cgataggaaa cctgtttaca taggtaaacc + 16141 tgaacctacg atggttgata ttgttcgaaa aaaattaaat tattctctat ttgaaacagt + 16201 tgtgattgga gatcgcttgt atacggatat catgactggt ataaatgcag gagtaacttc + 16261 agtttgtgtg ctgacaggag aagcaacggt gaatgatatt caacaagata gtataaaacc + 16321 gacttataca tttaaaaacg tgaaagaaat gtggaaagga attgtctgat tttttcattc + 16381 tgaatagtga attcatgaat actgtcaaaa tactcgtatg tatttaaatt gattttatta + 16441 ttttaataat ggacaaatta aaattatttt tctccccaaa tcgttcgtga acgtaaagta + 16501 ctcatcaaca aagaaaggta ccccttttat gaaaggtatt attctagcag gtggttcggg + 16561 aactcgcttg tatcctttga ctcgcgctgc atcaaaacaa cttatgccgg tttatgataa + 16621 accgatgatt tactacccac tttcaacatt aatgttggct gggattaggg atattttgat + 16681 tatctcaact cctcaagatt tgcctcgttt taaagagctt cttcaagatg gttctgagtt + 16741 tggtattaaa ctttcttatg ctgagcaacc aagtccagat ggtttggcac aagcctttat + 16801 cattggggaa gagtttatcg gtgacgatag cgttgccttg attttaggtg acaatatcta + 16861 ccatggtcct ggtctgagca caatgcttca aaaagcagcc aagaaagaga aaggtgcgac + 16921 tgtttttggc taccatgtca aggatccaga acgctttggt gttgtagaat ttgatgaaaa + 16981 tatgaatgct atctccatcg aagaaaagcc agaataccct cgttcaaact atgcagtgac + 17041 aggactctat ttctatgata atgatgtagt agagattgcc aaaagtatta aaccaagtcc + 17101 tcgtggtgaa ttggaaatta cagatgtcaa caaggcttac ttggatcgtg gtgatttgtc + 17161 tgttgagctc atgggacgtg gttttgcttg gttggatact ggcactcatg aaagtttact + 17221 agaggcttcg cagtacatcg aaacagtcca acggatgcaa aatgttcagg tagcaaactt + 17281 agaagaaatt gcttaccgta ggggctatat cagtcgagaa gatgtattgg ccttagccca + 17341 atcacttaag aaaaatgaat acggacagta tctgctccgt ttgattggag aagcatagat + 17401 gacagataat tttttcggta agacgcttgc ggcacgcaag gttgaagcta ttccaggcat + 17461 gttggagttt gatatccccg ttcatggaga taatcgtggc tggtttaaag aaaatttcca + 17521 aaaggaaaaa atgcttccac ttggatttcc agagtctttc tttgcagaag gaaaattgca + 17581 aaacaatgta tccttctcac gtaaaaatgt ccttcgaggc ctccacgcag agccttggga + 17641 taagtacatc tctgtagcag atggagggaa agttctgggt tcttgggttg atctacgcga + 17701 gggtgaaacc tttgggaata cctatcagac agtgattgat gcgagtaagg gaatctttgt + 17761 tcctcgaggc gtagctaatg gcttccaagt tttatcagat acagtgtcat atagctatct + 17821 ggtcaatgat tactgggctc ttgaactcaa acccaagtat gcctttgtga actacgctga + 17881 tccaagcctt ggtattgaat gggaaaatat tgcagaagca gaggtttcag aagcagataa + 17941 aaatcatcca ctacttaagg atgtaaaacc tttgaaaaaa gaagatttgt aaaaaggaaa + 18001 gaatatgact gaatacaaaa atattatcgt gacaggtgga gctggcttta tcggttctaa + 18061 ctttgtccat tatgtttacg agaactttcc agatgttcat gtgacagtcc tagataagtt + 18121 gacttatgct ggaaaccgcg cgaatattga ggaaatttta ggtaatcgtg ttgagttagt + 18181 tgttggtgac attgctgatg cggagttggt agacaagttg gctgctcaag cagatgctat + 18241 cgttcattat gcagcggaaa gccacaatga taattcgctc aatgatccat cgccatttat + 18301 tcatactaac ttcatcggaa cctatactct tttagaagct gctcgtaagt atgatattcg + 18361 cttccaccat gtatcgacag atgaagttta tggggatctc cctttacgcg aagatttgcc + 18421 aggtcatggt gaaggaccag gtgagaaatt tactgctgaa acaaaataca acccaagctc + 18481 tccgtactca tcaaccaagg cagcctcaga tttgattgtc aaagcctggg tgcgttcttt + 18541 tggagtcaag gcaacgattt ccaactgttc aaataactac ggtccttatc aacatatcga + 18601 aaaattcatc ccacgtcaga ttactaacat cctaagtgga attaagccaa aactttacgg + 18661 tgaaggtaag aatgttcgtg actggattca taccaatgac cattcttcag gagtttggac + 18721 aatcttgaca aaagggcaaa tcggtgaaac ctacttgatt ggggctgatg gtgagaagaa + 18781 caataaggaa gttttggaac ttatccttaa ggaaatggga caagctgtgg atgcctatga + 18841 tcatgtgact gaccgtgcag gacatgacct tcgctatgcg attgatgcta gcaagctccg + 18901 tgatgagttg gggtggaaac ctgaatttac caactttgaa gctgggctca aggcaacaat + 18961 caagtggtat acagataacc aagaatggtg gaaagcagaa aaagaagctg ttgaagccaa + 19021 ttatgctaag actcaggaga ttattacagt ataaaaagca ggaaatagct gctttttatt + 19081 gctatattgg gaagagttac atattagaaa ggtctagaga tgattttaat tacaggggca + 19141 aatggccaat taggaacgga acttcgctat ttattggatg aacgtaatga agaatacgtg + 19201 gcagtagatg tggctgagat ggacattacc gatgcagaaa tggttgagaa agtttttgaa + 19261 gaggtgaaac cgactttagt ctaccactgt gcagcctaca ccgctgttga tgcagcagag + 19321 gatgaaggaa gagagttgga cttcgccatc aatgtgacgg ggacaaaaaa tgtcgcaaaa + 19381 gcatctgaaa agcatggtgc aactctagtt tatatttcta cggactatgt ctttgatggt + 19441 aagaaaccag ttggacaaga gtgggaagtt gatgaccgac cagatccaca gacagaatat + 19501 ggccgtacta agcgtatggg ggaagagtta gttgagaagc atgtgtctaa tttctatatt + 19561 atccgtactg cctgggtatt tggaaattat ggcaaaaact tcgtttttac catgcaaaat + 19621 cttgcgaaaa ctcataagac tttaacagtt gtaaatgacc agtacggtcg tccgacttgg + 19681 actcgtacct tggctgagtt catgacctac ctagctgaaa atcgtaagga atttggttat + 19741 tatcatttgt caaatgatgc gacagaagac acaacatggt atgattttgc agttgaaatt + 19801 ttgaaaggta cagatgtcga agtcaagcca gtagattcca gtcaatttcc agccaaagct + 19861 aaacgtccgc taaactcaac gatgagcctg gccaaagcca aagctactgg atttgttatt + 19921 ccaacttggc aagatgcatt gcaagaattt tacaaacaag aagtgagata agtagtagaa + 19981 tgattttcta gtctaataaa agaggcagat aatgaactcc aaaggagctt aagatgtacg + 20041 attatcttgt tgttggtgct gatctctttg gcgcatagct ttggctcagt ttctattatc + 20101 gctcacacca tccatcagaa gtttaatctg aaggtaccca attatcgcca agaagaagat + 20161 tgggctagga tgggtttacc aatcacacgt aaggaaatct ctaattggca tatcaaggca + 20221 agtcaatact atttagagtc cctttataac cttttacgag aaaagttgtt agaacaacct + 20281 cttcttcatg cggatgaaac ttcttatagg gtgctagaga gtgatagtca gctgacttac + 20341 tattggacct ttttgtctgg gaaagctgag aatcaagcaa tcacgctgta ccaccatgat + 20401 cagcgtcgga gtggtttagt agtacaagaa ttcctaggag attattctgg ctatgttcat + 20461 tgtgacatgt tgcggcagta acttaggact ttagtcctct agttctgcct atgcgatagc + 20521 agtccaaggt ttaggagcaa ggcgacgcta agcttggtaa actgcgaacc gctagaagct + 20581 tatcgtcaac tggaagaagc tgaacttgtt ggatgttggg cgcatgtgag aaggaagttt + 20641 tttgaagcga cccccaagca agcggataaa tcatcgttag gagctaaagg tttagcttat + 20701 tgtaatcagt tattttcctt ggaaagagac tgggaggctt tgccagctga tgaacgacta + 20761 cagaaacgtc aagaagagct ccaaccccta atggaagact tctttgcttg atgccggcgt + 20821 cagtcagttt tatcgggttc aaaactagga agggcaattg aatacagcct caagtataaa + 20881 gaaaccttta agactatttt gaaagacgga catctggtcc tttccaataa tctagctgaa + 20941 tgcgccatta aatcattggt tatgggacgg agtaaaagag tccagtggac tcttttagcc + 21001 taagctcagt ttaaaaaagc gagggtggtt attttctcaa aattttgaag gagctaaagc + 21061 aagagctatt attatgagtt tgttggaaac agctaaacgt catcaattaa atagcgagaa + 21121 atatctatcc tatcttctag aatgtcttcc aaacgaggaa actctcgtaa acaaagaggt + 21181 tttagaggcc tatttaccgt ggactaaagt tgtacaagaa aagtgtaaat aagaaatctc + 21241 cagattagga actatccgtg agttctctag tctggagatt tttcaatata cttcgttatt + 21301 ggacggttac gatattcata ttttttgcaa agatgttgtt tgaaaaataa ttttcaaaaa + 21361 ttctgaaaat tctgttgaca actttctgaa aagagtctat aatggagaga aagttttaaa + 21421 ggagaaaatg atgaaaagtt caaaactact tgcccttgcg ggcgtgacat tattg +// + diff --git a/public/res/serotype_genbank/serotype_23B.gb b/public/res/serotype_genbank/serotype_23B.gb new file mode 100755 index 0000000..203afea --- /dev/null +++ b/public/res/serotype_genbank/serotype_23B.gb @@ -0,0 +1,976 @@ +LOCUS contig_1 23047 bp DNA linear UNK 10-JUN-2024 +DEFINITION contig_1, whole genome shotgun sequence. +ACCESSION contig_1 +VERSION contig_1 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/10/2024, 22:22:40 + CDSs :: 22 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 1 +FEATURES Location/Qualifiers + source 1..23047 + /mol_type="genomic DNA" + gene complement(596..1063) + /locus_tag="ONJEBG_00005" + CDS complement(596..1063) + /db_xref="RefSeq:WP_150854890.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E733E7" + /db_xref="UniRef:UniRef100_UPI0005E733E7" + /db_xref="UniRef:UniRef50_UPI0005E733E7" + /db_xref="UniRef:UniRef90_UPI0005E733E7" + /product="transposase" + /locus_tag="ONJEBG_00005" + /protein_id="gnl|Bakta|ONJEBG_00005" + /translation="MKSLKEDFSVRAEKYENYQETFQGPNSFSKTDPDATFMRMKEEHM + KNSQPKAAYNLQIATENQFVLHYDVFSNPTDTKTLLPFLETYPHDLKTVVADAGYGSEE + NLLRLDEKEVNHLIKYAMFDKEQKRGYKQSAKNLANWHYNDKEDSYTHPDG" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_150854890.1" + gene complement(<1359..2144) + /locus_tag="ONJEBG_00010" + /pseudogene="unitary" + CDS complement(<1359..2144) + /note="Frameshift due to deletion around 2278." + /db_xref="GO:0004803" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A1A9BIJ2" + /db_xref="UniRef:UniRef90_T2BQK0" + /product="ISNCY family transposase" + /locus_tag="ONJEBG_00010" + /pseudogene="unitary" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + gene complement(2198..2410) + /locus_tag="ONJEBG_00015" + CDS complement(2198..2410) + /db_xref="PFAM:PF13384.10" + /db_xref="PFAM:PF13551.10" + /product="hypothetical protein" + /locus_tag="ONJEBG_00015" + /protein_id="gnl|Bakta|ONJEBG_00015" + /translation="MNETKKYLVIKAIAQGKKTKKRACVELNLSERQINRLLLAYQQKG + KKPSDTETEIENQNMQSLMKSKNVS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + gene 2587..4032 + /locus_tag="ONJEBG_00020" + /gene="wzg" + CDS 2587..4032 + /db_xref="COG:COG1316" + /db_xref="COG:M" + /db_xref="RefSeq:WP_054362679.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E22D6B" + /db_xref="UniRef:UniRef100_Q4K0I5" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_O54604" + /db_xref="UniprotKB:Q4K0I5" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="ONJEBG_00020" + /protein_id="gnl|Bakta|ONJEBG_00020" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YFNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNIDLTVNQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDIHYYVRLNFTSFLKLIDLLGGVDVYNDQDFTSLH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDHDRGRNQQKVIAAILQKLTSSEALKNYS + MIIDSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGRGRTDLPSYAMPDSNLY + MMEINDSSLASVKTAIQDVLEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054362679.1" + /gene="wzg" + gene 4034..4765 + /locus_tag="ONJEBG_00025" + /gene="wzh" + CDS 4034..4765 + /db_xref="RefSeq:WP_050224251.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00024BF6A4" + /db_xref="UniRef:UniRef100_H6ULP6" + /db_xref="UniRef:UniRef90_Q9AHD4" + /db_xref="UniprotKB:Q4K0I4" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="ONJEBG_00025" + /protein_id="gnl|Bakta|ONJEBG_00025" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTEAYRQGVRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLGKLEKNRIPTLNNSRY + ALIEFSMNTPYRDIHSALIKILMLGITPVIAHIERYDALENNEKRVRELINMGCYTQVN + SSHVLKSKLFGEPYKFMKKRAQYFLERDLVHVIASDMHNVDSRPPHMAEAYDLVSQKYG + ETKAQDLFIDNPRKIVMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050224251.1" + /gene="wzh" + gene 4774..5466 + /locus_tag="ONJEBG_00030" + /gene="wzd" + CDS 4774..5466 + /db_xref="RefSeq:WP_050224252.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0000540025" + /db_xref="UniRef:UniRef100_Q4K0I3" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_A0A139PG18" + /db_xref="UniprotKB:Q4K0I3" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="ONJEBG_00030" + /protein_id="gnl|Bakta|ONJEBG_00030" + /translation="MKEQNTIEIDVFQLLKTLWKHKLIILLVALVTGAGAFAYSIFIVK + PEYTSTTRIYVVNRNQENKPGLTNQDLQAGTYLVKDYHEIILSQDVLEKVATNLKLDIP + VKTLTSKVQVTVPADTRIVSISVKDKQPEEASRIANSIREVAAEKIIAVTRVSDVTTLE + EARPATTPSSPNVRRNTLVGFLGAAAVTVITVLLIELFDTRVKRPEEVEDVLQMPLLGV + VPDFNKMK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050224252.1" + /gene="wzd" + gene 5476..6165 + /locus_tag="ONJEBG_00035" + /gene="wze" + CDS 5476..6165 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0000540026" + /db_xref="UniRef:UniRef100_Q4K0I2" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_Q4K254" + /db_xref="UniprotKB:Q4K0I2" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="ONJEBG_00035" + /protein_id="gnl|Bakta|ONJEBG_00035" + /translation="MPTLEISQAKLELAKKTEEYYNALCTNPQLSGDDLKVFSISSVKA + GEGKTTTSTNIAWAFAHAGYKTLLIDADMRNSVMSGVFKSRERITGLTEFLSGTTDLSQ + GLCDTNVENLFVIQAGSVSPNPIALLQSKNFSTMLGTLRKYFDYIVVDTAPIGIVIDAA + IIMQKCDASILVTKAGETKRRELQKAKEQLEQTGKSCLGVVLNKFDTSVDKYGFYGSYG + SYRKQKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K0I2" + /gene="wze" + gene 6180..7541 + /locus_tag="ONJEBG_00040" + /gene="wchA" + CDS 6180..7541 + /db_xref="RefSeq:WP_050224254.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0000540027" + /db_xref="UniRef:UniRef100_Q4K0I1" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_Q8VU30" + /db_xref="UniprotKB:Q4K0I1" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="ONJEBG_00040" + /protein_id="gnl|Bakta|ONJEBG_00040" + /translation="MNEKLAKSSVAIVQSFLVILLTYLLSAVRETEIVSTTAIVLYILH + YFVFYISDYGRNFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYFLL + LHVFLVYMLNLFIKWYWKRAYPNFKGSKKVFLLTATSHVEKVLDRLIESDDVVGELVAV + SVLDKPDFQHDDLKVVAEGEIVNFATREVVDEVFINLPSEKYNIGELVSQFETMGIDVT + VNLNAFDWARNKQICEMAGLNVVTFSTTFYKTSHVIAKRVIDIIGSLVGLILCGLVSIV + LVPLIRKDGGSAIFAQTRIGKNGRHFTFYKFRSMCVDAEDKKRELMEQNTMQGGMFKVD + DDPRITKIGHFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQKRRLSFKP + GITGLWQVSGRSEIKNFDEVVKLDVVYIDGWTIWKDIEILLKTVKVVLMKDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050224254.1" + /gene="wchA" + gene 7573..8751 + /locus_tag="ONJEBG_00045" + /gene="wchF" + CDS 7573..8751 + /db_xref="RefSeq:WP_050224255.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E00146" + /db_xref="UniRef:UniRef100_A0A9P1W197" + /db_xref="UniRef:UniRef50_A0A4L8A7M3" + /db_xref="UniRef:UniRef90_A0A9P1W197" + /db_xref="UniprotKB:Q4K0I0" + /db_xref="UserProtein:wchF" + /product="""putative rhamnosyl transferase WchF""" + /locus_tag="ONJEBG_00045" + /protein_id="gnl|Bakta|ONJEBG_00045" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTEYQKDGNIQYYVACMRE + NSAKSGFTADTFEYNDAICYNIDVPNIGPARAIAYDIAAVNKAIEIAKKNKDEAPIFYI + LACRIGPFIARLKKKIQAIGGTLFVNPDGHEWLRAKWSLPVRKYWKFSEQLMVKYADLL + VCDSKNIEKYIQNDYKQYQPKTTYIAYGTDTSPSILKSEDLKIRSWYQEKGLSENGYYL + VVGRFVPENNYETMIREFIKSKSKKDFVLITNVEQNKFYDQLLQETGFDKDPRVKFVGT + VYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGEDGAIYW + RKDNLHKVIEESEQKTIEEIKEIDILSTEQVEKRFTWDFIVNEYENLFLLGK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050224255.1" + /gene="wchF" + gene 9052..10239 + /locus_tag="ONJEBG_00050" + /gene="wzy" + CDS 9052..10239 + /db_xref="RefSeq:WP_050224256.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0000540029" + /db_xref="UniRef:UniRef100_Q4K0H9" + /db_xref="UniRef:UniRef50_A0A1N6LZ15" + /db_xref="UniRef:UniRef90_Q4K0H9" + /db_xref="UniprotKB:Q4K0H9" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="ONJEBG_00050" + /protein_id="gnl|Bakta|ONJEBG_00050" + /translation="MTIKINYMFFVCLSFFGIVLSSSQVIVNLGLSSIVQYIAYFLLLL + CIFFTLIKNSPDVIANRIAYFSIISFLFIIGINLQNLPFSTKIYLSFSMLIISSLSTLP + IKLINNINDFRRISYFLLNGILLSTFLGWLFNISLVTVAVEGIGFAYGFNGGLTHKNFY + AITILVSYILLFISRKHGTKYQVDSLVLWFDLFLLLVSNTRTIYIILVVFWIVVHSGFI + KYIKKNHRPVIITTWLVISLLSIIFFFKHIINNSESYTHRVLGIVNFFKYYESSKFHLF + FGDAELAFGDMTKGYTHNIRSVLGWDGTVEMPLLSVMIKNGYVGLIGYGVVLFKFISSV + LSMEDRRVKNIGLSILIPLLLSAMVENYIVNISFVFMPVCFCILCSIKNIEFKNN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050224256.1" + /gene="wzy" + gene 10249..11217 + /locus_tag="ONJEBG_00055" + /gene="wchV" + CDS 10249..11217 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000054002A" + /db_xref="UniRef:UniRef100_Q4K0H8" + /db_xref="UniRef:UniRef50_O85000" + /db_xref="UniRef:UniRef90_A0A1A9BJG7" + /db_xref="UniprotKB:Q4K0H8" + /db_xref="UserProtein:wchV" + /product="""putative glycosyl transferase""" + /locus_tag="ONJEBG_00055" + /protein_id="gnl|Bakta|ONJEBG_00055" + /translation="MKKVSIILPVYNVEQYIKKCLESIQQQTYPNLEVIIVNDGATDKS + VEYCEQICKIDSRFSVTHKENGGLSDARNVGIDKAKGDYLIFVDSDDFVSQDMVSYLVS + SMENNEADIAICDPAHYYSDRQNNDLNIFYPASSVKVYEKTEALCEMFYQKSFLVSAWA + KIYKKELFDDIRFPVGKLFEDSAVMYLLFEKCEKIVYSNAKLYAYVHRDNSITTKKFSD + KDLDILDISNTILDHYSGNFRVYKAAVSYKVSACFRILLNSSSEKKYNQIQKDCMTYIL + RNWRNMLFDKNVRLKNKLALISITLFNPFVKFIYSKVNRWE" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K0H8" + /gene="wchV" + gene 11224..12462 + /locus_tag="ONJEBG_00060" + /gene="wchW" + CDS 11224..12462 + /db_xref="RefSeq:WP_050224258.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000054002B" + /db_xref="UniRef:UniRef100_Q4K0H7" + /db_xref="UniRef:UniRef50_Q9R924" + /db_xref="UniRef:UniRef90_Q4K0H7" + /db_xref="UniprotKB:Q4K0H7" + /db_xref="UserProtein:wchW" + /product="""putative transferase""" + /locus_tag="ONJEBG_00060" + /protein_id="gnl|Bakta|ONJEBG_00060" + /translation="MNKYEERYQEDLSKNDFEKLINRRYLSDKELQVEYVKKGTVLPPK + VFEMKLSNKLGLQKALHGKGGVVDSKGNYVELSEQKAVGMRNRVYGSYKFNHKNLAIRN + EKVIYLNYFINQWGHFLLDVVGRLWYPLLKDTDTKLDYTCYAGTETKLEGNYLEFLELL + GIDKSRLILINRPTQFSEIIIPESSILPGEYYTKEYKMLFNSLVANVKLDNNLESKKIY + CSRARLDLAKGKEFGENGIEKVFLKNGYTPVYMETMSLKEQIRTLLSATTIVLTSGSLA + HNLLFINNKINVFILNKTYRVNLHQFLINKISEASVSFVDIYRSPLPILYGYGPFLMDI + TKPLVNFFEDSGFTYDSGTILDKTDYFKFYLKWLWSYKFFLFRLNHIKEGNSEFEKSFK + IIRRYYKMGRQYE" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050224258.1" + /gene="wchW" + gene 12455..13843 + /locus_tag="ONJEBG_00065" + /gene="wzx" + CDS 12455..13843 + /db_xref="RefSeq:WP_050224259.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000054002C" + /db_xref="UniRef:UniRef100_Q4K0H6" + /db_xref="UniRef:UniRef50_Q9R923" + /db_xref="UniRef:UniRef90_A0A1A9BIK6" + /db_xref="UniprotKB:Q4K0H6" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="ONJEBG_00065" + /protein_id="gnl|Bakta|ONJEBG_00065" + /translation="MSKYKELAKNTGTFALANFSSKILIFLLVPIYTKVLTTTEYGFYD + LVYTTIQLLVPILTLNISEAVMRFLMKEDVSKKSVFSIAILDIFLGSIIFCLLLLVNQI + FSLSELISQYSIYIMAIFAFYTLNNFLIQYSKGIDKIGVTAISGVISAAVMLSMNILLL + VVLNWGLLGFFIANICGYVIPCVYIIVKLKLWDLFELKIDRSLQWEMIYYTLPLILNTL + SWWVNNTSDRYIITVIIGIQASAIISVAYKIPQIFSTISAIFIQSWQISAIKIQEEKEG + NTFISKMLLYYNALLLIIASGIILFVKPISNILFGASFYSAWTLVPFLIISSLFNAISG + YIGAIMGAKMDTKNIAKSALVGMIANVFLNIVLTFLMGLQGITISTMIASFLIFYMRKD + SVEEIAPETYRAIYLSWFLLVVEASLLVYIDFIIGATLVTLINLFLLKDTLKPLCLKLL + KGFK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050224259.1" + /gene="wzx" + gene 13840..14994 + /locus_tag="ONJEBG_00070" + /gene="wchX" + CDS 13840..14994 + /db_xref="RefSeq:WP_225345905.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000054002D" + /db_xref="UniRef:UniRef100_Q4K0H5" + /db_xref="UniRef:UniRef50_Q9R922" + /db_xref="UniRef:UniRef90_Q9R922" + /db_xref="UniprotKB:Q4K0H5" + /db_xref="UserProtein:wchX" + /product="""putative glycerol phosphotransferase""" + /locus_tag="ONJEBG_00070" + /protein_id="gnl|Bakta|ONJEBG_00070" + /translation="MKMNILQYIKILARTIFMLLISTVLLPVRLKNNKILFINFNGKGY + GDNPKSICEYLRTTYPDLDLVWLARDNEGFPDGVRVVKYGTFQAFYEQASSKVWVYNVR + AFARILKKRGQIYIQTWHGASSFKLIEKQADLPINYVLEAKYDARVTDIMISDSRKQTE + EFQKYFWYSGEIFEVGMPRNDALFHYKEDYDKLNNIRKELSIHSDDYVILYAPTFRDDG + DASYLDINFERLLQCVEHGIKKKCKFLIRLHPNHSHLCNNISFNKNIINATFYSDMQEL + TLLADVLVTDYSSSIFDFMLLNKPYVRYVNDLEKYAELRGVSDTYYELPDSIIKTAEEL + YDLLPKKIENFDYDSIKKYRNEILCPIFNGTASENVGRRIIQEL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_225345905.1" + /gene="wchX" + gene 15030..16058 + /locus_tag="ONJEBG_00075" + /gene="gtp1" + CDS 15030..16058 + /db_xref="RefSeq:WP_000794266.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00000B58FF" + /db_xref="UniRef:UniRef100_Q9R921" + /db_xref="UniRef:UniRef50_Q9R921" + /db_xref="UniRef:UniRef90_Q9R921" + /db_xref="UniprotKB:Q9R921" + /db_xref="UserProtein:gtp1" + /product="""putative glycerol-2-phosphate dehydrogenase""" + /locus_tag="ONJEBG_00075" + /protein_id="gnl|Bakta|ONJEBG_00075" + /translation="MKNNDLKIGSGAIHQISATLSQNSISGKILYCADPVVDDLYGSIV + RSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFISKR + PYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKAGIG + DTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLVNSLV + LSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENSVDTVV + DYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQIYKELIS + EL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000794266.1" + /gene="gtp1" + gene 16074..16778 + /locus_tag="ONJEBG_00080" + /gene="gtp2" + CDS 16074..16778 + /db_xref="RefSeq:WP_000645462.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00000B4F25" + /db_xref="UniRef:UniRef100_O85005" + /db_xref="UniRef:UniRef50_O85005" + /db_xref="UniRef:UniRef90_O85005" + /db_xref="UniprotKB:O85005" + /db_xref="UserProtein:gtp2" + /product="""putative nucleotidyl transferase""" + /locus_tag="ONJEBG_00080" + /protein_id="gnl|Bakta|ONJEBG_00080" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQNN + ITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLMMN + ADVFYDASVIKSLLLHKAPNAIVTDLGIYIEESMKVVEKNGRLVEISKQISPEETLGAS + IDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILSEVEFVACPLEGRWLEIDN + HEDLVAAEKLFA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000645462.1" + /gene="gtp2" + gene 16799..17626 + /locus_tag="ONJEBG_00085" + /gene="gtp3" + CDS 16799..17626 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000152F48C" + /db_xref="UniRef:UniRef100_A0A9P1PND2" + /db_xref="UniRef:UniRef50_Q4K1N0" + /db_xref="UniRef:UniRef90_Q4K1N0" + /db_xref="UniprotKB:Q4K015" + /db_xref="UserProtein:gtp3" + /product="""putative phosphotransferase""" + /locus_tag="ONJEBG_00085" + /protein_id="gnl|Bakta|ONJEBG_00085" + /translation="MTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLELLDY + IHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPKSKVY + CQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDVPFIAT + NPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRKKLNYSLFETVVI + GDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQDSIKPTYTFKNVKEMWKGIV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef100_A0A9P1PND2" + /gene="gtp3" + gene 17786..18655 + /locus_tag="ONJEBG_00090" + /gene="rmlA" + CDS 17786..18655 + /db_xref="EC:2.7.7.24" + /db_xref="GO:0008879" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="RefSeq:WP_054362680.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000054002F" + /db_xref="UniRef:UniRef100_Q4K0H1" + /db_xref="UniRef:UniRef50_A0A366WAT5" + /db_xref="UniRef:UniRef90_Q4K105" + /db_xref="UniprotKB:Q4K0H1" + /db_xref="UserProtein:rmlA" + /product="""glucose-1-phosphate thymidylyltransferase + RmlA""" + /locus_tag="ONJEBG_00090" + /protein_id="gnl|Bakta|ONJEBG_00090" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLAG + IRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSVAL + ILGDNIYHGPGLSTMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEKPEY + PRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRGFAWL + DTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKNEYGQY + LLRLIGEA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_054362680.1" + /gene="rmlA" + gene 18656..19249 + /locus_tag="ONJEBG_00095" + /gene="rmlC" + CDS 18656..19249 + /db_xref="RefSeq:WP_000131458.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00000B9010" + /db_xref="UniRef:UniRef100_Q8RSE9" + /db_xref="UniRef:UniRef50_Q5XCG7" + /db_xref="UniRef:UniRef90_A0A1S0ZBJ9" + /db_xref="UniprotKB:Q9AHA9" + /db_xref="UserProtein:rmlC" + /product="""dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC""" + /locus_tag="ONJEBG_00095" + /protein_id="gnl|Bakta|ONJEBG_00095" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEKM + LPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREGET + FGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYADPS + LGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000131458.1" + /gene="rmlC" + gene 19262..20311 + /locus_tag="ONJEBG_00100" + /gene="rmlB" + CDS 19262..20311 + /db_xref="COG:COG1088" + /db_xref="COG:M" + /db_xref="EC:4.2.1.46" + /db_xref="GO:0008460" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="RefSeq:WP_000141508.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FF5F" + /db_xref="UniRef:UniRef100_Q4K121" + /db_xref="UniRef:UniRef50_P95780" + /db_xref="UniRef:UniRef90_F3UAC1" + /db_xref="UniprotKB:Q4K121" + /db_xref="UserProtein:rmlB" + /product="""dTDP-D-glucose 4,6-dehydratase RmlB""" + /locus_tag="ONJEBG_00100" + /protein_id="gnl|Bakta|ONJEBG_00100" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGNR + ANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTNFI + GTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSPYSS + TKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLYGEGK + NVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATDAYDHV + TDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKEAVEANY + AKTQEIITV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000141508.1" + /gene="rmlB" + gene 20377..21228 + /locus_tag="ONJEBG_00105" + /gene="rmlD" + CDS 20377..21228 + /db_xref="COG:COG1091" + /db_xref="COG:M" + /db_xref="EC:1.1.1.133" + /db_xref="GO:0008831" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="KEGG:K00067" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0000540030" + /db_xref="UniRef:UniRef100_Q4K0G8" + /db_xref="UniRef:UniRef50_Q9AH81" + /db_xref="UniRef:UniRef90_Q9AH81" + /db_xref="UniprotKB:Q4K0G8" + /db_xref="UserProtein:rmlD" + /product="""dTDP-4-keto-L-rhamnose reductase RmlD""" + /locus_tag="ONJEBG_00105" + /protein_id="gnl|Bakta|ONJEBG_00105" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEKV + FEEVKPTLVYHCAAYTAVDAAEDEGKELNFAINVTGTKNVAKASEKHGATLVYISTDYV + FDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKNFVF + TMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDTTWYD + FAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQEFYKQE + VR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K0G8" + /gene="rmlD" + gene 21313..21738 + /locus_tag="ONJEBG_00110" + CDS 21313..21738 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A0H2ZN29" + /db_xref="UniRef:UniRef90_A0A1A9BIN6" + /product="Transposase" + /locus_tag="ONJEBG_00110" + /protein_id="gnl|Bakta|ONJEBG_00110" + /translation="MLVSLAHSFGSVSIIAHIIHQKINLKVPNYRQEEDWARMGLPITR + KEISNWHIKASQYYLESLYNLLREKLLEQPLLHADETSYRVLESDSHLTYYWTFLSGKA + ENQAITLYHHDQRRSGLVVQEFLGDYSGYVHCDMLRQ" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A1A9BIN6" +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt atccaatgat aaacaaaact tttcagtaga + 61 tggaaaagtt agatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttgact ccatgggatg ctttctgtgt ggaaatgact gactagaatg agcaagagcc + 181 tgggacaaaa tagttctcga ccacaaaaaa gctagagatt tccaattgtg gaactctagc + 241 tttttaattt tgagtcattc tcttattgta ttttaggagg ttattggcca taagtaccaa + 301 tcccatgtca attctcactt gacgcttgcc cctcagatta catctcttgt aacccaaaca + 361 agcctttatc tgcccaaaga caggttccac atcaatcttg cgttgagcga aaatctgtct + 421 accttgggga gataaaagcg cctgacattc tttagctttc aagttttgat agccttcgtt + 481 catatacagt ccccttttga ggggctgatt caggttcgtc gacgtagtaa accttgattt + 541 cttgttgaaa gtctgtctgt gttttctgat gtttggtatg gtgaaaacga taatactagc + 601 catcaggatg tgtatagcta tcctccttgt cattatagtg ccaattcgct aagtttttag + 661 ctgactgttt atagcctctc ttctgttcct tatcaaacat ggcatattta atcagatggt + 721 ttacctcctt ttcatctaaa cgaaggaggt tctcttcact tccatatcca gcatctgcga + 781 caactgtctt caagtcatgc ggataggttt caaggaatgg cagaagagtc ttggtatctg + 841 tcggatttga aaagacatca tagtgaagaa caaattggtt ttccgtagcg atttgaagat + 901 tataagcagc cttgggttga ctatttttca tatgttcttc cttcatccgc ataaaagtgg + 961 catctggatc ggttttggaa aaactgttag gcccttgaaa tgtctcctga tagttctcat + 1021 atttttcagc acgtactgaa aaatcctcct ttaaactctt cataatcctt tttattttta + 1081 tgaagatatt gtttgaaaga tgtgagtttc cacggatggg tttgtggagg gatatacttg + 1141 cgtctttctt tttttgttct ggttcttgtt caaggttttt cgaatagagt tcatgattta + 1201 gtagctcctt tgtgtgatag attttgtcag cgatattgag gtagatgtca ccatcaaatg + 1261 cttttataac taatgctttt gtctttctga tgaaatagac ttcttttcct tgctcggtag + 1321 ggatatagca acgattttgg aatcggatat ggtgtccact atcgacgact ctctcccgcc + 1381 agtttagcta gaatgagatt tcgttcagag ggcttaggag cctcctcaaa gacagagagt + 1441 tttgtcttgt ttccaaactg ttcattaaag gtttggatat aggaaggcag aaaggtattg + 1501 gcttcttcca aggtatgaat cttgtttcgt tccagttcga taggcaggag agattgtagt + 1561 atctgattga gtctttcgac tctcccttta gcttgaggga tagaggttgt ctcaaggaga + 1621 attcccagtt ggtgacaggc gtatccaaat tgtgtatggg tgtcgtcctc cattttctta + 1681 gagttggagg cttgataggt aaaaacagtt ctcttatctg ttttgatttg aacaggaatg + 1741 ccgtggttgg ctaagatttg ttcgaggaca tgatagtaag cattcaaggt ctcttgtttg + 1801 tcaaaataag cgcctaggat attgccagaa gcatcatcaa tggctaggtg taagttagag + 1861 gtttctgctc caaaccaggc atgagggctg gcatccattt ggatgagttc tccagcaaat + 1921 ttctttctgg gtctactagg atgtaccttt ttagggtctt ccaggaagtt ttcagccgtc + 1981 ggtaagattg gattgtctag gggttgcttg gggttcagtt tagcttgctt tcttactctc + 2041 ctctttgtct ttctatggga cttaggcgac aggatatttt tcttatagag tatttttcta + 2101 acagtagtat cagagagctg aattccttct tcttcagcta gcaattcaca gaaatgacgg + 2161 acatttggtt tatatgtttc ataggagagg tatttcttta ggatacgttc tttgatttca + 2221 tcagggattg catgttttgg ttttcgattt ctgtttccgt gtctgaaggc ttctttcctt + 2281 tctgttgata ggctagtagc agacgattga tttgcctttc agaaagattg agctcgacac + 2341 aggctcgttt ctttgttttc tttccttggg ctatagcttt tatcacaaga tattttttcg + 2401 tttcattcat attcagttgg atcctttaca tatgactatt ctaccaaatg ggacattttt + 2461 acgttcgatt tactaaagac attatcacat tcgaattaca caagatgcag atagtgaaaa + 2521 aaaggtgtag acattaccgt aaaaaagtga tataattgta agatgttcaa tgtataggtg + 2581 ttaatcatga gtagacgttt taaaaaatca ggttcacaga aagtgaagcg aagtgttaat + 2641 atagttttgt tgactattta tttattgtta gtttgttttt tattgttctt aatctttaag + 2701 tacaatatcc ttgcttttag atattttaat ctagtggtaa ctgcgttagt cctactagtt + 2761 gccttggtag ggctactctt gattatctat aaaaaagctg aaaagtttac tatttttctg + 2821 ttggtgttct ctatccttgt cagctctgtg tcgctctttg cagtacagca gtttgttgga + 2881 ctgaccaatc gtttaaatgc gacttctaat tactcagaat attcaatcag tgtcgctgtt + 2941 ttagcagata gtgatatcga aaatgttacg caactgacga gtgtgacagc accgactggg + 3001 actgataatg aaaatattca aaaactacta gctgatatca aatcaagtca gaatatcgat + 3061 ttgacggtca atcaaagttc gtcttacttg gcagcttaca agagtttgat tgcaggagag + 3121 actaaggcca ttgtcttaaa tagtgtcttt gaaaatatca tcgaatcgga gtatccagat + 3181 tacgcatcga agataaaaaa gatttatacc aagggattca ctaaaaaagt agaagctcct + 3241 aagacgtcta agaatcagtc tttcaatatc tatgttagtg gaattgatac ttatggtccg + 3301 attagttcgg tgtcgcgttc agatgtcaat atcctgatga ctgtcaatcg agataccaag + 3361 aaaattctct tgaccacaac gccacgtgat gcttatgtac caatcgcaga tggtgggaat + 3421 aatcaaaaag ataaattgac ccatgcgggc atctatggag ttgattcgtc cattcacacc + 3481 ttagaaaatc tctatggagt ggatatccat tactatgtcc gtttgaactt cacttctttc + 3541 ttgaaattga tcgatttgtt gggtggggta gatgtttata atgaccaaga tttcacatct + 3601 ctacacggga agttccattt cccagttgga aatgtccact tagattctga gcaggctctg + 3661 ggatttgttc gtgagcgcta ttccctagcg gatggtgatc atgaccgcgg gcgcaatcaa + 3721 caaaaggtga ttgcggctat ccttcaaaaa ttaacttcga gcgaagcgct gaaaaattat + 3781 agtatgatca ttgatagctt gcaagattct atccaaacaa acatgcccct tgagaccatg + 3841 ataaacttgg tcaatgctca gttagaaagt ggtggaacgt acaaagtaaa ttcgcaagac + 3901 ttgaagggta ggggacggac ggatcttcct tcctatgcga tgccagatag taacctctat + 3961 atgatggaaa ttaacgacag tagccttgca tctgtcaaaa ctgctattca ggatgtgttg + 4021 gagggcagat gaaatgattg atattcattc gcacattgtc tttgatgtag atgatggtcc + 4081 caagtcaaga gaggaaagta aggctctctt gacagaagcc tacaggcagg gggtgcgaac + 4141 cattgtctct acctctcacc gtcgcaaggg catgtttgaa actccagaag agaagatagc + 4201 agaaaacttt cttcaggttc gggaaatagc taaggaagtc gcgagtgact tggtcattgc + 4261 ttatggggcc gaaatttact acacaccaga tgttttgggt aagctggaaa aaaatcggat + 4321 tccgaccctc aataatagtc gttatgcctt gatagagttt agtatgaaca ccccttatcg + 4381 cgatattcat agtgccttga ttaaaatatt gatgttggga attactccag tcattgccca + 4441 catcgagcgc tatgatgctc ttgaaaataa tgaaaaacgc gttcgagagc tgattaatat + 4501 gggctgttac acgcaagtaa atagttcaca tgtcctcaaa tccaaacttt ttggagaacc + 4561 ttataaattc atgaaaaaaa gagctcagta tttcttggag cgtgatttgg ttcatgtgat + 4621 tgcaagtgat atgcataatg tggacagcag acctccccat atggcagaag catatgacct + 4681 tgtttcccaa aaatacggag aaacgaaggc tcaggacctt tttatagaca atcctcgaaa + 4741 aattgtaatg gatcaactaa tttaggagaa ataatgaaag aacaaaacac gatagaaatc + 4801 gatgtatttc aattacttaa aaccttgtgg aaacacaagc taatcatttt attagtggca + 4861 cttgtgacag gggcgggagc ttttgcatat agcattttta ttgttaagcc agaatataca + 4921 agcaccacgc gtatttacgt agtcaatcgt aatcaagaaa ataagccggg actgacgaat + 4981 caggacttgc aggcaggaac ttatctggta aaagactacc acgaaattat cctttcgcaa + 5041 gatgtattgg aaaaggtagc gacaaatttg aaattggata ttccagtaaa aacgttaact + 5101 agcaaagtgc aagtgactgt accagccgac actcgtatcg tctcaatctc tgtcaaggat + 5161 aaacaaccag aggaagccag tcgcattgct aattctatac gagaagttgc tgcagaaaag + 5221 atcatcgctg taacgcgagt atctgatgta acgacgcttg aagaagcgcg accagctacg + 5281 actccctctt ctccaaatgt tcgacgcaac accttagttg gttttcttgg agccgccgcc + 5341 gtaacagtaa ttactgttct tttgattgag ttgttcgata cccgtgtaaa acgtcctgaa + 5401 gaagttgaag atgtactgca aatgccactt ctaggagtcg ttccagattt taataaaatg + 5461 aaataggagg aagttatgcc aacgttagaa atctcacagg cgaaattaga acttgcgaaa + 5521 aagacagagg aatattataa tgctttgtgc acgaacccac agttaagtgg agatgatttg + 5581 aaagtatttt ctatcagttc tgtgaaagca ggagaaggaa aaacaacgac ttccaccaat + 5641 atcgcttggg cttttgcgca tgcaggttac aaaacgctgc tgattgatgc agacatgcgt + 5701 aactccgtta tgtcaggtgt ctttaaatca agggaaagga ttactgggct aacagaattt + 5761 ctatcaggga caacagacct gtcacagggg ctttgcgata ccaatgttga gaatctcttt + 5821 gtgattcagg ctggctctgt gtcaccaaat ccgatagccc ttcttcaaag taagaatttc + 5881 agtacaatgc ttggaacctt gcgtaaatat tttgactata tcgtcgtaga cactgctcct + 5941 atcggtatcg tgattgatgc ggctatcatt atgcagaaat gtgatgcttc tattttagtg + 6001 acgaaggcag gtgaaacaaa acgacgggaa cttcaaaaag cgaaagaaca gttggaacaa + 6061 actgggaagt cgtgtttagg agttgtgttg aataaattcg atacttcagt agacaaatac + 6121 ggtttttatg ggagttatgg gagttacagg aaacagaaaa aataggttga gggatagaga + 6181 tgaatgaaaa actagcaaag tcttcagtag ctatagtcca gagttttctt gttattttat + 6241 tgacttatct acttagcgct gtgagagaaa cagagattgt ttcaacaaca gctattgtac + 6301 tttatatcct ccactatttt gtcttttata tcagtgatta tggacggaat ttctttaaaa + 6361 ggagatattt gattgaactt gtccagacat tgaaatatat cctattcttt gcgctagcga + 6421 ttagtatttc taattttttc ttagaggatc gatttagtat ttccagacga ggcatgattt + 6481 acttcctcct attacatgtt ttcttagtct atatgctaaa cctatttatc aagtggtatt + 6541 ggaagcgggc ttatcccaac tttaaaggaa gtaagaaggt tttcctactt acagcaactt + 6601 ctcatgtcga aaaggtactg gatagactaa tagaatcaga tgatgttgtt ggggagttgg + 6661 tagccgtcag tgttttagat aaaccagatt ttcagcatga tgatttaaag gttgtagcag + 6721 agggggagat cgtaaacttt gcgactcgtg aggtggtcga tgaagtcttt atcaatcttc + 6781 caagtgaaaa atacaatatt ggagagcttg tctctcagtt tgaaacgatg ggaattgatg + 6841 taacagtcaa tctaaatgct ttcgattggg cacgtaacaa gcaaatttgt gagatggcag + 6901 gactaaatgt tgtgactttt tctacaacat tttataagac tagccatgtg attgctaagc + 6961 gggttattga tattatcggt tccctggtag gtttgatact atgtggtcta gtcagtattg + 7021 tgctggttcc tttgattcga aaggatgggg gctctgctat ttttgctcag acgcgtatag + 7081 gaaaaaatgg ccgccatttc actttttaca agtttcgctc tatgtgtgta gatgctgagg + 7141 ataaaaagag agaactcatg gaacaaaata ccatgcaggg tggaatgttt aaggtggacg + 7201 atgatcctcg tatcacgaaa attggtcatt ttatacggaa gacgagcttg gacgagctac + 7261 cacagtttta taatgttcta aagggagata tgagtttggt aggtacacga ccaccaacag + 7321 tggacgagta tgaacactat accccagaac aaaaacgtcg gctaagtttt aaacctggta + 7381 taacaggctt atggcaggtc agtggacgaa gtgaaatcaa aaatttcgat gaagttgtca + 7441 aattagatgt ggtctatatt gatggttgga caatctggaa agatattgaa attttattga + 7501 agacagttaa agttgtattg atgaaggatg gagcgaaata gtttgctttt gtttcagact + 7561 attaggagaa aaatgaagaa gtcagtttat atcattggtt caaaagggat tcccgctaag + 7621 tatgggggct ttgaaacctt tgttgagaaa ttaacagaat atcaaaaaga tggtaacatc + 7681 caatactatg ttgcctgcat gcgcgaaaat tctgcaaaat caggatttac agcagataca + 7741 tttgagtaca atgatgctat ttgttacaac attgatgtgc ctaatattgg tcctgctaga + 7801 gccattgctt atgatattgc tgctgtgaat aaagcgattg aaatagctaa gaaaaacaaa + 7861 gatgaagctc ctatttttta cattctagct tgtcgtatcg ggccttttat agctagactt + 7921 aagaaaaaga ttcaagctat cggaggtact ctgtttgtca atccagatgg acatgagtgg + 7981 cttcgggcta aatggagcct gccggttcga aagtattgga aattttcgga acagttgatg + 8041 gtcaaatatg cagatttatt ggtctgtgat agcaaaaata ttgaaaaata tatccagaat + 8101 gactataagc aatatcaacc aaagacgact tatattgctt acgggacgga tacaagtccg + 8161 tctatcctga aatccgaaga tctaaaaatt cgtagttggt atcaggaaaa aggacttagc + 8221 gaaaatggct attatctagt ggtgggacga ttcgtccctg aaaacaacta cgaaaccatg + 8281 attcgtgaat ttatcaaatc taagtccaag aaggactttg tcctcatcac aaatgtggag + 8341 cagaataaat tttacgacca gttgttacag gagactggtt ttgacaaaga tcctagggtt + 8401 aaatttgtag gtactgtcta tgaccaagaa ttgcttaagt acattcgtga aaatgctttt + 8461 gcctatttcc atgggcatga ggttggaggg accaaccctt ctctactaga agctctagca + 8521 tccacaaaac tgaatttgtt gctagatgtt ggttttaacc gtgaggttgg tgaagacggg + 8581 gctatttatt ggagaaaaga taatcttcat aaggttattg aagagagtga acaaaaaaca + 8641 atagaagaaa taaaagaaat agatattcta tctacagagc aggtagaaaa aagatttact + 8701 tgggatttta ttgttaatga atatgaaaat ttatttttac tagggaaata attatctaag + 8761 ttacaaggat tttatttgag gaagctttga tggaagttca tcactttctt agacaattat + 8821 ctaaataact tatgttattc atgaagtttt taaaatgata gatattctcc ctttttgcaa + 8881 agatactaaa attatagaga ggaaatatgc ccagtagttg atagtgtttt tgggtagggt + 8941 taaacgacat agttttaaga caaactggtg gagatttaag aaataagtag ttcttattaa + 9001 atcaaaaacg tgttcttatt ctatattgtc atttagtcaa aggtatcaag tatgactatt + 9061 aaaattaatt atatgttttt tgtttgtctc tcttttttcg gtatagtttt aagtagttca + 9121 caggtaatag tgaatctggg tttgtccagt atagttcagt atatagctta ttttttattg + 9181 ttgctatgta tattttttac cttaattaaa aatagtccgg atgtaatcgc taatagaatt + 9241 gcttattttt ctattatttc atttttgttt atcataggga ttaatttaca aaatcttcct + 9301 ttctcaacaa agatttattt atcgttttcc atgcttatta tttctagtct atcgacttta + 9361 ccgattaaat taataaataa tataaatgat tttagaagaa tatcctattt tttattaaat + 9421 ggcatcctat tatcaacatt tttaggttgg ctatttaata tttcattagt aactgttgct + 9481 gttgagggga ttggttttgc atatggattt aatggtgggt tgacgcataa gaatttttat + 9541 gcaattacaa ttttagtttc ctatatccta ttgtttatta gtagaaaaca tggtacgaag + 9601 taccaagttg atagcttagt attatggttt gatctttttt tacttttagt atctaacaca + 9661 cggacaatat atataatatt agttgttttt tggatcgttg ttcatagcgg atttattaaa + 9721 tatataaaga aaaatcacag accagtaatt ataacgacat ggttagtaat ttctttatta + 9781 tctataatat tttttttcaa acacattata aataatagtg aatcctatac tcatcgtgtt + 9841 ttgggtattg ttaatttttt taaatactac gaatctagca aatttcattt attttttggt + 9901 gatgctgagt tagcctttgg tgatatgacg aaaggttata ctcacaatat aagaagtgtt + 9961 ttaggttggg atggaactgt ggaaatgccg ttgctaagtg ttatgataaa aaatggttat + 10021 gtcggcttaa tagggtatgg agtagtctta tttaaattta tatcctctgt attatctatg + 10081 gaagatagaa gagtaaaaaa tattggctta tccattctaa tacctctact tctatcagca + 10141 atggttgaaa attatatcgt taatattagc tttgtattca tgccggtctg tttttgtatt + 10201 ttatgctcaa taaaaaatat agaatttaaa aataattgaa agtgatttat gaaaaaagta + 10261 agtattattc tacctgtcta caatgttgaa cagtatataa aaaaatgctt agaatcaatt + 10321 caacaacaaa cttatccaaa tttggaagta atcattgtta atgacggagc aaccgataaa + 10381 agcgttgaat actgtgagca aatttgtaag atagattcta ggttttctgt cactcacaaa + 10441 gaaaatggtg gactttccga tgcaagaaat gtcggtatag ataaagccaa gggagattac + 10501 ctcatttttg ttgacagtga tgattttgtc tctcaagata tggtatctta tttagtatct + 10561 agtatggaga acaatgaggc agacattgct atttgcgatc ctgctcatta ttatagtgac + 10621 cgtcaaaaca atgatcttaa tattttttat ccggcatcaa gcgttaaggt ttacgaaaaa + 10681 acggaagctc tatgtgagat gttttatcaa aaatcttttt tggtatctgc ttgggctaag + 10741 atatataaaa aggaactatt tgatgatatc agattccctg ttgggaagtt atttgaagat + 10801 agtgctgtta tgtatctgct ttttgaaaaa tgtgaaaaga tagtatattc taatgcgaaa + 10861 ttatatgcct atgtgcatag agacaatagt attacaacaa agaagttttc agataaagat + 10921 ttagatattt tagacatttc aaatactatt cttgatcact atagtgggaa ctttagagtt + 10981 tataaagcgg cagtttccta taaagtttcg gcatgtttta gaattttgtt gaactcatct + 11041 tcagaaaaaa aatataatca aatacaaaaa gattgtatga catatatttt acgaaattgg + 11101 agaaatatgt tatttgataa aaatgtccga ttaaagaaca agcttgcctt gatttctata + 11161 actcttttca atccttttgt taaatttatc tatagcaaag taaacagatg ggaataatag + 11221 caaatgaaca aatatgaaga aagatatcag gaagatttat ctaagaatga ttttgagaaa + 11281 ctaatcaata gaagatacct atcggataaa gaactacaag ttgaatatgt aaaaaaagga + 11341 acagtgttac ctcccaaggt ctttgaaatg aaactatcaa ataaacttgg tctacaaaaa + 11401 gctttgcatg ggaaaggtgg tgttgtagat tcaaagggga attatgttga actttctgaa + 11461 caaaaagcag ttgggatgag aaatcgagtc tatggatctt acaaatttaa ccataaaaat + 11521 ttggctatca gaaatgaaaa agttatttac ctaaactatt tcataaatca gtggggacat + 11581 tttttactag atgttgtggg gagattatgg tatccattac taaaagatac tgatactaaa + 11641 ctggattaca catgttatgc tggtacagaa acgaaacttg aaggaaacta tttagagttt + 11701 ttagaactcc tcggtataga taaatcacgc ttaattttga taaatcgccc aactcaattc + 11761 tcagagataa ttatacctga aagttcaatt ctgccaggtg aatattatac aaaagaatat + 11821 aaaatgcttt ttaattcttt agtagcaaat gttaaattag ataacaattt agaatcaaaa + 11881 aaaatttatt gttcacgagc taggctagat ttagcaaaag gtaaagagtt cggtgagaat + 11941 ggtattgaaa aggtcttctt aaaaaacggt tatactccag tttatatgga aacaatgtct + 12001 ttgaaagaac aaataagaac gctattatca gctacaacaa tagtattaac tagcggttcg + 12061 ttggctcata atttattgtt tataaacaat aaaattaatg tttttatttt aaataaaact + 12121 tatagagtaa atcttcacca atttttaata aataaaatct cagaagctag tgtgagcttt + 12181 gtggatattt atcgttcccc gttacctatt ttatatggat atggtccatt tttaatggat + 12241 attactaaac ctttagtgaa tttttttgag gacagtggct tcacctatga ttcaggaacc + 12301 attttagata aaactgatta ttttaaattt tatttaaaat ggttatggag ttataaattc + 12361 tttctattta gactgaatca cattaaagaa ggaaacagtg aatttgagaa gagttttaaa + 12421 ataattagaa gatattataa aatgggacga cagtatgagt aaatataagg aattagcaaa + 12481 aaatacaggt acttttgctt tagctaattt ttcatcaaaa atattaattt ttttgttagt + 12541 acctatatat acaaaagttc taacaacgac agagtatggt ttttatgatt tggtttatac + 12601 aacaattcag ctccttgtac caatcctgac attgaatata tctgaagcag ttatgagatt + 12661 tttaatgaaa gaagatgttt caaaaaaatc agttttttcg attgcaatac ttgatatatt + 12721 tttagggtct attatttttt gtttgttact actggtcaat caaatatttt ctttatcgga + 12781 gttaatttct caatatagca tatatatcat ggcgattttt gctttttata cacttaataa + 12841 ttttttgata caatactcta aagggattga taaaataggt gtaacggcta tctctggagt + 12901 cataagtgca gcagttatgc tttcgatgaa tattttattg ttagtggtat taaattgggg + 12961 actactaggt ttttttatcg caaatatttg tgggtatgtc attccttgtg tatatataat + 13021 agtaaaacta aaattatggg atttatttga acttaaaatt gatagatcgt tacagtggga + 13081 aatgatatat tatactttac ctttgatttt aaatacttta agttggtggg ttaataacac + 13141 ttcagatagg tatattataa cagtaattat aggtatacaa gctagtgcga ttatttcagt + 13201 tgcttataag attccacaaa ttttttccac aattagcgct atattcattc aatcgtggca + 13261 aatatctgca ataaaaattc aggaagaaaa agaaggtaac acctttatat caaaaatgct + 13321 tttatattat aatgcactct tgctgattat agcgagcggt atcattctat ttgtaaaacc + 13381 aatctctaat atactcttcg gagcttcatt ttattcagcg tggacgcttg taccgttttt + 13441 aattattagc agtttgttta atgcgatttc gggttatata ggagcgataa tgggcgctaa + 13501 aatggatact aaaaatattg ctaaatctgc tttggttgga atgatagcta atgttttttt + 13561 aaatattgta ttaacatttt taatgggact acaggggatt acaatctcaa ctatgatagc + 13621 tagttttctt attttttata tgagaaaaga tagtgttgaa gaaattgctc cagaaacata + 13681 tagagctatt tatctttcgt ggtttttgtt agtggttgag gctagtcttt tggtttatat + 13741 agattttatt attggggcta cattagttac attaatcaat ttatttttat taaaggatac + 13801 tcttaaacca ttatgtttaa aattattaaa aggatttaaa tgaaaatgaa tattctacaa + 13861 tacattaaaa ttttggctag aactattttt atgctattga taagtacagt gttattacct + 13921 gtcaggttaa aaaataataa gattctattt attaatttca atgggaaggg ttatggtgat + 13981 aatcctaaaa gtatttgtga gtatcttaga actacttacc cagatttaga tttggtttgg + 14041 cttgcaagag ataacgaagg ttttccagat ggggttaggg ttgttaaata tgggactttc + 14101 caagcttttt atgagcaagc gagttcgaag gtttgggtat ataatgtaag agcttttgca + 14161 agaatactaa aaaaacgagg acagatttat attcaaactt ggcatggtgc ttctagtttt + 14221 aagttgatag aaaaacaagc tgatttacca ataaattatg ttttagaagc taagtatgat + 14281 gcaagagtca cagatataat gatttcagat agcagaaaac aaactgaaga atttcaaaag + 14341 tatttttggt attcaggaga aatttttgag gtggggatgc cgagaaatga tgccttgttt + 14401 cactataagg aagactacga caagttaaat aatatcagaa aagaactaag cattcattca + 14461 gatgattatg ttattttata tgcccctact ttcagagatg atggggatgc atcttattta + 14521 gatataaatt ttgaacggct tttgcaatgt gttgaacacg gaattaaaaa gaaatgtaaa + 14581 ttcttaatta ggttacaccc taatcactcc catttgtgta ataatatttc atttaataag + 14641 aatataatca atgctacgtt ttattcagat atgcaagagc ttactttgtt ggcagatgtt + 14701 ttagtcacag attattcttc ctcgatattt gattttatgc ttttaaacaa gccttatgtc + 14761 agatatgtga atgatttaga aaaatatgct gagcttaggg gggtatcaga tacatattac + 14821 gaattgccgg attcgattat taaaactgct gaagaattgt atgacttact gcctaaaaaa + 14881 atagaaaatt ttgattatga ttctataaaa aaatatagaa atgaaatact gtgtccaatc + 14941 tttaatggaa ccgctagtga aaatgtagga aggagaataa ttcaagagtt gtgaagtaaa + 15001 acattgggtt atttttaagg taacgagatt tgaaaaataa tgatttaaag ataggaagtg + 15061 gagctattca tcaaatttcc gctacacttt ctcaaaatag tatttcggga aagattttat + 15121 attgtgctga tccagttgtc gatgacttgt acggttcgat agtacgttca caaatagagg + 15181 aaattggtcg ggtaaaggaa gaaagttgca attataatac tattgcttat gcgatgaata + 15241 tagcagaacg ggctattgcc acagatattg actgtattgt gggaatggga ggaggtcgtg + 15301 ttttagatgt ctgcaagtat gcatctttta tttcgaaacg tccttaccta tcgattccga + 15361 caacagcagc aaatgatggc attgcttccc cagttgctgt tttgaaaagg caggatgata + 15421 gaccaaaaag cttaggggcg gctatcccct caatgacact aattgatatt gatgttattg + 15481 catcaggacc tatacaaaat ataaaagctg gtatcggtga tacaatatcc aattacactg + 15541 cattgaaaga ttgggagttg gcagttgagc gagggaaaga tgagatgcat ggttttgcat + 15601 atctaatgtc gcaaaattct ttagatgctt taatgaaaac gaagtataat tctattaccc + 15661 ctgattttat tgaagttttg gtaaactctt tagttttatc aggcattgca atggattttg + 15721 cgggaagtag tagacctgtc agtgggtcag agcacttatt tagtcatgca ttagattact + 15781 atggttctac aaggaatctt catggaattc aggttgcatt aggtacagtc gcagttttga + 15841 aattaattga aaattctgtt gatactgtag tggattactt gcaaagattt gaggttcata + 15901 ttaacccgaa acttttgggg atagatgaag agttgtttat ttattgtatg caacatgcta + 15961 caaaaatgag aagtaatcgc tatacctatc tgcatgaagt tgatcttagc acagatagat + 16021 tgaaacaaat atataaggaa ctcataagcg agttgtagag aagagaggaa aaaatgaaag + 16081 cacttatttt agcagcaggg ttaggaacac gtctagctcc aattaccaat gaggtaccaa + 16141 aatctttggt accagtcaat ggtaagccaa ttttgatgaa acaaattgaa aatttatatc + 16201 aaaataatat tacagatatt acgattattg ctggatataa gtcatctgta ttaacagatg + 16261 cagttactga aaagtatcca gaaattaata ttattgataa tgttgatttt aaaacgacta + 16321 ataatatgta ttcagcctat ctaggaaaag ctgcaatggg tgatagtgac ttcttaatga + 16381 tgaatgcaga tgtattttat gatgcttctg ttattaaaag tctgttgctt cataaagctc + 16441 caaatgcaat tgtaactgat ttaggtattt atattgaaga gtctatgaaa gtcgtagaaa + 16501 aaaatggtcg tttagtagaa atttctaaac agatttcacc tgaggaaact ttaggagctt + 16561 ctattgatgt ttataaattc tcttatgaag caggtgctcg attctttgaa aagtgtaagg + 16621 aatttattga agataaacga gaacttcaaa tgtggagtga ggttgctctt aatgcaattc + 16681 tttctgaagt tgaatttgta gcatgtccat tagagggtcg ttggttagaa attgataatc + 16741 atgaagactt agttgctgca gaaaaactat ttgcttgaac cgaatacgga gaatgaaatt + 16801 gacaaataga gttgattatt ttggtgctga tattagtgaa cttcagaata aaaaattatt + 16861 cttatttgat atggatggta ccatttatga agaagatagg ttgtttgagg gtactctcga + 16921 attattagac tatattcata atattggcgg tgagtatatt tttattacaa acaattcatc + 16981 taagtctgtt gttgactatg ttgaaaaagt taacagatta ggtattaaag ctgaacgaga + 17041 taattttttt acctctgctc aagccacaat tgtttatatt aaagaaaatt atcctaaatc + 17101 taaagtttat tgccaaggaa caaaatcttt gataaaagaa ctatctgacg caggaattga + 17161 tgtaactgag caagttagtg ctgatataga tgttgttctt gttggttttg atacagaatt + 17221 aaccagtgat aaaattcgca atacctgcga gattctatca acaaaggacg tacctttcat + 17281 agctactaac cctgatattc gctgcccagt atcgtttgga ttcatcccgg attgtggttc + 17341 tatttgtgat atgattagta aatcagtcga taggaaacct gtttacatag gtaaacctga + 17401 acctacgatg gttgatattg ttcgaaaaaa attaaattat tctctatttg aaacagttgt + 17461 gattggagat cgcttgtata cggatatcat gactggtata aatgcaggag taacttcagt + 17521 ttgtgtgctg acaggagaag caacggtgaa tgatattcaa caagatagta taaaaccgac + 17581 ttatacattt aaaaacgtga aagaaatgtg gaaaggaatt gtctgatttt ttcattctga + 17641 atagtgaatt catgaatact gtcaaaatac tcgtatgtat ttaaattgat tttattattt + 17701 taataatgga caaattaaaa ttatttttct ccccaaatcg ttcgtgaacg taaagtactc + 17761 atcaacaaag aaaggtaccc cttttatgaa aggtattatt ctagcaggtg gttcgggaac + 17821 tcgcttgtat cctttgactc gcgctgcatc aaaacaactt atgccggttt atgataaacc + 17881 gatgatttac tacccacttt caacattaat gttggctggg attagggata ttttgattat + 17941 ctcaactcct caagatttgc ctcgttttaa agagcttctt caagatggtt ctgagtttgg + 18001 tattaaactt tcttatgctg agcaaccaag tccagatggt ttggcacaag cctttatcat + 18061 tggggaagag tttatcggtg acgatagcgt tgccttgatt ttaggtgaca atatctacca + 18121 tggtcctggt ctgagcacaa tgcttcaaaa agcagccaag aaagagaaag gtgcgactgt + 18181 ttttggctac catgtcaagg atccagaacg ctttggtgtt gtagaatttg atgaaaatat + 18241 gaatgctatc tccatcgaag aaaagccaga ataccctcgt tcaaactatg cagtgacagg + 18301 actctatttc tatgataatg atgtagtaga gattgccaaa agtattaaac caagtcctcg + 18361 tggtgaattg gaaattacag atgtcaacaa ggcttacttg gatcgtggtg atttgtctgt + 18421 tgagctcatg ggacgtggtt ttgcttggtt ggatactggc actcatgaaa gtttactaga + 18481 ggcttcgcag tacatcgaaa cagtccaacg gatgcaaaat gttcaggtag caaacttgga + 18541 agaaattgct taccgtatgg gctatatcag tcgcgaagat gtgttggcct tagcccaacc + 18601 acttaagaaa aatgaatacg gacagtatct actccgtttg attggagaag catagatgac + 18661 agataatttt ttcggtaaga cgcttgcggc acgcaaggtt gaagctattc caggcatgtt + 18721 ggagtttgat atccccgttc atggagataa tcgtggctgg tttaaagaaa atttccaaaa + 18781 ggaaaaaatg cttccacttg gatttccaga gtctttcttt gcagaaggaa aattgcaaaa + 18841 caatgtatcc ttctcacgta aaaatgtcct tcgaggcctc cacgcagagc cttgggataa + 18901 gtacatctct gtagcagatg gagggaaagt tctgggttct tgggttgatc tacgcgaggg + 18961 tgaaaccttt gggaatacct atcagacagt gattgatgcg agtaagggaa tctttgttcc + 19021 tcgaggcgta gctaatggct tccaagtttt atcagataca gtgtcatata gctatctggt + 19081 caatgattac tgggctcttg aactcaaacc caagtatgcc tttgtgaact acgctgatcc + 19141 aagccttggt attgaatggg aaaatattgc agaagcagaa gtttcagaag cagataaaaa + 19201 tcatccacta cttaaggatg taaaaccttt gaaaaaagaa gatttgtaaa aaggaaagaa + 19261 tatgactgaa tacaaaaata ttatcgtgac aggtggagct ggctttatcg gttctaactt + 19321 tgtccattat gtttacgaga actttccagg tgttcacgtg acagtcctag ataagttgac + 19381 ttatgctgga aatcgcgcga atattgagga aattttaggt aatcgtgttg agttagttgt + 19441 tggtgacatt gctgatgcgg agttggtaga caagttggct gctcaagcag atgctatcgt + 19501 tcattatgca gcggaaagcc acaatgataa ttcgctcaat gatccatcgc catttattca + 19561 tactaacttc atcggaacct atactctttt agaagctgct cgtaagtatg atattcgctt + 19621 ccaccatgta tcgacagatg aagtttatgg ggatctccct ttacgcgaag atttgccagg + 19681 tcatggtgaa ggaccaggtg agaaatttac tgctgaaaca aaatacaacc caagctctcc + 19741 gtactcatca accaaggcag cctcagattt gattgtcaaa gcctgggtgc gttcttttgg + 19801 agtcaaggca acgatttcca actgttcaaa taactacggt ccttatcaac atatcgaaaa + 19861 attcatccca cgtcagatta ctaacatcct aagtggaatt aagccaaaac tttacggtga + 19921 aggtaagaat gttcgtgact ggattcatac caatgaccat tcttcaggag tttggacaat + 19981 cttgacaaaa gggcaaatcg gtgaaaccta cttgattggg gctgatggtg agaagaacaa + 20041 taaggaagtt ttggaactta tccttaagga aatgggacaa gctacggatg cctatgatca + 20101 tgtgactgac cgtgcaggac atgaccttcg ctatgcgatt gatgccagca agctccgtga + 20161 tgagttgggg tggaaacctg aatttaccaa ctttgaagct gggctcaagg caacaatcaa + 20221 gtggtataca gataaccaag aatggtggaa agcagaaaaa gaagctgttg aagccaatta + 20281 tgctaagact caggagatta ttacagtata aaaagcagga aatagctgct ttttattgct + 20341 atattgggaa gagttacata ttagaaaggt ctagagatga ttttaattac aggggcaaat + 20401 ggccaattag gaacggaact tcgctattta ttggatgaac gtaatgaaga atacgtggca + 20461 gtagatgtgg ctgagatgga cattaccaat gaagaaatgg ttgaaaaagt ttttgaagag + 20521 gtgaaaccga ctttagtcta ccactgtgca gcctacaccg ctgttgatgc agcagaggat + 20581 gaaggaaaag agttgaactt cgccatcaat gtgacgggga caaaaaatgt cgcaaaagca + 20641 tctgaaaagc atggtgcaac tctagtttat atttctacgg actatgtctt tgacggtaag + 20701 aaaccagttg gacaagagtg ggaagttgat gaccgaccag atccacagac agaatatgga + 20761 cgcactaagc gtatggggga agagttagtt gagaagcatg tgtctaattt ctatattatc + 20821 cgtactgcct gggtatttgg aaattatggc aaaaacttcg tttttaccat gcaaaatctt + 20881 gcgaaaactc ataagacttt aacagttgta aatgaccagt acggtcgtcc gacttggact + 20941 cgtaccttgg ctgagttcat gacctaccta gctgaaaatc gtaaggaatt tggttattat + 21001 catttgtcaa atgatgcgac agaagacaca acatggtatg attttgcagt tgaaattttg + 21061 aaagatacag atgtcgaagt caagccagta gattccagtc aatttccagc caaagctaaa + 21121 cgtccgctaa actcaacgat gagcctggcc aaagccaaag ctactggatt tgttattcca + 21181 acttggcaag atgcattgca agaattttac aaacaagaag tgagataagt agtagaatga + 21241 ttttctagtc taataaaaga ggcagataat gaactccaaa ggagcttaag atgtacgatt + 21301 atcttgttgt tggtgctggt ctctttggcg catagctttg gctcagtttc tattatcgct + 21361 cacatcatcc atcagaagat taatctgaag gtacccaatt atcgccaaga agaagattgg + 21421 gctaggatgg gtttaccaat cacacgtaag gaaatctcta attggcatat caaggcaagt + 21481 caatactatt tagagtccct ttataacctt ttacgagaaa agttgttaga acaacctctt + 21541 cttcatgcgg atgaaacctc ttatcgggtt ctagagagtg atagccatct gacctactat + 21601 tggacctttt tgtctgggaa agctgagaat caagcaatca cgctgtacca tcatgatcag + 21661 cgtcggagtg gtttagtagt acaagaattc ctaggagatt attctggcta tgtgcattgt + 21721 gatatgttgc ggcagtaact taggacttta gtcctctagt tctgcctatg cgatagcagt + 21781 ccaaggttta ggagcaaggc gacgctaagc ttggtaaact gcgaaccgct agaagcttat + 21841 cgtcaactgg aagaagctga acttgttgga tgttgggcac atgtgagaag gaagtttttt + 21901 gaagcgaccc ccaagcaagc agataaatca tccttagaag ctaaaggttt agcttattgt + 21961 gatcagttat tttccctgga aagagactgg gaggctttgc cagctgatga acgactacag + 22021 aaacgtcaag aagagctcca acccctaatg gaagacttct ttgcttagtg ccggcgtcag + 22081 tcagttttag caggttcaaa actaggaagg gcaattgaat acagcctcaa gtatgaagaa + 22141 acctttaaga ctattttgaa agacggacat ctggtccttt ccaataatct agctgaacgc + 22201 gccattaaat cattggttat gggacggagt aaaagagttc agtggactct tttagcctaa + 22261 gctaaatttt aaaaagcgag ggtggttatt ttctcaaagt tttgaaggag ctaaagcaac + 22321 agctattatt atgagtttgt tggaaacagc taaacgtcat caattaaata gcgagaaata + 22381 tctattctat cttctagaat gtcttccaaa cgaggaaact ctcgtaaaca aagaggtttt + 22441 agaggcttat ttaccatgga ctaaagttgt acaagaaaag tgcaaataag aaatctccag + 22501 attaggaact atccgtgagt tctctagtct ggagattttt caatatactt cgttattggg + 22561 cgcttacaat gatattcata ttttttgcaa agatgttgtt tgaaaaataa ttttcaaaaa + 22621 ttctgaaaat tctgttgaca actttctgaa aagagtctat aatggagaga aagttttaaa + 22681 ggagaaaatg atgaaaagtt caaaactatt tgcccttgcg ggcgtgacat tattggcggc + 22741 gactacttta gctgcatgct ctggatcagg ttcaagtact aaaggtgaga agacattctc + 22801 atacatttat gagacagacc ctgataacct caactatttg acaactgcta aggctgcgac + 22861 agcaaatatt accagtaacg tggttgatgg tttgctagaa aatgatcgct acgggaactt + 22921 tgtgccgtct atggctgagg attggtctgt atccaaggat ggattgactt acacttatac + 22981 tatccgtaag gatgcaaaat ggtatacttc tgaaggtgaa gaatacgcgg cagtcaaagc + 23041 tcaagac +// diff --git a/public/res/serotype_genbank/serotype_23F.gb b/public/res/serotype_genbank/serotype_23F.gb new file mode 100644 index 0000000..958bf59 --- /dev/null +++ b/public/res/serotype_genbank/serotype_23F.gb @@ -0,0 +1,1006 @@ +LOCUS CR931685 22330 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Dr. Melchior (serotype 23f). +ACCESSION CR931685 +VERSION CR931685.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22330) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22330) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22330 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Dr. Melchior" + /db_xref="taxon:1313" + gene <1..166 + /gene="dexB" + /locus_tag="SPC23F_0001" + CDS <1..166 + /gene="dexB" + /locus_tag="SPC23F_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33854.1" + /db_xref="GOA:Q4K241" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K241" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVEMTD" + gene complement(order(313..432,441..1707)) + /gene="tnp" + /locus_tag="SPC23F_0002" + /pseudo + CDS complement(join(313..432,441..1520,1519..1707)) + /gene="tnp" + /locus_tag="SPC23F_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(723..1223) + /gene="tnp" + /locus_tag="SPC23F_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.8e-21" + /pseudo + gene 1882..3327 + /gene="wzg" + /locus_tag="SPC23F_0003" + CDS 1882..3327 + /gene="wzg" + /locus_tag="SPC23F_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33856.1" + /db_xref="GOA:Q9R928" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q9R928" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1882..1998 + /gene="wzg" + /locus_tag="SPC23F_0003" + /note="Signal peptide predicted for SPC1208 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 2086..2433 + /gene="wzg" + /locus_tag="SPC23F_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.7e-65" + misc_feature 2611..3054 + /gene="wzg" + /locus_tag="SPC23F_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 3329..4060 + /gene="wzh" + /locus_tag="SPC23F_0004" + CDS 3329..4060 + /gene="wzh" + /locus_tag="SPC23F_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33857.1" + /db_xref="GOA:O54645" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:O54645" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3332..3940 + /gene="wzh" + /locus_tag="SPC23F_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 6.7e-38" + gene 4066..4761 + /gene="wzd" + /locus_tag="SPC23F_0005" + CDS 4066..4761 + /gene="wzd" + /locus_tag="SPC23F_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33858.1" + /db_xref="GOA:Q4K0G3" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0G3" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGTGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 4087..4503 + /gene="wzd" + /locus_tag="SPC23F_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 6.4e-55" + misc_feature 4609..4686 + /gene="wzd" + /locus_tag="SPC23F_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4771..5460 + /gene="wze" + /locus_tag="SPC23F_0006" + CDS 4771..5460 + /gene="wze" + /locus_tag="SPC23F_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33859.1" + /db_xref="GOA:O84996" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:O84996" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGNYGKNKK" + gene 5475..6842 + /gene="wchA" + /locus_tag="SPC23F_0007" + CDS 5475..6842 + /gene="wchA" + /locus_tag="SPC23F_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33860.1" + /db_xref="GOA:Q4K0G1" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0G1" + /translation="MNEKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALCIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAIGISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGGIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVIVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGCFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDGWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5475..5561 + /gene="wchA" + /locus_tag="SPC23F_0007" + /note="Signal peptide predicted for SPC1212 by SignalP 2.0 + HMM (Signal peptide probability 0.670) with cleavage site + probability 0.344 between residues 29 and 30" + misc_feature 6258..6839 + /gene="wchA" + /locus_tag="SPC23F_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.7e-161" + gene 6873..8051 + /gene="wchF" + /locus_tag="SPC23F_0008" + CDS 6873..8051 + /gene="wchF" + /locus_tag="SPC23F_0008" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33861.1" + /db_xref="GOA:Q4K0G0" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K0G0" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNFGPARAIAYDIAAINRAIEIAKENKDEDPIF + YILACRIGPFIHGIKKKIQEIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSVLKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVAE + DGAIYWKKDNLHEIIETSEQKTQKEIDEKDILSIKQVTERFSWELIVNEYEKLFLCEK + " + misc_feature 7488..7994 + /gene="wchF" + /locus_tag="SPC23F_0008" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0029" + gene 8351..9544 + /gene="wzy" + /locus_tag="SPC23F_0009" + CDS 8351..9544 + /gene="wzy" + /locus_tag="SPC23F_0009" + /note="member of homology group 168" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33862.1" + /db_xref="UniProtKB/TrEMBL:Q9R925" + /translation="MTIKINNLFFVCLSFFGIVLSSSQVIVNLGLSSIIQYISYFMLM + LCVFLTLIKNTLNVFANRIIYFLIISFLFIIGINLQNLPLSRKIYLSFSMLIISSLST + LPIKLINNLSDLRRISYYLLHSIFLSVFLGLVFKISLVTVAVEGIGFSYGFNGGLTHK + NFYAITILVSYILLYVSRKYDAKHQIDSFVLWLDLFLLLISNTRTVYIILVVFWIIIN + RNFINNIKKEHRLVVTATTIVISLLALTFFFKHIINNSESYSHRVLGVVNFFKYYESD + RFHLFFGDAELAFGNTTKGYGHNIRSVLGWDGTVEMPLLSVMIKNGYVGLVGYIIVLF + KFISSIISVKNSTKKNIGLSIFIPLLLSATVENYIVNISFVFMPVCFCILCSIKNIKL + VNNRK" + misc_feature 8351..8461 + /gene="wzy" + /locus_tag="SPC23F_0009" + /note="Signal peptide predicted for SPC1214 by SignalP 2.0 + HMM (Signal peptide probability 0.975) with cleavage site + probability 0.241 between residues 37 and 38" + gene 9548..10519 + /gene="wchV" + /locus_tag="SPC23F_0010" + CDS 9548..10519 + /gene="wchV" + /locus_tag="SPC23F_0010" + /note="member of homology group 109" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33863.1" + /db_xref="GOA:O85000" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:O85000" + /translation="MEKLVSIILPVYNVEQYIKNCLESIQQQTYSNLEVIIVNDGSTD + KSVEYCEQICKIDSRFSITHKENGGLSDARNVGIDKSKGDYLIFVDSDDFVSQDMVSY + LVSCMENNEADIAICDPVHYYSDRQNNDLNIFSPASNVKVYETTEALCEMFYQKSFLV + SAWAKIFKRELFDDIRFPVGKLFEDSAIMYLLFEKCETIAYSDAELYAYVHRDNSITT + KKFSDRDLDILEITNTIINHYGDNLRVYTAAVSYKVSACFRILLNSPSGEKYKKVQKE + CLSYILQNWRNILFNNNVRLKNKLALISITIFNPFVKFIYSKVNRWE" + misc_feature 9563..10075 + /gene="wchV" + /locus_tag="SPC23F_0010" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 9.1e-49" + gene 10526..11758 + /gene="wchW" + /locus_tag="SPC23F_0011" + CDS 10526..11758 + /gene="wchW" + /locus_tag="SPC23F_0011" + /note="member of homology group 110" + /codon_start=1 + /transl_table=11 + /product="putative transferase" + /protein_id="CAI33864.1" + /db_xref="GOA:Q9R924" + /db_xref="UniProtKB/TrEMBL:Q9R924" + /translation="MNKYEERYQENLSKNDFYKLINKSYLSDKELQVQQVKAGIVLPP + KAFETKLSNKLGLQKSLHGKGGVVDSNGNYIELSAQKAVGMRNRVYGPYKINYDNLPI + RNEKVIYLNYFIKQWGHFLLDVVGRLWYPLLQDNDTKLVYTCYAGTETKIEGNYLEFL + KLLGIDQSRLIMINCPTQFSEVIIPESSILPGGYYTKEYKQLFSSVVENIKLDKYDVN + AKMIYCSRSKLGIAKSKEFGEDGIEGIFKQNGYTSVYMETMSLEEQIKTLLSAKTIVL + TSGSLAHNLLFVNKDIDVFILNKTYRVNLHQFLINEISDATVRFVDIYRSPLPILYGY + GPFLMDLTKPLANFLDDNEFVYEKGTVLSKKDYFKYYLKWLWSYRFFLFRLNGIKEGN + SEFEKSFKIIRRYYKTGR" + gene 11760..13145 + /gene="wzx" + /locus_tag="SPC23F_0012" + CDS 11760..13145 + /gene="wzx" + /locus_tag="SPC23F_0012" + /note="member of homology group 111" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33865.1" + /db_xref="GOA:Q9R923" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q9R923" + /translation="MSKYKELAKNTGIFALANFSSKILIFLLVPIYTRVLTTTEYGFY + DLVYTTIQLFVPILTLNISEAVMRFLMKDGVSKKSVFSIAVLDIFIGSIAFALLLLVN + NLFSLSDLISQYSIYIFVIFVFYTLNNFLIQFSKGIDKIGVTAISGVISTAVMLAMNV + ILLVVFDWGLLGFFIANVCGYVIPCIYIVSRLRLWELFEIKIDKKLQWEMVYYALPLV + LNILSWWVNNTSDRYIVTAIVGIQASAIISVAYKIPQILSTISAIFIQSWQISAIKIQ + EDKSDTTFVSNMLLYYNALLLIIASGIILFVKPISNILFGISFYSAWELVPFLIISSL + FNAISGCIGAIMGAKMDTHNIAKSALVGMIANIILNIVLTFLMGPQGITISTLIASFL + IFYMRKDSVKEINSETYRAIYLSWILLVVEACLLIYMDFIIGALIAMVINLFLLKDVI + KPLYLKIFKRN" + misc_feature 11778..12587 + /gene="wzx" + /locus_tag="SPC23F_0012" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 6.3e-67" + gene 13153..14301 + /gene="wchX" + /locus_tag="SPC23F_0013" + CDS 13153..14301 + /gene="wchX" + /locus_tag="SPC23F_0013" + /note="member of homology group 53" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI33866.1" + /db_xref="GOA:Q9R922" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q9R922" + /translation="MIVLQYFKILARFVFMFLISAVLLPFKIKPNKIVFINFNGKGYG + DNPKSICEYLRTTYPDLDLVWLARDNEGFPDGVRVVKYGTFQAFYEQASSKVWVYNVR + AFARILKKRGQIYIQTWHGASSFKLIEKQADLPINYVLEAKYDARVTDIMISDSRKQT + EEFQKYFWYSGEIFEVGMPRNDALFHYKEDYDKLNNIRKELSIHSDDYVILYAPTFRD + DGDASYLDINFERLLQCVEHGIKKKCKFLIRLHPNHSHLCNNISFNKNIINATFYSDM + QELTLLADVLVTDYSSSIFDFMLLNKPYVRYVNDLEKYAELRGVSDTYYELPDSIIKT + AEELYDLLPKKIENFDYDSIKKYRNEILCPIFNGTASENVGRRIIQEL" + misc_feature 13741..14292 + /gene="wchX" + /locus_tag="SPC23F_0013" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 4.3e-73" + gene 14337..15365 + /gene="gtp1" + /locus_tag="SPC23F_0014" + CDS 14337..15365 + /gene="gtp1" + /locus_tag="SPC23F_0014" + /note="member of homology group 40" + /codon_start=1 + /transl_table=11 + /product="putative glycerol-2-phosphate dehydrogenase" + /protein_id="CAI33867.1" + /db_xref="GOA:Q9R921" + /db_xref="InterPro:IPR002658" + /db_xref="InterPro:IPR016205" + /db_xref="UniProtKB/TrEMBL:Q9R921" + /translation="MKNNDLKIGSGAIHQISATLSQNSISGKILYCADPVVDDLYGSI + VRSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFIS + KRPYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKA + GIGDTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLV + NSLVLSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENS + VDTVVDYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQI + YKELISEL" + misc_feature 14358..15278 + /gene="gtp1" + /locus_tag="SPC23F_0014" + /note="HMMPfam hit to PF01761, 3-dehydroquinate synthase, + score 2.9e-70" + gene 15381..16085 + /gene="gtp2" + /locus_tag="SPC23F_0015" + CDS 15381..16085 + /gene="gtp2" + /locus_tag="SPC23F_0015" + /note="member of homology group 41" + /codon_start=1 + /transl_table=11 + /product="putative nucleotidyl transferase" + /protein_id="CAI33868.1" + /db_xref="GOA:O85005" + /db_xref="InterPro:IPR005835" + /db_xref="UniProtKB/TrEMBL:O85005" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQN + NITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLM + MNADVFYDASVIKSLLLHKAPNAIVTDLGIYIEESMKVVEKNGRLVEISKQISPEETL + GASIDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILSEVEFVACPLEGRWL + EIDNHEDLVAAEKLFA" + misc_feature 15384..16082 + /gene="gtp2" + /locus_tag="SPC23F_0015" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 1e-07" + gene 16100..16933 + /gene="gtp3" + /locus_tag="SPC23F_0016" + CDS 16100..16933 + /gene="gtp3" + /locus_tag="SPC23F_0016" + /note="member of homology group 42" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI33869.1" + /db_xref="GOA:Q4K0F2" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006357" + /db_xref="UniProtKB/TrEMBL:Q4K0F2" + /translation="MKLTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLEL + LDYIHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPK + SKVYCQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDV + PFIATNPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRKKLNYSL + FETVVIGDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQDSIKPTYTFKNVKEMWKGI + V" + misc_feature 16157..16843 + /gene="gtp3" + /locus_tag="SPC23F_0016" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 5.9e-25" + gene 17093..17962 + /gene="rmlA" + /locus_tag="SPC23F_0017" + CDS 17093..17962 + /gene="rmlA" + /locus_tag="SPC23F_0017" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33870.1" + /db_xref="GOA:Q4K0F1" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K0F1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSTMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRRGYISREDVLALAQSLKKN + EYGQYLLRLIGEA" + misc_feature 17096..17812 + /gene="rmlA" + /locus_tag="SPC23F_0017" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.7e-121" + gene 17963..18556 + /gene="rmlC" + /locus_tag="SPC23F_0018" + CDS 17963..18556 + /gene="rmlC" + /locus_tag="SPC23F_0018" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33871.1" + /db_xref="GOA:Q9AHA9" + /db_xref="HSSP:1NXM" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q9AHA9" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + misc_feature 17999..18529 + /gene="rmlC" + /locus_tag="SPC23F_0018" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 4.5e-16" + gene 18569..19618 + /gene="rmlB" + /locus_tag="SPC23F_0019" + CDS 18569..19618 + /gene="rmlB" + /locus_tag="SPC23F_0019" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33872.1" + /db_xref="GOA:Q9AHA8" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AHA8" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAVD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18584..19540 + /gene="rmlB" + /locus_tag="SPC23F_0019" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 9.7e-05" + misc_feature 18587..19327 + /gene="rmlB" + /locus_tag="SPC23F_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 18590..19402 + /gene="rmlB" + /locus_tag="SPC23F_0019" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.6e-05" + gene 19684..20535 + /gene="rmlD" + /locus_tag="SPC23F_0020" + CDS 19684..20535 + /gene="rmlD" + /locus_tag="SPC23F_0020" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33873.1" + /db_xref="GOA:Q4K0E8" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0E8" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGRELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKGTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19684..20532 + /gene="rmlD" + /locus_tag="SPC23F_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.6e-147" + misc_feature 19687..20328 + /gene="rmlD" + /locus_tag="SPC23F_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 9.3e-05" + misc_feature 19687..20316 + /gene="rmlD" + /locus_tag="SPC23F_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.4e-19" + misc_feature 19690..20418 + /gene="rmlD" + /locus_tag="SPC23F_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.4e-08" + gene order(20611..21552,21569..21784) + /gene="tnp" + /locus_tag="SPC23F_0021" + /pseudo + CDS join(20611..21552,21569..21784) + /gene="tnp" + /locus_tag="SPC23F_0021" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 20617..21060 + /gene="tnp" + /locus_tag="SPC23F_0021" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 7.7e-05" + /pseudo + gene 21980..>22330 + /gene="aliA" + /locus_tag="SPC23F_0022" + CDS 21980..>22330 + /gene="aliA" + /locus_tag="SPC23F_0022" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33875.1" + /db_xref="GOA:Q4K0E7" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K0E7" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVK" + misc_feature 21980..22066 + /gene="aliA" + /locus_tag="SPC23F_0022" + /note="Signal peptide predicted for SPC1227 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 22226..22294 + /gene="aliA" + /locus_tag="SPC23F_0022" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaaatgact gactagaatg agcaaacctc + 181 aagtttttga agcttgaggt tttttactat agtggattga aactagaata gtgcacctct + 241 gcttctaaaa cattgttaga aatcgatttg actgtcccga tcgattcgtc ctattcttat + 301 ttcattttgc tatacttgta gttgaggaga attaagctcc tcactagtaa actcttcata + 361 atccttttta tttttatgaa gatattgttt gaaagatgtg agtttccacg gatgggtttg + 421 tggagggata tacttgcgtc tttctttttt tgttctggtt cttgttcaaa gtttttcgaa + 481 tagagttcat gatttagtag ctcctttgtg tgatagattt tgtcagcgat attgaggtag + 541 atgtctccgt caaatgcttt tataactaat gctttcgtct ttctgatgaa atagacttct + 601 tttccttgtt cggtagggat atagtaacga ttttggaatc ggatatggtg tccactatcg + 661 acgactctct ccgccagtct agccagaatg agattccttt cagaggggtt aggaacctcc + 721 tcgaagacag agagttttgt cttgtttcca aactgttcat taaaggtttg aatgtaggaa + 781 agcaggaagg tattggcttc ttccaaggta tgaatattgt tttgttccag ttcgataggc + 841 aggcgagatt gtagtgtctg attgagtctt tcgactctcc ctttagcttg agggatagag + 901 gttgtctcaa ggagaatccc tagttggtga caggcgtatc caaactgtgt atgggtatcg + 961 tcctccattt tcttagagtt ggaggcttga taggtaaaga ccgttctctt atctgtttta + 1021 atttgaaggg gaatgccgtg attggctaag atttgttcga ggacatgata gtaagcattc + 1081 aagttctctt gtttatcaaa ataagcgcct aggatattgc cagaagcatc atcaatggct + 1141 aagtgtaagt tagatgtttg ggctccaaac taggcatgag gactggcatc catttgaatg + 1201 agttcaccag caaatttctt tctgggtcta ctaggatgta cttttttagg gtcttcaagg + 1261 aagttttcag ccgtcggtaa gattggattg tctaggggtt gattcaggtt cagtttagct + 1321 tgttttctta ctctcttctt tgtctttcta tgggacttag gcgacaggat atttttctta + 1381 tagagtattt ttctaacagt agtatcagag agctgaattc cttcttcttc agctagcaat + 1441 tcacagaaat gaaggacatt tggtttatat gtttcatagg agaggtattt ttttaggaga + 1501 cgttctttga tttcatcagg gattgcatgt tttggttttc gatttctgtt tccgtgtctg + 1561 aaggcttctt tgtcctttca gttgataggc tagtagcaga cgattgattt gtctttcaga + 1621 aagattgagc tcgacacagg ctcgtttctt tgttttcttt ccttgggcta tagcttttat + 1681 cacaagatat tttttcgttt cattcatatt cagttggatc cttttcatat gactattcta + 1741 ccaaatggga cattttcacg ttcgatttac taaagacatt atcacattcg aattacacaa + 1801 gatgcagata gtaaaaaaaa tgtagacatt accgtaaaaa agtgatataa tcgtatgatg + 1861 ttcaaggtat aggtgttaat catgagtaga cgttttaaaa aatcacgttc acagaaagtg + 1921 aagcgaagtg ttaatatcgt tttgctgact atttatttat tgttagtttg ttttttattg + 1981 ttcttaatct ttaagtacaa tatccttgct tttagatatc ttaacctagt ggtaactgcg + 2041 ttagtcctac tagttgcctt ggtagggcta ctcttgatta tctataaaaa agctgaaaag + 2101 tttactattt ttctgttggt gttctctatc cttgtcagct ctgtgtcgct ctttgcagta + 2161 cagcagtttg ttggactgac caatcgttta aatgcgactt ctaattactc agaatattca + 2221 atcagtgtcg ctgttttagc agatagtgat atcgaaaatg ttacgcaact gacgagtgtg + 2281 acagcaccga ctgggactga taatgaaaat attcaaaaac tactagctga tattaagtca + 2341 agtcagaata ccgatttgac ggtcgaccag agttcgtctt acttggcagc ttacaagagt + 2401 ttgattgcag gggagactaa ggccattgtc ttaaatagtg tctttgaaaa tatcatcgag + 2461 tcagagtatc cagactacgc atcgaagata aaaaagattt ataccaaggg attcactaaa + 2521 aaagtagaag ctcctaagac gtctaagaat cagtctttta atatctatgt tagtggaatt + 2581 gacacctatg gtcctattag ttcggtgtcg cgatcagatg tcaatatcct gatgactgtc + 2641 aatcgagata ccaagaaaat cctcttgacc acaacgccac gtgatgccta tgtaccaata + 2701 gcagatggtg gaaataatca aaaagataaa ttaacccatg cgggcattta tggagttgat + 2761 tcgtccattc acaccttaga aaatctctat ggagtggata tcaattacta tgtgcgattg + 2821 aacttcactt ctttcttgaa aatgattgac ttattgggag gggtagatgt tcataatgat + 2881 caagagtttt cagctctaca tgggaagttc catttcccag tagggaatgt ccatctagac + 2941 tctgagcagg ctctaggttt tgtacgtgaa cgctactcac tagccgatgg agaccgtgac + 3001 cgtggtcgca accaacaaaa ggttattgta gctatccttc aaaaattaac gtcaaccgaa + 3061 gcactgaaaa attatagtac gatcattgat agcttgcaag attctatcca aacaaatatg + 3121 ccacttgaga ctatgataaa tttggtcaat gctcagttag aaagtggagg gaattataaa + 3181 gtaaattctc aagatttaaa aggtacaggt cggacggatc ttccttctta tgcaatgcca + 3241 gacagtaacc tctatgtgat ggaaatagat gatagtagtt tagctgtagt taaagcagct + 3301 atacaggatg tgatggaggg tagatgaaat gatagacatc cattcgcata tcgtttttga + 3361 tgtagatgac ggtcccaagt caagagagga aagcaaggct ctcttgacag aatcctacag + 3421 gcagggggtg cgaaccattg tctctacctc tcaccgtcgc aagggcatgt ttgaaactcc + 3481 ggaagagaag atagcagaaa actttcttca ggttcgggaa attgcaaaag aagtagcaga + 3541 tgatttagtc attgcttatg gcgcagagat atactatact ctggatgctc tagaaaagct + 3601 agaaaaaaaa gaaattccta ccctcaatga tagtcgttat gccttgatag agtttagtat + 3661 gaacactcct tatcgcgata ttcatagcgc cttgagcaag atcttgatgt tgggaattac + 3721 tccagtcatt gcccacattg agcgctatga tgctcttgaa aataacgaaa aacgtgttcg + 3781 tgaactgatt gatatgggct gttacacgca agtaaatagt tcacatgtcc tcaaacccaa + 3841 actttttggc gaacgttata aattcatgaa aaaaagagct cagtattttt tagagcagga + 3901 tttggtccat gtcattgcaa gtgatatgca caatctagac ggtagacctc ctcatatggc + 3961 agaagcatat gaccttgtta cccaaaaata cggagaagcg aaggctcagg aactttttat + 4021 agacaatcct cgaaaaattg taatggatca actaatttag gagaaatgat gaaagaacaa + 4081 aacacgatag aaatcgatgt atttcaatta tttaaaacct tgtggaaacg caagctaatg + 4141 attttaatag tggcacttgt gacaggtacg ggggcttttg catatagcac ttttattgtt + 4201 aagccagaat atacgagtac cacgcgaatt tatgtagtga atcgcaatca aggagacaag + 4261 ccggggttga caaatcagga tttgcaggca ggaacttatc tggtaaaaga ctaccgtgag + 4321 attatccttt cgcaggatgc attggaaaaa gtagcgacaa atttgaagtt ggatatgcca + 4381 gcaaaaacgt tagccagcaa agttcaagtg gctgtgccag ctgacactcg tatcgtctca + 4441 atctctgtca aggataaaca gccagaggaa gccagtcgta tcgctaattc tctacgagaa + 4501 gttgctgcag aaaagatcgt cgctgtaacg cgagtatctg atgtaacgac acttgaagaa + 4561 gcgcgaccag ctacgactcc ctcttctcca aatgttcgac gcaattcctt gtttggtttt + 4621 cttggaggag cagtcgtaac agtaattgct gttcttttga ttgagttgct cgacacccgt + 4681 gtgaaacgtc ctgaagatgt tgaagatgta ctgaaaattc cacttttagg gctcgttcca + 4741 gattttgaca aaataaaata ggaggaagtt atgccaacat tagaaatctc acaggcaaaa + 4801 ttggattctg taaaaaaggc agaggaatat tataacgctt tgtgcacgaa cctacagtta + 4861 agtggagatg gtttgaaagt attttctatc acttctgtga aaataggaga aggaaaatca + 4921 acgacttccg ccaatatcgc ttgggctttt gcgcgtgcag gttacaaaac gctgctgatt + 4981 gatggagata ttcgcaattc tgttatgtta ggtgtcttta aagcaaggaa taagattaca + 5041 ggcctgacag aatttttatc aggaactaca gacctatcac aagggctttg tgataccaat + 5101 atcgaaaatc tctttgtaat tcaggctggc tctgtgtcac cgaatccgac agctcttctt + 5161 caaagtaaga atttcactac aatgcttgaa accttgcgta aatattttga ctacatcatt + 5221 gtagatactg ctcctgttgg tgtcgtgatt gatgcggcta ttattacgcg aaactgcgat + 5281 gcttctattt tagtgacgga ggcaggtgaa ataaatcgac gggatattca aaaagcaaaa + 5341 gaacagttgg aacacacagg aaagccgttt ttgggaattg tgttgaataa attcgatact + 5401 tcagtagaca aatacggttc ttatggaaat tatggaaatt acgggaaaaa taaaaaatag + 5461 gtcaggggat agagatgaat gaaaaaatat taagatcttc attggccata attcagagtt + 5521 ttcttgttat tttattgact tatctactta gtgctgtgag agaaacggag attgtttcaa + 5581 caacagctat tgcactttgt atcctccatt attttgtctt ttatatcagt gattatggac + 5641 aggatttctt taaaaggaga tatttgattg aacttgtcca gacattgaaa tatatcctat + 5701 tctttgcact agcgattggt atttctaatt ttttcttaga ggatcgattt agtatttcca + 5761 gacgaggcat gatttacttc ctcacattac atgctctctt agtctatgtg ctaaacctat + 5821 ttatcaagtg gtattggaag cgggcttatc ccaactttaa aggaagtaag aagattctct + 5881 tacttacagc aacttctcgt gtcgaaaagg tactggatag attaatagaa tcaaatgagg + 5941 ttgttgggaa gttggtagcc gtcagtgtct tagataaacc agattttcag catgattgtt + 6001 taaaggtagt agcagagggg gggatagtaa actttgcgac tcacgaggtg gtcgatgaag + 6061 tctttatcaa tcttccaagt gaaaaataca atattggaga gcttgtctct cagtttgaaa + 6121 cgatgggaat tgatgtaata gtcaatctaa atgcttttga tcgtagtttg gcacgtaaca + 6181 agcaaattcg tgagatggca gggttaaacg ttgtgacttt ttctacaaca ttttataaga + 6241 ctagtcatgt aattgctaag cggattattg atatcgtggg tgcattggta gggctgatac + 6301 tatgtggttt agtcagtatt gtactggttc ctttgattcg aaaggatggg ggatctgcta + 6361 tttttgctca gacgcgtata ggaaaaaatg gtcgtcagtt cactttttat aagtttcgct + 6421 ctatgtgtgt agatgccgag gcgaaaaaaa gagaactcat ggaacaaaat accatgcaag + 6481 gtggaatgtt taaggtggac gatgatcctc gtatcacgaa aattggttgt tttatacgga + 6541 agactagctt ggacgagcta ccacagtttt ataatgttct aaagggagat atgagtttgg + 6601 ttggcacacg gccaccaaca gtggacgagt atgagcacta taccccagaa caaaaacgcc + 6661 gactaagttt taaacctggc ataacaggtt tatggcaggt cagcggacga agtgagatca + 6721 agaatttcga tgaagttgtc aaattagatg tggcctatat tgatggttgg acaatctgga + 6781 aagatattga aattttattg aagacagtta aagtagtatt tatgagagat ggagcgaagt + 6841 aatttctgta tatccatcat attaggagag aaatgaaaaa gtcagtttat atcattggtt + 6901 caaaaggaat tcctgctaag tatggaggat ttgaaacttt tgttgagaaa ttaacagcct + 6961 tccaacaaga taaggctatc caatattatg tggcttgtat gcgtgaaaac tctgcaaaat + 7021 cagggactac tgaggatgtt tttgaacata atggtgctat ctgttataac gtcgatgttc + 7081 ctaattttgg tccagcgcga gctatagcgt atgatatcgc tgcaattaac agagctattg + 7141 agattgccaa agaaaataag gatgaagatc caatcttcta tattttagct tgtcgaattg + 7201 gtccgttcat ccatggaatt aagaaaaaaa tccaggagat aggtgggact cttctagtta + 7261 atccagatgg ccacgagtgg ttgcgagcta agtggagtgc tcctgttcgt cgctactgga + 7321 aaatttctga aggtcttatg gtcaaacatg cagatctttt agtgtgtgat agtaaaaata + 7381 ttgaaaaata tatccaagaa gattataaac agtatcaacc taagacaacc tatatcgctt + 7441 atgggactga tacaacacgc tccgtattaa agagtagtga tgaaaaagta cgttcttggt + 7501 tcaaagagaa gaatgtttct gagaacgagt attatctagt tgtaggacgt tttgtaccag + 7561 aaaacaacta tgaatctatg attcgtggct ttttggcgtc taactctaag aaggactttg + 7621 tcttaatcac aaatgtagaa cagaataaat tttataatca gttgttggca aaaactggtt + 7681 ttgataagga cccacgagta aaatttgtag gtacagtcta tgagcaagag cttcttaaat + 7741 atattcgtga aaacgccttt gcttacttcc acgggcatga agttggtgga accaatcctt + 7801 cgcttttaga agctctggca tcaactaaac tgaatttatt gctagatgtt ggctttaacc + 7861 gagaagttgc tgaagatggt gccatttact ggaagaaaga taatcttcat gagattattg + 7921 aaacgagtga acaaaaaaca caaaaagaga ttgatgagaa agatatactt tcaataaaac + 7981 aagtgacgga gcggttctct tgggaattga tagttaatga gtatgagaaa ctttttttat + 8041 gtgagaaata atttacagtt tcatagaaat gttataaaaa attaactctg aagaataatt + 8101 acatattgga tttagaatgt tttttgctga ttcttgttgt ttatggattt gaaaaaataa + 8161 gagaagatgc ctcctttttg tcaggatatc tatgcaatgt atacagaaat aatgactatt + 8221 agctgattgt attattctcg aaattgtaat taaatataat tgtattttgt ttttactata + 8281 ttcgaaaata caagtgactt tatacaatca aatcaaaatc tttcttgtta tttaataaaa + 8341 ggaatcaagt gtgactataa aaattaataa tttgtttttt gtttgtctat ccttttttgg + 8401 gatagtttta agtagttcac aagtgatagt gaacttggga ttgtctagta ttattcagta + 8461 catttcttat tttatgttga tgttgtgtgt atttttaaca ttaattaaga atactctcaa + 8521 cgtgtttgca aatagaatca tatatttttt gattatttca tttttgttta ttattgggat + 8581 taatttacaa aatcttccat tatcaagaaa gatttattta tcattctcta tgttaattat + 8641 ttctagctta tccaccttac cgataaagct aataaataat ctcagtgatt taagaaggat + 8701 atcatattac ttattgcaca gcatattttt atctgtattt ttaggtttgg tttttaaaat + 8761 atctttagta acagttgctg tagagggaat tggcttttca tatggtttta atggaggttt + 8821 gactcataaa aatttttatg caattacaat tttagtttcc tatattctac tatatgtcag + 8881 cagaaaatat gacgctaaac atcagattga tagttttgta ttatggttag atcttttttt + 8941 acttttaata tctaatacgc gaacagttta tataatacta gttgtttttt ggattattat + 9001 taatagaaat tttataaata atattaaaaa agagcataga ctggtagtga cagcaacgac + 9061 aatagtcatc tctttactgg cgttaacatt ttttttcaaa catataatta ataatagtga + 9121 atcatatagc catcgagtgt taggtgttgt gaattttttt aaatattatg aatcagatag + 9181 gtttcatttg ttttttgggg atgctgaatt agcctttgga aatacgacga agggttatgg + 9241 acacaatatt agaagtgtgt taggttggga tggaacggta gagatgcctt tactcagtgt + 9301 aatgattaaa aatggttatg ttgggttagt tggttacatt atagtgctgt ttaagtttat + 9361 atcttcaata atctcagtta aaaatagcac aaaaaaaaat attggattat caatctttat + 9421 tccgttactt ctatctgcaa cagttgaaaa ttatatcgtc aacattagct ttgtattcat + 9481 gcctgtctgc ttttgtattt tatgttcaat taaaaatata aaattagtaa ataacagaaa + 9541 gtaatatatg gaaaaattag ttagtattat tctgcccgtc tacaatgtcg aacagtatat + 9601 aaaaaattgt ttagaatcaa ttcaacaaca aacttattca aatttggaag taatcattgt + 9661 taatgacggt tcaaccgata aaagcgttga atattgtgag caaatttgca agatagattc + 9721 taggttttct atcactcaca aagaaaatgg tggactttcc gatgcaagaa atgtcggtat + 9781 agataaatcc aagggagatt acctcatttt tgttgacagt gatgattttg tctctcaaga + 9841 tatggtatct tatttagtat cttgtatgga gaacaatgag gcagacattg ctatttgcga + 9901 tcctgttcat tattacagtg atcgtcaaaa caatgatctt aatatttttt ctccggcatc + 9961 aaacgttaag gtttacgaaa caacggaggc tctatgtgag atgttttatc aaaaatcttt + 10021 tttggtgtct gcctgggcca agatatttaa aagagagttg tttgatgata taagatttcc + 10081 tgtaggtaag ctatttgaag atagtgcgat tatgtatttg ctcttcgaaa aatgtgaaac + 10141 aattgcatac tctgatgcgg aattatatgc ttatgtacac agggataata gcatcacaac + 10201 aaagaaattt tcggatagag acttagatat tttggagatt acgaacacaa ttattaatca + 10261 ctatggtgat aatttacgcg tgtatactgc agcggtgtct tataaggtat ctgcatgttt + 10321 cagaattcta ttaaactcac cttctggaga aaagtataaa aaagtacaaa aagaatgtct + 10381 gagttatatt ttacaaaatt ggagaaacat attatttaat aataatgttc gattgaagaa + 10441 caagcttgcc ttaatttcta taactatttt caatcctttt gttaaattta tctatagtaa + 10501 agtaaacaga tgggaatgat agcaaatgaa caaatatgaa gaaagatatc aagaaaattt + 10561 atctaagaat gatttttata aattaattaa taagagttac ttatcagata aagaacttca + 10621 agtacaacaa gtaaaagctg ggatagtctt accaccaaag gcatttgaaa caaaattatc + 10681 aaataaactt ggcctacaaa aatctttgca tggaaagggt ggagttgtag actcaaatgg + 10741 aaattacatt gaactatctg cacaaaaagc agtcgggatg agaaatagag tctatggtcc + 10801 gtataaaatt aattacgata atctgccaat tagaaatgaa aaagtaatct atttgaacta + 10861 tttcatcaaa caatggggac attttttact ggatgttgtt ggaaggttat ggtatccatt + 10921 gctgcaggat aatgatacta agttagtcta tacctgctat gctggaacag aaacaaagat + 10981 tgagggaaac tatttagagt ttttgaagct tctcggcata gatcaatcac gtttaatcat + 11041 gataaactgt cccactcagt tctcagaagt cattattcct gaaagctcca ttttaccggg + 11101 gggatattat acaaaagagt ataaacaact attcagttcg gtagtagaaa atattaaatt + 11161 ggacaagtat gatgtgaatg ctaaaatgat ttattgttcg aggtctaaat tagggattgc + 11221 taaaagtaaa gaatttggcg aagacggtat tgaggggatt tttaaacaaa atggctacac + 11281 atctgtttac atggaaacaa tgtctttgga agagcaaata aaaaccttat tatcggctaa + 11341 gacaatagta ttaacgagtg gttcgttagc acataatctt ttatttgtaa ataaagatat + 11401 tgatgttttt attttgaata aaacctatag agtaaatctc catcaatttt taataaacga + 11461 gatctcagat gctacagtaa gatttgtaga tatctatcga tcacctttac cgattttata + 11521 cggatatgga ccatttttaa tggatcttac aaaacctttg gctaatttct tggacgataa + 11581 tgaatttgta tatgaaaaag gtactgtttt aagtaaaaaa gattatttta aatactattt + 11641 gaaatggttg tggagttata gattcttttt atttaggtta aatggtatta aagaaggaaa + 11701 tagtgaattc gagaagagtt ttaagataat taggagatac tataaaacag gacgatagaa + 11761 tgagtaaata taaggaatta gcaaaaaata caggtatttt tgctttggct aacttttcat + 11821 caaagatttt aatttttttg ttagtaccta tatatacacg ggtacttacc actacggaat + 11881 atggttttta tgacttagtc tatacaacta ttcagctttt tgtaccaatc ttgacattaa + 11941 atatatctga agccgttatg aggttcctaa tgaaagatgg tgtttctaaa aaatcagtct + 12001 tttcaattgc tgttttagat atatttattg gatcaattgc ttttgcttta ttgttgttag + 12061 taaataacct gttttcttta tcagatttaa tttctcaata cagtatttac atatttgtaa + 12121 tctttgtttt ctatacccta aataattttt tgatacaatt ttctaaggga attgataaaa + 12181 ttggtgttac agctatctct ggggtcataa gtacagcagt tatgcttgcc atgaatgtca + 12241 ttcttctagt agtatttgat tggggattgt taggtttctt tattgctaat gtttgtggat + 12301 atgttatacc ttgtatttat atagtttcta gattaagatt gtgggaatta tttgaaatta + 12361 agattgataa aaaattacaa tgggaaatgg tttactatgc tttgccatta gttttaaata + 12421 tattaagctg gtgggtaaat aatacttcag atagatatat tgtgactgca atagtaggta + 12481 tacaagctag tgcaattatt tcagtcgctt ataaaattcc acagattttg tctacgatta + 12541 gtgcaatttt tattcaatca tggcaaatct ctgcaattaa aatacaagaa gataagagcg + 12601 atactacatt tgtatcaaac atgctcctat actataatgc acttctattg attatagcga + 12661 gtggtatcat attatttgtc aaacctattt ctaatatatt gtttggtatt tccttctatt + 12721 ctgcgtggga gctggtacca tttttaataa ttagcagtct attcaatgca atttcaggtt + 12781 gtataggagc aattatggga gctaaaatgg atactcataa cattgcaaag tcggctttag + 12841 ttgggatgat tgcaaatatt attttaaata tagtgttaac attcttaatg ggtccacagg + 12901 gaattacaat ttctaccctg atagctagtt ttcttatttt ttatatgcga aaagatagtg + 12961 taaaagaaat taattcagaa acatatagag caatttattt atcgtggata ctattagttg + 13021 tagaggcctg tctgctaatt tatatggatt ttattattgg tgctttaata gcaatggtaa + 13081 taaacttatt tttactaaaa gatgttatca aacctttata tttaaaaatt ttcaaaagaa + 13141 attaggtaca aaatgattgt tttacaatac tttaagattt tagctagatt cgtttttatg + 13201 tttttgataa gtgcggtgtt actgcctttc aaaataaaac ctaataagat tgtttttatt + 13261 aatttcaatg ggaaaggata tggtgataat ccgaaaagta tttgtgagta tcttagaact + 13321 acttacccag atttagattt ggtttggctt gcaagagata acgaaggttt tccagatggg + 13381 gttagggttg ttaaatatgg gactttccaa gctttttatg agcaagcgag ttcgaaggtt + 13441 tgggtatata atgtaagagc ttttgcaaga atactaaaaa aacgaggaca gatttatatt + 13501 caaacttggc atggtgcttc tagttttaag ttgatagaaa aacaagctga tttaccaata + 13561 aattatgttt tagaagctaa gtatgatgca agagtcacag atataatgat ttcagatagc + 13621 agaaaacaaa ctgaagaatt tcaaaagtat ttttggtatt caggagaaat ttttgaggtg + 13681 gggatgccga gaaatgatgc cttgtttcac tataaggaag actacgacaa gttaaataat + 13741 atcagaaaag aactaagcat tcattcagat gattatgtta ttttatatgc ccctactttc + 13801 agagatgatg gggatgcatc ttatttagat ataaattttg aacggctttt gcaatgtgtt + 13861 gaacacggaa ttaaaaagaa atgtaaattc ttaattaggt tacaccctaa tcactcccat + 13921 ttgtgtaata atatttcatt taataagaat ataatcaatg ctacgtttta ttcagatatg + 13981 caagagctta ctttgttggc agatgtttta gtcacagatt attcttcctc gatatttgat + 14041 tttatgcttt taaacaagcc ttatgtcaga tatgtgaatg atttagaaaa atatgctgag + 14101 cttagggggg tatcagatac atattacgaa ttgccggatt cgattattaa aactgctgaa + 14161 gaattgtatg acttactgcc taaaaaaata gaaaattttg attatgattc tataaaaaaa + 14221 tatagaaatg aaatactgtg tccaatcttt aatggaaccg ctagtgaaaa tgtaggaagg + 14281 agaataattc aagagttgtg aagtaaaaca ttgggttatt tttaaggtaa cgagatttga + 14341 aaaataatga tttaaagata ggaagtggag ctattcatca aatttccgct acactttctc + 14401 aaaatagtat ttcgggaaag attttatatt gtgctgatcc agttgtcgat gacttgtacg + 14461 gttcgatagt acgttcacaa atagaggaaa ttggtcgggt aaaggaagaa agttgcaatt + 14521 ataatactat tgcttatgcg atgaatatag cagaacgggc tattgccaca gatattgact + 14581 gtattgtggg aatgggagga ggtcgtgttt tagatgtctg caagtatgca tcttttattt + 14641 cgaaacgtcc ttacctatcg attccgacaa cagcagcaaa tgatggcatt gcttccccag + 14701 ttgctgtttt gaaaaggcag gatgatagac caaaaagctt aggggcggct atcccctcaa + 14761 tgacactaat tgatattgat gttattgcat caggacctat acaaaatata aaagctggta + 14821 tcggtgatac aatatccaat tacactgcat tgaaagattg ggagttggca gttgagcgag + 14881 ggaaagatga gatgcatggt tttgcatatc taatgtcgca aaattcttta gatgctttaa + 14941 tgaaaacgaa gtataattct attacccctg attttattga agttttggta aactctttag + 15001 ttttatcagg cattgcaatg gattttgcgg gaagtagtag acctgtcagt gggtcagagc + 15061 acttatttag tcatgcatta gattactatg gttctacaag gaatcttcat ggaattcagg + 15121 ttgcattagg tacagtcgca gttttgaaat taattgaaaa ttctgttgat actgtagtgg + 15181 attacttgca aagatttgag gttcatatta acccgaaact tttggggata gatgaagagt + 15241 tgtttattta ttgtatgcaa catgctacaa aaatgagaag taatcgctat acctatctgc + 15301 atgaagttga tcttagcaca gatagattga aacaaatata taaggaactc ataagcgagt + 15361 tgtagagaag agaggaaaaa atgaaagcac ttattttagc agcagggtta ggaacacgtc + 15421 tagctccaat taccaatgag gtaccaaaat ctttggtacc agtcaatggt aagccaattt + 15481 tgatgaaaca aattgaaaat ttatatcaaa ataatattac agatattacg attattgctg + 15541 gatataagtc atctgtatta acagatgcag ttactgaaaa gtatccagaa attaatatta + 15601 ttgataatgt tgattttaaa acgactaata atatgtattc agcctatcta ggaaaagctg + 15661 caatgggtga tagtgacttc ttaatgatga atgcagatgt attttatgat gcttctgtta + 15721 ttaaaagtct gttgcttcat aaagctccaa atgcaattgt aactgattta ggtatttata + 15781 ttgaagagtc tatgaaagtc gtagaaaaaa atggtcgttt agtagaaatt tctaaacaga + 15841 tttcacctga ggaaacttta ggagcttcta ttgatgttta taaattctct tatgaagcag + 15901 gtgctcgatt ctttgaaaag tgtaaggaat ttattgaaga taaacgagaa cttcaaatgt + 15961 ggagtgaggt tgctcttaat gcaattcttt ctgaagttga atttgtagca tgtccattag + 16021 agggtcgttg gttagaaatt gataatcatg aagacttagt tgctgcagaa aaactatttg + 16081 cttgaaccga atacggagaa tgaaattgac aaatagagtt gattattttg gtgctgatat + 16141 tagtgaactt cagaataaaa aattattctt atttgatatg gatggtacca tttatgaaga + 16201 agataggttg tttgagggta ctctcgaatt attagactat attcataata ttggcggtga + 16261 gtatattttt attacaaaca attcatctaa gtctgttgtt gactatgttg aaaaagttaa + 16321 cagattaggt attaaagctg aacgagataa tttttttacc tctgctcaag ccacaattgt + 16381 ttatattaaa gaaaattatc ctaaatctaa agtttattgc caaggaacaa aatctttgat + 16441 aaaagaacta tctgacgcag gaattgatgt aactgagcaa gttagtgctg atatagatgt + 16501 tgttcttgtt ggttttgata cagaattaac cagtgataaa attcgcaata cctgcgagat + 16561 tctatcaaca aaggacgtac ctttcatagc tactaaccct gatattcgct gcccagtatc + 16621 gtttggattc atcccggatt gtggttctat ttgtgatatg attagtaaat cagtcgatag + 16681 gaaacctgtt tacataggta aacctgaacc tacgatggtt gatattgttc gaaaaaaatt + 16741 aaattattct ctatttgaaa cagttgtgat tggagatcgc ttgtatacgg atatcatgac + 16801 tggtataaat gcaggagtaa cttcagtttg tgtgctgaca ggagaagcaa cggtgaatga + 16861 tattcaacaa gatagtataa aaccgactta tacatttaaa aacgtgaaag aaatgtggaa + 16921 aggaattgtc tgattttttc attctgaata gtgaattcat gaatactgtc aaaatactcg + 16981 tatgtattta aattgatttt attattttaa taatggacaa attaaaatta tttttctccc + 17041 caaatcgttc gtgaacgtaa agtactcatc aacaaagaaa ggtacccctt ttatgaaagg + 17101 tattattcta gcaggtggtt cgggaactcg cttgtatcct ttgactcgcg ctgcatcaaa + 17161 acaacttatg ccggtttatg ataaaccgat gatttactac ccactttcaa cattaatgtt + 17221 ggctgggatt agggatattt tgattatctc aactcctcaa gatttgcctc gttttaaaga + 17281 gcttcttcaa gatggttctg agtttggtat taaactttct tatgctgagc aaccaagtcc + 17341 agatggtttg gcacaagcct ttatcattgg ggaagagttt atcggtgacg atagcgttgc + 17401 cttgatttta ggtgacaata tctaccatgg tcctggtctg agcacaatgc ttcaaaaagc + 17461 agccaagaaa gagaaaggtg cgactgtttt tggctaccat gtcaaggatc cagaacgctt + 17521 tggtgttgta gaatttgatg aaaatatgaa tgctatctcc atcgaagaaa agccagaata + 17581 ccctcgttca aactatgcag tgacaggact ctatttctat gataatgatg tagtagagat + 17641 tgccaaaagt attaaaccaa gtcctcgtgg tgaattggaa attacagatg tcaacaaggc + 17701 ttacttggat cgtggtgatt tgtctgttga gctcatggga cgtggttttg cttggttgga + 17761 tactggcact catgaaagtt tactagaggc ttcgcagtac atcgaaacag tccaacggat + 17821 gcaaaatgtt caggtagcaa acttagaaga aattgcttac cgtaggggct atatcagtcg + 17881 agaagatgta ttggccttag cccaatcact taagaaaaat gaatacggac agtatctgct + 17941 ccgtttgatt ggagaagcat agatgacaga taattttttc ggtaagacgc ttgcggcacg + 18001 caaggttgaa gctattccag gcatgttgga gtttgatatc cccgttcatg gagataatcg + 18061 tggctggttt aaagaaaatt tccaaaagga aaaaatgctt ccacttggat ttccagagtc + 18121 tttctttgca gaaggaaaat tgcaaaacaa tgtatccttc tcacgtaaaa atgtccttcg + 18181 aggcctccac gcagagcctt gggataagta catctctgta gcagatggag ggaaagttct + 18241 gggttcttgg gttgatctac gcgagggtga aacctttggg aatacctatc agacagtgat + 18301 tgatgcgagt aagggaatct ttgttcctcg aggcgtagct aatggcttcc aagttttatc + 18361 agatacagtg tcatatagct atctggtcaa tgattactgg gctcttgaac tcaaacccaa + 18421 gtatgccttt gtgaactacg ctgatccaag ccttggtatt gaatgggaaa atattgcaga + 18481 agcagaggtt tcagaagcag ataaaaatca tccactactt aaggatgtaa aacctttgaa + 18541 aaaagaagat ttgtaaaaag gaaagaatat gactgaatac aaaaatatta tcgtgacagg + 18601 tggagctggc tttatcggtt ctaactttgt ccattatgtt tacgagaact ttccagatgt + 18661 tcatgtgaca gtcctagata agttgactta tgctggaaac cgcgcgaata ttgaggaaat + 18721 tttaggtaat cgtgttgagt tagttgttgg tgacattgct gatgcggagt tggtagacaa + 18781 gttggctgct caagcagatg ctatcgttca ttatgcagcg gaaagccaca atgataattc + 18841 gctcaatgat ccatcgccat ttattcatac taacttcatc ggaacctata ctcttttaga + 18901 agctgctcgt aagtatgata ttcgcttcca ccatgtatcg acagatgaag tttatgggga + 18961 tctcccttta cgcgaagatt tgccaggtca tggtgaagga ccaggtgaga aatttactgc + 19021 tgaaacaaaa tacaacccaa gctctccgta ctcatcaacc aaggcagcct cagatttgat + 19081 tgtcaaagcc tgggtgcgtt cttttggagt caaggcaacg atttccaact gttcaaataa + 19141 ctacggtcct tatcaacata tcgaaaaatt catcccacgt cagattacta acatcctaag + 19201 tggaattaag ccaaaacttt acggtgaagg taagaatgtt cgtgactgga ttcataccaa + 19261 tgaccattct tcaggagttt ggacaatctt gacaaaaggg caaatcggtg aaacctactt + 19321 gattggggct gatggtgaga agaacaataa ggaagttttg gaacttatcc ttaaggaaat + 19381 gggacaagct gtggatgcct atgatcatgt gactgaccgt gcaggacatg accttcgcta + 19441 tgcgattgat gctagcaagc tccgtgatga gttggggtgg aaacctgaat ttaccaactt + 19501 tgaagctggg ctcaaggcaa caatcaagtg gtatacagat aaccaagaat ggtggaaagc + 19561 agaaaaagaa gctgttgaag ccaattatgc taagactcag gagattatta cagtataaaa + 19621 agcaggaaat agctgctttt tattgctata ttgggaagag ttacatatta gaaaggtcta + 19681 gagatgattt taattacagg ggcaaatggc caattaggaa cggaacttcg ctatttattg + 19741 gatgaacgta atgaagaata cgtggcagta gatgtggctg agatggacat taccgatgca + 19801 gaaatggttg agaaagtttt tgaagaggtg aaaccgactt tagtctacca ctgtgcagcc + 19861 tacaccgctg ttgatgcagc agaggatgaa ggaagagagt tggacttcgc catcaatgtg + 19921 acggggacaa aaaatgtcgc aaaagcatct gaaaagcatg gtgcaactct agtttatatt + 19981 tctacagact atgtctttga tggtaagaaa ccagttggac aagagtggga agttgatgac + 20041 cgaccagatc cacagacaga atatggccgt actaagcgta tgggggaaga gttagttgag + 20101 aagcatgtgt ctaatttcta tattatccgt actgcctggg tatttggaaa ttatggcaaa + 20161 aacttcgttt ttaccatgca aaatcttgcg aaaactcata agactttaac agttgtaaat + 20221 gaccagtacg gtcgtccgac ttggactcgt accttggctg agttcatgac ctacctagct + 20281 gaaaatcgta aggaatttgg ttattatcat ttgtcaaatg atgcgacaga agacacaaca + 20341 tggtatgatt ttgcagttga aattttgaaa ggtacagatg tcgaagtcaa gccagtagat + 20401 tccagtcaat ttccagccaa agctaaacgt ccgctaaact caacgatgag cctggccaaa + 20461 gccaaagcta ctggatttgt tattccaact tggcaagatg cattgcaaga attttacaaa + 20521 caagaagtga gataagtagt agaatgattt tctagtctaa taaaagaggc agataatgaa + 20581 ctccaaagga gcttaagatg tacgattatc ttgttgttgg tgctgatctc tttggcgcat + 20641 agctttggct cagtttctat tatcgctcac accatccatc agaagtttaa tctgaaggta + 20701 cccaattatc gccaagaaga agattgggct aggatgggtt taccaatcac acgtaaggaa + 20761 atctctaatt ggcatatcaa ggcaagtcaa tactatttag agtcccttta taacctttta + 20821 cgagaaaagt tgttagaaca acctcttctt catgcggatg aaacctctta tcgggtgcta + 20881 gagagtgata gccatctgac ctactattgg acctttttgt ctgggaaagc tgagaatcaa + 20941 gcaatcacgc tgtaccatca tgatcagcgt cggagtggtt tagtagtaca agaattccta + 21001 ggagattatt ctggctatgt gcattgtgat atgttgcggc agtaacttag gactttagtc + 21061 ctctagttct gcctatgcga tagcagtcca aggtttagga gcaaggcgac gctaagcttg + 21121 gtaaactaag cttatcgtca actggaagaa gctgaacttg ttggatgttg ggcacatgtg + 21181 agaaggaagt tttttgaagc gacccccaag caagcagata aatcatcctt aggagctaaa + 21241 ggtttagctt attgtgatca gttattttcc ctggaaagag actgggaggc tttgccagct + 21301 gatgaacgac tacagaaacg tcaagaacat ctccagccct taatggaaga cttctttgct + 21361 tagtgccggc gtcagtcagt tttagcaggt tcaaaactag gaagggcaat tgaatacagc + 21421 ctcaagtatg aagaaacctt taagactatt ttgaaagacg gacatctggt cctttccaat + 21481 aatctagctg aacgcgccat taaatcattg gttatgggac ggagtaaaag aattcagtgg + 21541 actcttttag cctaagctaa attttaaaaa gcgagggtgg ttattttctc aaagttttga + 21601 aggagctaaa gcaacagcta ttattatgag tttgttggaa acagctaaac gtcatcaatt + 21661 aaatagcgag aaatatctat tctatcttct agaatgtctt ccaaacgagg aaactctcgt + 21721 aaacaaagag gttttagagg cttatttacc atggactaaa gttgtacaag aaaagtgcaa + 21781 ataagaaatc tccagattag gaactatccg tgagttctct agtctggaga tttttcaata + 21841 tacttcgtta ttggacggtt acgatattca tattttttgc aaagatgttg tttgaaaaat + 21901 aattttcaaa aattctgaaa attctgttga caactttctg aaaagagtct ataatggaga + 21961 gaaagtttta aaggagaaaa tgatgaaaag ttcaaaacta tttgcccttg cgggcgtgac + 22021 attattggcg gcgactactt tagctgcatg ctctggatca ggttcaagca ctaaaggtga + 22081 gaagacattc tcatacattt atgagacaga ccctgataac ctcaactatt tgacaactgc + 22141 taaggctgcg acagcaaata ttaccagtaa cgtggttgat ggtttgctag aaaatgatcg + 22201 ctacgggaac tttgtgccgt ctatggctga ggattggtct gtatccaagg atggattgac + 22261 ttacacttat actatccgta aggatgcaaa atggtatact tctgaaggtg aagaatacgc + 22321 ggcagtcaaa +// + diff --git a/public/res/serotype_genbank/serotype_24A.gb b/public/res/serotype_genbank/serotype_24A.gb new file mode 100644 index 0000000..f9b72c9 --- /dev/null +++ b/public/res/serotype_genbank/serotype_24A.gb @@ -0,0 +1,1024 @@ +LOCUS CR931686 21907 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 2748/40 (serotype 24a). +ACCESSION CR931686 +VERSION CR931686.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21907) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21907) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21907 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="2748/40" + /db_xref="taxon:1313" + gene <1..133 + /gene="dexB" + /locus_tag="SPC24A_0001" + CDS <1..133 + /gene="dexB" + /locus_tag="SPC24A_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33876.1" + /db_xref="GOA:Q4K0E6" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K0E6" + /translation="VHEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVELL" + gene complement(264..452) + /gene="tnp" + /locus_tag="SPC24A_0002" + /pseudo + CDS complement(264..452) + /gene="tnp" + /locus_tag="SPC24A_0002" + /note="Lone member of homology group 0244" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn transposase(fragment)" + gene 886..1839 + /gene="tnp" + /locus_tag="SPC24A_0003" + CDS 886..1839 + /gene="tnp" + /locus_tag="SPC24A_0003" + /note="member of homology group 39" + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + /protein_id="CAI33878.1" + /db_xref="GOA:Q4K0E5" + /db_xref="InterPro:IPR001584" + /db_xref="InterPro:IPR012337" + /db_xref="UniProtKB/TrEMBL:Q4K0E5" + /translation="MQEHYTPKGKHLTIDNRRLIERWKNENKSNREIAGLLGKAPQTI + HTEVKRGTTLQQVRKGLYKKVYSADYAQTVYQFNRKRSVKKLILTKEIREKILHYHKQ + KFSPEMMVNKKQVKVGISTIYYWFHNGHLGLTKADMLYPRKRKGVKKQASPNFKPAGK + SIEERPDVINLRLENGHYEIDTVLLTKIKNYCLLVLTDRRSRHQIIRLIPNKTAESVN + QALTLLLGEHRILSITADNGSEFKRLSEVFPEEHIYYAHAYSSWERGSNENHNRLIRR + WLPKGTKKTTPKEVAFIENWINNYPKKCLDYKSPSEFLLGG" + misc_feature 1393..1830 + /gene="tnp" + /locus_tag="SPC24A_0003" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 6.6e-23" + gene 1924..3378 + /gene="wzg" + /locus_tag="SPC24A_0004" + CDS 1924..3378 + /gene="wzg" + /locus_tag="SPC24A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33879.1" + /db_xref="GOA:Q4K0E4" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0E4" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSICVAVLADSDIENVTQLTSVTAPTGTDNENVQKLLADIKSSQNT + DLTVDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIKKL + TSTEVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1924..2049 + /gene="wzg" + /locus_tag="SPC24A_0004" + /note="Signal peptide predicted for SPC1231 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 2137..2484 + /gene="wzg" + /locus_tag="SPC24A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1e-62" + misc_feature 2662..3105 + /gene="wzg" + /locus_tag="SPC24A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.6e-69" + gene 3380..4111 + /gene="wzh" + /locus_tag="SPC24A_0005" + CDS 3380..4111 + /gene="wzh" + /locus_tag="SPC24A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33880.1" + /db_xref="GOA:Q4K0E3" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0E3" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKLFGERYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 3383..3991 + /gene="wzh" + /locus_tag="SPC24A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.5e-38" + gene 4120..4812 + /gene="wzd" + /locus_tag="SPC24A_0006" + CDS 4120..4812 + /gene="wzd" + /locus_tag="SPC24A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33881.1" + /db_xref="GOA:Q4K0E2" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0E2" + /translation="MQDQNTLEIDVFQLFRALWKRKLVILLVAIITSSVAFAYSTFII + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSISVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGVIGTSVIVLLLELLDTRVKRPEDIENTLQMT + LLGVVPNLNKLK" + misc_feature 4138..4554 + /gene="wzd" + /locus_tag="SPC24A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 7.1e-54" + misc_feature 4660..4737 + /gene="wzd" + /locus_tag="SPC24A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4822..5505 + /gene="wze" + /locus_tag="SPC24A_0007" + CDS 4822..5505 + /gene="wze" + /locus_tag="SPC24A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33882.1" + /db_xref="GOA:Q4K0E1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0E1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIAWSFARAGYKTLLIDGDTRNSVMSGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGTVTPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILITATGEANKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 5521..6888 + /gene="wchA" + /locus_tag="SPC24A_0008" + CDS 5521..6888 + /gene="wchA" + /locus_tag="SPC24A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33883.1" + /db_xref="GOA:Q4K0E0" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0E0" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETEVERSSMVILYLL + HFFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDVGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 6304..6885 + /gene="wchA" + /locus_tag="SPC24A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.2e-146" + gene 6919..8091 + /gene="wchF" + /locus_tag="SPC24A_0009" + CDS 6919..8091 + /gene="wchF" + /locus_tag="SPC24A_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33884.1" + /db_xref="GOA:Q4K0D9" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K0D9" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIVYDIAAINRAIKIAKENKDEDPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSILKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIADSFTWEKIVTDYEKVFKG" + gene 8097..8993 + /gene="wcxG" + /locus_tag="SPC24A_0010" + CDS 8097..8993 + /gene="wcxG" + /locus_tag="SPC24A_0010" + /note="member of homology group 79" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33885.1" + /db_xref="GOA:Q4K0D8" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K0D8" + /translation="MAVKLKYDKSDITFLDDDELKKYQSELLKMISDVFTFFDENRIA + YSLSGGSILGAIRHKGFIPWDDDVDINIPRESYDKLFSLFELDNSLSRKYYLQSAKSH + PELGLHVSQIRKKGTVARRKYDHSAEECGISIDLYIVENVYNNPVKRFFQGYTSMFLT + FALASVRETKNHALMKEMFRLEGRKLNYSAGKLMVGWFFGIIPIEKWLNWLDKCNSSC + KDSHTKYVSIPTGRKHFRRETYLRENMNIYKKVPFETLMVNVPVWSEEYLEMFYGKDY + MVVPPVDKREQHLFLELSYGEE" + misc_feature 8214..8915 + /gene="wcxG" + /locus_tag="SPC24A_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 2.3e-19" + gene 8994..9713 + /gene="abp1" + /locus_tag="SPC24A_0011" + CDS 8994..9713 + /gene="abp1" + /locus_tag="SPC24A_0011" + /note="member of homology group 57" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (arabinitol) + Abp1" + /protein_id="CAI33886.1" + /db_xref="GOA:Q4K0D7" + /db_xref="InterPro:IPR001228" + /db_xref="UniProtKB/TrEMBL:Q4K0D7" + /translation="MKVAILTASGIGSRIGQDIPKQFIHVENKPVIIYTLEKFQNHPE + IDEICIVILKGWDQMVKAYAEQFGITKLKMITFGGKSGQESIYNGLREVKKAHPNDDV + TVLIHDGNRPLVSNDIISNALATYQQFGNAVAAIPTTEVVFVLENPQSTSSTEALNRD + LLRRTQTPHVYHLDNILSLHEKALENGITDVAASCQLMQLFGEKSYFSLGTEKNLKIT + TVEDLDIFKALLSSTRDKWIK" + misc_feature 9000..9689 + /gene="abp1" + /locus_tag="SPC24A_0011" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF0007, score 2e-14" + gene 9716..10771 + /gene="abp2" + /locus_tag="SPC24A_0012" + CDS 9716..10771 + /gene="abp2" + /locus_tag="SPC24A_0012" + /note="member of homology group 58" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (arabinitol) + Abp2" + /protein_id="CAI33887.1" + /db_xref="GOA:Q4K0D6" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0D6" + /translation="MTLLLNKIYRQDVESSLETIVNINDLNGKSILITGASGLIGSSV + IDQLLLLNEIRNFNIKIFCCGREFESLEKRFGRQTEYLHFVFYDATKAPHFDFAVDYI + IHAASPASPELYVNQPVETMASNFLGMYNLLEYAKNAKVSNLVYISSSEVYGISTSNN + PLDENYIGTVDHLSVRSSYANSKRATETLCVSFASEYGIKIMIVRPGHIYGPSAKDSD + NRVSSFFMTEAIAGRDIVIKSTGSQLRSYCYSLDCASAILSVLLSGGSGQAYNVSNPN + SIITIKQMATCIADASGVRVLYDIPITQERKQENPMVNASLDSEKIESLGWSGLFSAE + VGFHHTFSILKELSSEK" + misc_feature 9803..10762 + /gene="abp2" + /locus_tag="SPC24A_0012" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00052" + misc_feature 9806..10564 + /gene="abp2" + /locus_tag="SPC24A_0012" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00074" + misc_feature 9806..10534 + /gene="abp2" + /locus_tag="SPC24A_0012" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 6.1e-44" + misc_feature 9809..10621 + /gene="abp2" + /locus_tag="SPC24A_0012" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.5e-05" + gene 10761..10895 + /gene="HG268" + /locus_tag="SPC24A_0013" + /pseudo + CDS 10761..10895 + /gene="HG268" + /locus_tag="SPC24A_0013" + /note="member of homology group 268" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase (fragment)" + gene complement(10986..11165) + /gene="tnp" + /locus_tag="SPC24A_0014" + /pseudo + CDS complement(10986..11165) + /gene="tnp" + /locus_tag="SPC24A_0014" + /note="Lone member of homology group 0245" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase (fragment)" + gene 11505..12755 + /gene="wzy" + /locus_tag="SPC24A_0015" + CDS 11505..12755 + /gene="wzy" + /locus_tag="SPC24A_0015" + /note="member of homology group 112" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33890.1" + /db_xref="UniProtKB/TrEMBL:Q4K0D5" + /translation="MIDGDFMNRRLVIKKKSIMFFMLMLCVTAFYGTNYWYTNIYIYD + FMLITSCLLSIIVFVCNGIRIDKTYYKGTIILGIVMWFSGLIAAQGKGLPAIVIFKES + LYTITPIMIFLAFRPMIKSIKDTSLFLRTISAAGVICNLIACIEMFFAKRGFDFLNIS + VFEKLRNGTPRFIIGETIIVLSFFISCSVVFSKGGKRNRRIFHVLNIALTAINLVYII + KTRTLNLYILSTLMMMPVLKKNVKKQLKFWIVFLISIILTFVSAEYFIPIVKNLIHSD + HGIQIRFLTIEYYIEYFKNHYLLGAGYISSSPYFETYSIVTGPLGRYYPSDVGLIGLM + FRSGIIGLIWLISWFYTSLKIIKDNTIRIPAHYDLLMKLVIVFLMFSCINLIITDAPR + FPYIALAMLLFESSYTLSYENSSN" + gene 12794..13717 + /gene="wcxI" + /locus_tag="SPC24A_0016" + CDS 12794..13717 + /gene="wcxI" + /locus_tag="SPC24A_0016" + /note="member of homology group 113" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33891.1" + /db_xref="GOA:Q4K0B4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0B4" + /translation="MIKRLAILMATYNGEKYIKEQIESILNQDTDFDFTLIIRDDGST + DNTKNIIREYVDSGKIIFIEGQNKGAARGFISLLCDNPGYDYYAFSDQDDVWNHNKLQ + KGIWSLSKYTGPALYCSNCELVDSELNSIGRNTHRKRPNYTLESILCLASCAQGCTSV + FNKELASIIQENDVPDTFIMHDSLITCLCALIGGKIIYDEIPSMKYRMHDDNIFGMVS + AKQNVLNVIKDRISEITKKRTISMYDQAECLLKVYKKYIDSNNQDICRIVIDSKVSLK + ARLKLIFNKNLQHTTLNKTITKKLEILFGND" + misc_feature 12809..13300 + /gene="wcxI" + /locus_tag="SPC24A_0016" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.8e-23" + gene 13733..14512 + /gene="wcxJ" + /locus_tag="SPC24A_0017" + CDS 13733..14512 + /gene="wcxJ" + /locus_tag="SPC24A_0017" + /note="member of homology group 114" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33892.1" + /db_xref="GOA:Q4K0D3" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0D3" + /translation="MKYQLIVSTMNQQDNSLIEKMNIKSDAIIINQSNSFSYHETKLK + NSIVKWYEFNERGIGLSRNTGFMRSDADIIQFADDDMIFTDTYYEDVLLEYQKHPEAD + VILFSNKCLNEDRMPYQVNNFGRINRFEGVKFGGARITARREKILHNNITFSLLFGGG + AKYGAGEDVTFIQDCIKAGLRVYKSPIIVSTMKQDSSTWFKGYDRKYYKDKGALLAAN + FPSISEVGVYIQAFKNRGGIYTFSELLRFYKEGINEFKINR" + gene 14522..15364 + /gene="wcxK" + /locus_tag="SPC24A_0018" + CDS 14522..15364 + /gene="wcxK" + /locus_tag="SPC24A_0018" + /note="member of homology group 115" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33893.1" + /db_xref="GOA:Q4K0D2" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K0D2" + /translation="MMRRFLIMPRNKVYNTGETDIELKNKYNYEGSELRKAQVRMIDM + LSFLNDICKENNITYFIAFGTLLGAIRHGGFIPWDDDLDIYINDKGLKKLRKIINNGN + YPYVIQDYSSDKGFVRYYSVLRDTNSEYIKDEYQHNQRKYRGVQIDLFPYGYGVMKWG + ERLIGKTYGFNEKIFLGKNKMLTALIFYLTKEVIIPFLKVISKINGRKKVGLGYETGD + PGYYYNSYDVFPLKTIDFEGLVVPCPNNPGLVLEVDYGPDYMELPNETQRDHHKIRNI + HFYD" + misc_feature 14675..15289 + /gene="wcxK" + /locus_tag="SPC24A_0018" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 3.2e-20" + gene 15415..16854 + /gene="wzx" + /locus_tag="SPC24A_0019" + CDS 15415..16854 + /gene="wzx" + /locus_tag="SPC24A_0019" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33894.1" + /db_xref="GOA:Q4K0D1" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K0D1" + /translation="MNIGKQRSVRKNAILSVIKQLFTLLFPMITFPYATQILGVANYG + KYTFSMSVVNYISYIAAAGILRYAVRECARVRDDKEALHKLVNEIYTINIITTMFAYL + LLFVVLTFVPLLEEYISWIILLSLSVLFTTIGTDWINSAFEDYLFITIRYIISQIFAL + FLLFLLVREQDNITQYAFVSIFAGILANILNIVHIRKTLGIVPRLMYSRQLFSHIKPI + LYLFASTIATFIYINSDVTFLRIYADDTSVGYYGVSTQFYQLIKQLINAAFIVVVPRI + SNELTKEKSLAYSRYSKILVITILLVIPCAAGLFMIRHNLVILFSGEEYVKAASSLAI + LAVALIPAMIANFFINIVMIPLGMEKQVMIATIISALVNIGLNFVLIPRFAENAAAFT + TLNAEIILILIAMFYCRDIKLKSVTKPIATSIVGSGVIIFICSVLNKNVSNYFVNVVL + CLMVCGILYSVVILFFYKTELKRIIKEIK" + misc_feature 15439..16254 + /gene="wzx" + /locus_tag="SPC24A_0019" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2e-35" + gene 16939..17808 + /gene="rmlA" + /locus_tag="SPC24A_0020" + CDS 16939..17808 + /gene="rmlA" + /locus_tag="SPC24A_0020" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33895.1" + /db_xref="GOA:Q4K1A5" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K1A5" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 16942..17658 + /gene="rmlA" + /locus_tag="SPC24A_0020" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 4.9e-120" + gene 17809..18402 + /gene="rmlC" + /locus_tag="SPC24A_0021" + CDS 17809..18402 + /gene="rmlC" + /locus_tag="SPC24A_0021" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33896.1" + /db_xref="GOA:Q9AHA9" + /db_xref="HSSP:1NXM" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q9AHA9" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + misc_feature 17845..18375 + /gene="rmlC" + /locus_tag="SPC24A_0021" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 4.5e-16" + gene 18415..19464 + /gene="rmlB" + /locus_tag="SPC24A_0022" + CDS 18415..19464 + /gene="rmlB" + /locus_tag="SPC24A_0022" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33897.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18430..19386 + /gene="rmlB" + /locus_tag="SPC24A_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 18433..19173 + /gene="rmlB" + /locus_tag="SPC24A_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 18436..19248 + /gene="rmlB" + /locus_tag="SPC24A_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 19530..20381 + /gene="rmlD" + /locus_tag="SPC24A_0023" + CDS 19530..20381 + /gene="rmlD" + /locus_tag="SPC24A_0023" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33898.1" + /db_xref="GOA:O54665" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54665" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19530..20378 + /gene="rmlD" + /locus_tag="SPC24A_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 3.4e-148" + misc_feature 19533..20174 + /gene="rmlD" + /locus_tag="SPC24A_0023" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 19533..20162 + /gene="rmlD" + /locus_tag="SPC24A_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.6e-19" + misc_feature 19536..20264 + /gene="rmlD" + /locus_tag="SPC24A_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.8e-08" + gene 20732..21539 + /gene="glf" + /locus_tag="SPC24A_0024" + /pseudo + CDS join(20732..20950,20950..21036,21036..21539) + /gene="glf" + /locus_tag="SPC24A_0024" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + misc_feature join(20879..20950,20950..21036,21036..21482) + /gene="glf" + /locus_tag="SPC24A_0024" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 7.3e-109" + /pseudo + gene 21860..>21907 + /gene="aliA" + /locus_tag="SPC24A_0025" + CDS 21860..>21907 + /gene="aliA" + /locus_tag="SPC24A_0025" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33900.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccatgaa gagcaagact tgacagtaga aggaaaagtc aaatctgtct tgattgaaaa + 61 cactgcggct aaagaagtac ttgaaaaaca ggtcttggct ccatgggatg ctttctgtgt + 121 ggaattacta taaatatttt ttgcagaaaa atttaaaatt gaaatcatgt aaaaacaagg + 181 gaggactgta taaaagacag aaatcctttg ttttttataa ccaaggttta taaactttca + 241 ttctcgaaat tcaattaact ttacaaattc ccactatttg cttggtggtt tagctctcct + 301 gttttctctt ttagctttaa ccagccataa atggtattac gtgagatttg gaaaacgtgt + 361 gatgcttctg ttatactacc tgttcgctca caataagaga gaactttttt acgaaaatct + 421 attggatatg ccataagaag attataccac attgtgtact atattgtatt gaaactagaa + 481 tagtacacct ctgcttctaa aacattgtta gaaatcgatt tgactgttct gaacgttttg + 541 tcctggtctt atttcatttt actatatttt tggttcgcgg gaagtctact aagatactta + 601 aagatgcaga tagtgaaaat aaaggttgaa agttctataa tgaagttagc caccttacct + 661 tagtcaagaa ttagatgttt cactatgttt gagtaagttg atgatttcat ttgataacag + 721 gtttgaaact gttaggctag gtggccaagg ctaatcatag ccttggttta gctgaaaaaa + 781 caggttcaag ggttcctgtt gtcaaatgaa atgtgattta aggtataaga aaacacctct + 841 gtgctatact tgttgttcac cacaaacaca aggaaaggca cagagatgca agaacattat + 901 accccaaaag ggaaacattt gacaatagat aaccgtcgct tgattgagcg gtggaagaat + 961 gaaaataagt ccaatcgtga aattgcaggc ttgttaggaa aggcgcctca aacgattcat + 1021 actgaagtca aaagaggtac aactttacaa caagtgagaa aagggctata caaaaaggtc + 1081 tattctgccg attacgcaca aactgtttac caattcaatc gaaaacggtc ggtgaaaaag + 1141 ttaattttaa caaaggaaat cagagagaag atcttacact atcataagca aaaattttcg + 1201 cctgaaatga tggttaacaa gaagcaagtg aaagttggta tttcaaccat ctactactgg + 1261 tttcataatg gtcatttagg attgacgaag gccgacatgc tttatcccag aaaaaggaaa + 1321 ggtgtcaaga agcaagctag tccgaacttt aagccggcag gtaaatctat cgaagaacgt + 1381 cctgacgtta ttaatcttcg cttggaaaat ggtcattatg aaattgatac cgtcctactg + 1441 actaagataa aaaattattg cctgttagtc ttaaccgacc ggcggagcag acaccaaatt + 1501 ataaggttaa ttccaaataa aactgctgaa tctgtcaatc aggcgcttac gttactatta + 1561 ggggagcatc gtattctgtc cattactgca gataatggtt cggagttcaa acgattgtct + 1621 gaggtatttc ctgaggaaca tatctactac gcacatgctt actcttcatg ggagagaggt + 1681 tcaaatgaaa atcataatcg attaattcgg agatggttac ctaaaggaac caagaaaacg + 1741 actccgaaag aagtagcttt tatcgaaaat tggattaaca actaccctaa aaaatgcttg + 1801 gactacaagt cgccaagtga atttcttttg ggtggctaac ttcaacttga aatttgggat + 1861 gaaaataaag gtgtagacat taccgtaaaa aagtgatata atcgaatgat gttgaatgta + 1921 taggtgttaa tcatgagtag acgttttaaa aaatcacgtt cacagaaagt gaagcgaagt + 1981 gttaatatag ttttgctgac tatttattta ttgttagttt gttttttatt gttcttaatc + 2041 tttaagtaca atatccttgc ttttagatat cttaatctag tggtaactgc gttagttcta + 2101 ctagttgcct tggtagggct actcttgatt atctataaaa aagctgaaaa gtttactatt + 2161 tttctgttgg tgttctctat ccttgtcagc tctgtgtcgc tctttgcagt acagcagttt + 2221 gttggactga ccaatcgttt aaatgcgact tctaattact cagaatattc aatctgtgtc + 2281 gctgttttag cagatagtga tatcgaaaat gttacgcaac tgacgagtgt gacagcaccg + 2341 actgggactg ataatgaaaa tgttcaaaaa ctactagctg atatcaagtc aagtcagaat + 2401 accgatttga cggtcgacca gagttcgtct tacttggcag cttacaagag tttgattgca + 2461 ggggagacca aggccattgt cttaaatagt gtctttgaaa atatcatcga gtcagagtat + 2521 ccagactacg catcgaagat aaaaaagatt tataccaagg gattcactaa aaaagtagaa + 2581 gctcctaaga cgtctaagaa tcagtctttc aatatctatg ttagtggaat tgacacctat + 2641 ggtcctatta gttcggtgtc gcgatcagat gtcaatatcc tgatgactgt caatcgagat + 2701 accaagaaaa tcctcttgac cacaacacca cgtgatgcct atgtaccaat cgcagatggt + 2761 ggaaataatc aaaaagataa attaacccat gcgggcattt atggagttga ttcgtccatt + 2821 cacaccttag aaaatctcta tggagtggat atcaattact atgtgcgatt gaacttcact + 2881 tctttcttga aaatgattga cttattggga ggggtagatg ttcataatga tcaagaattt + 2941 actgcccata cgaatggaaa gtattaccct gcaggcaatg ttcatcttga ctcagaacag + 3001 gctctcggtt ttgtacgtga acgctactca ctagccgatg gagaccgtga ccgtggtcgc + 3061 aaccaacaaa aggtcattgt agcaattatt aagaagttaa cttctacaga ggttttgaaa + 3121 aactatagta gtattcttca aggattgcag gattctcttc aaacaaatat gccgattgag + 3181 actatgatag atttagtgaa tactcagttg gaaagtgggg ggaattataa agtaaattct + 3241 caagatttaa aagggacagg tcggatggat cttccttctt atgcaatgcc agacagtaac + 3301 ctctatgtga tggaaataga tgatagtagt ttagctgtag ttaaagcagc tatacaggat + 3361 gtgatggagg gtagatgaaa tgatagacat ccattcgcat atcgtttttg atgtagatga + 3421 cggtcccaag tcaagagagg aaagcaaggc tctcttggca gaagcctaca gacagggggt + 3481 gcgaaccatt gtctctacct ctcaccgtcg caagggcatg tttgaaactc cggaagagaa + 3541 gatagcagaa aactttcttc aggttcggga aattgcaaaa gaagtagcag atgatttagt + 3601 cattgcttat ggcgcagaga tatactatac tctggatgct ctagaaaagc tagaaaaaaa + 3661 agaaattcct acccttaatg atagtcgtta tgccttgatt gagtttagca tgcatacttc + 3721 ctatcgtcag attcatacgg gattgagcaa tattttgatg ttgggaatta ctccagtcat + 3781 tgcccacatc gagcgctatg atgctcttga aaataatgaa aaacgcgttc gggaactgat + 3841 tgatatggga tgctatactc agataaatag ttatcatgtt ttaaaaccta agctctttgg + 3901 tgaaagatat aaatttatga aaaagagagc tcggtatttt ttggaacgtg atttagttca + 3961 tgtagttgca agtgatatgc acaatttaga cagtagacct ccatatatgc aacaggcata + 4021 tgatatcatt gctaagaaat atggagcgaa aaaagcgaaa gaactttttg tagataatcc + 4081 cagaaaaatt ataatggatc aattaattta ggagaaaata tgcaagatca aaacactttg + 4141 gaaatcgatg tatttcaact attcagagct ttatggaaaa gaaagttggt cattttatta + 4201 gtggcaatta taacttcttc agttgctttt gcctacagta cttttattat caaacctgag + 4261 tttactagta cgactcggat ttatgtagtt aaccgtaatc aggaagagaa gtctggttta + 4321 accaatcaag acttgcaggc aggatcatac ttggttaaag actatcgtga aattatccta + 4381 tcgcaggatg ttttggagga agttgtttct gatttgaaac tagatttgac gccaaaaggt + 4441 ttggctaata aaattaaagt gacagtacca gttgataccc gtattgtctc tatttcagtt + 4501 aatgatcgag ttcctgaaga ggcaagtcgt atcgctaact ctttgagaga agtagctgct + 4561 caaaaaatta tcagtatcac tcgtgtttct gatgtgacaa cactggagga ggcaagaccg + 4621 gcgatatcgc cgtcttcgcc aaatattaaa cgcaatacac taattggttt tttggcaggg + 4681 gtgattggaa ctagtgttat agttcttctt cttgaacttt tggacactcg tgtgaaacgt + 4741 ccggaagata tcgaaaatac attgcagatg acacttttgg gagttgtacc aaacttgaat + 4801 aagttgaaat aggagagaag gatgccgaca ttagaaatag cacaaaaaaa actggagttc + 4861 attaagaagg cagaagaata ttacaatgcc ttgtgtacaa atatacagtt gagcggagat + 4921 aaactaaaag taatttccgt tacttctgtt aaccctgggg aaggaaaaac aactacttct + 4981 gtaaatatag catggtcgtt tgcgcgtgca ggctataaaa ctcttttgat cgatggtgat + 5041 actcgaaatt cagttatgtc aggagttttt aaatctcgtg aaaaaattac agggctaaca + 5101 gaatttttat ctgggacagc tgatttatct catggtttat gtgatacaaa tattgaaaat + 5161 ttatttgtag ttcaatcggg aactgtaaca ccaaacccta cagccttgtt acaaagtaaa + 5221 aattttaatg atatgattga aacattgcgt aaatattttg attatatcat tgttgataca + 5281 ccacctattg gaattgttat tgatgcggca attatcactc aaaagtgtga tgcgtctatc + 5341 ttgataacag caacaggtga ggcgaataaa cgtgatgtcc aaaaagcgaa acaacaatta + 5401 gaacaaacag ggaaactgtt cctgggagtt gttttaaata aattggatat ctcggttgat + 5461 aagtatggag tttacggttc ctatggaaat tatggtaaaa aataacttag aaaagatttt + 5521 atggatgaaa aaggattgaa aatttttctg gcagtattac agagtattat tgtcatttta + 5581 ttggtttatt ttcttagctt tgttagagag acagaagttg aacgttcttc gatggttata + 5641 ctataccttc tccacttttt tgtattctat tttagttcct atggtaacaa tttttttaaa + 5701 agagggcacc tagttgagtt taatagtact ataagatata tttttttctt tgcaatagct + 5761 ataagtgtat taaacttttt tatagcggaa cggtttagta tctctagaag aggaatggta + 5821 tacttcttaa ctttagaagg aatatcctta tacttgttaa atttcttagt aaaaaaatat + 5881 tggaagcatg tgttttttaa tctaaaaaat agcaagaaaa ttttactgtt aacagtaacg + 5941 aaaaatatgg aaaaagttct tgataaattg ctagaatctg atgaactttc atggaaattg + 6001 gtagcagtaa gtgttttgga taaatctgat tttcaacatg ataaaatacc tgtaattgaa + 6061 aaggaaaaaa ttattgaatt tgcaacgcat gaagttgtgg atgaggtgtt tgtcaatctt + 6121 ccaggagaga gctacgatgt tggagaaatt atctctaggt ttgagacaat ggggatagat + 6181 gtaactgtaa atcttaaagc atttgataag aatttgggtc gcaataaaca aattcatgag + 6241 atggtgggat tgaatgtagt cactttctct acaaattttt ataaaactag tcatgtgatt + 6301 tcaaagagaa ttctcgatat ttgtggtgcc actattggcc ttattctttt tgctatagct + 6361 agtctagttt tagttccatt gattcgtaaa gatggcggac cagctatttt tgctcaaact + 6421 cgtataggga aaaatggtcg acattttacc ttttataaat tccgttcgat gcggatcgat + 6481 gctgaagcta tcaaagaaca gttgatggat caaaatacga tgcaaggtgg tatgtttaag + 6541 atagacaatg atcctcgtgt tacaaaaatt ggtcgcttta ttcgtaaaac cagtttggat + 6601 gaattgccgc agttttggaa tgtctttata ggagatatga gtttggtggg aacacgtcca + 6661 cctacagtag acgagtatga tcagtatact ccagaacaga aacgtcgact cagctttaaa + 6721 cctggtatta caggtttatg gcaggttagc ggccgtagta aaataaccga ttttgacgat + 6781 gttgtaaaat tagatgtggc ttatattgat aattggacaa tctggaaaga tattgaaatt + 6841 ttgcttaaaa ctgttaaagt tgtatttatg agagatggag cgaagtaatt tctgtatatc + 6901 catcatatta ggagagaaat gaaaaagtca gtttatatca ttggttcaaa aggaattcct + 6961 gctaagtatg gaggatttga aacttttgtt gaaaaattaa cagccttcca acaagataag + 7021 gctatccaat attatgtggc ttgtatgcgt gaaaactctg caaaatcagg gactactgag + 7081 gatgtttttg aacataatgg tgctatctgt tataacgtcg atgttcctaa tattggtcca + 7141 gcgcgagcca tagtatatga tatcgcggca attaacagag ctattaaaat tgccaaagaa + 7201 aataaggatg aagatccaat cttctatatt ctagcttgtc gaatcggtcc gttcatccat + 7261 ggaattaaga aaaaaatcca ggcgataggt gggactcttc tagttaatcc agatggtcac + 7321 gagtggttac gagctaagtg gagcgctcca gttcgtcgtt attggaaaat ttccgaaggt + 7381 cttatggtca aacatgcaga tcttttagtg tgtgatagta agaatattga aaaatatatc + 7441 caagaagatt ataaacagta tcaacctaag acaacctata tcgcttatgg gactgataca + 7501 acacgctcca tattaaagag tagtgacgaa aaagtacgtt cttggttcaa agagaagaat + 7561 gtttctgaga acgagtatta tctagttgta ggacgttttg taccagaaaa caactatgaa + 7621 tctatgattc gtggcttttt ggcatctaac tctaagaagg actttgtctt aatcacaaat + 7681 gtagaacaga ataaatttta taatcagttg ttggcaaaaa ctggttttga taaggaccca + 7741 cgagtaaaat ttgtaggtac agtctatgag caagagcttc ttaaatatat tcgtgaaaac + 7801 gcctttgctt acttccacgg gcatgaagtt ggtggaacca atccttcact tttagaagct + 7861 ctggcatcaa ctaaactgaa tttattgcta gatgttggct ttaaccgaga agttggggag + 7921 caaagtgcga tttattggaa aaaagatgag ctttcccaag taatcgagaa agttgaacaa + 7981 tttgatgcaa aaatgattga tgagttagat agacaatcaa atcagagaat tgcggattct + 8041 ttcacttggg aaaagattgt cacagactac gagaaagtat ttaaaggtta gagttaatgg + 8101 cagtaaaatt aaaatatgat aaatcagata ttacattttt agatgatgac gaattgaaaa + 8161 aataccaatc agaattgttg aaaatgatat cagatgtgtt tacttttttt gatgaaaata + 8221 ggatagcgta ttctttaagt ggaggtagca ttttaggggc aatccgtcat aaaggcttta + 8281 tcccttggga tgatgatgtt gatatcaata ttccgaggga aagttacgat aaactatttt + 8341 ctctatttga gttagacaat agtcttagtc gtaaatatta tcttcaatca gcaaaaagtc + 8401 atccagaatt gggacttcat gtttctcaaa ttagaaaaaa aggaacagtt gctcgtagga + 8461 aatacgatca ttcggctgag gagtgcggta tttctataga tctttacatt gtagaaaatg + 8521 tatacaataa tccagtgaaa cgattctttc aaggttatac aagtatgttt ttgacttttg + 8581 ccttggcttc tgtacgagaa acaaagaatc atgccctgat gaaggaaatg tttagactgg + 8641 aaggtagaaa actaaattat tcagctggaa agttaatggt tggttggttt tttggaatta + 8701 ttccaattga aaagtggttg aattggcttg ataaatgtaa ttcaagctgt aaggattcac + 8761 atacaaaata tgtatccata cctacaggaa ggaaacactt tagacgcgag acttacttgc + 8821 gagagaatat gaatatttat aaaaaggttc cttttgaaac tttgatggtg aatgttcctg + 8881 tttggtcaga agagtattta gaaatgtttt acggtaaaga ttatatggtc gttcctcctg + 8941 ttgataagag agagcaacat ttgtttttag aattgagtta cggagaagaa tagatgaaag + 9001 tagcgatttt aacagcttca ggcattggaa gccgaattgg tcaagatatc cctaaacaat + 9061 ttattcatgt tgaaaataag ccagtcatta tctataccct tgaaaaattt caaaatcatc + 9121 cagaaattga tgaaatctgt attgttattt taaaaggctg ggatcagatg gttaaagctt + 9181 atgcggaaca atttggaatt acaaagttaa agatgataac ttttgggggg aagtctggtc + 9241 aagaatcaat ttataacggt cttagagaag ttaagaaagc tcatcccaat gatgatgtga + 9301 ctgtattaat tcatgacggg aatcgtcctt tagtgagcaa tgatattatt agcaacgctt + 9361 tagcaacata ccaacagttt ggaaatgctg ttgcagcgat accaacgact gaggtagtat + 9421 ttgttttaga aaacccacaa tcaacttcgt ccacagaagc attgaatcgt gacttgttga + 9481 gacgaacaca aactcctcat gtttaccatc ttgataatat tctatcgctt catgaaaaag + 9541 cattagaaaa tgggataact gatgttgcag catcatgcca actcatgcaa ctatttggtg + 9601 aaaagagtta tttctctctt ggaacagaga aaaacttgaa aattacgact gtagaagatc + 9661 tcgatatttt taaagcctta ttgagttcaa ctcgagataa gtggattaaa tagtaatgac + 9721 attattatta aataaaatat atagacaaga tgtagaatct tctctagaaa caatcgtcaa + 9781 tattaatgac ttgaatggca agtcaatttt aattactgga gcttctggtt tgattggttc + 9841 aagtgtcatt gaccagttat tattgctaaa tgaaataagg aattttaaca ttaaaatttt + 9901 ttgttgtgga agagagtttg aatcattaga aaaacgattt ggtagacaaa cagagtattt + 9961 acactttgtg ttctatgatg cgactaaagc acctcacttt gattttgcag tggactacat + 10021 tattcatgct gctagtcctg ctagtcctga attatacgtt aatcagcctg tagaaacaat + 10081 ggctagtaat tttctgggca tgtataatct actggaatac gccaaaaatg ctaaagtttc + 10141 aaatctagtt tatatctcat ctagtgaagt ttatggaatt agcactagta ataatccttt + 10201 ggacgaaaat tatattggaa ctgttgatca tcttagcgta cggtcttctt atgccaattc + 10261 aaaaagagct actgaaacac tttgtgttag ttttgcttcc gagtatggaa tcaaaataat + 10321 gatagtaagg ccaggacata tctatggtcc tagtgccaag gactctgata atcgtgtatc + 10381 atcatttttt atgacagaag cgattgctgg gcgtgatatt gtcataaaaa gtacaggtag + 10441 tcagttaaga tcctattgtt atagtttgga ttgtgccagt gcaattctaa gtgttcttct + 10501 ttcgggtgga tcaggacaag cttataatgt ttccaatcca aattcaatta ttactataaa + 10561 acagatggca acttgcattg cagatgcttc aggagtcaga gttctttatg atatacctat + 10621 aactcaagag cgaaagcagg aaaatcctat ggtaaatgca agcttagata gtgagaaaat + 10681 tgagtccttg ggatggtcag gtctattttc agctgaagta ggcttccatc acacatttag + 10741 tattttaaag gagttatcaa gtgaaaaatg atagtatttt aatcatgatg acaacataca + 10801 atggagaaga atttatacgt gaacagttgg agagtattct ttttcaaacc attacagcat + 10861 ggaaactata gattcgtgat gacaattcta gtgatcaaat aagagcaatt attaaagaat + 10921 acgaagaaaa agatagtcaa tttttgatat aagctatcca agaggatttt ggagaagttt + 10981 ttttattgaa gagtggcctt aagaaggtct tctaggctta atttaggttt tcgtccacct + 11041 tttgcgtgtt taagttgata agctgttttt aatacagcta acatctcttc aaaaatggta + 11101 cgctgaacgt caacaagacg cttaaatcgt acatcagtta gttgtttact tgcttcataa + 11161 ttcatagaac tattatacca tattttattt cgcaggaaat ctattgaaaa aacgacacta + 11221 tagtatcaat ggggatgtta gggctatatg ttaaaaacat gcgagagtat cttttgttat + 11281 gaatgttatg agagtacata gaaagataga gattccactg atggaatttt atagagaagg + 11341 gaaaactgta tttatttgga tatattgaac tccgtggaat ggattgatta gggtatgtac + 11401 atatggtaaa tggatgtaac cctcaaacag aacacggatg gagtacacat ttgctaatta + 11461 cagagattca ttgaaaaata ttagagtttc aaataggaaa agtaatgatt gacggagatt + 11521 ttatgaatag aagacttgta ataaaaaaga aaagtataat gtttttcatg cttatgttat + 11581 gtgttacggc attttatggg acaaattatt ggtatacaaa tatctatata tatgatttta + 11641 tgcttataac atcatgctta ttatcaataa tagtatttgt atgtaatggt attagaattg + 11701 ataaaacata ttataaaggg acaataatac tgggtattgt aatgtggttt tcaggactta + 11761 ttgctgcaca aggaaaaggg ctccctgcta ttgtaatctt taaagagagt ttatatacta + 11821 ttactccaat aatgatattt ttagctttcc gacctatgat aaagtcaata aaagacactt + 11881 cattattcct tcgtactatt tctgctgctg gtgttatatg taatttaatt gcttgtattg + 11941 aaatgttctt tgccaaaaga ggatttgatt ttctaaatat aagtgtattt gaaaaactta + 12001 gaaatggtac tcctagattt ataattggag aaacaataat agttcttagt ttttttatct + 12061 cctgtagtgt tgtttttagt aaagggggaa agagaaatag acgcattttc catgttctaa + 12121 atatagctct cacagctata aatttagtgt atattattaa aacaaggaca cttaatttat + 12181 atattttatc aacacttatg atgatgcctg ttttaaaaaa aaatgtaaag aaacaactta + 12241 agttttggat tgtgtttttg atatctataa ttcttacctt tgtttctgca gaatatttta + 12301 ttccaatagt caaaaattta attcatagtg atcatgggat tcaaattaga ttcttgacga + 12361 tagaatacta tatagagtat tttaaaaatc attacttact tggagcggga tatatttctt + 12421 ctagtccata ttttgaaact tattctattg ttaccggtcc attaggacgt tattatccaa + 12481 gtgatgtagg tctgattgga cttatgttta gaagtgggat tatcgggcta atttggttaa + 12541 taagttggtt ttatacaagc ctgaagataa ttaaagataa tacgattaga attccagctc + 12601 attatgactt attaatgaag ctagttatag tttttttgat gttttcttgt attaatttga + 12661 taatcactga tgcacctaga ttcccatata ttgcattagc tatgttactt tttgaatcaa + 12721 gttatacctt gagttatgaa aacagttcta attagaatgt atctcagata gttattttaa + 12781 aggatgaggg gaaatgatta agagattagc aatacttatg gccacatata atggcgaaaa + 12841 atatataaaa gagcaaattg aaagtattct caaccaagat acagattttg attttactct + 12901 aattattaga gatgacggtt caacagataa tactaaaaat ataattagag aatatgttga + 12961 tagtgggaaa attattttta tagaaggcca gaataaaggg gcagcaagag gatttatttc + 13021 tttgttatgt gataatccgg gatatgatta ctatgctttc tcggatcaag atgatgtttg + 13081 gaatcataat aaattacaga aaggtatatg gagtctttcc aaatatactg ggccagcact + 13141 ttattgttct aattgtgaat tagttgattc agagttaaat agtataggtc gtaatacaca + 13201 taggaagaga ccgaactata ctcttgaatc tattctttgt cttgctagtt gtgcacaagg + 13261 atgtacatct gtatttaata aagagctagc ttcgataatt caggagaatg atgtgcctga + 13321 tacttttatt atgcatgatt ctttgattac ttgtttatgt gcactgatag gtggaaagat + 13381 aatttacgac gaaattccat caatgaaata tagaatgcat gatgataata tatttggaat + 13441 ggtgtcagct aagcaaaatg tactaaatgt tataaaagat cgtattagtg aaataacaaa + 13501 aaagcgaacg attagtatgt acgatcaagc agagtgttta ctaaaggttt ataaaaaata + 13561 tatagattct aacaatcaag atatatgtag aattgttatt gattctaaag tatcgctaaa + 13621 ggcaagactt aagctgattt ttaataaaaa tttgcagcat actacattaa ataaaaccat + 13681 aacaaaaaaa ttagagatat tatttggcaa tgactaataa aggagtttag atatgaagta + 13741 tcaactcatt gtatcaacaa tgaatcaaca ggataacagt ctgatagaga aaatgaatat + 13801 aaaatctgat gcaattatca ttaatcaatc aaactcattt tcttaccatg agacgaaatt + 13861 gaaaaattcg attgtaaaat ggtatgaatt caatgaaaga ggtattggtt taagtcgaaa + 13921 cacaggtttc atgagatcgg atgctgatat tattcaattt gctgatgacg atatgatttt + 13981 tacagataca tattacgaag acgtattatt agaatatcaa aaacatccag aagctgatgt + 14041 aattcttttt tcgaataaat gtcttaatga agatcgaatg ccttatcagg ttaataattt + 14101 tggacgtata aataggtttg aaggtgttaa gtttggtggt gctagaatta cagccaggag + 14161 agaaaagata ttgcataata acataacgtt ttctctttta tttggggggg gagcaaaata + 14221 cggtgcagga gaggacgtaa catttattca ggactgtatc aaggcaggat tacgggtata + 14281 taaatcacct attattgttt ctacaatgaa acaagattct tctacatggt ttaaaggata + 14341 tgatagaaaa tattataaag ataaaggtgc tttattagca gcaaatttcc cttctataag + 14401 tgaggtagga gtatatatac aagctttcaa aaataggggg gggatttata catttagtga + 14461 attacttaga ttttataagg aaggtattaa cgaatttaaa ataaatagat gataggttga + 14521 tatgatgagg aggtttttga ttatgccaag aaataaagtt tacaatactg gcgagacaga + 14581 cattgagttg aaaaataaat acaattatga aggtagtgag ttgaggaaag ctcaagttcg + 14641 tatgattgat atgctttctt ttttgaatga tatatgcaaa gaaaataaca tcacctattt + 14701 cattgctttt ggaactctat taggagctat tagacatgga ggctttattc catgggatga + 14761 tgatcttgat atttatatta atgataaagg tttaaaaaaa cttagaaaaa taattaacaa + 14821 tggaaactat ccctatgtta ttcaagacta ttctagtgat aaaggatttg tgaggtatta + 14881 tagtgttctc agagatacta actctgaata tataaaagat gaatatcaac ataatcagcg + 14941 caaatacaga ggtgtacaaa ttgatttatt cccttatggt tatggtgtaa tgaaatgggg + 15001 cgaacgtctt attggaaaaa catatggttt taatgaaaaa atatttttag ggaaaaataa + 15061 aatgttgaca gcattaattt tttatttaac taaagaagtt ataattccat ttctgaaagt + 15121 aattagtaag attaacggaa gaaagaaagt gggacttgga tatgagactg gtgatcctgg + 15181 atactattat aattcctatg atgtatttcc gcttaaaact atagattttg aagggcttgt + 15241 tgttccttgt ccaaataatc ctgggcttgt attagaagtt gattatggac ctgactacat + 15301 ggagctacca aatgaaactc agagagatca ccacaagata cgtaatatcc atttttatga + 15361 ttaaaaatgt attgtcgtca tcatagttac ctttgaacta gaaatggaga tgtcatgaat + 15421 ataggaaagc aacgttcagt gaggaaaaat gcaattttga gtgtaataaa acaattgttt + 15481 acgcttctct ttccaatgat tacatttcca tatgcgactc aaatacttgg agttgctaat + 15541 tatgggaagt atacatttag tatgtctgtt gtaaattaca tctcttatat agcagctgcg + 15601 ggtattttac gatatgctgt gcgagagtgt gcacgtgtaa gagatgataa agaggcattg + 15661 cataaattag tcaatgaaat atatacaatc aacataataa ctacgatgtt tgcgtatctt + 15721 ttgctgtttg tagttctaac tttcgttccc ctgttagagg agtatatatc ttggataatt + 15781 ttgttaagtt tatctgtttt atttacgact ataggtacag attggattaa tagtgcattt + 15841 gaagactatt tatttataac gataagatat attattagtc agatatttgc tctttttctg + 15901 ttgtttttac tggttagaga acaagacaat attactcaat atgcatttgt aagtattttt + 15961 gctgggatat tagcaaatat tttaaatatt gtccatatta gaaaaacttt ggggatagtt + 16021 cctcgtttaa tgtattctag gcaattgttt agtcatatta agccgatatt atatctattt + 16081 gcgtctacta ttgcgacttt catttatatc aattcagatg ttacattttt acgaatttat + 16141 gcagatgaca cttccgtagg ttattatggt gtatcaactc aattttatca attaattaag + 16201 caattgataa atgctgcttt tattgttgtc gtcccaagaa tttcaaatga attgactaaa + 16261 gagaaatctt tagcctatag tcggtatagt aaaattctag taattactat tctattagta + 16321 attccatgtg ctgctggttt atttatgata agacataatt tagtgatact attttcaggt + 16381 gaggaatatg taaaagcagc ctcttctctt gcgattttag cagttgcatt aattccagca + 16441 atgatagcaa atttttttat taatatagtt atgattccac tcggaatgga aaaacaagta + 16501 atgattgcta ctataattag tgctttagtt aatattgggt tgaattttgt attaattcct + 16561 agatttgcgg aaaatgcggc agcgtttaca acattgaatg ctgaaattat tttgatatta + 16621 attgctatgt tttattgtag agatataaaa ttaaagagtg ttactaagcc aattgctacc + 16681 agtatagttg gaagtggagt tattattttt atttgttccg tattaaacaa aaatgtgagt + 16741 aattactttg tcaatgttgt attatgttta atggtatgcg gaatacttta ctctgtagta + 16801 atactatttt tttataaaac agaattaaag agaattatta aagaaattaa atgaaaaaat + 16861 tgaatactac ttttcaagta gaacttatat acaattaaaa gtaatttact ctaaaataac + 16921 aaagaaaggt accctactat gaaaggtatt attctagcag gtggttcggg gacacgttta + 16981 tatcctttga ctcgcgctgc atcaaaacaa ctgatgccgg tttatgataa accgatgatt + 17041 tactacccac tttcaacatt gatgttggct gggattaggg atattttgat tatttccact + 17101 ccacaggatt tacatcgatt tcaagagctt cttcaagacg gatctgagtt tgggatcaaa + 17161 ctttcttatg cagagcaacc aagtccagat ggtttggcac aagcctttat cattggggaa + 17221 gagtttattt ctgatgatag cgttgcgcta atcttaggtg ataatatcta ccatggttct + 17281 gggctttcca agatgctaca aaaggcagcg agtaaggagt cgggagcaac tgtttttggc + 17341 taccatgtca aggatccaga gcgctttggt gtggttgagt ttgatcagga tatgaaggct + 17401 atttctattg aagaaaagcc agagcaacct cgttcaaact atgcagttac aggtctctat + 17461 ttctatgata atgatgtagt agagattgcc aagagtatta aaccaagtcc tcgtggtgaa + 17521 ctggaaatta cagatgtaaa caaagcttac ctagatcgtg gtgatttgtc tgttgagctt + 17581 atgggacgtg gctttgcttg gctggatact ggaactcatg aaagtttact agaggcttca + 17641 cagtacatcg aaacagtgca acggatgcaa aatgttcagg tagcaaactt agaagaaatt + 17701 gcctatcgca tgggttatat cagtcgtgaa gatgtattga ccttagccca accacttaag + 17761 aaaaatgaat acggacagta tctgctccgt ttgattggag aagcatagat gacagataat + 17821 tttttcggta agacgcttgc ggcacgcaag gttgaagcta ttccaggcat gttggagttt + 17881 gatatccccg ttcatggaga taatcgtggc tggtttaaag aaaatttcca aaaggaaaaa + 17941 atgcttccgc ttggatttcc agagtctttc tttgcagaag gaaaattgca aaacaatgta + 18001 tccttctcac gtaaaaatgt ccttcgaggc ctccacgcag agccttggga taagtacatc + 18061 tctgtagcag atggagggaa agttctgggt tcttgggttg atctacgcga gggtgaaacc + 18121 tttgggaata cctatcagac agtgattgat gcgagtaagg gaatctttgt tcctcgaggc + 18181 gtagctaatg gcttccaagt tttatcagat acagtgtcat atagctatct ggtcaatgat + 18241 tactgggcgc ttgaactcaa acccaagtat gcctttgtga actacgctga tccaagcctt + 18301 ggtattgaat gggaaaatat tgcagaagca gaggtttcag aagcagataa aaatcatcca + 18361 ctacttaagg atgtaaaacc tttgaaaaaa gaagatttgt aaaaaggaaa gaatatgact + 18421 gaatacaaaa atattatcgt gacaggtgga gctggcttta tcggttctaa ctttgtccat + 18481 tatgtttacg agaactttcc agatgttcat gtgacagtcc tagataagtt gacttatgct + 18541 ggaaaccgcg cgaatattga ggaaatttta ggtaatcgtg ttgagttagt tgttggtgac + 18601 attgctgatg cggagttggt agacaagttg gctgctcaag cagatgctat cgttcattat + 18661 gcagcggaaa gccacaatga taattcgctc aatgatccat cgccatttat tcatactaac + 18721 ttcatcggaa cctatactct tttagaagct gctcgtaagt atgatattcg cttccaccat + 18781 gtatcgacag atgaagttta tggggatctc cctttacgcg aagatttgcc aggtcatggt + 18841 gaaggaccag gtgagaaatt tactgctgaa acaaaataca acccaagctc tccgtactca + 18901 tcaaccaagg ccgcatcaga cttgattgtc aaagcctggg tgcgttcttt tggagtcaag + 18961 gcaacgattt ccaactgttc aaataactac ggtccttatc aacatatcga aaaattcatc + 19021 ccacgtcaga ttactaacat cctaagtgga attaagccaa aactttacgg tgaaggtaag + 19081 aacgttcgtg actggattca taccaatgac cattcttcag gagtttggac aatcttgaca + 19141 aaagggcaaa tcggtgaaac ctacttgatt ggggctgatg gtgagaagaa caataaggaa + 19201 gttttggaac ttatccttaa ggaaatggga caagctgcgg atgcctatga tcatgtgact + 19261 gaccgtgcag gacatgacct tcgctatgcg attgatgcta gcaagctccg tgatgagttg + 19321 gggtggaaac ctgaatttac caactttgaa gctgggctca aggcaacaat caagtggtat + 19381 acagataacc aagaatggtg gaaagcagaa aaagaagctg ttgaagccaa ttatgctaag + 19441 actcaggaga ttattacagt ataaaaagca ggaaatagct gctttttatt gctatattgg + 19501 gaagagttac atattagaaa ggtctagaga tgattttaat tacaggggca aatggccaat + 19561 taggaacgga acttcgctat ttattggatg aacgtaatga agaatacgtg gcagtagatg + 19621 tggctgagat ggacattacc gatgcagaaa tggttgagaa agtttttgaa gaggtgaaac + 19681 cgactttagt ctaccactgt gcagcctaca ccgctgttga tgcagcagag gatgaaggaa + 19741 aagagttgga cttcgccatc aatgtgacgg ggacaaaaaa tgtcgcaaaa gcatctgaaa + 19801 agcatggtgc aactctagtt tatatttcta cggactatgt ctttgacggt aagaaaccag + 19861 ttggacaaga gtgggaagtt gatgaccgac cagatccaca gacagaatat gggcgtacta + 19921 agcgtatggg ggaagagtta gttgagaagc atgtgtctaa tttctatatt atccgtactg + 19981 cctgggtatt tggaaattat ggcaaaaact tcgtttttac catgcaaaat cttgcgaaaa + 20041 ctcataagac tttaacagtt gtaaatgacc agtacggtcg tccgacttgg actcgtacct + 20101 tggctgagtt catgacctac ctagctgaaa atcgtaagga atttggttat tatcatttgt + 20161 caaatgatgc gacagaagac acaacatggt atgattttgc agttgaaatt ttgaaagata + 20221 cagatgtcga agtcaagcca gtagattcca gtcaatttcc agccaaagct aaacgtccgc + 20281 taaactcaac gatgagcctg gccaaagcca aagctactgg atttgttatt ccaacttggc + 20341 aagatgcatt gcaagaattt tacaaacaag aagtgagata agtagtagaa tgattttcta + 20401 gtctaataaa agaggcagat aatgaactcc aaaggagctt aagatataca attatcttgt + 20461 tgttggtgct ggtctctttg gtgcagtctt tgcccatgaa gcggccttaa aaggaaaaaa + 20521 agtaaaagtt attgaaaaac gaaatcatat cgcgggtaat atctatactc gtgaagagga + 20581 aggaattcaa gtttatcaat atggtgctca tatcttccat acttctgata aggagatctg + 20641 ggattatgta aatcagtttg cagagtttaa ccgttacata aattctcctg ttgcaaacta + 20701 taagggtgag atttataacc ttccttttaa tatgaatact ttcaataaac tctggggagt + 20761 tgtaacgcca gcagaagcac aagctaagat tgatgaacaa cgtgctattt taaatggtaa + 20821 aactcctgaa aatttggaag aacaggcgat ttctcttgta gctacagaca tctacgaaaa + 20881 attaatcaaa gactatacag agaaacagtg gggcaaacca actactgaac ttccatcctt + 20941 tattattgtt tgccagtacg cctgacctat gataacaact attttaacga tacctatcaa + 21001 gggattccaa ttggtggata cactcaaata gttgaaaaat gttggatcat gaaaatattg + 21061 atgtagaaac aaacgttgat ttctttgtga ataaagagca atatctgaaa gattttccta + 21121 agattgtctt tactggtatg attgatgaat tctttgacta taagttgggc gaactagagt + 21181 accgtagtct tcgttttgaa aatgagacct tggatatgga aaattaccaa ggaaatgcag + 21241 ttgtgaacta tacggatgca gaaaccccat atactcgcat tattgaacac aaacattttg + 21301 agtttgggag tcaagcaaag actatcatta ctaaagaaca ttctaaaaca tgggaaaaag + 21361 gtgatgagcc ttattatcca gttaataatg atcgtaataa tcatttgtat aaatcatata + 21421 aaaaacttgc tgatgagcaa gggaatgtta tctttggtgg ccgcttagga cactatcgtt + 21481 attacgatat gcaccaagta attggagcag ctttgcagtg cgtgagaaat gagttaaatt + 21541 aatactcaat gaaaattaaa gagcaaacta ggaagctagc cacaggttgc tcaaaacact + 21601 gttttgaggt tgcagatgga agctgacgcg gtttgaagag attttcgaag agtataaaca + 21661 agtaaaactg actaccagtt attatttaga aatagtatta aaaattcctt gactatgtga + 21721 tatagttgag ggatttttaa atgatattca tattttttgc aaagatgttg tttgaaaaat + 21781 aattttcaaa aattctgaaa attctgttga catctttctg aaaagagtct ataatggaga + 21841 gaaagtttta aaggagaaaa tgatgaaaag ttcaaaacta cttgcccttg cgggcgtgac + 21901 attattg +// + diff --git a/public/res/serotype_genbank/serotype_24B.gb b/public/res/serotype_genbank/serotype_24B.gb new file mode 100644 index 0000000..0755438 --- /dev/null +++ b/public/res/serotype_genbank/serotype_24B.gb @@ -0,0 +1,1095 @@ +LOCUS CR931687 23976 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 2236/42 (serotype). +ACCESSION CR931687 +VERSION CR931687.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 23976) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 23976) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..23976 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="2236/42" + /db_xref="taxon:1313" + gene <1..>151 + /gene="dexB" + /locus_tag="SPC24B_0001" + CDS <1..>151 + /gene="dexB" + /locus_tag="SPC24B_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33901.1" + /db_xref="GOA:Q4K0C5" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K0C5" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCV" + gene 322..495 + /gene="aliB" + /locus_tag="SPC24B_0002" + /pseudo + CDS 322..495 + /gene="aliB" + /locus_tag="SPC24B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI33902.1" + gene complement(order(511..1023,1025..1351)) + /gene="tnp" + /locus_tag="SPC24B_0003" + /pseudo + CDS complement(join(511..1023,1025..1351)) + /gene="tnp" + /locus_tag="SPC24B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(961..1023,1025..1333)) + /gene="tnp" + /locus_tag="SPC24B_0003" + /note="HMMPfam hit to PF01710, Transposase, score 4.1e-23" + /pseudo + gene 1575..3029 + /gene="wzg" + /locus_tag="SPC24B_0004" + CDS 1575..3029 + /gene="wzg" + /locus_tag="SPC24B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33904.1" + /db_xref="GOA:Q4K0C4" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0C4" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVLSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1575..1700 + /gene="wzg" + /locus_tag="SPC24B_0004" + /note="Signal peptide predicted for SPC1258 by SignalP 2.0 + HMM (Signal peptide probability 0.991) with cleavage site + probability 0.537 between residues 42 and 43" + misc_feature 1788..2135 + /gene="wzg" + /locus_tag="SPC24B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 3.2e-64" + misc_feature 2313..2756 + /gene="wzg" + /locus_tag="SPC24B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 3031..3762 + /gene="wzh" + /locus_tag="SPC24B_0005" + CDS 3031..3762 + /gene="wzh" + /locus_tag="SPC24B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33905.1" + /db_xref="GOA:Q4K0C3" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0C3" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTLYRDIHSALNKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRVQYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 3034..3642 + /gene="wzh" + /locus_tag="SPC24B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4e-36" + gene 3771..4463 + /gene="wzd" + /locus_tag="SPC24B_0006" + CDS 3771..4463 + /gene="wzd" + /locus_tag="SPC24B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33906.1" + /db_xref="GOA:Q4K0A1" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0A1" + /translation="MQDQNTLEIDVFQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPATSPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 3789..4205 + /gene="wzd" + /locus_tag="SPC24B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 4.9e-54" + misc_feature 4311..4388 + /gene="wzd" + /locus_tag="SPC24B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4473..5156 + /gene="wze" + /locus_tag="SPC24B_0007" + CDS 4473..5156 + /gene="wze" + /locus_tag="SPC24B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33907.1" + /db_xref="GOA:Q4K0A0" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0A0" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILVTATGEANKRDVQKVKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 5172..6539 + /gene="wchA" + /locus_tag="SPC24B_0008" + CDS 5172..6539 + /gene="wchA" + /locus_tag="SPC24B_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33908.1" + /db_xref="GOA:Q4K0C0" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K0C0" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETEVERSSMVILYLL + HFFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMIYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDVGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVILKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITNFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5955..6536 + /gene="wchA" + /locus_tag="SPC24B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 8.2e-147" + gene 6570..7742 + /gene="wchF" + /locus_tag="SPC24B_0009" + CDS 6570..7742 + /gene="wchF" + /locus_tag="SPC24B_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33909.1" + /db_xref="GOA:Q4K098" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K098" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFKHNGAICYNVDIPNIGPARAIAYDIAAINRAIEFAKENKDEDPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKYA + DFLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSTLKSSDKKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQIIEKVEQFDAKMIDELDRQSNQRIADSFTWEKIVTDYEKVFKG" + gene 7748..8644 + /gene="wcxG" + /locus_tag="SPC24B_0010" + CDS 7748..8644 + /gene="wcxG" + /locus_tag="SPC24B_0010" + /note="member of homology group 79" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33910.1" + /db_xref="GOA:Q4K0B8" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K0B8" + /translation="MAVKLKYDKSDIIFLDDDELKKYQSELLKMISDVFTFFDENGIA + YSLSGGSILGAIRHKGFIPWDDDVDINIPRESYDKLFSLFESDNSLSRKYYLQSAKSH + PELGLHVSQIRKKGTVARRKYDHSAEECGISIDLYIVENVYNNPVKRFFQGYTSMFLT + FALASVRETKNHALMKEMFRLEGRKLNYSAGKLMVGWFFGIIPIEKWLNWLDKCNSSC + KDSHTKYVSIPTGRKHFRRETYLRENMNIYKKVPFETLMVNVPVWSEEYLEMFYGKDY + MVVPPVDKREQHLFLELSYGEE" + misc_feature 7865..8566 + /gene="wcxG" + /locus_tag="SPC24B_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 2.2e-21" + gene 8645..9363 + /gene="abp1" + /locus_tag="SPC24B_0011" + CDS join(8645..8947,8947..9363) + /gene="abp1" + /locus_tag="SPC24B_0011" + /note="member of homology group 57" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (arabinitol) + Abp1" + /protein_id="CAI33911.1" + /db_xref="GOA:Q4K0B7" + /db_xref="InterPro:IPR001228" + /db_xref="UniProtKB/TrEMBL:Q4K0B7" + /translation="MKVAILTASGIGSRIGQDIPKQFIHVENKSVIIYTLEKFQNHPE + IDEICIVILKGWDQMVKAYAEQFGITKLKMITLGGKSGQESIITVLEKLRKLIPMRMV + TVLIHDGNRPLVSNDIISNALATYQQFGNAVAAIPTTEVVFVLENPQSTSSTEALNRD + LLRRTQTPHVYHLDNILSLHEKALENGITDVAASCQLMQLFGEESYFSLGTEKNLKIT + TVEDLDIFKALLSSTRDKWIK" + misc_feature join(8651..8947,8947..9339) + /gene="abp1" + /locus_tag="SPC24B_0011" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF0007, score 9.5e-12" + gene 9366..10421 + /gene="abp2" + /locus_tag="SPC24B_0012" + CDS 9366..10421 + /gene="abp2" + /locus_tag="SPC24B_0012" + /note="member of homology group 58" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (arabinitol) + Abp2" + /protein_id="CAI33912.1" + /db_xref="GOA:Q4K0B6" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0B6" + /translation="MTLLLNKIYRQDVESSLETIVNINDLNGKSILITGASGLIGSSV + IDQLLLLNEIRNFNIKIFCCGREFESLEKRFGRQTEYLHFVFYDATKAPHFDFAVDYI + IHAASPASPELYVNQPVETMASNFLGMYNLLEYAKNAKVSNLVYISSSEVYGISTSNN + PLDENYIGTVDHLSVRSSYASSKRATETLCVSFASEYGIKIMIVRPGHIYGPSAKDSD + NRVSSFFMTEAIAGRDIVMKSTGSQLRSYCYSLDCASAILSVLLSGGSGQAYNVSNPN + SIITIKQMATCIADTSGVRVLYDIPITQERKQENPMVNASLDSKKIESLGWSGLFSAE + VGFHHTFSILKELSSEK" + misc_feature 9453..10412 + /gene="abp2" + /locus_tag="SPC24B_0012" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00085" + misc_feature 9456..10214 + /gene="abp2" + /locus_tag="SPC24B_0012" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00092" + misc_feature 9456..10184 + /gene="abp2" + /locus_tag="SPC24B_0012" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 6.6e-45" + misc_feature 9459..10271 + /gene="abp2" + /locus_tag="SPC24B_0012" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 5.3e-05" + gene 10435..10636 + /gene="HG269" + /locus_tag="SPC24B_0013" + /pseudo + CDS 10435..10636 + /gene="HG269" + /locus_tag="SPC24B_0013" + /note="member of homology group 269" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative transferase (fragment)" + gene complement(10637..10810) + /gene="tnp" + /locus_tag="SPC24B_0014" + /pseudo + CDS complement(10637..10810) + /gene="tnp" + /locus_tag="SPC24B_0014" + /note="Lone member of homology group 0246" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase (fragment)" + gene 11156..12406 + /gene="wzy" + /locus_tag="SPC24B_0015" + CDS 11156..12406 + /gene="wzy" + /locus_tag="SPC24B_0015" + /note="member of homology group 112" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33915.1" + /db_xref="UniProtKB/TrEMBL:Q4K094" + /translation="MIDGDFMNRRLVIKKKSIMFFMLMLCVTAFYGTNYWYTNIYIYD + FMIITSCLLSIIVFVCNGIRIDKTYYKGTIILGIVMWFSGLIAAQGKGLPAIVIFKES + LYTITPIMIFLAFRPMIKSIKDTSLFLRTISAAGVICNLIACIEMFFAKRGFDFLNIS + VFEKLRNGTPRFTIGETIIVLSFFISCSVVFSKGGKRNRRIFHVLNIALTAINLVYII + KTRTLNLYILSTLMMVPVLKKNVKKQLKFWIVFLISIILTFVSAEYFIPIVKNLIHSD + HGIQIRFLTIEYYIEYFKNHYLFGAGYISSSPYFETYSIVTGPLGRYYPSDVGLIGLM + FRSGIIGLIWLISWFYTSLKIIKDNTIRIPAHYDLLMKLVIVFLMFSCINLIITDAPR + FPYIALAMLLFESSYTLSYENSSN" + gene 12445..13368 + /gene="wcxI" + /locus_tag="SPC24B_0016" + CDS 12445..13368 + /gene="wcxI" + /locus_tag="SPC24B_0016" + /note="member of homology group 113" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33916.1" + /db_xref="GOA:Q4K0B4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0B4" + /translation="MIKRLAILMATYNGEKYIKEQIESILNQDTDFDFTLIIRDDGST + DNTKNIIREYVDSGKIIFIEGQNKGAARGFISLLCDNPGYDYYAFSDQDDVWNHNKLQ + KGIWSLSKYTGPALYCSNCELVDSELNSIGRNTHRKRPNYTLESILCLASCAQGCTSV + FNKELASIIQENDVPDTFIMHDSLITCLCALIGGKIIYDEIPSMKYRMHDDNIFGMVS + AKQNVLNVIKDRISEITKKRTISMYDQAECLLKVYKKYIDSNNQDICRIVIDSKVSLK + ARLKLIFNKNLQHTTLNKTITKKLEILFGND" + misc_feature 12460..12951 + /gene="wcxI" + /locus_tag="SPC24B_0016" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.8e-23" + gene 13384..14163 + /gene="wcxJ" + /locus_tag="SPC24B_0017" + CDS 13384..14163 + /gene="wcxJ" + /locus_tag="SPC24B_0017" + /note="member of homology group 114" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33917.1" + /db_xref="GOA:Q4K092" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K092" + /translation="MKYQLIVSTMNQQDNSLIEKMNIKSDAIIINQSNSFSYHETKLK + NSIVKWYEFNERGIGLSRNTGFMRSDADIIQFADDDMIFTDTYYEDVLLEYQKHPEAD + VILFSNKCLNEDRMPYQVNNFRRINRFEGVKFGGARITVRREKILHNNITFSLLFGGG + AKYGAGEDVTFIQDCIKAGLRVYKSPIIVSTMKQDSSTWFKGYDRKYYKDKGALLAAN + FPSISEVGVYIQAFKNRGGIYTFSELLRFYKEGVNEFKINR" + gene 14173..14733 + /gene="wcxK" + /locus_tag="SPC24B_0018" + CDS 14173..14733 + /gene="wcxK" + /locus_tag="SPC24B_0018" + /note="member of homology group 115" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33918.1" + /db_xref="GOA:Q4K0B2" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K0B2" + /translation="MIKSFLIMPKNKVYNTGETDIELKNKYNYEGSELRKVQVRMIDM + LSFLNDICKENNITYFIAFGTLLGAIRHGGFIPWDDNLYIYIYINDKGLKKLRKIINN + GNYPYVIQDYSSDKGFVRYYSVLRDTNSEYIKNEYQHNQRKYRGVQIDLFPYGYGVMK + WGERLIGKIYGFNEKIFLGKIKCWQH" + gene 14718..15335 + /gene="wzy" + /locus_tag="SPC24B_0019" + CDS 14718..15335 + /gene="wzy" + /locus_tag="SPC24B_0019" + /note="member of homology group 65" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy + (fragment)" + /protein_id="CAI33919.1" + /db_xref="UniProtKB/TrEMBL:Q4K0B1" + /translation="MLAALIFYLTKEVIIPFLKVISKINGRKKVIYWLLTILGLWMIT + LTPIFENIVGAILKVDGVGRGSDSLTIRAIGRQLYWEQLNETTLKLLFGTGYPNYNYA + LAFQRTGFFKQYFFNRQWFYDIYIFGIVGSSIMGLLFLKYLKNSIKYDRQSADMIPLM + YIISLLIVAYNIILWYWNADGTFILVIMICALEHGEQLLHQKNGV" + gene 15340..17292 + /gene="rbsF" + /locus_tag="SPC24B_0020" + CDS 15340..17292 + /gene="rbsF" + /locus_tag="SPC24B_0020" + /note="member of homology group 49" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI33920.1" + /db_xref="GOA:Q4K089" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006439" + /db_xref="UniProtKB/TrEMBL:Q4K089" + /translation="MNLNKEVRWKDKQYIAFDFFDTTIHRNCHPEVILFEWSKKISIY + FSFKISATEIYSIRKKSEIHEKQEKQLEEIKYERLLQLVFYTILSRLKSDVTDYNLED + FLIYARTCEEEIELRHISIDTDTINFIEFLKQNGKKIILISDFYSDKKLIEKLMVSLG + IRDYFSKIFISSEIGLRKSSGNLYEYVINELSCKPINLLMIGDNIYSDVKVPKKLGID + SYHKSYSDSHVTVSPNDIVKAMNNVISQACTESLFNLYIPEILYFISKLYKELSVNKA + SDILFCSREGFFIKKLFDLYQKKMNLKLINSHYFYVSRKSTLYPSFKNIEDEDFEVIF + RQFPEITLENFLINLNFSNNDINNIAKQTEIKQTDKVSDKSIINKLKQNKLFKDVYEL + NCKEEKYSFREYLKSVGVENDNSIINMVDIGWKGTIQDNIQKAFPSLNIKGYYMGLNF + QRYSTRNSMNKTGILFTDDPQKTKFFNLFNYKYLFYERIFVADHGPTVRYEFMNGVGV + PTLDTDENHIEIYRFAEEFQITFFNTFEKILDLFNESLVTPDELFNEIANLSLKKHCI + YLPRLSVSIKKLDRAAKENFGIIKSTNRNSDNKVRNFWKNRDFLFLDYIYKAYGKNRL + LNPILDIYGYFVYLIKTLQIKIVGDI" + misc_feature 15373..16014 + /gene="rbsF" + /locus_tag="SPC24B_0020" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 1.8e-07" + gene 17289..18749 + /gene="wzx" + /locus_tag="SPC24B_0021" + CDS 17289..18749 + /gene="wzx" + /locus_tag="SPC24B_0021" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33921.1" + /db_xref="GOA:Q4K0A9" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K0A9" + /translation="MMSMKEKSISKNAILNIILTLTNIVFPLITFPYISRILNPSGIG + AISFFSSIGSYGVLVASLGISTYGIRVIAKNRYHKDKITKIFQELIVINSVMSIIVTF + FLVLMSFRLEQLSSEKGLLIITCITILSSPFNLNWFYSGIEEYSYITKRSIFFKLVSL + ILTFLFVKSKDDYIIYAVIILFSTLASNFINILESRKYINFNLRRNLEFRYHLKPMWY + LFASLLAVNIYTNLDSVMLGIINGNDAVGIYSIASKVKWILLSVVTSVSLVLLPRLSF + YSNKYDETKFNNILRKSSTIIFMISIPLTIFFMIKAKESILLLGGEQYIQAVLAMQIL + MPILIISGFSNIIGNQILIPTGNEKYFMRAVSIGAIVNLCLNLLLMPILGIIGGAIAT + LCAESVQMIIQFYFSRNKLMGNISLNSIKKVAYSSIFAGILLIVIQNIIENFNSFLNL + AASSFLYFGVYFFLLVLFKESTIKKFLNQIFYKDIS" + misc_feature 17313..18122 + /gene="wzx" + /locus_tag="SPC24B_0021" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.3e-62" + gene 18889..19791 + /gene="rmlA" + /locus_tag="SPC24B_0022" + CDS 18889..19791 + /gene="rmlA" + /locus_tag="SPC24B_0022" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33922.1" + /db_xref="GOA:Q4K0A8" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K0A8" + /translation="MKTNLKRRDYSMKGIILAGGSGTRLYPLTRAASKQLMPVYDKPM + IYYPLSTLMLAGIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFI + IGEEFIGDDSVALILGDNIYHGPGLSTMLQKAAKKEKGATVFGYHVKDPERFGVVEFD + ENMNAISIEEKPEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDR + GDLSVELMGRGFAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISRED + VLALAQSLKKNEYGQYLLRLIGEA" + misc_feature 18925..19641 + /gene="rmlA" + /locus_tag="SPC24B_0022" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.7e-121" + gene 19792..20382 + /gene="rmlC" + /locus_tag="SPC24B_0023" + /pseudo + CDS 19792..20382 + /gene="rmlC" + /locus_tag="SPC24B_0023" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /pseudo + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase RmlC + (pseudogene)" + misc_feature 19828..20355 + /gene="rmlC" + /locus_tag="SPC24B_0023" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 4.2e-15" + /pseudo + gene 20398..21447 + /gene="rmlB" + /locus_tag="SPC24B_0024" + CDS 20398..21447 + /gene="rmlB" + /locus_tag="SPC24B_0024" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33924.1" + /db_xref="GOA:Q4K0A7" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0A7" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAVD + AYDHVTDRAGHDLRYAIDASKLREELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 20413..21369 + /gene="rmlB" + /locus_tag="SPC24B_0024" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 6.3e-05" + misc_feature 20416..21360 + /gene="rmlB" + /locus_tag="SPC24B_0024" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0033" + misc_feature 20416..21156 + /gene="rmlB" + /locus_tag="SPC24B_0024" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.4e-77" + misc_feature 20419..21231 + /gene="rmlB" + /locus_tag="SPC24B_0024" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.6e-05" + gene 21513..22364 + /gene="rmlD" + /locus_tag="SPC24B_0025" + CDS 21513..22364 + /gene="rmlD" + /locus_tag="SPC24B_0025" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33925.1" + /db_xref="GOA:Q4K1G6" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G6" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 21513..22361 + /gene="rmlD" + /locus_tag="SPC24B_0025" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-147" + misc_feature 21516..22157 + /gene="rmlD" + /locus_tag="SPC24B_0025" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 21516..22145 + /gene="rmlD" + /locus_tag="SPC24B_0025" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 21519..22247 + /gene="rmlD" + /locus_tag="SPC24B_0025" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene order(22440..23393,23410..23625) + /gene="tnp" + /locus_tag="SPC24B_0026" + /pseudo + CDS join(22440..23393,23410..23625) + /gene="tnp" + /locus_tag="SPC24B_0026" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 22446..22889 + /gene="tnp" + /locus_tag="SPC24B_0026" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 8.9e-05" + /pseudo + gene 23824..>23976 + /gene="aliA" + /locus_tag="SPC24B_0027" + CDS 23824..>23976 + /gene="aliA" + /locus_tag="SPC24B_0027" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33927.1" + /db_xref="UniProtKB/TrEMBL:Q4K0A5" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSAKGEKTFSYIYETD + PDNLNYL" + misc_feature 23824..23916 + /gene="aliA" + /locus_tag="SPC24B_0027" + /note="Signal peptide predicted for SPC1281 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.782 between residues 31 and 32" +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaaagcag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggcctgact + 361 tttgcatctg ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactacg tttaactatc tattagacta ttacgctgat + 481 aatataataa attgaaacaa gaacaagaca aaagcacctc aaaaaggtat tgcaacttgg + 541 taataccttt ttgaggtgct ttttgatatg agcccatgtt ttctcaatag gattgtactc + 601 aggcgagtag ggaggaagag gtaaaagttt atgcccaaac tcttcgcata aaagttatag + 661 cttccccatt ctatggaatc ttgcattatc cataataata accgatggtg tggttaatgt + 721 tggtaagaga aatttctgaa actaagcttc aaaaaagtcg ctcgtcatcg tctcttcgta + 781 agtcattgga gcgattaact caccattggt tagacctgca accaaagaaa tcctctgata + 841 tcttcttcca gatactttgc ctcttattaa ctgacctttt aatgagcgac catattctcg + 901 ataaaaataa gtatcgaatc ctgtttcgtc aatctaaaca ggtgctaggt gctttaaact + 961 attaaaattc ttaagaaata aggctacttt ttctgggtct tgttcatagt aggtgtggtt + 1021 ctttttttcg agtgtagccc atagctttga gcgcatagtg gatggtagtt ggatgacagc + 1081 caaagtcaga agctatttca gtcaaataag catctggatt gtcagtaaga tagtttttaa + 1141 gtctatctct atcaactttt cttggctttg ttccttttac ttggtggttt agctctcctg + 1201 ttttctcttt tagctttaac cagccataaa tggtattacg tgagatttgg aaaacgtgtg + 1261 atgcttctgt tatactacct gttcgctcac aataagagag aactttttta cgaaaatcta + 1321 ttgaatatgc cataaaaaga ttataccaca ttgtgtacta tagtagattg aaactagagt + 1381 agtacacctc tgcttctaaa acattgttag aaatcgattt gactgtcctg atcgatttgt + 1441 tatgttctta tttcatttta ttatattttt ggtttgcggg aagtctacta agatacttaa + 1501 agatgcagat agtaaaaaaa gatgtagaca ttaccgtaaa aaagtgatat aattgtatga + 1561 tgttcaatgt ataggtgtta atcatgagta gacgttttaa aaaatcaggt tcacagaaag + 1621 tgaagcgaag tgttaatatc gttttgctaa ctatttattt attgttagtt tgttttttat + 1681 tgttcttaat ctttaagtac aatatccttg cttttagata tcttaatctc gtggtaactg + 1741 cgttagtcct actagttgcc ttggtagggc tactcttgat tatctataaa aaagctgaaa + 1801 agtttactat ttttctgttg gtgctctcta tccttgtcag ctctgtgtcg ctctttgcag + 1861 tacagcagtt tgttggactg accaatcgtt taaatgcgac ttctaattac tcagaatatt + 1921 caatcagtgt cgctgtttta gcagatagtg agatcgaaaa tgttacgcaa ctgacgagtg + 1981 tgacagcacc gactgggact gataatgaaa atattcaaaa actactagct gatatcaagt + 2041 caagtcagaa tactgatttg acggtcaacc agagttcgtc ttacttggca gcttacaaga + 2101 gtttgattgc aggggagact aaggccattg tcctaaatag tgtctttgaa aatatcatcg + 2161 agtcagagta tccagactac gcatcgaaga taaaaaagat ttataccaag ggattcacta + 2221 aaaaagtaga agctcctaag acgtctaaga atcagtcttt caatatctat gttagtggaa + 2281 ttgacaccta tggtcctatt agttcggtgt cgcgatcaga tgtcaatatc ctgatgactg + 2341 tcaatcgaga taccaagaaa atcctcttga ccacaacacc acgtgatgcc tatgtaccaa + 2401 tcgcagatgg tggaaataat caaaaagata aattaaccca tgcgggcatt tatggagttg + 2461 attcgtccat tcacacctta gaaaatctct atggagtgga tatcaattac tatgtgcgat + 2521 tgaacttcac ttctttcttg aaaatgattg acttattggg aggggtagat gttcataatg + 2581 accaagagtt ttcagctcta catgggaagt tccatttccc agtagggaat gtccatctag + 2641 actctgagca agctctaggt tttgtacgtg aacgctactc actagccgat ggagaccgtg + 2701 accgtggtcg caaccaacaa aaggtgattg tggctatcct tcaaaaatta acgtcaaccg + 2761 aagcactgaa aaattatagt acgatcattg atagcttgca agattctatc caaacaaata + 2821 tgccacttga gaccatgata aatttggtca atgctcagtt agaaagtgga gggaattata + 2881 aagtaaattc tcaagattta aaaggtacag gtcggatgga tcttccttct tatgcaatgc + 2941 cagacagtaa cctctatgtg atggaaatag atgatagtag tttagctgta gttaaagcag + 3001 ctatacagga tgtgatggag ggtagatgaa atgatagaca tccattcgca tatcgttttt + 3061 gatgtagatg acggtcccaa gtcaagagag gaaagcaagg ctctcttggc agaatcctac + 3121 aggcaggggg tgcgaaccat tgtctctacc tctcaccgtc gcaagggcat gtttgaaact + 3181 ccggaagaga agatagcaga aaactttctt caggttcggg aaatagctaa ggaagtggcg + 3241 agtgacttag tcattgctta cggagctgaa atttactaca caccagatgt tctggataag + 3301 ctgggaaaaa agcggattcc gaccctcaat gatagtcgtt atgccttgat agagtttagt + 3361 atgaacactc tttatcgcga tattcatagc gccttgaaca agatcttgat gttgggaatt + 3421 actccagtca ttgcccacat cgaacgctat gatgctcttg aaaataatga aaaacgcgtt + 3481 cgggaactga tcgatatggg ctgttacacg caagtaaata gttcacatgt cctcaaaccc + 3541 aaactttttg gcgaacgtta taaattcatg aaaaaaagag ttcagtattt tttggaacgt + 3601 gatttagttc atgtagttgc aagtgatatg cacaatttag acagtagacc tccatatatg + 3661 caacaggcat atgatatcat tgctaagaaa tatggagcga aaaaagcgaa agaacttttt + 3721 gtagataatc ccagaaaaat tataatggat caattaattt aggagaaaat atgcaagatc + 3781 aaaacacttt ggaaatcgat gtatttcaac tattcagagc tttatggaaa agaaagttgg + 3841 tcattttatt agtggcaatt ataacttctt cagttgcttt tgcctacagt acttttgtta + 3901 tcaaacctga gtttactagt acgacccgga tttatgtagt taaccgtaat caggaagaga + 3961 aatctggttt aaccaatcaa gacttgcagg caggttcata cttggttaaa gactatcgtg + 4021 aaattatcct atcgcaggat gttttggagg aagttatttc tgatttgaaa ctagatttga + 4081 cgccaaaagg tttggctaat aaaattaaag taacagtacc agttgatacc cgtattgtat + 4141 ctgtttcagt taatgatcga gttcctgaag aggcaagccg tatcgctaac tctttgagag + 4201 aagtagctgc tcaaaaaatt atcagtatta ctcgtgtttc tgatgtgaca acactggagg + 4261 aggcaagacc ggcgacatca ccgtcttcgc caaatattaa acgcaataca ctaattggtt + 4321 ttttggcagg ggggattgga actagtgtta tagttcttct tcttgaactt ttggacactc + 4381 atgtgaaacg tccggaagat atcgaagata cactgcagat gacacttttg ggagttgtac + 4441 caaacttgag taagttgaaa taggagagag gaatgccgac attagaaata gcacaaaaaa + 4501 aactggagtt cattaagaag gcagaagaat attacaatgc cttgtgtaca aatatacagt + 4561 tgagcggaga taaactaaaa gtaatttccg ttacttctgt taaccctggg gaaggaaaaa + 4621 caactacttc cgtaaatata gcaaggtcgt ttgcgcgtgc aggctataaa actcttttga + 4681 tcgatggcga tactcgaaat tcagttatat caggagtttt taaatcgcgt gaaaaaatta + 4741 cagggctaac agaattttta tctgggacag ctgatttatc tcacggttta tgtgatacaa + 4801 atattgaaaa tttatttgta attcaatcgg gatctgtatc accaaaccct acggccttgt + 4861 tacaaagtaa aaattttaat gatatgattg aaacattgcg taaatatttt gattatatca + 4921 ttgttgatac accacctatt ggaattgtta ttgatgcggc aattatcact caaaagtgtg + 4981 atgcgtccat cttggtaaca gcaacaggtg aggcgaataa acgtgatgtc caaaaagtga + 5041 aacaacaatt agaacaaaca gggaaactgt tcctgggagt tgttttaaat aaattggata + 5101 tctcggttga taagtatgga gtttacggtt cctatggaaa ttatggtaaa aaataactta + 5161 gaaaagattt tatggatgaa aaaggattga aaatttttct ggcagtatta cagagtatta + 5221 ttgtcatttt attggtttat tttcttagct ttgttagaga gacagaagtt gaacgttctt + 5281 cgatggttat actatacctt ctccactttt ttgtattcta ttttagttcc tatggtaaca + 5341 atttttttaa aagagggcac ctagttgagt ttaatagtac tataagatat atttttttct + 5401 ttgcaatagc tataagtgta ttaaactttt ttatagcgga acggtttagt atctctagaa + 5461 gaggaatgat atacttctta actttagaag gaatatcctt atacttgtta aatttcttag + 5521 taaaaaaata ttggaagcat gtgtttttta atctaaaaaa tagcaagaaa attttactgt + 5581 taacagtaac gaaaaatatg gaaaaagttc ttgataaatt gctagaatct gatgaacttt + 5641 catggaaatt ggtagcagta agtgttttgg ataaatctga ttttcaacat gataaaatac + 5701 ctgtaattga aaaggaaaaa attattgaat ttgcaacgca tgaagttgtg gatgaggtgt + 5761 ttgtcaatct tccaggagag agctacgatg ttggagaaat tatctctagg tttgagacaa + 5821 tggggataga tgtaactgta aatcttaaag catttgataa gaatttgggt cgcaataaac + 5881 aaattcatga gatggtggga ttgaatgtag tcactttctc tacaaatttt tataaaacta + 5941 gtcatgtgat tttaaagaga attctcgata tttgtggtgc cactattggc cttattcttt + 6001 ttgctatagc tagtctagtt ttagttccat tgattcgtaa agatggcgga ccagctattt + 6061 ttgctcaaac tcgtataggg aaaaatggtc gacattttac cttttataaa ttccgttcga + 6121 tgcggatcga tgctgaagct atcaaagaac agttgatgga tcaaaatacg atgcaaggtg + 6181 gtatgtttaa gatagacaat gatcctcgtg ttacaaaaat tggtcgcttt attcgtaaaa + 6241 ccagtttgga tgaattgccg cagttttgga atgtctttat aggagatatg agtttggtgg + 6301 gaacacgtcc acctacagta gacgagtatg atcagtatac tccagaacag aaacgtcgac + 6361 tcagctttaa acctggtatt acaggtttat ggcaggttag cggccgtagt aaaataacca + 6421 attttgacga tgttgtaaaa ttagatgtgg cttatattga taattggaca atctggaaag + 6481 atattgaaat tttgcttaaa actgttaaag ttgtatttat gagagatgga gcgaagtaat + 6541 ttctgtatat ccatcatatt aggagagaaa tgaaaaagtc agtttatatc attggttcaa + 6601 aaggaattcc tgctaagtat ggaggatttg aaacttttgt tgaaaaatta acagccttcc + 6661 aacaagataa ggctatccaa tattatgtgg cttgtatgcg tgaaaactct gcaaaatcag + 6721 ggactactga ggatgttttt aaacataatg gtgctatctg ttataacgtc gatattccta + 6781 atattggtcc agcgcgagct atagcgtatg atatcgctgc aattaacaga gctattgaat + 6841 ttgccaaaga aaataaggat gaagatccaa tcttctatat tttagcttgt cgaattggtc + 6901 cgttcatcca tggaattaag aaaaaaatcc aggcgatagg tgggactctt ctagttaatc + 6961 cagatggcca cgagtggtta cgagctaagt ggagtgctcc cgttcgtcgc tactggaaaa + 7021 tttctgaagg tcttatggtc aaatatgcag attttttagt gtgtgatagt aagaatattg + 7081 aaaaatatat ccaagaagat tataaacagt atcaacctaa aacaacctat atcgcttatg + 7141 gaacagatac aacacgctct acattaaaga gtagtgataa aaaagtacgt tcttggttca + 7201 aagagaagaa tgtttctgag aacgagtatt atctagttgt aggacgtttt gtaccagaaa + 7261 acaactatga atctatgatt cgtggctttt tggcgtctaa ctctaagaag gactttgtct + 7321 taatcacaaa tgtagaacag aataaatttt ataatcagtt gttggcaaaa actggttttg + 7381 ataaggaccc acgagtaaaa tttgtaggta cagtctatga gcaagagctt cttaaatata + 7441 ttcgtgaaaa cgcctttgct tacttccacg ggcatgaagt tggtggaacc aatccttcgc + 7501 ttttagaagc tctggcatca actaaactga atttattgct agatgttggc tttaaccgag + 7561 aagttgggga gcaaagtgcg atttattgga aaaaagatga gctttcccaa ataattgaga + 7621 aagttgaaca atttgatgca aaaatgattg atgagttaga tagacaatca aatcagagaa + 7681 ttgcggattc tttcacttgg gaaaagattg tcacagacta cgagaaagta tttaaaggtt + 7741 agagttaatg gcagtaaaat taaaatatga taaatcagat attatatttt tagatgatga + 7801 cgaattgaaa aaataccaat cagaattgtt gaaaatgata tcagatgtgt ttactttttt + 7861 tgatgaaaat gggatagcgt attctttaag tggaggtagc attttagggg caatccgtca + 7921 taaagggttt atcccttggg atgatgatgt tgatatcaat attccgaggg aaagttacga + 7981 taaactattt tctctatttg agtcagacaa tagtcttagt cgtaaatatt atcttcaatc + 8041 agcaaaaagt catccagaat taggacttca tgtttctcaa attagaaaaa aaggaacagt + 8101 tgctcgtagg aaatacgatc attcggctga ggagtgcggt atttctatag atctttacat + 8161 tgtagaaaat gtatacaata atccagtgaa acgattcttt caaggttata caagtatgtt + 8221 tttgactttt gccttggctt ctgtacgaga aacaaagaac catgccctga tgaaggaaat + 8281 gtttagactg gaaggtagaa aactaaatta ttcagctgga aagttaatgg ttggttggtt + 8341 ttttggaatt attccaattg aaaagtggtt gaattggctt gataaatgta attcaagctg + 8401 taaggattca catacaaaat atgtatccat acctacagga aggaaacact ttagacgcga + 8461 gacttacttg cgagagaata tgaatattta taaaaaggtt ccttttgaaa ctttgatggt + 8521 gaatgttcct gtttggtcag aagagtattt agaaatgttt tacggtaaag attatatggt + 8581 cgttcctcct gttgataaga gagagcaaca tttgttttta gagttgagtt acggagaaga + 8641 atagatgaaa gtagcgattt taacagcttc aggcattgga agccgaattg gtcaagatat + 8701 ccctaaacaa tttattcatg ttgaaaataa gtcagtcatt atctataccc ttgaaaaatt + 8761 tcaaaatcat ccagaaattg atgaaatctg tattgttatt ttaaaaggct gggaccagat + 8821 ggttaaagct tatgcggaac aatttggaat tacaaagtta aagatgataa ctttgggagg + 8881 gaagtctggt caagaatcaa ttataacggt cttagagaag ttaagaaagc tcatcccaat + 8941 gaggatgtga ctgtattaat tcatgacgga aatcgtcctt tagtgagcaa tgatattatt + 9001 agcaacgctt tagcaacata ccaacagttt ggaaatgctg ttgcagcgat accaacgact + 9061 gaggtagtat ttgttttaga aaacccacaa tcaacttcat ccacagaagc attgaatcgt + 9121 gacttgttga gacgaacaca aactcctcat gtttaccatc ttgataatat tctatcgctt + 9181 catgaaaaag cattagaaaa tgggataact gatgttgcag catcatgcca actcatgcaa + 9241 ctatttggtg aagagagtta tttctctctt ggaacagaga aaaacttgaa aattacgact + 9301 gtagaagatc ttgatatttt taaagcttta ttgagttcaa ctagagataa gtggattaaa + 9361 tagtaatgac attattatta aataaaatat atagacaaga tgtagaatct tctctagaaa + 9421 caatcgtcaa tattaatgac ttgaatggca agtcaatttt aattactgga gcttctggtt + 9481 tgattggttc aagtgtcatt gaccagttat tattgctaaa tgaaataagg aattttaaca + 9541 ttaaaatttt ttgttgtgga agagagtttg aatcattaga aaaacgattt ggtagacaaa + 9601 cagagtattt acactttgtg ttctatgatg cgactaaagc acctcacttt gattttgcag + 9661 tggactacat tattcatgct gctagtcctg ctagtcctga attatacgtt aatcagcctg + 9721 tagaaacaat ggctagtaat tttctgggca tgtataatct actggaatac gccaaaaatg + 9781 ctaaagtttc aaatctagtt tatatctcat ctagtgaagt ttatggaatt agcactagta + 9841 ataatccttt ggacgaaaat tatattggaa ctgttgatca tcttagcgta cggtcttctt + 9901 atgccagttc aaaaagagct actgaaacac tttgtgttag ttttgcttcc gagtatggaa + 9961 tcaaaataat gatagtaagg ccaggacata tctatggccc tagtgccaag gactctgata + 10021 atcgtgtatc atcatttttt atgacagaag cgattgctgg gcgtgatatt gtcatgaaaa + 10081 gtacaggtag tcagttaaga tcctattgtt atagtttgga ttgtgccagt gcaattctaa + 10141 gtgttcttct ttcgggtgga tcaggacaag cttataatgt ttccaatcca aattcaatta + 10201 ttactataaa acagatggca acttgcattg cagatacttc aggagtcaga gttctttatg + 10261 atatacctat aactcaagag cgaaaacagg aaaatcctat ggtaaatgca agcttagata + 10321 gtaagaaaat tgagtccttg ggatggtcag gtctattttc agctgaagta ggcttccatc + 10381 acacatttag tattttaaag gagttatcaa gtgaaaaatg atagtatttt aattatgatg + 10441 acaacataca atggagaaga atttatacgt gaacagttgg agagtatcct ttttcaaacc + 10501 attacagcat ggaaactata gattcgtgat gacaattcta gtgatcaaat aagagcaatt + 10561 attaaagaat acgaagaaaa agatagtcaa tttttgatat aagctagcca agggggattt + 10621 tggagaagtt tttttattga agagtggcca taagaaggtc ttctaggctt aatttaggtt + 10681 ttagtccacc ttttgcgtgt ttaagttgat aagctgtttt taatacagct aacatctctt + 10741 caaaaatggt acgctgaacg tcaacaagac gcttaaatcg tacatcagtt agttgtttac + 10801 ttgcttcata attcatagaa ctattatacc atattttatt tcgcaggaaa tctattgaaa + 10861 aaacgacact atattatcaa tggggatgtt aggactatat gttaaaaaca tgcgagagta + 10921 tcttttgtta tgaatattat gagagtacat agaaagatag agatttcact gatggaattt + 10981 tatagagaag ggaaaactgt atttatttgg atatattgaa ctcagtggaa tggattgatt + 11041 agggtatata catatggtaa atggatgtaa cccgcaaaca gaacacggat ggagtacaca + 11101 tttgctaatt acagagattc attgaaaaat attagagttt caaataggaa aagtaatgat + 11161 tgacggagat tttatgaata gaagacttgt aataaaaaag aaaagtataa tgtttttcat + 11221 gcttatgtta tgtgttacgg cattttatgg gacaaattat tggtatacaa atatatatat + 11281 atatgatttt atgattataa catcatgctt attatcaata atagtatttg tatgtaatgg + 11341 tattagaatt gataaaacat attataaagg gacaataata ctgggtattg taatgtggtt + 11401 ttcaggactt attgctgcac aaggaaaagg gctccctgct attgtaatct ttaaagagag + 11461 tttatatact attactccaa taatgatatt tttagctttc cgacctatga taaagtcaat + 11521 aaaagacact tcattattcc ttcgtactat ttctgctgcc ggtgttatat gtaatttaat + 11581 tgcttgtatt gaaatgttct ttgccaaaag aggatttgat tttctaaata taagtgtatt + 11641 tgaaaaactt agaaatggta ctcctagatt tacaattgga gaaacaataa tagttcttag + 11701 tttttttatc tcctgtagtg ttgtttttag taaaggggga aagagaaata gacgcatttt + 11761 ccatgttcta aatatagctc tcacagctat aaatttagtg tatattatta aaacaaggac + 11821 actgaattta tatattttat caacacttat gatggtgcct gttttaaaaa aaaatgtaaa + 11881 gaaacaactt aagttttgga ttgtgttttt gatatctata attcttactt ttgtttctgc + 11941 agaatatttt attccaatag tcaaaaattt aattcatagt gatcatggga ttcaaattag + 12001 attcttgacg atagaatact atatagagta ttttaaaaat cattacttat ttggagcggg + 12061 atatatttct tctagtccat attttgaaac ttattctatt gttaccggtc cattaggacg + 12121 ttattatcca agcgatgtag gtttgattgg acttatgttt agaagtggga ttatcgggct + 12181 aatttggtta ataagttggt tttatacaag cttgaagata attaaagata atacgattag + 12241 aattccagct cattatgact tattaatgaa gctagttata gtttttttga tgttttcttg + 12301 tattaatttg ataatcactg atgcacctag attcccatat attgcattag ctatgttact + 12361 ttttgaatca agttatacct tgagttatga aaacagttct aattagaatg tatttcagat + 12421 agttatttta aaggatgagg ggaaatgatt aagagattag caatacttat ggccacatat + 12481 aatggcgaaa aatatataaa agagcaaatt gaaagtattc tcaaccaaga tacagatttt + 12541 gattttactc taattattag agatgacggt tcaacagata atactaaaaa tataattaga + 12601 gaatatgttg atagtgggaa aattattttt atagaaggcc agaataaagg ggcggcaaga + 12661 ggatttattt ctttgttatg tgataatcct ggatatgatt actatgcttt ctcggatcaa + 12721 gatgatgttt ggaatcataa taaattacag aaaggtatat ggagtctttc caaatatact + 12781 gggccagcac tttattgttc taattgtgaa ttagttgatt cagagttaaa tagtataggt + 12841 cgtaatacac ataggaagag accgaactat actcttgaat ctattctttg tcttgctagt + 12901 tgtgcacaag gatgtacatc tgtatttaat aaagagctag cttcgataat tcaggagaat + 12961 gatgtgcctg atacttttat tatgcatgat tctttgatta cttgtttatg tgcactgata + 13021 ggtggaaaga taatttacga cgaaattcca tcaatgaaat atagaatgca tgatgataat + 13081 atatttggaa tggtgtcagc taagcaaaat gtactaaatg ttataaaaga tcgtattagt + 13141 gaaataacaa aaaagcgaac gattagtatg tacgatcaag cagagtgttt actaaaggtt + 13201 tataaaaaat atatagattc taacaatcaa gatatatgta gaattgttat tgattctaaa + 13261 gtatcgctaa aggcaagact taagctgatt tttaataaaa atttgcagca tactacatta + 13321 aataaaacca taacaaaaaa attagagata ttatttggca atgactaata aaggagttta + 13381 gctatgaagt atcaactcat tgtatcaaca atgaatcaac aggataacag tctgatagag + 13441 aaaatgaata taaaatctga tgcaattatc attaatcaat caaactcatt ttcttaccat + 13501 gagacgaaat tgaaaaattc gattgtaaaa tggtatgaat tcaatgaaag aggtattggt + 13561 ttaagtcgaa acacaggttt catgagatcg gatgctgata ttattcaatt tgctgatgac + 13621 gatatgattt ttacagatac atattatgaa gacgtattat tagaatatca aaaacatcca + 13681 gaagctgatg taattctttt ttcgaataaa tgtcttaatg aagatcgaat gccttatcag + 13741 gttaataatt ttagacgtat aaataggttt gaaggtgtta agtttggtgg tgctagaatt + 13801 acagtcagga gagaaaagat attgcataat aacataacgt tttctctttt atttgggggg + 13861 ggagcaaaat acggtgcagg agaggacgta acatttattc aggactgtat caaggcagga + 13921 ttacgggtat ataaatcacc tattattgtt tctacaatga aacaagattc ttctacatgg + 13981 tttaaaggat atgatagaaa atattataaa gataaaggtg ctttattagc agcaaatttc + 14041 ccttctataa gtgaggtagg agtatatata caagctttca aaaatagggg gggaatttat + 14101 acatttagtg aattacttag attttataag gaaggtgtta acgaatttaa aataaataga + 14161 tgataaattg atatgataaa gagttttttg attatgccaa aaaataaagt ttataatact + 14221 ggcgagacag acattgagtt gaaaaataaa tacaattatg aaggtagtga gttgaggaaa + 14281 gttcaagttc gtatgattga tatgctttct tttttgaatg atatatgcaa agaaaataac + 14341 atcacctatt tcattgcttt tggaactcta ttaggagcta ttagacatgg aggctttatt + 14401 ccatgggatg ataatcttta tatttatatt tatattaatg ataaaggttt aaaaaaactt + 14461 agaaaaataa ttaataatgg aaactatccc tatgttattc aagactattc tagtgataaa + 14521 ggatttgtaa ggtattatag tgttctcaga gatactaact ctgaatatat aaaaaatgaa + 14581 tatcaacata atcagcgtaa atacagaggt gtacaaattg acttattccc ttatggttat + 14641 ggtgtaatga aatggggtga acgtcttatt ggaaaaatat atggttttaa tgaaaaaata + 14701 tttttaggga aaataaaatg ttggcagcat taatttttta tttaactaaa gaagttataa + 14761 ttccatttct gaaagtaatt agtaagatta acggaagaaa gaaagtaatt tattggttgc + 14821 tgacaatttt gggactgtgg atgattactc taacacctat ttttgaaaat attgttggag + 14881 ctattttaaa agtagatgga gtaggtagag gaagtgattc attgactatt cgagcaattg + 14941 gacgacagtt atattgggaa caattgaatg agacaacttt aaaacttctt tttggaacag + 15001 gataccctaa ttataattat gctttagcct ttcaacgtac aggttttttc aagcaatatt + 15061 tttttaacag acaatggttt tatgatatat atatatttgg tattgtgggt tcctcaatta + 15121 tgggattatt atttttaaaa tatcttaaaa attcaataaa gtatgataga caatctgcag + 15181 atatgattcc gttgatgtat attatttctt tactaattgt agcctataat attattcttt + 15241 ggtattggaa tgcggacggt acttttatat tagtaatcat gatttgcgca ttggagcatg + 15301 gagaacaatt attacatcag aagaatggag tgtgattgga tgaatttaaa taaagaagtt + 15361 agatggaagg ataagcaata tattgctttt gatttttttg atacaactat ccatagaaat + 15421 tgtcatcctg aagtgatttt atttgaatgg tctaaaaaaa tttctattta tttctctttc + 15481 aaaatatctg ctacagaaat ttattcaatt aggaaaaaat ctgaaataca tgagaagcaa + 15541 gaaaaacaat tggaagaaat taaatatgaa agattacttc aacttgtttt ttatactatt + 15601 ttaagtcgtt tgaagtcaga tgttaccgac tataatcttg aagatttttt aatttatgca + 15661 agaacgtgtg aagaggaaat agaattaaga catattagta ttgatacaga tacaattaat + 15721 tttattgaat ttttaaaaca aaatgggaaa aaaataattt taatttcaga tttttattct + 15781 gataaaaagc taattgaaaa attaatggtt tcattaggga ttagagatta tttctctaaa + 15841 atatttattt caagtgaaat tgggttacgt aagtcatcag gaaatttata tgaatatgtg + 15901 atcaatgaat tgagctgtaa gcctataaat ttacttatga ttggtgataa tatttattct + 15961 gatgtaaaag ttccaaaaaa actaggaata gattcttatc ataaatctta ttcagattca + 16021 catgtgactg tgagtcctaa cgatattgta aaagcgatga ataatgttat ttctcaagct + 16081 tgtactgaat ctttatttaa tctctatata cctgaaatac tttattttat ttcaaagtta + 16141 tacaaagaat tatctgttaa caaagctagt gatatattat tttgttcaag agaaggtttt + 16201 tttataaaaa aattatttga tctttatcaa aaaaaaatga acttaaagct tattaactca + 16261 cattattttt atgtttctag aaaatcaacg ctatatccat catttaaaaa tattgaggat + 16321 gaagattttg aagttatttt tagacaattt cctgaaatta ctttagaaaa ttttttgatt + 16381 aatttaaatt tttccaataa tgatattaac aatattgcta agcaaacaga aattaaacaa + 16441 acagacaaag tatcagataa atctattatt aacaaattaa aacaaaataa attatttaaa + 16501 gacgtttatg aattgaactg taaagaagaa aaatattctt ttagagaata tttaaagtct + 16561 gtaggagttg agaatgacaa ttctataata aatatggtag atattggttg gaaaggtacg + 16621 atacaagaca atattcaaaa agcttttcca tctttaaata taaaagggta ttatatgggg + 16681 ttgaattttc aacggtattc tactaggaat agtatgaata agacgggaat actgtttact + 16741 gatgatcctc aaaaaacaaa gttttttaac ttatttaatt ataaatattt attctatgaa + 16801 agaatttttg ttgcagatca tggaccgaca gttagatatg aatttatgaa tggtgttggg + 16861 gtaccaacat tggatacaga tgaaaatcat atagaaattt atagatttgc tgaggaattt + 16921 cagattacat ttttcaacac atttgagaaa attttagatt tgttcaatga atcactagta + 16981 acaccagatg aattatttaa cgaaatagct aatttatcat taaaaaaaca ttgcatctat + 17041 ttaccaaggc tttcagtaag tataaaaaaa ttagatagag cagcaaaaga aaattttggt + 17101 attataaaat ctactaacag gaatagtgat aataaggtaa gaaatttttg gaaaaataga + 17161 gattttttat ttttagatta tatatataaa gcgtatggaa agaatagatt gttaaaccct + 17221 atattggata tttacggata ttttgtatat ctgattaaaa cactgcaaat aaaaatagta + 17281 ggggatattt gatgagcatg aaagaaaaat caataagtaa aaatgctatt ttgaatatta + 17341 ttttaacact aacaaatatt gtgtttccat taattacttt tccttatatt tctagaattc + 17401 tgaatccgtc aggaataggc gcaatctctt ttttttcatc tattggttct tatggtgttt + 17461 tagttgcctc gcttggaatt tcaacttatg ggattcgggt gattgcaaag aatcgttatc + 17521 ataaagataa gataactaaa atattccaag aattgatagt tattaatagt gtaatgtcta + 17581 ttatagtgac gttcttcctt gttttaatga gtttccgatt agagcagtta agttcagaaa + 17641 aaggtttatt aataatcaca tgtattacta ttttgtcctc tccttttaat ttgaattggt + 17701 tttatagtgg aatagaagag tattcatata taacaaaacg ttcaatattt tttaaattag + 17761 tttcattgat attaaccttt ttatttgtta aaagtaaaga cgattatatt atatatgctg + 17821 tgataatatt gttttcaaca ttggcttcca attttataaa tattttggag agtagaaaat + 17881 acatcaattt taatttgaga aggaatttag aatttagata tcatctaaaa ccaatgtggt + 17941 atttatttgc ttcgttactt gcagttaata tttatacaaa tttggattct gtgatgttag + 18001 gaattattaa tggaaatgat gcggtaggta tttactcaat cgcatcaaaa gtaaaatgga + 18061 ttttattatc agtcgttact tcagtgagtt tagttttatt acccagatta tcattttata + 18121 gcaataagta tgacgaaacg aagtttaata atattttgag aaagtcatct acaataattt + 18181 ttatgatttc aattcctcta acaatttttt ttatgataaa agcgaaagag agtatattat + 18241 tgttaggtgg agagcagtat attcaggcag ttttagcaat gcaaatatta atgccgatct + 18301 tgataatatc aggtttttcc aatattatag gtaatcagat attgatccct actggtaatg + 18361 agaaatattt tatgagagca gtttctatag gggcaatagt aaatttatgt ttaaatttgt + 18421 tgcttatgcc tattttggga attatcggag gtgcaatcgc aactctttgt gcagaatcag + 18481 tccaaatgat tattcaattt tatttttctc gtaataaatt aatgggtaat atttcattaa + 18541 attcaatcaa aaaagtagcc tattcatcaa tttttgcggg tatactgtta atagtaatac + 18601 aaaatattat agagaatttt aatagcttct taaatttagc tgcttctagt ttcctatatt + 18661 ttggagtata ttttttctta ttggtattgt ttaaagaaag tacaattaag aaatttctaa + 18721 atcaaatttt ttataaggat atttcatgaa tttattacca attatttatg gagcgattct + 18781 tgatttaata ttaataattt tttaaagtga ataaaatcaa agcaataaaa gattaaaaaa + 18841 taaattgcta tctattatgt ttttctcaaa ctaagtaaaa cataacttat gaaaacaaat + 18901 ttaaaaagga gggactatag tatgaaaggt attattctag caggtggttc gggaactcgc + 18961 ttgtatcctt tgactcgcgc tgcatcaaaa caacttatgc cggtttatga taaaccgatg + 19021 atttactacc cactttcaac attaatgttg gctgggatta gggatatttt gattatctca + 19081 actcctcaag atttgcctcg ttttaaagag cttcttcaag atggttctga gtttggtatt + 19141 aaactttctt atgctgagca accaagtcca gatggtttgg cacaagcctt tatcattggg + 19201 gaagagttta tcggtgacga tagcgttgcc ttgattttag gtgacaatat ctaccatggt + 19261 cctggtttga gcacaatgct tcaaaaagca gccaagaaag agaaaggtgc gactgttttt + 19321 ggctaccatg tcaaggatcc agaacgcttt ggtgttgtag aatttgatga aaatatgaat + 19381 gctatctcca tcgaagaaaa gccagaatac cctcgttcaa actatgcagt gacaggactc + 19441 tatttctatg ataatgatgt agtagagatt gccaaaagta ttaaaccaag tcctcgtggt + 19501 gaattggaaa ttacagatgt caacaaggct tacttggatc gtggtgattt gtctgttgag + 19561 ctcatgggac gtggttttgc ttggttggat actggcactc atgaaagttt actagaggct + 19621 tcgcagtaca tcgaaacagt ccaacggatg caaaatgttc aggtagcaaa cttagaagaa + 19681 attgcttacc gtatgggcta tatcagtcga gaagatgtat tggccttagc ccaatcactt + 19741 aagaaaaatg aatacggaca gtatctgctc cgtttgattg gagaagcata gatgacagat + 19801 aattttttcg gtaagacgct tgcggcacgc aaggttgaag ctattccagg catgttggag + 19861 tttgatatcc ccgttcatgg agataatcgt ggctggttta aagaaaattt ccaaaaggaa + 19921 aaaatgcttc cacttggatt tccagagtct ttctttgcag aaggaaaatt gcaaaacaat + 19981 gtatccttct cacgtaaaaa tgtccttcga ggcctccacg cagagccttg ggataagtac + 20041 atctctgtag cagatggagg gaaagttctg ggttcttggg ttgatctacg cgagggtgaa + 20101 acctttggga atacctatca gacagtgatt gatgcgagta agggaatctt tgttccttga + 20161 ggcgtagcta atggcttcca agttttatca gatacagtgt catatagcta tctggtcaat + 20221 gattactggg ctcttgaact caaacccaag tatgcctttg tgaactacgc tgatccaagc + 20281 cttggtattg aatgggaaaa tattgcagaa gcagaggttt cagaagcaga taaaaatcat + 20341 ccactactta aggatgtaaa acctttgaaa aaagaagatt tgtaaaaagg aaagaatatg + 20401 actgaataca aaaatattat cgtgacaggt ggagctggct ttatcggttc taactttgtc + 20461 cattatgttt acgagaactt tccagatgtt catgtgacag tcctagataa gttgacttat + 20521 gctggaaacc gcgcgaatat tgaggaaatt ttaggtaatc gtgttgagtt agttgttggt + 20581 gacattgctg atgcggagtt ggtagacaag ttggctgctc aagcagatgc tatcgttcat + 20641 tatgcagcgg aaagccacaa tgataattcg ctcaatgatc catcgccatt tattcatact + 20701 aacttcatcg gaacctatac tcttttagaa gctgctcgta agtatgatat tcgcttccac + 20761 catgtatcga cagatgaagt ttatggggat ctccctttac gcgaagattt gccaggtcat + 20821 ggtgaaggac caggtgagaa atttactgct gaaacaaaat acaacccaag ctctccgtac + 20881 tcatcaacca aggcagcctc agatttgatt gtcaaagcct gggtgcgttc ttttggagtc + 20941 aaggcaacga tttccaactg ttcaaataac tacggtcctt atcaacatat cgaaaaattc + 21001 atcccacgtc agattactaa catcctaagt ggaattaagc caaaacttta cggtgaaggt + 21061 aagaatgttc gtgactggat tcataccaat gaccattctt caggagtttg gacaatcttg + 21121 acaaaagggc aaatcggtga aacctacttg attggggctg atggtgagaa gaacaataag + 21181 gaagttttgg aacttatcct taaggaaatg ggacaagctg tggatgccta tgatcatgtg + 21241 actgaccgtg caggacatga ccttcgctat gcgattgatg ccagcaagct ccgtgaggag + 21301 ttggggtgga aacctgaatt taccaacttt gaagctgggc tcaaggcaac aatcaagtgg + 21361 tatacagata accaagaatg gtggaaagca gaaaaagaag ctgttgaagc caattatgct + 21421 aagactcagg agattattac agtataaaaa gcaggaaaca gctgcttttt attgctatat + 21481 tgggaagagt tacatattag aaaggtctag agatgatttt aattacaggg gcaaatggcc + 21541 aattaggaac ggaacttcgc tatttattgg atgaacgtaa tgaagaatac gtggcagtag + 21601 atgtggctga gatggacatt accaatgaag aaatggttga aaaagttttt gaagaggtga + 21661 aaccgacttt agtctaccac tgtgcagcct acaccgctgt tgatgcagca gaggatgaag + 21721 gaaaagagtt ggacttcgcc atcaatgtga cggggacaaa aaatgtcgca aaagcatctg + 21781 aaaagcatgg tgcaactcta gtttatattt ctacggacta tgtctttgac ggtaagaaac + 21841 cagttggaca agagtgggaa gttgatgacc gaccagatcc acagacagaa tatggacgca + 21901 ctaagcgtat gggggaagag ttagttgaga agcatgtgtc taatttctat attatccgta + 21961 ctgcctgggt atttggaaat tatggcaaaa acttcgtttt taccatgcaa aatcttgcga + 22021 aaactcataa gactttaaca gttgtaaatg accagtacgg tcgtccgact tggactcgta + 22081 ccttggctga gttcatgacc tacctagctg aaaatcgtaa ggaatttggt tattatcatt + 22141 tgtcaaatga tgcgacagaa gacacaacat ggtatgattt tgcagttgaa attttgaaag + 22201 atacagatgt cgaagtcaag ccagtagatt ccagtcaatt tccagccaaa gctaaacgtc + 22261 cgctaaactc aacgatgagc ctggccaaag ccaaagctac tggatttgtt attccaactt + 22321 ggcaagatgc attgcaagaa ttttacaaac aagaagtgag ataagtagta gaatgatttt + 22381 ctagtctaat aaaagaggca gataatgaac tccaaaggag cttaagatgt acgattatct + 22441 tgttgttggt gctggtctct ttggcgcata gctttggctc agtttctatt atcgctcaca + 22501 tcatccatca gaagattaat ctgaaggtac ccaattatcg ccaagaagaa gattgggcta + 22561 ggatgggttt accaatcaca cgtaaggaaa tctctaattg gcatatcaag gcaagtcaat + 22621 actatttaga gtccctttat aaccttttac gagaaaagtt gttagaacaa cctcttcttc + 22681 atgcggatga aacctcttat cgggttctag agagtgatag ccatctgacc tactattgga + 22741 cctttttgtc tgggaaagct gagaatcaag caatcacgct gtaccatcat gatcagcgtc + 22801 ggagtggttt agtagtccaa gaattcctag gagattattc tggctatgtg cattgtgata + 22861 tgttgcggca gtaacttagg actttagtcc tctagttctg cctatgcgat agcagtccaa + 22921 ggtttaggag caaggcgacg ctaagcttgg taaactgcga acctctagaa gcttatcgtc + 22981 aactggaaga agctgaactt gttggatgtt gggcacatgt gagaaggaag ttttttgaag + 23041 cgacccccaa gcaagcagat aaatcatcct tagaagctaa aggtttagct tattgtgatc + 23101 agttattttc cctggaaaga gactgggagg ctttgccagc tgatgaacga ctacagaaac + 23161 gtcaagaaga gctccaaccc ctaatggaag acttctttgc ttagtgccgg cgtcagtcag + 23221 ttttagcagg ttcaaaacta ggaagggcaa ttgaatacag cctcaagtat gaagaaacct + 23281 ttaagactat tttgaaagac ggacatctgg tcctttccaa taatctagct gaacgcgcca + 23341 ttaaatcatt ggttatggga cggagtaaaa gagttcagtg gactctttta gcctaagcta + 23401 aattttaaaa agcgagggtg gttattttct caaagttttg aaggagctaa agcaacagct + 23461 attattatga gtttgttgga agcagctaaa cgtcatcaat taaatagcga gaaatatcta + 23521 ttctatcttc tagaatgtct tccaaacgag gaaactctcg taaacaaaga ggttttagag + 23581 gcttatttac catggactaa agttgtacaa gaaaagtgca aataagaaat ctccagatta + 23641 ggaactatcc gtgagttctc tagtctggag atttttcaat atacttcgtt attgggcgct + 23701 tacaatgata ttcatatttt ttgcaaagat gttgtttgaa aaataatttt caaaaattct + 23761 gaaaattctg ttgacaactt tctgaaaaga gtctataatg gagagaaagt tttaaaggag + 23821 aaaatgatga aaagttcaaa actatttgcc cttgcgggcg tgacattatt ggcggcgact + 23881 actttagctg catgctctgg atcaggttca agcgctaaag gtgagaagac attctcatac + 23941 atttatgaga cagaccctga taacctcaac tatttg +// + diff --git a/public/res/serotype_genbank/serotype_24C.gb b/public/res/serotype_genbank/serotype_24C.gb new file mode 100644 index 0000000..d067314 --- /dev/null +++ b/public/res/serotype_genbank/serotype_24C.gb @@ -0,0 +1,858 @@ +LOCUS MW683298 23524 bp DNA linear BCT 08-MAY-2021 +DEFINITION Streptococcus pneumoniae strain MNY585 capsular polysaccharide gene + locus, partial sequence. +ACCESSION MW683298 +VERSION MW683298.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 23524) + AUTHORS Ganaie,F., Maruhn,K., Li,C., Porambo,R.J., Elverdal,P.L., + Abeygunwardana,C., van der Linden,M., Duus,J.O., Sheppard,C.L. and + Nahm,M.H. + TITLE Emergent Streptococcus pneumoniae serogroup 24 has a new serotype + (24C) with a variable structure + JOURNAL Unpublished +REFERENCE 2 (bases 1 to 23524) + AUTHORS Ganaie,F., Maruhn,K., Li,C., Porambo,R.J., Elverdal,P.L., + Abeygunwardana,C., van der Linden,M., Duus,J.O., Sheppard,C.L. and + Nahm,M.H. + TITLE Direct Submission + JOURNAL Submitted (26-FEB-2021) German National Reference Center for + Streptococci, Department of Medical Microbiology, University + Hospital RWTH Aachen, Pauwelsstrasse 30, Aachen 52074, Germany +COMMENT ##Assembly-Data-START## + Assembly Method :: SPAdes v. 3.11.1 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..23524 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="MNY585" + /serotype="24C(24X)" + /isolation_source="blood" + /db_xref="taxon:1313" + /collection_date="08-Dec-2012" + misc_feature <1..>23524 + /note="capsular polysaccharide gene locus" + gene <1..134 + /locus_tag="MNY585_0001" + CDS <1..134 + /locus_tag="MNY585_0001" + /note="dexB" + /codon_start=3 + /transl_table=11 + /product="DexB" + /protein_id="QUP73981.1" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 299..466 + /gene="aliB" + /locus_tag="MNY585_0002" + /note="unknown" + /pseudo + gene complement(459..797) + /gene="tnp" + /locus_tag="MNY585_0003" + /note="unknown" + /pseudo + gene 1210..2664 + /gene="wzg" + /locus_tag="MNY585_0004" + CDS 1210..2664 + /gene="wzg" + /locus_tag="MNY585_0004" + /note="member of homology group 0; wzg" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="QUP73982.1" + /db_xref="GOA:Q4K0C4" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0C4" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKLSQNT + DLTVDQSSSYLVAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALSFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIIDSLQDSIQTNMPLETMIDLVNAQLESGGTYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 2666..3397 + /gene="wzh" + /locus_tag="MNY585_0005" + CDS 2666..3397 + /gene="wzh" + /locus_tag="MNY585_0005" + /EC_number="3.1.3.48" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="QUP73983.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTLYRDIHSALNKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRVQYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + gene 3406..4098 + /gene="wzd" + /locus_tag="MNY585_0006" + CDS 3406..4098 + /gene="wzd" + /locus_tag="MNY585_0006" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="QUP73984.1" + /translation="MQDQNTLEIDVFQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPATSPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + gene 4108..4791 + /gene="wze" + /locus_tag="MNY585_0007" + CDS 4108..4791 + /gene="wze" + /locus_tag="MNY585_0007" + /EC_number="2.7.10.1" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="QUP73985.1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILVTATGEANKRDVQKVKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 4807..6174 + /gene="wchA" + /locus_tag="MNY585_0008" + CDS 4807..6174 + /gene="wchA" + /locus_tag="MNY585_0008" + /note="initial sugar transferase" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA" + /protein_id="QUP73986.1" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETEVERSSMVILYLL + HFFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMIYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDVGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + gene 6205..7377 + /gene="wchF" + /locus_tag="MNY585_0009" + CDS 6205..7377 + /gene="wchF" + /locus_tag="MNY585_0009" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="QUP73987.1" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIVYDIAAINRAIKIAKENKDEDPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSILKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIADSFTWEKIVTDYEKVFKG" + gene 7383..8279 + /gene="wcxG" + /locus_tag="MNY585_0010" + CDS 7383..8279 + /gene="wcxG" + /locus_tag="MNY585_0010" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="QUP73988.1" + /translation="MAVKLKYDKSDITFLDDDELKKYQSELLKMISDVFTFFDENRIA + YSLSGGSILGAIRHKGFIPWDDDVDINIPRESYDKLFSLFELDNSLSRKYYLQSAKSH + PELGLHVSQIRKKGTVARRKYDHSAEECGISIDLYIVENVYNNPVKRFFQGYTSMFLT + FALASVRETKNHALMKEMFRLEGRKLNYSAGKLMVGWFFGIIPIEKWLNWLDKCNSSC + KDSHTKYVSIPTGRKHFRRETYLRENMNIYKKVPFETLMVNVPVWSEEYLEMFYGKDY + MVVPPVDKREQHLFLELSYGEE" + gene 8280..8999 + /gene="abpA" + /locus_tag="MNY585_0011" + CDS 8280..8999 + /gene="abpA" + /locus_tag="MNY585_0011" + /note="arabinitol" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase Abp1" + /protein_id="QUP73989.1" + /translation="MKVAILTASGIGSRIGQDIPKQFIHVENKPVIIYTLEKFQNHPE + IDEICIVILKGWDQMVKAYAEQFGITKLKMITFGGKSGQESIYNGLREVKKAHPNDDV + TVLIHDGNRPLVSNDIISNALATYQQFGNAVAAIPTTEVVFVLENPQSTSSTEALNRD + LLRRTQTPHVYHLDNILSLHEKALENGITDVAASCQLMQLFGEKSYFSLGTEKNLKIT + TVEDLDIFKALLSSTRDKWIK" + gene 9002..10057 + /gene="abpB" + /locus_tag="MNY585_0012" + CDS 9002..10057 + /gene="abpB" + /locus_tag="MNY585_0012" + /note="arabinitol" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase Abp2" + /protein_id="QUP73990.1" + /translation="MTLLLNKIYRQDVESSLETIVNINDLNGKSILITGASGLIGSSV + IDQLLLLNEIRNFNIKIFCCGREFESLEKRFGRQTEYLHFVFYDATKAPHFDFAVDYI + IHAASPASPELYVNQPVETMASNFLGMYNLLEYAKNAKVSNLVYISSSEVYGISTSNN + PLDENYIGTVDHLSVRSSYASSKRATEILCVSFASEYGIKIMIVRPGHIYGPSAKDSD + NRVSSFFMTEAIAGRDIVIKSTGSQLRSYCYSLDCASAILSVLLSGGSGQAYNVSNPN + SIITIKQMATCIADASGVRVLYDIPITQERKRENPMVNASLDSEKIESLGWSGLFSAE + VGFHHTFSILKELSSEK" + gene 10071..10271 + /gene="HG26X" + /locus_tag="MNY585_0013" + /note="unknown; label: HG26X" + /pseudo + gene complement(10269..10451) + /gene="tnp" + /locus_tag="MNY585_0014" + /note="unknown" + /pseudo + gene 10791..12041 + /gene="wzy" + /locus_tag="MNY585_0015" + CDS 10791..12041 + /gene="wzy" + /locus_tag="MNY585_0015" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="QUP73991.1" + /translation="MIDGDFMNRRLVIKKKSIMFFMLMLCVTAFYGTNYWYTNIYIYD + FMIITSCLLSIIVFVCNGIRIDKTYYKGTIILGIVMWFSGLIAAQGKGLPAIVIFKES + LYTITPIMIFLAFRPMIKSIKDTSLFLRTISAAGVICNLIACIEMFFAKRGFDFLNIS + VFEKLRNGTPRFTIGETIIVLSFFISCSVVFSKGGKRNRRIFHVLNIALTAINLVYII + KTRTLNLYILSTLMMVPVLKKNVKKQLKFCIVFLISIILTFVSAEYFIPIVKNLIHSD + HGIQIRFLTIEYYIEYFKNHYLFGAGYISSSPYFETYSIVTGPLGRYYPSDVGLIGLM + FRSGIIGLIWLISWFYTSLKIIKDNTIRIPAHYDLLMKLVIVFLMFSCINLIITDAPR + FPYIALAMLLFESSYTLSYENSSN" + gene 12080..13003 + /gene="wcxI" + /locus_tag="MNY585_0016" + CDS 12080..13003 + /gene="wcxI" + /locus_tag="MNY585_0016" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="QUP73992.1" + /translation="MIKRLAILMATYNGEKYIKEQIESILNQDTDFDFTLIIRDDGST + DNTKNIIREYVDSGKIIFIEGQNKGAARGFISLLCDNPGYDYYAFSDQDDVWNHNKLQ + KGIWSLSKYTGPALYCSNCELVDSELNSIGRNTHRKRPNYTLESILCLASCAQGCTSV + FNKELASIIQENDVPDTFIMHDSLITCLCALIGGKIIYDEIPSMKYRMHDDNIFGMVS + AKQNVLNVIKDRISEITKKRTISMYDQAECLLKVYKKYIDSNNQDICRIVIDSKVSLK + ARLKLIFNKNLQHTTLNKTITKKLEILFGND" + gene 13019..13798 + /gene="wcxJ" + /locus_tag="MNY585_0017" + CDS 13019..13798 + /gene="wcxJ" + /locus_tag="MNY585_0017" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="QUP73993.1" + /translation="MKYQLIVSTMNQQDNSLIEKMNIKSDAIIINQSNSFSYHETKLK + NSIVKWYEFNERGIGLSRNTGFMRSDADIIQFADDDMIFTDTYYEDVLLEYQKHPEAD + VILFSNKCLNEDRMPYQVNNFRRINRFEGVKFGGARITVRREKILHNNITFSLLFGGG + AKYGAGEDVTFIQDCIKAGLRVYKSPIIVSTMKQDSSTWFKGYDRKYYKDKGALLAAN + FPSISEVGVYIQAFKNRGGIYTFSELLRFYKEGVNEFKINR" + gene 13808..14368 + /gene="wcxKs" + /locus_tag="MNY585_0018" + CDS 13808..14368 + /gene="wcxKs" + /locus_tag="MNY585_0018" + /note="member of homology group 115; wcxKs" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="QUP73994.1" + /db_xref="GOA:Q4K0B2" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K0B2" + /translation="MIKSFLIMPKNKVYNTGETDIELKNKYNYEGSELRKVQVRMIDM + LSFLNDICKENNITYFIAFGTLLGAIRHGGFIPWDDNLYIYIYINDKGLKKLRKIINN + GNYPYVIQDYSSDKGFVRYYSVLRDTNSEYIKNEYQHNQRKYRGVQIDLFPYGYGVMK + WGERLIGKIYGFNEKIFLGKIKCWQH" + gene 14353..14970 + /gene="wzys" + /locus_tag="MNY585_0019" + CDS 14353..14970 + /gene="wzys" + /locus_tag="MNY585_0019" + /note="fragment" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="QUP73995.1" + /translation="MLAALIFYLTKEVIIPFLKVISKINGRKKVIYWLLTILGLWMIT + LTPIFENIVGAILKVDGVGRGSDSLTIRAIGRQLYWEQLNETTLKLLFGTGYPNYNYA + LAFQRTGFFKQYFFNRQWFYDIYIFGIVGSSIMGLLFLKYLKNSIKYDRQSADMIPLM + YIISLLIVAYNIILWYWNADGTFILVIMICALEHGEQLLHQKNGV" + gene 14975..16927 + /gene="rbsF" + /locus_tag="MNY585_0020" + CDS 14975..16927 + /gene="rbsF" + /locus_tag="MNY585_0020" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="QUP73996.1" + /translation="MNLNKEVRWKDKQYIAFDFFDTTIHRNCHPEVILFEWSKKISIY + FSFKISATEIYSIRKKSEIHEKQEKQLEEIKYERLLQLVFYTILSRLKSDVTDYNLED + FLIYARTCEEEIELRHISIDTDTINFIEFLKQNGKKIILISDFYSDKKLIEKLMVSLG + IRDYFSKIFISSEIGLRKSSGNLYEYVINELSCKPINLLMIGDNIYSDVKVPKKLGID + SYHKSYSDSHVTVSPNDIVKAMNNVISQACTESLFNLYIPEILYFISKLYKELSVNKA + SDILFCSREGFFIKKLFDLYQKKMNLKLINSHYFYVSRKSTLYPSFKNIEDEDFEVIF + RQFPEITLENFLINLNFSNNDINNIAKQTEIKQTDKVSDKSIINKLKQNKLFKDVYEL + NCKEEKYSFREYLKSVGVENDNSIINMVDIGWKGTIQDNIQKAFPSLNIKGYYMGLNF + QRYSTRNSMNKTGILFTDDPQKTKFFNLFNYKYLFYERIFVADHGPTVRYEFMNGVGV + PTLDTDENHIEIYRFAEEFQITFFNTFEKILDLFNESLVTPDELFNEIANLSLKKHCI + YLPRLSVSIKKLDRAAKENFGIIKSTNRNSDNKVRNFWKNRDFLFLDYIYKAYGKNRL + LNPILDIYGYFVYLIKTLQIKIVGDI" + gene 16927..18384 + /gene="wzx" + /locus_tag="MNY585_0021" + CDS 16927..18384 + /gene="wzx" + /locus_tag="MNY585_0021" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="QUP73997.1" + /translation="MSMKEKSISKNAILNIILTLTNIVFPLITFPYISRILNPSGIGA + ISFFSSIGSYGVLVASLGISTYGIRVIAKNRYHKDKITKIFQELIVINSVMSIIVTFF + LVLMSFRLEQLSSEKGLLIITCITILSSPFNLNWFYSGIEEYSYITKRSIFFKLVLLI + LTFLFVKSKDDYIIYAVIILFSTLASNFINILESRKYINFNLRRNLEFRYHLKPMWYL + FASLLAVNIYTNLDSVMLGIINGNDAVGIYSIASKVKWILLSVVTSVSLVLLPRLSFY + SNKYDETKFNNILRKSSTIIFMISIPLTIFFMIKAKESILLLGGEQYIQAVLAMQILM + PILIISGFSNIIGNQILIPTGNEKYFMRAVSIGAIVNLCLNLLLMPILGIIGGAIATL + CAESVQMIIQFYFSRNKLMGNISLNSIKKVAYSSIFAGILLIVIQNIIENFNSFLNLA + ASSFLYFGVYFFLLVLFKESTIKKFLNQIFYKDIS" + gene 18557..19426 + /gene="rmlA" + /locus_tag="MNY585_0022" + CDS 18557..19426 + /gene="rmlA" + /locus_tag="MNY585_0022" + /EC_number="2.7.7.24" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="QUP73998.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + gene 19427..20023 + /gene="rmlC" + /locus_tag="MNY585_0023" + CDS 19427..20023 + /gene="rmlC" + /locus_tag="MNY585_0023" + /EC_number="5.1.3.13" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="QUP73999.1" + /translation="MTDNFFGKMLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPASFFAAGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDLE" + gene 20033..21082 + /gene="rmlB" + /locus_tag="MNY585_0024" + CDS 20033..21082 + /gene="rmlB" + /locus_tag="MNY585_0024" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="QUP74000.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKTEKE + AVEANYAKTQEIITV" + gene 21148..21999 + /gene="rmlD" + /locus_tag="MNY585_0025" + CDS 21148..21999 + /gene="rmlD" + /locus_tag="MNY585_0025" + /EC_number="1.1.1.133" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="QUP74001.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNIAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + gene 22349..22582 + /gene="glf_1" + /locus_tag="MNY585_0026" + CDS 22349..22582 + /gene="glf_1" + /locus_tag="MNY585_0026" + /EC_number="5.4.99.9" + /note="glf 1" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="QUP74002.1" + /translation="MNTFNKLWGVVTPAEAQAKIEEQRAILNGKTPENLEEQAISLVG + TDIYEKLIKDYTEKQWGKSTTELPSFIIVCQYA" + gene 22656..23159 + /gene="glf_2" + /locus_tag="MNY585_0027" + CDS 22656..23159 + /gene="glf_2" + /locus_tag="MNY585_0027" + /EC_number="5.4.99.9" + /note="glf 2" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="QUP74003.1" + /translation="MLDHENIDVETNVDFFVNKEQYLKDFPKIVFTGMIDEFFDYKLG + ELEYCSLRFENETLDMENYQGNAVVNYTDAETPYTRIIEHKHFEFGSQAKTIITKEHS + KTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQGNVIFGGRLGHYRYYDMHQVIGAALQ + CVRNELD" + gene 23477..>23524 + /gene="aliA" + /locus_tag="MNY585_0028" + CDS 23477..>23524 + /gene="aliA" + /locus_tag="MNY585_0028" + /codon_start=1 + /transl_table=11 + /product="AliA" + /protein_id="QUP74004.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaaggca gaaatccttt gttttttata accaaggttt ataaaccttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga aaaacttctg aaaccatact + 721 tcaaaaaagt cgctcgtcat catctcttcg taagtcattg gagcgattaa ttcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 tttctgggtc ttgttcataa ttagattgaa actagagtag tagacctctg cttctaaaac + 1021 attgttagaa atcgatttga ctgtcctgat cgatttgtca tgttcttatt tcattttact + 1081 atatttttgt ttcgcgggaa gtctactaag atacttaaag atgcagatag taaaaaaaga + 1141 tgcagatagt aaaaaaatgt agacattacc gtaaaaaagt gatataatca taagatgttc + 1201 aatgtatagg tgttaatcat gagtagacgt tttaaaaaat caggttcaca gaaagtgaag + 1261 cgaagtgtta atatagtttt gctgactatt tatttattgt tagtttgttt tttattgttc + 1321 ttaatcttta agtacaatat ccttgctttt agatatctta atctagtggt aactgcgtta + 1381 gtcttactag tagccttggt agggctactc ttgattatct ataaaaaagc tgaaaaattt + 1441 actatttttc tgttggtgtt ctctatcctt gtcagctcag tgtcgctctt tgcagtacag + 1501 cagtttgttg gactgaccaa tcgtttaaat gcgacttcta attactcaga atattcgctc + 1561 agtgtcgctg ttttagcaga tagtgagatc gaaaatgtta cgcaactgac gagtgtgaca + 1621 gcaccgactg ggactgataa tgaaaatatt caaaaactac tagctgatat caagttaagt + 1681 cagaataccg atttgacagt cgaccagagt tcgtcttact tggttgctta caagagtttg + 1741 attgcagggg agactaaggc cattgtccta aatagtgtct ttgaaaatat catcgagtca + 1801 gagtatccag actacgcatc gaagataaag aagatttata ccaagggatt tactaaaaaa + 1861 gtagaagctc ctaagacgtc taagaatcag tctttcaata tctatgttag tggaattgac + 1921 acctatggtc ctattagttc ggtgtcgcga tcagatgtca atatcctgat gactgtcaat + 1981 cgtgatacca agaaaatcct cttgaccaca acgccacgtg atgcctatgt accaatcgca + 2041 gatggtggaa ataatcaaaa agataaatta acccatgcgg gcatttatgg agttgattcg + 2101 tccattcaca ccttagaaaa tctctatgga gtggatatca attactatgt gcgattgaac + 2161 ttcacttctt tcttgaaaat gattgactta ttgggagggg tagatgttca taatgatcaa + 2221 gagttttcag ctctacatgg gaagttccat ttcccagtag ggaatgtcca cctagactct + 2281 gagcaggctc taagttttgt acgtgaacgc tactcactag ccgatggaga ccgtgaccgt + 2341 ggtcgcaacc aacaaaaggt gattgtggct atccttcaaa aattaacgtc aaccgaagca + 2401 ctgaaaaatt atagtacgat cattgatagc ttgcaagatt ctatccaaac aaatatgcca + 2461 cttgagacca tgatagattt ggtcaatgct cagttagaaa gtggtggaac ttacaaagtg + 2521 aattcgcaag acttgaaagg tacaggtcgg atggatcttc cttcttatgc aatgccagac + 2581 agtaacctct atgtgatgga aatagatgat agtagtttag ctgtagttaa agcagctata + 2641 caggatgtga tggagggtag atgaaatgat agacatccat tcgcatatcg tttttgatgt + 2701 agatgacggt cccaagtcaa gagaggaaag caaggctctc ttggcagaat cctacaggca + 2761 gggggtgcga accattgtct ctacctctca ccgtcgcaag ggcatgtttg aaactccgga + 2821 agagaagata gcagaaaact ttcttcaggt tcgggaaata gctaaggaag tggcgagtga + 2881 cttagtcatt gcttacgggg ctgaaattta ctacacacca gatgttctgg ataagctggg + 2941 aaaaaagcgg attccgaccc tcaatgatag tcgttatgcc ttgatagagt ttagtatgaa + 3001 cactctttat cgcgatattc atagcgcctt gaacaagatc ttgatgttgg gaattactcc + 3061 agtcattgcc cacatcgaac gctatgatgc tcttgaaaat aatgaaaaac gcgttcggga + 3121 gctgatcgat atgggctgtt acacgcaagt aaatagttca catgtcctca aacccaaact + 3181 ttttggcgaa cgttataaat tcatgaaaaa aagagttcag tattttttgg aacgtgattt + 3241 agttcatgta gttgcaagtg atatgcacaa tttagacagt agacctccat atatgcaaca + 3301 ggcatatgat atcattgcta agaaatatgg agcgaaaaaa gcgaaagaac tttttgtaga + 3361 taatcccaga aaaattataa tggatcaatt aatttaggag aaaatatgca agatcaaaac + 3421 actttggaaa tcgatgtatt tcaactattc agagctttat ggaaaagaaa gttggtcatt + 3481 ttattagtgg caattataac ttcttcagtt gcttttgcct acagtacttt tgttatcaaa + 3541 cctgagttta ctagtacgac ccggatttat gtagttaacc gtaatcagga agagaaatct + 3601 ggtttaacca atcaagactt gcaggcaggt tcatacttgg ttaaagacta tcgtgaaatt + 3661 atcctatcgc aggatgtttt ggaggaagtt gtttctgatt tgaaactaga tttgacgcca + 3721 aaaggtttgg ctaataaaat taaagtaaca gtaccagttg atacccgtat tgtatctgtt + 3781 tcagttaatg atcgagttcc tgaagaggca agccgtatcg ctaactcttt gagagaagta + 3841 gctgctcaaa aaattatcag tattactcgt gtttctgatg tgacaacact ggaggaggca + 3901 agaccggcga catcaccgtc ttcgccaaat attaaacgca atacactaat tggttttttg + 3961 gcagggggga ttggaactag tgttatagtt cttcttcttg aacttttgga cactcatgtg + 4021 aaacgtccgg aagatatcga agatacactg cagatgacac ttttgggagt tgtaccaaac + 4081 ttgagtaagt tgaaatagga gagaggaatg ccgacattag aaatagcaca aaaaaaactg + 4141 gagttcatta agaaggcaga agaatattac aatgccttgt gtacaaatat acagttgagc + 4201 ggagataaac taaaagtaat ttccgttact tctgttaacc ctggggaagg aaaaacaact + 4261 acttccgtaa atatagcaag gtcgtttgcg cgtgcaggct ataaaactct tttgatcgat + 4321 ggcgatactc gaaattcagt tatatcagga gtttttaaat cgcgtgaaaa aattacaggg + 4381 ctaacagaat ttttatctgg gacagctgat ttatctcacg gtttatgtga tacaaatatt + 4441 gaaaatttat ttgtaattca atcgggatct gtatcaccaa accctacggc cttgttacaa + 4501 agtaaaaatt ttaatgatat gattgaaaca ttgcgtaaat attttgatta tatcattgtt + 4561 gatacaccac ctattggaat tgttattgat gcggcaatta tcactcaaaa gtgtgatgcg + 4621 tccatcttgg taacagcaac aggtgaggcg aataaacgtg atgtccaaaa agtgaaacaa + 4681 caattagaac aaacagggaa actgttcctg ggagttgttt taaataaatt ggatatctcg + 4741 gttgataagt atggagttta cggttcctat ggaaattatg gtaaaaaata acttagaaaa + 4801 gattttatgg atgaaaaagg attgaaaatt tttctggcag tattacagag tattattgtc + 4861 attttattgg tttattttct tagctttgtt agagagacag aagttgaacg ttcttcgatg + 4921 gttatactat accttctcca cttttttgta ttctatttta gttcctatgg taacaatttt + 4981 tttaaaagag ggcacctagt tgagtttaat agtactataa gatatatttt tttctttgca + 5041 atagctataa gtgtattaaa cttttttata gcggaacggt ttagtatctc tagaagagga + 5101 atgatatact tcttaacttt agaaggaata tccttatact tgttaaattt cttagtaaaa + 5161 aaatattgga agcatgtgtt ttttaatcta aaaaatagca agaaaatttt actgttaaca + 5221 gtaacgaaaa atatggaaaa agttcttgat aaattgctag aatctgatga actttcatgg + 5281 aaattggtag cagtaagtgt tttggataaa tctgattttc aacatgataa aatacctgta + 5341 attgaaaagg aaaaaattat tgaatttgca acgcatgaag ttgtggatga ggtgtttgtc + 5401 aatcttccag gagagagcta cgatgttgga gaaattatct ctaggtttga gacaatgggg + 5461 atagatgtaa ctgtaaatct taaagcattt gataagaatt tgggtcgcaa taaacaaatt + 5521 catgagatgg tgggattgaa tgtagtcact ttctctacaa atttttataa aactagtcat + 5581 gtgatttcaa agagaattct cgatatttgt ggtgccacta ttggccttat tctttttgct + 5641 atagctagtc tagttttagt tccattgatt cgtaaagatg gcggaccagc tatttttgct + 5701 caaactcgta tagggaaaaa tggtcgacat tttacctttt ataaattccg ttcgatgcgg + 5761 atcgatgctg aagctatcaa agaacagttg atggatcaaa atacgatgca aggtggtatg + 5821 tttaagatag acaatgatcc tcgtgttaca aaaattggtc gctttattcg taaaaccagt + 5881 ttggatgaat tgccgcagtt ttggaatgtc tttataggag atatgagttt ggtgggaaca + 5941 cgtccaccta cagtagacga gtatgatcag tatactccag aacagaaacg tcgactcagc + 6001 tttaaacctg gtattacagg tttatggcag gttagcggcc gtagtaaaat aaccgatttt + 6061 gatgatgttg taaaattaga tgtggcttat attgataatt ggacaatctg gaaagatatt + 6121 gaaattttgc ttaaaactgt taaagttgta tttatgagag atggagcgaa gtaatttctg + 6181 tatatccatc atattaggag agaaatgaaa aagtcagttt atatcattgg ttcaaaagga + 6241 attcctgcta agtatggagg atttgaaact tttgttgaaa aattaacagc cttccaacaa + 6301 gataaggcta tccaatatta tgtggcttgt atgcgtgaaa actctgcaaa atcagggact + 6361 actgaggatg tttttgaaca taatggtgct atctgttata acgtcgatgt tcctaatatt + 6421 ggtccagcgc gagccatagt atatgatatc gcggcaatta acagagctat taaaattgcc + 6481 aaagaaaata aggatgaaga tccaatcttc tatattctag cttgtcgaat cggtccgttc + 6541 atccatggaa ttaagaaaaa aatccaggcg ataggtggga ctcttctagt taatccagat + 6601 ggtcacgagt ggttacgagc taagtggagc gctccagttc gtcgttattg gaaaatttcc + 6661 gaaggtctta tggtcaaaca tgcagatctt ttagtgtgtg atagtaagaa tattgaaaaa + 6721 tatatccaag aagattataa acagtatcaa cctaagacaa cctatatcgc ttatgggact + 6781 gatacaacac gctccatatt aaagagtagt gacgaaaaag tacgttcttg gttcaaagag + 6841 aagaatgttt ctgagaacga gtattatcta gttgtaggac gttttgtacc agaaaacaac + 6901 tatgaatcta tgattcgtgg ctttttggca tctaactcta agaaggactt tgtcttaatc + 6961 acaaatgtag aacagaataa attttataat cagttgttgg caaaaactgg ttttgataag + 7021 gacccacgag taaaatttgt aggtacagtc tatgagcaag agcttcttaa atatattcgt + 7081 gaaaacgcct ttgcttactt ccacgggcat gaagttggtg gaaccaatcc ttcactttta + 7141 gaagctctgg catcaactaa actgaattta ttgctagatg ttggctttaa ccgagaagtt + 7201 ggggagcaaa gtgcgattta ttggaaaaaa gatgagcttt cccaagtaat cgagaaagtt + 7261 gaacaatttg atgcaaaaat gattgatgag ttagatagac aatcaaatca gagaattgcg + 7321 gattctttca cttgggaaaa gattgtcaca gactacgaga aagtatttaa aggttagagt + 7381 taatggcagt aaaattaaaa tatgataaat cagatattac atttttagat gatgacgaat + 7441 tgaaaaaata ccaatcagaa ttgttgaaaa tgatatcaga tgtgtttact ttttttgatg + 7501 aaaataggat agcgtattct ttaagtggag gtagcatttt aggggcaatc cgtcataaag + 7561 ggtttatccc ttgggatgat gatgttgata tcaatattcc gagggaaagt tacgataaac + 7621 tattttctct atttgagtta gacaatagtc ttagtcgtaa atattatctt caatcagcaa + 7681 aaagtcatcc agaattggga cttcatgttt ctcaaattag aaaaaaagga acagttgctc + 7741 gtaggaaata cgatcattcg gctgaggagt gcggtatttc tatagatctt tacattgtag + 7801 aaaatgtata caataatcca gtgaaacgat tctttcaagg ttatacaagt atgtttttga + 7861 cttttgcctt ggcttctgta cgagaaacaa agaatcatgc cctgatgaag gaaatgttta + 7921 gactggaagg tagaaaacta aattattcag ctggaaagtt aatggttggt tggttttttg + 7981 gaattattcc aattgaaaag tggttgaatt ggcttgataa atgtaattca agctgtaagg + 8041 attcacatac aaaatatgta tccataccta caggaaggaa acactttaga cgcgagactt + 8101 acttgcgaga gaatatgaat atttataaaa aggttccttt tgaaactttg atggtgaatg + 8161 ttcctgtttg gtcagaagag tatttagaaa tgttttacgg taaagattat atggtcgttc + 8221 ctcctgttga taagagagag caacatttgt ttttagaatt gagttacgga gaagaataga + 8281 tgaaagtagc gattttaaca gcttcaggca ttggaagccg aattggtcaa gatatcccta + 8341 aacaatttat tcatgttgaa aataagccag tcattatcta tacccttgaa aaatttcaaa + 8401 atcatccaga aattgatgaa atctgtattg ttattttaaa aggctgggat cagatggtta + 8461 aagcttatgc ggaacaattt ggaattacaa agttaaagat gataactttt ggggggaagt + 8521 ctggtcaaga atcaatttat aacggtctta gagaagttaa gaaagctcat cccaatgatg + 8581 atgtgactgt attaattcat gacgggaatc gtcctttagt gagcaatgat attattagca + 8641 acgctttagc aacataccaa cagtttggaa atgctgttgc agcgatacca acgactgagg + 8701 tagtatttgt tttagaaaac ccacaatcaa cttcgtccac agaagcattg aatcgtgact + 8761 tgttgagacg aacacaaact cctcatgttt accatcttga taatattcta tcgcttcatg + 8821 aaaaagcatt agaaaatggg ataactgatg ttgcagcatc atgccaactc atgcaactat + 8881 ttggtgaaaa gagttatttc tctcttggaa cagagaaaaa cttgaaaatt acgactgtag + 8941 aagatctcga tatttttaaa gccttattga gttcaactcg agataagtgg attaaatagt + 9001 aatgacatta ttattaaata aaatatatag acaagatgta gaatcttctc tagaaacaat + 9061 cgtcaatatt aatgacttga atggcaagtc aattttaatt actggagctt ctggtttgat + 9121 tggttcaagt gtcattgacc agttattatt gctaaatgaa ataaggaatt ttaacattaa + 9181 aattttttgt tgtggaagag agtttgaatc attagaaaaa cgatttggta gacaaacaga + 9241 gtatttacac tttgtgttct atgatgcgac taaagcacct cactttgatt ttgcagtgga + 9301 ctacattatt catgctgcta gtcctgctag tcctgaatta tacgttaatc agcctgtaga + 9361 aacaatggct agtaattttc tgggtatgta taatctactg gaatacgcca aaaatgctaa + 9421 agtttcaaat ctagtttata tctcatctag tgaagtttat ggaattagca ctagtaataa + 9481 tcctttggac gaaaattata ttggaactgt tgatcatctt agcgtacggt cttcttatgc + 9541 cagttcaaaa agagctactg aaatactttg tgttagtttt gcttccgagt atggaatcaa + 9601 aataatgata gtaaggccag gacatatcta tggtcctagt gccaaggact ctgataatcg + 9661 tgtatcatca ttttttatga cagaagcgat tgctgggcgt gatattgtca taaaaagtac + 9721 aggtagtcag ttaagatcct attgttatag tttggattgt gccagtgcaa ttctaagtgt + 9781 tcttctttcg ggtggatcag gacaagctta taatgtttcc aatccaaatt caattattac + 9841 tataaaacag atggcaactt gcattgcaga tgcttcagga gtcagagttc tttatgatat + 9901 acctataact caagagcgaa agcgggaaaa tcctatggta aatgcaagct tagatagtga + 9961 gaaaattgag tccttgggat ggtcaggtct attttcagct gaagtaggct tccatcacac + 10021 atttagtatt ttaaaggagt tatcaagtga aaaatgatag tattttaatc atgatgacaa + 10081 catacaatgg agaagaattt atacgtgaac agttggagag tatccttttt caaaccatta + 10141 cagcatggaa actatagatt cgtgatgaca attctagtga tcaaataaga gcaattatta + 10201 aagaatacga agaaaaagat agtcaatttt tgatataagc tatccaagag gattttggag + 10261 aagttttttt attgaagagt ggccttaaga aggtcttcta ggcttaattt aggtttttgt + 10321 ccaccttttg cgtgtttaag ttgataagct gtttttaata cagctaacat ctcttcaaaa + 10381 atggtacgct gaacgtcaac aagacgctta aatcgtacat cagttagttg tttacttgct + 10441 tcataattca tagaactatt ataccatatt ttatttcgca ggaaatctat tgaaaaaacg + 10501 acactatatt atcaatgggg atgttaggac tatatgttaa aaacatgcga gagtatcttt + 10561 tgttatgaat attatgagag tacatagaaa gatagagatt ccactgatgg aattttatag + 10621 agaagggaaa actgtattta tttggatata ttgaactccg tggaatggat tgattagggt + 10681 atgtacatat ggtaaatgga tgtaacccgc aaacagaaca cggatggagt acacatttgc + 10741 taattacaga gattcattga aaaatattag agtttcaaat aggaaaagta atgattgacg + 10801 gagattttat gaatagaaga cttgtaataa aaaagaaaag tataatgttt ttcatgctta + 10861 tgttatgtgt tacggcattt tatgggacaa attattggta tacaaatata tatatatatg + 10921 attttatgat tataacatca tgcttattat caataatagt atttgtatgt aatggtatta + 10981 gaattgataa aacatattat aaagggacaa taatactggg tattgtaatg tggttttcag + 11041 gacttattgc tgcacaagga aaagggctcc ctgctattgt aatctttaaa gagagtttat + 11101 atactattac tccaataatg atatttttag ctttccgacc tatgataaag tcaataaaag + 11161 acacttcatt attccttcgt actatttctg ctgccggtgt tatatgtaat ttaattgctt + 11221 gtattgaaat gttctttgcc aaaagaggat ttgattttct aaatataagt gtatttgaaa + 11281 aacttagaaa tggtactcct agatttacaa ttggagaaac aataatagtt cttagttttt + 11341 ttatctcctg tagtgttgtt tttagtaaag ggggaaagag aaatagacgc attttccatg + 11401 ttctaaatat agctctcaca gctataaatt tagtgtatat tattaaaaca aggacactga + 11461 atttatatat tttatcaaca cttatgatgg tgcctgtttt aaaaaaaaat gtaaagaaac + 11521 aacttaagtt ttgtattgtg tttttgatat ctataattct tacttttgtt tctgcagaat + 11581 attttattcc aatagtcaaa aatttaattc atagtgatca tgggattcaa attagattct + 11641 tgacgataga atactatata gagtatttta aaaatcatta cttatttgga gcgggatata + 11701 tttcttctag tccatatttt gaaacttatt ctattgttac cggtccatta ggacgttatt + 11761 atccaagcga tgtaggtttg attggactta tgtttagaag tgggattatc gggctaattt + 11821 ggttaataag ttggttttat acaagcttga agataattaa agataatacg attagaattc + 11881 cagctcatta tgacttatta atgaagctag ttatagtttt tttgatgttt tcttgtatta + 11941 atttgataat cactgatgca cctagattcc catatattgc attagctatg ttactttttg + 12001 aatcaagtta taccttgagt tatgaaaaca gttctaatta gaatgtattt cagatagtta + 12061 ttttaaagga tgaggggaaa tgattaagag attagcaata cttatggcca catataatgg + 12121 cgaaaaatat ataaaagagc aaattgaaag tattctcaac caagatacag attttgattt + 12181 tactctaatt attagagatg acggttcaac agataatact aaaaatataa ttagagaata + 12241 tgttgatagt gggaaaatta tttttataga aggccagaat aaaggggcgg caagaggatt + 12301 tatttctttg ttatgtgata atcctggata tgattactat gctttctcgg atcaagatga + 12361 tgtttggaat cataataaat tacagaaagg tatatggagt ctttccaaat atactgggcc + 12421 agcactttat tgttctaatt gtgaattagt tgattcagag ttaaatagta taggtcgtaa + 12481 tacacatagg aagagaccga actatactct tgaatctatt ctttgtcttg ctagttgtgc + 12541 acaaggatgt acatctgtat ttaataaaga gctagcttcg ataattcagg agaatgatgt + 12601 gcctgatact tttattatgc atgattcttt gattacttgt ttatgtgcac tgataggtgg + 12661 aaagataatt tacgacgaaa ttccatcaat gaaatataga atgcatgatg ataatatatt + 12721 tggaatggtg tcagctaagc aaaatgtact aaatgttata aaagatcgta ttagtgaaat + 12781 aacaaaaaag cgaacgatta gtatgtacga tcaagcagag tgtttactaa aggtttataa + 12841 aaaatatata gattctaaca atcaagatat atgtagaatt gttattgatt ctaaagtatc + 12901 gctaaaggca agacttaagc tgatttttaa taaaaatttg cagcatacta cattaaataa + 12961 aaccataaca aaaaaattag agatattatt tggcaatgac taataaagga gtttagatat + 13021 gaagtatcaa ctcattgtat caacaatgaa tcaacaggat aacagtctga tagagaaaat + 13081 gaatataaaa tctgatgcaa ttatcattaa tcaatcaaac tcattttctt accatgagac + 13141 gaaattgaaa aattcgattg taaaatggta tgaattcaat gaaagaggta ttggtttaag + 13201 tcgaaacaca ggtttcatga gatcggatgc tgatattatt caatttgctg atgacgatat + 13261 gatttttaca gatacatatt atgaagacgt attattagaa tatcaaaaac atccagaagc + 13321 tgatgtaatt cttttttcga ataaatgtct taatgaagat cgaatgcctt atcaggttaa + 13381 taattttaga cgtataaata ggtttgaagg tgttaagttt ggtggtgcta gaattacagt + 13441 caggagagaa aagatattgc ataataacat aacgttttct cttttatttg gggggggagc + 13501 aaaatacggt gcaggagagg acgtaacatt tattcaggac tgtatcaagg caggattacg + 13561 ggtatataaa tcacctatta ttgtttctac aatgaaacaa gattcttcta catggtttaa + 13621 aggatatgat agaaaatatt ataaagataa aggtgcttta ttagcagcaa atttcccttc + 13681 tataagtgag gtaggagtat atatacaagc tttcaaaaat agggggggaa tttatacatt + 13741 tagtgaatta cttagatttt ataaggaagg tgttaacgaa tttaaaataa atagatgata + 13801 aattgatatg ataaagagtt ttttgattat gccaaaaaat aaagtttata atactggcga + 13861 gacagacatt gagttgaaaa ataaatacaa ttatgaaggt agtgagttga ggaaagttca + 13921 agttcgtatg attgatatgc tttctttttt gaatgatata tgcaaagaaa ataacatcac + 13981 ctatttcatt gcttttggaa ctctattagg agctattaga catggaggct ttattccatg + 14041 ggatgataat ctttatattt atatttatat taatgataaa ggtttaaaaa aacttagaaa + 14101 aataattaat aatggaaact atccctatgt tattcaagac tattctagtg ataaaggatt + 14161 tgtaaggtat tatagtgttc tcagagatac taactctgaa tatataaaaa atgaatatca + 14221 acataatcag cgtaaataca gaggtgtaca aattgactta ttcccttatg gttatggtgt + 14281 aatgaaatgg ggtgaacgtc ttattggaaa aatatatggt tttaatgaaa aaatattttt + 14341 agggaaaata aaatgttggc agcattaatt ttttatttaa ctaaagaagt tataattcca + 14401 tttctgaaag taattagtaa gattaacgga agaaagaaag taatttattg gttgctgaca + 14461 attttgggac tgtggatgat tactctaaca cctatttttg aaaatattgt tggagctatt + 14521 ttaaaagtag atggagtagg tagaggaagt gattcattga ctattcgagc aattggacga + 14581 cagttatatt gggaacaatt gaatgagaca actttaaaac ttctttttgg aacaggatac + 14641 cctaattata attatgcttt agcctttcaa cgtacaggtt ttttcaagca atattttttt + 14701 aacagacaat ggttttatga tatatatata tttggtattg tgggttcctc aattatggga + 14761 ttattatttt taaaatatct taaaaattca ataaagtatg atagacaatc tgcagatatg + 14821 attccgttga tgtatattat ttctttacta attgtagcct ataatattat tctttggtat + 14881 tggaatgcgg acggtacttt tatattagta atcatgattt gcgcattgga gcatggagaa + 14941 caattattac atcagaagaa tggagtgtga ttggatgaat ttaaataaag aagttagatg + 15001 gaaggataag caatatattg cttttgattt ttttgataca actatccata gaaattgtca + 15061 tcctgaagtg attttatttg aatggtctaa aaaaatttct atttatttct ctttcaaaat + 15121 atctgctaca gaaatttatt caattaggaa aaaatctgaa atacatgaga agcaagaaaa + 15181 acaattggaa gaaattaaat atgaaagatt acttcaactt gttttttata ctattttaag + 15241 tcgtttgaag tcagatgtta ccgactataa tcttgaagat tttttaattt atgcaagaac + 15301 gtgtgaagag gaaatagaat taagacatat tagtattgat acagatacaa ttaattttat + 15361 tgaattttta aaacaaaatg ggaaaaaaat aattttaatt tcagattttt attctgataa + 15421 aaagctaatt gaaaaattaa tggtttcatt agggattaga gattatttct ctaaaatatt + 15481 tatttcaagt gaaattgggt tacgtaagtc atcaggaaat ttatatgaat atgtgatcaa + 15541 tgaattgagc tgtaagccta taaatttact tatgattggt gataatattt attctgatgt + 15601 aaaagttcca aaaaaactag gaatagattc ttatcataaa tcttattcag attcacatgt + 15661 gactgtgagt cctaacgata ttgtaaaagc gatgaataat gttatttctc aagcttgtac + 15721 tgaatcttta tttaatctct atatacctga aatactttat tttatttcaa agttatacaa + 15781 agaattatct gttaacaaag ctagtgatat attattttgt tcaagagaag gtttttttat + 15841 aaaaaaatta tttgatcttt atcaaaaaaa aatgaactta aagcttatta actcacatta + 15901 tttttatgtt tctagaaaat caacgctata tccatcattt aaaaatattg aggatgaaga + 15961 ttttgaagtt atttttagac aatttcctga aattacttta gaaaattttt tgattaattt + 16021 aaatttttcc aataatgata ttaacaatat tgctaagcaa acagaaatta aacaaacaga + 16081 caaagtatca gataaatcta ttattaacaa attaaaacaa aataaattat ttaaagacgt + 16141 ttatgaattg aactgtaaag aagaaaaata ttcttttaga gaatatttaa agtctgtagg + 16201 agttgagaat gacaattcta taataaatat ggtagatatt ggttggaaag gtacgataca + 16261 agacaatatt caaaaagctt ttccatcttt aaatataaaa gggtattata tggggttgaa + 16321 ttttcaacgg tattctacta ggaatagtat gaataagacg ggaatactgt ttactgatga + 16381 tcctcaaaaa acaaagtttt ttaacttatt taattataaa tatttattct atgaaagaat + 16441 ttttgttgca gatcatggac cgacagttag atatgaattt atgaatggtg ttggggtacc + 16501 aacattggat acagatgaaa atcatataga aatttataga tttgctgagg aatttcagat + 16561 tacatttttc aacacatttg agaaaatttt agatttgttc aatgaatcac tagtaacacc + 16621 agatgaatta tttaacgaaa tagctaattt atcattaaaa aaacattgca tctatttacc + 16681 aaggctttca gtaagtataa aaaaattaga tagagcagca aaagaaaatt ttggtattat + 16741 aaaatctact aacaggaata gtgataataa ggtaagaaat ttttggaaaa atagagattt + 16801 tttattttta gattatatat ataaagcgta tggaaagaat agattgttaa accctatatt + 16861 ggatatttac ggatattttg tatatctgat taaaacactg caaataaaaa tagtagggga + 16921 tatttgatga gcatgaaaga aaaatcaata agtaaaaatg ctattttgaa tattatttta + 16981 acactaacaa atattgtgtt tccattaatt acttttcctt atatttctag aattctgaat + 17041 ccgtcaggaa taggcgcaat ctcttttttt tcatctattg gttcttatgg tgttttagtt + 17101 gcctcgcttg gaatttcaac ttatgggatt cgggtgattg caaagaatcg ttatcataaa + 17161 gataagataa ctaaaatatt ccaagaattg atagttatta atagtgtaat gtctattata + 17221 gtgacgttct tccttgtttt aatgagtttc cgattagagc agttaagttc agaaaaaggt + 17281 ttattaataa tcacatgtat tactattttg tcctctcctt ttaatttgaa ttggttttat + 17341 agtggaatag aagagtattc atatataaca aaacgttcaa tattttttaa attagtttta + 17401 ttgatattaa cctttttatt tgttaaaagt aaagacgatt atattatata tgctgtgata + 17461 atattgtttt caacattggc ttccaatttt ataaatattt tggagagtag aaaatacatc + 17521 aattttaatt tgagaaggaa tttagaattt agatatcatc taaaaccaat gtggtattta + 17581 tttgcttcgt tacttgcagt taatatttat acaaatttgg attctgtgat gttaggaatt + 17641 attaatggaa atgatgcggt aggtatttac tcaatcgcat caaaagtaaa atggatttta + 17701 ttatcagtcg ttacttcagt gagtttagtt ttattaccca gattatcatt ttatagcaat + 17761 aagtatgacg aaacgaagtt taataatatt ttgagaaagt catctacaat aatttttatg + 17821 atttcaattc ctctaacaat tttttttatg ataaaagcga aagagagtat attattgtta + 17881 ggtggagagc agtatattca ggcagtttta gcaatgcaaa tattaatgcc gatcttgata + 17941 atatcaggtt tttccaatat tataggtaat cagatattga tccctactgg taatgagaaa + 18001 tattttatga gagcagtttc tataggggca atagtaaatt tatgtttaaa tttgttgctt + 18061 atgcctattt tgggaattat cggaggtgca atcgcaactc tttgtgcaga atcagtccaa + 18121 atgattattc aattttattt ttctcgtaat aaattaatgg gtaatatttc attaaattca + 18181 atcaaaaaag tagcctattc atcaattttt gcgggtatac tgttaatagt aatacaaaat + 18241 attatagaga attttaatag cttcttaaat ttagctgctt ctagtttcct atattttgga + 18301 gtatattttt tcttattggt attgtttaaa gaaagtacaa ttaagaaatt tctaaatcaa + 18361 attttttata aggatatttc atgaatttat taccaattat ttatggagcg attcttgatt + 18421 taatattaat aattttttaa agtgaataaa atcaaagcaa taaaagatta aaaaataaat + 18481 tgctatctat tatgtttttc tcaaactaag taaaacataa cttatgaaaa caaatttaaa + 18541 aaggagggac tatagtatga aaggtattat tcttgcaggt ggttcgggga cacgattata + 18601 tcctttgact cgggctgcat caaaacaact tatgccggtt tatgataaac ccatgattta + 18661 ctatccactt tcaacattga tgttggctgg gattagggat attttgataa tctcaactcc + 18721 tcaagatttg cctcgtttta aagagcttct tcaagacgga tctgagtttg gtattaaact + 18781 ttcttatgca gagcaaccaa gtccagatgg tttggcacaa gcctttatca ttggggaaga + 18841 gtttattggt gatgatagtg ttgctttgat cttgggggac aatatctatc acggtcctgg + 18901 tttgagcaaa atgcttcaaa aagcagccaa gaaagagaaa ggtgcgactg tctttggcta + 18961 ccatgtcaag gatccagaac gctttggtgt tgtagaattt gatgaaaata tgaatgctat + 19021 ctccatcgaa gaaaagccag aataccctcg ttcaaactat gcagtgacag gactctattt + 19081 ctatgataat gatgttgtcg aaattgccaa gagtatcaaa ccaagtcctc gcggagaatt + 19141 agaaatcaca gatgtcaaca aggcttactt ggatcgtgga gacttatccg ttgagcttat + 19201 gggacgtggt tttgcttggt tggatactgg cactcatgaa agtttactag aggcttcgca + 19261 gtacatcgaa acagtccaac ggatgcaaaa tgttcaggta gcaaacttgg aagaaattgc + 19321 ctatcgcatg ggttatatca gtcgtgaaga tgtattgacc ttagcccaac cacttaagaa + 19381 aaatgaatac ggacagtatc tgctccgttt gattggagaa gcatagatga cagataattt + 19441 tttcggtaag atgcttgcgg cacgcaaggt tgaagctatt ccaggcatgt tggagtttga + 19501 tatccccgtt catggagata atcgtggctg gtttaaagaa aatttccaaa aggaaaaaat + 19561 gcttccactt ggatttccag cgtctttctt tgcagcagga aaattgcaaa acaatgtatc + 19621 cttctcacgt aaaaatgtcc ttcgaggcct ccacgcagag ccttgggata agtacatctc + 19681 tgtagcagat ggagggaaag ttctgggttc ttgggttgat ctacgcgagg gtgaaacctt + 19741 tgggaatacc tatcagacag tgattgatgc gagtaaggga atctttgttc ctcgaggcgt + 19801 agctaatggc ttccaagttt tatcagatac agtgtcatat agctatctgg tcaatgatta + 19861 ctgggctctt gaactcaaac ccaagtatgc ctttgtgaac tacgctgatc caagccttgg + 19921 tattgaatgg gaaaatattg cagaagcaga ggtttcagaa gcagataaac atcatcccct + 19981 acttaaggac gtgaagcctt tgaaaaaaga agatttggaa taaggaaaga atatgactga + 20041 atacaaaaat attatcgtga caggtggagc tggctttatc ggttctaact ttgtccatta + 20101 tgtttacgag aactttccag atgttcacgt gacagtccta gataagttga cttatgctgg + 20161 aaaccgcgcg aatattgagg aaattttagg taatcgtgtt gagttagttg ttggtgacat + 20221 tgctgatgcg gagttggtag acaagttggc tgctcaagca gatgctatcg ttcattatgc + 20281 agcggaaagc cacaatgata attcgctcaa tgatccatcg ccatttattc atactaactt + 20341 catcggaacc tatactcttt tagaagctgc tcgtaagtat gatattcgct tccaccatgt + 20401 atcgacagat gaagtttatg gagatctccc tttacgcgaa gatttgccag gtcatggaga + 20461 agggccgggt gagaaattta cggctgaaac caagtacaat ccaagctcgc cttactcatc + 20521 aaccaaggca gcctcagatt tgattgtcaa agcctgggtg cgttcttttg gagtcaaggc + 20581 aacgatttcc aactgttcaa ataactacgg tccttatcaa catatcgaaa aattcatccc + 20641 acgtcagatt actaacatcc taagtggtat caagccaaaa ctttacggtg aaggtaaaaa + 20701 cgttcgtgac tggattcata ccaatgacca ttcttcagga gtttggacaa tcttgacaaa + 20761 agggcaaatc ggtgaaacct acttgattgg ggctgatggt gagaagaaca ataaggaagt + 20821 tttggaactt atccttaagg aaatgggaca agctgcggat gcctatgatc atgtgactga + 20881 ccgtgcagga catgaccttc gctatgcgat tgatgctagc aagctccgtg atgagttggg + 20941 gtggaaacct gaatttacca actttgaagc tgggctcaag gcaacaatca agtggtatac + 21001 agataaccaa gaatggtgga aaacagaaaa agaagctgtt gaagccaatt atgctaagac + 21061 tcaggagatt attacagtat aaaaagcagg aaatagctgc tttttattgc tatattggga + 21121 agagttacat attagaaagg tctagagatg attttaatta caggggcaaa tggccaatta + 21181 ggaacggaac ttcgctattt attggatgaa cgtaatgaag aatacgtggc agtagatgtg + 21241 gctaagatgg acattaccaa tgaagaaatg gttgagaaag tttttgaaga ggtgaaaccg + 21301 actttagtct accattgtgc agcctacacc gctgttgatg cagcagagga tgaaggaaaa + 21361 gagttggact tcgccatcaa tgtgacgggg acaaaaaata tcgcaaaagc atctgaaaag + 21421 catggtgcaa ctctagttta tatttctacg gactatgtct ttgacggtaa gaaaccagtt + 21481 ggacaagagt gggaagttga tgaccgacca gatccacaga cagaatatgg acgcactaag + 21541 cgtatggggg aagagttagt tgagaagcat gtgtctaatt tctatattat ccgtactgcc + 21601 tgggtatttg gaaattatgg caaaaacttc gtttttacca tgcaaaatct tgcgaaaact + 21661 cataagactt taacagttgt aaatgaccag tacggtcgtc cgacttggac tcgtaccttg + 21721 gctgagttca tgacctacct agctgaaaat cgtaaggaat ttggttatta tcatttgtca + 21781 aatgatgcga cagaagatac aacatggtat gattttgcag ttgaaatttt gaaagataca + 21841 gatgtcgaag tcaagccagt agattccagt caatttccag ccaaagctaa acgtccgcta + 21901 aactcaacga tgagcctggc caaagccaaa gctactggat ttgttattcc aacttggcaa + 21961 gatgcattgc aagaatttta caaacaagaa gtgagataag tagtagaatg attttctagt + 22021 ctaataaaag aggcagataa tgaactccaa aggagcttaa gatatacaat tatcttgttg + 22081 ttggtgctgg tctctttggt gcagtctttg cccatgaagc agccttaaaa ggaaaaaagt + 22141 aaaagttatt gaaaaacgaa atcatatcgc gggtaatatc tatactcgtg aagaggaagg + 22201 aattcaagtt catcaatatg gtgctcatat cttccatact tctgataagg agatctggga + 22261 gtatgtaaat cagtttgcag agtttaaccg ttataccaat tctcctgttg caaactataa + 22321 gggtgagatt tataaccttc cttttaatat gaatactttc aataaactct ggggagttgt + 22381 aacgccagca gaagcacaag ctaagattga ggaacaacgt gctattttaa atggtaaaac + 22441 tcctgaaaat ttggaagaac aggcgatttc tcttgtaggt acagacatct acgaaaaatt + 22501 aatcaaagac tatacagaga aacagtgggg caaatcaact actgaacttc catcctttat + 22561 tattgtttgc cagtacgcct gacctatgat aacaactatt ttaacgatac ctatcaaggg + 22621 attccaattg gtggatacac tcaaatagtt gaaaaatgtt ggatcatgaa aatattgatg + 22681 tagaaacaaa cgttgatttc tttgtgaata aagagcaata tctgaaagat tttcctaaga + 22741 ttgtctttac tggtatgatt gatgaattct ttgactataa gttgggcgaa ctagagtact + 22801 gtagtcttcg ttttgaaaat gagaccttgg atatggaaaa ttaccaagga aatgcagttg + 22861 tgaactatac ggatgcagaa accccatata ctcgcattat tgaacacaaa cattttgagt + 22921 ttgggagtca agcaaagact atcattacta aagaacattc taaaacatgg gaaaaaggtg + 22981 atgagcctta ttatccagtt aataatgatc gtaataatca tttgtataaa tcgtataaaa + 23041 aacttgctga tgagcaaggg aatgttatct ttggtggtcg cttaggacac tatcgttatt + 23101 acgatatgca ccaagtaatt ggagcagctt tgcagtgcgt gagaaatgag ttagattaat + 23161 actcaatgaa aatcaaagag caaactagga agctagccac aggttgctca aaatactgtt + 23221 ttgaggttgc agatggaagc tgacgcggtt tgaagagatt ttcgaagagt ataaacaagt + 23281 aaaactgact accagttatt atttagaaat agtattaaaa attccttgac tatgtgatat + 23341 agttgaggga tttttaaatg atattcatat tttttgcaaa gatgttgttt gaaaaataat + 23401 tttcaaaaat tctgaaaatt ctgttgacaa ctttctgaaa agagtctata atggagagaa + 23461 agttttaaag gagaaaatga tgaaaagttc aaaactattt gcccttgcgg gcgtgacatt + 23521 attg +// + diff --git a/public/res/serotype_genbank/serotype_24F.gb b/public/res/serotype_genbank/serotype_24F.gb new file mode 100644 index 0000000..adea984 --- /dev/null +++ b/public/res/serotype_genbank/serotype_24F.gb @@ -0,0 +1,1094 @@ +LOCUS CR931688 24165 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 24F L (serotype 24f). +ACCESSION CR931688 +VERSION CR931688.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 24165) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 24165) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..24165 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="24F L" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC24F_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC24F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33928.1" + /db_xref="UniProtKB/TrEMBL:Q4K2K9" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVEMTD + " + gene complement(order(268..1140,1141..1548,1550..1678)) + /gene="tnp" + /locus_tag="SPC24F_0002" + /pseudo + CDS complement(join(268..1140,1141..1548,1550..1678)) + /gene="tnp" + /locus_tag="SPC24F_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(order(694..1140,1141..1194)) + /gene="tnp" + /locus_tag="SPC24F_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.8e-21" + /pseudo + gene 1844..3298 + /gene="wzg" + /locus_tag="SPC24F_0003" + CDS 1844..3298 + /gene="wzg" + /locus_tag="SPC24F_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33930.1" + /db_xref="GOA:Q4K0A3" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K0A3" + /translation="MLITSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVDQSSSYLAAYKSLIAGDTKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIQKL + TSTEVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRIDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1844..1969 + /gene="wzg" + /locus_tag="SPC24F_0003" + /note="Signal peptide predicted for SPC1285 by SignalP 2.0 + HMM (Signal peptide probability 0.998) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 2057..2404 + /gene="wzg" + /locus_tag="SPC24F_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.1e-64" + misc_feature 2582..3025 + /gene="wzg" + /locus_tag="SPC24F_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 3.5e-70" + gene 3300..4031 + /gene="wzh" + /locus_tag="SPC24F_0004" + CDS 3300..4031 + /gene="wzh" + /locus_tag="SPC24F_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33931.1" + /db_xref="GOA:Q4K0A2" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K0A2" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KDMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRVQYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGGKKAKELFVDNPRKIIMDQLI" + misc_feature 3303..3911 + /gene="wzh" + /locus_tag="SPC24F_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 1e-38" + gene 4040..4732 + /gene="wzd" + /locus_tag="SPC24F_0005" + CDS 4040..4732 + /gene="wzd" + /locus_tag="SPC24F_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33932.1" + /db_xref="GOA:Q4K0A1" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K0A1" + /translation="MQDQNTLEIDVFQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPATSPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 4058..4474 + /gene="wzd" + /locus_tag="SPC24F_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 4.9e-54" + misc_feature 4580..4657 + /gene="wzd" + /locus_tag="SPC24F_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4742..5425 + /gene="wze" + /locus_tag="SPC24F_0006" + CDS 4742..5425 + /gene="wze" + /locus_tag="SPC24F_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33933.1" + /db_xref="GOA:Q4K0A0" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K0A0" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILVTATGEANKRDVQKVKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 5441..6808 + /gene="wchA" + /locus_tag="SPC24F_0007" + CDS 5441..6808 + /gene="wchA" + /locus_tag="SPC24F_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33934.1" + /db_xref="GOA:Q4K099" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K099" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETEVERSSMVILYLL + HFFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMIYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDVGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITNFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 6224..6805 + /gene="wchA" + /locus_tag="SPC24F_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 8.2e-147" + gene 6839..8011 + /gene="wchF" + /locus_tag="SPC24F_0008" + CDS 6839..8011 + /gene="wchF" + /locus_tag="SPC24F_0008" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI33935.1" + /db_xref="GOA:Q4K098" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K098" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFKHNGAICYNVDIPNIGPARAIAYDIAAINRAIEFAKENKDEDPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKYA + DFLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSTLKSSDKKVRSWFKEKNVSEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQIIEKVEQFDAKMIDELDRQSNQRIADSFTWEKIVTDYEKVFKG" + gene 8017..8913 + /gene="wcxG" + /locus_tag="SPC24F_0009" + CDS 8017..8913 + /gene="wcxG" + /locus_tag="SPC24F_0009" + /note="member of homology group 79" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33936.1" + /db_xref="GOA:Q4K097" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K097" + /translation="MAVKLKYDKSNITFLDDDELKKYQSELLKMISDVFTFFDENGIA + YSLSGGSILGAIRHKGFIPWDDDVDINIPRESYDKLFSLFELDSSLSRKYYLQSAKSH + PELGLHVSQIRKTGTVARRKYDHSAEECGISIDLYIVENVYNNPVKRFFQGYTSMFLT + FALASVRETKNHALMKEMFRLEGRKLNYSAGKLMVGWFFGIIPIEKWLNWLDKCNSSC + KDSHTKYVSIPTGRKHFRRETYLRDNMNIYKKVPFETLMVNVPVWSEEYLEMFYGKDY + MVVPPVDKREQHLFLELSYGEE" + misc_feature 8134..8835 + /gene="wcxG" + /locus_tag="SPC24F_0009" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 1.3e-19" + gene 8914..9633 + /gene="abp1" + /locus_tag="SPC24F_0010" + CDS 8914..9633 + /gene="abp1" + /locus_tag="SPC24F_0010" + /note="member of homology group 57" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (arabinitol) + Abp1" + /protein_id="CAI33937.1" + /db_xref="GOA:Q4K096" + /db_xref="InterPro:IPR001228" + /db_xref="UniProtKB/TrEMBL:Q4K096" + /translation="MKVAILTASGIGSRIGQDIPKQFIHVENKPVIIYTLEKFQNHPE + IDEICIVILKGWDQMVKAYAEQFGITKLKMITLGGKSGQESIYNGLREVKKAHPNEDV + TVLIHDGNRPLVSNDIISNALATYQQFGNAVAAIPTTEVVFVLENPQSTSSTEALNRD + LLRRTQTPHVYHLDNILSLHEKALENGITDVAASCQLMQLFGEKSYFSLGTEKNLKIT + TVEDLDIFKALLSSTRDKWIK" + misc_feature 8920..9609 + /gene="abp1" + /locus_tag="SPC24F_0010" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF0007, score 4.8e-15" + gene 9636..10691 + /gene="abp2" + /locus_tag="SPC24F_0011" + CDS 9636..10691 + /gene="abp2" + /locus_tag="SPC24F_0011" + /note="member of homology group 58" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (arabinitol) + Abp2" + /protein_id="CAI33938.1" + /db_xref="GOA:Q4K095" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K095" + /translation="MTLLLNKIYRQDVESSLETIVNINDLNGKSILITGASGLIGSSV + IDQLLLLNEIRNFNIKIFCCGREFESLEKRFGRQTEYLHFVFYDATKAPHFDFAVDYI + IHAASPASPELYVNQPVETMASNFLGMYNLLEYAKNAKVSNLVYISSSEVYGISTSNN + PLDENYIGTVDHLSVRSSYASSKRATETLCVSFASEYGIKIMIVRPGHIYGPSAKDSD + NRVSSFFMTEAIAGRDIVMKSTGSQLRSYCYSLDCASAILSVLLSGGSGQAYNVSNPN + SIITIKQMATCIADASGVRVLYDIPITQERKQENPMVNASLDSKKIESLGWSGLFSAE + VGFHHTFSILKELSSEK" + misc_feature 9723..10682 + /gene="abp2" + /locus_tag="SPC24F_0011" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00073" + misc_feature 9726..10484 + /gene="abp2" + /locus_tag="SPC24F_0011" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00092" + misc_feature 9726..10454 + /gene="abp2" + /locus_tag="SPC24F_0011" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 6.6e-45" + misc_feature 9729..10541 + /gene="abp2" + /locus_tag="SPC24F_0011" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-05" + gene 10681..10902 + /gene="HG267" + /locus_tag="SPC24F_0012" + /pseudo + CDS 10681..10902 + /gene="HG267" + /locus_tag="SPC24F_0012" + /note="member of homology group 267" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase (fragment)" + gene complement(10904..11086) + /gene="tnp" + /locus_tag="SPC24F_0013" + /pseudo + CDS complement(10904..11086) + /gene="tnp" + /locus_tag="SPC24F_0013" + /note="Lone member of homology group 0247" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase (fragment)" + /db_xref="PSEUDO:CAI33940.1" + gene 11426..12676 + /gene="wzy" + /locus_tag="SPC24F_0014" + CDS 11426..12676 + /gene="wzy" + /locus_tag="SPC24F_0014" + /note="member of homology group 112" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33941.1" + /db_xref="UniProtKB/TrEMBL:Q4K094" + /translation="MIDGDFMNRRLVIKKKSIMFFMLMLCVTAFYGTNYWYTNIYIYD + FMIITSCLLSIIVFVCNGIRIDKTYYKGTIILGIVMWFSGLIAAQGKGLPAIVIFKES + LYTITPIMIFLAFRPMIKSIKDTSLFLRTISAAGVICNLIACIEMFFAKRGFDFLNIS + VFEKLRNGTPRFTIGETIIVLSFFISCSVVFSKGGKRNRRIFHVLNIALTAINLVYII + KTRTLNLYILSTLMMVPVLKKNVKKQLKFWIVFLISIILTFVSAEYFIPIVKNLIHSD + HGIQIRFLTIEYYIEYFKNHYLFGAGYISSSPYFETYSIVTGPLGRYYPSDVGLIGLM + FRSGIIGLIWLISWFYTSLKIIKDNTIRIPAHYDLLMKLVIVFLMFSCINLIITDAPR + FPYIALAMLLFESSYTLSYENSSN" + gene 12715..13638 + /gene="wcxI" + /locus_tag="SPC24F_0015" + CDS 12715..13638 + /gene="wcxI" + /locus_tag="SPC24F_0015" + /note="member of homology group 113" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33942.1" + /db_xref="GOA:Q4K0B4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K0B4" + /translation="MIKRLAILMATYNGEKYIKEQIESILNQDTDFDFTLIIRDDGST + DNTKNIIREYVDSGKIIFIEGQNKGAARGFISLLCDNPGYDYYAFSDQDDVWNHNKLQ + KGIWSLSKYTGPALYCSNCELVDSELNSIGRNTHRKRPNYTLESILCLASCAQGCTSV + FNKELASIIQENDVPDTFIMHDSLITCLCALIGGKIIYDEIPSMKYRMHDDNIFGMVS + AKQNVLNVIKDRISEITKKRTISMYDQAECLLKVYKKYIDSNNQDICRIVIDSKVSLK + ARLKLIFNKNLQHTTLNKTITKKLEILFGND" + misc_feature 12730..13221 + /gene="wcxI" + /locus_tag="SPC24F_0015" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.8e-23" + gene 13654..14433 + /gene="wcxJ" + /locus_tag="SPC24F_0016" + CDS 13654..14433 + /gene="wcxJ" + /locus_tag="SPC24F_0016" + /note="member of homology group 114" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33943.1" + /db_xref="GOA:Q4K092" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K092" + /translation="MKYQLIVSTMNQQDNSLIEKMNIKSDAIIINQSNSFSYHETKLK + NSIVKWYEFNERGIGLSRNTGFMRSDADIIQFADDDMIFTDTYYEDVLLEYQKHPEAD + VILFSNKCLNEDRMPYQVNNFRRINRFEGVKFGGARITVRREKILHNNITFSLLFGGG + AKYGAGEDVTFIQDCIKAGLRVYKSPIIVSTMKQDSSTWFKGYDRKYYKDKGALLAAN + FPSISEVGVYIQAFKNRGGIYTFSELLRFYKEGVNEFKINR" + gene 14443..15003 + /gene="wcxK" + /locus_tag="SPC24F_0017" + CDS 14443..15003 + /gene="wcxK" + /locus_tag="SPC24F_0017" + /note="member of homology group 115" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI33944.1" + /db_xref="GOA:Q4K091" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K091" + /translation="MIKRFLIMPKNKVYNTGETDIELKNKYNYEGSELRKVQVRMIDM + LSFLNDICKENNITYFIAFGTLLGAIRHGGFIPWDDDLYIYIYINDKGLKKLRKIINN + GNYPYVIQDYSSDKGFVRYYSVLRDTNSEYIKNEYQHNQRKYRGVQIDLFPYGYGVMK + WGERLIGKIYGFNEKIFLGKIKCWQH" + gene 14988..15605 + /gene="wzy" + /locus_tag="SPC24F_0018" + CDS 14988..15605 + /gene="wzy" + /locus_tag="SPC24F_0018" + /note="member of homology group 65" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy + (fragment)" + /protein_id="CAI33945.1" + /db_xref="UniProtKB/TrEMBL:Q4K090" + /translation="MLAALIFYLTKEVIIPFLKVISKINGRKKVIYWLLTILGLWMIT + LTPIFENIVGAILKVDGVGRGSDSLTIRAIGRQLYWEQLNETTLKLLFGTGYPNYNYA + LAFQRTGFFKQYFFNRQWFYDIYIFGIVGSSIMGLLFLKYLKNSIKYDRQSADMIPLM + YIISLLIVAYNIILWYWNADGTFILVIMICALEHGEQLLHQRNGV" + gene 15610..17562 + /gene="rbsF" + /locus_tag="SPC24F_0019" + CDS 15610..17562 + /gene="rbsF" + /locus_tag="SPC24F_0019" + /note="member of homology group 49" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI33946.1" + /db_xref="GOA:Q4K089" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006439" + /db_xref="UniProtKB/TrEMBL:Q4K089" + /translation="MNLNKEVRWKDKQYIAFDFFDTTIHRNCHPEVILFEWSKKISIY + FSFKISATEIYSIRKKSEIHEKQEKQLEEIKYERLLQLVFYTILSRLKSDVTDYNLED + FLIYARTCEEEIELRHISIDTDTINFIEFLKQNGKKIILISDFYSDKKLIEKLMVSLG + IRDYFSKIFISSEIGLRKSSGNLYEYVINELSCKPINLLMIGDNIYSDVKVPKKLGID + SYHKSYSDSHVTVSPNDIVKAMNNVISQACTESLFNLYIPEILYFISKLYKELSVNKA + SDILFCSREGFFIKKLFDLYQKKMNLKLINSHYFYVSRKSTLYPSFKNIEDEDFEVIF + RQFPEITLENFLINLNFSNNDINNIAKQTEIKQTDKVSDKSIINKLKQNKLFKDVYEL + NCKEEKYSFREYLKSVGVENDNSIINMVDIGWKGTIQDNIQKAFPSLNIKGYYMGLNF + QRYSTRNSMNKTGILFTDDPQKTKFFNLFNYKYLFYERIFVADHGPTVRYEFMNGVGV + PTLDTDENHIEIYRFAEEFQITFFNTFEKILDLFNESLVTPDELFNEIANLSLKKHCI + YLPRLSVSIKKLDRAAKENFGIIKSTNRNSDNKVRNFWKNRDFLFLDYIYKAYGKNRL + LNPILDIYGYFVYLIKTLQIKIVGDI" + misc_feature 15643..16284 + /gene="rbsF" + /locus_tag="SPC24F_0019" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 1.8e-07" + gene 17562..19019 + /gene="wzx" + /locus_tag="SPC24F_0020" + CDS 17562..19019 + /gene="wzx" + /locus_tag="SPC24F_0020" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33947.1" + /db_xref="GOA:Q4K088" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K088" + /translation="MSMKEKSISKNAILNIILTLTNIVFPLITFPYISRILNPSGIGA + ISFFSSIGSYGVLVASLGISTYGIRVIAKNRYHKDKITKIFQELIVINSVMSIIVTFF + LVLMSFRLEQLSSEKGLLIITCITILSSPFNLNWFYSGIEEYSYITKRSIFFKLVSLI + LTFLFVKSKDDYILYAVIILFSTLASNFINILESRKYINFNLRRNLEFRYHLKPMWYL + FASLLAVNIYTNLDSVMLGIINGNDAVGIYSIASKVKWILLSVVTSVSLVLLPRLSFY + SNKYDETKFNNILRKSSTIIFMISIPLTIFFMIKAKESILLLGGEQYIQAVLAMQILM + PILIISGFSNIIGNQILIPTGNEKYFMRAVSIGAIVNLCLNLLLMPILGIIGGAIATL + CAESVQMIIQFYFSRNKLMGNISLNSIKKVAYSSIFAGILLIVIQNIIENFNSFLNLA + ASSFLYFGVYFFLLVLFKESTIKKFLNQIFYKDIS" + misc_feature 17583..18392 + /gene="wzx" + /locus_tag="SPC24F_0020" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.2e-62" + gene 19193..20062 + /gene="rmlA" + /locus_tag="SPC24F_0021" + CDS 19193..20062 + /gene="rmlA" + /locus_tag="SPC24F_0021" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI33948.1" + /db_xref="GOA:Q8RSF0" + /db_xref="HSSP:1FXO" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q8RSF0" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + misc_feature 19196..19912 + /gene="rmlA" + /locus_tag="SPC24F_0021" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.3e-120" + gene 20063..20659 + /gene="rmlC" + /locus_tag="SPC24F_0022" + CDS 20063..20659 + /gene="rmlC" + /locus_tag="SPC24F_0022" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI33949.1" + /db_xref="GOA:Q8RSE9" + /db_xref="HSSP:1NXM" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q8RSE9" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDLE" + misc_feature 20099..20629 + /gene="rmlC" + /locus_tag="SPC24F_0022" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 4.5e-16" + gene 20669..21718 + /gene="rmlB" + /locus_tag="SPC24F_0023" + CDS 20669..21718 + /gene="rmlB" + /locus_tag="SPC24F_0023" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI33950.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 20684..21640 + /gene="rmlB" + /locus_tag="SPC24F_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 20687..21427 + /gene="rmlB" + /locus_tag="SPC24F_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 20690..21502 + /gene="rmlB" + /locus_tag="SPC24F_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 21784..22635 + /gene="rmlD" + /locus_tag="SPC24F_0024" + CDS 21784..22635 + /gene="rmlD" + /locus_tag="SPC24F_0024" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI33951.1" + /db_xref="GOA:Q9AH81" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH81" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 21784..22632 + /gene="rmlD" + /locus_tag="SPC24F_0024" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4.3e-146" + misc_feature 21787..22428 + /gene="rmlD" + /locus_tag="SPC24F_0024" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00011" + misc_feature 21787..22416 + /gene="rmlD" + /locus_tag="SPC24F_0024" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2e-18" + misc_feature 21790..22518 + /gene="rmlD" + /locus_tag="SPC24F_0024" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-08" + gene 22698..23800 + /gene="glf" + /locus_tag="SPC24F_0025" + CDS join(22698..23294,23294..23800) + /gene="glf" + /locus_tag="SPC24F_0025" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33952.1" + /db_xref="GOA:Q4K083" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K083" + /translation="MYDYLIVGAGLFGAVFAHESALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIEEQRAILNGKTPENLKEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPSFIIRRLPVHLTYDNNYFNDTYQGIPIGGYTQIVEKMLDYENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKFADEQ + GNVIFGGRLGHYRYYDMHQVIGAALQCVRNELD" + misc_feature order(23133..23294,23294..23740) + /gene="glf" + /locus_tag="SPC24F_0025" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.9e-107" + gene 24118..>24165 + /gene="aliA" + /locus_tag="SPC24F_0026" + CDS 24118..>24165 + /gene="aliA" + /locus_tag="SPC24F_0026" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33953.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagtaaacct caagtttttg aagcttgagg ttttttacta + 181 tagtggattg aaactagaat agtgcacctc tgcttctaaa acattgttag aaatcgattt + 241 gactgtcccg atcgatttgt cctattctta tttcattttg ctatacttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttatga agatattgtt + 361 tgaaagatgt gagtttccac ggatgggttt gtggagggat atacttgcgt ctttcttttt + 421 ttgttctggt tcttgttcaa agtttttcga atagagttca tgatttagta gctcctttgt + 481 gtgatagatt ttgtcagcga tattgaggta gatgtctccg tcaaatgctt ttataactaa + 541 tgctttcgtc tttctgatga aatagacttc ttttccttgt tcggtaggga tatagtaacg + 601 attttggaat cggatatggt gttcactatc gacgactctc tccgccagtc tagccagaat + 661 gagattcctt tcagaggggt taggaacctc ctcgaagaca gagagttttg tcttgtttcc + 721 aaactgttca ttaaaggttt gaatgtagga aagcaggaag gtattggctt cttccaaggt + 781 atgaatattg ttttgttcca gttcgatagg caggcgagat tgtagtgtct gattgagtct + 841 ttcgactctc cctttagctt gagggataga ggttgtctca aggagaatcc ctagttggtg + 901 acaggcgtat ccaaactgtg tatgggtatc gtcctccatt ttcttagagt tggaggcttg + 961 ataggtaaag accgttctct tatctgtttt aatttgaagg ggaatgccgt gattggctaa + 1021 gatttgttcg aggacatgat agtaagcatt caagttctct tgtttatcaa aataagcgcc + 1081 taggatattg ccagaagcat catcaatggc taagtgtaag ttagatgttt gggctccaaa + 1141 ctaggcatga ggactggcat ccatttgaat gagttcacca gcaaatttct ttctgggtct + 1201 actaggatat acttttttag ggtcttcaag gaagttttca gccgtcggta agattggatt + 1261 gtctaggggt tgattcaggt tcagtttagc ttgttttctt actctcttct ttgtctttct + 1321 atgggactta ggcgacagga tatttttctt atagagtatt tttctaacag tagtatcaga + 1381 gagctgaatt ccttcttctt cagctagcaa ttcacagaaa tgaaggacat ttggtttata + 1441 tgtttcatag gagaggtatt tttttaggag acgttctttg atttcatcag ggattgcatg + 1501 ttttggtttt cgatttctgt ttccgtgtct gaaggcttct ttgtcctttc agttgatagg + 1561 ctagtagcag acgattgatt tgtctttcag aaagattgag ctcgacacag gctcgtttct + 1621 ttgttttctt tccttgggct atagctttta tcacaagata ttttttcgtt tcattcatat + 1681 tcagttggat ccttttcata tgactattct accaaatggg acattttcac gttcgattta + 1741 ctaaagacat tatcacattc gaattacaca agatgcagat agtaaaaaaa atgtagacat + 1801 taccgtaaaa aagtgatata atcgtatgat gttcaaggta taggtgttaa tcacgagtag + 1861 acgttttaaa aaatcacgtt cacagaaagt gaagcgaagt gttaatatcg ttttgctgac + 1921 tatttattta ttgttagttt gttttttatt gttcttaatc tttaagtaca atatccttgc + 1981 ttttagatat cttaacctag tggtaactgc gttagtccta ctagttgcct tggtagggct + 2041 actcttgatt atctataaaa aagctgaaaa gtttactatt tttctgttgg tgttctctat + 2101 ccttgtcagc tctgtgtcgc tctttgcagt acagcagttt gttggactga ccaatcgttt + 2161 aaatgcgact tctaattact cagaatattc aatcagtgtc gctgttttag cagatagtga + 2221 gatcgaaaat gttacgcaac tgacgagtgt gacagcaccg actgggactg ataatgaaaa + 2281 tattcaaaaa ctactagctg atatcaagtc aagtcagaat accgatttga cggtcgacca + 2341 gagttcgtct tacttggctg cttacaagag tctgattgca ggtgacacca aggccattgt + 2401 cttaaatagt gtctttgaaa atatcatcga gtcagagtat ccagactacg catcgaagat + 2461 aaaaaagatt tataccaagg gattcactaa aaaagtagaa gctcctaaga cgtctaagaa + 2521 tcagtctttc aatatctatg ttagtggaat tgacacctat ggtcctatta gttcggtgtc + 2581 gcgatcagat gtcaatatcc tgatgactgt caatcgagat accaagaaaa tcctcttgac + 2641 cacaacacca cgtgacgcct atgtaccaat cgcagatggt ggaaataatc aaaaagataa + 2701 attaacccat gcgggcattt atggagttga ttcgtccatt cacaccttag aaaatctcta + 2761 tggagtggat atcaattact atgtgcgatt gaacttcact tctttcttga aaatgattga + 2821 cttattggga ggggtagatg ttcataatga ccaagagttt tcagctctac atgggaagtt + 2881 ccatttccca gtagggaatg tccatctaga ctctgagcaa gctttaggtt ttgtacgtga + 2941 acgctactca ctagccgatg gagaccgtga ccgtggtcgc aaccaacaaa aggtcattgt + 3001 agcaattatt cagaagttaa cttctacaga ggtcttgaaa aactatagta gtattcttca + 3061 aggattgcag gattctcttc aaacaaatat gccgattgag actatgatag atttagtgaa + 3121 tactcagttg gaaagtggag ggaattataa agtaaattct caagatttaa aagggacagg + 3181 tcggatagat cttccttctt atgcaatgcc agacagtaac ctctatgtga tggaaataga + 3241 tgatagtagt ttagctgtag ttaaagcagc tatacaggat gtgatggagg gtagatgaaa + 3301 tgatagacat ccattcgcat atcgtttttg atgtagatga cggtcccaag tcaagagagg + 3361 aaagcaaggc tctcttggca gaatcctaca ggcagggggt gcgaaccatt gtctctacct + 3421 ctcaccgtcg caaggacatg tttgaaactc cggaagagaa gatagcagaa aactttcttc + 3481 aggttcggga aattgcaaaa gaagtagcag atgatttagt cattgcttat ggcgcagaga + 3541 tatactatac tctggatgct ctagaaaagc tagaaaaaaa agaaattcct acccttaatg + 3601 atagtcgtta tgccttgata gagtttagta tgaacactcc ttatcgcgat attcatagcg + 3661 ccttgagcaa gatcttgatg ttgggaatta ctccagtcat tgcccacatc gagcgctatg + 3721 atgctcttga aaataatgaa aaacgcgttc gggaactgat cgatatgggc tgttacacgc + 3781 aagtaaatag ttcacatgtc ctcaaaccca aactttttgg cgaacgttat aaattcatga + 3841 aaaaaagagt tcagtatttt ttggaacgtg atttagttca tgtagttgca agtgacatgc + 3901 acaatttaga cagtagacct ccatatatgc aacaggcata tgatatcatt gctaagaaat + 3961 atggagggaa aaaagcgaaa gaactttttg tagataatcc cagaaaaatt ataatggatc + 4021 aattaattta ggagaaaata tgcaagatca aaacactttg gaaatcgatg tatttcaact + 4081 attcagagct ttatggaaaa gaaagttggt cattttatta gtggcaatta taacttcttc + 4141 agttgctttt gcctacagta cttttgttat caaacctgag tttactagta cgacccggat + 4201 ttatgtagtt aaccgtaatc aggaagagaa atctggttta accaatcaag acttgcaggc + 4261 aggttcatac ttggttaaag actatcgtga aattatccta tcgcaggatg ttttggagga + 4321 agttatttct gatttgaaac tagatttgac gccaaaaggt ttggctaata aaattaaagt + 4381 aacagtacca gttgataccc gtattgtctc tgtttcagtt aatgatcgag ttcctgaaga + 4441 ggcaagccgt atcgctaact ctttgagaga agtagctgct caaaaaatta tcagtattac + 4501 tcgtgtttct gatgtgacaa cactggagga ggcaagaccg gcgacatcac cgtcttcgcc + 4561 aaatattaaa cgcaatacac taattggttt tttggcaggg gggattggaa ctagtgttat + 4621 agttcttctt cttgaacttt tggacactca tgtgaaacgt ccggaagata tcgaagatac + 4681 actgcagatg acacttttgg gagttgtacc aaacttgagt aagttgaaat aggagagagg + 4741 aatgccgaca ttagaaatag cacaaaaaaa actggagttc attaagaagg cagaagaata + 4801 ttacaatgcc ttgtgtacaa atatacagtt gagcggagat aaactaaaag taatttccgt + 4861 tacttctgtt aaccctgggg aaggaaaaac aactacttcc gtaaatatag caaggtcgtt + 4921 tgcgcgtgca ggctataaaa ctcttttgat cgatggcgat actcgaaatt cagttatatc + 4981 aggagttttt aaatcgcgtg aaaaaattac agggctaaca gaatttttat ctgggacagc + 5041 tgatttatct cacggtttat gtgatacaaa tattgaaaat ttatttgtaa ttcaatcggg + 5101 atctgtatca ccaaacccta cggccttgtt acaaagtaaa aattttaatg atatgattga + 5161 aacattgcgt aaatattttg attatatcat tgttgataca ccacctattg gaattgttat + 5221 tgatgcggca attatcactc aaaagtgtga tgcgtccatc ttggtaacag caacaggtga + 5281 ggcgaataaa cgtgatgtcc aaaaagtgaa acaacaatta gaacaaacag ggaaactgtt + 5341 cctgggagtt gttttaaata aattggatat ctcggttgat aagtatggag tttacggttc + 5401 ctatggaaat tatggtaaaa aataacttag aaaagatttt atggatgaaa aaggattgaa + 5461 aatttttctg gcagtattac agagtattat tgtcatttta ttggtttatt ttcttagctt + 5521 tgttagagag acagaagttg aacgttcttc gatggttata ctataccttc tccacttttt + 5581 tgtattctat tttagttcct atggtaacaa tttttttaaa agagggcacc tagttgagtt + 5641 taatagtact ataagatata tttttttctt tgcaatagct ataagtgtat taaacttttt + 5701 tatagcggaa cggtttagta tctctagaag aggaatgata tacttcttaa ctttagaagg + 5761 aatatcctta tacttgttaa atttcttagt aaaaaaatat tggaagcatg tgttttttaa + 5821 tctaaaaaat agcaagaaaa ttttactgtt aacagtaacg aaaaatatgg aaaaagttct + 5881 tgataaattg ctagaatctg atgaactttc atggaaattg gtagcagtaa gtgttttgga + 5941 taaatctgat tttcaacatg ataaaatacc tgtaattgaa aaggaaaaaa ttattgaatt + 6001 tgcaacgcat gaagttgtgg atgaggtgtt tgtcaatctt ccaggagaga gctacgatgt + 6061 tggagaaatt atctctaggt ttgagacaat ggggatagat gtaactgtaa atcttaaagc + 6121 atttgataag aatttgggtc gcaataaaca aattcatgag atggtgggat tgaatgtagt + 6181 cactttctct acaaattttt ataaaactag tcatgtgatt tcaaagagaa ttctcgacat + 6241 ttgtggtgcc actattggcc ttattctttt tgctatagct agtctagttt tagttccatt + 6301 gattcgtaaa gatggcggac cagctatttt tgctcaaact cgtataggga aaaatggtcg + 6361 acattttacc ttttataaat tccgttcgat gcggatcgat gctgaagcta tcaaagaaca + 6421 gttgatggat caaaatacga tgcaaggtgg tatgtttaag atagacaatg atcctcgtgt + 6481 tacaaaaatt ggtcgcttta ttcgtaaaac cagtttggat gaattgccgc agttttggaa + 6541 tgtctttata ggagatatga gtttggtggg aacacgtcca cctacagtag acgagtatga + 6601 tcagtatact ccagaacaga aacgtcgact cagctttaaa cctggtatta caggtttatg + 6661 gcaggttagc ggccgtagta aaataaccaa ttttgacgat gttgtaaaat tagatgtggc + 6721 ttatattgat aattggacaa tctggaaaga tattgaaatt ttgcttaaaa ctgttaaagt + 6781 tgtatttatg agagatggag cgaagtaatt tctgtatatc catcatatta ggagagaaat + 6841 gaaaaagtca gtttatatta ttggttcaaa aggaattcct gctaagtatg gaggatttga + 6901 aacttttgtt gaaaaattaa cagccttcca acaagataag gctatccaat attatgtggc + 6961 ttgtatgcgt gaaaactctg caaaatcagg gactactgag gatgttttta aacataatgg + 7021 tgctatctgt tataacgtcg atattcctaa tattggtcca gcgcgagcta tagcgtatga + 7081 tatcgctgca attaacagag ctattgaatt tgccaaagaa aataaggatg aagatccaat + 7141 cttctatatt ttagcttgtc gaattggtcc gttcatccat ggaattaaga aaaaaatcca + 7201 ggcgataggt gggactcttc tagttaatcc agatggccac gagtggttac gagctaagtg + 7261 gagtgctccc gttcgtcgct actggaaaat ttctgaaggt cttatggtca aatatgcaga + 7321 ttttttagtg tgtgatagta agaatattga aaaatatatc caagaagatt ataaacagta + 7381 tcaacctaaa acaacctata tcgcttatgg aacagataca acacgctcta cattaaagag + 7441 tagtgataaa aaagtacgtt cttggttcaa agagaagaat gtttctgaga acgagtatta + 7501 tctagttgta ggacgttttg taccagaaaa caactatgaa tctatgattc gtggcttttt + 7561 ggcgtctaac tctaagaagg actttgtctt aatcacaaat gtagaacaga ataaatttta + 7621 taatcagttg ttggcaaaaa ctggttttga taaggaccca cgagtaaaat ttgtaggtac + 7681 agtctatgag caagagcttc ttaaatatat tcgtgaaaac gcctttgctt acttccacgg + 7741 gcatgaagtt ggtggaacca atccttcgct tttagaagct ctggcatcaa ctaaactgaa + 7801 tttattgcta gatgttggct ttaaccgaga agttggggag caaagtgcga tttattggaa + 7861 aaaagatgag ctttcccaaa taattgagaa agttgaacaa tttgatgcaa aaatgattga + 7921 tgagttagat agacaatcaa atcagagaat tgcggattct ttcacttggg aaaagattgt + 7981 cacagactac gagaaagtat ttaaaggtta gagttaatgg cagtaaaatt aaaatatgat + 8041 aaatcaaata ttacattttt agatgatgac gaattgaaaa aataccaatc agaattgttg + 8101 aaaatgatat cagatgtgtt tacttttttt gatgaaaatg ggatagcgta ttctttaagt + 8161 ggaggtagca ttttaggggc aatccgtcat aaagggttta tcccttggga tgatgatgtt + 8221 gatatcaata ttccgaggga aagttacgat aaactatttt ctctatttga gttagacagt + 8281 agtcttagtc gtaaatatta tcttcaatca gcaaagagtc atccagaatt gggacttcat + 8341 gtttctcaaa ttagaaaaac aggaacagtt gctcgtagga aatacgatca ttcggctgag + 8401 gagtgcggta tttctataga tctttacatt gtagaaaatg tatacaataa tccagtgaaa + 8461 cgattctttc aaggttatac aagtatgttt ttgacttttg ccttggcttc tgtacgagaa + 8521 acaaagaatc atgccctgat gaaggaaatg tttagactgg aaggtagaaa actaaattat + 8581 tcagctggaa agttaatggt tggttggttt tttggaatta ttccaattga aaagtggttg + 8641 aattggcttg ataaatgtaa ttcaagctgt aaggattcac atacaaaata tgtatccata + 8701 cctacaggaa ggaaacactt tagacgcgag acttacttgc gagataatat gaatatttat + 8761 aaaaaggttc cttttgaaac tttgatggtg aatgttcctg tttggtcaga agagtattta + 8821 gaaatgtttt acggtaaaga ttatatggtc gttcctcctg ttgataagag agagcaacat + 8881 ttgtttttag agttgagtta cggagaagaa tagatgaaag tagcgatttt aacagcttca + 8941 ggcattggaa gccgaattgg tcaagatatc cctaaacaat ttattcatgt tgaaaataag + 9001 ccagtcatta tctataccct tgaaaaattt caaaatcatc cagaaattga tgaaatctgt + 9061 attgttattt taaaaggctg ggaccagatg gttaaagctt atgcggaaca atttggaatt + 9121 acaaagttaa agatgataac tttgggaggg aagtctggtc aagaatcaat ttataacggt + 9181 cttagagaag ttaagaaagc tcatcccaat gaggatgtga ctgtattaat tcatgacgga + 9241 aatcgtcctt tagtgagcaa tgatattatt agcaacgctt tagcaacata ccaacagttt + 9301 ggaaatgctg ttgcagcgat accaacgact gaggtagtat ttgttttaga aaacccacaa + 9361 tcaacttcat ccacagaagc attgaatcgt gacttgttga gacgaacaca aactcctcat + 9421 gtttaccatc ttgataatat tctatcgctt catgaaaaag cattagaaaa tgggataact + 9481 gatgttgcag catcatgcca actcatgcaa ctatttggtg aaaagagtta tttctctctt + 9541 ggaacagaga aaaacttgaa aattacgact gtagaagatc ttgatatttt taaagcttta + 9601 ttgagttcaa ctagagataa gtggattaaa tagtaatgac attattatta aataaaatat + 9661 atagacaaga tgtagaatct tctctagaaa caatcgtcaa tattaatgac ttgaatggca + 9721 agtcaatttt aattactgga gcttctggtt tgattggttc aagtgtcatt gaccagttat + 9781 tattgctaaa tgaaataagg aattttaaca ttaaaatttt ttgttgtgga agagagtttg + 9841 aatcattaga aaaacgattt ggtagacaaa cagagtattt acactttgtg ttctatgatg + 9901 cgactaaagc acctcacttt gattttgcag tggactacat tattcatgct gctagtcctg + 9961 ctagtcctga attatacgtt aatcagcctg tagaaacaat ggctagtaat tttctgggca + 10021 tgtataatct actggaatac gccaaaaatg ctaaagtttc aaatctagtt tatatctcat + 10081 ctagtgaagt ttatggaatt agcactagta ataatccttt ggacgaaaat tatattggaa + 10141 ctgttgatca tcttagcgta cggtcttctt atgccagttc aaaaagagct actgaaacac + 10201 tttgtgttag ttttgcttcc gagtatggaa tcaaaataat gatagtaagg ccaggacata + 10261 tctatggtcc tagtgccaag gactctgata atcgtgtatc atcatttttt atgacagaag + 10321 cgattgctgg gcgtgatatt gtcatgaaaa gtacaggtag tcagttaaga tcctattgtt + 10381 atagtttgga ttgtgccagt gcaattctaa gtgttcttct ttcgggtgga tcaggacaag + 10441 cttataatgt ttccaatcca aattcaatta ttactataaa acagatggca acttgcattg + 10501 cagatgcttc aggagtcaga gttctttatg atatacctat aactcaagag cgaaaacagg + 10561 aaaatcctat ggtaaatgca agcttagata gtaagaaaat tgagtccttg ggatggtcag + 10621 gtctattttc agctgaagta ggcttccatc acacatttag tattttaaag gagttatcaa + 10681 gtgaaaaatg atagtatttt aattatgatg acaacataca atggagaaga atttatacgt + 10741 gaacagttgg agagtatcct ttttcaaacc attacagcat ggaaactata gattcgtgat + 10801 gacaattcta gtgatcaaat aagagcaatt attaaagaat acgaagaaaa agatagtcaa + 10861 tttttgatat aagctagcca agggggattt tggagaagtt tttttattga agagtggcca + 10921 taagaaggtc ttctaggctt aatttaggtt ttcgtccacc ttttgcgtgt ttaagttgat + 10981 aagctgtttt taatacagct aacatctctt caaaaatggc acgctgaaca ccaacaagac + 11041 gcttaaatcg tgcatcagtt agttgtttac ttgcttcata attcatagaa ctattatacc + 11101 atattttatt tcgcaggaaa tctattgaaa aaacgacact atattatcaa tggggatgtt + 11161 aggactatat gttaaaaaca tgcgagagta tcttttgtta tgaatattat gagagtacat + 11221 agaaagatag agatttcact gatggaattt tatagagaag ggaaaactgt atttatttgg + 11281 atatattgaa ctcagtggaa tggattgatt agggtatata catatggtaa atggatgtaa + 11341 cccgcaaaca gaacacggat ggagtacaca tttgctaatt acagagattc attgaaaaat + 11401 attagagttt caaataggaa aagtaatgat tgacggagat tttatgaata gaagacttgt + 11461 aataaaaaag aaaagtataa tgtttttcat gcttatgtta tgtgttacgg cattttatgg + 11521 gacaaattat tggtatacaa atatatatat atatgatttt atgattataa catcatgctt + 11581 attatcaata atagtatttg tatgtaatgg tattagaatt gataaaacat attataaagg + 11641 gacaataata ctgggtattg taatgtggtt ttcaggactt attgctgcac aaggaaaagg + 11701 gctccctgct attgtaatct ttaaagagag tttatatact attactccaa taatgatatt + 11761 tttagctttc cgacctatga taaagtcaat aaaagacact tcattattcc ttcgtactat + 11821 ttctgctgcc ggtgttatat gtaatttaat tgcttgtatt gaaatgttct ttgccaaaag + 11881 aggatttgat tttctaaata taagtgtatt tgaaaaactt agaaatggta ctcctagatt + 11941 tacaattgga gaaacaataa tagttcttag tttttttatc tcctgtagtg ttgtttttag + 12001 taaaggggga aagagaaata gacgcatttt ccatgttcta aatatagctc tcacagctat + 12061 aaatttagtg tatattatta aaacaaggac actgaattta tatattttat caacacttat + 12121 gatggtgcct gttttaaaaa aaaatgtaaa gaaacaactt aagttttgga ttgtgttttt + 12181 gatatctata attcttactt ttgtttctgc agaatatttt attccaatag tcaaaaattt + 12241 aattcatagt gatcatggga ttcaaattag attcttgacg atagaatact atatagagta + 12301 ttttaaaaat cattacttat ttggagcggg atatatttct tctagtccat attttgaaac + 12361 ttattctatt gttactggtc cattaggacg ttattatcca agcgatgtag gtttgattgg + 12421 acttatgttt agaagtggga ttatcgggct aatttggtta ataagttggt tttatacaag + 12481 cttgaagata attaaagata atacgattag aattccagct cattatgact tattaatgaa + 12541 gctagttata gtttttttga tgttttcttg tattaatttg ataatcactg atgcacctag + 12601 attcccatat attgcattag ctatgttact ttttgaatca agttatacct tgagttatga + 12661 aaacagttct aattagaatg tatttcagat agttatttta aaggatgagg ggaaatgatt + 12721 aagagattag caatacttat ggccacatat aatggcgaaa aatatataaa agagcaaatt + 12781 gaaagtattc tcaaccaaga tacagatttt gattttactc taattattag agatgacggt + 12841 tcaacagata atactaaaaa tataattaga gaatatgttg atagtgggaa aattattttt + 12901 atagaaggcc agaataaagg ggcggcaaga ggatttattt ctttgttatg tgataatccg + 12961 ggatatgatt actatgcttt ctcggatcaa gatgatgttt ggaatcataa taaattacag + 13021 aaaggtatat ggagtctttc caaatatact gggccagcac tttattgttc taattgtgaa + 13081 ttagttgatt cagagttaaa tagtataggt cgtaatacac ataggaagag accgaactat + 13141 actcttgaat ctattctttg tcttgctagt tgtgcacaag gatgtacatc tgtatttaat + 13201 aaagagctag cttcgataat tcaggagaat gatgtgcctg atacttttat tatgcatgat + 13261 tctttgatta cttgtttatg tgcactgata ggtggaaaga taatttacga cgaaattcca + 13321 tcaatgaaat atagaatgca tgatgataat atatttggaa tggtgtcagc taagcaaaat + 13381 gtactaaatg ttataaaaga tcgtattagt gaaataacaa aaaagcgaac gattagtatg + 13441 tacgatcaag cagagtgttt actaaaggtt tataaaaaat atatagattc taacaatcaa + 13501 gatatatgta gaattgttat tgattctaaa gtatcgctaa aggcaagact taagctgatt + 13561 tttaataaaa atttgcagca tactacatta aataaaacca taacaaaaaa attagagata + 13621 ttatttggca atgactaata aaggagttta gatatgaagt atcaactcat tgtatcaaca + 13681 atgaatcaac aggataacag tctgatagag aaaatgaata taaaatctga tgcaattatc + 13741 attaatcaat caaattcatt ttcttaccat gagacgaaat tgaaaaattc gattgtaaaa + 13801 tggtatgaat tcaatgaaag aggtattggt ttaagtcgaa acacaggttt catgagatcg + 13861 gatgctgata ttattcaatt tgctgatgac gatatgattt ttacagatac atattatgaa + 13921 gacgtattat tagaatatca aaaacatcca gaagctgatg taattctttt ttcgaataaa + 13981 tgtcttaatg aagatcgaat gccttatcag gttaataatt ttagacgtat aaataggttt + 14041 gaaggtgtta agtttggtgg tgctagaatt acagtcagga gagaaaagat attgcataat + 14101 aacataacgt tttctctttt atttgggggg ggagcaaaat acggtgcagg agaggacgta + 14161 acatttattc aggactgtat caaggcagga ttacgggtat ataaatcacc tattattgtt + 14221 tctacaatga aacaagattc ttctacatgg tttaaaggat atgatagaaa atattataaa + 14281 gataaaggtg ctttattagc agcaaatttc ccttctataa gtgaggtagg agtatatata + 14341 caagctttca aaaatagggg gggaatttat acatttagtg aattacttag attttataag + 14401 gaaggtgtta acgaatttaa aataaataga tgatagattg atatgataaa gaggtttttg + 14461 attatgccaa aaaataaagt ttataatact ggcgagacag acattgagtt gaaaaataaa + 14521 tacaattatg aaggtagtga gttgaggaaa gttcaagttc gtatgattga tatgctttct + 14581 tttttgaatg atatatgcaa agaaaataac atcacctatt tcattgcttt tggaactcta + 14641 ttaggagcta ttagacatgg aggctttatt ccatgggatg atgatcttta tatttatatt + 14701 tatattaatg ataaaggttt aaaaaaactt agaaaaataa ttaataatgg aaactatccc + 14761 tatgttattc aagactattc tagtgataaa ggatttgtaa ggtattatag tgttctcaga + 14821 gatactaact ctgaatatat aaaaaatgaa tatcaacata atcagcgtaa atacagaggt + 14881 gtacaaattg acttattccc ttatggttat ggtgtaatga aatggggtga acgtcttatt + 14941 ggaaaaatat atggttttaa tgaaaaaata tttttaggga aaataaaatg ttggcagcat + 15001 taatttttta tttaactaaa gaagttataa ttccatttct gaaagtaatt agtaagatta + 15061 acggaagaaa gaaagtaatt tattggttgc tgacaatttt gggactgtgg atgattactc + 15121 taacacctat ttttgaaaat attgttggag ctattttaaa agtagatgga gtaggtagag + 15181 gaagtgattc attgactatt cgagcaattg gacgacagtt atattgggaa caattgaatg + 15241 agacaacttt aaaacttctt tttggaacag gataccctaa ttataattat gctttagcct + 15301 ttcaacgtac aggttttttc aagcaatatt tttttaacag acaatggttt tatgatatat + 15361 atatatttgg tattgtgggt tcctcaatta tgggattatt atttttaaaa tatcttaaaa + 15421 attcaataaa gtatgataga caatctgcag atatgattcc gttgatgtat attatttctt + 15481 tactaattgt agcctataat attattcttt ggtattggaa tgcggacggt acttttatat + 15541 tagtaatcat gatttgcgca ttggagcatg gagaacaatt attacatcag aggaatggag + 15601 tgtgattgga tgaatttaaa taaagaagtt agatggaagg ataagcaata tattgctttt + 15661 gatttttttg atacaactat ccatagaaat tgtcatcctg aagtgatttt atttgaatgg + 15721 tctaaaaaaa tttctattta tttctctttc aaaatatctg ctacagaaat ttattcaatt + 15781 aggaaaaaat ctgaaataca tgagaagcaa gaaaaacaat tggaagaaat taaatatgaa + 15841 agattacttc aacttgtttt ttatactatt ttaagtcgtt tgaagtcaga tgttaccgac + 15901 tataatcttg aagatttttt aatttatgca agaacgtgtg aagaggaaat agaattaaga + 15961 catattagta ttgatacaga tacaattaat tttattgaat ttttaaaaca aaatgggaaa + 16021 aaaataattt taatttcaga tttttattct gataaaaagc taattgaaaa attaatggtt + 16081 tcattaggga ttagagatta tttctctaaa atatttattt caagtgaaat tgggttacgt + 16141 aagtcatcag gaaatttata tgaatatgtg atcaatgaat tgagctgtaa gcctataaat + 16201 ttacttatga ttggtgataa tatttattct gatgtaaaag ttccaaaaaa actaggaata + 16261 gattcttatc ataaatctta ttcagattca catgtgactg tgagtcctaa cgatattgta + 16321 aaagcgatga ataatgttat ttctcaagct tgtactgaat ctttatttaa tctctatata + 16381 cctgaaatac tttattttat ttcaaagttg tacaaagaat tatctgttaa caaagctagt + 16441 gatatattat tttgttcaag agaaggtttt tttataaaaa aattatttga tctttatcaa + 16501 aaaaaaatga acttaaagct tattaactca cattattttt atgtttctag aaaatcaacg + 16561 ctatatccat catttaaaaa tattgaggat gaagattttg aagttatttt tagacaattt + 16621 cctgaaatta ctttagaaaa ttttttgatt aatttaaatt tttccaataa tgatattaac + 16681 aatattgcta agcaaacaga aattaaacaa acagacaaag tatcagataa atctattatt + 16741 aacaaattaa aacaaaataa attatttaaa gacgtttatg aattgaactg taaagaagaa + 16801 aaatattctt ttagagaata tttaaagtct gtaggagttg agaatgacaa ttctataata + 16861 aatatggtag atattggttg gaaaggcacg atacaagaca atattcaaaa agcttttcca + 16921 tctttaaata taaaagggta ttatatgggg ttgaattttc aacggtattc tactaggaat + 16981 agtatgaata agacgggaat actgtttact gatgatcctc aaaaaacaaa gttttttaac + 17041 ttatttaatt ataaatattt attctatgaa agaatttttg ttgcagatca tggaccgaca + 17101 gttagatatg aatttatgaa tggtgttggg gtaccaacat tggatacaga tgaaaatcat + 17161 atagaaattt atagatttgc tgaggaattt cagattacat ttttcaacac atttgagaaa + 17221 attttagatt tgttcaatga atcactagta acaccagatg aattatttaa cgaaatagct + 17281 aatttatcat taaaaaaaca ttgcatctat ttaccaaggc tttcagtaag tataaaaaaa + 17341 ttagatagag cagcaaaaga aaattttggt attataaaat ctactaacag gaatagtgat + 17401 aataaggtaa gaaatttttg gaaaaataga gattttttat ttttagatta tatatataaa + 17461 gcgtatggaa agaatagatt gttaaaccct atattggata tttacggata ttttgtatat + 17521 ctgattaaaa cactgcaaat aaaaatagta ggggatattt gatgagcatg aaagaaaaat + 17581 caataagtaa aaatgctatt ttgaatatta ttttaacact aacaaatatt gtgtttccat + 17641 taattacttt tccttatatt tctagaattc tgaatccgtc aggaataggc gcaatctctt + 17701 ttttttcatc tattggttct tatggtgttt tagttgcctc gcttggaatt tcaacttatg + 17761 ggattcgggt gattgcaaag aatcgttatc ataaagataa gataactaaa atattccaag + 17821 aattgatagt tattaatagt gtaatgtcta ttatagtgac gttcttcctt gttttaatga + 17881 gtttccgatt agagcagtta agttcagaaa aaggtttatt aataatcaca tgtattacta + 17941 ttttatcctc tccttttaat ttgaattggt tttatagtgg aatagaagag tattcatata + 18001 taacaaaacg ttcaatattt tttaaattag tttcattgat attaaccttt ttatttgtta + 18061 aaagtaaaga cgattatatt ctatatgctg tgataatatt gttttcaaca ttggcttcca + 18121 attttataaa tattttggag agtagaaaat acatcaattt taatttgaga aggaatttag + 18181 aatttagata tcatctaaaa ccaatgtggt atttatttgc ttcgttactt gcagttaata + 18241 tttatacaaa tttggattct gtgatgttag gaattattaa tggaaatgat gcggtaggta + 18301 tttactcaat cgcatcaaaa gtaaaatgga ttttattatc agtcgttact tcagtgagtt + 18361 tagttttatt acccagatta tcattttata gcaataagta tgacgaaacg aagtttaata + 18421 atattttgag aaagtcatct acaataattt ttatgatttc aattcctcta acaatttttt + 18481 ttatgataaa agcgaaagag agtatattat tgttaggtgg agagcagtat attcaggcag + 18541 ttttagcaat gcaaatatta atgccgatct tgataatatc aggtttttcc aatattatag + 18601 gtaatcagat attgatccct actggtaatg agaaatattt tatgagagca gtttctatag + 18661 gggcaatagt aaatttatgt ttaaatttgt tgcttatgcc tattttggga attatcggag + 18721 gtgcaatcgc aactctttgt gcagaatcag tccaaatgat tattcaattt tatttttctc + 18781 gtaataaatt aatgggtaat atttcattaa attcaatcaa aaaagtagcc tattcatcaa + 18841 tttttgcggg tatactgtta atagtaatac aaaatattat agagaatttt aatagcttct + 18901 taaatttagc tgcttctagt tttctatatt ttggagtata ttttttctta ttggtattgt + 18961 ttaaagaaag tacaattaag aaatttctaa atcaaatttt ttataaggat atttcatgaa + 19021 tttattacca attatttatg gagcgattct tgatttaata ttagaataat tttttaaagt + 19081 gaatgaaatc aaagcaataa aagactaaaa ataaattgct atctattatg tttttctcaa + 19141 actaagtaaa acataactca tgaaaacaaa tttaaaaagg agggactata gtatgaaagg + 19201 tattattctt gcaggtggtt cggggacacg attatatcct ttgactcggg ctgcatcaaa + 19261 acaacttatg ccggtttatg ataaaccgat gatttactat ccactttcaa cattgatgtt + 19321 ggctgggatt agggatattt tgataatctc aactcctcaa gatttgcctc gttttaaaga + 19381 gcttcttcaa gacggatctg agtttgggat taaactttct tatgcagagc aaccaagtcc + 19441 agatggtttg gcacaagcct ttatcattgg ggaagagttt attggtgatg atagtgttgc + 19501 tttgattttg ggggacaata tctatcacgg ccctggtttg agcaaaatgc ttcaaaaagc + 19561 agccaagaaa gagaaaggtg cgactgtttt tggctaccaa gtgaaggatc cagagcgttt + 19621 tggtgtggtt gagtttgata cagacatgaa tgctatctcc atcgaagaaa agccagaata + 19681 ccctcgttca aactatgcag tgacaggact ctatttctat gataatgatg tagtagagat + 19741 tgccaagagt atcaaaccaa gtcctcgcgg agaattagaa atcacagatg tcaacaaggc + 19801 ttacttggat cgtggagact tatccgttga gcttatggga cgtggctttg cttggctgga + 19861 tactggaact catgaaagtt tactagaggc ttcacagtac atcgaaacag tgcaacggat + 19921 gcaaaatgtt caggtagcaa acttagaaga aattgcttac cgtatgggct atatcagtcg + 19981 agaagatgta ttggccttag cccaaccact taagaaaaat gaatacggac agtatctgct + 20041 ccgtttgatt ggagaagcat agatgacaga taattttttc ggtaagacgc ttgcggcacg + 20101 caaggttgaa gctattccag gcatgttgga gtttgatatc cccgttcatg gagataatcg + 20161 tggctggttt aaagaaaatt tccaaaagga aaaaatgctt ccacttggat ttccagagtc + 20221 tttctttgca gaaggaaaat tgcaaaacaa tgtatccttc tcacgtaaaa atgtccttcg + 20281 aggcctccac gcagagcctt gggataagta catctctgta gcagatggag ggaaagttct + 20341 gggttcttgg gttgatctac gcgagggtga aacctttggg aatacctatc agacagtgat + 20401 tgatgcgagt aagggaatct ttgttcctcg aggcgtagct aatggcttcc aagttttatc + 20461 agatacagtg tcatatagct atctggtcaa tgattactgg gctcttgaac tcaaacccaa + 20521 gtatgccttt gtgaactacg ctgatccaag ccttggtatt gaatgggaaa atattgcaga + 20581 agcagaggtt tcagaagcag ataaaaatca tccactactt aaggatgtaa aacctttgaa + 20641 aaaagaagat ttggaataag gaaagaatat gactgaatac aaaaatatta tcgtgacagg + 20701 tggagctggc tttatcggtt ctaactttgt ccattatgtt tacgagaact ttccagatgt + 20761 tcacgtgaca gtcctagata agttgactta tgctggaaac cgcgcgaata ttgaggaaat + 20821 tttaggtaat cgtgttgagt tagttgttgg tgacattgct gatgcggagt tggtagacaa + 20881 gttggctgct caagcagatg ctatcgttca ttatgcagcg gaaagccaca atgataattc + 20941 gctcaatgat ccatcgccat ttattcatac taacttcatt ggaacctata ctcttttaga + 21001 agctgctcgt aagtatgata ttcgcttcca ccatgtatcg acagatgaag tttatgggga + 21061 tctcccttta cgcgaagatt tgccaggtca tggagaaggg ccgggtgaga aatttacggc + 21121 tgaaaccaag tacaatccaa gctcgcctta ctcatcaacc aaggcagcct cagatttgat + 21181 tgtcaaagcc tgggtgcgtt cttttggagt caaggcaacg atttccaact gttcaaataa + 21241 ctacggtcct tatcaacata tcgaaaaatt catcccacgt cagattacta acatcctaag + 21301 tggtatcaag ccaaaacttt acggtgaagg taaaaacgtt cgtgactgga ttcataccaa + 21361 tgaccattct tcaggagttt ggacaatctt gacaaaaggg caaatcggtg aaacctactt + 21421 gattggggct gatggtgaga agaacaataa ggaagttttg gaacttatcc ttaaggaaat + 21481 gggacaagct gcggatgcct atgatcatgt gactgaccgt gcaggacatg accttcgcta + 21541 tgcgattgat gctagcaagc tccgtgatga gttggggtgg aaacctgaat ttaccaactt + 21601 tgaagctggg ctcaaggcaa caatcaagtg gtatacagat aaccaagaat ggtggaaagc + 21661 agaaaaagaa gctgttgaag ccaattatgc taagactcag gagattatta cagtataaaa + 21721 agcaggaaat agctgctttt tattgctata ttgggaagag ttacatatta gaaaggtcta + 21781 gagatgattt taattacagg ggcaaatggc caattaggaa cggaacttcg ctatttattg + 21841 gatgaacgta atgaagaata cgtggcagta gatgtggcta agatggacat taccaatgaa + 21901 gaaatggttg agaaagtttt tgaagaggtg aaaccgactt tagtctacca ttgtgcagcc + 21961 tacaccgctg ttgatgcagc agaggatgaa ggaaaagagt tggacttcgc catcaatgtg + 22021 acggggacaa aaaatgtcgc aaaagcatct gaaaagcatg gtgcaactct agtttatatt + 22081 tctacggact atgtctttga cggtaagaaa ccagttggac aagagtggga agttgatgac + 22141 cgaccagatc cacagacaga atatggacgc actaagcgta tgggggaaga gttagttgag + 22201 aagcatgtgt ctaatttcta tattatccgt actgcctggg tatttggaaa ttatggcaaa + 22261 aacttcgttt ttaccatgca aaatcttgcg aaaactcata agactttaac agttgtaaat + 22321 gaccagtacg gtcgtccgac ttggactcgt accttggctg agttcatgac ctacctagct + 22381 gaaaatcgta aggaatttgg ttattatcat ttgtcaaatg atgcgacaga agacacaaca + 22441 tggtatgatt ttgcagttga aattttgaaa gatacagatg tcgaagtcaa gccagtagat + 22501 tccagtcaat ttccagccaa agctaaacgt ccgctaaact caacgatgag cctggccaaa + 22561 gccaaagcta ctggatttgt tattccaact tggcaagatg cattgcaaga attttacaaa + 22621 caagaagtga gataagtagt agaatgattt tctagtctaa taaaagaggc agagaatgaa + 22681 ctccaaagga gcataagatg tacgattatc ttatcgttgg tgccggtctt tttggtgcag + 22741 tatttgccca tgaatcagcc ttaaaaggaa aaaaagtaaa agttattgaa aaacgaaatc + 22801 atattgcggg taatatctat actcgtgaag aggaaggaat tcaagttcat cagtatggtg + 22861 ctcatatctt tcatacttct gataaggaga tctgggatta tgtgaaccag tttgcagagt + 22921 ttaaccgtta tacaaattct cctgttgcaa actataaggg agagatttat aacttacctt + 22981 ttaatatgaa taccttcaat aaactctggg gagttgtgac gccagcagaa gcacaagcta + 23041 agattgagga acaacgtgct attttaaatg gtaaaactcc tgaaaatttg aaagaacagg + 23101 cgatttctct tgtaggtaca gacatctacg aaaaattaat caaagactat acagagaaac + 23161 agtggggcaa accaactact gaacttccat cctttattat tcgccgttta ccagtacacc + 23221 tgacctatga taacaactat tttaacgata cctatcaagg gattccaatt ggtggataca + 23281 ctcaaatagt tgaaaaatgt tggattatga aaatattgat gtagaaacaa atgttgattt + 23341 ctttgtgaac aaagagcaat atctgaaaga ttttcctaag attgtcttta ctggtatgat + 23401 tgatgaattc tttgactata agttgggcga actagagtac cgtagtcttc gttttgaaaa + 23461 tgagaccttg gatatggaaa attaccaagg aaatgcagtt gtgaactata cggatgcaga + 23521 aaccccatat actcgcatta ttgaacacaa acattttgag tttgggagtc aagcaaagac + 23581 tatcattact aaagaacatt ctaaaacatg ggaaaaaggt gatgagcctt attatccagt + 23641 taataatgat cgtaataatc atttgtataa atcgtataaa aaatttgctg atgagcaagg + 23701 gaatgttatc tttggtggcc gcttaggaca ctatcgttat tacgatatgc accaagtaat + 23761 tggagcagct ttgcagtgcg tgagaaatga gttagattaa tactcaatga aaatcaaaga + 23821 gcaaactagg aagctagcca caggttgctc aaaatactgt tttgaggttg cagatggaag + 23881 ctgacgcggt ttgaagagat tttcgaagag tataaacaag taaaactgac taccagttat + 23941 tatttagaaa tagtattaaa aattccttga ctatgtgata tagttgaggg atttttaaat + 24001 gatattcata ttttttgcaa agatgttgtt tgaaaaataa ttttcaaaaa ttctgaaaat + 24061 tctgttgaca actttctgaa aagagtctat aatggagaga aagttttaaa ggagaaaatg + 24121 atgaaaagtt caaaactatt tgcccttgcg ggcgtgacat tattg +// + diff --git a/public/res/serotype_genbank/serotype_25A.gb b/public/res/serotype_genbank/serotype_25A.gb new file mode 100644 index 0000000..5a3d65c --- /dev/null +++ b/public/res/serotype_genbank/serotype_25A.gb @@ -0,0 +1,1175 @@ +LOCUS CR931689 28466 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain tp 25/38, sp 65/81 (serotype 25a). +ACCESSION CR931689 +VERSION CR931689.2 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 28466) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 28466) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT On Mar 17, 2006 this sequence version replaced CR931689.1. + NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..28466 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="tp 25/38, sp 65/81" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC25A_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC25A_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI33954.2" + /db_xref="GOA:Q4JZD8" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JZD8" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAP + WDAFCVELL" + gene order(322..1752,1788..2273) + /gene="aliB" + /locus_tag="SPC25A_0002" + /pseudo + CDS join(322..1752,1788..2273) + /gene="aliB" + /locus_tag="SPC25A_0002" + /note="member of homology group 169; + old_tribe:0162 2" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + misc_feature join(538..1752,1788..1871) + /gene="aliB" + /locus_tag="SPC25A_0002" + /note="HMMPfam hit to PF00496, Bacterial extracellular + solute-binding prot, score 4.5e-36" + /pseudo + gene complement(order(2417..2998,3052..3740)) + /gene="tnp" + /locus_tag="SPC25A_0003" + /pseudo + CDS complement(join(2417..2998,3052..3225,3225..3740)) + /gene="tnp" + /locus_tag="SPC25A_0003" + /note="member of homology group 13; + old_tribe:0015 22" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(2918..2998,3052..3225,3225..3248)) + /gene="tnp" + /locus_tag="SPC25A_0003" + /note="HMMPfam hit to PF01610, Transposase, score 2.3e-31" + /pseudo + gene 3778..3999 + /gene="tnp" + /locus_tag="SPC25A_0004" + /pseudo + CDS 3778..3999 + /gene="tnp" + /locus_tag="SPC25A_0004" + /note="Lone member of homology group 0248" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase (fragment)" + gene 4276..5373 + /gene="glf" + /locus_tag="SPC25A_0005" + CDS 4276..5373 + /gene="glf" + /locus_tag="SPC25A_0005" + /EC_number="5.4.99.9" + /note="member of homology group 6; + old_tribe:0006 56" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33958.2" + /db_xref="GOA:Q4K079" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K079" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + IEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + TWGTKTPQEVKNKIAEQTAHMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TDLPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKGVEVELGVDFFANRQ + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEVLDKENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQDKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAVQNDK + VIFCGRLADYKYYDMHVVIERALEVVRNEFS" + misc_feature 4711..5313 + /gene="glf" + /locus_tag="SPC25A_0005" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 2.4e-135" + gene 5691..6371 + /gene="wzd" + /locus_tag="SPC25A_0006" + CDS 5691..6371 + /gene="wzd" + /locus_tag="SPC25A_0006" + /note="member of homology group 2; + old_tribe:0002 80" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33959.2" + /db_xref="GOA:Q4JZ56" + /db_xref="InterPro:IPR003856" + /db_xref="UniProtKB/TrEMBL:Q4JZ56" + /translation="MNNRIVDISLFDLLNVLWLRKWIIVFVSFVFGCISFLYYQFFVP + KTYTSDTRIYVVSKGDNKNLSNADLQAGSALTKDYKEIILSDEVLEETISDLKLESTL + ESLASKIKISIPAETRIISISVTNTNSDEAARIANGIRKVAALKIKEVTQVTDVTTLQ + TARPPQTPSGPHVRKSTTAGLVLGAFLTVFLVVAKEILDDRIKRFEELEKLGIPILGS + IPLSKNIK" + misc_feature 5706..6116 + /gene="wzd" + /locus_tag="SPC25A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 2.5e-41" + gene 6378..7067 + /gene="wze" + /locus_tag="SPC25A_0007" + CDS 6378..7067 + /gene="wze" + /locus_tag="SPC25A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3; + old_tribe:0003 80" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33960.2" + /db_xref="GOA:Q4JZ55" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZ55" + /translation="MGKLELTRKYYQLYNETKEYFNALQTNIQLSGDGLKVISVTSTV + KNEGKSTISVGLSMSLALSGYKVLLLDVDLRNSVMSGMFHSRERITGLTEYLSGKAGM + ADSMQETTLDNLYILQAGVVSPNPLSLLRSVKFETLIDSMKKYFDYIIVDTPPIGQVI + DAAIIAQQCDGIFLVTEMRKTTRRQIFSSLQQLEQTGVPVLGLVANKAIIKKDSYGYY + GKNTASETERY" + gene order(7258..7568,7590..7655,7660..7977) + /gene="tnp" + /locus_tag="SPC25A_0008" + /pseudo + CDS join(7258..7374,7374..7568,7590..7655,7660..7977) + /gene="tnp" + /locus_tag="SPC25A_0008" + /note="member of homology group 19; + old_tribe:0021 15" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature join(7503..7568,7590..7655,7660..7971) + /gene="tnp" + /locus_tag="SPC25A_0008" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 2.1e-09" + /pseudo + gene 8198..9649 + /gene="wzg" + /locus_tag="SPC25A_0009" + CDS 8198..9649 + /gene="wzg" + /locus_tag="SPC25A_0009" + /note="member of homology group 0; + old_tribe:0000 80" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33962.2" + /db_xref="GOA:Q4K075" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K075" + /translation="MRYFMSREKKRGTAVHLKSYINSVLLILYTGIASLFLFQIFRYN + ILNFRNLNLLVALLVVLVFILGVSLIVRKKAEKLTMLLLILAVASSSISLLAVQQFIG + FTSRLNATSNVSEYAISLVVLKDSEISELEQVSHVMAPTDTDYEAIQSLLADIKEKQG + KDLIVDKSKSYLEAYKSLISGDTKVIFLNSIFEHMIESDFPDFRDKIKKIYTKEMTKK + VEAPKVSKGQAFTIYFSGIDTYGPINSVSRSDVNILMTVNSETKKILLTTTPRDSYVA + IADGGKNRKDKLTHAGIYGIDSSIHTLEHLYGVEINYYVRVNFTSFLKIVDLLNGIDV + DDSQEFTIDGNDYPVGNLHLNSKSALGFVRERHSLADGDRDRGRNQQKVLAAIIQKLT + SIESLKNYRQIMQGLEDSIQTNLSPTTIMDLANTQLESGGNYKINSQDLKGTGRMDLP + SYAMPDSQLYMMEIDENSLSAIKENIQAVLEGR" + misc_feature 8414..8761 + /gene="wzg" + /locus_tag="SPC25A_0009" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 9.5e-40" + misc_feature 8939..9376 + /gene="wzg" + /locus_tag="SPC25A_0009" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.7e-63" + gene 9588..10382 + /gene="wzh" + /locus_tag="SPC25A_0010" + CDS 9588..10382 + /gene="wzh" + /locus_tag="SPC25A_0010" + /EC_number="3.1.3.48" + /note="member of homology group 1; + old_tribe:0001 80" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33963.2" + /db_xref="GOA:Q4JZ53" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ53" + /translation="MMRIASQLSKKIFRLFWRVGKMIDVHSHIIFDVDDGPKSIEDSR + ALLLEAYDQGIRTIVSTSHRRQGMFETPEDKIAENFRAVQKIARDIADDLTILYGAEI + YYTQDIINKLEKKTFPTLNGSRYALIEFSSETSYRSIHSALQQLLLSGITPLIAHIER + YDALENNKQAVLELIRMGCYTQINSSHLLKKKLFKDDAKIMKKRVHYFLKHDLVHIVA + SDMHNLDTRPPYMAEAYEIISKRYGKEKAEEFFIKNPQRILMDQLI" + misc_feature 9654..10262 + /gene="wzh" + /locus_tag="SPC25A_0010" + /note="HMMPfam hit to PF02811, PHP domain, score 3.6e-36" + gene 10401..10988 + /gene="wciI" + /locus_tag="SPC25A_0011" + CDS 10401..10988 + /gene="wciI" + /locus_tag="SPC25A_0011" + /note="member of homology group 29; + old_tribe:0034 8" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI33964.2" + /db_xref="GOA:Q4K061" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4K061" + /translation="MYKVIKRFIDIALALLGIVLLSPLFLGIIVFIKLESKGPIFFKQ + KRIGLHKKEFYILKFRTMRIDTPSAVPTHLLKNPYQWITKVGKVLRRTSLDELPQIWN + ILVGHMSLVGPRPALWNQFDLIEERDKYGANDILPGLTGWAQINGRDELSIPVKAKFD + GYYVKNCSFVLDCRCVVESFLVVFKRYGHREGGAD" + misc_feature 10416..10970 + /gene="wciI" + /locus_tag="SPC25A_0011" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 3e-32" + gene 11001..12131 + /gene="wcyA" + /locus_tag="SPC25A_0012" + CDS 11001..12131 + /gene="wcyA" + /locus_tag="SPC25A_0012" + /note="member of homology group 170; + old_tribe:0163 2" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33965.2" + /db_xref="GOA:Q4K060" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K060" + /translation="MGNRKKVFVVANVVKEHILKFHIPTIKEMTKRGWTVDVGASGDE + TVPYCHQQYSLPHQRSPFHLGTLKSIWKLRKILKSGGYDIVYCHTPVGGLVGRLASLG + LRKQGTRVIYFAHGYHFYKGATFFNWLVYYPIEKLLSLFTDSIILINQEDYHLTKTKF + KQVQSYLVSGMGVKQERFSPQSNQVRERYRKELKLPEDATVLIYCAELIKNKNQTFLL + HAMKKLVDQGENLYCLLVGIDYTKGEMVECIQSLNLSDRVLLLGWREDIANLYACSDI + CVATSIREGFGLNIVEAMFCHVPVVATINRGHASIIQDGQNGLLVQLGNTKQLVEAIY + VLMKDTKKKQELVEQASANLEQYHSQKIVNSLLEIIEQTAMK" + misc_feature 11556..12071 + /gene="wcyA" + /locus_tag="SPC25A_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.5e-40" + gene 12128..13558 + /gene="wzy" + /locus_tag="SPC25A_0013" + CDS 12128..13558 + /gene="wzy" + /locus_tag="SPC25A_0013" + /note="member of homology group 171; + old_tribe:0164 2" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33966.2" + /db_xref="UniProtKB/TrEMBL:Q4K059" + /translation="MSEGCEKVKIQIDKIYYLFFWLVVSFGYFFMMPTFTEDLEGVVS + ASLVQLLLFIIGYVYVSYLNRSFISLYSIFMIVFYLFQNGQVLLYSLGVEYDYFYVLR + YDETIVLQSVIFSTQCLIAAFMAGVFSTKKEVSKPLYSYMDQLEREKLITAGKLFWGA + FAIFALPFMMMKFVITSTSGYFAMIRFVGSLPTITVLFEKMFIASSVFLVVYLKSEET + WSKFLKVVILGWSIMAALTGDRTVGLAGIVTLALIQTLIGNRKKKIKFSQYALLVGAA + VVVMYLMSFAFQFRMQQDSKVSGLQTAVVEMIGTLGFSFFPLVLTIRIVPTSINFFRG + KSYIAAIITGLIPSNFDFLHLTKTLSEWNAYPTELLDTIYHYGFGLDYSLIAEAYINF + GSYGWIAIFFLCSLIAYFVRDVDFKRKDNLFSQYASLILLYSWFTLPRRKSYFIFNNF + FWYVLFFGLALILVSRSIKQRKEFKK" + gene 13555..14322 + /gene="wcyB" + /locus_tag="SPC25A_0014" + CDS 13555..14322 + /gene="wcyB" + /locus_tag="SPC25A_0014" + /note="member of homology group 172; + old_tribe:0165 2" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33967.2" + /db_xref="GOA:Q4K058" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K058" + /translation="MKISIIMGIHNGEKRFETAVQSIFNQTYDNWEFIICDDASTDKT + FEKLQGLYGQDSRFILLKNEKNVGLSATLNRCIEASSGEFIARMDDDDICYPERFERQ + VDYLFHHPEIDFVSSSIDIFDGEVVVGTRILLDFPSKKDLIWNSPFVHPVTMFRRDAL + LEVGGYRVSPETVRGQDYDLFMRLYSREKKGGNILEPLFRYTIDQNTMKRRTFKARIG + EMIIRYKGYRAMKVPFYNYVFIFKPLVAHLVTLVKRR" + misc_feature 13564..14046 + /gene="wcyB" + /locus_tag="SPC25A_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.2e-39" + gene 14322..15503 + /gene="wcyC" + /locus_tag="SPC25A_0015" + CDS 14322..15503 + /gene="wcyC" + /locus_tag="SPC25A_0015" + /note="member of homology group 173; + old_tribe:0166 2" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33968.2" + /db_xref="GOA:Q4K057" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K057" + /translation="MFMKILITTHTYLPNKDGVQFVNQYLAEGLVKKGHQVTVLTYCY + PSRTRVPREVINGVRVIRWNARTSCTFHKGEKLAYQNFILNSQSDYDVLVNVGTQTAL + TDWLFPIFSQITIPKVLYIHSIWDFNWLHWHRQSFKRFVAKTWANVRWKYYYWKQTVI + FKQYNEVIQLHPKDYSVAFFKEKYDIESQILGNAADASFFQNKNAIKKQSYIVNVSNF + NDLKNQKKAVEYFLKSNLSSEWKFVLVGSEKNDYLQSVQDFEKELRNQLGITSGKEIE + YRIGLSREEVVKTVKEASFCLLTSIREAFPISLIEVMAAGIPFISSDVGIVNYLSGGI + TACSDQEFIRAIEEFATYPEVRNQYGKKGQMEAKEHYQVDDKVKEFETLLQKFVKEEE + D" + misc_feature 14910..15419 + /gene="wcyC" + /locus_tag="SPC25A_0015" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.2e-13" + gene 15500..16465 + /gene="wcyD" + /locus_tag="SPC25A_0016" + CDS 15500..16465 + /gene="wcyD" + /locus_tag="SPC25A_0016" + /note="member of homology group 174; + old_tribe:0167 2" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33969.2" + /db_xref="GOA:Q4K056" + /db_xref="UniProtKB/TrEMBL:Q4K056" + /translation="MKKIVFLCPYFGTLPPHTQLWLNSCKMNPSVTWYLFTDDKRTFD + YPENVQVFYTTLEETKALYQRKFDFEISLEGAYKLGDYKPLFGYLYEEMIQEFDAWGH + IDVYDEIYGDIRAFVTDELLDKYDKLMFFGHMGIYRNSPEVNRRFKLSSDLDRTYQEI + FSSSQFYNFEEYVAGSITRVYQKNGFPIGRLDKVIADLSGLSYHFRRGYYSDDFETFT + YLPNLPMIFSWEDGKTYCYSVQNNQVQKNEFLYVHFKRRKMIQSISNDVSAYLIVPNG + FVEMPKEITVDLIQKYSQKKLFYPVYFQEKWKGVKRLLKKIGRSE" + gene order(16462..16557,16565..17089,17122..17160) + /gene="wcyE" + /locus_tag="SPC25A_0017" + /pseudo + CDS join(16462..16557,16565..17089,17122..17160) + /gene="wcyE" + /locus_tag="SPC25A_0017" + /note="member of homology group 175" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + gene 17151..18566 + /gene="wzx" + /locus_tag="SPC25A_0018" + CDS 17151..18566 + /gene="wzx" + /locus_tag="SPC25A_0018" + /note="member of homology group 176; + old_tribe:0168 2" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAJ84825.1" + /db_xref="GOA:Q4K055" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K055" + /translation="METKEKRLVNNTIIFTIGSLGSKFIQFLLVPLYTYTLTAAQFGI + TEILLTAVNLLIPVFSISIADGLLRFGLDKTLRRENVLKSAFIISILGTILSIISIPI + FSLYPTLSEWMVYFIIILNLRMYRDVFAIQLKVEGKNTLFACDSMIYTFVLSLASIVF + LVPFSLGISGYFFAYIVSNGISIFFILFFGGVWKSFTSGRFEKQLMIQLLKYSAPMIL + NGIAWWITNASDRFMLQWFMDDRAVGLYGVVAKLPLLIGTFTGVFNQAWIISAVEEFE + EENEEWFYQKVFHQYYAALFLSVSVFLLLLQPFMKVYVSPSFYEAWQYAPFLLLSSVV + SGIAAFMTGFYVAQKKNLNIIYTTIAGAFANILLNAMFIPMLGVLGASIATFLSWFVI + AIYRMKDVENFACFPLDKKVFWYLFLLCIQTITMTFLPILGIVFSVVLIPYFFYQEQE + FLAVLFDKGRKKVCSFKKSKR" + misc_feature 17172..17975 + /gene="wzx" + /locus_tag="SPC25A_0018" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 3.4e-10" + gene 18539..19201 + /gene="wcyF" + /locus_tag="SPC25A_0019" + CDS 18539..19201 + /gene="wcyF" + /locus_tag="SPC25A_0019" + /note="member of homology group 177; + old_tribe:0169 2" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAJ84826.1" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4JZ44" + /translation="MFIQKIKKIIRVFLRKSLVKDYRQRIQNKEFTLITSNCVGGLIS + HDLGLQFRSPTINMYIEAADFIQFCSHLERYLKEDLSFIEVNQDGHFVALCGDIKIYI + VHYNSFEEFAKKWSERAKRVDFDQLYLMMSERDGCRYEDIVKFDTLPYKNKVIFTSKK + MPEIQSAFYIPGIETKNNQKHKVKSVTTYLNSFTGKRYIDLFDFVEFLNTGRKQLSKY + EK" + gene 19191..20273 + /gene="gla" + /locus_tag="SPC25A_0020" + CDS 19191..20273 + /gene="gla" + /locus_tag="SPC25A_0020" + /note="member of homology group 96; + old_tribe:0170 2" + /codon_start=1 + /transl_table=11 + /product="putative epimerase" + /protein_id="CAJ84827.1" + /db_xref="GOA:Q4JZ43" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR008089" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZ43" + /translation="MKSKIILKNKTILVTGAAGFIGANLVMSLLQEENPLQIIGIDNL + NDYYDVSLKEYRLSTIQEECQSSLNKKWVFIKGDIADSDLMEEIFETYRPQIVVNLAA + QAGVRYSITNPDVYMKSNIIGFHTILEKCRKYQENIEHLVYASSSSVYGGNTKIPFSE + LDAVDNPVSLYAVTKKTNELEAHAYSKLYNIPTTGLRFFTVYGPAGRPDMAYFSFTKQ + LIDKKPIEIFNYGNCQRDFTYIDDIVEGVKRVMTGAPQKEIGEDGLPIPPYAIYNIGN + HQPENLLNFVEILQEKLIAASILPEDYDFSSAQKLVPMQAGDVVATYADISLLEKDFN + FKPKTSLRNGLRNFAEWYRNFYQRGE" + misc_feature 19221..20252 + /gene="gla" + /locus_tag="SPC25A_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00023" + misc_feature 19224..20129 + /gene="gla" + /locus_tag="SPC25A_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 7.1e-05" + misc_feature 19224..20015 + /gene="gla" + /locus_tag="SPC25A_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 8.3e-55" + misc_feature 19227..20093 + /gene="gla" + /locus_tag="SPC25A_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 5.4e-09" + gene 20233..21501 + /gene="ugd" + /locus_tag="SPC25A_0021" + CDS 20233..21501 + /gene="ugd" + /locus_tag="SPC25A_0021" + /note="member of homology group 20; + old_tribe:0020 15" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAJ84828.1" + /db_xref="GOA:Q4JZ42" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4JZ42" + /translation="MQNGIEIFIKGVNRMKITVVGMGYVGLSLAVLLAQHHEVTALDI + IDKKIQLINEKKSPIQDEYIEQYFLEKNLHLSATTNEVEAYKDAEMIIIAAPTDYDTH + KNFFDTSAVEQVIENIISMNNEALIVIKSTVPVGYTESIREKYGKKNILFSPEFLREA + NGLYDNLYPNRIIVGTDLNDGALVSKAHEFVSLLQEGALKENIDTLIMGFSEAEAVKL + FSNAYLALRVSYFNELDTYAELKGLNTKAIIDGVGLDPRIGQFYNNPSFGYGGYCLPK + DSKQLLSNYHDVPENIISAIVSSNETRKKFIAERILEIVGANHIDEYYNLKQEIVVGI + YRLVMKKGSDNFRHSSIQGIIKRLKANGVTLMIYEPSLPDGQLFFGSEVVHDFPKFKE + KSHLIVANRFDETLMDVKDKVYTRDLFGRD" + misc_feature 20275..20832 + /gene="ugd" + /locus_tag="SPC25A_0021" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.3e-45" + misc_feature 20275..20673 + /gene="ugd" + /locus_tag="SPC25A_0021" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.0013" + misc_feature 20860..21141 + /gene="ugd" + /locus_tag="SPC25A_0021" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-35" + misc_feature 21241..21480 + /gene="ugd" + /locus_tag="SPC25A_0021" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 8.5e-05" + gene complement(order(21633..22214,22271..22956)) + /gene="tnp" + /locus_tag="SPC25A_0022" + /pseudo + CDS complement(join(21633..22214,22271..22441,22441..22956)) + /gene="tnp" + /locus_tag="SPC25A_0022" + /note="member of homology group 13; + old_tribe:0015 22" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(22134..22214,22271..22441,22441..22464)) + /gene="tnp" + /locus_tag="SPC25A_0022" + /note="HMMPfam hit to PF01610, Transposase, score 1.2e-31" + /pseudo + gene 23942..25219 + /gene="intron" + /locus_tag="SPC25A_0023" + CDS 23942..25219 + /gene="intron" + /locus_tag="SPC25A_0023" + /note="member of homology group 108; + old_tribe:0103 3" + /codon_start=1 + /transl_table=11 + /product="putative group II intron protein" + /protein_id="CAJ84830.1" + /db_xref="GOA:Q4K051" + /db_xref="InterPro:IPR000477" + /db_xref="InterPro:IPR013597" + /db_xref="InterPro:IPR015706" + /db_xref="UniProtKB/TrEMBL:Q4K051" + /translation="MSKLLDKILSRENMLEAYNQVKSNKGSAGIDGMTIEEMDNYLRQ + NWRLTKELIKQRKYKPQPVLKVEIPKPDGGIRQLGIPTVMDRMIQQAIVQVMSPICEP + HFSDTSYDFRPNRSCEKAIMKLLEYLNDGYEWIVDIDLEKFFDTVPQDRLMSLVHNII + EDGDTESLIRKYLHSGVIINGQRYKTLVGTPQGGNLSPLLSNIMLNELDKELEKRGLR + FVRYADDCVITVGSEAASKRVMYSVSRFIEKRLGLKVNMTKTKITRPRELKYLGFGFW + KSSDGWKSRPHQDSVRRFKFKLKKLTQRKWSIDLTRRIEQLNLSIRGWINYFSLGNMK + SIVASIDERLRTRLRVIIWKQWKKKSRRLWGLLKLGVPKWIADKVSGWGDHYQLVAQK + SVLKRAISKPVLEKRGLVSCLDYYLERHALKVS" + misc_feature 24116..24766 + /gene="intron" + /locus_tag="SPC25A_0023" + /note="HMMPfam hit to PF00078, Reverse transcriptase + (RNA-dependent DNA pol, score 6.4e-63" + misc_feature 24812..25063 + /gene="intron" + /locus_tag="SPC25A_0023" + /note="HMMPfam hit to PF08388, Group II intron, + maturase-specific domain, score 3.5e-30" + gene complement(order(25279..25752,25754..26080)) + /gene="tnp" + /locus_tag="SPC25A_0024" + /pseudo + CDS complement(join(25279..25752,25754..26080)) + /gene="tnp" + /locus_tag="SPC25A_0024" + /note="member of homology group 4; + old_tribe:0004 68" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(25690..25752,25754..26062)) + /gene="tnp" + /locus_tag="SPC25A_0024" + /note="HMMPfam hit to PF01710, Transposase, score 2.2e-23" + /pseudo + gene 26341..26442 + /gene="tnp" + /locus_tag="SPC25A_0025" + /pseudo + CDS 26341..26442 + /gene="tnp" + /locus_tag="SPC25A_0025" + /note="member of homology group 0019 18; + member of homology group 0022 16; + old_tribe:0171 2; + old_tribe:0021 15" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + /db_xref="PSEUDO:CAJ84832.1" + gene order(26442..26657,26674..27165) + /gene="tnp" + /locus_tag="SPC25A_0026" + /pseudo + CDS join(26442..26657,26674..27165) + /gene="tnp" + /locus_tag="SPC25A_0026" + /note="member of homology group 19; + member of homology group 19; + old_tribe:0171 2; + old_tribe:0021 15" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature join(26586..26657,26674..27048) + /gene="tnp" + /locus_tag="SPC25A_0026" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 0.0004" + /pseudo + gene 27311..28294 + /gene="tnp" + /locus_tag="SPC25A_0028" + /pseudo + CDS 27311..28294 + /gene="tnp" + /locus_tag="SPC25A_0028" + /note="member of homology group 39; + old_tribe:0051 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + misc_feature 27815..28249 + /gene="tnp" + /locus_tag="SPC25A_0028" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.1e-18" + /pseudo + gene 28371..>28466 + /gene="aliA" + /locus_tag="SPC25A_0029" + CDS 28371..>28466 + /gene="aliA" + /locus_tag="SPC25A_0029" + /codon_start=1 + /transl_table=11 + /protein_id="CAJ84835.1" + /db_xref="UniProtKB/TrEMBL:Q20WL5" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSAK" +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttggct ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaaagcag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggtctgact + 361 tttgcatctg ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatacattga ttatcaccaa tctagttgat ggtttgcttg aaaatgacaa tcacggaaac + 541 ctagttccat ctttgccaga ggactggtct gtttcgagcg acggtctgac ttatacttac + 601 aaattgagaa aagatgccaa atggttcaca gctgacggtg aagagtactc cccagtcaag + 661 gcccaggatt ttgtgacagg tatcaagtac gtagtggata ataaatcaca ggctattgac + 721 ttgattcaaa actcgatcaa aggtttgaat gattatatta caggagcgga ttctgacttt + 781 tctaaggttg ggatgaaggc cattgacaac cagactgttg agtatacttt ggtacgccca + 841 gaaccttact ggaactcaaa aacaaccaac agtattcttt tcccggtaaa ctaagagttt + 901 ctaaattcaa aagggaaaga ttttgggacc ctatctccag atagtattct ctacagcggt + 961 ccttatttgt taaaagattt cacatcaaaa tcatttatcg agtatgtgaa aaacccacat + 1021 tactatgatc atgccaaagt atcgattgaa cacgtgaaat tggcttactt taatggatca + 1081 gatcaagaat tgactatccg taactttgaa agtggagctt attctatcgc tggagtttat + 1141 ccaaatagtt cgaactttgc taagaccaag gagaaatata aggataatat cgtctatagc + 1201 ttgcaggaca agacttcttg gtatttaaat ttcaatgtca atcgcgaggc ttgcaatcac + 1261 actactaaaa cgacagatga gccgaagaag tcaactgaga cagctgtctt gaacaaaaac + 1321 ttccgccaag cagtaaactt tgccttggac cgcacagccc attctgccca gtcaaatggg + 1381 gaagaggcgg ctagcaagac ccttcgtaac accttggtgc tcctacattt gtccaagttg + 1441 gagacaagac ctttggagaa gtagttgctt ctaaattggt caactatggt acagaatgga + 1501 ggtattgact tggcagatgc tcaggatgcc tatttcaaca aagaaaaagc ccaagcaaaa + 1561 tttgcggaag ctaaaaaaga attggcaagt caaggtgtga ctttccctat tcacgtgaat + 1621 gtggcagtag atcagacaag taaaaatgcc gttacaggca tgaactcagt taagcagact + 1681 ctggagtcag ttttaggtgc tgataacatt gttattgatg ttcagcaact ttcaacagat + 1741 gattttaata atgtaccttc ttggcaccga tgccagctga tagaggctat gatttgagct + 1801 ttgatggttg ggtgggtgac tatcaggatc catcaactta tctcaatcct ttcaatgcag + 1861 agaatggctt ctatctcaaa atttttggac cggatgccaa ggaagataag gaaaaaatca + 1921 ctagcctagg tcttgatacc tacactaaga tgctcaaaga tgcagatagt gaaaacaaag + 1981 atgtagccaa acgctatgaa aaatatgctg aagcacaggc ttggatgatt gacaattctc + 2041 tcattatgtc agctatgtca agtggtggca cagcatctgt aaccaaagtg atgccattta + 2101 caagagggca ttaattggtt ggtattaagg gtgatggcaa taactacaag tacatgaaac + 2161 tgcaaaaaga tactgtaaca accaaacggt ttgaaaaagc taagaccaaa tgggagcaag + 2221 aaagcaaaaa agcaatcgaa aaagcccaaa aagaagcaga aaaacatgtt aaatagttat + 2281 aaatagcttt ttcaaggaga attaaaaaga caaacatcag ttttggtgct tgtcttttta + 2341 aatcactcgg ttattgaaaa ttagacttct tgcgaaacag gctctttgtc aactgtagtg + 2401 ggttgaagaa aagctaagct cgagaaagga caaatttcgt cctttctttt ttgatattca + 2461 gagcgataaa aatccgtttt ttgaagtttt caaagttccg aaaaccaaag gcattgcgct + 2521 tgataagttt gatgagatta ttggtcgctt ccaatttggc gtttgaatag ggtagttgaa + 2581 gggcgttgac gattttctct ttgtccttta gaaaggtttt aaagacagtc tgaaaaatag + 2641 gatgaacctg cttaagattg tcctcaatga gtccgaaaaa tttctcaggg tctttgttct + 2701 gaaagtgaaa aagtaagagt tgatagatct gatagtggtg tttcaagtct tctgaatagc + 2761 ttaaaatctt gtcaagaatt tctttatttg ttaagtgcat gcgaaaagta gggcgataaa + 2821 atcgcttatc actcagttta cggctatcct gttgaatgag tttccagtag cgcttgatag + 2881 ccttgtattc atgggatttt cgatgaaact gattcatgat ttggacatgc acacgactca + 2941 tagcacggct aagatgttgt acaatgtgaa agcgatcaag aacgatttta gcattcggga + 3001 gtgaaacagc ctgggagact gtttcagcct gagcctagaa atttgaaagc gaagctgttt + 3061 agccaagtca tagtaagggc taaacatatc catagtaatg attttgacgc gacatcggac + 3121 ggctctatca tatttaagaa agtgatctcg gatgacagct tgtgttctac cctcaagaac + 3181 agtgatgata tcgagctttt caaaatcttg cgcaataaag ctcatctcca tctcccgatt + 3241 gaaacagtca ctccccggac tgtttcaacg tcccaggaca taatctcagg aagacaagaa + 3301 aaatcatgtt taaagtgaaa atcattgagc tttcgaatga cagttgaagt tgaaatggcc + 3361 agctgatggg caatatcggt catagaattc ttttcaatta acttttgagc aatcttttgg + 3421 ttgatgatac gagggatttg gtgattcttc ttgacgatag aagtttcagc gaccatcatt + 3481 tttgaacagt gatagcactt gaatcgacgc tttctaagga gaattctagt aggcatacca + 3541 gtcgtttcaa gataaggaat tttagaaggt ttttgaaagt catatttctt catttgactt + 3601 ccgcactcag ggcaagatgg ggcgtcgtag tccagtttgg cgatgatttc cttgtgtgta + 3661 tccttattga tgatgtctaa aatctggata ttagggtctt taatgtctag taattttgtg + 3721 ataaaatgta attgttccat atgaatcttt ctaatgagtt gtttgatcgc ttttcatttg + 3781 gccactcttc aatatgtgcg agaatatcgc acttatgaac aaattgcggc tgattttggt + 3841 attcacgaaa gcaacttaat ccgtcggagc caatgggttg aagtaactct tgttcaaagt + 3901 ggttttacga tttcaagaac tcctctcagt tctgaggaca cggtaatgat tgatgcgacg + 3961 gaagtaaaaa tcaatcgccc taaaaaaaga attagcaaat tattctggta aaaagaaatg + 4021 ccgcgctatg gaaaaatgat ttgttttgtg ctaaaataga ttgaaactaa tactcaatga + 4081 aaatcaaaga gtaacttgga agttagctca aagtacagct ttaaggtggt agatagaact + 4141 gacgaagtca gctcaaaata ctgttttgag gttgcagatg gacgctgacg tggtttgaag + 4201 agattttcga agagtataag atcctctctt ttgctatagt taaggagatg agaggtaaat + 4261 gataagggag agactatgta cgactatcta atcgttggtg ctggtttgtc gggagcaatt + 4321 tttgcttatg aagcaaccaa gcgtggaaaa aaagtaaaag ttattgataa acgtaaccac + 4381 attggtggaa atatctactg tgagaatata gaaggagtta atgttcataa atatggtgca + 4441 catatcttcc atacttctaa taagaaagtc tgggattatg tgaatcaatt tgctgaattt + 4501 aacaactaca tcaactcgcc tgtagctaat tacaagggta gcctttataa tctacctttc + 4561 aatatgaata ctttctatgc tacgtggggg acaaaaactc ctcaagaagt gaaaaataag + 4621 attgctgagc aaacggctca catgaaagac gttgaaccga aaaacttgga agaacaggct + 4681 atcaagttga tcggtccaga tatttatgaa aagttgatta aaggatatac tgaaaagcaa + 4741 tggggacgtt ccgcgactga ccttccaccg tttatcatca aacgtctacc agttcgtttg + 4801 acttttgata ataactactt taatgaccgt taccaaggta ttccaatcgg tggctataat + 4861 gtcattatcg aaaatatgct gaaaggtgtt gaagtagaac ttggagttga cttttttgcc + 4921 aatcgtcagg aattagaagc ttctgctgaa aaagttgtct ttacagggat gattgaccaa + 4981 tatttcgatt ataaacatgg tgagctagaa taccgtagtc ttcgttttga gcatgaagtt + 5041 ctagataagg aaaattatca aggaaatgcc gttgttaatt atacagaacg agaaattcct + 5101 tatactcgca ttattgagca caaacatttt gagtacggaa cacaagataa aacggttatt + 5161 actcgtgaat acccagctga ttggaaacgt ggagatgaac cttattatcc aatcaatgat + 5221 gagagaaaca atgccatgtt tgctaaatat caagaagaag cagtacagaa tgataaggta + 5281 attttctgtg gacgtttggc tgattataaa tactacgaca tgcatgtggt tattgaacgg + 5341 gctttggaag tggtaaggaa tgagttctca tgagagaaac aggcatatat gaaagttaat + 5401 gtagaggagt tgagcttttt atttgaatat tgggtgaaaa agtagtatac ttagatagtc + 5461 tgtttttaaa aatcaaaatg gggaaatcga ttcttatcaa cttcagagtg aactgaatta + 5521 aaactgcata ggagtatata aaatgctgaa gtaagattta cagaacatgg tatgataagt + 5581 gttcgacagc ttgtttggca ggagttcgaa tattcaagta attgagaggg tttttgaact + 5641 tctgataaga tagatagtag attactttcg agtaaaggat agttgagaaa atgaataatc + 5701 gtatagtaga catcagtttg tttgatttat tgaatgtctt atggcttcgt aaatggatca + 5761 ttgtttttgt atcatttgtt tttggatgta tttctttttt atattatcaa ttttttgtac + 5821 ccaaaaccta tacaagtgat actcgtatat atgtggtaag caaaggggat aataaaaatc + 5881 tgtctaatgc agatttgcaa gcaggaagtg ctctaacaaa ggattacaaa gaaatcattt + 5941 tatcagatga agtgttagaa gaaacaattt ctgatttaaa actagaatca actttggaat + 6001 ctctagcttc gaaaattaaa atttctatcc ctgcggaaac tcgaattatt tccattagtg + 6061 ttacaaatac gaactcagat gaagctgctc gaatagcaaa tgggataagg aaggtagctg + 6121 cccttaaaat caaggaagta actcaagtta cagatgtcac cactttacag actgcacgcc + 6181 ctccccaaac tccgtcagga ccgcatgtgc gaaaatctac tacagcaggg cttgttcttg + 6241 gtgcattctt aacagtcttt ctagtagttg ccaaggaaat attagatgat cgcataaaac + 6301 gttttgaaga acttgaaaaa ttgggaatcc ctattttagg ctcaatacct ttatcaaaaa + 6361 atataaagta gaaaatcatg ggaaaattag aactaacacg taagtactat caattgtaca + 6421 atgaaacgaa agaatatttt aatgccttac agaccaatat tcaacttagt ggtgatggac + 6481 tgaaagtcat ttctgttact tccacagtaa aaaacgaagg caaatcgact atatcagttg + 6541 gcttgtccat gtccttggcc ttatcaggct ataaagtcct gttactggat gtggatttac + 6601 gtaattcagt gatgtcagga atgtttcatt ctagggaaag aataacaggt ttgactgaat + 6661 atttatctgg caaagcggga atggcggatt ctatgcagga aactacttta gataatctct + 6721 atatattaca agcaggagtc gtttcaccga atcccttatc tctattaagg agtgttaagt + 6781 ttgaaacctt gatagattct atgaaaaagt actttgacta tattatagta gatactccac + 6841 caatcggcca agtaatagat gctgcaatta ttgcccaaca atgtgatggg atatttttgg + 6901 tcactgaaat gaggaaaacg acacgcagac aaattttttc ttccctccag caattggaac + 6961 aaactggagt tcccgttttg ggccttgtgg ccaataaagc aattataaaa aaagatagct + 7021 atggctatta tggaaaaaac accgcgagcg agactgaaag atattgatgg actacctcct + 7081 ctacctcaca aattgcattt tttgtgaggt agaggagtaa gttgatacta ttatatatta + 7141 gacttcctgc gaaacaaaat atggtatagt agttctatga attatgaagc aagtaaacaa + 7201 ctaactgatg cacgatttaa gcgtcttgtt ggtgttcagc gtaccacttt tgaagagatg + 7261 ttagctgtat taaaaacagc ttatcaactt aaacacgcaa aaggtggacg aaaacctaaa + 7321 ttaagcctag aagaccttct tatggctact cttcaatatg tgcgagaata cccacttatg + 7381 aagaaattgc ggctgatttt ggtattcacg aaagcaactt actccgtcgg agccaatggg + 7441 ttgaagtaac tcttgttcaa agtggtgtta cgatttcaag aactcctctc agctctgagg + 7501 acacggtaat gattgatgcg acggaagtac aaatcaatcg ccctaaaaaa agaattagcg + 7561 aattattctg ataaaaaaaa tgccacgcta tgaaggctca agcgattgtc acaagtcaag + 7621 ggagaattgt ttctttggat atcgctgtga actatttgtt atgatatgaa gttgttcaaa + 7681 atgagtcgca gaaatatcgg acaagctggt aaaatcttgg ctgacagtgg ttatcaaggg + 7741 ctcatgaaga tatatcctca agcacaaact ccacgtaaat ccagcaaact caagccgcta + 7801 acagctgaag ataaagcctg taaccatgcg ctatccaagg agagaagcat ggttgagaac + 7861 atctttgcca aagtaaaaac gtttaaaatg ttttcaacaa cctatcgaaa tcatcgtaaa + 7921 cgcttcggat tacgaatgaa tttgattgct gctattatca atcatgaact aggattctag + 7981 tttggcagga agtctatttt ggaatgctat tatgtttagt tgtgctcaat gaaaatgaaa + 8041 gaactagtaa gctaggcgca gtcagctcaa aacagtgttt tgaggttgta gatagaactg + 8101 acgaagtcag taacatatat atgacaaacc gatgctgacg tggtttgaag agatttttga + 8161 agagtataag acggtatttt aagggaatga ttactatttg aggtatttta tgagtagaga + 8221 gaaaaaaaga ggaacagcag tccacttgaa atcttatatc aatagtgtgc tgctaatcct + 8281 gtacacagga atagcgagcc tatttctttt tcagatattc cgatacaata ttttaaattt + 8341 taggaatctc aatttattag tagctctgct agtagtattg gtatttattt taggagtgag + 8401 tttgattgtc cgaaaaaaag ctgaaaagtt gacaatgctt ctcctaatct tagctgtcgc + 8461 aagtagttca atatcgcttt tggctgttca acaatttatc ggttttacaa gtcgcttaaa + 8521 tgcaacttca aacgtttcag aatatgctat tagtcttgta gttttgaaag atagcgaaat + 8581 tagtgaacta gaacaagtat cacatgtgat ggcgcctacc gatacagatt atgaagctat + 8641 tcaaagtttg ttagcagata taaaagaaaa gcaaggtaaa gatctaatag tagataaaag + 8701 caaatcttat ttagaagcct ataagagttt gatttcaggt gacaccaagg tgattttttt + 8761 aaatagtatt tttgaacata tgattgagtc ggattttcct gactttagag acaaaattaa + 8821 gaaaatatat acaaaagaaa tgacaaagaa agtagaagct ccaaaggttt caaaggggca + 8881 ggcttttact atttatttca gtgggattga tacttatgga ccaattaact ctgtatcacg + 8941 ttcggatgtc aatattttga tgacagtcaa tagcgagacc aaaaaaattc ttttgacaac + 9001 tacacctcgt gactcctatg tcgcaattgc agatggagga aagaatcgaa aagataaatt + 9061 gactcatgct ggaatttatg gtattgattc ttccattcat accttggaac atttatatgg + 9121 tgtagagatt aactactatg ttcgtgtaaa tttcacctct ttcttaaaga tagttgattt + 9181 attgaatggt attgatgtgg acgatagtca agaatttaca attgacggga acgactatcc + 9241 tgttggaaat ctccatctaa attctaagtc agcacttggt ttcgttcgag aacgtcattc + 9301 tctagcagat ggagatcgtg atcgaggacg gaatcaacag aaggtgctcg ctgcaattat + 9361 tcaaaaatta acctcaatag aatcattgaa aaattatcgt caaatcatgc aaggattaga + 9421 ggattcaata caaacaaatc tctctccaac aactatcatg gacttagcca atactcaatt + 9481 ggaaagtgga gggaattata aaataaattc tcaagattta aaagggacag ggcggatgga + 9541 tcttccttct tatgcaatgc ctgatagtca gttgtatatg atggaaattg atgagaatag + 9601 cctctcagct atcaaagaaa atattcaggc tgttctggag ggtaggtaag atgatagatg + 9661 ttcattctca cattattttt gatgtggatg atgggccaaa gtccatagaa gatagtagag + 9721 ctttgttgtt agaagcctat gatcaaggaa ttcggacaat tgtttcaaca tcccaccgcc + 9781 gtcaaggtat gtttgaaaca ccagaagaca agattgcgga aaattttcgt gcggtacaga + 9841 aaatagctag agatattgca gatgatttaa caattttata tggtgcagaa atctactata + 9901 ctcaagacat tatcaataaa cttgaaaaga aaactttccc aactttaaat gggagtcgat + 9961 atgccttgat tgaatttagt agcgagactt cttatcgttc tattcatagc gctcttcagc + 10021 agttgctttt gtcaggaatt accccgctta tcgcccatat cgaacgttat gatgctcttg + 10081 aaaacaataa acaagcagtt ctcgaattga ttcgtatggg ctgttataca cagattaata + 10141 gttcccatct actcaaaaaa aaattattta aagatgatgc aaaaatcatg aagaaacgag + 10201 ttcactattt tttgaaacat gatttagtcc atattgtagc aagtgacatg cataatcttg + 10261 atactagacc gccttatatg gcggaagctt atgaaatcat ttctaaaaga tacggaaaag + 10321 aaaaagctga agaatttttt ataaaaaatc cgcaacgaat cctaatggat caattgattt + 10381 aatgaaaaag gaaacaacaa atgtataaag ttatcaaacg atttatagat atagctttag + 10441 ccttgctagg aattgtatta ttatcaccac tatttttagg aattatagtg ttcataaaat + 10501 tagaatctaa agggcctatt ttctttaaac aaaaaagaat tgggctacat aaaaaagaat + 10561 tttacattct aaaatttaga acgatgagaa ttgacactcc ttcagctgtc cctacacatc + 10621 ttttaaaaaa tccttatcaa tggattacaa aggttggtaa agtcttacgt agaacctctc + 10681 tggatgaatt gccacagatt tggaatattt tggtcggtca catgtcgctt gtaggaccaa + 10741 gacctgccct ttggaatcaa tttgatttga ttgaagaaag agacaaatat ggagcaaatg + 10801 atattttacc tggtttaaca ggttgggcac aaatcaatgg aagagatgaa ttatctattc + 10861 cagtcaaagc caaatttgat ggctactatg tgaagaactg ttcatttgtt ttagattgtc + 10921 gatgtgttgt agaaagtttt ttagtagtat ttaagagata tgggcatcga gaaggtggtg + 10981 cagattagag gaactgatat atgggaaatc gtaaaaaagt ttttgtagta gccaatgtag + 11041 tcaaagaaca tattctaaaa tttcacattc cgactatcaa agaaatgaca aaaagagggt + 11101 ggacggtaga cgtaggtgct tctggggatg aaacagttcc ctattgtcac caacaatatt + 11161 cactgcccca ccaacgttct ccgtttcatc taggcactct caaaagtatc tggaaattga + 11221 gaaaaatttt gaagtctgga ggctatgata ttgtttactg tcatactcct gttggaggtt + 11281 tggtgggacg actggcttct ttaggattgc gaaaacaagg aacaagagtc atttattttg + 11341 ctcatggata tcatttttac aaaggagcaa cttttttcaa ttggttagtg tattacccaa + 11401 ttgaaaagct actgtccctt tttacagata gtatcattct aatcaatcaa gaagattatc + 11461 atctcacaaa aacaaaattt aaacaggttc aatcctatct agtgagtgga atgggagtaa + 11521 aacaagaacg gttttcaccc caatcaaatc aagttagaga acgttatcgt aaagaattga + 11581 aactgcctga ggatgcgact gttttaattt attgtgctga gctaataaaa aataaaaatc + 11641 aaacattttt acttcatgct atgaaaaagc ttgtggatca gggagagaat ctttattgct + 11701 tattagtagg aattgattat accaagggtg aaatggtaga atgtattcaa tccttgaatt + 11761 tatccgatcg agttttactt ttagggtgga gagaagatat tgccaatctt tacgcttgtt + 11821 ctgatatatg tgttgcaaca agtattcgag aaggatttgg attaaatata gtggaagcaa + 11881 tgttttgtca cgttccagtt gttgcgacca tcaatagagg acacgccagt attatacaag + 11941 atggacaaaa cggtctatta gtccaattag gaaatacaaa gcaattagta gaggctattt + 12001 atgtactaat gaaggatact aagaagaagc aagaattagt ggagcaagct agtgcgaatt + 12061 tagaacaata tcatagtcag aaaattgtaa atagcttact agaaataata gaacagactg + 12121 caatgaagtg agtgaaggat gtgaaaaagt gaaaatacaa attgataaaa tatactatct + 12181 atttttttgg ctggtagttt cctttggata tttttttatg atgccaacct ttacagaaga + 12241 tttagaaggc gttgtcagtg ctagtttagt acaattgtta ttatttatta taggatatgt + 12301 atatgtatct tatttaaatc gttcttttat ctcactgtat agtatcttta tgattgtgtt + 12361 ttaccttttt caaaatggac aggtattgtt atattcactt ggagtagagt atgattactt + 12421 ttatgtttta agatatgatg aaaccatcgt actacaatca gttatttttt caacacaatg + 12481 tcttattgca gcctttatgg ctggagtctt ttctacgaag aaagaggtat caaaacccct + 12541 ttattcttat atggatcaat tagaacgaga aaaactgatt actgctggaa agttattttg + 12601 gggtgcgttt gcgatttttg ctttaccctt tatgatgatg aagtttgtta tcaccagtac + 12661 atctgggtat tttgcgatga tacgtttcgt tggaagccta cctacaataa cagtgttatt + 12721 tgaaaaaatg ttcattgctt caagtgtttt tttggttgtt tatttaaaat ctgaggaaac + 12781 ttggagcaag tttttaaaag ttgttatctt aggttggagt ataatggctg ctttaacagg + 12841 agatagaacc gtaggtttag cagggattgt tacgttagct ttaattcaaa cattaattgg + 12901 taatcgtaaa aaaaagatta agttttctca gtatgccttg ttagttgggg cagctgttgt + 12961 agtgatgtat ttaatgtcct ttgcttttca atttaggatg caacaagatt ctaaagtttc + 13021 aggactacaa actgcggtag tagaaatgat aggaactcta gggtttagtt ttttcccact + 13081 cgtattaacg attagaattg ttccaacttc tattaacttt tttagaggaa aatcatatat + 13141 tgcagccatc attacaggac taattccatc taattttgat tttttacatt taacaaagac + 13201 attatcagaa tggaatgcat atccaacgga attattagat acaatctatc attatggttt + 13261 cggattagat tattctttaa ttgcggaagc ctatattaat tttggttctt atggatggat + 13321 agcgattttt ttcctttgtt ctctaatagc ttattttgta agagatgtgg attttaaaag + 13381 gaaggacaac ttattctcac aatatgctag cttgattttg ctgtattcat ggtttaccct + 13441 tccaagaaga aaatcttatt ttatttttaa taattttttt tggtatgtat tattttttgg + 13501 actagcactc atacttgtct ctcgttctat taaacaacga aaggaattta aaaaatgaaa + 13561 atttcaatta ttatgggcat tcataatggt gaaaagcgct ttgaaacagc tgttcaaagt + 13621 attttcaatc aaacttatga taattgggaa tttattattt gtgatgatgc ttccacagat + 13681 aaaacgtttg aaaagttaca aggattatat ggacaggatt cacgttttat cttattaaaa + 13741 aatgaaaaaa atgtaggtct ttccgcgaca ttaaaccgtt gcattgaagc aagtagtgga + 13801 gaatttattg ctagaatgga tgatgatgat atttgttatc ccgagcgctt tgaaagacaa + 13861 gtcgactatt tgttccatca tccagagatt gattttgttt cttcatctat tgatattttt + 13921 gatggagaag tagttgtagg tacacggatt ttacttgatt ttcctagtaa aaaggatttg + 13981 atttggaata gcccctttgt tcatcctgtt accatgtttc gtagagatgc cttgcttgaa + 14041 gttggcggtt atagagtttc tccagaaact gttcgtgggc aagattatga tttgtttatg + 14101 agactatatt cacgcgagaa aaaaggtgga aatattttag aaccactatt tcgctatacg + 14161 attgatcaaa atacgatgaa gcgacgtacg tttaaagctc gaattgggga aatgattatt + 14221 cgctataaag gttatcgtgc gatgaaagtt ccattttata attatgtttt tatatttaaa + 14281 ccattagtag ctcatctagt aacactcgtt aaaaggagat aatgtttatg aaaattttaa + 14341 taaccactca tacttatctt cctaataaag atggtgttca atttgttaat caatatttag + 14401 cagaaggatt ggttaaaaag ggtcatcaag taacagtgct gacctattgt tatccatcac + 14461 gtacaagggt acctagagaa gtgataaatg gtgttagagt cattcgttgg aatgctcgaa + 14521 caagctgtac tttccataaa ggagaaaaat tagcttatca aaatttcatc ttaaattccc + 14581 aatcggatta tgatgtttta gtgaatgttg ggacacagac tgctttaaca gattggttat + 14641 ttccgatatt ttctcagata acaattccaa aagtcttata tattcattcg atatgggatt + 14701 tcaactggct gcattggcat agacaatcat tcaagcgatt tgttgctaaa acttgggcaa + 14761 atgtacgctg gaaatattat tattggaaac agactgttat ctttaaacaa tataatgaag + 14821 taattcagct acacccaaaa gattatagtg tggctttctt taaagaaaaa tatgatatag + 14881 aaagtcagat tttaggaaat gccgctgatg cttccttttt tcaaaataaa aacgctatca + 14941 aaaagcaatc ttacattgta aatgtttcta attttaatga tctaaaaaat caaaagaaag + 15001 cggttgagta ttttttgaaa agcaatcttt caagtgagtg gaagttcgtt ttagttggtt + 15061 cagaaaagaa tgattattta caaagcgtac aagattttga aaaagaactc cgaaaccaat + 15121 taggtatcac ttctggtaaa gaaatagagt atcgcatcgg attgtcaaga gaagaagttg + 15181 taaaaactgt aaaagaagcc tctttttgtt tactgacgag tatacgggaa gcttttccaa + 15241 tttcattaat tgaagtaatg gcagcaggaa ttccttttat ctcttctgat gtaggaattg + 15301 tcaactattt gtctggagga atcactgctt gtagtgatca agaatttata agagctattg + 15361 aagagtttgc tacttatccc gaggtcagaa atcaatatgg caaaaagggg caaatggaag + 15421 cgaaagaaca ttatcaagta gatgataaag tgaaagagtt tgaaactttg ttacaaaagt + 15481 tcgtaaagga agaagaagat tgaaaaaaat agtatttttg tgtccctatt ttgggacttt + 15541 accaccccat acgcagttat ggttgaattc ttgtaaaatg aatccgtctg taacatggta + 15601 tctatttaca gatgacaaga ggacatttga ttatccggaa aatgtgcaag ttttctatac + 15661 tactttggaa gaaacaaagg cgttgtatca aagaaaattt gactttgaga tttctttaga + 15721 gggtgcttat aaactaggag attataagcc tttattcggc tatctttatg aggaaatgat + 15781 acaagagttt gatgcttggg gacatattga tgtttatgat gaaatctatg gagatattcg + 15841 tgcatttgta acagatgagt tattagataa atacgataaa ttgatgtttt ttggacatat + 15901 gggtatttat agaaattctc ctgaagttaa tcgcagattt aaattatcgt ctgatttgga + 15961 tcgtacttat caagaaatat tttcttcatc acaattttat aattttgaag aatatgttgc + 16021 aggaagtatc actcgtgttt atcaaaaaaa tggattccca ataggaagat tagataaagt + 16081 gattgcagat ctttctggtt taagttatca tttccgacgt gggtattatt cagatgattt + 16141 tgagacattt acctatttac caaatctacc tatgattttt tcttgggaag atggaaaaac + 16201 ttattgttat tcggtacaaa acaatcaagt gcaaaaaaat gagttcttgt atgtacactt + 16261 taagcgtaga aaaatgattc agtctatttc aaatgatgtt tctgcttatt taatcgttcc + 16321 aaatggtttt gttgagatgc ctaaagagat aactgttgat ttgattcaaa aatatagtca + 16381 gaaaaaatta ttttatccag tctattttca ggaaaagtgg aaaggtgtca aacgattatt + 16441 gaagaaaata gggaggtcag aatgaaggac attttaaaaa agttgataca acaattaccg + 16501 gataaactat ttctacaaat taaatactac tacgttttta aaaaagaaat taaatttaca + 16561 gaatcctaaa acctttaata aaaaaacaca atgattaaaa ttatataatc ggaaaccttt + 16621 ttatacaatt ttagcggata aaattttagt gaagaactat attgcccata tacttgggga + 16681 agaaaatatt attccgactc tgggtgttta taatcgtttt gatgagattc attttgtttc + 16741 gcaggaagtc tattgaagaa tttgtaacag atgagtcgaa acgagaatta aaggaatata + 16801 agattgtttt ctttatactg ttcctaagtt ttttcaatta gattataacc gctttacaaa + 16861 tcataagaga aatatttatg ataccaacta gaatcagcag gactttattt atgcttaccc + 16921 atcaagtaaa gataagataa tagatagtcc cgctggactt actgcaatac tcgagtttgc + 16981 gagtaaatta tcaaaagata ttccattttt gaggtgcgat ttttatattg tgaatgataa + 17041 aatattattt gaagagatta cgttttttcc agaatcaggt tttggaaaat ttagtccaga + 17101 gcattataat ttagagtttg gaaaggatat tactttactg gagaagcaag atggaaacaa + 17161 aagaaaaacg tttagtgaat aatacgatta tttttacaat tggaagttta ggttcaaaat + 17221 ttatacagtt tttgttagta cctttatata cctatacttt aacagctgct cagtttggga + 17281 ttaccgaaat tttattaacc gctgtgaatc ttttaatacc tgtattttct atttccattg + 17341 ctgatggatt attaagattt ggattagata agaccttaag aagagaaaat gtcttgaaat + 17401 cagcttttat catttcgata cttgggacta ttttatccat tatttcgatt ccaatttttt + 17461 cgctctatcc tactttgtca gagtggatgg tttattttat catcattttg aacttgagaa + 17521 tgtatcggga tgtttttgcg attcaattga aagttgaagg gaaaaataca ttatttgctt + 17581 gcgatagtat gatttataca tttgttttat ctttagcgag tattgtcttt ctagttcctt + 17641 tttctttagg catttcaggt tattttttcg cttatattgt cagtaatgga atttccattt + 17701 tctttatctt atttttcgga ggagtctgga aaagttttac tagcggaaga tttgaaaaac + 17761 aattgatgat acaactattg aaatattcag cacccatgat tttaaatggt attgcatggt + 17821 ggattacaaa tgcctcagat cggtttatgt tgcaatggtt tatggatgat agagcggtag + 17881 gtttgtatgg tgttgttgca aagttaccct tattaatcgg aacgtttact ggagtattta + 17941 atcaggcatg gattatttca gcagtagaag agtttgaaga agaaaatgaa gaatggtttt + 18001 atcaaaaagt ttttcaccaa tattatgcag cactcttttt aagtgtttca gtatttttgc + 18061 ttctacttca accatttatg aaagtatatg ttagtccaag cttttatgaa gcatggcaat + 18121 atgctccgtt tttattattg tcaagtgtag tttcaggaat cgccgcattt atgacaggtt + 18181 tttatgttgc gcaaaagaaa aatttgaata ttatatacac gacgattgct ggtgcttttg + 18241 cgaatatttt gttaaatgcg atgtttattc ctatgcttgg agtattaggc gcttccattg + 18301 cgacctttct atcatggttt gttattgcaa tctatcgtat gaaagatgtt gaaaactttg + 18361 cttgttttcc attagataaa aaagtttttt ggtatttatt tctattatgt attcagacca + 18421 ttacgatgac ttttctgcca atccttggca ttgttttttc agtcgtattg attccttatt + 18481 tcttttacca agaacaggaa tttctagcag ttttatttga taaaggaagg aaaaaagtat + 18541 gttcattcaa aaaatcaaaa agataataag agtattttta aggaaatctt tagtaaaaga + 18601 ttatcgacaa agaattcaaa ataaagagtt tactcttatt acttctaatt gtgtgggtgg + 18661 actgattagt catgatttgg gtctacaatt tcgttctccc actatcaata tgtatataga + 18721 agcagcagac tttattcagt tttgttcaca tttagaacgc tatttaaaag aagacttatc + 18781 ttttattgaa gtaaatcaag atggacattt tgtagctctt tgtggggata taaaaattta + 18841 tattgttcat tataatagct ttgaagagtt tgctaaaaaa tggtctgaac gtgccaaaag + 18901 agtagatttt gatcaattat atcttatgat gtctgaacga gatggctgtc gttatgaaga + 18961 tattgtgaag tttgatacgt taccctataa gaataaagta atttttacaa gtaaaaagat + 19021 gccagaaatt caatccgctt tttatatacc aggtattgaa acaaaaaata atcaaaaaca + 19081 taaggtgaaa tcagtaacaa cttatcttaa ctcctttaca ggaaaacgat atatagattt + 19141 attcgacttt gtagagtttt tgaatacagg aaggaaacaa ttaagtaagt atgaaaagta + 19201 agataatatt aaaaaataaa acaattcttg ttacaggagc agctggcttt attggtgcta + 19261 atcttgtcat gagtttatta caagaagaaa atccattaca gattattgga atagataatt + 19321 tgaatgatta ttatgatgtt tctttaaaag agtatcgttt atcaacaatt caagaggagt + 19381 gtcaatcatc tttaaataaa aaatgggtat ttatcaaagg agatattgct gattctgatt + 19441 tgatggaaga aatttttgag acgtatagac ctcaaattgt agtgaatttg gcagcacaag + 19501 caggtgttcg ttattctatc actaatcctg atgtttatat gaaaagtaat atcattggat + 19561 ttcatactat tcttgaaaaa tgtagaaagt atcaagaaaa tattgaacat ttagtttatg + 19621 catcatcctc ttctgtttat ggtggaaata caaaaattcc tttttctgaa ttagatgcag + 19681 tagacaatcc tgtttcttta tatgcagtta cgaagaaaac aaatgaatta gaagcacatg + 19741 cgtattcaaa attgtacaat attccaacaa caggcctgag attttttaca gtttatggac + 19801 cagctggaag acctgatatg gcttatttta gttttacaaa gcaattaatt gataaaaagc + 19861 caattgaaat tttcaattat gggaattgtc aacgtgattt tacttatatt gacgatattg + 19921 ttgaaggcgt taaaagagtg atgactggag ctcctcaaaa agaaattgga gaagatgggt + 19981 taccaattcc tccttatgct atctataata ttggaaatca ccaaccagaa aatttattga + 20041 attttgtcga aatcttgcaa gaaaaattga tagctgcttc tattttacca gaagattatg + 20101 atttctcatc tgctcagaaa cttgttccaa tgcaagctgg tgatgtagtt gcaacctatg + 20161 cagatataag tctattggag aaggatttta atttcaaacc taagactagt cttagaaatg + 20221 gcttgagaaa ttttgcagaa tggtatagaa atttttatca aaggggtgaa tagaatgaaa + 20281 attactgtag taggaatggg atatgtcgga ttgtccttgg cggtattatt agcgcaacat + 20341 catgaagtaa cagcgttaga tattattgat aaaaaaattc aactcatcaa tgagaaaaaa + 20401 tctccaattc aagatgagta tattgaacaa tactttttag aaaaaaatct tcatttaagc + 20461 gcaacaacaa acgaagtaga ggcgtataaa gatgcggaaa tgattattat agctgctcct + 20521 acagattatg atacacacaa aaatttcttt gatacatctg ccgtagaaca agtaatcgaa + 20581 aatattattt ctatgaataa cgaggcttta attgtcatta aatcaactgt tcctgttggc + 20641 tatacggagt cgattcgaga aaaatatggt aaaaagaata tactgtttag cccagaattt + 20701 cttcgtgaag caaatggatt gtatgataat ctttatccta atcgaattat cgtaggtaca + 20761 gatttgaatg atggagcatt agtttctaaa gcacatgaat ttgtgtcttt attacaagaa + 20821 ggtgctctca aagagaatat tgatacttta atcatgggat tttctgaagc agaagctgtg + 20881 aaattatttt ccaatgctta tctggcttta agagtgtctt attttaatga gttggatact + 20941 tatgctgaac tgaaaggatt gaatacgaaa gccattattg atggagtagg attggatcct + 21001 agaattggtc agttttataa caatccatcc tttggttatg gtggttactg tttaccaaag + 21061 gatagtaagc aactgttgtc aaattatcat gatgttcctg aaaatattat ttcagcaatt + 21121 gtttctagta atgaaactcg taaaaaattt attgcagaac gtattcttga aatagtcgga + 21181 gctaatcata ttgatgaata ctataatttg aagcaggaaa tcgttgtagg tatttatcgt + 21241 ttagtcatga aaaaaggttc ggataatttt agacattctt ctatccaagg aattataaag + 21301 agactaaaag cgaatggagt gacattaatg atctatgaac cttcacttcc agatggacaa + 21361 ttattttttg gaagtgaagt tgttcatgat tttccaaaat ttaaagaaaa aagccacctt + 21421 attgtagcca atcgttttga tgaaacatta atggatgtaa aggataaagt atatacaagg + 21481 gatttgtttg gaagagatta agggagatag gttttgaaca agttctattc ccaaaaaatc + 21541 acaccgttac tatcttcgaa taaattaaaa gcaaagcaag tgattgatag aaaatcggct + 21601 ctttgtcaac tgtagtgggt tgaagtcagc taagctcgag aaaggacaaa ttttgtcctt + 21661 tcttttttga tattcagagc gataaaaatc cgttttttga agttttcaaa gttccgaaaa + 21721 ccaaaggcat tgcgcttgat aagtttgatg agattattgg tcgcttccaa tttggcgttt + 21781 gaatagggta gttgaagggc gttgacgatt ttctctttgt cctttagaaa ggttttaaag + 21841 acagtctgaa aaagaggatg aacctgctta agattgtcct caataagtcc gaaaaatttc + 21901 tctggttcct tattctgaaa gtgaaacagc aagagttgat agagctgata gtgatgtttc + 21961 aagtcttgtg aatagctcaa aagcttgtct aaaatctctt tattggttaa atgcatacga + 22021 aaagtagggc gataaaaatg tttatcgctg agtttacgac tatcctgttg tatgagcttc + 22081 cagtagcgct tgatagcctt gtattcatga gactatcgat ccaattgatt catgatttga + 22141 acacgcacac gactcatagc acgactaaga tgttgtacaa tgtgaaagcg atcaagaacg + 22201 attttagcat tcgggagtga aacagtctgg gagactgttt cagcctgagc ctagaaattt + 22261 gaaagcgagg ctgtttagct aagtcatagt aaggactaaa catatccata gtaataattt + 22321 tgacgcgaca tcggacaact ctatcgtagc gaagaaagtg atttcgaatg atagcttgtg + 22381 ttctaccctc aagaacagtg atgatatcga gcttttcaaa atcttgcgca atgaagctca + 22441 tctccatctc ccgattgaaa cagtcactcc ccggactgtt tcaacgtccc aagacataat + 22501 ctcaggaaga cgcgaaaaat catgtttaaa gtgaaaatca ttgagcttac gaataacagt + 22561 tgaagttgag atggaaagct gatgggcaat atcagtcata gaaatctttt caattaactt + 22621 ttgagcaatc ttttggttga tgatacgagg gatttggtga ttcttcttga cgatagaagt + 22681 ttcagcgacc atcatttttg aacagtgata gcacttgaat cgacgctttc taaggagaat + 22741 tctagtaggc ataccagtcg tttcaagata aggaatttta gaaggttttt gaaagtcata + 22801 tttcttcatt tgacttccgc actcagggca agatggggcg tcgtagtcca gtttggcgat + 22861 gatttccttg tgtgtatcct tattgatgat gtctaaaatc tggatattag ggtctttaat + 22921 gtctagtaat tttgtgataa aatgtaattg ttccatatga atctttctaa tgagttgttt + 22981 gatcgctttt cattatagac cttatgggac tttttttcta cacaaaaata ggctccataa + 23041 tatccatagg gaatttaccc actacaaata ttatagagcc agaaaatcac ctgctttttg + 23101 tatcaatgtt ttttcacaaa atctaaaata taatggattg aatttggaat agaacactat + 23161 ggtttctaaa gcattgttag aaattatagt caattgaaac aagagcagga caaaagagcc + 23221 tcgtaaaagg tattgcaact tggtaatacc tttttgatgt acgacgggca tgtcgtatat + 23281 ctgaggtgta agtcctcggt gggcacctgc taccggtgaa cccaatagcg attcccaagc + 23341 ctgactatcg tgaggtagca gggagaggaa gggatagcga aatcgtggct ctacgaacag + 23401 gaacgtgata gtaaggcgta tatagcggat aaggaggttt caaactctaa agtccaaaaa + 23461 ggtagtcgta acctatatgt gtaaatcacg agagtaattg aattcggact aaggtttgtg + 23521 tgaaaaagat aaatctttct agagtctaaa gactctgcgt cagatttcct attttcactg + 23581 taacctttta acgtcctcat atcttgtata aacgaggaaa gatgtacaac ttatcccgtg + 23641 aggtttcatg ggcgctgaaa gcgtagtaac aacgaatcat gagaagtcag ccgagcccat + 23701 agtagtgagg aaacttctgt agtggaagtg gagcgaaggg gtgaatactc aaacagtctg + 23761 gggagagact gtttgaggtc tgtcgctaga aagagaaaac gacagatcga agtaatccta + 23821 cttcacttgt gtctgtaaaa tgagtggtct gatagaactg gactttgaca cgtaatgact + 23881 agatgaaggt tcaccaatat aagatgtccc tcaggcacca aaacaagaaa ggaatacgca + 23941 catgtcaaaa ctgctagata agatattatc acgcgaaaat atgctggaag cctacaatca + 24001 agtaaaatcc aataaaggct cagctgggat tgatggaatg actatcgaag agatggataa + 24061 ttatctcaga caaaactggc gcttgactaa ggaactgata aaacagagaa aatataagcc + 24121 tcaaccagtt cttaaagttg agatacctaa accagacgga ggcatccgtc aactaggaat + 24181 tccaacagtt atggatagaa tgattcaaca ggccattgtc caagtcatga gccccatttg + 24241 tgaaccccat ttctcagata cgagttatga tttcagacca aataggtcat gtgaaaaagc + 24301 catcatgaag ctcttagaat acttaaatga cggctatgag tggatagtgg atatagacct + 24361 agagaaattt ttcgatacag ttcctcaaga tagattgatg tccttagtac ataacattat + 24421 cgaagacgga gatacggaat ccttgattcg taagtatctt cattcaggtg ttatcattaa + 24481 tggtcaacgt tataaaacac tagttggtac accacaggga ggaaatttat ctcctctctt + 24541 atctaatatc atgcttaatg aattggacaa ggaattagaa aagaggggac ttcgatttgt + 24601 gcgctacgca gatgattgtg tgattacggt cggaagcgag gcagcctcta agcgtgtgat + 24661 gtattcagtc agtcgtttta ttgagaaacg gctaggtttg aaagtaaaca tgaccaagac + 24721 taagattacc agaccaagag agttgaaata tctaggtttt gggttctgga aatcatcaga + 24781 tggttggaaa agccgtccac atcaagatag tgttcggaga tttaagttta aattgaagaa + 24841 actaacacag aggaaatgga gtatagacct aacaagacgt attgagcaac tgaatttgtc + 24901 tattcgagga tggataaact atttctcatt gggaaatatg aaaagtatag tcgccagcat + 24961 agatgagcgc ttgcgtactc gcctacgagt gattatctgg aagcaatgga agaagaaatc + 25021 gagacgatta tggggattgc ttaagttagg agttcctaaa tggatagcag ataaggtatc + 25081 tggctggggc gaccattatc aattagtagc tcagaagtcg gtacttaaac gtgctatatc + 25141 aaaaccagtc ctggaaaaac gtggactggt ttcgtgtttg gattattacc ttgaacgaca + 25201 tgcgttaaaa gttagttgaa ccgccgtatg ccgaacggca cgtacggtgg tgtgagaggg + 25261 gctagagatt atcccctact ctatgtgctt tttgatatga gcccatgttt tctcaatagg + 25321 attgtactca ggtgagtagg gaggaagagg taaaagttta tgcccaaact ctttgcataa + 25381 aagttctagc ttccccattc tatggaatct tgcattatcc ataataataa ccgatggtgt + 25441 ggttaatgtt ggtaagagaa acttctgaaa ccaagcttca aaaaagtcgc tcgtcatcat + 25501 ctcttcgtaa gtcattggag cgattaactc accatttgtt agacctgcaa ccaaagaaat + 25561 cctctgatat cttcttccag atactttgcc tcttcttaac tgacctttta atgagcgact + 25621 atattctcga taaaaataag tatcgaatcc tgtttcatca atctaaacag gtgataggtg + 25681 ctttaaacta ttaaaattct taagaaataa ggctactttt tctgggtctt gttcatagta + 25741 ggtgtggttc tttttttcga gtgtagtcca tagctttgag cgcatagtgg atggtagttg + 25801 gatgacagcc aaattcagaa gctatttcag tcaaataagc gtctggattg tcagtaagat + 25861 agtttttaag tctatctcta tcaacttttc ttggttttgt tccttttact tggtggttta + 25921 gctctcctgt tttctctttt agctttaacc agccataaat agtattacgt gagatttgga + 25981 aaacgtgtga tgcttctgtt atactacctg ttcgctcaca ataagagaga acttttttac + 26041 gaaaatctat tgaatatgcc ataagaagat tataccacat tgtgtactat ttttggttca + 26101 ttttactata atttaaaatt ccctcatcga tttgttcaca ttctattgca atcaactgta + 26161 aatatgcttt tcagaatata tcaaatataa caaatataac aaataactaa aagttctata + 26221 atagactccc tgcgaaacaa aatatggtat agtagttcta tgaatgatga agcaagtaaa + 26281 caactaaccg atgcacgatt taagcgtctt gttggtgttc agcgtaccac ttttgaagag + 26341 atgttagctg tattaaaaac agcttatcaa cttaaacacg caaaaggtgg acgaaaacct + 26401 aaattaagcc tagaagacct tcttatggcc actcttcaat agtgcgagaa tatcgaactt + 26461 atgaagaaat tgcggctgat tttggtattc acgaaagcaa cttaatccgt cggagccaat + 26521 gggttgaagt aactcttgtt caaagtggtt ttacgatttc aagaacttct ctcagttctg + 26581 aggacacggt aatgattgat gcgacagaag taaaaatcaa tcgccctaaa aaaagaatta + 26641 gcgaattatt ctggtaaaaa gaaatgccac gctatgaagt ctcaggcgat tgtcacaagt + 26701 caagggagaa ttgtttcttt ggatatcact gtgaactatt gtcatgatat gaagttgttc + 26761 aaaatgagtt gcagaaatat cggacaagct ggtaaaatct tggccgacag tggttatcaa + 26821 gggctcatga agatatatcc tcaagcacaa actccacgta aatccagcaa actcaagccg + 26881 ctaacagctg aagataaagc ctgtaaccat gcgctatcta aggagagaag caaggttgag + 26941 aacatctttg ccaaagcata gtatattgaa actagaatag tacacctcta cttctaaaac + 27001 attgttagaa atcgatttga ctgccctgat cgattcgtcc tattcttgtt tcattttgat + 27061 ataaaaacgt ttaaaatgtt ttcaacaact tatcgaaatc atcgtaaacg cttcggatta + 27121 cgaatgaatt tgattgctgc tattatcaat catgaactag gattctagtt ttgcaggaag + 27181 tttaatgaag ttagccaccc agccctccta aaaattagat ggttcagcta gctgaaagct + 27241 cttgtaggca taagaaaaca cctctgtgtt atacttgttg ttcaaccaca aacacaagaa + 27301 aggcacagaa atgcaagaca attatactac aaaaggtaaa catttgacaa tcgatagccg + 27361 tcgcttaatc gaaagatgga aaaaagaagg aaaatcaaat agagaaattg cctctctact + 27421 tggaaaagct cctcaaacta tccacactga aatcaagcgt aggacagtcc gaaaatgtct + 27481 tggaaaaggg cgcttcaaag aggtttattc tgccgactat gctcaacagt cttatgaaaa + 27541 taatcgcaag cactcggtca agagatcaag cgtgaccaag gaactaaagg aaaagattct + 27601 ccactatcat aaccaaaaat ttttgcctga aatgatggtt atggctaaag gggttaacgt + 27661 gggaatttca accatttact attggattca tcatggaaaa ttgggattaa gcaaatagga + 27721 tctgctttac cctagaaaag gaaaagcgct taagaaacag gctagcacca actttaaacc + 27781 tgctggtcaa tccatcgaac agcggcctga agctatcaat cttcgcttgg agaatgggca + 27841 ttatgagatt gatacggttc tacttacgag atcgaaaaac tactgcttgc ttgtcttgac + 27901 ggatcgaaag agtagacatc agatcatccg attgattcca aataaaagtg ctgaggtggt + 27961 caatcaggct ctaaaactca tcttaaaaca acacaagatt ctttccatca cggcagataa + 28021 tggaacggaa ttcaatcgct tgtttgatat attttctgag gagcacatct attatgcgca + 28081 cccctatgcc tcttgggaaa ggggaactaa tgagaatcac aacaggctca ttcgtagata + 28141 gttacctaag ggaaccaaga aaatgactcc caaagaagtc gcattcatcg aaaagtggat + 28201 taacaactat cctaaaaaat gcttggacta caagtcaccc agagaagact tctggatggc + 28261 taacttgaac ttgaaattta gctataacaa ataactctta aaattctgaa aattctgttg + 28321 acaactttct gaaaagagtc tataatggag agaaagtttt aaaggagaaa atgatgaaaa + 28381 gttcaaaact atttgccctt gctggcgtga cattattggc ggcgactact ttagctgcat + 28441 gctctggatc aggttcaagc gctaaa +// + diff --git a/public/res/serotype_genbank/serotype_25F.gb b/public/res/serotype_genbank/serotype_25F.gb new file mode 100644 index 0000000..22751bc --- /dev/null +++ b/public/res/serotype_genbank/serotype_25F.gb @@ -0,0 +1,1145 @@ +LOCUS CR931690 28389 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 601/62 (serotype 25f). +ACCESSION CR931690 +VERSION CR931690.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 28389) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 28389) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..28389 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="601/62" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC25F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC25F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33971.1" + /db_xref="GOA:Q4K1T1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K1T1" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVELL" + gene order(293..1723,1759..2244) + /gene="aliB" + /locus_tag="SPC25F_0002" + /pseudo + CDS join(293..1723,1759..2244) + /gene="aliB" + /locus_tag="SPC25F_0002" + /note="member of homology group 169" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + misc_feature join(509..1723,1759..1842) + /gene="aliB" + /locus_tag="SPC25F_0002" + /note="HMMPfam hit to PF00496, Bacterial extracellular + solute-binding prot, score 4.5e-36" + /pseudo + gene complement(order(2388..2969,3023..3711)) + /gene="tnp" + /locus_tag="SPC25F_0003" + /pseudo + CDS complement(join(2388..2969,3023..3196,3196..3711)) + /gene="tnp" + /locus_tag="SPC25F_0003" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(2889..2969,3023..3196,3196..3219)) + /gene="tnp" + /locus_tag="SPC25F_0003" + /note="HMMPfam hit to PF01610, Transposase, score 2.3e-31" + /pseudo + gene 3749..3970 + /gene="tnp" + /locus_tag="SPC25F_0004" + /pseudo + CDS 3749..3970 + /gene="tnp" + /locus_tag="SPC25F_0004" + /note="Lone member of homology group 0248" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase (fragment)" + gene 4247..5344 + /gene="glf" + /locus_tag="SPC25F_0005" + CDS 4247..5344 + /gene="glf" + /locus_tag="SPC25F_0005" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI33975.1" + /db_xref="GOA:Q4JZ57" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZ57" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + IEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKNKIAEQTAHMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TDLPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFANRQ + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEVLDKENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQDKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAVQNDK + VIFCGRLADYKYYDMHVVIERALEVVRNEFS" + misc_feature 4682..5284 + /gene="glf" + /locus_tag="SPC25F_0005" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.1e-135" + gene 5662..6342 + /gene="wzd" + /locus_tag="SPC25F_0006" + CDS 5662..6342 + /gene="wzd" + /locus_tag="SPC25F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33976.1" + /db_xref="GOA:Q4JZ56" + /db_xref="InterPro:IPR003856" + /db_xref="UniProtKB/TrEMBL:Q4JZ56" + /translation="MNNRIVDISLFDLLNVLWLRKWIIVFVSFVFGCISFLYYQFFVP + KTYTSDTRIYVVSKGDNKNLSNADLQAGSALTKDYKEIILSDEVLEETISDLKLESTL + ESLASKIKISIPAETRIISISVTNTNSDEAARIANGIRKVAALKIKEVTQVTDVTTLQ + TARPPQTPSGPHVRKSTTAGLVLGAFLTVFLVVAKEILDDRIKRFEELEKLGIPILGS + IPLSKNIK" + misc_feature 5677..6087 + /gene="wzd" + /locus_tag="SPC25F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 2.5e-41" + gene 6349..7038 + /gene="wze" + /locus_tag="SPC25F_0007" + CDS 6349..7038 + /gene="wze" + /locus_tag="SPC25F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33977.1" + /db_xref="GOA:Q4JZ55" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZ55" + /translation="MGKLELTRKYYQLYNETKEYFNALQTNIQLSGDGLKVISVTSTV + KNEGKSTISVGLSMSLALSGYKVLLLDVDLRNSVMSGMFHSRERITGLTEYLSGKAGM + ADSMQETTLDNLYILQAGVVSPNPLSLLRSVKFETLIDSMKKYFDYIIVDTPPIGQVI + DAAIIAQQCDGIFLVTEMRKTTRRQIFSSLQQLEQTGVPVLGLVANKAIIKKDSYGYY + GKNTASETERY" + gene order(7229..7539,7561..7626,7631..7948) + /gene="tnp" + /locus_tag="SPC25F_0008" + /pseudo + CDS join(7229..7345,7345..7539,7561..7626,7631..7948) + /gene="tnp" + /locus_tag="SPC25F_0008" + /note="member of homology group 19; + member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature join(7474..7539,7561..7626,7631..7942) + /gene="tnp" + /locus_tag="SPC25F_0008" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 2.1e-09" + /pseudo + gene 8169..9620 + /gene="wzg" + /locus_tag="SPC25F_0009" + CDS 8169..9620 + /gene="wzg" + /locus_tag="SPC25F_0009" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33979.1" + /db_xref="GOA:Q4K063" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K063" + /translation="MRYFMSREKKRGTAVHLKSYINSVLLILYTGIASLFLFQIFRYN + ILNFRNLNLLVALLVVLVFILGVSLIVRKKAEKLTMLLLILAVASSSISLLAVQQFIG + FTSRLNATSNVSEYAISLVVLKDSEISELEQVSHVMAPTDTDYEAIQSLLADIKEKQG + KDLIVDKSKSYLEAYKSLISGDTKVIFLNSIFEHMIESDFPDFRDKIKKIYTKEMTKK + VEAPKVSKGQAFTIYFSGIDTYGPINSVSRSDVNILMTVNSETKKILLTTTPRDSYVA + IADGGKNQKDKLTHAGIYGIDSSIHTLEHLYGVEINYYVRVNFTSFLKIVDLLNGIDV + DNSQEFTIDGNDYPVGNLHLNSKSALGFVRERHSLADGDRDRGRNQQKVLAAIIQKLT + SIESLKNYRQIMQGLEDSIQTNLSPTTIMDLANTQLESGGNYKINSQDLKGTGRMDLP + SYAMPDSQLYMMEIDENSLSAIKENIQAVLEGR" + misc_feature 8385..8732 + /gene="wzg" + /locus_tag="SPC25F_0009" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 9.5e-40" + misc_feature 8910..9347 + /gene="wzg" + /locus_tag="SPC25F_0009" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-65" + gene 9559..10353 + /gene="wzh" + /locus_tag="SPC25F_0010" + CDS 9559..10353 + /gene="wzh" + /locus_tag="SPC25F_0010" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33980.1" + /db_xref="GOA:Q4JZ53" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ53" + /translation="MMRIASQLSKKIFRLFWRVGKMIDVHSHIIFDVDDGPKSIEDSR + ALLLEAYDQGIRTIVSTSHRRQGMFETPEDKIAENFRAVQKIARDIADDLTILYGAEI + YYTQDIINKLEKKTFPTLNGSRYALIEFSSETSYRSIHSALQQLLLSGITPLIAHIER + YDALENNKQAVLELIRMGCYTQINSSHLLKKKLFKDDAKIMKKRVHYFLKHDLVHIVA + SDMHNLDTRPPYMAEAYEIISKRYGKEKAEEFFIKNPQRILMDQLI" + misc_feature 9625..10233 + /gene="wzh" + /locus_tag="SPC25F_0010" + /note="HMMPfam hit to PF02811, PHP domain, score 3.6e-36" + gene 10372..10959 + /gene="wciI" + /locus_tag="SPC25F_0011" + CDS 10372..10959 + /gene="wciI" + /locus_tag="SPC25F_0011" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI33981.1" + /db_xref="GOA:Q4K061" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4K061" + /translation="MYKVIKRFIDIALALLGIVLLSPLFLGIIVFIKLESKGPIFFKQ + KRIGLHKKEFYILKFRTMRIDTPSAVPTHLLKNPYQWITKVGKVLRRTSLDELPQIWN + ILVGHMSLVGPRPALWNQFDLIEERDKYGANDILPGLTGWAQINGRDELSIPVKAKFD + GYYVKNCSFVLDCRCVVESFLVVFKRYGHREGGAD" + misc_feature 10372..10473 + /gene="wciI" + /locus_tag="SPC25F_0011" + /note="Signal peptide predicted for SPC1337 by SignalP 2.0 + HMM (Signal peptide probability 0.966) with cleavage site + probability 0.671 between residues 34 and 35" + misc_feature 10387..10941 + /gene="wciI" + /locus_tag="SPC25F_0011" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 3e-32" + gene 10972..12102 + /gene="wcyA" + /locus_tag="SPC25F_0012" + CDS 10972..12102 + /gene="wcyA" + /locus_tag="SPC25F_0012" + /note="member of homology group 170" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33982.1" + /db_xref="GOA:Q4K060" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K060" + /translation="MGNRKKVFVVANVVKEHILKFHIPTIKEMTKRGWTVDVGASGDE + TVPYCHQQYSLPHQRSPFHLGTLKSIWKLRKILKSGGYDIVYCHTPVGGLVGRLASLG + LRKQGTRVIYFAHGYHFYKGATFFNWLVYYPIEKLLSLFTDSIILINQEDYHLTKTKF + KQVQSYLVSGMGVKQERFSPQSNQVRERYRKELKLPEDATVLIYCAELIKNKNQTFLL + HAMKKLVDQGENLYCLLVGIDYTKGEMVECIQSLNLSDRVLLLGWREDIANLYACSDI + CVATSIREGFGLNIVEAMFCHVPVVATINRGHASIIQDGQNGLLVQLGNTKQLVEAIY + VLMKDTKKKQELVEQASANLEQYHSQKIVNSLLEIIEQTAMK" + misc_feature 11527..12042 + /gene="wcyA" + /locus_tag="SPC25F_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.5e-40" + gene 12099..13529 + /gene="wzy" + /locus_tag="SPC25F_0013" + CDS 12099..13529 + /gene="wzy" + /locus_tag="SPC25F_0013" + /note="member of homology group 171" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33983.1" + /db_xref="UniProtKB/TrEMBL:Q4K059" + /translation="MSEGCEKVKIQIDKIYYLFFWLVVSFGYFFMMPTFTEDLEGVVS + ASLVQLLLFIIGYVYVSYLNRSFISLYSIFMIVFYLFQNGQVLLYSLGVEYDYFYVLR + YDETIVLQSVIFSTQCLIAAFMAGVFSTKKEVSKPLYSYMDQLEREKLITAGKLFWGA + FAIFALPFMMMKFVITSTSGYFAMIRFVGSLPTITVLFEKMFIASSVFLVVYLKSEET + WSKFLKVVILGWSIMAALTGDRTVGLAGIVTLALIQTLIGNRKKKIKFSQYALLVGAA + VVVMYLMSFAFQFRMQQDSKVSGLQTAVVEMIGTLGFSFFPLVLTIRIVPTSINFFRG + KSYIAAIITGLIPSNFDFLHLTKTLSEWNAYPTELLDTIYHYGFGLDYSLIAEAYINF + GSYGWIAIFFLCSLIAYFVRDVDFKRKDNLFSQYASLILLYSWFTLPRRKSYFIFNNF + FWYVLFFGLALILVSRSIKQRKEFKK" + gene 13526..14293 + /gene="wcyB" + /locus_tag="SPC25F_0014" + CDS 13526..14293 + /gene="wcyB" + /locus_tag="SPC25F_0014" + /note="member of homology group 172" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33984.1" + /db_xref="GOA:Q4K058" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K058" + /translation="MKISIIMGIHNGEKRFETAVQSIFNQTYDNWEFIICDDASTDKT + FEKLQGLYGQDSRFILLKNEKNVGLSATLNRCIEASSGEFIARMDDDDICYPERFERQ + VDYLFHHPEIDFVSSSIDIFDGEVVVGTRILLDFPSKKDLIWNSPFVHPVTMFRRDAL + LEVGGYRVSPETVRGQDYDLFMRLYSREKKGGNILEPLFRYTIDQNTMKRRTFKARIG + EMIIRYKGYRAMKVPFYNYVFIFKPLVAHLVTLVKRR" + misc_feature 13535..14017 + /gene="wcyB" + /locus_tag="SPC25F_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.2e-39" + gene 14293..15474 + /gene="wcyC" + /locus_tag="SPC25F_0015" + CDS 14293..15474 + /gene="wcyC" + /locus_tag="SPC25F_0015" + /note="member of homology group 173" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33985.1" + /db_xref="GOA:Q4K057" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K057" + /translation="MFMKILITTHTYLPNKDGVQFVNQYLAEGLVKKGHQVTVLTYCY + PSRTRVPREVINGVRVIRWNARTSCTFHKGEKLAYQNFILNSQSDYDVLVNVGTQTAL + TDWLFPIFSQITIPKVLYIHSIWDFNWLHWHRQSFKRFVAKTWANVRWKYYYWKQTVI + FKQYNEVIQLHPKDYSVAFFKEKYDIESQILGNAADASFFQNKNAIKKQSYIVNVSNF + NDLKNQKKAVEYFLKSNLSSEWKFVLVGSEKNDYLQSVQDFEKELRNQLGITSGKEIE + YRIGLSREEVVKTVKEASFCLLTSIREAFPISLIEVMAAGIPFISSDVGIVNYLSGGI + TACSDQEFIRAIEEFATYPEVRNQYGKKGQMEAKEHYQVDDKVKEFETLLQKFVKEEE + D" + misc_feature 14881..15390 + /gene="wcyC" + /locus_tag="SPC25F_0015" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.2e-13" + gene 15471..16436 + /gene="wcyD" + /locus_tag="SPC25F_0016" + CDS 15471..16436 + /gene="wcyD" + /locus_tag="SPC25F_0016" + /note="member of homology group 174" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33986.1" + /db_xref="GOA:Q4K056" + /db_xref="UniProtKB/TrEMBL:Q4K056" + /translation="MKKIVFLCPYFGTLPPHTQLWLNSCKMNPSVTWYLFTDDKRTFD + YPENVQVFYTTLEETKALYQRKFDFEISLEGAYKLGDYKPLFGYLYEEMIQEFDAWGH + IDVYDEIYGDIRAFVTDELLDKYDKLMFFGHMGIYRNSPEVNRRFKLSSDLDRTYQEI + FSSSQFYNFEEYVAGSITRVYQKNGFPIGRLDKVIADLSGLSYHFRRGYYSDDFETFT + YLPNLPMIFSWEDGKTYCYSVQNNQVQKNEFLYVHFKRRKMIQSISNDVSAYLIVPNG + FVEMPKEITVDLIQKYSQKKLFYPVYFQEKWKGVKRLLKKIGRSE" + gene order(16433..17117,17120..17146) + /gene="wcyE" + /locus_tag="SPC25F_0017" + /pseudo + CDS join(16433..16516,16515..17117,17120..17146) + /gene="wcyE" + /locus_tag="SPC25F_0017" + /note="member of homology group 175" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + gene 17122..18537 + /gene="wzx" + /locus_tag="SPC25F_0018" + CDS 17122..18537 + /gene="wzx" + /locus_tag="SPC25F_0018" + /note="member of homology group 176" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33988.1" + /db_xref="GOA:Q4K055" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K055" + /translation="METKEKRLVNNTIIFTIGSLGSKFIQFLLVPLYTYTLTAAQFGI + TEILLTAVNLLIPVFSISIADGLLRFGLDKTLRRENVLKSAFIISILGTILSIISIPI + FSLYPTLSEWMVYFIIILNLRMYRDVFAIQLKVEGKNTLFACDSMIYTFVLSLASIVF + LVPFSLGISGYFFAYIVSNGISIFFILFFGGVWKSFTSGRFEKQLMIQLLKYSAPMIL + NGIAWWITNASDRFMLQWFMDDRAVGLYGVVAKLPLLIGTFTGVFNQAWIISAVEEFE + EENEEWFYQKVFHQYYAALFLSVSVFLLLLQPFMKVYVSPSFYEAWQYAPFLLLSSVV + SGIAAFMTGFYVAQKKNLNIIYTTIAGAFANILLNAMFIPMLGVLGASIATFLSWFVI + AIYRMKDVENFACFPLDKKVFWYLFLLCIQTITMTFLPILGIVFSVVLIPYFFYQEQE + FLAVLFDKGRKKVCSFKKSKR" + misc_feature 17143..17946 + /gene="wzx" + /locus_tag="SPC25F_0018" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 3.4e-10" + gene 18510..19172 + /gene="wcyF" + /locus_tag="SPC25F_0019" + CDS 18510..19172 + /gene="wcyF" + /locus_tag="SPC25F_0019" + /note="member of homology group 177" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI33989.1" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4JZ44" + /translation="MFIQKIKKIIRVFLRKSLVKDYRQRIQNKEFTLITSNCVGGLIS + HDLGLQFRSPTINMYIEAADFIQFCSHLERYLKEDLSFIEVNQDGHFVALCGDIKIYI + VHYNSFEEFAKKWSERAKRVDFDQLYLMMSERDGCRYEDIVKFDTLPYKNKVIFTSKK + MPEIQSAFYIPGIETKNNQKHKVKSVTTYLNSFTGKRYIDLFDFVEFLNTGRKQLSKY + EK" + gene 19162..20244 + /gene="gla" + /locus_tag="SPC25F_0020" + CDS 19162..20244 + /gene="gla" + /locus_tag="SPC25F_0020" + /note="member of homology group 96" + /codon_start=1 + /transl_table=11 + /product="putative epimerase" + /protein_id="CAI33990.1" + /db_xref="GOA:Q4JZ43" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR008089" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZ43" + /translation="MKSKIILKNKTILVTGAAGFIGANLVMSLLQEENPLQIIGIDNL + NDYYDVSLKEYRLSTIQEECQSSLNKKWVFIKGDIADSDLMEEIFETYRPQIVVNLAA + QAGVRYSITNPDVYMKSNIIGFHTILEKCRKYQENIEHLVYASSSSVYGGNTKIPFSE + LDAVDNPVSLYAVTKKTNELEAHAYSKLYNIPTTGLRFFTVYGPAGRPDMAYFSFTKQ + LIDKKPIEIFNYGNCQRDFTYIDDIVEGVKRVMTGAPQKEIGEDGLPIPPYAIYNIGN + HQPENLLNFVEILQEKLIAASILPEDYDFSSAQKLVPMQAGDVVATYADISLLEKDFN + FKPKTSLRNGLRNFAEWYRNFYQRGE" + misc_feature 19162..19251 + /gene="gla" + /locus_tag="SPC25F_0020" + /note="Signal peptide predicted for SPC1346 by SignalP 2.0 + HMM (Signal peptide probability 0.974) with cleavage site + probability 0.471 between residues 30 and 31" + misc_feature 19192..20223 + /gene="gla" + /locus_tag="SPC25F_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00023" + misc_feature 19195..20100 + /gene="gla" + /locus_tag="SPC25F_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 7.1e-05" + misc_feature 19195..19986 + /gene="gla" + /locus_tag="SPC25F_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 8.3e-55" + misc_feature 19198..20064 + /gene="gla" + /locus_tag="SPC25F_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 5.4e-09" + gene 20204..21472 + /gene="ugd" + /locus_tag="SPC25F_0021" + CDS 20204..21472 + /gene="ugd" + /locus_tag="SPC25F_0021" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI33991.1" + /db_xref="GOA:Q4JZ42" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4JZ42" + /translation="MQNGIEIFIKGVNRMKITVVGMGYVGLSLAVLLAQHHEVTALDI + IDKKIQLINEKKSPIQDEYIEQYFLEKNLHLSATTNEVEAYKDAEMIIIAAPTDYDTH + KNFFDTSAVEQVIENIISMNNEALIVIKSTVPVGYTESIREKYGKKNILFSPEFLREA + NGLYDNLYPNRIIVGTDLNDGALVSKAHEFVSLLQEGALKENIDTLIMGFSEAEAVKL + FSNAYLALRVSYFNELDTYAELKGLNTKAIIDGVGLDPRIGQFYNNPSFGYGGYCLPK + DSKQLLSNYHDVPENIISAIVSSNETRKKFIAERILEIVGANHIDEYYNLKQEIVVGI + YRLVMKKGSDNFRHSSIQGIIKRLKANGVTLMIYEPSLPDGQLFFGSEVVHDFPKFKE + KSHLIVANRFDETLMDVKDKVYTRDLFGRD" + misc_feature 20246..20803 + /gene="ugd" + /locus_tag="SPC25F_0021" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.3e-45" + misc_feature 20246..20644 + /gene="ugd" + /locus_tag="SPC25F_0021" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.0013" + misc_feature 20831..21112 + /gene="ugd" + /locus_tag="SPC25F_0021" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-35" + misc_feature 21212..21451 + /gene="ugd" + /locus_tag="SPC25F_0021" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 8.5e-05" + gene complement(order(21604..22185,22242..22927)) + /gene="tnp" + /locus_tag="SPC25F_0022" + /pseudo + CDS complement(join(21604..22185,22242..22412,22412..22927)) + /gene="tnp" + /locus_tag="SPC25F_0022" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(22105..22185,22242..22412,22412..22435)) + /gene="tnp" + /locus_tag="SPC25F_0022" + /note="HMMPfam hit to PF01610, Transposase, score 1.2e-31" + /pseudo + gene 23913..25190 + /gene="intron" + /locus_tag="SPC25F_0023" + CDS 23913..25190 + /gene="intron" + /locus_tag="SPC25F_0023" + /note="member of homology group 108" + /codon_start=1 + /transl_table=11 + /product="putative group II intron protein" + /protein_id="CAI33993.1" + /db_xref="GOA:Q4K051" + /db_xref="InterPro:IPR000477" + /db_xref="InterPro:IPR013597" + /db_xref="InterPro:IPR015706" + /db_xref="UniProtKB/TrEMBL:Q4K051" + /translation="MSKLLDKILSRENMLEAYNQVKSNKGSAGIDGMTIEEMDNYLRQ + NWRLTKELIKQRKYKPQPVLKVEIPKPDGGIRQLGIPTVMDRMIQQAIVQVMSPICEP + HFSDTSYDFRPNRSCEKAIMKLLEYLNDGYEWIVDIDLEKFFDTVPQDRLMSLVHNII + EDGDTESLIRKYLHSGVIINGQRYKTLVGTPQGGNLSPLLSNIMLNELDKELEKRGLR + FVRYADDCVITVGSEAASKRVMYSVSRFIEKRLGLKVNMTKTKITRPRELKYLGFGFW + KSSDGWKSRPHQDSVRRFKFKLKKLTQRKWSIDLTRRIEQLNLSIRGWINYFSLGNMK + SIVASIDERLRTRLRVIIWKQWKKKSRRLWGLLKLGVPKWIADKVSGWGDHYQLVAQK + SVLKRAISKPVLEKRGLVSCLDYYLERHALKVS" + misc_feature 24087..24737 + /gene="intron" + /locus_tag="SPC25F_0023" + /note="HMMPfam hit to PF00078, Reverse transcriptase + (RNA-dependent DNA pol, score 6.4e-63" + misc_feature 24783..25034 + /gene="intron" + /locus_tag="SPC25F_0023" + /note="HMMPfam hit to PF08388, Group II intron, + maturase-specific domain, score 3.5e-30" + gene complement(order(25250..25723,25725..26051)) + /gene="tnp" + /locus_tag="SPC25F_0024" + /pseudo + CDS complement(join(25250..25723,25725..26051)) + /gene="tnp" + /locus_tag="SPC25F_0024" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(25661..25723,25725..26033)) + /gene="tnp" + /locus_tag="SPC25F_0024" + /note="HMMPfam hit to PF01710, Transposase, score 2.2e-23" + /pseudo + gene order(26312..26628,26645..27136) + /gene="tnp" + /locus_tag="SPC25F_0025" + /pseudo + CDS join(26312..26413,26413..26628,26645..27136) + /gene="tnp" + /locus_tag="SPC25F_0025" + /note="member of homology group 19; + member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature join(26554..26628,26645..27016) + /gene="tnp" + /locus_tag="SPC25F_0025" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 0.0004" + /pseudo + gene 27282..28265 + /gene="tnp" + /locus_tag="SPC25F_0026" + /pseudo + CDS 27282..28265 + /gene="tnp" + /locus_tag="SPC25F_0026" + /note="member of homology group 39" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + misc_feature 27786..28220 + /gene="tnp" + /locus_tag="SPC25F_0026" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.1e-18" + /pseudo + gene 28342..>28389 + /gene="aliA" + /locus_tag="SPC25F_0027" + CDS 28342..>28389 + /gene="aliA" + /locus_tag="SPC25F_0027" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33997.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaaagca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatacattg attatcacca atctagttga + 481 tggtttgctt gaaaatgaca atcacggaaa cctagttcca tctttgccag aggactggtc + 541 tgtttcgagc gacggtctga cttatactta caaattgaga aaagatgcca aatggttcac + 601 agctgacggt gaagagtact ccccagtcaa ggcccaggat tttgtgacag gtatcaagta + 661 cgtagtggat aataaatcac aggctattga cttgattcaa aactcgatca aaggtttgaa + 721 tgattatatt acaggagcgg attctgactt ttctaaggtt gggatgaagg ccattgacaa + 781 ccagactgtt gagtatactt tggtacgccc agaaccttac tggaactcaa aaacaaccaa + 841 cagtattctt ttcccggtaa actaagagtt tctaaattca aaagggaaag attttgggac + 901 cctatctcca gatagtattc tctacagcgg tccttatttg ttaaaagatt tcacatcaaa + 961 atcatttatc gagtatgtga aaaacccaca ttactatgat catgccaaag tatcgattga + 1021 acacgtgaaa ttggcttact ttaatggatc agatcaagaa ttgactatcc gtaactttga + 1081 aagtggagct tattctatcg ctggagttta tccaaatagt tcgaactttg ctaagaccaa + 1141 ggagaaatat aaggataata tcgtctatag cttgcaggac aagacttctt ggtatttaaa + 1201 tttcaatgtc aatcgcgagg cttgcaatca cactactaaa acgacagatg agccgaagaa + 1261 gtcaactgag acagctgtct tgaacaaaaa cttccgccaa gcagtaaact ttgccttgga + 1321 ccgcacagcc cattctgccc agtcaaatgg ggaagaggcg gctagcaaga cccttcgtaa + 1381 caccttggtg ctcctacatt tgtccaagtt ggagacaaga cctttggaga agtagttgct + 1441 tctaaattgg tcaactatgg tacagaatgg aggtattgac ttggcagatg ctcaggatgc + 1501 ctatttcaac aaagaaaaag cccaagcaaa atttgcggaa gctaaaaaag aattggcaag + 1561 tcaaggtgtg actttcccta ttcacgtgaa tgtggcagta gatcagacaa gtaaaaatgc + 1621 cgttacaggc atgaactcag ttaagcagac tctggagtca gttttaggtg ctgataacat + 1681 tgttattgat gttcagcaac tttcaacaga tgattttaat aatgtacctt cttggcaccg + 1741 atgccagctg atagaggcta tgatttgagc tttgatggtt gggtgggtga ctatcaggat + 1801 ccatcaactt atctcaatcc tttcaatgca gagaatggct tctatctcaa aatttttgga + 1861 ccggatgcca aggaagataa ggaaaaaatc actagcctag gtcttgatac ctacactaag + 1921 atgctcaaag atgcagatag tgaaaacaaa gatgtagcca aacgctatga aaaatatgct + 1981 gaagcacagg cttggatgat tgacaattct ctcattatgt cagctatgtc aagtggtggc + 2041 acagcatctg taaccaaagt gatgccattt acaagagggc attaattggt tggtattaag + 2101 ggtgatggca ataactacaa gtacatgaaa ctgcaaaaag atactgtaac aaccaaacgg + 2161 tttgaaaaag ctaagaccaa atgggagcaa gaaagcaaaa aagcaatcga aaaagcccaa + 2221 aaagaagcag aaaaacatgt taaatagtta taaatagctt tttcaaggag aattaaaaag + 2281 acaaacatca gttttggtgc ttgtcttttt aaatcactcg gttattgaaa attagacttc + 2341 ttgcgaaaca ggctctttgt caactgtagt gggttgaaga aaagctaagc tcgagaaagg + 2401 acaaatttcg tcctttcttt tttgatattc agagcgataa aaatccgttt tttgaagttt + 2461 tcaaagttcc gaaaaccaaa ggcattgcgc ttgataagtt tgatgagatt attggtcgct + 2521 tccaatttgg cgtttgaata gggtagttga agggcgttga cgattttctc tttgtccttt + 2581 agaaaggttt taaagacagt ctgaaaaata ggatgaacct gcttaagatt gtcctcaatg + 2641 agtccgaaaa atttctcagg gtctttgttc tgaaagtgaa aaagtaagag ttgatagatc + 2701 tgatagtggt gtttcaagtc ttctgaatag cttaaaatct tgtcaagaat ttctttattt + 2761 gttaagtgca tgcgaaaagt agggcgataa aatcgcttat cactcagttt acggctatcc + 2821 tgttgaatga gtttccagta gcgcttgata gccttgtatt catgggattt tcgatgaaac + 2881 tgattcatga tttggacatg cacacgactc atagcacggc taagatgttg tacaatgtga + 2941 aagcgatcaa gaacgatttt agcattcggg agtgaaacag cctgggagac tgtttcagcc + 3001 tgagcctaga aatttgaaag cgaagctgtt tagccaagtc atagtaaggg ctaaacatat + 3061 ccatagtaat gattttgacg cgacatcgga cggctctatc atatttaaga aagtgatctc + 3121 ggatgacagc ttgtgttcta ccctcaagaa cagtgatgat atcgagcttt tcaaaatctt + 3181 gcgcaataaa gctcatctcc atctcccgat tgaaacagtc actccccgga ctgtttcaac + 3241 gtcccaggac ataatctcag gaagacaaga aaaatcatgt ttaaagtgaa aatcattgag + 3301 ctttcgaatg acagttgaag ttgaaatggc cagctgatgg gcaatatcgg tcatagaatt + 3361 cttttcaatt aacttttgag caatcttttg gttgatgata cgagggattt ggtgattctt + 3421 cttgacgata gaagtttcag cgaccatcat ttttgaacag tgatagcact tgaatcgacg + 3481 ctttctaagg agaattctag taggcatacc agtcgtttca agataaggaa ttttagaagg + 3541 tttttgaaag tcatatttct tcatttgact tccgcactca gggcaagatg gggcgtcgta + 3601 gtccagtttg gcgatgattt ccttgtgtgt atccttattg atgatgtcta aaatctggat + 3661 attagggtct ttaatgtcta gtaattttgt gataaaatgt aattgttcca tatgaatctt + 3721 tctaatgagt tgtttgatcg cttttcattt ggccactctt caatatgtgc gagaatatcg + 3781 cacttatgaa caaattgcgg ctgattttgg tattcacgaa agcaacttaa tccgtcggag + 3841 ccaatgggtt gaagtaactc ttgttcaaag tggttttacg atttcaagaa ctcctctcag + 3901 ttctgaggac acggtaatga ttgatgcgac ggaagtaaaa atcaatcgcc ctaaaaaaag + 3961 aattagcaaa ttattctggt aaaaagaaat gccgcgctat ggaaaaatga tttgttttgt + 4021 gctaaaatag attgaaacta atactcaatg aaaatcaaag agtaacttgg aagttagctc + 4081 aaagtacagc tttaaggtgg tagatagaac tgacgaagtc agctcaaaat actgttttga + 4141 ggttgcagat ggacgctgac gtggtttgaa gagattttcg aagagtataa gatcctctct + 4201 tttgctatag ttaaggagat gagaggtaaa tgataaggga gagactatgt acgactatct + 4261 aatcgttggt gctggtttgt cgggagcaat ttttgcttat gaagcaacca agcgtggaaa + 4321 aaaagtaaaa gttattgata aacgtaacca cattggtgga aatatctact gtgagaatat + 4381 agaaggagtt aatgttcata aatatggtgc acatatcttc catacttcta ataagaaagt + 4441 ctgggattat gtgaatcaat ttgctgaatt taacaactac atcaactcgc ctgtagctaa + 4501 ttacaagggt agcctttata atctaccttt caatatgaat actttctatg ctatgtgggg + 4561 gacaaaaact cctcaagaag tgaaaaataa gattgctgag caaacggctc acatgaaaga + 4621 cgttgaaccg aaaaacttgg aagaacaggc tatcaagttg atcggtccag atatttatga + 4681 aaagttgatt aaaggatata ctgaaaagca atggggacgt tccgcgactg accttccacc + 4741 gtttatcatc aaacgtctac cagttcgttt gacttttgat aataactact ttaatgaccg + 4801 ttaccaaggt attccaatcg gtggctataa tgtcattatc gaaaatatgc tgaaagatgt + 4861 tgaagtagaa cttggagttg acttttttgc caatcgtcag gaattagaag cttctgctga + 4921 aaaagttgtc tttacaggga tgattgacca atatttcgat tataaacatg gtgagctaga + 4981 ataccgtagt cttcgttttg agcatgaagt tctagataag gaaaattatc aaggaaatgc + 5041 cgttgttaat tatacagaac gagaaattcc ttatactcgc attattgagc acaaacattt + 5101 tgagtacgga acacaagata aaacggttat tactcgtgaa tacccagctg attggaaacg + 5161 tggagatgaa ccttattatc caatcaatga tgagagaaac aatgccatgt ttgctaaata + 5221 tcaagaagaa gcagtacaga atgataaggt aattttctgt ggacgtttgg ctgattataa + 5281 atactacgac atgcatgtgg ttattgaacg ggctttggaa gtggtaagga atgagttctc + 5341 atgagagaaa caggcatata tgaaagttaa tgtagaggag ttgagctttt tatttgaata + 5401 ttgggtgaaa aagtagtata cttagatagt ctgtttttaa aaatcaaaat ggggaaatcg + 5461 attcttatca acttcagagt gaactgaatt aaaactgcat aggagtatat aaaatgctga + 5521 agtaagattt acagaacatg gtatgataag tgttcgacag cttgtttggc aggagttcga + 5581 atattcaagt aattgagagg gtttttgaac ttctgataag atagatagta gattactttc + 5641 gagtaaagga tagttgagaa aatgaataat cgtatagtag acatcagttt gtttgattta + 5701 ttgaatgtct tatggcttcg taaatggatc attgtttttg tatcatttgt ttttggatgt + 5761 atttcttttt tatattatca attttttgta cccaaaacct atacaagtga tactcgtata + 5821 tatgtggtaa gcaaagggga taataaaaat ctgtctaatg cagatttgca agcaggaagt + 5881 gctctaacaa aggattacaa agaaatcatt ttatcagatg aagtgttaga agaaacaatt + 5941 tctgatttaa aactagaatc aactttggaa tctctagctt cgaaaattaa aatttctatc + 6001 cctgcggaaa ctcgaattat ttccattagt gttacaaata cgaactcaga tgaagctgct + 6061 cgaatagcaa atgggataag gaaggtagct gcccttaaaa tcaaggaagt aactcaagtt + 6121 acagatgtca ccactttaca gactgcacgc cctccccaaa ctccgtcagg accgcatgtg + 6181 cgaaaatcta ctacagcagg gcttgttctt ggtgcattct taacagtctt tctagtagtt + 6241 gccaaggaaa tattagatga tcgcataaaa cgttttgaag aacttgaaaa attgggaatc + 6301 cctattttag gctcaatacc tttatcaaaa aatataaagt agaaaatcat gggaaaatta + 6361 gaactaacac gtaagtacta tcaattgtac aatgaaacga aagaatattt taatgcctta + 6421 cagaccaata ttcaacttag tggtgatgga ctgaaagtca tttctgttac ttccacagta + 6481 aaaaacgaag gcaaatcgac tatatcagtt ggcttgtcca tgtccttggc cttatcaggc + 6541 tataaagtcc tgttactgga tgtggattta cgtaattcag tgatgtcagg aatgtttcat + 6601 tctagggaaa gaataacagg tttgactgaa tatttatctg gcaaagcggg aatggcggat + 6661 tctatgcagg aaactacttt agataatctc tatatattac aagcaggagt cgtttcaccg + 6721 aatcccttat ctctattaag gagtgttaag tttgaaacct tgatagattc tatgaaaaag + 6781 tactttgact atattatagt agatactcca ccaatcggcc aagtaataga tgctgcaatt + 6841 attgcccaac aatgtgatgg gatatttttg gtcactgaaa tgaggaaaac gacacgcaga + 6901 caaatttttt cttccctcca gcaattggaa caaactggag ttcccgtttt gggccttgtg + 6961 gccaataaag caattataaa aaaagatagc tatggctatt atggaaaaaa caccgcgagc + 7021 gagactgaaa gatattgatg gactacctcc tctacctcac aaattgcatt ttttgtgagg + 7081 tagaggagta agttgatact attatatatt agacttcctg cgaaacaaaa tatggtatag + 7141 tagttctatg aattatgaag caagtaaaca actaactgat gcacgattta agcgtcttgt + 7201 tggtgttcag cgtaccactt ttgaagagat gttagctgta ttaaaaacag cttatcaact + 7261 taaacacgca aaaggtggac gaaaacctaa attaagccta gaagaccttc ttatggctac + 7321 tcttcaatat gtgcgagaat acccacttat gaagaaattg cggctgattt tggtattcac + 7381 gaaagcaact tactccgtcg gagccaatgg gttgaagtaa ctcttgttca aagtggtgtt + 7441 acgatttcaa gaactcctct cagctctgag gacacggtaa tgattgatgc gacggaagta + 7501 caaatcaatc gccctaaaaa aagaattagc gaattattct gataaaaaaa atgccacgct + 7561 atgaaggctc aagcgattgt cacaagtcaa gggagaattg tttctttgga tatcgctgtg + 7621 aactatttgt tatgatatga agttgttcaa aatgagtcgc agaaatatcg gacaagctgg + 7681 taaaatcttg gctgacagtg gttatcaagg gctcatgaag atatatcctc aagcacaaac + 7741 tccacgtaaa tccagcaaac tcaagccgct aacagctgaa gataaagcct gtaaccatgc + 7801 gctatccaag gagagaagca tggttgagaa catctttgcc aaagtaaaaa cgtttaaaat + 7861 gttttcaaca acctatcgaa atcatcgtaa acgcttcgga ttacgaatga atttgattgc + 7921 tgctattatc aatcatgaac taggattcta gtttggcagg aagtctattt tggaatgcta + 7981 ttatgtttag ttgtgctcaa tgaaaatgaa agaactagta agctaggcgc agtcagctca + 8041 aaacagtgtt ttgaggttgt agatagaact gacgaagtca gtaacatata tatgacaaac + 8101 cgatgctgac gtggtttgaa gagatttttg aagagtataa gacggtattt taagggaatg + 8161 attactattt gaggtatttt atgagtagag agaaaaaaag aggaacagca gtccacttga + 8221 aatcttatat caatagtgtg ctgctaatcc tgtacacagg aatagcgagc ctatttcttt + 8281 ttcagatatt ccgatacaat attttaaatt ttaggaatct caatttatta gtagctctgc + 8341 tagtagtatt ggtatttatt ttaggagtga gtttgattgt ccgaaaaaaa gctgaaaagt + 8401 tgacaatgct tctcctaatc ttagctgtcg caagtagttc aatatcgctt ttggctgttc + 8461 aacaatttat cggttttaca agtcgcttaa atgcaacttc aaacgtttca gaatatgcta + 8521 ttagtcttgt agttttgaaa gatagcgaaa ttagtgaact agaacaagta tcacatgtga + 8581 tggcgcctac cgatacagat tatgaagcta ttcaaagttt gttagcagat ataaaagaaa + 8641 agcaaggtaa agatctaata gtagataaaa gcaaatctta tttagaagcc tataagagtt + 8701 tgatttcagg tgacaccaag gtgatttttt taaatagtat ttttgaacat atgattgagt + 8761 cggattttcc tgactttaga gacaaaatta agaaaatata tacaaaagaa atgacaaaga + 8821 aagtagaagc tccaaaggtt tcaaaggggc aggcttttac tatttatttc agtgggattg + 8881 atacttatgg accaattaac tctgtatcac gttcggatgt caatattttg atgacagtca + 8941 atagcgagac caaaaaaatt cttttgacaa ctacacctcg tgactcctat gtcgcaattg + 9001 cagatggagg aaagaatcaa aaagataaat tgactcatgc tggaatttat ggtattgatt + 9061 cttccattca taccttggaa catttatatg gtgtagagat taactactat gttcgtgtaa + 9121 atttcacttc tttcttaaag atagttgatt tattgaatgg tattgatgtg gacaatagtc + 9181 aagaatttac aattgacggg aacgactatc ctgttggaaa tctccatcta aattctaagt + 9241 cagcacttgg tttcgttcga gaacgtcatt ctctagcaga tggagatcgt gatcgaggac + 9301 ggaatcaaca gaaggtgctc gctgcaatta ttcaaaaatt aacctcaata gaatcattga + 9361 aaaattatcg tcaaatcatg caaggattag aggattcaat acaaacaaat ctctctccaa + 9421 caactatcat ggacttagcc aatactcaat tggaaagtgg agggaattat aaaataaatt + 9481 ctcaagattt aaaagggaca gggcggatgg atcttccttc ttatgcaatg cctgatagtc + 9541 agttgtatat gatggaaatt gatgagaata gcctctcagc tatcaaagaa aatattcagg + 9601 ctgttctgga gggtaggtaa gatgatagat gttcattctc acattatttt tgatgtggat + 9661 gatgggccaa agtccataga agatagtaga gctttgttgt tagaagccta tgatcaagga + 9721 attcggacaa ttgtttcaac atcccaccgc cgtcaaggta tgtttgaaac accagaagac + 9781 aagattgcgg aaaattttcg tgcggtacag aaaatagcta gagatattgc agatgattta + 9841 acaattttat atggtgcaga aatctactat actcaagaca ttatcaataa acttgaaaag + 9901 aaaactttcc caactttaaa tgggagtcga tatgccttga ttgaatttag tagcgagact + 9961 tcttatcgtt ctattcatag cgctcttcag cagttgcttt tgtcaggaat taccccgctt + 10021 atcgcccata tcgaacgtta tgatgctctt gaaaacaata aacaagcagt tctcgaattg + 10081 attcgtatgg gctgttatac acagattaat agttcccatc tactcaaaaa aaaattattt + 10141 aaagatgatg caaaaatcat gaagaaacga gttcactatt ttttgaaaca tgatttagtc + 10201 catattgtag caagtgacat gcataatctt gatactagac cgccttatat ggcggaagct + 10261 tatgaaatca tttctaaaag atacggaaaa gaaaaagctg aagaattttt tataaaaaat + 10321 ccgcaacgaa tcctaatgga tcaattgatt taatgaaaaa ggaaacaaca aatgtataaa + 10381 gttatcaaac gatttataga tatagcttta gccttgctag gaattgtatt attatcacca + 10441 ctatttttag gaattatagt gttcataaaa ttagaatcta aagggcctat tttctttaaa + 10501 caaaaaagaa ttgggctaca taaaaaagaa ttttacattc taaaatttag aacgatgaga + 10561 attgacactc cttcagctgt ccctacacat cttttaaaaa atccttatca atggattaca + 10621 aaggttggta aagtcttacg tagaacctct ctggatgaat tgccacagat ttggaatatt + 10681 ttggtcggtc acatgtcgct tgtaggacca agacctgccc tttggaatca atttgatttg + 10741 attgaagaaa gagacaaata tggagcaaat gatattttac ctggtttaac aggttgggca + 10801 caaatcaatg gaagagatga attatctatt ccagtcaaag ccaaatttga tggctactat + 10861 gtgaagaact gttcatttgt tttagattgt cgatgtgttg tagaaagttt tttagtagta + 10921 tttaagagat atgggcatcg agaaggtggt gcagattaga ggaactgata tatgggaaat + 10981 cgtaaaaaag tttttgtagt agccaatgta gtcaaagaac atattctaaa atttcacatt + 11041 ccgactatca aagaaatgac aaaaagaggg tggacggtag acgtaggtgc ttctggggat + 11101 gaaacagttc cctattgtca ccaacaatat tcactgcccc accaacgttc tccgtttcat + 11161 ctaggcactc tcaaaagtat ctggaaattg agaaaaattt tgaagtctgg aggctatgat + 11221 attgtttact gtcatactcc tgttggaggt ttggtgggac gactggcttc tttaggattg + 11281 cgaaaacaag gaacaagagt catttatttt gctcatggat atcattttta caaaggagca + 11341 acttttttca attggttagt gtattaccca attgaaaagc tactgtccct ttttacagat + 11401 agtatcattc taatcaatca agaagattat catctcacaa aaacaaaatt taaacaggtt + 11461 caatcctatc tagtgagtgg aatgggagta aaacaagaac ggttttcacc ccaatcaaat + 11521 caagttagag aacgttatcg taaagaattg aaactgcctg aggatgcgac tgttttaatt + 11581 tattgtgctg agctaataaa aaataaaaat caaacatttt tacttcatgc tatgaaaaag + 11641 cttgtggatc agggagagaa tctttattgc ttattagtag gaattgatta taccaagggt + 11701 gaaatggtag aatgtattca atccttgaat ttatccgatc gagttttact tttagggtgg + 11761 agagaagata ttgccaatct ttacgcttgt tctgatatat gtgttgcaac aagtattcga + 11821 gaaggatttg gattaaatat agtggaagca atgttttgtc acgttccagt tgttgcgacc + 11881 atcaatagag gacacgccag tattatacaa gatggacaaa acggtctatt agtccaatta + 11941 ggaaatacaa agcaattagt agaggctatt tatgtactaa tgaaggatac taagaagaag + 12001 caagaattag tggagcaagc tagtgcgaat ttagaacaat atcatagtca gaaaattgta + 12061 aatagcttac tagaaataat agaacagact gcaatgaagt gagtgaagga tgtgaaaaag + 12121 tgaaaataca aattgataaa atatactatc tatttttttg gctggtagtt tcctttggat + 12181 atttttttat gatgccaacc tttacagaag atttagaagg cgttgtcagt gctagtttag + 12241 tacaattgtt attatttatt ataggatatg tatatgtatc ttatttaaat cgttctttta + 12301 tctcactgta tagtatcttt atgattgtgt tttacctttt tcaaaatgga caggtattgt + 12361 tatattcact tggagtagag tatgattact tttatgtttt aagatatgat gaaaccatcg + 12421 tactacaatc agttattttt tcaacacaat gtcttattgc agcctttatg gctggagtct + 12481 tttctacgaa gaaagaggta tcaaaacccc tttattctta tatggatcaa ttagaacgag + 12541 aaaaactgat tactgctgga aagttatttt ggggtgcgtt tgcgattttt gctttaccct + 12601 ttatgatgat gaagtttgtt atcaccagta catctgggta ttttgcgatg atacgtttcg + 12661 ttggaagcct acctacaata acagtgttat ttgaaaaaat gttcattgct tcaagtgttt + 12721 ttttggttgt ttatttaaaa tctgaggaaa cttggagcaa gtttttaaaa gttgttatct + 12781 taggttggag tataatggct gctttaacag gagatagaac cgtaggttta gcagggattg + 12841 ttacgttagc tttaattcaa acattaattg gtaatcgtaa aaaaaagatt aagttttctc + 12901 agtatgcctt gttagttggg gcagctgttg tagtgatgta tttaatgtcc tttgcttttc + 12961 aatttaggat gcaacaagat tctaaagttt caggactaca aactgcggta gtagaaatga + 13021 taggaactct agggtttagt tttttcccac tcgtattaac gattagaatt gttccaactt + 13081 ctattaactt ttttagagga aaatcatata ttgcagccat cattacagga ctaattccat + 13141 ctaattttga ttttttacat ttaacaaaga cattatcaga atggaatgca tatccaacgg + 13201 aattattaga tacaatctat cattatggtt tcggattaga ttattcttta attgcggaag + 13261 cctatattaa ttttggttct tatggatgga tagcgatttt tttcctttgt tctctaatag + 13321 cttattttgt aagagatgtg gattttaaaa ggaaggacaa cttattctca caatatgcta + 13381 gcttgatttt gctgtattca tggtttaccc ttccaagaag aaaatcttat tttattttta + 13441 ataatttttt ttggtatgta ttattttttg gactagcact catacttgtc tctcgttcta + 13501 ttaaacaacg aaaggaattt aaaaaatgaa aatttcaatt attatgggca ttcataatgg + 13561 tgaaaagcgc tttgaaacag ctgttcaaag tattttcaat caaacttatg ataattggga + 13621 atttattatt tgtgatgatg cttccacaga taaaacgttt gaaaagttac aaggattata + 13681 tggacaggat tcacgtttta tcttattaaa aaatgaaaaa aatgtaggtc tttccgcgac + 13741 attaaaccgt tgcattgaag caagtagtgg agaatttatt gctagaatgg atgatgatga + 13801 tatttgttat cccgagcgct ttgaaagaca agtcgactat ttgttccatc atccagagat + 13861 tgattttgtt tcttcatcta ttgatatttt tgatggagaa gtagttgtag gtacacggat + 13921 tttacttgat tttcctagta aaaaggattt gatttggaat agcccctttg ttcatcctgt + 13981 taccatgttt cgtagagatg ccttgcttga agttggcggt tatagagttt ctccagaaac + 14041 tgttcgtggg caagattatg atttgtttat gagactatat tcacgcgaga aaaaaggtgg + 14101 aaatatttta gaaccactat ttcgctatac gattgatcaa aatacgatga agcgacgtac + 14161 gtttaaagct cgaattgggg aaatgattat tcgctataaa ggttatcgtg cgatgaaagt + 14221 tccattttat aattatgttt ttatatttaa accattagta gctcatctag taacactcgt + 14281 taaaaggaga taatgtttat gaaaatttta ataaccactc atacttatct tcctaataaa + 14341 gatggtgttc aatttgttaa tcaatattta gcagaaggat tggttaaaaa gggtcatcaa + 14401 gtaacagtgc tgacctattg ttatccatca cgtacaaggg tacctagaga agtgataaat + 14461 ggtgttagag tcattcgttg gaatgctcga acaagctgta ctttccataa aggagaaaaa + 14521 ttagcttatc aaaatttcat cttaaattcc caatcggatt atgatgtttt agtgaatgtt + 14581 gggacacaga ctgctttaac agattggtta tttccgatat tttctcagat aacaattcca + 14641 aaagtcttat atattcattc gatatgggat ttcaactggc tgcattggca tagacaatca + 14701 ttcaagcgat ttgttgctaa aacttgggca aatgtacgct ggaaatatta ttattggaaa + 14761 cagactgtta tctttaaaca atataatgaa gtaattcagc tacacccaaa agattatagt + 14821 gtggctttct ttaaagaaaa atatgatata gaaagtcaga ttttaggaaa tgccgctgat + 14881 gcttcctttt ttcaaaataa aaacgctatc aaaaagcaat cttacattgt aaatgtttct + 14941 aattttaatg atctaaaaaa tcaaaagaaa gcggttgagt attttttgaa aagcaatctt + 15001 tcaagtgagt ggaagttcgt tttagttggt tcagaaaaga atgattattt acaaagcgta + 15061 caagattttg aaaaagaact ccgaaaccaa ttaggtatca cttctggtaa agaaatagag + 15121 tatcgcatcg gattgtcaag agaagaagtt gtaaaaactg taaaagaagc ctctttttgt + 15181 ttactgacga gtatacggga agcttttcca atttcattaa ttgaagtaat ggcagcagga + 15241 attcctttta tctcttctga tgtaggaatt gtcaactatt tgtctggagg aatcactgct + 15301 tgtagtgatc aagaatttat aagagctatt gaagagtttg ctacttatcc cgaggtcaga + 15361 aatcaatatg gcaaaaaggg gcaaatggaa gcgaaagaac attatcaagt agatgataaa + 15421 gtgaaagagt ttgaaacttt gttacaaaag ttcgtaaagg aagaagaaga ttgaaaaaaa + 15481 tagtattttt gtgtccctat tttgggactt taccacccca tacgcagtta tggttgaatt + 15541 cttgtaaaat gaatccgtct gtaacatggt atctatttac agatgacaag aggacatttg + 15601 attatccgga aaatgtgcaa gttttctata ctactttgga agaaacaaag gcgttgtatc + 15661 aaagaaaatt tgactttgag atttctttag agggtgctta taaactagga gattataagc + 15721 ctttattcgg ctatctttat gaggaaatga tacaagagtt tgatgcttgg ggacatattg + 15781 atgtttatga tgaaatctat ggagatattc gtgcatttgt aacagatgag ttattagata + 15841 aatacgataa attgatgttt tttggacata tgggtattta tagaaattct cctgaagtta + 15901 atcgcagatt taaattatcg tctgatttgg atcgtactta tcaagaaata ttttcttcat + 15961 cacaatttta taattttgaa gaatatgttg caggaagtat cactcgtgtt tatcaaaaaa + 16021 atggattccc aataggaaga ttagataaag tgattgcaga tctttctggt ttaagttatc + 16081 atttccgacg tgggtattat tcagatgatt ttgagacatt tacctattta ccaaatctac + 16141 ctatgatttt ttcttgggaa gatggaaaaa cttattgtta ttcggtacaa aacaatcaag + 16201 tgcaaaaaaa tgagttcttg tatgtacact ttaagcgtag aaaaatgatt cagtctattt + 16261 caaatgatgt ttctgcttat ttaatcgttc caaatggttt tgttgagatg cctaaagaga + 16321 taactgttga tttgattcaa aaatatagtc agaaaaaatt attttatcca gtctattttc + 16381 aggaaaagtg gaaaggtgtc aaacgattat tgaagaaaat agggaggtca gaatgaagga + 16441 cattttaaaa aagttgatac aacaattacc ggataaacta tttctacaaa ttaaatacta + 16501 ctacgttttt aaaaaagaaa ttaaatttac agaatcctaa aacctttaat aaaaaaacac + 16561 aatgattaaa attatataat cggaaacctt tttatacaat tttagcggat aaaattttag + 16621 tgaagaacta tattgcccat atacttgggg aagaaaatat tattccgact ctgggtgttt + 16681 ataatcgttt tgatgagatt cattttgttt cgcaggaagt ctattgaaga atttgtaaca + 16741 gatgagtcga aacgagaatt aaaggaatat aagattgttt tctttatact gttcctaagt + 16801 tttttcaatt agattataac cgctttacaa atcataagag aaatatttat gataccaact + 16861 agaatcagca ggactttatt tatgcttacc catcaagtaa agataagata atagatagtc + 16921 ccgctggact tactgcaata ctcgagtttg cgagtaaatt atcaaaagat attccatttt + 16981 tgaggtgcga tttttatatt gtgaatgata aaatattatt tgaagagatt acgttttttc + 17041 cagaatcagg ttttggaaaa tttagtccag agcattataa tttagagttt ggaaaggata + 17101 ttactttact ggagaagcaa gatggaaaca aaagaaaaac gtttagtgaa taatacgatt + 17161 atttttacaa ttggaagttt aggttcaaaa tttatacagt ttttgttagt acctttatat + 17221 acctatactt taacagctgc tcagtttggg attaccgaaa ttttattaac cgctgtgaat + 17281 cttttaatac ctgtattttc tatttccatt gctgatggat tattaagatt tggattagat + 17341 aagaccttaa gaagagaaaa tgtcttgaaa tcagctttta tcatttcgat acttgggact + 17401 attttatcca ttatttcgat tccaattttt tcgctctatc ctactttgtc agagtggatg + 17461 gtttatttta tcatcatttt gaacttgaga atgtatcggg atgtttttgc gattcaattg + 17521 aaagttgaag ggaaaaatac attatttgct tgcgatagta tgatttatac atttgtttta + 17581 tctttagcga gtattgtctt tctagttcct ttttctttag gcatttcagg ttattttttc + 17641 gcttatattg tcagtaatgg aatttccatt ttctttatct tatttttcgg aggagtctgg + 17701 aaaagtttta ctagcggaag atttgaaaaa caattgatga tacaactatt gaaatattca + 17761 gcacccatga ttttaaatgg tattgcatgg tggattacaa atgcctcaga tcggtttatg + 17821 ttgcaatggt ttatggatga tagagcggta ggtttgtatg gtgttgttgc aaagttaccc + 17881 ttattaatcg gaacgtttac tggagtattt aatcaggcat ggattatttc agcagtagaa + 17941 gagtttgaag aagaaaatga agaatggttt tatcaaaaag tttttcacca atattatgca + 18001 gcactctttt taagtgtttc agtatttttg cttctacttc aaccatttat gaaagtatat + 18061 gttagtccaa gcttttatga agcatggcaa tatgctccgt ttttattatt gtcaagtgta + 18121 gtttcaggaa tcgccgcatt tatgacaggt ttttatgttg cgcaaaagaa aaatttgaat + 18181 attatataca cgacgattgc tggtgctttt gcgaatattt tgttaaatgc gatgtttatt + 18241 cctatgcttg gagtattagg cgcttccatt gcgacctttc tatcatggtt tgttattgca + 18301 atctatcgta tgaaagatgt tgaaaacttt gcttgttttc cattagataa aaaagttttt + 18361 tggtatttat ttctattatg tattcagacc attacgatga cttttctgcc aatccttggc + 18421 attgtttttt cagtcgtatt gattccttat ttcttttacc aagaacagga atttctagca + 18481 gttttatttg ataaaggaag gaaaaaagta tgttcattca aaaaatcaaa aagataataa + 18541 gagtattttt aaggaaatct ttagtaaaag attatcgaca aagaattcaa aataaagagt + 18601 ttactcttat tacttctaat tgtgtgggtg gactgattag tcatgatttg ggtctacaat + 18661 ttcgttctcc cactatcaat atgtatatag aagcagcaga ctttattcag ttttgttcac + 18721 atttagaacg ctatttaaaa gaagacttat cttttattga agtaaatcaa gatggacatt + 18781 ttgtagctct ttgtggggat ataaaaattt atattgttca ttataatagc tttgaagagt + 18841 ttgctaaaaa atggtctgaa cgtgccaaaa gagtagattt tgatcaatta tatcttatga + 18901 tgtctgaacg agatggctgt cgttatgaag atattgtgaa gtttgatacg ttaccctata + 18961 agaataaagt aatttttaca agtaaaaaga tgccagaaat tcaatccgct ttttatatac + 19021 caggtattga aacaaaaaat aatcaaaaac ataaggtgaa atcagtaaca acttatctta + 19081 actcctttac aggaaaacga tatatagatt tattcgactt tgtagagttt ttgaatacag + 19141 gaaggaaaca attaagtaag tatgaaaagt aagataatat taaaaaataa aacaattctt + 19201 gttacaggag cagctggctt tattggtgct aatcttgtca tgagtttatt acaagaagaa + 19261 aatccattac agattattgg aatagataat ttgaatgatt attatgatgt ttctttaaaa + 19321 gagtatcgtt tatcaacaat tcaagaggag tgtcaatcat ctttaaataa aaaatgggta + 19381 tttatcaaag gagatattgc tgattctgat ttgatggaag aaatttttga gacgtataga + 19441 cctcaaattg tagtgaattt ggcagcacaa gcaggtgttc gttattctat cactaatcct + 19501 gatgtttata tgaaaagtaa tatcattgga tttcatacta ttcttgaaaa atgtagaaag + 19561 tatcaagaaa atattgaaca tttagtttat gcatcatcct cttctgttta tggtggaaat + 19621 acaaaaattc ctttttctga attagatgca gtagacaatc ctgtttcttt atatgcagtt + 19681 acgaagaaaa caaatgaatt agaagcacat gcgtattcaa aattgtacaa tattccaaca + 19741 acaggcctga gattttttac agtttatgga ccagctggaa gacctgatat ggcttatttt + 19801 agttttacaa agcaattaat tgataaaaag ccaattgaaa ttttcaatta tgggaattgt + 19861 caacgtgatt ttacttatat tgacgatatt gttgaaggcg ttaaaagagt gatgactgga + 19921 gctcctcaaa aagaaattgg agaagatggg ttaccaattc ctccttatgc tatctataat + 19981 attggaaatc accaaccaga aaatttattg aattttgtcg aaatcttgca agaaaaattg + 20041 atagctgctt ctattttacc agaagattat gatttctcat ctgctcagaa acttgttcca + 20101 atgcaagctg gtgatgtagt tgcaacctat gcagatataa gtctattgga gaaggatttt + 20161 aatttcaaac ctaagactag tcttagaaat ggcttgagaa attttgcaga atggtataga + 20221 aatttttatc aaaggggtga atagaatgaa aattactgta gtaggaatgg gatatgtcgg + 20281 attgtccttg gcggtattat tagcgcaaca tcatgaagta acagcgttag atattattga + 20341 taaaaaaatt caactcatca atgagaaaaa atctccaatt caagatgagt atattgaaca + 20401 atacttttta gaaaaaaatc ttcatttaag cgcaacaaca aacgaagtag aggcgtataa + 20461 agatgcggaa atgattatta tagctgctcc tacagattat gatacacaca aaaatttctt + 20521 tgatacatct gccgtagaac aagtaatcga aaatattatt tctatgaata acgaggcttt + 20581 aattgtcatt aaatcaactg ttcctgttgg ctatacggag tcgattcgag aaaaatatgg + 20641 taaaaagaat atactgttta gcccagaatt tcttcgtgaa gcaaatggat tgtatgataa + 20701 tctttatcct aatcgaatta tcgtaggtac agatttgaat gatggagcat tagtttctaa + 20761 agcacatgaa tttgtgtctt tattacaaga aggtgctctc aaagagaata ttgatacttt + 20821 aatcatggga ttttctgaag cagaagctgt gaaattattt tccaatgctt atctggcttt + 20881 aagagtgtct tattttaatg agttggatac ttatgctgaa ctgaaaggat tgaatacgaa + 20941 agccattatt gatggagtag gattggatcc tagaattggt cagttttata acaatccatc + 21001 ctttggttat ggtggttact gtttaccaaa ggatagtaag caactgttgt caaattatca + 21061 tgatgttcct gaaaatatta tttcagcaat tgtttctagt aatgaaactc gtaaaaaatt + 21121 tattgcagaa cgtattcttg aaatagtcgg agctaatcat attgatgaat actataattt + 21181 gaagcaggaa atcgttgtag gtatttatcg tttagtcatg aaaaaaggtt cggataattt + 21241 tagacattct tctatccaag gaattataaa gagactaaaa gcgaatggag tgacattaat + 21301 gatctatgaa ccttcacttc cagatggaca attatttttt ggaagtgaag ttgttcatga + 21361 ttttccaaaa tttaaagaaa aaagccacct tattgtagcc aatcgttttg atgaaacatt + 21421 aatggatgta aaggataaag tatatacaag ggatttgttt ggaagagatt aagggagata + 21481 ggttttgaac aagttctatt cccaaaaaat cacaccgtta ctatcttcga ataaattaaa + 21541 agcaaagcaa gtgattgata gaaaatcggc tctttgtcaa ctgtagtggg ttgaagtcag + 21601 ctaagctcga gaaaggacaa attttgtcct ttcttttttg atattcagag cgataaaaat + 21661 ccgttttttg aagttttcaa agttccgaaa accaaaggca ttgcgcttga taagtttgat + 21721 gagattattg gtcgcttcca atttggcgtt tgaatagggt agttgaaggg cgttgacgat + 21781 tttctctttg tcctttagaa aggttttaaa gacagtctga aaaagaggat gaacctgctt + 21841 aagattgtcc tcaataagtc cgaaaaattt ctctggttcc ttattctgaa agtgaaacag + 21901 caagagttga tagagctgat agtgatgttt caagtcttgt gaatagctca aaagcttgtc + 21961 taaaatctct ttattggtta aatgcatacg aaaagtaggg cgataaaaat gtttatcgct + 22021 gagtttacga ctatcctgtt gtatgagctt ccagtagcgc ttgatagcct tgtattcatg + 22081 agactatcga tccaattgat tcatgatttg aacacgcaca cgactcatag cacgactaag + 22141 atgttgtaca atgtgaaagc gatcaagaac gattttagca ttcgggagtg aaacagtctg + 22201 ggagactgtt tcagcctgag cctagaaatt tgaaagcgag gctgtttagc taagtcatag + 22261 taaggactaa acatatccat agtaataatt ttgacgcgac atcggacaac tctatcgtag + 22321 cgaagaaagt gatttcgaat gatagcttgt gttctaccct caagaacagt gatgatatcg + 22381 agcttttcaa aatcttgcgc aatgaagctc atctccatct cccgattgaa acagtcactc + 22441 cccggactgt ttcaacgtcc caagacataa tctcaggaag acgcgaaaaa tcatgtttaa + 22501 agtgaaaatc attgagctta cgaataacag ttgaagttga gatggaaagc tgatgggcaa + 22561 tatcagtcat agaaatcttt tcaattaact tttgagcaat cttttggttg atgatacgag + 22621 ggatttggtg attcttcttg acgatagaag tttcagcgac catcattttt gaacagtgat + 22681 agcacttgaa tcgacgcttt ctaaggagaa ttctagtagg cataccagtc gtttcaagat + 22741 aaggaatttt agaaggtttt tgaaagtcat atttcttcat ttgacttccg cactcagggc + 22801 aagatggggc gtcgtagtcc agtttggcga tgatttcctt gtgtgtatcc ttattgatga + 22861 tgtctaaaat ctggatatta gggtctttaa tgtctagtaa ttttgtgata aaatgtaatt + 22921 gttccatatg aatctttcta atgagttgtt tgatcgcttt tcattataga tcttatggga + 22981 ctttttttct acacaaaaat aggctccata atatccatag ggaatttacc cactacaaat + 23041 attatagagc cagaaaatca cctgcttttt gtatcaatgt tttttcacaa aatctaaaat + 23101 ataatggatt gaatttggaa tagaacacta tggtttctaa agcattgtta gaaattatag + 23161 tcaattgaaa caagagcagg acaaaagagc ctcgtaaaag gtattgcaac ttggtaatac + 23221 ctttttgatg tacgacgggc atgtcgtata tctgaggtgt aagtcctcgg tgggcacctg + 23281 ctaccggtga acccaatagc gattcccaag cctgactatc gtgaggtagc agggagagga + 23341 agggatagcg aaatcgtggc tctacgaaca ggaacgtgat agtaaggcgt atatagcgga + 23401 taaggaggtt tcaaactcta aagtccaaaa aggtagtcgt aacctatatg tgtaaatcac + 23461 gagagtaatt gaattcggac taaggtttgt gtgaaaaaga taaatctttc tagagtctaa + 23521 agactctgcg tcagatttcc tattttcact gtaacctttt aacgtcctca tatcttgtat + 23581 aaacgaggaa agatgtacaa cttatcccgt gaggtttcat gggcgctgaa agcgtagtaa + 23641 caacgaatca tgagaagtca gccgagccca tagtagtgag gaaacttctg tagtggaagt + 23701 ggagcgaagg ggtgaatact caaacagtct ggggagagac tgtttgaggt ctgtcgctag + 23761 aaagagaaaa cgacagatcg aagtaatcct acttcacttg tgtctgtaaa atgagtggtc + 23821 tgatagaact ggactttgac acgtaatgac tagatgaagg ttcaccaata taagatgtcc + 23881 ctcaggcacc aaaacaagaa aggaatacgc acatgtcaaa actgctagat aagatattat + 23941 cacgcgaaaa tatgctggaa gcctacaatc aagtaaaatc caataaaggc tcagctggga + 24001 ttgatggaat gactatcgaa gagatggata attatctcag acaaaactgg cgcttgacta + 24061 aggaactgat aaaacagaga aaatataagc ctcaaccagt tcttaaagtt gagataccta + 24121 aaccagacgg aggcatccgt caactaggaa ttccaacagt tatggataga atgattcaac + 24181 aggccattgt ccaagtcatg agccccattt gtgaacccca tttctcagat acgagttatg + 24241 atttcagacc aaataggtca tgtgaaaaag ccatcatgaa gctcttagaa tacttaaatg + 24301 acggctatga gtggatagtg gatatagacc tagagaaatt tttcgataca gttcctcaag + 24361 atagattgat gtccttagta cataacatta tcgaagacgg agatacggaa tccttgattc + 24421 gtaagtatct tcattcaggt gttatcatta atggtcaacg ttataaaaca ctagttggta + 24481 caccacaggg aggaaattta tctcctctct tatctaatat catgcttaat gaattggaca + 24541 aggaattaga aaagagggga cttcgatttg tgcgctacgc agatgattgt gtgattacgg + 24601 tcggaagcga ggcagcctct aagcgtgtga tgtattcagt cagtcgtttt attgagaaac + 24661 ggctaggttt gaaagtaaac atgaccaaga ctaagattac cagaccaaga gagttgaaat + 24721 atctaggttt tgggttctgg aaatcatcag atggttggaa aagccgtcca catcaagata + 24781 gtgttcggag atttaagttt aaattgaaga aactaacaca gaggaaatgg agtatagacc + 24841 taacaagacg tattgagcaa ctgaatttgt ctattcgagg atggataaac tatttctcat + 24901 tgggaaatat gaaaagtata gtcgccagca tagatgagcg cttgcgtact cgcctacgag + 24961 tgattatctg gaagcaatgg aagaagaaat cgagacgatt atggggattg cttaagttag + 25021 gagttcctaa atggatagca gataaggtat ctggctgggg cgaccattat caattagtag + 25081 ctcagaagtc ggtacttaaa cgtgctatat caaaaccagt cctggaaaaa cgtggactgg + 25141 tttcgtgttt ggattattac cttgaacgac atgcgttaaa agttagttga accgccgtat + 25201 gccgaacggc acgtacggtg gtgtgagagg ggctagagat tatcccctac tctatgtgct + 25261 ttttgatatg agcccatgtt ttctcaatag gattgtactc aggtgagtag ggaggaagag + 25321 gtaaaagttt atgcccaaac tctttgcata aaagttctag cttccccatt ctatggaatc + 25381 ttgcattatc cataataata accgatggtg tggttaatgt tggtaagaga aacttctgaa + 25441 accaagcttc aaaaaagtcg ctcgtcatca tctcttcgta agtcattgga gcgattaact + 25501 caccatttgt tagacctgca accaaagaaa tcctctgata tcttcttcca gatactttgc + 25561 ctcttcttaa ctgacctttt aatgagcgac tatattctcg ataaaaataa gtatcgaatc + 25621 ctgtttcatc aatctaaaca ggtgataggt gctttaaact attaaaattc ttaagaaata + 25681 aggctacttt ttctgggtct tgttcatagt aggtgtggtt ctttttttcg agtgtagtcc + 25741 atagctttga gcgcatagtg gatggtagtt ggatgacagc caaattcaga agctatttca + 25801 gtcaaataag cgtctggatt gtcagtaaga tagtttttaa gtctatctct atcaactttt + 25861 cttggttttg ttccttttac ttggtggttt agctctcctg ttttctcttt tagctttaac + 25921 cagccataaa tagtattacg tgagatttgg aaaacgtgtg atgcttctgt tatactacct + 25981 gttcgctcac aataagagag aactttttta cgaaaatcta ttgaatatgc cataagaaga + 26041 ttataccaca ttgtgtacta tttttggttc attttactat aatttaaaat tccctcatcg + 26101 atttgttcac attctattgc aatcaactgt aaatatgctt ttcagaatat atcaaatata + 26161 acaaatataa caaataacta aaagttctat aatagactcc ctgcgaaaca aaatatggta + 26221 tagtagttct atgaatgatg aagcaagtaa acaactaacc gatgcacgat ttaagcgtct + 26281 tgttggtgtt cagcgtacca cttttgaaga gatgttagct gtattaaaaa cagcttatca + 26341 acttaaacac gcaaaaggtg gacgaaaacc taaattaagc ctagaagacc ttcttatggc + 26401 cactcttcaa tagtgcgaga atatcgaact tatgaagaaa ttgcggctga ttttggtatt + 26461 cacgaaagca acttaatccg tcggagccaa tgggttgaag taactcttgt tcaaagtggt + 26521 tttacgattt caagaactcc tctcagttct gaggacacgg taatgattga tgcgacagaa + 26581 gtaaaaatca atcgccctaa aaaaagaatt agcgaattat tctggtaaaa agaaatgcca + 26641 cgctatgaag tctcaggcga ttgtcacaag tcaagggaga attgtttctt tggatatcac + 26701 tgtgaactat tgtcatgata tgaagttgtt caaaatgagt tgcagaaata tcggacaagc + 26761 tggtaaaatc ttggccgaca gtggttatca agggctcatg aagatatatc ctcaagcaca + 26821 aactccacgt aaatccagca aactcaagcc gctaacagct gaagataaag cctgtaacca + 26881 tgcgctatct aaggagagaa gcaaggttga gaacatcttt gccaaagcat agtatattga + 26941 aactagaata gtacacctct acttctaaaa cattgttaga aatcgatttg actgccctga + 27001 tcgattcgtc ctattcttgt ttcattttga tataaaaacg tttaaaatgt tttcaacaac + 27061 ttatcgaaat catcgtaaac gcttcggatt acgaatgaat ttgattgctg ctattatcaa + 27121 tcatgaacta ggattctagt tttgcaggaa gtttaatgaa gttagccacc cagccctcct + 27181 aaaaattaga tggttcaact agctgaaagc tcttgtaggc ataagaaaac acctctgtgt + 27241 tatacttgtt gttcaaccac aaacacaaga aaggcacaga aatgcaagac aattatacta + 27301 caaaaggtaa acatttgaca atcgatagcc gtcgcttaat cgaaagatgg aaaaaagaag + 27361 gaaaatcaaa tagagaaatt gcctctctac ttggaaaagc tcctcaaact atccacactg + 27421 aaatcaagcg taggacagtc cgaaaatgtc ttggaaaagg gcgcttcaaa gaggtttatt + 27481 ctgccgacta tgctcaacag tcttatgaaa ataatcgcaa gcactcggtc aagagatcaa + 27541 gcgtgaccaa ggaactaaag gaaaagattc tccactatca taaccaaaaa tttttgcctg + 27601 aaatgatggt tatggctaaa ggggttaacg tgggaatttc aaccatttac tattggattc + 27661 atcatggaaa attgggatta agcaaatagg atctgcttta ccctagaaaa ggaaaagcgc + 27721 ttaagaaaca ggctagcacc aactttaaac ctgctggtca atccatcgaa cagcggcctg + 27781 aagctatcaa tcttcgcttg gagaatgggc attatgagat tgatacggtt ctacttacga + 27841 gatcgaaaaa ctactgcttg cttgtcttga cggatcgaaa gagtagacat cagatcatcc + 27901 gattgattcc aaataaaagt gctgaggtgg tcaatcaggc tctaaaactc atcttaaaac + 27961 aacacaagat tctttccatc acggcagata atggaacgga attcaatcgc ttgtttgata + 28021 tattttctga ggagcacatc tattatgcgc acccctatgc ctcttgggaa aggggaacta + 28081 atgagaatca caacaggctc attcgtagat agttacctaa gggaaccaag aaaatgactc + 28141 ccaaagaagt cgcattcatc gaaaagtgga ttaacaacta tcctaaaaaa tgcttggact + 28201 acaagtcacc cagagaagac ttctggatgg ctaacttgaa cttgaaattt agctataaca + 28261 aataactctt aaaattctga aaattctgtt gacaactttc tgaaaagagt ctataatgga + 28321 gagaaagttt taaaggagaa aatgatgaaa agttcaaaac tacttgccct tgcgggcgtg + 28381 acattattg +// + diff --git a/public/res/serotype_genbank/serotype_27.gb b/public/res/serotype_genbank/serotype_27.gb new file mode 100644 index 0000000..222ea49 --- /dev/null +++ b/public/res/serotype_genbank/serotype_27.gb @@ -0,0 +1,943 @@ +LOCUS CR931691 20135 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain nr. 34371 (serotype 27). +ACCESSION CR931691 +VERSION CR931691.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 20135) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 20135) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..20135 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="nr. 34371" + /db_xref="taxon:1313" + gene <1..33 + /gene="dexB" + /locus_tag="SPC27_0001" + CDS <1..33 + /gene="dexB" + /locus_tag="SPC27_0001" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33998.1" + /db_xref="UniProtKB/TrEMBL:Q4JZU9" + /translation="PWDAFCVELL" + gene 192..362 + /gene="aliB" + /locus_tag="SPC27_0002" + /pseudo + CDS 192..362 + /gene="aliB" + /locus_tag="SPC27_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(361..881) + /gene="tnp" + /locus_tag="SPC27_0003" + /pseudo + CDS complement(join(361..681,674..802,810..881)) + /gene="tnp" + /locus_tag="SPC27_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1096..2550 + /gene="wzg" + /locus_tag="SPC27_0004" + CDS 1096..2550 + /gene="wzg" + /locus_tag="SPC27_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34001.1" + /db_xref="GOA:Q4K048" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K048" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1096..1221 + /gene="wzg" + /locus_tag="SPC27_0004" + /note="Signal peptide predicted for SPC1360 by SignalP 2.0 + HMM (Signal peptide probability 0.991) with cleavage site + probability 0.537 between residues 42 and 43" + misc_feature 1309..1656 + /gene="wzg" + /locus_tag="SPC27_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 9.8e-65" + misc_feature 1834..2277 + /gene="wzg" + /locus_tag="SPC27_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 2552..3283 + /gene="wzh" + /locus_tag="SPC27_0005" + CDS 2552..3283 + /gene="wzh" + /locus_tag="SPC27_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34002.1" + /db_xref="GOA:Q4K047" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K047" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTLYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEKDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKHGEAKAQELFIDNPRKIVIDQLI" + misc_feature 2555..3163 + /gene="wzh" + /locus_tag="SPC27_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 3.1e-36" + gene 3289..3984 + /gene="wzd" + /locus_tag="SPC27_0006" + CDS 3289..3984 + /gene="wzd" + /locus_tag="SPC27_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34003.1" + /db_xref="GOA:Q4K046" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K046" + /translation="MMKEQNTTEIDVFQLVKTLWKRKLMILLVALVTGAGAFVYSTFI + VRPEYTSVTRIYIVNRNQGDKAGLTNQDLQAGTYLVKDYREIILSQDVLEKVAANLKL + DMPAKTLTSKVQVTVPADTRVVSISVKDKQPEEASRIANSLREVATEKIVAVTRVSDV + TTLEEARPATTPSSPDVRRNSMFGFLGGAAVTAIAVFLIELLDTRVKRPEDVEDVLQI + PLLGIIPDLDKMK" + misc_feature 3310..3726 + /gene="wzd" + /locus_tag="SPC27_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-53" + misc_feature 3832..3909 + /gene="wzd" + /locus_tag="SPC27_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 3994..4695 + /gene="wze" + /locus_tag="SPC27_0007" + CDS 3994..4695 + /gene="wze" + /locus_tag="SPC27_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34004.1" + /db_xref="GOA:Q4K045" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K045" + /translation="MPTLEISQAKLDFVKKVEENYNALCTNLQLSGDDLKVFSITSVK + LGEGKSMTSTSIAWTFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIPAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGGVNRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GKYGDYEKNKKYVEG" + gene 4698..6065 + /gene="wchA" + /locus_tag="SPC27_0008" + CDS 4698..6065 + /gene="wchA" + /locus_tag="SPC27_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34005.1" + /db_xref="GOA:Q4K044" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K044" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGVIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATYRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLEVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSTIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 4698..4790 + /gene="wchA" + /locus_tag="SPC27_0008" + /note="Signal peptide predicted for SPC1364 by SignalP 2.0 + HMM (Signal peptide probability 0.902) with cleavage site + probability 0.355 between residues 31 and 32" + misc_feature 5481..6062 + /gene="wchA" + /locus_tag="SPC27_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 7.9e-158" + gene 6069..7268 + /gene="wchF" + /locus_tag="SPC27_0009" + CDS 6069..7268 + /gene="wchF" + /locus_tag="SPC27_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI34006.1" + /db_xref="GOA:Q4K043" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K043" + /translation="MPLSLVRREMKQSVYIIGSKGIPAKYGGFETFVEKLTEYQKDDN + IQYYVACMRENSAKSGFTADTFEYNGAICYNIDVPNIGPSRAIAYDIAAVNKAIELAK + ENKDEAPIFYILACRIGPFISGLKKKIRSIGGRLLVNPDGHEWLRAKWSLSVRKYWKF + SEQLMVKHADLLVCDSKNIEKYIQEDYKQYQPKTVYIAYGTDTTPSSLKSEDAKVRNW + HREKGVSENGYYLVVGRFVPENNYETMIREFMKSNSKKDFVLITNVEQNKFYDQLLKD + TGFDKDPRVKFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLSLLLD + VGFNREVGEDGAIYWKKDELAHVIEEVERFDEGDISELDEKSSQRIADAFTWEKIVTS + YETIFNS" + misc_feature 6711..7205 + /gene="wchF" + /locus_tag="SPC27_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0022" + gene 7451..8479 + /gene="whaK" + /locus_tag="SPC27_0010" + CDS 7451..8479 + /gene="whaK" + /locus_tag="SPC27_0010" + /note="member of homology group 199" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34007.1" + /db_xref="GOA:Q4K042" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K042" + /translation="MIHLSIIVPVYNTAIDKLEQCFQSIKTFMDKNSALNMECVIIDD + GSKGKVSDWCREFSETKADFKFYKKVNEGVSVARNMGISLSKGQYIIFVDSDDLLVSF + NELEQYLLDGKYDLIFSDLATDIQQKHMWKAFEGDSREIDFETVISRIVSDGTLNGPV + CKIIRKNLLDQHHIEFDKTMITGEDLVFLIHILLQKPKMYYISQCTYIYKLDTNTSNN + RLKNCSKVFIKNNVVAYKHMIQLINQFSSNQHKQIFEKRATEIYIKQLFNSLADLLEM + GLLSQELKDYTVQLLSELDKQTVDLIQGQKLSKSNLQLTVLLNKWWLLLAVASRMRIL + YLKIKNSL" + misc_feature 7463..7960 + /gene="whaK" + /locus_tag="SPC27_0010" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6.8e-23" + gene 8489..9613 + /gene="wzy" + /locus_tag="SPC27_0011" + CDS 8489..9613 + /gene="wzy" + /locus_tag="SPC27_0011" + /note="member of homology group 249" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34008.1" + /db_xref="UniProtKB/TrEMBL:Q4K041" + /translation="MLPYLGVFFASSSLIALSEKIKKNQRLFFVILALALPCMLAGFR + ADHIGTDTGVYLMPTINAATSSHSFSEYLNTSWYRIWRFLSVKDFERGFTLVVYVTTK + LLGAFWTKFILELLMTTPTYLAIKKYGKYPAWLGMMVFYLTTYNSTLNMMRQSIAVAF + TLLGILYFIERNKKGFVTCLLLGCSFHTSGLVLLMIAAMFYFIKPNQQLDTLFSRRVE + LQKVALILVLGIASLFSLGVVSSILKIIGLGSYVNYIGGTFHFVQNQFLSRFPIMLLM + LISWYKWNEGESYARFFIVMFILEVLCLQLTSVNVYSGRIAYFFSSMNVLTYPSLCYC + RPQKGRRFFMISALLVYLFFYWWFYYGIQGIDATIPYMMI" + misc_feature 8489..8623 + /gene="wzy" + /locus_tag="SPC27_0011" + /note="Signal peptide predicted for SPC1367 by SignalP 2.0 + HMM (Signal peptide probability 0.877) with cleavage site + probability 0.373 between residues 45 and 46" + gene 9630..10739 + /gene="whaL" + /locus_tag="SPC27_0012" + CDS 9630..10739 + /gene="whaL" + /locus_tag="SPC27_0012" + /note="member of homology group 200" + /codon_start=1 + /transl_table=11 + /product="putative transferase" + /protein_id="CAI34009.1" + /db_xref="GOA:Q4K040" + /db_xref="InterPro:IPR007345" + /db_xref="UniProtKB/TrEMBL:Q4K040" + /translation="MEIFVRGFFHVNLGDDLFLYILAKRYPNHNFHVILNEEYTKVFR + DEKNIIVHPYKKIRRGLDRFLINCNKDYYVEIEKKCQLNVVIGGSIFQENVDDVVARE + RLARMPQLNPTYILGANFGPYVTEEYRLLVKDYLTKSEDVCFRDEWSKQKFPELTKVR + FAPDIVFGIQSIIPKVNEKKKRIFVSVVDCFKKAGGIKKYAPNYEAFILRCINYYNEQ + GYEIILSSFCKMEGDKEVIDRILEKLPSDKQSEISILNYNGENWREVVAAIQQSEKII + ASRFHSMILGMVFGVSVLPIAYNKKFKQFLANFDLSHYCISVSDIDHQVPKNLNYLLF + DGNTDIAEQANEHFMKLDERLMRGTLWNNEYYKNK" + gene 10717..12207 + /gene="wzx" + /locus_tag="SPC27_0013" + CDS 10717..12207 + /gene="wzx" + /locus_tag="SPC27_0013" + /note="member of homology group 250" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34010.1" + /db_xref="InterPro:IPR004268" + /db_xref="UniProtKB/TrEMBL:Q4K039" + /translation="MSTTKISNQNKKTAIQLTLMIILTCLSQIVALYKSRFTAVNFGA + TDYMDAYNFSLEIATFIFSFMTGGVTTVIIPAYVKKNSSKAVNTFITLTYGCILLLSV + GIIIFRTPLLSSLTVRGTDFIAIASGFLIVSFVIQGILSLLAVTTAYYQSEDRYNIPK + IIVLIVNMIVLTILLLGVIDNIYLYFSLLIAGSVLNLILDFIVAIKIGFRYKFCFDFK + NPEFKNMLIVFLPTVLSSGVYKLHTMVDTTIATNLAEGQATILTYASQIITMVNTVIV + GNLTVYVYPKIIANLKSKNTSKYFWDYCILFHAVLAIIIAGFINVGFEGLSLLFVGGK + FTLENANVLYMCACIYISGQQFNVIRDLIYRYFYANSNTKETFKNSVIVSIINIILSL + LLVSLFRVYGIVLGTVLSNMISLALIYIRFKKNFGIDVKISYISIEIIKNILAMVGSV + IVIHWLKTFLAINNNILSIIVYGTGTVIVYLVLILLLQTKIRHIKL" + misc_feature 10717..10815 + /gene="wzx" + /locus_tag="SPC27_0013" + /note="Signal peptide predicted for SPC1369 by SignalP 2.0 + HMM (Signal peptide probability 0.853) with cleavage site + probability 0.554 between residues 33 and 34" + misc_feature 10834..12138 + /gene="wzx" + /locus_tag="SPC27_0013" + /note="HMMPfam hit to PF03023, MviN-like protein, score + 1.6e-11" + gene 12333..13289 + /gene="wcyS" + /locus_tag="SPC27_0014" + CDS 12333..13289 + /gene="wcyS" + /locus_tag="SPC27_0014" + /note="member of homology group 118" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34011.1" + /db_xref="GOA:Q4K038" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4K038" + /translation="MSIFATLIKKKGAEIFKNLIQSRVLFRTIAILPLVGFSKKSLEI + VRLNNSNIVLSRLRRNYRSAIQKFREENQYSLVYDQQDSSTSSKIWICWFQGLDVAPH + VVRECIASVRKQLADREVVVLTDDNYHHYVTFPDHIKAKIDQGIISKTHLSDLLRLEL + LTKYGGTWIDGTVFCSSSDIPVYMLDSDLFLFQNLKPGLDGQALAISTWFMTAAKLHH + PLLELTKDLLYLYWKKNNTMVDYFLIHHFFQLSIEEFPEYWSRVVPFNNSTPHILQLR + LFEEFDETMYRHILEQTPFHKLTYKFEGEKSSIPNTYYKHLF" + misc_feature 12468..13283 + /gene="wcyS" + /locus_tag="SPC27_0014" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.4e-64" + gene 13366..14187 + /gene="wcrN" + /locus_tag="SPC27_0015" + CDS 13366..14187 + /gene="wcrN" + /locus_tag="SPC27_0015" + /note="member of homology group 119" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34012.1" + /db_xref="GOA:Q4K037" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4K037" + /translation="MKELTTREMQEVSLEILHTIASICEKQHLRYALIYGTLIGAVRH + KGYIPWDDDVDIMMPRPDYDSLLQYLKENIADYPYLKVFNREECPEYPYMITRISDQR + YRIEMENEKPFGLGVFIDIYPYDGLGDTKQESVAFGLKGDRLSSFCYQATREHFAIET + TISAFRKFIKYPVYLFSKMIGKNYFQSQLDKLARVKDYDNSNFVGCVIWLSWGEKDIF + PREWFDETILVPFEKYEFRIPKEFDKILRHEYGDYMILPPEKDRVGHHYFKAYKK" + misc_feature 13435..14118 + /gene="wcrN" + /locus_tag="SPC27_0015" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 7.3e-42" + gene 14347..14613 + /gene="HG270" + /locus_tag="SPC27_0016" + /pseudo + CDS 14347..14613 + /gene="HG270" + /locus_tag="SPC27_0016" + /note="member of homology group 270" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative transferase (fragment)" + misc_feature 14350..14403 + /gene="HG270" + /locus_tag="SPC27_0016" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.18" + /pseudo + misc_feature 14434..14487 + /gene="HG270" + /locus_tag="SPC27_0016" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.26" + /pseudo + misc_feature 14488..14541 + /gene="HG270" + /locus_tag="SPC27_0016" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.019" + /pseudo + gene 15021..15953 + /gene="rmlA" + /locus_tag="SPC27_0017" + CDS 15021..15953 + /gene="rmlA" + /locus_tag="SPC27_0017" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34014.1" + /db_xref="GOA:Q4K036" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K036" + /translation="MILVYKHGKIKVQITKKGTPFMKGIILAGGSGTRLYPLTRAASK + QLMPVYDKPMIYYPLSTLMLAGIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQP + SPDGLAQAFIIGEEFISDDSVALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKD + PERFGVVEFDQDMKAISIEEKPEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEI + TDVNKAYLERGDLSVELMGRGFAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIA + YRMGYISRKDVLTLAQPLKKNEYGQYLLRLIGEA" + misc_feature 15087..15803 + /gene="rmlA" + /locus_tag="SPC27_0017" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.2e-120" + gene 15954..16547 + /gene="rmlC" + /locus_tag="SPC27_0018" + CDS 15954..16547 + /gene="rmlC" + /locus_tag="SPC27_0018" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34015.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 15990..16520 + /gene="rmlC" + /locus_tag="SPC27_0018" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 16560..17609 + /gene="rmlB" + /locus_tag="SPC27_0019" + CDS 16560..17609 + /gene="rmlB" + /locus_tag="SPC27_0019" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34016.1" + /db_xref="GOA:Q4K034" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K034" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGERPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 16575..17531 + /gene="rmlB" + /locus_tag="SPC27_0019" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00011" + misc_feature 16578..17318 + /gene="rmlB" + /locus_tag="SPC27_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 3.3e-76" + misc_feature 16581..17393 + /gene="rmlB" + /locus_tag="SPC27_0019" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.7e-05" + gene 17675..18526 + /gene="rmlD" + /locus_tag="SPC27_0020" + CDS 17675..18526 + /gene="rmlD" + /locus_tag="SPC27_0020" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34017.1" + /db_xref="GOA:Q4K2P3" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P3" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVNPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 17675..18523 + /gene="rmlD" + /locus_tag="SPC27_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 5.7e-148" + misc_feature 17678..18319 + /gene="rmlD" + /locus_tag="SPC27_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 17678..18307 + /gene="rmlD" + /locus_tag="SPC27_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.6e-19" + misc_feature 17681..18409 + /gene="rmlD" + /locus_tag="SPC27_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.9e-08" + gene order(18602..19555,19566..19784) + /gene="tnp" + /locus_tag="SPC27_0021" + /pseudo + CDS join(18602..19555,19566..19784) + /gene="tnp" + /locus_tag="SPC27_0021" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 18608..19051 + /gene="tnp" + /locus_tag="SPC27_0021" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 0.00049" + /pseudo + gene 19983..>20135 + /gene="aliA" + /locus_tag="SPC27_0022" + CDS 19983..>20135 + /gene="aliA" + /locus_tag="SPC27_0022" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34019.1" + /db_xref="UniProtKB/TrEMBL:Q4K0S2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYL" + misc_feature 19983..20069 + /gene="aliA" + /locus_tag="SPC27_0022" + /note="Signal peptide predicted for SPC1381 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" +ORIGIN + 1 ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa atttaaaatt + 61 gaaatcgtat aaaaacaagg gaggactgta taaaaagcag aaatcctttg ttttttataa + 121 ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc ccactattga + 181 ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggcctgact tttgcatctg + 241 ttttgctttt agttgcttgc ggccaatcag gttcagatac aaaaacttac tcatcaacct + 301 ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat aatatagtta + 361 attgaaacaa gagcaggaca aaagagcctc gtaaaaggta ttgcaacttg gtaatacctt + 421 tttgaggtgc tttttgatat gagcctatgt tttctcaata ggattgtatt caggcgagta + 481 gggaggaaga ggtaaaagtt tatgcccaaa ctcttcgcac aagagttcta gcttccccat + 541 tctatggaat cttacattat ccataataat aaccgatagt gtggttaatg ttggtaagag + 601 aaacttctga aaccaagctt caaaaaagtc gctcgtcatc gtctcttcgt aagtcattgg + 661 agcgattaac tcaccattca tttgttagac ctgcaaccaa agaaatcctc tgatatcttc + 721 ttccagatac tttgcctctt cttaactgac cttttaatga gcgaccatat tctcgataaa + 781 aataagtatc gaatcctgtt tccaatataa acaggtgcta ggtgctttaa actattaaaa + 841 ttcttaagaa atatggctac tttttctggg tcttgttcat aattagattg aaactagaat + 901 agtacacatc tgcttctaaa acattgttag aaaacgattt gactgtcctg aacaatttgt + 961 catgttcttg tttcatttta ctatattttt ggttcgcggg aagtctacta agatacttaa + 1021 agatgcagat agtgaaaaaa aggtgtagac attaccgtaa aaaagtgata taatcgtata + 1081 atgttcaatg tataggtgtt aatcatgagt agacgtttta aaaaatcagg ttcacagaaa + 1141 gtgaagcgaa gtgttaatat cgttttgttg actatttatt tattgttagt ttgtttttta + 1201 ttgttcttaa tctttaagta caatatcctt gcttttagat atcttaatct agtggtaact + 1261 gcgttagtcc tactagttgc cttggtaggg ctactcctga ttatctataa aaaagctgaa + 1321 aaatttacta tttttctgtt ggtgttctct atccttgtca gctctgtgtc gctctttgca + 1381 gtacagcagt ttgttggact gaccaatcgt ttaaatgcga cttctaatta ctcagaatat + 1441 tcaatcagtg tcgctgtttt agcagatagt gagatcgaaa atgttacgca actgacgagt + 1501 gtgacagcac cgactgggac tgataatgaa aatattcaaa aactactagc tgatatcaag + 1561 tcaagtcaga ataccgattt gacggtcgac cagagttcgt cttacttggc agcttataag + 1621 agtttgattg caggtgagac taaggccatt gtcttaaata gtgtctttga aaatatcatc + 1681 gagtcagagt atccagacta tgcatcgaag ataaaaaaga tttataccaa gggatttact + 1741 aaaaaagtag aagctcctaa gacgtctaag aatcagtctt tcaatatcta tgttagtgga + 1801 attgacacct atggtcctat tagttcggtg tcgcgatcag atgtcaatat cctgatgact + 1861 gtcaatcgag ataccaagaa aatcctcttg accacaacac cacgtgatgc ctatgtacca + 1921 atcgcagatg gtggaaataa tcaaaaagat aaattaaccc atgcgggcat ttatggagtt + 1981 gattcgtcca ttcacacctt agaaaatctc tatggagtgg atatcaatta ctatgtgcga + 2041 ttgaacttca cttctttctt gaaaatgatt gacttattgg gaggggtaga tgttcataat + 2101 gatcaagagt tttcagctct acatgggaag ttccatttcc cagtagggaa tgtccatcta + 2161 gactctgagc aggctctagg ttttgtacgt gaacgctact cactagcaga tggcgatcgt + 2221 gaccgcgggc gcaatcaaca aaaggtcatt gtggctatcc ttcaaaaatt aacgtcaacc + 2281 gaagcactga aaaattatag tacgatcatt aatagcttgc aagattctat ccaaacaaat + 2341 atgccacttg agactatgat aaatttggtc aatgctcagt tagaaagtgg agggaattat + 2401 aaagtaaatt ctcaagattt aaaaggtaca ggtcggatgg atcttccttc ttatgcaatg + 2461 ccagacagta acctctatgt gatggaaata gatgatagta gtttagctgt agttaaagca + 2521 gctatacagg atgtgatgga aggtagatga aatgatagac atccattcgc atatcgtttt + 2581 tgatgtagat gacggtccca agtcaagaga ggaaagcaag gctctcttgg cagaatccta + 2641 caggcagggg gtgcgaacca ttgtctctac ctctcaccgt cgcaagggca tgtttgaaac + 2701 tccggaagag aagatagcag aaaactttct tcaggttcgg gaaattgcaa aagaagtagc + 2761 agatgattta gtcattgctt atggggctga aatttactac acaccagatg ttctggataa + 2821 gctggaaaaa aagcggattc cgaccctcaa tgatagtcgt tatgccttga tagagtttag + 2881 tatgaacact ctttatcgcg atattcatag cgccttgagc aagatcttga tgttgggaat + 2941 tactccagtc attgcccaca tcgaacgcta tgatgctctt gaaaataatg aaaaacgcgt + 3001 tcgggaactg atcgatatgg gttgttacac gcaagtaaat agttcacatg tcctcaaacc + 3061 caaacttttt ggcgaacgtt ataaattcat gaaaaaaaga gctcagtatt ttttagagaa + 3121 ggatttggtt catatcattg caagtgatat gcacaatcta gacggtagac ctcctcatat + 3181 ggcagaagca tatgaccttg ttacccaaaa acacggagaa gcgaaggctc aggaactttt + 3241 tatagacaat cctcgaaaaa ttgtaataga tcaactaatt taggagaaat gatgaaagaa + 3301 caaaacacga cagaaatcga tgtatttcaa ttagttaaaa ccttgtggaa acgcaagcta + 3361 atgattttat tagtggcact tgtgacaggt gcgggggctt ttgtatatag cacttttatt + 3421 gttaggccag aatatacgag tgtcacgcga atttacatag tgaatcgcaa tcaaggagac + 3481 aaggcggggc tgacaaatca ggatttgcaa gcaggaactt atctggtaaa agactaccgt + 3541 gagattatcc tttcgcagga tgtattggaa aaagtagcgg caaatttgaa gttggatatg + 3601 ccagcaaaaa cgttaaccag caaagttcaa gtgactgtac cagctgacac tcgtgtcgtc + 3661 tcaatctctg tcaaggataa acagccagag gaagccagtc gtatcgctaa ttctctacga + 3721 gaagttgcta cagaaaagat cgtcgctgta acgcgagtat ctgatgtaac gacacttgaa + 3781 gaagcgcgac cagctacgac tccctcttct ccagatgttc gacgcaattc catgtttggt + 3841 tttcttggag gagcagccgt aacagcaatt gctgtttttt tgattgagtt gctcgacacc + 3901 cgtgtaaaac gtcctgaaga tgtcgaagat gtactgcaaa ttccactttt agggatcatt + 3961 ccagatttgg acaaaatgaa ataggaggaa attatgccaa cgttagaaat ttcacaggca + 4021 aaattggatt ttgtaaaaaa ggtagaggaa aattataacg ctttgtgcac gaacctacag + 4081 ttaagtggag atgatttgaa agtattttct atcacttctg tgaaactagg agaaggaaaa + 4141 tcaatgactt ccaccagtat cgcttggact tttgcgcgtg caggttacaa aacgctgctg + 4201 attgatggag atattcgcaa ttctgttatg ttaggtgtct ttaaagcaag ggataagatt + 4261 acaggcctga cagaattttt atcaggaact acagacctat cacaagggct ttgtgatacc + 4321 aatatcgaaa atctctttgt aattccggct ggctctgtgt caccgaatcc gacagctctt + 4381 cttcaaagta agaatttcag tacaatgctt gaaaccttgc gtaaatattt tgactacatc + 4441 attgtagata ctgctcctgt cggtgtcgtg attgatgcgg ctattattac gcgaaaatgc + 4501 gatgcttcta ttttagtgac ggaggcaggt ggagtaaatc gacgggatat tcaaaaagca + 4561 aaagaacagt tggaacacac agggaagccg tttttgggag ttgtgttgaa taaattcgat + 4621 acttcagtag acaaatacgg ttcttatgga aaatatggag attacgagaa aaataaaaaa + 4681 tatgttgagg gatagagatg aatggaaaaa tagtaaagtc ttcattggcc ataatccaga + 4741 gttttcttgt tattttattg acttatctac ttagtgctgt gagagaagcg gagattgttt + 4801 caacaacagc tattgcactt tatatcctcc attattttgt cttttatatc agtgattatg + 4861 gacaggattt ctttaaaagg ggatatttga ttgaacttgt ccagacattg aaatatatcc + 4921 tattctttgc actagcgatt agtatttcta attttttctt agaggatcga tttagtattt + 4981 ccagacgagg cgtgatttac ttcctcacat tacatgctct cttagtctat gtgctaaacc + 5041 tatttatcaa gtggtattgg aagcgggctt atcccaactt taaaggaagt aagaagattc + 5101 tcctacttac agcaacttat cgtgtcgaaa aggtactgga tagattaata gaatcaaatg + 5161 aggttgttgg ggagttggta gccgtcagtg tcttagataa accagatttt cagcatgatt + 5221 gtttagaagt agtagcagag ggggagatag taaactttgc gactcatgag gtggtcgatg + 5281 aagtctttat caatcttcca agtgaaaaat acaatattgg agagcttgtc tctcagtttg + 5341 aaacgatggg aattgatgta acagtcaatc taaatgcttt tgatcgtagt ttggcacgta + 5401 acaagcaaat tcgtgagatg gcaggattaa acgttgtgac tttttctaca acattttata + 5461 agactagtca tgtaattgct aagcggatta ttgatatcgt gggtgcattg gtagggctga + 5521 tactatgtgg tttagtcagt attgtactgg ttcctttgat tcgaaaggat gggggctcta + 5581 ctatttttgc tcagacgcgt ataggaaaaa atggtcgtca gttcactttt tataagtttc + 5641 gctctatgtg tgtagatgcc gaggcgaaaa aaagagaact catggaacaa aataccatgc + 5701 agggtggaat gtttaaggtg gacgatgatc ctcgtatcac gaaaattggt cgttttatac + 5761 ggaagactag cttggacgag ctaccacagt tttataatgt tctaaaggga gatatgagtt + 5821 tggttggcac acgaccacca acagtggacg agtatgaaca ctatacccca gaacaaaaac + 5881 gtcggctaag ttttaaacct ggtataacag gcttatggca ggtcagtgga cgaagtgaga + 5941 ttaagaattt tgatgaagtt gtcaaattag atgtagccta tatagacgat tggacaattt + 6001 ggaaagacat tgaaatttta ttgaagacag ttaaagttgt attgatgaag gatggagcga + 6061 agtgattttt gcccctcagt cttgttagga gagagatgaa acagtcagtt tatatcattg + 6121 gttcaaaggg gattcctgcc aagtatggag gatttgaaac ctttgttgaa aaattaacag + 6181 aatatcaaaa agatgataac atccaatact atgttgcctg catgcgtgaa aattcggcaa + 6241 agtcaggatt tacagcagat acatttgagt acaacggtgc tatttgttac aacattgatg + 6301 tgcctaatat tggtccttct agagccattg cttacgatat tgcagcggtc aataaggcta + 6361 ttgaattggc taaggaaaac aaggacgagg ctcccatttt ttacattcta gcttgtcgta + 6421 tcgggccttt tatttctgga cttaagaaaa aaattcgttc gatcggaggc cgactactgg + 6481 taaatccaga tggccatgag tggctccggg ctaaatggag cctgtcagtt cggaagtatt + 6541 ggaagttttc ggaacagttg atggtcaaac atgcagattt attagtctgt gatagcaaaa + 6601 atatcgaaaa atatatccaa gaggactata aacagtatca gcctaaaacg gtctatatcg + 6661 cttatggcac agatactacc ccctcgagcc tgaaatcaga agatgccaaa gttcgaaact + 6721 ggcatcgtga aaagggagta agcgaaaatg gctattatct agtggtggga cgattcgttc + 6781 ccgaaaacaa ctatgaaacc atgattcgtg aatttatgaa gtctaattct aaaaaagact + 6841 ttgttctcat tacaaatgta gaacaaaata agttttacga tcagttgctc aaggatacag + 6901 gcttcgacaa agatccaaga gtcaaatttg tgggaacagt ctatgaccaa gaattgctca + 6961 agtatatccg tgaaaatgct ttcgcctatt tccatggaca tgaagttggg ggtaccaatc + 7021 catcgcttct tgaagcttta gcatccacta aacttagctt gttgttggat gtcggcttta + 7081 accgtgaagt tggtgaagac ggagccattt attggaaaaa agatgagcta gcgcatgtaa + 7141 tcgaagaagt ggaacgattt gatgaaggtg atatttcgga attagacgaa aagtctagcc + 7201 aacgaattgc ggatgcattt acgtgggaaa agattgtcac tagctatgag acgattttca + 7261 attcgtgaaa cgtattaata gatggtagaa ttatctccta ttgatttttt actattgcgc + 7321 taattcattt actgtatctt gttattgttt caggctttta gtaaatgata cgattggata + 7381 atggttttac gatattattc tggaatgttg tgagagataa gctaatattt ttgaagagaa + 7441 agaggagagt atgatacatt tgagcatcat tgttcctgtt tacaatacag ctatagataa + 7501 attagaacaa tgctttcagt ctatcaaaac ttttatggat aagaatagtg ccttaaatat + 7561 ggaatgtgtt atcattgatg acggttcaaa gggtaaggta tctgattggt gtcgagagtt + 7621 ttcagagaca aaggctgatt ttaaatttta taaaaaagtt aacgaaggtg ttagcgtagc + 7681 gagaaatatg gggattagcc tttctaaagg acaatacatt atcttcgttg attcagatga + 7741 tcttcttgtt tcctttaatg agctggagca gtatcttttg gatggcaagt atgaccttat + 7801 ttttagcgat ttagcgactg atatccaaca aaagcatatg tggaaggcgt ttgaaggtga + 7861 ctcacgcgag atcgattttg agacagtaat tagtagaatt gtcagcgatg ggaccttaaa + 7921 tggtcctgtt tgcaagatta tcagaaaaaa tttgttagac caacaccata tagagttcga + 7981 caaaacgatg ataacgggag aagatttggt ttttttaatt catatcttat tacaaaaacc + 8041 taaaatgtat tatatttctc aatgtaccta tatctataaa ttagacacaa atacgtctaa + 8101 caaccgcttg aaaaattgct cgaaagtttt tataaaaaat aatgttgttg cctataaaca + 8161 tatgattcag ttgattaatc aattttccag caatcaacat aaacaaatat ttgaaaaaag + 8221 ggcaacagag atatatataa agcaattatt caattctctt gcagatttgc tagaaatggg + 8281 cttgttgtcg caagagttaa aagactacac agtacagttg ttgtcagagt tggataagca + 8341 gacagtagat ttgattcaag gacaaaaact gtctaaatca aatttgcaat taacagtatt + 8401 actcaacaag tggtggctac tgttagcagt agctagtaga atgaggattc tatacttgaa + 8461 aattaaaaat agcttataag gagtagggat gttaccttat cttggtgtct tttttgcctc + 8521 tagttctttg atagcattgt cagagaaaat aaagaaaaat caaagacttt tttttgttat + 8581 attagcttta gctctcccat gcatgcttgc aggatttaga gcagatcata ttggaactga + 8641 tacaggggtt tacttaatgc cgacgattaa tgcagccacc tcttctcatt ctttttcaga + 8701 atatttgaat actagttggt atagaatttg gcgtttttta tccgtaaaag attttgaacg + 8761 aggtttcaca cttgtagtct atgtaactac aaaattatta ggcgctttct ggacaaagtt + 8821 tattttggaa ctgcttatga caactccaac ctatctagct ataaaaaaat atgggaaata + 8881 tccagcatgg ctagggatga tggtgtttta tcttactacc tataattcaa ccttgaatat + 8941 gatgagacaa tcaatagcag tcgcattcac tttattggga attttatact ttattgagag + 9001 aaataagaag ggctttgtta cttgtttatt gttgggttgt tccttccata cttctgggct + 9061 tgttttgtta atgattgcag cgatgtttta ctttataaaa ccaaatcagc aacttgacac + 9121 gctattctca aggagagttg agcttcaaaa agttgctctc atactggttt taggtatagc + 9181 ctccctgttt tccttaggag tagtgtctag cattttaaaa attataggtt taggaagcta + 9241 cgtaaattat attggcggaa catttcattt tgtacagaat caattcttga gtcggtttcc + 9301 aattatgctc cttatgctta tcagctggta taagtggaat gaaggggaaa gttatgctag + 9361 atttttcata gtgatgttta ttctagaggt cttgtgtttg caactaacta gtgtaaatgt + 9421 atactcagga agaattgcct actttttctc ttctatgaat gttttgacct atccttcctt + 9481 gtgttactgc agaccgcaaa aagggcgtcg ctttttcatg attagtgcct tacttgtcta + 9541 ccttttcttt tattggtggt tttactatgg aatacaagga atagatgcga ctattccata + 9601 tatgatgata taaggaggaa gtatatataa tggaaatatt tgtcagaggt ttttttcatg + 9661 ttaatttagg tgacgatcta tttttgtata ttcttgcaaa acgatatcca aatcataatt + 9721 ttcatgtgat tcttaatgaa gaatatacaa aggtatttcg tgatgaaaaa aatatcattg + 9781 tccatccata taaaaaaata agaagaggct tagatcgttt tttaattaac tgtaataaag + 9841 attactatgt agaaatagag aaaaagtgcc aactcaatgt tgtgattggg ggatctattt + 9901 ttcaggaaaa tgtagatgat gtggttgctc gtgaacgttt agctagaatg cctcaattaa + 9961 atcctactta tattttagga gcaaatttcg gtccctatgt aacggaagag tatcgcttgc + 10021 ttgttaaaga ttatcttact aaatcagaag atgtctgttt ccgtgatgaa tggtccaagc + 10081 aaaaatttcc agaattaaca aaggttcgtt ttgcaccaga tattgttttt gggatacaga + 10141 gtatcattcc gaaagtgaac gagaaaaaga aaagaatttt tgtttctgtc gtagactgtt + 10201 ttaaaaaagc tggaggcata aaaaaatatg cccccaacta tgaggcattt attcttcgtt + 10261 gcataaatta ttataatgaa caggggtatg aaattatcct ctcttctttt tgtaaaatgg + 10321 aaggtgataa agaggtaatt gatagaattc tagagaagct accatcagat aaacaatctg + 10381 aaatatctat tttgaattat aatggagaga attggagaga ggtcgttgct gctattcaac + 10441 aatcagaaaa aatcattgct tcacgattcc atagcatgat tctcggcatg gtctttggtg + 10501 tgtcagttct ccctattgct tataataaaa aattcaaaca atttttagca aattttgact + 10561 tatctcacta ttgtatttcg gtttcagata tagatcatca agtgcccaaa aatttgaatt + 10621 atttattatt tgacggaaat acggatatag ctgaacaagc taatgaacac tttatgaaac + 10681 tagatgaacg actaatgaga ggcacacttt ggaataatga gtactacaaa aataagtaat + 10741 caaaacaaaa aaacagctat tcaattaacc ttgatgatta tactaacgtg cttgtctcaa + 10801 attgtggcct tatataaatc taggtttaca gctgttaact ttggtgcaac cgactacatg + 10861 gatgcttaca atttttcttt agaaattgca acatttattt tttcatttat gacgggcgga + 10921 gtaaccactg taataattcc ggcttatgtg aaaaaaaatt cttctaaagc agtgaatact + 10981 ttcatcaccc ttacctacgg ttgtatctta ttgttaagtg tggggattat tatctttcga + 11041 acacctttac tatcttcgct aactgtcaga gggactgact ttatagctat cgcttcaggt + 11101 tttttgatag tttcatttgt gattcaaggc attctatctt tgttagctgt aaccacggcc + 11161 tactatcagt ctgaggatag atataatatc ccaaagataa tcgtgctgat tgtcaatatg + 11221 attgtattaa ctattttact gcttggggtg attgataata tctatttata cttctcgctt + 11281 ttgattgcgg gatcagttct caatttgatt ttagatttta ttgttgctat caaaataggc + 11341 tttagataca agttctgctt tgatttcaag aatccagaat ttaaaaatat gctgattgta + 11401 tttttgccaa ccgtattaag ttcaggagtt tataagttgc atacaatggt agatactacg + 11461 attgcaacga atttagcaga aggacaggct acaatcctaa cttatgcttc acagatcatt + 11521 acgatggtaa atacggttat tgttgggaat ttaacagtgt atgtctatcc taaaatcata + 11581 gcaaatttaa agagtaaaaa tacatctaaa tatttttggg attattgcat acttttccat + 11641 gctgtcttag cgattattat tgcaggtttt ataaatgttg gttttgaagg actatcttta + 11701 ctatttgttg gtgggaaatt tacacttgaa aatgcgaatg ttctttatat gtgtgcctgt + 11761 atttatatca gcgggcaaca gtttaatgtt atccgtgact tgatttatcg atatttttac + 11821 gcaaattcca acacaaaaga aacctttaag aatagtgtta tcgtcagcat cataaatatt + 11881 atactgagct tgttgttggt tagtcttttt agagtttatg gtattgttct tggaaccgtg + 11941 ttatctaata tgatttcgct tgctctcatc tatattcgct ttaaaaagaa tttcggtata + 12001 gatgtaaaga ttagctatat atccattgag ataattaaaa atattttggc aatggtagga + 12061 tcagtcatcg ttatacattg gctaaagact ttcttagcta tcaataataa tattttatct + 12121 attattgtat atggtaccgg gacagttata gtatatttgg tactgatttt gctattacag + 12181 acaaaaataa gacacataaa attataagaa acatagggac tacactatct aaagaaaata + 12241 ctaggtattg ttgagatatc cttaatattt ttcttaaagg ttcaacacga atataccaga + 12301 atatatgctt atggtttaga aaggatgttt tagtgagtat ttttgccaca ttgattaaaa + 12361 aaaagggtgc agagattttt aaaaacttaa tacaatcaag agtgcttttt cgaacgatag + 12421 ctattttacc gctggttggt ttttcaaaaa aatcattaga gatagtccgt ctaaataata + 12481 gcaatatagt tctttcaaga ttgagaagga actatagatc cgctattcaa aaatttagag + 12541 aagaaaatca gtattcactt gtgtatgacc agcaagatag tagcacttcc tcaaagatat + 12601 ggatttgttg gtttcaagga ttagatgttg cccctcatgt agttcgggag tgtatcgctt + 12661 cggtaagaaa gcagctagca gacagagaag tggttgtttt aacagacgat aattaccatc + 12721 actatgtgac tttcccagat cacattaaag caaaaattga tcagggaatt atttccaaga + 12781 ctcacttgtc agatttattg cgtttggagt tgctgactaa atatggtggg acatggattg + 12841 atggaacagt attttgttcg agttccgata ttcccgttta tatgctagat tctgatttat + 12901 ttctgtttca aaatttaaaa ccgggtcttg atgggcaagc tttggctatt tcaacttggt + 12961 ttatgacagc tgctaaactt catcatccac ttttagagtt aacaaaggat ttgctttatc + 13021 tgtactggaa aaagaataac acgatggttg actattttct aatccaccac ttcttccagt + 13081 tatctatcga agagtttcct gaatactgga gtagagtagt tcctttcaat aattcaactc + 13141 ctcatatttt gcagttgcgc ttatttgaag agtttgacga aacaatgtat cgtcatattc + 13201 ttgaacagac accattccat aagctaacat acaaatttga aggagaaaag tcaagcatac + 13261 cgaatactta ctataaacac ttattttgat aaaaatgatc gtagttgatt taaaaactgc + 13321 tgttaggtat agaacataat taagatatta tcgggagggt acgatatgaa agaactaact + 13381 actcgagaga tgcaagaagt atcgttggag attttacata cgattgctag tatttgtgaa + 13441 aagcaacatt tgcgctatgc tttgatttat ggaaccttaa tcggtgcggt tagacataaa + 13501 ggttatattc cttgggatga tgacgttgac attatgatgc cccgacccga ttatgatagt + 13561 ctattacaat acttgaagga aaatatcgct gattatccat atttaaaagt atttaatcgc + 13621 gaagagtgcc cagaatatcc ctacatgatt actagaatta gcgatcagag ataccggatt + 13681 gagatggaaa acgagaaacc ttttggttta ggagttttca tcgatatcta tccctatgat + 13741 ggtttgggag atacgaaaca agaatcggtt gccttcggtt tgaaggggga tcgtttatca + 13801 tcattttgtt atcaggcaac tagagaacat tttgcgattg aaacgacaat atcagctttt + 13861 aggaagttta ttaaataccc ggtttatctg ttttctaaaa tgattggaaa aaattacttt + 13921 caaagtcaat tagataagtt agcgagagtc aaagattatg acaacagtaa ctttgttggt + 13981 tgtgtgattt ggttgtcatg gggagaaaaa gacatctttc cacgtgagtg gtttgatgag + 14041 actattttgg tcccttttga aaaatatgaa tttagaatcc ctaaagagtt tgacaaaatt + 14101 ttgcgacatg aatatggaga ttatatgatt ttacctcctg aaaaggatag ggtgggacat + 14161 cactatttta aagcttataa aaaatgataa tttgctaagc aaagaaaagg aaaatcatga + 14221 aattatttta tttacaattg gagtaggaag tttaaaggtg gagtttctct gctcagagtt + 14281 ctatatgatt tcgagtgccc gcgtaaagct aaaattggga ataacgtcaa tttttcacat + 14341 cgtgggatgg gaacagttgt aagtagtaat gctatcatcg ggaacaatgt gaccatacaa + 14401 catcatgtaa cattagggat taaaaacgat gatagaatta tcatcgggga gaactgtttt + 14461 ataggagcct atgcatttat cttgggaaat gtaaaaattg gtgcaaattc taagattgga + 14521 gcaggtacga tagttttaca tgatgtccca gatggaagca cagtggttaa tccagtggaa + 14581 ctaaaagcgc tcgcttcaga agcaaatgtt cagtaataga gaaatgaata gaatattgaa + 14641 aacaatgtta gaggaaagtt atggtaacgc ttgataatac tgaaaatttc attcattttt + 14701 ttaacacatt agggttaatg tttactccac agatttaatt gaattattta ataaaaagat + 14761 taagagacaa gcaaaaaaag attatcttcc tgaatggaga agccgtagat tgttgtctag + 14821 ttccggtgaa tacaaagtaa aatataaaaa ttgcaataac aaagaattcg aattttgttc + 14881 aggtgcttta taaagcctat ttgagtaatt aaatagcaac ttgacactgt gattacataa + 14941 aattattgat aagcctaatt tttatttaat cgtatggatc atttataaaa aatgtataaa + 15001 attgaatata aatgtgaggt gtgattttgg tctataaaca tgggaaaata aaagtgcaaa + 15061 taacaaagaa aggtacccct tttatgaaag gtattattct agcaggtggt tcgggaactc + 15121 gcttgtatcc tttgactcga gccgcatcaa aacaacttat gccggtttat gataaaccga + 15181 tgatttacta cccactttca acattgatgt tggctgggat tagggatatt ttgattattt + 15241 ccactccaca ggatttacat cgatttcaag agcttcttca agacggatct gagtttggga + 15301 tcaaactttc ttatgcagag caaccaagtc cagatggttt ggcacaagcc tttatcattg + 15361 gggaagagtt tatttctgat gatagcgttg cgctaatctt aggtgataat atctaccatg + 15421 gttctgggct ttccaagatg ctacaaaagg cagcgagtaa ggagtcggga gcaactgttt + 15481 ttggctacca tgtcaaggat ccagagcgct ttggtgtggt tgagtttgat caggatatga + 15541 aggctatttc tattgaagaa aagccagagc aacctcgttc aaactatgca gttacaggtc + 15601 tctatttcta tgataatgat gtagtagaga ttgccaaaag tattaaacca agtcctcgtg + 15661 gtgaattgga aattacagac gttaacaagg cttatctaga acgtggtgat ttgtctgttg + 15721 agcttatggg acgtggcttt gcttggttgg atactggcac tcatgaaagt ttactagagg + 15781 cttcgcagta catcgaaaca gtccaacgga tgcaaaatgt tcaggtagca aacttagaag + 15841 aaattgccta tcgcatgggt tatatcagtc gtaaagatgt attgacctta gcccaaccac + 15901 ttaagaaaaa tgaatacgga cagtatctgc tccgtttgat tggagaagca tagatgacag + 15961 ataatttttt cggtaagacg cttgcggcac gcaaggttga agctattcca ggcatgttgg + 16021 agtttgatat ccccgttcat ggagataatc gtggctggtt taaagaaaat ttccaaaagg + 16081 aaaaaatgct tccacttgga tttccagagt ctttctttgc agaaggaaaa ttgcaaaaca + 16141 atgtatcctt ctcacgtaaa aatgtccttc gaggcctcca cgcagagcct tgggataagt + 16201 acatctctgt agcagatgga gggaaagttc tgggttcttg ggttgatcta cgcgagggtg + 16261 aaacctttgg gaatacctat cagacagtaa ttgatgcaag caagggaatc tttgttcctc + 16321 gaggcgtagc taatggcttc caagttctat cagatacagt gtcatatagc tatctggtca + 16381 atgattactg ggctctcgag ctcaaaccca agtatgcctt tgtgaactac gctgatccaa + 16441 gccttggtat tgaatgggaa aatattgcag aagcagaggt ttcagaagca gataaacatc + 16501 atcccctact taaggatgta aaacctttga aaaaagaaga tttgtaaaaa ggaaagaata + 16561 tgactgaata caaaaatatt atcgtgacag gtggagctgg ctttatcggt tctaactttg + 16621 tccattatgt ttacgagaac tttccaggtg ttcacgtgac agtcctagat aagttgactt + 16681 atgctggaaa tcgcgcgaat attgaggaaa ttttaggtaa tcgtgttgag ttagttgttg + 16741 gtgacattgc tgatgcggag ttggtagaca agttggctgc tcaagcagat gctatcgttc + 16801 attatgcagc ggaaagccac aatgataatt cgctcaatga tccatcgcca tttattcata + 16861 ctaacttcat cggaacctat actcttttag aagctgctcg taagtatgat attcgcttcc + 16921 accatgtatc gacagatgaa gtttatgggg atctcccttt acgcgaagat ttgccaggtc + 16981 atggtgaaag accaggtgag aaatttacgg ctgaaacaaa atacaaccca agctctccgt + 17041 actcatcaac caaggcagcc tcagatttga ttgtcaaagc ctgggtgcgt tctttcggag + 17101 tcaaggcaac gatttccaac tgttcaaata actacggtcc ttatcaacat atcgaaaaat + 17161 tcatcccacg tcagattact aacatcctaa gtggtatcaa gccaaaactt tacggtgaag + 17221 gtaagaacgt tcgtgattgg attcatacca atgaccattc ttcaggagtt tggacaatct + 17281 tgacaaaagg gcaaatcggt gaaacctact tgattggggc tgatggtgag aagaacaata + 17341 aggaagtttt ggaacttatc cttaaggaaa tgggacaagc tgcggatgcc tatgatcatg + 17401 tgactgaccg tgcaggacat gaccttcgct atgcgattga tgctagcaag ctccgtgatg + 17461 agttggggtg gaaacctgaa tttaccaact ttgaagctgg gctcaaggca acaatcaagt + 17521 ggtatacaga taaccaagaa tggtggaaag cagaaaaaga agctgttgaa gccaattatg + 17581 ctaagactca ggagattatt acagtataaa aagcaggaaa tagctgcttt ttattgctat + 17641 attgggaaga gttacatatt agaaaggtct agagatgatt ttaattacag gggcaaatgg + 17701 ccaattagga acggaacttc gctatttatt ggatgaacgt aatgaagaat acgtggcagt + 17761 agatgtggct gagatggaca ttaccgatgc agaaatggtt gagaaagttt ttgaagaggt + 17821 gaaaccgact ttagtctacc actgtgcagc ctacaccgct gttgatgcag cagaggatga + 17881 aggaaaagag ttggacttcg ccatcaatgt gacggggaca aaaaatgtcg caaaagcatc + 17941 tgaaaagcat ggtgcaactc tagtttatat ttctacggac tatgtctttg acggtaagaa + 18001 accagttgga caagagtggg aagttgatga ccgaccagat ccacagacag aatatggccg + 18061 tactaagcgt atgggggaag agttagttga gaagcatgtg tctaatttct atattatccg + 18121 tactgcctgg gtatttggaa attatggcaa aaacttcgtt tttaccatgc aaaatcttgc + 18181 gaaaactcat aagactttaa cagttgtaaa tgaccagtac ggtcgtccga cttggactcg + 18241 taccttggct gagttcatga cctacctagc tgaaaatcgt aaggaatttg gttattatca + 18301 tttgtcaaat gatgcgacag aagacacaac atggtatgat tttgcagttg aaattttgaa + 18361 agatacagat gtcgaagtca atccagtaga ttccagtcaa tttccagcca aagctaaacg + 18421 tccgctaaac tcaacgatga gcctggccaa agccaaagct actggatttg ttattccaac + 18481 ttggcaagat gcattgcaag aattttacaa acaagaagtg agataagtag tagaatgatt + 18541 ttctagtcta ataaaagagg cagataatga actccaaagg agcttaagat gtacgattat + 18601 cttgttgttg gtgctggtct ctttggcgca tagctttggc tcagtttcta ttatcgctca + 18661 caccatccat cagaagttta atctgaaggt acccaattat cgccaagaag aagattgggc + 18721 taggaggggt ttaccaatca cacgtaagga aatctctaat tggcatatca aggcaagtca + 18781 atactattta gagtcccttt ataagctttt acgagaaaag ttgttagaac aacctcttct + 18841 tcctgcggat gaaacctctt atcgggttct agagagtgat agccatctga cctactattg + 18901 gacctttttg tctgggaaag ctgagaatca agcaatcacg ctgtaccatc atggtcagtg + 18961 tcgaagtggt ttagtagtac aagaattcct aggagattat tctggctatg tgcattgtga + 19021 tatgttgcgg cagtaactta ggactttagt cctctagttc tgcctatgcg atagcagtcc + 19081 aaggtttagg agcaaggcga cgctaagctt ggtaaactgc gaaccgctag aagcttatcg + 19141 tcaactggaa gaagctgaac ttgttggatg ttgggcacat gtgagaagga agttttttga + 19201 agcgaccccc aagcaagcgg ataaatcatc gttaggagct aaaggtttag cttattgtaa + 19261 tcagttattt tccttggaaa gagactggga ggctttgcca gctgatgaac gactacagaa + 19321 acgtcaagaa gagctccaac ccctaatgga agacttcttt gcttggtgcc gccgtcagtc + 19381 agttttatcg ggttcaaaac taggaagggc aattgaatac agcctcaagt ataaagaaac + 19441 ctttaagact attttgaaag acggacatct ggtcctttcc aataatctag ctgaatgcgc + 19501 cattaaatca ttggttatgg gacggagtaa aagagttcag tggactcttt tagcctaagc + 19561 tcagtttaaa aaagcgaggg tggttatttt ctcaaaattt tgaaggagct aaagcaagag + 19621 ctattattat gagtttgttg gaaacagcta aacgtcatca attaaatagc gagaaatatc + 19681 tattctatct tctagaatgt cttccaaacg aggaaactct cgtaaacaaa gaggttttag + 19741 aggcttattt accatggact aaagttgtac aagaaaagtg caaataagaa atctccagat + 19801 taggaactat ccgtgagttc tctagtctgg agatttttca atatacttcg ttattggacg + 19861 gttacgatat tcatattttt tgcaaagatg ttgtttgaaa aataattttc aaaaattctg + 19921 aaaattctgt tgacaacttt ctgaaaagag tctataatgg agagaaagtt ttaaaggaga + 19981 aaatgatgaa aagttcaaaa ctatttgccc ttgcgggcgt gacattattg gcggcgacta + 20041 ctttagctgc atgctctgga tcaggttcaa gcactaaagg tgagaagaca ttctcataca + 20101 tttatgagac agaccctgat aacctcaact atttg +// + diff --git a/public/res/serotype_genbank/serotype_28A.gb b/public/res/serotype_genbank/serotype_28A.gb new file mode 100644 index 0000000..e740f36 --- /dev/null +++ b/public/res/serotype_genbank/serotype_28A.gb @@ -0,0 +1,1072 @@ +LOCUS CR931692 22978 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 1982/45 (serotype 28A). +ACCESSION CR931692 +VERSION CR931692.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22978) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22978) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22978 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="1982/45" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC28A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC28A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34020.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC28A_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC28A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(462..977,979..1305)) + /gene="tnp" + /locus_tag="SPC28A_0003" + /pseudo + CDS complement(join(462..977,979..1305)) + /gene="tnp" + /locus_tag="SPC28A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(915..977,979..1287)) + /gene="tnp" + /locus_tag="SPC28A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 6e-23" + /pseudo + gene 1527..2981 + /gene="wzg" + /locus_tag="SPC28A_0004" + CDS 1527..2981 + /gene="wzg" + /locus_tag="SPC28A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34023.1" + /db_xref="GOA:Q4K030" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K030" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1527..1652 + /gene="wzg" + /locus_tag="SPC28A_0004" + /note="Signal peptide predicted for SPC1385 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 1740..2087 + /gene="wzg" + /locus_tag="SPC28A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.7e-65" + misc_feature 2265..2708 + /gene="wzg" + /locus_tag="SPC28A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 2983..3714 + /gene="wzh" + /locus_tag="SPC28A_0005" + CDS 2983..3714 + /gene="wzh" + /locus_tag="SPC28A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34024.1" + /db_xref="GOA:Q4K029" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K029" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTLYRDIHSALSKILMLGITPVIAHIERYAALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEKDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2986..3594 + /gene="wzh" + /locus_tag="SPC28A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.6e-37" + gene 3720..4415 + /gene="wzd" + /locus_tag="SPC28A_0006" + CDS 3720..4415 + /gene="wzd" + /locus_tag="SPC28A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34025.1" + /db_xref="GOA:Q4K028" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K028" + /translation="MMKEQNMIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDSPGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREAAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQI + PLLGVVPDLNKMK" + misc_feature 3720..3836 + /gene="wzd" + /locus_tag="SPC28A_0006" + /note="Signal peptide predicted for SPC1387 by SignalP 2.0 + HMM (Signal peptide probability 0.774) with cleavage site + probability 0.498 between residues 39 and 40" + misc_feature 3741..4157 + /gene="wzd" + /locus_tag="SPC28A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 2.7e-56" + misc_feature 4263..4340 + /gene="wzd" + /locus_tag="SPC28A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4425..5114 + /gene="wze" + /locus_tag="SPC28A_0007" + CDS 4425..5114 + /gene="wze" + /locus_tag="SPC28A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34026.1" + /db_xref="GOA:Q4K005" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K005" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + AGEGKSMTSTNIAWAFAHAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEVNRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5129..6496 + /gene="wchA" + /locus_tag="SPC28A_0008" + CDS 5129..6496 + /gene="wchA" + /locus_tag="SPC28A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34027.1" + /db_xref="GOA:Q4K026" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K026" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVIVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGCFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5129..5215 + /gene="wchA" + /locus_tag="SPC28A_0008" + /note="Signal peptide predicted for SPC1389 by SignalP 2.0 + HMM (Signal peptide probability 0.844) with cleavage site + probability 0.429 between residues 29 and 30" + misc_feature 5912..6493 + /gene="wchA" + /locus_tag="SPC28A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.8e-160" + gene 6527..7699 + /gene="wchF" + /locus_tag="SPC28A_0009" + CDS 6527..7699 + /gene="wchF" + /locus_tag="SPC28A_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI34028.1" + /db_xref="GOA:Q4K025" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K025" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGITEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDEDPIF + YILACRIGPFIHGIKKRIQAIGGALLVNPDGHEWLREKWSLPVRKYWKYSERLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSILKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYEAMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIVDFFTWEKIVTDYEKLFKK" + gene 7696..8967 + /gene="wciU" + /locus_tag="SPC28A_0010" + CDS 7696..8967 + /gene="wciU" + /locus_tag="SPC28A_0010" + /note="member of homology group 59" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34029.1" + /db_xref="GOA:Q4K024" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K024" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMIEQIAQGYQVAALCPGRI + KFFSKKIEIIKATSRQFECYELLNSLPIALFGGISDPTAFMTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSDKNTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIQPVNSVVLSITSSSIKHHQRLTTTNNKIRVA + YIGSDEEYKGYFDFIDFAGTLEQESYEVVTYGHLPNEECPSFIEQKGYFTKETIDSVY + ENIDILIIASKCKETFGLITVEALSYGVNVFVSENVGSKDLLPETHVFKNQNDLVVKF + LKNDIENTKLKTLDEHSIEVIQYYERVINDS" + misc_feature 8470..8931 + /gene="wciU" + /locus_tag="SPC28A_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00061" + gene 8957..9643 + /gene="wcxM" + /locus_tag="SPC28A_0011" + CDS 8957..9643 + /gene="wcxM" + /locus_tag="SPC28A_0011" + /note="member of homology group 105" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34030.1" + /db_xref="GOA:Q4K001" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K001" + /translation="MIVKSFIKKITGKTVDIHPDVPLSYILQRGINYGFGLFRGVVRG + IGFGQNDKRLFIGQGVSILAKRKLFVGKNVRIGKKVSIDALSKEGIHFADNVKIGDYS + QIIGTGSIKNMGIGLKIGKNSSFSEYSLFGSAGGITIGDNVIAGQNVRFHAENHNYSD + LDKLIVEQGVSRKGISVGDNCWIGAGSVFLDGSSIGSGCVVAANSVITKNFPDNVIVA + GVPAKIIKMK" + misc_feature 9155..9208 + /gene="wcxM" + /locus_tag="SPC28A_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 16" + misc_feature 9221..9274 + /gene="wcxM" + /locus_tag="SPC28A_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 13" + misc_feature 9362..9415 + /gene="wcxM" + /locus_tag="SPC28A_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 10" + misc_feature 9476..9529 + /gene="wcxM" + /locus_tag="SPC28A_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 11" + misc_feature 9530..9583 + /gene="wcxM" + /locus_tag="SPC28A_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 1.7" + gene 9655..10533 + /gene="wcxN" + /locus_tag="SPC28A_0012" + CDS 9655..10533 + /gene="wcxN" + /locus_tag="SPC28A_0012" + /note="member of homology group 154" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34031.1" + /db_xref="GOA:Q4K000" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K000" + /translation="MGKEIKAVYAILNYNTWEDTARLAQKVATFQHIQSVIIVDNLST + DDSYHYLKRLEGEKISVYQTQRNGGYSVGNNVAARKAYNMGVDILFISNPDVDIDEKD + SLMIAQNLYKNSSYALLSGIEYNAMKEIDLPIVWHENSYYDDLLDCLFLTRKLRRKKE + DINLSMIKSSIIDVDLVKGSFFAVRLSDFHDVGYFDESVFLFCEERILAKKLQKANKK + IGILPEAKYYHNHSTSINEKYKKKKEQIVLLYNARYYYNVTYQNISFLKKICLKLFMF + LSIIEYSILDYIKRKG" + gene 10542..11774 + /gene="wzy" + /locus_tag="SPC28A_0013" + CDS 10542..11774 + /gene="wzy" + /locus_tag="SPC28A_0013" + /note="member of homology group 251" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34032.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K021" + /translation="MVINFSKYNWILILILSSSELFSKETNLFLLLFILLYYVLVRGG + RLPISIPGAKYYFTLLMVGLFIGIGNVIINENTVFNFVKHFIYYLLPLFFWQFGCVLS + NNDNLSYKQNNIKESIVITAFLLSSYDLIGSIISFLSRTKEIVDLYSLRSEFGRGSYI + PIIALYLVLVYSREIKLSKNFKGFLLLLFTISILIHFSRTHFIILLILVFFSGFEKNM + KSIKKIMFAGTLILAGVGVLYLYFPNLVIDFYNKISQSTTEITFSKSSWSHKDIIWNW + RGYEMYSALNHFKSSTLLEQILGGGFGTVLYIGEYAYFVSDLPYLLFLHNGYFTTLLV + FGVSGVILFVLWVLSLFSYSKYVNDTQDSNFIKGLAVVILFTTYFVNGPLFSVSQATF + LLYFALFSNNHGELDEDF" + gene 11761..12921 + /gene="wcxP" + /locus_tag="SPC28A_0014" + CDS 11761..12921 + /gene="wcxP" + /locus_tag="SPC28A_0014" + /note="member of homology group 155" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI34033.1" + /db_xref="GOA:Q4JZZ8" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4JZZ8" + /translation="MKIFKKIKFILMLLYTSTFPRCEKILIFGSWLGEKYADNPRYLF + EYVIKNRPDLKAIWITSNQDVFKELQKKQYPVMMADESEAHKIMKKAKYIFTTTGIFD + IGVENSRLIGGAFLINLWHGIPLKKIMYDDKHSALHKRSKLVTWVEKIPLRNYFVIST + STAITQIYQSAFRVKKSNILELGQPRNDYFYDESYPVSSLIQELKSKNIILYMPTHRN + EGKKQIPLDNLMDLNRLNKWCEETNSIFVIKKHFYHSKEKTLEKEYSSIIDVTNEKVD + AQELLKYSKILITDYSSCYIDYLLLDRPIIFFNYDYDDYLRIDRSLYFPYEKVTPGEK + CQNFDELLVTLQNLYLGKDDYRKKRENIKTFFYSSETQKSVSEKIINHVLNL" + misc_feature 12349..12915 + /gene="wcxP" + /locus_tag="SPC28A_0014" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 4.5e-32" + gene 12927..14378 + /gene="wzx" + /locus_tag="SPC28A_0015" + CDS 12927..14378 + /gene="wzx" + /locus_tag="SPC28A_0015" + /note="member of homology group 52" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34034.1" + /db_xref="GOA:Q4JZZ7" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZZ7" + /translation="MESVMKKILNKYYSLSNPVKASIWFTICNVLQKGISMITVPIFT + RLLTTEQYGVYSVYQSWYSIIGVFATLNLYYGVFNNGMVKYEKDKNAFTSSMQGLTTT + VTAIFLVIYLIGIDFWNSLLGLPTLLILVMFFDLFFTPAYSFWATRQRFEYQYRNLVF + ITLIIAIGSPIIGISSVVLSTYKAEARVISFVLVQSCIGLYFYVLNLYRGKYFFCKKY + WLYALNFNLPLIPHYLSQSVLNQSDRIMINSMVGMGEAAIYSVAYSISTLMVLVTSAI + NSSFIPYTYKCIRDKKYTELGKSANLLITLVGIGSILTISLGPEIIQLFAPKQYYEAI + WIIPPVALSVYFMFLYPIFGNIEFYFEANHFVMWASIGGAIMNIFLNFIFIKHFGYIA + AGYTTLLCYILFALGHYIFMRRALYQNLSGIQIYDSRYIFFFSFLLLILMLLIVTIYP + FVLIRYIAISLILGGCFLKRRKIMSSIVMIKKQ" + misc_feature 12978..13790 + /gene="wzx" + /locus_tag="SPC28A_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.9e-12" + gene 14388..15200 + /gene="wcxQ" + /locus_tag="SPC28A_0016" + CDS 14388..15200 + /gene="wcxQ" + /locus_tag="SPC28A_0016" + /note="member of homology group 156" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34035.1" + /db_xref="GOA:Q4JZZ6" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZZ6" + /translation="MTEINKQLHETLIEILDFVKEICEKHELTYFLIYGTALGAKRHC + GFIPWDDDVDIALPREHYNILIDVLSKMEQSIFSLQNEDNEPNYFLPFAKLRKNNTIF + IEKILDVEYENNGIYIDIFPLDFVENPDSFNFKMRRTMFNYIKHILKFSSCRSFYKNK + YSSVRYLMENIMSIPTLFFSNRRLLFLANNLISSTNKANFIGQYDESSERAIMPSSYY + FPSRSAVFEGKIYSVPAKLEDYLKYFYGSDYMELPPIEKRVTHQPIKLRFKK" + misc_feature 14454..15125 + /gene="wcxQ" + /locus_tag="SPC28A_0016" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 1.4e-36" + gene 15276..16304 + /gene="gtp1" + /locus_tag="SPC28A_0017" + CDS 15276..16304 + /gene="gtp1" + /locus_tag="SPC28A_0017" + /note="member of homology group 40" + /codon_start=1 + /transl_table=11 + /product="putative glycerol-2-phosphate dehydrogenase" + /protein_id="CAI34036.1" + /db_xref="GOA:Q9R921" + /db_xref="InterPro:IPR002658" + /db_xref="InterPro:IPR016205" + /db_xref="UniProtKB/TrEMBL:Q9R921" + /translation="MKNNDLKIGSGAIHQISATLSQNSISGKILYCADPVVDDLYGSI + VRSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFIS + KRPYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKA + GIGDTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLV + NSLVLSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENS + VDTVVDYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQI + YKELISEL" + misc_feature 15297..16217 + /gene="gtp1" + /locus_tag="SPC28A_0017" + /note="HMMPfam hit to PF01761, 3-dehydroquinate synthase, + score 2.9e-70" + gene 16320..17024 + /gene="gtp2" + /locus_tag="SPC28A_0018" + CDS 16320..17024 + /gene="gtp2" + /locus_tag="SPC28A_0018" + /note="member of homology group 41" + /codon_start=1 + /transl_table=11 + /product="putative nucleotidyl transferase" + /protein_id="CAI34037.1" + /db_xref="GOA:O85005" + /db_xref="InterPro:IPR005835" + /db_xref="UniProtKB/TrEMBL:O85005" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQN + NITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLM + MNADVFYDASVIKSLLLHKAPNAIVTDLGIYIEESMKVVEKNGRLVEISKQISPEETL + GASIDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILSEVEFVACPLEGRWL + EIDNHEDLVAAEKLFA" + misc_feature 16323..17021 + /gene="gtp2" + /locus_tag="SPC28A_0018" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 1e-07" + gene 17021..17872 + /gene="gtp3" + /locus_tag="SPC28A_0019" + CDS 17021..17872 + /gene="gtp3" + /locus_tag="SPC28A_0019" + /note="member of homology group 42" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI34038.1" + /db_xref="GOA:Q4K015" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006357" + /db_xref="UniProtKB/TrEMBL:Q4K015" + /translation="MNRIRRMKLTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLF + EGTLELLDYIHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYI + KENYPKSKVYCQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEI + LSTKDVPFIATNPDIRCPVSFGFIPDCGSICDMISKSVDRKPVYIGKPEPTMVDIVRK + KLNYSLFETVVIGDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQDSIKPTYTFKNVK + EMWKGIV" + misc_feature 17096..17782 + /gene="gtp3" + /locus_tag="SPC28A_0019" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 5.9e-25" + gene 18032..18901 + /gene="rmlA" + /locus_tag="SPC28A_0020" + CDS 18032..18901 + /gene="rmlA" + /locus_tag="SPC28A_0020" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34039.1" + /db_xref="GOA:Q4JZZ2" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JZZ2" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLERGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 18035..18751 + /gene="rmlA" + /locus_tag="SPC28A_0020" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.2e-120" + gene 18902..19495 + /gene="rmlC" + /locus_tag="SPC28A_0021" + CDS 18902..19495 + /gene="rmlC" + /locus_tag="SPC28A_0021" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34040.1" + /db_xref="GOA:Q4K013" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4K013" + /translation="MTDNFFGKTLAARKVETIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKYHPLLKDVKPLKKEDL" + misc_feature 18938..19468 + /gene="rmlC" + /locus_tag="SPC28A_0021" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 1.3e-15" + gene 19508..20557 + /gene="rmlB" + /locus_tag="SPC28A_0022" + CDS 19508..20557 + /gene="rmlB" + /locus_tag="SPC28A_0022" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34041.1" + /db_xref="GOA:Q4K2P4" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P4" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 19523..20479 + /gene="rmlB" + /locus_tag="SPC28A_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0001" + misc_feature 19526..20266 + /gene="rmlB" + /locus_tag="SPC28A_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 2.7e-76" + misc_feature 19529..20341 + /gene="rmlB" + /locus_tag="SPC28A_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.7e-05" + gene 20623..21474 + /gene="rmlD" + /locus_tag="SPC28A_0023" + CDS 20623..21474 + /gene="rmlD" + /locus_tag="SPC28A_0023" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34042.1" + /db_xref="GOA:Q4K011" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K011" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDIIDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 20623..21471 + /gene="rmlD" + /locus_tag="SPC28A_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 3.3e-146" + misc_feature 20626..21267 + /gene="rmlD" + /locus_tag="SPC28A_0023" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00014" + misc_feature 20626..21255 + /gene="rmlD" + /locus_tag="SPC28A_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 8.4e-17" + misc_feature 20629..21357 + /gene="rmlD" + /locus_tag="SPC28A_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.2e-08" + gene order(21550..22506,22514..22735) + /gene="tnp" + /locus_tag="SPC28A_0024" + /pseudo + CDS join(21550..22506,22514..22735) + /gene="tnp" + /locus_tag="SPC28A_0024" + /note="member of homology group 12; + member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 21556..21999 + /gene="tnp" + /locus_tag="SPC28A_0024" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 0.00014" + /pseudo + gene 22931..>22978 + /gene="aliA" + /locus_tag="SPC28A_0025" + CDS 22931..>22978 + /gene="aliA" + /locus_tag="SPC28A_0025" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34044.1" + /db_xref="UniProtKB/TrEMBL:Q4K2C2" + /translation="MMKSSRLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga aaatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attacgctga taatatagtc aattgaaaca agagcaggac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct tttacgaggc tttttgatat + 541 gagcccatgt tttctcaata ggattgtact caggtgagta gggaggaaga aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtaat cgtctcttcg taagtcattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc ttaactgacc ttttaaagag + 841 cgaccatatt ctcgataaaa ataagtatca aatcctgttt cgtcaatcta aacagctgct + 901 aggtgcttta aactattaaa attcttaaga aataaggcta ctttttctgg gtcttgttca + 961 tagtaggtgt ggttcttttt ttcgagtgta gcccatagct ttgagcgcat agtggatggt + 1021 agttggatga cagccaaatt cagaagctat ttcagtcaaa taagcgtctg gattatcagt + 1081 aagatagttt ttaagtctat ctctatcaac ttttcttggt tttattcctt ttacttggtg + 1141 gtttagctct cctgttttct cttttagctt taaccagcca taaatggtat tacgtgagat + 1201 ttggaaaacg tgtgatgctt ctgttatact acctgttcgc tcacaataag agagaacttt + 1261 tttacgaaaa tctattgaat atgccataaa aagattatac cacattgtgt actatattag + 1321 attgaaacta gagtagtaca cctctgcttc taaaaaattt ttagaaatcg atttaactgt + 1381 cctgatcgat ttgtcatgtt cttatttcat tttactatat ttttgtttcg cgggaagtct + 1441 actaagatac ttaaagatgc agatagtaaa aaaatgtaga cattaccgta aaaaagtgat + 1501 ataattgtac gatgttcaag gtataggtgt taatcatgag tagacgtttt aaaaaatcac + 1561 gttcacagaa agtgaagcga agtgttaata tcgttttgct gactatttat ttattgttag + 1621 tttgtttttt attgttctta atctttaagt acaatatcct tgcttttaga tatcttaacc + 1681 tagtggtaac tgcgttagtc ctactagttg ccttggtagg gctactcttg attatctata + 1741 aaaaagctga aaagtttact atttttctgt tggtgttctc tatccttgtc agctctgtgt + 1801 cgctctttgc agtacagcag tttgttggac tgaccaatcg tttaaatgcg acttctaatt + 1861 actcagaata ttcaatcagt gtcgctgttt tagcagatag tgatatcgaa aatgttacgc + 1921 aactgacgag tgtgacagca ccgactggga ctgataatga aaatattcaa aaactactag + 1981 ctgatattaa gtcaagtcag aataccgatt tgacggtcga ccagagttcg tcttacttgg + 2041 cagcttacaa gagtttgatt gcaggggaga ctaaggccat tgtcttaaat agtgtctttg + 2101 aaaatatcat cgagtcagag tatccagact acgcatcgaa gataaaaaag atttatacca + 2161 agggattcac taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct + 2221 atgttagtgg aattgacacc tatggtccta ttagttcggt gtcgcgatca gatgtcaata + 2281 tcctgatgac tgtcaatcga gataccaaga aaatcctctt gactacaaca ccacgtgatg + 2341 cctatgtacc aatcgcagat ggtggaaata atcaaaaaga taaattaacc catgcgggca + 2401 tttatggagt tgattcgtcc attcataccc tagagaacct ttatggtgta gatattaatt + 2461 attatgttcg tttgaatttt acctcatttt tgaaattgat tgacttattg ggaggggtag + 2521 atgttcataa tgatcaagag ttttcagctc tacatgggaa gttccatttc ccagtaggga + 2581 atgtccatct agactctgag caagctttag gttttgttcg tgagcgctac tccctagcag + 2641 atggcgatcg tgaccgtggt cgcaaccaac aaaaggtgat tgtggctatc cttcaaaaat + 2701 taacgtcaac cgaagcactg aaaaattata gtacgatcat tgatagcttg caagattcta + 2761 tccaaacaaa tatgccactt gagaccatga taaatttggt caatgctcag ttagaaagtg + 2821 gtggaactta caaagtgaat tcgcaagact tgaaaggtac aggtcggatg gatcttcctt + 2881 cttatgcaat gccagacagt aacctctatg tgatggaaat agatgatagt agtttagctg + 2941 tagttaaagc agctatacag gatgtgatgg aggggagatg aaatgataga catccattca + 3001 catatcgttt ttgatgtaga tgacggtccc aagtcaagag aggaaagcaa ggctctcttg + 3061 gcagaagcct acagacaggg ggtgagaacc attgtctcta cctctcaccg tcgcaagggc + 3121 atgtttgaaa ctccggaaga gaagatagca gaaaactttc ttcaggttcg ggaaatagct + 3181 aaggaagtgg cgagtgactt agtcattgct tacggagctg aaatttacta cacaccagat + 3241 gttctggata agctgggaaa aaagcggatt ccgaccctca atgatagtcg ttatgccttg + 3301 atagagttta gtatgaacac tctttatcgc gatattcata gcgccttgag caagatcttg + 3361 atgttgggaa ttactccagt cattgcccac atcgaacgct atgctgctct tgaaaataat + 3421 gaaaaacgcg ttcgggagct gattgatatg ggctgttaca cgcaagtaaa tagttcacat + 3481 gtcctcaaac ccaaactttt tggcgaacgt tataaattca tgaaaaaaag agctcagtat + 3541 tttttagaga aagatttggt tcatatcatt gcaagtgata tgcacaatct agacggtaga + 3601 cctcctcata tggcagaagc atatgacctt gttacccaaa aatacggaga agcgaaggct + 3661 caggaacttt ttatagataa tcctcgaaaa attgtaatgg atcaactaat ttaggagaaa + 3721 tgatgaaaga acaaaacatg atagaaatcg atgtatttca attatttaaa accttgtgga + 3781 aacgcaagct aatgatttta ttagtggcac ttgtgacagg tgcgggggct tttgcatata + 3841 gcacttttat tgttaagcca gaatatacga gtaccacgcg aatttacgta gtgaatcgca + 3901 atcaaggaga cagtccgggg ctgacaaatc aggatttgca ggcaggatct tatctggtaa + 3961 aagactaccg tgagattatc ctttcgcagg atgtattgga aaaagtagcg acaaatttga + 4021 agctggatat gccagccaaa acgttagcca gcaaagttca agtgactgta ccagctgaca + 4081 ctcgtatcgt ctcaatctct gtcaaggata aacagccaga ggaagccagt cgtatcgcta + 4141 attctctacg agaagctgct gcagaaaaga tcgtcgctgt aacgcgagta tctgatgtaa + 4201 cgacacttga agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgacgcaatt + 4261 ccttgtttgg ttttcttgga ggagcagtcg taacagtaat tgctgttctt ttgattgagt + 4321 tgctcgacac ccgtgtgaaa cgtcctgaag atgtcgaaga tgtactgcaa attccacttt + 4381 taggggtcgt tccagatttg aacaaaatga aataggagga agttatgcca acattagaaa + 4441 tctcacaggc aaaattggat tttgtaaaaa aggcagagga aaattataac gctttgtgca + 4501 cgaacctaca gttaagtgga gatgatttga aagtattttc tatcacttct gtgaaagcag + 4561 gagaaggaaa atcaatgact tccaccaata tcgcttgggc ttttgcgcat gcaggttaca + 4621 aaacgctgct gattgatgga gatattcgca attctgttat gttaggtgtc tttaaagcaa + 4681 gggataagat tacaggcctg acagaatttt tatcaggaac tacagaccta tcacaagggc + 4741 tttgtgatac caatatcgaa aatctctttg taattcaggc tggctctgtg tcaccgaatc + 4801 cgacagctct tcttcaaagt aagaatttca gtacaatgct tgaaaccttg cgtaaatatt + 4861 ttgactacat cattgtagat actgctcctg tcggtgtcgt gattgatgcg gctattatta + 4921 cgcgaaaatg cgatgcttct attttagtga cggaggcagg tgaagtaaat cgtcgggata + 4981 ttcaaaaagc aaaagaacag ttggaacaca caggaaagcc gtttttggga attgtgttga + 5041 ataaattcga tacttcagta gacaaatacg gttcttatgg aaattatgga gattacggga + 5101 aaaataaaaa ataggtcggg ggatagagat gaatggaaaa atattaaggt cttcattggc + 5161 cataatccag agttttcttg ttattttatt gacttatcta cttagtgctg tgagagaaac + 5221 ggagattgtt tcaacaacag ctattgcact ttatatcctc cattattttg tcttttatat + 5281 cagtgattat ggacaggatt tctttaaaag gagatatttg attgaacttg tccagacatt + 5341 gaaatatatc ctattctttg cactagcgat tagtatttct aattttttct tagaggatcg + 5401 atttagtatt tccagacgag gcatgattta cttcctcaca ttacatgctc tcttagtcta + 5461 tgtgctaaac ctatttatca agtggtattg gaagcgggct tatcccaact ttaaaggaag + 5521 taagaagatt ctcctactta cagcaacttc tcgtgtcgaa aaggtactgg atagattaat + 5581 agaatcaaat gaggttgttg ggaagttggt agccgtcagt gtcttagata aaccagattt + 5641 tcagcatgat tgtttaaagg tagtagcaga gggggagata gtaaactttg cgactcatga + 5701 ggtggtcgat gaagtcttta tcaatcttcc aagtgaaaaa tacaatattg gagagcttgt + 5761 ctctcagttt gaaacgatgg gaattgatgt aatagtcaat ctaaatgctt ttgatcgtag + 5821 tttggcacgt aacaagcaaa ttcgtgagat ggcagggtta aacgttgtga ctttttctac + 5881 aacattttat aagactagtc atgtaattgc taagcggatt attgatatcg tgggtgcatt + 5941 ggtagggctg atactatgtg gtttagtcag tattgtactg gttcctttga ttcgaaagga + 6001 tgggggatct gctatttttg ctcagacgcg tataggaaaa aatggtcgtc agttcacttt + 6061 ttataagttt cgctctatgt gtgtagatgc cgaggcgaaa aaaagagaac ttatggaaca + 6121 aaataccatg caaggtggaa tgtttaaggt ggacgatgat cctcgtatca cgaaaattgg + 6181 ttgttttata cggaagacta gcttggacga gctaccacag ttttataatg ttctaaaggg + 6241 agatatgagt ttggttggca cacggccacc aacagtggac gagtatgagc actatacccc + 6301 agaacaaaaa cgccgactaa gttttaaacc tggcataaca ggtttatggc aggtcagcgg + 6361 acgaagtgag atcaagaatt tcgatgaagt tgtcaaatta gatgtagcct atatagacga + 6421 ttggacaatt tggaaagata ttgagatttt attgaagaca gttaaagttg tattgatgaa + 6481 ggatggagcg aagtaatttc tgtatatcca tcatattagg agagaaatga aaaagtcagt + 6541 ttatatcatt ggttcaaaag gaattcctgc taagtatgga ggatttgaaa cttttgttga + 6601 aaaattaaca gccttccaac aagataaggc tatccaatat tatgtggctt gtatgcgtga + 6661 aaattctgca aaatcaggga ttactgagga tgtttttgaa cataatggtg ctatctgtta + 6721 taacgtcgat gttcctaata ttggtccagc gcgagctata gcgtatgata tcgctgcaat + 6781 taacagagct attgaaattg ccaaagaaaa taaggatgaa gatccaatct tctatatttt + 6841 agcttgtcga attggtccgt ttatccatgg aattaagaaa agaattcaag caataggtgg + 6901 ggctcttctg gttaatccgg atggtcatga atggctacga gaaaaatgga gtttacctgt + 6961 tcgcaaatat tggaaatact ctgaaagact tatggtcaaa catgcagatc ttttagtgtg + 7021 tgatagtaag aatattgaaa aatatatcca agaagattat aaacagtatc aacctaagac + 7081 aacctatatc gcttatggga ctgatacaac acgctccata ttaaagagta gtgacgaaaa + 7141 agtacgttct tggttcaaag agaagaatgt ttctgaaaac gagtattacc tagttgtagg + 7201 acgttttgtt ccagaaaata actatgaggc tatgatacgt gggtttttag catctaattc + 7261 taagaaggac tttgtcttaa tcacaaatgt agaacagaat aaattttata atcagttgtt + 7321 ggcaaaaact ggttttgata aggacccacg agtaaaattt gtaggtacag tctatgagca + 7381 agagcttctt aaatatattc gtgaaaacgc ctttgcttac ttccacgggc atgaagttgg + 7441 tggaaccaat ccttcgcttt tagaagctct ggcatcaact aaactgaatt tattgctaga + 7501 tgttggcttt aaccgagaag ttggggagca aagtgcaatc tattggaaaa aagatgagct + 7561 ttcccaagta atcgagaaag ttgaacaatt tgatgcaaaa atgattgatg agttagatag + 7621 acaatcaaat cagagaattg tggatttttt cacttgggaa aagattgtca cagactacga + 7681 gaaattattt aaaaaatgaa aatattacat tatactttag gatttcaacc ccagcgaaca + 7741 ggtggtttgg ttaaatatgc tgaggattta atgatagagc aaattgctca aggttatcaa + 7801 gtagccgccc tatgtccagg gagaattaag ttcttttcaa aaaaaataga aataattaaa + 7861 gcgacgtcaa ggcagtttga gtgttatgaa ctgcttaata gcttacctat agctttattt + 7921 ggaggtatat ccgatccaac tgctttcatg acaccttgtg acaaaaatgt ttatcgtact + 7981 tttttagaaa aagtacaacc cgacattata catattcact cgtttatggg attgcataaa + 8041 gaattcctcg aaattgctaa aaacttgaat attagagtgg tttttacgag ccatgattat + 8101 tatggattag cacccgtacc tcatttctat tttaatgggg tggattatag tgataaaaat + 8161 acaaacttaa catggaatat tatgtcttcc aatgctttaa gtgtgaaaaa actaagactt + 8221 tttcaagttt cattttatcc tactattcgt aaacttttga aactattagg gaaaaatcca + 8281 aaatctaaaa agaatttagt tattcgagat gttattgagg aacaagatta tagtgaactt + 8341 cgatactatt ataatgagat gtttcactta atagatggtt atttgtttaa tagtagactt + 8401 gcaaagaagg tatatgagat aaacgagatt caaccagtta atagtgtagt attatctata + 8461 acaagtagtt caattaaaca tcatcagaga ttaacgacta caaataataa gattagggtt + 8521 gcttatattg gttcagacga agaatataaa ggttactttg attttattga ctttgctgga + 8581 actttagaac aagaatcata tgaagtggta acttatggtc atttaccaaa tgaagagtgc + 8641 ccttcattca ttgaacaaaa aggatatttt accaaggaaa cgattgacag tgtctatgaa + 8701 aatattgata ttttgattat agcaagcaaa tgtaaagaaa cctttggatt gataacagta + 8761 gaagcattat cctatggggt aaatgttttt gtgagtgaaa atgttggatc aaaagacttg + 8821 cttccagaaa cacatgtttt taaaaatcag aatgatttag tagttaaatt tttaaaaaat + 8881 gatatagaaa atacaaaatt gaaaacttta gatgaacact cgatagaagt gattcagtat + 8941 tatgaaagag tgataaatga tagttaagag tttcataaaa aagattactg gaaaaacagt + 9001 agacattcat ccagatgtac ctttgtcgta tatactacaa agaggtataa actatggttt + 9061 cggactcttt cgtggggttg tacgtggaat cggatttggt caaaacgaca aacgtttatt + 9121 cattggacaa ggagtttcta tcttagcaaa gcgtaaatta tttgttggaa aaaatgttcg + 9181 aattggtaaa aaggtgtcta tagatgcact gtcaaaagaa ggaatccatt ttgcagataa + 9241 tgtaaagatt ggagattatt ctcaaattat tggcacaggt tctataaaaa atatggggat + 9301 tggcttgaaa atcggtaaga actcatcttt ttcagaatat agtttatttg gttctgctgg + 9361 aggtatcaca attggtgata atgttatcgc aggtcagaat gttcgttttc atgctgaaaa + 9421 tcataattat agtgatttag ataaactcat tgttgaacaa ggggtatctc gaaagggaat + 9481 ttcagtaggt gataattgtt ggattggtgc tggatctgtt tttttggatg ggtccagcat + 9541 tggttcaggt tgtgttgtag ctgcaaattc tgtaattacg aaaaactttc cagataacgt + 9601 tattgttgct ggagtaccag ctaaaattat aaaaatgaaa tgataggatg ttaaatgggg + 9661 aaagaaatta aagctgttta tgcgatatta aattacaata cttgggaaga tactgcgcgt + 9721 ttagcacaga aagttgcaac atttcagcat attcaatctg tgataatagt ggataatcta + 9781 tcaacagatg attcatacca ttatttaaaa agacttgagg gagagaaaat ttcagtttat + 9841 caaacacaaa gaaatggtgg atattctgtt ggaaataatg ttgcagcacg aaaagcttat + 9901 aatatgggag ttgatattct tttcatttca aatccagacg ttgatattga tgaaaaagat + 9961 tccttgatga ttgcacaaaa tttgtataaa aatagttcat atgcactgct atcaggtata + 10021 gaatataatg ctatgaagga gatagatttg ccaattgtct ggcatgaaaa ttcctattac + 10081 gatgacttac ttgattgttt gtttttaacc agaaaattgc gaagaaaaaa agaagatatc + 10141 aatttgtcaa tgattaaatc atctataata gatgtagatc ttgttaaagg ctcgtttttt + 10201 gctgtaaggc tgtctgattt tcatgatgtt ggttattttg atgaatctgt atttcttttt + 10261 tgtgaagaga gaatattagc caaaaagtta caaaaagcaa ataaaaaaat aggtattctg + 10321 cctgaagcga aatattacca caatcattca acttctataa acgagaagta taaaaagaaa + 10381 aaagaacaga tagttttact atataatgct cgttattatt acaatgtgac gtatcaaaat + 10441 attagctttt tgaaaaaaat ttgcctaaaa ctattcatgt ttttatctat tattgaatac + 10501 tcgatactag attatattaa acgaaaggga tagttatttt tatggttatt aactttagta + 10561 aatataattg gattttaatt ttaattttat cgagctcaga actgttttct aaagaaacaa + 10621 atctattttt attactattt attctactat actatgtttt agttcgtgga ggtagactac + 10681 caatttcaat tccaggagcg aaatattatt ttactttatt aatggtgggg ctatttatag + 10741 gtattgggaa tgtaataatt aacgaaaata cagtatttaa ttttgtaaag cattttatct + 10801 attacttatt acctctattt ttttggcagt ttggatgtgt tctgtcaaat aacgataatt + 10861 tatcttacaa gcaaaacaat attaaggaat caattgttat aacagcattt ctattatctt + 10921 cttatgattt aataggttca atcattagtt tcttgtctag aactaaggaa attgttgatt + 10981 tatatagttt acggtcagag tttggtcgag gttcctatat accaattatt gcactgtatt + 11041 tagttcttgt ttattctaga gaaataaagt tgagcaaaaa ttttaaggga tttttgttat + 11101 tactgtttac aatctcgatt ttgatacatt tttctaggac acattttatt attttattga + 11161 ttctagtatt tttttcagga tttgaaaaaa atatgaaaag tattaaaaaa ataatgtttg + 11221 caggaacatt gatattagca ggtgtaggtg ttttatattt atattttcca aatttagtta + 11281 tagattttta taataaaata tctcaatcaa cgacggaaat cacgttttct aaatcgtcat + 11341 ggtcccataa agatatcata tggaattggc gtggatatga aatgtactct gccttaaatc + 11401 attttaaatc ttcaacttta ttagagcaaa ttttaggagg aggatttgga acagttttat + 11461 acataggcga atatgcgtat ttcgtaagcg atttaccgta tcttcttttt ttacataatg + 11521 gatatttcac tactttactt gtttttggtg ttagtggggt catactattc gttttatggg + 11581 tacttagttt atttagttat agcaagtatg ttaatgatac ccaagattca aattttataa + 11641 aaggtcttgc tgtggttata ttatttacca catattttgt aaatggtcct cttttttctg + 11701 tttcacaagc caccttcttg ctttattttg cactttttag taataatcat ggagaattag + 11761 atgaagattt ttaaaaaaat taaatttata ttaatgctgc tttatacctc aacttttcca + 11821 agatgtgaga aaatactgat ttttggatca tggttaggtg aaaaatatgc agacaatcca + 11881 agatatttgt ttgagtatgt gattaagaat cgtcccgatt taaaagctat atggattaca + 11941 agtaatcaag atgtttttaa agaattacag aagaaacaat atcccgtgat gatggcagat + 12001 gagagtgaag ctcataaaat tatgaagaaa gctaaatata tttttacaac tacaggtatt + 12061 tttgatatcg gagtagaaaa tagtaggttg attggcggtg cttttttaat taacctttgg + 12121 catggcattc ctttgaaaaa aatcatgtat gatgataaac attcagcgct tcacaaacgt + 12181 agtaaactag tgacttgggt agaaaaaatt cctcttcgaa actattttgt tatttctact + 12241 agtacggcaa taactcaaat ttatcagtct gcttttcgcg taaagaaatc taatatatta + 12301 gaacttggac agcctagaaa tgactatttt tatgatgagt cttatccagt aagttcgcta + 12361 atacaagaat taaaaagtaa aaatattatc ttatatatgc cgacacatcg caatgaagga + 12421 aagaaacaaa ttcctctaga taatttaatg gatttaaatc gattaaataa atggtgtgaa + 12481 gaaacaaatt caatttttgt aattaaaaaa cacttctatc attcaaaaga aaaaacactt + 12541 gagaaagaat attcatcaat aattgatgtg acaaatgaga aggtcgatgc tcaagaatta + 12601 ctcaaatatt caaagatctt aataactgac tactcgagct gctatattga ctacttattg + 12661 ttggatcgac caattatatt ttttaattat gactatgatg attatttgag gattgatcgt + 12721 tcgctatatt ttccatatga gaaggttact ccaggggaga aatgtcaaaa ctttgatgaa + 12781 ttattagtga ctctgcaaaa tctatatcta ggaaaagatg attataggaa aaagcgtgaa + 12841 aatattaaaa ctttctttta ttctagtgaa actcagaagt cagtttctga aaaaatcatt + 12901 aatcacgtac taaatctata actttattgg aatctgtaat gaaaaaaata ttaaataagt + 12961 attattcttt atctaatcct gtaaaagctt caatttggtt tactatttgc aatgttcttc + 13021 aaaaaggaat ttcaatgatt actgttccaa tttttactag attattgaca acggaacaat + 13081 atggtgtata ctctgtatat caatcatggt attcaataat tggagttttt gcaacactaa + 13141 acctatatta tggagtcttt aataatggaa tggttaaata cgagaaagat aaaaatgcct + 13201 ttacttcctc tatgcaggga ctaacaacaa cagttacagc tatattttta gtgatatatt + 13261 taatagggat tgatttttgg aactcgttgt taggcttacc tacgctacta atcttagtga + 13321 tgttctttga tttgtttttt actcctgctt attctttttg ggctacgcgt cagagatttg + 13381 aatatcaata tcgaaactta gtatttatca cacttattat agcgattgga agccctatta + 13441 ttggtatttc ttcagttgtt ttatcgactt ataaagcgga ggctagagtt atctcatttg + 13501 tgttagttca atcttgtata ggattatatt tctatgtttt gaacctttac cgaggtaaat + 13561 attttttttg taaaaaatat tggctctatg ctttgaattt taatttacct cttattcctc + 13621 attatttatc gcaatcagtt ttaaatcaat cggatagaat aatgattaat tcaatggtag + 13681 gaatgggaga agcagctatt tatagtgttg cttacagcat atcaactttg atggttttag + 13741 tgacaagtgc tataaacagc tcttttattc cttacacata taagtgtatt cgagataaga + 13801 aatatactga actagggaaa agtgcaaatc ttttaattac tctggtaggc attggttcga + 13861 ttttaactat ttctcttgga ccagaaatca ttcaattatt tgcaccaaaa caatattacg + 13921 aagcaatatg gattattcct ccagttgctc tttcagtata tttcatgttc ttatatccca + 13981 tttttggtaa cattgagttt tactttgaag caaatcattt tgtaatgtgg gcttcaatag + 14041 gtggagcaat tatgaatatt tttttgaatt ttatttttat aaaacacttt ggctatattg + 14101 cggcaggcta tacaacttta ttatgttata ttttatttgc attgggacat tacattttta + 14161 tgagaagagc attgtatcag aatctttcgg gtatccaaat ttatgattct cgatatattt + 14221 tctttttttc gtttcttctt ctgattctaa tgctactaat cgtgactatt tatccatttg + 14281 tgttgattcg ttatattgct atctcactca tcctaggagg atgtttttta aagaggagaa + 14341 agataatgag ttcgatagtc atgataaaaa aacagtgagg tacacgaatg acagaaataa + 14401 ataaacagtt acatgaaaca ttaatcgaaa ttttagactt tgtaaaagaa atttgtgaaa + 14461 aacatgaatt aacttatttt ttgatctatg gtacggcact cggtgcaaaa cgccattgtg + 14521 gatttattcc ttgggatgat gatgttgata ttgctttacc gcgagagcac tacaatatat + 14581 taatcgacgt gttatctaag atggaacaat ctatatttag tcttcaaaat gaagataacg + 14641 agccgaacta ttttttacca tttgctaaat taagaaaaaa caatacgatt tttattgaaa + 14701 agattcttga tgttgaatat gagaataacg gtatttacat tgatattttt ccactagatt + 14761 tcgtagagaa tccggactct tttaatttta agatgaggag aactatgttt aattatataa + 14821 agcatatttt aaaattttca agttgcagaa gtttttataa aaataaatac agtagcgtac + 14881 gttatttgat ggaaaatatt atgagtattc ctaccctgtt tttttcaaat aggagattac + 14941 tattcttagc gaataattta atttcatcaa cgaataaagc taattttatt ggtcaatatg + 15001 atgaaagtag cgaaagagct atcatgcctt caagctatta tttcccgtct agatccgctg + 15061 tgtttgaagg aaagatttat agtgttcctg cgaaattaga agattattta aaatattttt + 15121 atggttcgga ttatatggaa ttaccaccaa tagaaaaaag agtcactcat caaccaataa + 15181 aacttagatt caaaaaataa ttggctattc tgtagaagga gaataattca agagttgtga + 15241 agtaaaacat tgggttattt ttaaggtaac gagatttgaa aaataatgat ttaaagatag + 15301 gaagtggagc tattcatcaa atttccgcta cactttctca aaatagtatt tcgggaaaga + 15361 ttttatattg tgctgatcca gttgtcgatg acttgtacgg ttcgatagta cgttcacaaa + 15421 tagaggaaat tggtcgggta aaggaagaaa gttgcaatta taatactatt gcttatgcga + 15481 tgaatatagc agaacgggct attgccacag atattgactg tattgtggga atgggaggag + 15541 gtcgtgtttt agatgtctgc aagtatgcat cttttatttc gaaacgtcct tacctatcga + 15601 ttccgacaac agcagcaaat gatggcattg cttccccagt tgctgttttg aaaaggcagg + 15661 atgatagacc aaaaagctta ggggcggcta tcccctcaat gacactaatt gatattgatg + 15721 ttattgcatc aggacctata caaaatataa aagctggtat cggtgataca atatccaatt + 15781 acactgcatt gaaagattgg gagttggcag ttgagcgagg gaaagatgag atgcatggtt + 15841 ttgcatatct aatgtcgcaa aattctttag atgctttaat gaaaacgaag tataattcta + 15901 ttacccctga ttttattgaa gttttggtaa actctttagt tttatcaggc attgcaatgg + 15961 attttgcggg aagtagtaga cctgtcagtg ggtcagagca cttatttagt catgcattag + 16021 attactatgg ttctacaagg aatcttcatg gaattcaggt tgcattaggt acagtcgcag + 16081 ttttgaaatt aattgaaaat tctgttgata ctgtagtgga ttacttgcaa agatttgagg + 16141 ttcatattaa cccgaaactt ttggggatag atgaagagtt gtttatttat tgtatgcaac + 16201 atgctacaaa aatgagaagt aatcgctata cttatctgca tgaagttgat cttagcacag + 16261 atagattgaa acaaatatat aaggaactca taagcgagtt gtagaaaaga gaggaaaaaa + 16321 tgaaagcact tattttagca gcagggttag gaacacgtct agctccaatt accaatgagg + 16381 taccaaaatc tttggtacca gtcaatggta agccaatttt gatgaaacaa attgaaaatt + 16441 tatatcaaaa taatattaca gatattacga ttattgctgg atataagtca tctgtattaa + 16501 cagatgcagt tactgaaaag tatccagaaa ttaatattat tgataatgtt gattttaaaa + 16561 cgactaataa tatgtattca gcctatctag gaaaagctgc aatgggtgat agtgacttct + 16621 taatgatgaa tgcagatgta ttttatgatg cttctgttat taaaagtctg ttgcttcata + 16681 aagctccaaa tgcaattgta actgatttag gtatttatat tgaagagtct atgaaagtcg + 16741 tagaaaaaaa tgggcgttta gtagaaattt ctaaacagat ttcacctgag gaaactttag + 16801 gagcttctat tgatgtttat aaattctctt atgaagcagg tgctcgattc tttgaaaagt + 16861 gtaaggaatt tattgaagat aaacgagaac ttcaaatgtg gagtgaggtt gctcttaatg + 16921 caattctttc tgaagttgaa tttgtagcat gtccattaga gggtcgttgg ttagaaattg + 16981 ataatcatga agacttagtt gctgcagaaa aactatttgc ttgaaccgaa tacggagaat + 17041 gaaattgaca aatagagttg attattttgg tgctgatatt agtgaacttc agaataaaaa + 17101 attattctta tttgatatgg atggtaccat ttatgaagaa gataggttgt ttgagggtac + 17161 tctcgaatta ttagactata ttcataatat tggcggtgag tatattttta ttacaaacaa + 17221 ttcatctaag tctgttgttg actatgttga aaaagttaac agattaggta ttaaagctga + 17281 acgagataat ttttttacct ctgctcaggc cacaattgtt tatattaaag aaaattatcc + 17341 taaatctaaa gtttattgcc aaggaacaaa atctttgata aaagaactat ctgacgcagg + 17401 aattgatgta actgagcaag ttagtgctga tatagatgtt gttcttgttg gttttgatac + 17461 agaattaacc agtgataaaa ttcgcaatac ctgcgagatt ctatcaacaa aggacgtacc + 17521 tttcatagct actaaccctg atattcgctg cccagtatcg tttggattca tcccggattg + 17581 tggttctatt tgtgatatga ttagtaaatc agtcgatagg aaacctgttt acataggtaa + 17641 acctgaacct acgatggttg atattgttcg aaaaaaatta aattattctc tatttgaaac + 17701 agttgtgatt ggagatcgct tgtatacgga tatcatgact ggtataaatg caggagtaac + 17761 ttcagtttgt gtgctgacag gagaagcaac ggtgaatgat attcaacaag atagtataaa + 17821 accgacttat acatttaaaa acgtgaaaga aatgtggaaa ggaattgtct gattttttca + 17881 ttctgaatag tgaattcatg aatactgtca aaatactcgt atgtatttaa attgatttca + 17941 ttattttaat aatggacaaa ttaaaattat ttttctcccc aaatcgttcg tgaacgtaaa + 18001 gtactcatca acaaagaaag gtaccccttt tatgaaaggt attattctag caggtggttc + 18061 gggaactcgc ttgtatcctt tgactcgagc cgcatcaaaa caacttatgc cggtttatga + 18121 taaaccgatg atttactacc cactttcaac attgatgttg gctgggatta gggatatttt + 18181 gattatttcc actccacagg atttacatcg atttcaagag cttcttcaag acggatctga + 18241 gtttgggatc aaactttctt atgcagagca accaagtcca gatggtttgg cacaagcctt + 18301 tatcattggg gaagagttta tttctgatga tagcgttgcg ctaatcttag gtgataatat + 18361 ctaccatggt tctgggcttt ccaagatgct acaaaaggca gcgagtaagg agtcgggagc + 18421 aactgttttt ggctaccatg tcaaggatcc agagcgcttt ggtgtggttg agtttgatca + 18481 ggatatgaag gctatttcta ttgaagaaaa gccagagcaa cctcgttcaa actatgcagt + 18541 tacaggtctc tatttctatg ataatgatgt agtagagatt gccaaaagta ttaaaccaag + 18601 tcctcgtggt gaattggaaa ttacagacgt taacaaggct tatctagaac gtggtgattt + 18661 gtctgttgag cttatgggac gtggctttgc ttggttggat actggcactc atgaaagttt + 18721 actagaggct tcgcagtaca tcgaaacagt ccaacggatg caaaatgttc aggtagcaaa + 18781 cttagaagaa attgcctatc gcatgggtta tatcagtcgt gaagatgtat tgaccttagc + 18841 ccaaccactt aagaaaaatg aatacggaca gtatctgctc cgtttgattg gagaagcata + 18901 gatgacagat aattttttcg gtaagacgct tgcggcacgc aaggttgaaa ctattccagg + 18961 catgttggag tttgatatcc ccgttcatgg agataatcgt ggctggttta aagaaaattt + 19021 ccaaaaggaa aaaatgcttc cacttggatt tccagagtct ttctttgcag aaggaaaatt + 19081 gcaaaacaat gtatccttct cacgtaaaaa tgtccttcga ggcctccacg cagagccttg + 19141 ggataagtac atctctgtag cagatggagg gaaagttctg ggttcttggg ttgatctacg + 19201 cgagggtgaa acctttggga atacctatca gacagtaatt gatgcaagca agggaatctt + 19261 tgttcctcga ggcgtagcta atggcttcca agttctatca gatacagtgt catatagcta + 19321 tctggtcaat gattactggg ctctcgagct caaacccaag tatgcctttg tgaactacgc + 19381 tgatccaagc cttggtattg aatgggaaaa tattgcagaa gcagaggttt cagaagcaga + 19441 taaatatcat cccctactta aggatgtaaa acctttgaaa aaagaagatt tgtaaaaagg + 19501 aaagaatatg actgaataca aaaatattat cgtgacaggt ggagctggct ttatcggttc + 19561 taactttgtc cattatgttt acgagaactt tccaggtgtt cacgtgacag tcctagataa + 19621 gttgacttat gctggaaatc gcgcgaatat tgaggaaatt ttaggtaatc gtgttgagtt + 19681 agttgttggt gacattgctg atgcggagtt ggtagacaag ttggctgctc aagcagatgc + 19741 tatcgttcat tatgcagcgg aaagccacaa tgataattcg ctcaatgatc catcgccatt + 19801 tattcatact aacttcatcg gaacctatac tcttttagaa gctgctcgta agtatgatat + 19861 tcgcttccac catgtatcga cagatgaagt ttatggggat ctccctttac gcgaagattt + 19921 gccaggtcat ggagaagggc cgggtgagaa atttacggct gaaaccaagt acaatccaag + 19981 ctcgccttac tcatcaacca aggcagcctc agatttgatt gtcaaagcct gggtccgttc + 20041 ttttggagtc aaggcaacga tttccaactg ttcaaataac tacggtcctt atcaacatat + 20101 cgaaaaattc atcccacgtc agattactaa catcctaagt ggaattaagc caaaacttta + 20161 cggtgaaggt aagaacgttc gtgactggat tcataccaat gaccattctt caggagtttg + 20221 gacaatcttg acaaaagggc aaattggtga aacctacttg attggggctg atggtgagaa + 20281 gaacaataag gaagttttgg aacttatcct taaggaaatg ggacaagctg cggatgccta + 20341 tgatcatgtg actgaccgtg caggacatga ccttcgctat gcgattgatg ctagcaagct + 20401 ccgtgatgag ttggggtgga aacctgaatt taccaacttt gaagctgggc tcaaggcaac + 20461 aatcaagtgg tatacagata accaagaatg gtggaaagca gaaaaagaag ctgttgaagc + 20521 caattatgct aagactcagg agattattac agtataaaaa gcaggaaata gctgcttttt + 20581 attgctatat tgggaagagt tacatattag aaaggtctag agatgatttt aattacaggg + 20641 gcaaatggcc aattaggaac ggaacttcgc tatttattgg atgaacgtaa tgaagaatac + 20701 gtggcagtag atgtggctga gatggacatt atcgatgcag aaatggttga gaaagttttt + 20761 gaagaggtga aaccgacttt agtctaccac tgtgcagcct acaccgctgt tgatgcagca + 20821 gaggatgaag gaaaagagtt ggacttcgcc atcaatgtga cggggacaaa aaatgtcgca + 20881 aaagcatctg aaaaacatgg tgcaactcta gtttatattt ctacggacta tgtctttgac + 20941 ggtaagaaac cagttgggca agagtgggaa gttgatgacc gaccagatcc acagacagaa + 21001 tatggccgta ctaagcgtat gggggaagag ttagttgaga agcatgtgtc taatttctat + 21061 attatccgta ctgcctgggt atttggaaat tatggcaaaa acttcgtttt taccatgcaa + 21121 aatcttgcga aaactcataa gactttaaca gttgtaaatg accagtacgg tcgtccgact + 21181 tggactcgta ccttggctga gttcatgacc tacctagctg aaaatcgtaa ggaatttggt + 21241 tattatcatt tgtcaaatga tgcgacagaa gacacaacat ggtatgattt tgcagttgaa + 21301 attttgaaag atacagatgt cgaagtcaag ccagtagatt ccagtcaatt tccagccaaa + 21361 gctaaacgtc cgctaaactc aacgatgagc ctggccaaag ccaaagctac tggatttgtt + 21421 attccaactt ggcaagatgc attgcaagaa ttttacaaac aagaagtgag ataagtagta + 21481 gaatgatttt ctagtctaat aaaagaggta gataatgaac tccaaaggag cttaagatat + 21541 acgattatct tgttgttggt gctggtctct ttggtgcata gctatggctc agtttctatt + 21601 atcgctcaca ccatccatca gaagtttaat ctgaaggtac ccaattatcg ccaagaagaa + 21661 gattgggcta agatgggttt accaatcaca cgcaaggaaa tctctaattg gcatatcaag + 21721 acgagtcaat actatttgga gcccctctat aacctcttgc gagagagact attgactcag + 21781 cccttacttc atgcggatga aacttcttat agggtgctag agagtgatag tcagctgact + 21841 tactattgga cttttttgtc aggtaaatca gagaaacaag ggattacgct ttaccaccat + 21901 gatcagtgtc gaagtggttc agtagtacaa gaattcctag gagattattc tggctatgtg + 21961 cattgtgata tgttgtggca gtaacttagg actttagtcc tctagttctg cctatgcgat + 22021 agcagtccaa agtttaggag taaggcgacg ctaagcttgg taaactgcga acagctagaa + 22081 gcttatcgtc aactggaaga agctgcactt gttggatgtt gggcgcatgt gagaaggaag + 22141 ttttttgaag cgacccccaa gcaagcagat aaatcatcct taggagctaa aggtttagtt + 22201 tattgtgatc agttattttc cttggaaaga gactgggagg ctttgccagc tgatgaacga + 22261 ctacagaaac gtcaagaaca tctccaaccc ctactggaag acttctttgc ttggtgccgg + 22321 cgtcagtcag ttttatcggg ttcaaaacta ggaagggcaa ttgaatacag cctcaagtat + 22381 aaagaaacct ttaagaccat tttgaaagac ggacatctgg tcctttccaa taatctagct + 22441 gaatgcacca ttaaatcatt ggttatggga cggagtaaaa gagtccagtg gactctttta + 22501 gcctaagctc agtttaaaaa agcgagggtg gttattttct caaagttttg aaggagctaa + 22561 agcaagagct attattatga gtttgttgga aacagctaaa cgtcatcaat taaatagcga + 22621 gaaatatcta ttctatcttc tagaatgtct tccaaacgag gaaactctcg taaacaaaga + 22681 ggttttagag gtttatttat catggactaa agttgtacaa gaaaagtgca aataagaaat + 22741 ctccagatta ggaactatcc gtgagttctc tagtctggag atttttcaat atacttcgtt + 22801 attgggcggt tacgatattc atattttttg caaagatgtt gtttgaaaaa taattttcaa + 22861 aaattctgaa aattctgttg acaactttct gaaaagagtc tataatggag agaaagtttt + 22921 aaaggagaaa atgatgaaaa gttcaagact acttgccctt gcgggcgtga cattattg +// + diff --git a/public/res/serotype_genbank/serotype_28F.gb b/public/res/serotype_genbank/serotype_28F.gb new file mode 100644 index 0000000..30a6258 --- /dev/null +++ b/public/res/serotype_genbank/serotype_28F.gb @@ -0,0 +1,1045 @@ +LOCUS CR931693 21839 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 34372 (serotype 28f). +ACCESSION CR931693 +VERSION CR931693.2 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21839) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21839) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT On Mar 17, 2006 this sequence version replaced CR931693.1. + NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21839 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="34372" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC28F_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC28F_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34045.2" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 321..489 + /gene="aliB" + /locus_tag="SPC28F_0002" + /pseudo + CDS 321..489 + /gene="aliB" + /locus_tag="SPC28F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(490..1007) + /gene="tnp" + /locus_tag="SPC28F_0003" + /pseudo + CDS complement(join(490..618,618..1007)) + /gene="tnp" + /locus_tag="SPC28F_0003" + /note="member of homology group 4; + old_tribe:0004 68" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + gene 1219..2673 + /gene="wzg" + /locus_tag="SPC28F_0004" + CDS 1219..2673 + /gene="wzg" + /locus_tag="SPC28F_0004" + /note="member of homology group 0; + old_tribe:0000 80" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34048.2" + /db_xref="GOA:Q4K008" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K008" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1432..1779 + /gene="wzg" + /locus_tag="SPC28F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.6e-64" + misc_feature 1957..2400 + /gene="wzg" + /locus_tag="SPC28F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 2675..3406 + /gene="wzh" + /locus_tag="SPC28F_0005" + CDS 2675..3406 + /gene="wzh" + /locus_tag="SPC28F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1; + old_tribe:0001 80" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34049.2" + /db_xref="GOA:Q4K007" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K007" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTLYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEKDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2678..3286 + /gene="wzh" + /locus_tag="SPC28F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.7e-37" + gene 3412..4107 + /gene="wzd" + /locus_tag="SPC28F_0006" + CDS 3412..4107 + /gene="wzd" + /locus_tag="SPC28F_0006" + /note="member of homology group 2; + old_tribe:0002 80" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34050.2" + /db_xref="GOA:Q4K006" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K006" + /translation="MMKEQNMIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDNPGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQI + PLLGVVPDLNKMK" + misc_feature 3433..3849 + /gene="wzd" + /locus_tag="SPC28F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-56" + gene 4117..4806 + /gene="wze" + /locus_tag="SPC28F_0007" + CDS 4117..4806 + /gene="wze" + /locus_tag="SPC28F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3; + old_tribe:0003 80" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34051.2" + /db_xref="GOA:Q4K005" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K005" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + AGEGKSMTSTNIAWAFAHAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEVNRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 4821..6188 + /gene="wchA" + /locus_tag="SPC28F_0008" + CDS 4821..6188 + /gene="wchA" + /locus_tag="SPC28F_0008" + /note="member of homology group 5; + old_tribe:0005 59" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34052.2" + /db_xref="GOA:Q4K004" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K004" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTETSRVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVIVNLNAFDRSLACNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGCFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5604..6185 + /gene="wchA" + /locus_tag="SPC28F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.8e-160" + gene 6219..7391 + /gene="wchF" + /locus_tag="SPC28F_0009" + CDS 6219..7391 + /gene="wchF" + /locus_tag="SPC28F_0009" + /note="member of homology group 15; + old_tribe:0014 23" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI34053.2" + /db_xref="GOA:Q4K003" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K003" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGITEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDEDPIF + YILACRIGPFIHGIKKRIQAIGGTLLVNPDGHEWLREKWSLPVRKYWKYSERLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSILKSSDEKVRSWFKEKNVSEN + EYYLVVGRFVPENNYEAMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIVDFFTWEKIVTDYEKIFKK" + gene 7388..8659 + /gene="wciU" + /locus_tag="SPC28F_0010" + CDS 7388..8659 + /gene="wciU" + /locus_tag="SPC28F_0010" + /note="member of homology group 59; + old_tribe:0042 7" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34054.2" + /db_xref="GOA:Q4K002" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K002" + /translation="MKILHYTLGFQPQRTGGLVKYAEDLMLEQIAQGYQVAALYPGRI + KFFSKKIEIIKAMSRQFECYELLNSLPMALFGGISDPTAFLTPCDKNVYRTFLEKVQP + DIIHIHSFMGLHKEFLEIAKNLNIRVVFTSHDYYGLAPVPHFYFNGVDYSNKSTNLTW + NIMSSNALSVKKLRLFQVSFYPTIRKLLKLLGKNPKSKKNLVIRDVIEEQDYSELRYY + YNEMFHLIDGYLFNSRLAKKVYEINEIKSANSIVLSITNSSINHHQRLTTTNNKIRVA + YIGPDEEYKGYFDFIDFVETLDRESYEVATYGHLPNGECPSFIEQKGYFTKEMIDSVY + ENIDILIVPSKWKETFGLITVEALSYGVNVFVSENVGSKDLLPESHVFKNQNDLVVKF + LKNDIENTKLKTLDEHSIEVIQYYERVINDS" + misc_feature 8162..8623 + /gene="wciU" + /locus_tag="SPC28F_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0016" + gene 8649..9335 + /gene="wcxM" + /locus_tag="SPC28F_0011" + CDS 8649..9335 + /gene="wcxM" + /locus_tag="SPC28F_0011" + /note="member of homology group 105; + old_tribe:0078 4" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34055.2" + /db_xref="GOA:Q4K001" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4K001" + /translation="MIVKSFIKKITGKTVDIHPDVPLSYILQRGINYGFGLFRGVVRG + IGFGQNDKRLFIGQGVSILAKRKLFVGKNVRIGKKVSIDALSKEGIHFADNVKIGDYS + QIIGTGSIKNMGIGLKIGKNSSFSEYSLFGSAGGITIGDNVIAGQNVRFHAENHNYSD + LDKLIVEQGVSRKGISVGDNCWIGAGSVFLDGSSIGSGCVVAANSVITKNFPDNVIVA + GVPAKIIKMK" + misc_feature 8847..8900 + /gene="wcxM" + /locus_tag="SPC28F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 16" + misc_feature 8913..8966 + /gene="wcxM" + /locus_tag="SPC28F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 13" + misc_feature 9054..9107 + /gene="wcxM" + /locus_tag="SPC28F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 10" + misc_feature 9168..9221 + /gene="wcxM" + /locus_tag="SPC28F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 11" + misc_feature 9222..9275 + /gene="wcxM" + /locus_tag="SPC28F_0011" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 1.7" + gene 9347..10225 + /gene="wcxN" + /locus_tag="SPC28F_0012" + CDS 9347..10225 + /gene="wcxN" + /locus_tag="SPC28F_0012" + /note="member of homology group 154; + old_tribe:0096 3" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34056.2" + /db_xref="GOA:Q4K000" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K000" + /translation="MGKEIKAVYAILNYNTWEDTARLAQKVATFQHIQSVIIVDNLST + DDSYHYLKRLEGEKISVYQTQRNGGYSVGNNVAARKAYNMGVDILFISNPDVDIDEKD + SLMIAQNLYKNSSYALLSGIEYNAMKEIDLPIVWHENSYYDDLLDCLFLTRKLRRKKE + DINLSMIKSSIIDVDLVKGSFFAVRLSDFHDVGYFDESVFLFCEERILAKKLQKANKK + IGILPEAKYYHNHSTSINEKYKKKKEQIVLLYNARYYYNVTYQNISFLKKICLKLFMF + LSIIEYSILDYIKRKG" + gene 10234..11466 + /gene="wzy" + /locus_tag="SPC28F_0013" + CDS 10234..11466 + /gene="wzy" + /locus_tag="SPC28F_0013" + /note="old_tribe:0172 2; + member of homology group 251" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34057.2" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4JZZ9" + /translation="MVINFSKYNWILILILSSSELFSKETNLFLLLFILLYYVLVRGG + RLPISIPGAKYYFTLLMVGLFIGIGNVIINENTVFNFVKHFIYYLLPLFFWQFGCILS + NNDNLSYKQNNIKESIVITAFLLSSYDLIGSIISFLSRTKEIVDLYSLRSEFGRGSYI + PIIALYLVLVYSREIKLSKNFKGFLLLLFTISILIHFSRTHFIILLILVFFSGFEKNM + KSIKKIMFAGTLILAGVGVLYLYFPNLVIDFYNKISQSTTEITFSKSSWSHKDIIWNW + RGYEMYSALNHFKSSTLLEQILGGGFGTVLYIGEYAYLVSDLPYLLFLHNGYFTTLLV + FGVSGVILFVLWVLSLFSYSKYVNDTQDSNFIKGLAVVILFTTYFVNGPLFSVSQATF + LLYFALFSNNHGELDEDF" + gene 11453..12613 + /gene="wcxP" + /locus_tag="SPC28F_0014" + CDS 11453..12613 + /gene="wcxP" + /locus_tag="SPC28F_0014" + /note="member of homology group 155; + old_tribe:0097 3" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI34058.2" + /db_xref="GOA:Q4JZZ8" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4JZZ8" + /translation="MKIFKKIKFILMLLYTSTFPRCEKILIFGSWLGEKYADNPRYLF + EYVIKNRPDLKAIWITSNQDVFKELQKKQYPVMMADESEAHKIMKKAKYIFTTTGIFD + IGVENSRLIGGAFLINLWHGIPLKKIMYDDKHSALHKRSKLVTWVEKIPLRNYFVIST + STAITQIYQSAFRVKKSNILELGQPRNDYFYDESYPVSSLIQELKSKNIILYMPTHRN + EGKKQIPLDNLMDLNRLNKWCEETNSIFVIKKHFYHSKEKTLEKEYSSIIDVTNEKVD + AQELLKYSKILITDYSSCYIDYLLLDRPIIFFNYDYDDYLRIDRSLYFPYEKVTPGEK + CQNFDELLVTLQNLYLGKDDYRKKRENIKTFFYSSETQKSVSEKIINHVLNL" + misc_feature 12041..12607 + /gene="wcxP" + /locus_tag="SPC28F_0014" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 4.5e-32" + gene 12619..14070 + /gene="wzx" + /locus_tag="SPC28F_0015" + CDS 12619..14070 + /gene="wzx" + /locus_tag="SPC28F_0015" + /note="member of homology group 52; + old_tribe:0058 5" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34059.2" + /db_xref="GOA:Q4JZZ7" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZZ7" + /translation="MESVMKKILNKYYSLSNPVKASIWFTICNVLQKGISMITVPIFT + RLLTTEQYGVYSVYQSWYSIIGVFATLNLYYGVFNNGMVKYEKDKNAFTSSMQGLTTT + VTAIFLVIYLIGIDFWNSLLGLPTLLILVMFFDLFFTPAYSFWATRQRFEYQYRNLVF + ITLIIAIGSPIIGISSVVLSTYKAEARVISFVLVQSCIGLYFYVLNLYRGKYFFCKKY + WLYALNFNLPLIPHYLSQSVLNQSDRIMINSMVGMGEAAIYSVAYSISTLMVLVTSAI + NSSFIPYTYKCIRDKKYTELGKSANLLITLVGIGSILTISLGPEIIQLFAPKQYYEAI + WIIPPVALSVYFMFLYPIFGNIEFYFEANHFVMWASIGGAIMNIFLNFIFIKHFGYIA + AGYTTLLCYILFALGHYIFMRRALYQNLSGIQIYDSRYIFFFSFLLLILMLLIVTIYP + FVLIRYIAISLILGGCFLKRRKIMSSIVMIKKQ" + misc_feature 12670..13482 + /gene="wzx" + /locus_tag="SPC28F_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.9e-12" + gene 14080..14892 + /gene="wcxQ" + /locus_tag="SPC28F_0016" + CDS 14080..14892 + /gene="wcxQ" + /locus_tag="SPC28F_0016" + /note="member of homology group 156; + old_tribe:0098 3" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34060.2" + /db_xref="GOA:Q4JZZ6" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZZ6" + /translation="MTEINKQLHETLIEILDFVKEICEKHELTYFLIYGTALGAKRHC + GFIPWDDDVDIALPREHYNILIDVLSKMEQSIFSLQNEDNEPNYFLPFAKLRKNNTIF + IEKILDVEYENNGIYIDIFPLDFVENPDSFNFKMRRTMFNYIKHILKFSSCRSFYKNK + YSSVRYLMENIMSIPTLFFSNRRLLFLANNLISSTNKANFIGQYDESSERAIMPSSYY + FPSRSAVFEGKIYSVPAKLEDYLKYFYGSDYMELPPIEKRVTHQPIKLRFKK" + misc_feature 14146..14817 + /gene="wcxQ" + /locus_tag="SPC28F_0016" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 1.4e-36" + gene 14968..15996 + /gene="gtp1" + /locus_tag="SPC28F_0017" + CDS 14968..15996 + /gene="gtp1" + /locus_tag="SPC28F_0017" + /note="member of homology group 40; + old_tribe:0030 9" + /codon_start=1 + /transl_table=11 + /product="putative glycerol-2-phosphate dehydrogenase" + /protein_id="CAI34061.2" + /db_xref="GOA:Q6X849" + /db_xref="InterPro:IPR002658" + /db_xref="InterPro:IPR016205" + /db_xref="UniProtKB/TrEMBL:Q6X849" + /translation="MKNNDLKIGSGAIHQISATLSQNNISGKILYCADPVVDDLYGSI + VRSQIEEIGRVKEESCNYNTIAYAMNIAERAIATDIDCIVGMGGGRVLDVCKYASFIS + KRPYLSIPTTAANDGIASPVAVLKRQDDRPKSLGAAIPSMTLIDIDVIASGPIQNIKA + GIGDTISNYTALKDWELAVERGKDEMHGFAYLMSQNSLDALMKTKYNSITPDFIEVLV + NSLVLSGIAMDFAGSSRPVSGSEHLFSHALDYYGSTRNLHGIQVALGTVAVLKLIENS + VDTVVDYLQRFEVHINPKLLGIDEELFIYCMQHATKMRSNRYTYLHEVDLSTDRLKQI + YKELISEL" + misc_feature 14989..15909 + /gene="gtp1" + /locus_tag="SPC28F_0017" + /note="HMMPfam hit to PF01761, 3-dehydroquinate synthase, + score 3.1e-70" + gene 16012..16716 + /gene="gtp2" + /locus_tag="SPC28F_0018" + CDS 16012..16716 + /gene="gtp2" + /locus_tag="SPC28F_0018" + /note="member of homology group 41; + old_tribe:0031 9" + /codon_start=1 + /transl_table=11 + /product="putative nucleotidyl transferase" + /protein_id="CAI34062.2" + /db_xref="GOA:Q4K1J4" + /db_xref="InterPro:IPR005835" + /db_xref="UniProtKB/TrEMBL:Q4K1J4" + /translation="MKALILAAGLGTRLAPITNEVPKSLVPVNGKPILMKQIENLYQN + NITDITIIAGYKSSVLTDAVTEKYPEINIIDNVDFKTTNNMYSAYLGKAAMGDSDFLM + MNADVFYDASVIKSLLLHKAPNAIVTDLGTYIEESMKVVEKNGRLVEISKQISPEEAL + GASIDVYKFSYEAGARFFEKCKEFIEDKRELQMWSEVALNAILPEVEFIACPLDGRWL + EIDNHEDLAVAEKLFA" + misc_feature 16015..16704 + /gene="gtp2" + /locus_tag="SPC28F_0018" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 8.9e-08" + gene 16731..17564 + /gene="gtp3" + /locus_tag="SPC28F_0019" + CDS 16731..17564 + /gene="gtp3" + /locus_tag="SPC28F_0019" + /note="member of homology group 42; + old_tribe:0032 9" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI34063.2" + /db_xref="GOA:Q4JZZ3" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006357" + /db_xref="UniProtKB/TrEMBL:Q4JZZ3" + /translation="MKLTNRVDYFGADISELQNKKLFLFDMDGTIYEEDRLFEGTLEL + LDYIHNIGGEYIFITNNSSKSVVDYVEKVNRLGIKAERDNFFTSAQATIVYIKENYPK + SKVYCQGTKSLIKELSDAGIDVTEQVSADIDVVLVGFDTELTSDKIRNTCEILSTKDA + PFIATNPDIRCPVSFGFIPDCGSICDMISKSVDREPVYIGKPEPTMVDIVRKKLNYSL + FETVVIGDRLYTDIMTGINAGVTSVCVLTGEATVNDIQQGSIKPTYTFKNVKEMWKGI + V" + misc_feature 16788..17474 + /gene="gtp3" + /locus_tag="SPC28F_0019" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 6.5e-25" + gene 17724..18593 + /gene="rmlA" + /locus_tag="SPC28F_0020" + CDS 17724..18593 + /gene="rmlA" + /locus_tag="SPC28F_0020" + /EC_number="2.7.7.24" + /note="member of homology group 10; + old_tribe:0009 35" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34064.2" + /db_xref="GOA:Q4JZZ2" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JZZ2" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLERGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17727..18443 + /gene="rmlA" + /locus_tag="SPC28F_0020" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.2e-120" + gene 18594..19202 + /gene="rmlC" + /locus_tag="SPC28F_0021" + CDS 18594..19202 + /gene="rmlC" + /locus_tag="SPC28F_0021" + /EC_number="5.1.3.13" + /note="member of homology group 11; + old_tribe:0010 35" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34065.2" + /db_xref="GOA:Q4JZZ1" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4JZZ1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 18630..19175 + /gene="rmlC" + /locus_tag="SPC28F_0021" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 2.4e-15" + gene 19215..20264 + /gene="rmlB" + /locus_tag="SPC28F_0022" + CDS 19215..20264 + /gene="rmlB" + /locus_tag="SPC28F_0022" + /EC_number="4.2.1.46" + /note="member of homology group 8; + old_tribe:0008 36" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34066.2" + /db_xref="GOA:Q4JYY6" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYY6" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGERPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLREELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 19230..20186 + /gene="rmlB" + /locus_tag="SPC28F_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 7.3e-05" + misc_feature 19233..20177 + /gene="rmlB" + /locus_tag="SPC28F_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0047" + misc_feature 19233..19973 + /gene="rmlB" + /locus_tag="SPC28F_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 3.3e-76" + misc_feature 19236..20048 + /gene="rmlB" + /locus_tag="SPC28F_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.7e-05" + gene 20330..21181 + /gene="rmlD" + /locus_tag="SPC28F_0023" + CDS 20330..21181 + /gene="rmlD" + /locus_tag="SPC28F_0023" + /EC_number="1.1.1.133" + /note="member of homology group 9; + old_tribe:0011 35" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34067.2" + /db_xref="GOA:Q4JZY9" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZY9" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPEPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 20330..21178 + /gene="rmlD" + /locus_tag="SPC28F_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 2.9e-147" + misc_feature 20333..20974 + /gene="rmlD" + /locus_tag="SPC28F_0023" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 20333..20962 + /gene="rmlD" + /locus_tag="SPC28F_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.2e-18" + misc_feature 20336..21064 + /gene="rmlD" + /locus_tag="SPC28F_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 4.5e-08" + gene 21257..21837 + /gene="tnp" + /locus_tag="SPC28F_0024" + /pseudo + CDS join(21257..21667,21655..21837) + /gene="tnp" + /locus_tag="SPC28F_0024" + /note="member of homology group 12; + old_tribe:0012 28" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature join(21263..21655,21667..21702) + /gene="tnp" + /locus_tag="SPC28F_0024" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 0.00017" + /pseudo +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 tttttataac caaggtttat aaactttcat tctcgaaatt caattaactt tacaaattcc + 301 cactattaag gagaaagaag atgaacataa agaagcgtgt ccttagtgca ggcctgactt + 361 ttgcatctgc tttgctttta gctgcttgcg gccaatcagg ttcagataca aaaacttact + 421 catcaacctt tagtggaaat ccaactacat ttaattacct gttagactat tacgctgata + 481 atatagtcaa ttgaaacaag agcaggacaa aagagcctca taaaaggtat tgcaacttgt + 541 aatacctttt tgaggtgctt tttgatatga gcccatgttt tctcaatagg attgtactca + 601 ggtgagtagg gaggaagagg taaaagttta tacccaaact cttcacacaa gagttctaac + 661 ttacccattc tatggaatct tgcattatcc ataataataa ccgatggtgt gtttaatgtt + 721 ggtaagagaa atttctgaaa ctaagcttca aaaaagtcgc tcgtcatcgt ctcttcgtaa + 781 gtcattggag cgattaactc accatttgtt agacctgcaa ccaaagaaat cctctgatat + 841 cttcttccag atactttgcc tcttcttaac tgacctttta atgagcgacc atattctcga + 901 taaaaataag tatcaaatcc tgtttcgtca atctaaacag gtactaggtg ctttaaacta + 961 ttaaaattct taagaaataa ggctactttt tctgggtctt gttcataatt agattgaaac + 1021 tagaatagta cacctctgct tctaaaacat tgttagaaat cgatttgact gtcctgatcg + 1081 atttgtcatg ttcttatttt attttactat atttttgttt cgcgggaagt ctactaagat + 1141 acttaaagat gcagatagta aaaaaatgta gacattaccg taaaaaagtg atataatcgt + 1201 atgatgttca aggtataggt gttaatcatg agtagacgtt ttaaaaaatc aggttcacag + 1261 aaagtgaagc gaagtgttaa tatcgttttg ctgactattt atttattgtt agtttgtttt + 1321 ttattgttct taatctttaa gtacaatatc cttgctttta gatatcttaa cctagtggta + 1381 actgcgttag tcctactagt tgccttggta gggctactct tgattatcta taaaaaagct + 1441 gaaaagttta ctatttttct gttggtgttc tctatccttg tcagctctgt gtcgctcttt + 1501 gcagtacagc agtttgttgg actgaccaat cgtttaaatg cgacttctaa ttactcagaa + 1561 tattcaatca gtgtcgctgt tttagcagat agtgatatcg aaaatgttac gcaactgacg + 1621 agtgtgacag caccgactgg gactgataat gaaaatattc aaaaactact agctgatatc + 1681 aagtcaagtc agaataccga tttgacggtc aaccagagtt cgtcttactt ggcagcttac + 1741 aagagtttga ttgcagggga gactaaggcc attgtcctaa atagtgtctt tgaaaatatc + 1801 atcgagtcag agtatccaga ctacgcatcg aagataaaaa agatttatac caagggattc + 1861 actaaaaaag tagaagctcc taagacgtct aagaatcagt ctttcaatat ctatgttagt + 1921 ggaattgaca cctatggtcc tattagttcg gtgtcgcgat cagatgtcaa tatcctgatg + 1981 actgtcaatc gagataccaa gaaaatcctc ttgactacaa caccacgtga tgcctatgta + 2041 ccaatcgcag atggtggaaa taatcaaaaa gataaattaa cccatgcggg catttatgga + 2101 gttgattcgt ccattcatac cctagagaac ctttatggtg tagatattaa ttattatgtt + 2161 cgtttgaatt ttacctcatt tttgaaattg attgacttat tgggaggggt agatgttcat + 2221 aatgatcaag agttttcagc tctacatggg aagttccatt tcccagtagg gaatgtccat + 2281 ctagactctg agcaagcttt aggttttgtt cgtgagcgct actccctagc agatggcgat + 2341 cgtgaccgtg gtcgcaacca acaaaaggtg attgtggcta tccttcaaaa attaacgtca + 2401 accgaagcac tgaaaaatta tagtacgatc attgatagct tgcaagattc tatccaaaca + 2461 aatatgccac ttgagaccat gataaatttg gtcaatgctc agttagaaag tggtggaact + 2521 tacaaagtga attcgcaaga cttgaaaggt acaggtcgga tggatcttcc ttcttatgca + 2581 atgccagaca gtaacctcta tgtgatggaa atagatgata gtagtttagc tgtagttaaa + 2641 gcagctatac aggatgtgat ggaggggaga tgaaatgata gacatccatt cacatatcgt + 2701 ttttgatgta gatgacggtc ccaagtcaag agaggaaagc aaggctctct tggcagaagc + 2761 ctacagacag ggggtgagaa ccattgtctc tacctctcac cgtcgcaagg gcatgtttga + 2821 aactccggaa gagaagatag cagaaaactt tcttcaggtt cgggaaatag ctaaggaagt + 2881 ggcgagtgac ttagtcattg cttacggagc tgaaatttac tacacaccag atgttctgga + 2941 taagctggga aaaaagcgga ttccgaccct caatgatagt cgttatgcct tgatagagtt + 3001 tagtatgaac actctttatc gcgatattca tagcgccttg agcaagatct tgatgttggg + 3061 aattactcca gtcattgccc acatcgaacg ctatgatgct cttgaaaata atgaaaaacg + 3121 cgttcgggag ctgattgata tgggctgtta cacgcaagta aatagttcac atgtcctcaa + 3181 acccaaactt tttggcgaac gttataaatt catgaaaaaa agagctcagt attttttaga + 3241 gaaagatttg gttcatatca ttgcaagtga tatgcacaat ctagacggta gacctcctca + 3301 tatggcagaa gcatatgacc ttgttaccca aaaatacgga gaagcgaagg ctcaggaact + 3361 ttttatagat aatcctcgaa aaattgtaat ggatcaacta atttaggaga aatgatgaaa + 3421 gaacaaaaca tgatagaaat cgatgtattt caattattta aaaccttgtg gaaacgcaag + 3481 ctaatgattt tattagtggc acttgtgaca ggtgcggggg cttttgcata tagcactttt + 3541 attgttaagc cagaatatac gagtaccacg cgaatttacg tagtgaatcg caatcaagga + 3601 gacaatccgg ggctgacaaa tcaggatttg caggcaggat cttatctggt aaaagactac + 3661 cgtgagatta tcctttcgca ggatgtattg gaaaaagtag cgacaaattt gaagctggat + 3721 atgccagcca aaacgttagc cagcaaagtt caagtgactg taccagctga cactcgtatc + 3781 gtctcaatct ctgtcaagga taaacagcca gaggaagcca gtcgtatcgc taattctcta + 3841 cgagaagttg ctgcagaaaa gatcgtcgct gtaacgcgag tatctgatgt aacgacactt + 3901 gaagaagcgc gaccagctac gactccctct tctccaaatg ttcgacgcaa ttccttgttt + 3961 ggttttcttg gaggagcagt cgtaacagta attgctgttc ttttgattga gttgctcgac + 4021 acccgtgtga aacgtcctga agatgtcgaa gatgtactgc aaattccact tttaggggtc + 4081 gttccagatt tgaacaaaat gaaataggag gaagttatgc caacattaga aatctcacag + 4141 gcaaaattgg attttgtaaa aaaggcagag gaaaattata acgctttgtg cacgaaccta + 4201 cagttaagtg gagatgattt gaaagtattt tctatcactt ctgtgaaagc aggagaagga + 4261 aaatcaatga cttccaccaa tatcgcttgg gcttttgcgc atgcaggtta caaaacgctg + 4321 ctgattgatg gagatattcg caattctgtt atgttaggtg tctttaaagc aagggataag + 4381 attacaggcc tgacagaatt tttatcagga actacagacc tatcacaagg gctttgtgat + 4441 accaatatcg aaaatctctt tgtaattcag gctggctctg tgtcaccgaa tccgacagct + 4501 cttcttcaaa gtaagaattt cagtacaatg cttgaaacct tgcgtaaata ttttgactac + 4561 atcattgtag atactgctcc tgtcggtgtc gtgattgatg cggctattat tacgcgaaaa + 4621 tgcgatgctt ctattttagt gacggaggca ggtgaagtaa atcgtcggga tattcaaaaa + 4681 gcaaaagaac agttggaaca cacaggaaag ccgtttttgg gaattgtgtt gaataaattc + 4741 gatacttcag tagacaaata cggttcttat ggaaattatg gagattacgg gaaaaataaa + 4801 aaataggtcg ggggatagag atgaatggaa aaatattaag gtcttcattg gccataatcc + 4861 agagttttct tgttatttta ttgacttatc tacttagtgc tgtgagagaa acggagattg + 4921 tttcaacaac agctattgca ctttatatcc tccattattt tgtcttttat atcagtgatt + 4981 atggacagga tttctttaaa aggagatatt tgattgaact tgtccagaca ttgaaatata + 5041 tcctattctt tgcactagcg attagtattt ctaatttttt cttagaggat cgatttagta + 5101 tttccagacg aggcatgatt tacttcctca cattacatgc tctcttagtc tatgtgctaa + 5161 acctatttat caagtggtat tggaagcggg cttatcccaa ctttaaagga agtaagaaga + 5221 ttctcctact tacagaaact tctcgtgtcg aaaaggtact ggatagatta atagaatcaa + 5281 atgaggttgt tgggaagttg gtagccgtca gtgtcttaga taaaccagat tttcagcatg + 5341 attgtttaaa ggtagtagca gagggggaga tagtaaactt tgcgactcat gaggtggtcg + 5401 atgaagtctt tatcaatctt ccaagtgaaa aatacaatat tggagagctt gtctctcagt + 5461 ttgaaacgat gggaattgat gtaatagtca atctaaatgc ttttgatcgt agtttggcat + 5521 gtaacaagca aattcgtgag atggcagggt taaacgttgt gactttttct acaacatttt + 5581 ataagactag tcatgtaatt gctaagcgga ttattgatat cgtgggtgca ttggtagggc + 5641 tgatactatg tggtttagtc agtattgtac tggttccttt gattcgaaag gatgggggat + 5701 ctgctatttt tgctcagacg cgtataggaa aaaatggtcg tcagttcact ttttataagt + 5761 ttcgctctat gtgtgtagat gccgaggcga aaaaaagaga acttatggaa caaaatacca + 5821 tgcaaggtgg aatgtttaag gtggacgatg atcctcgtat cacgaaaatt ggttgtttta + 5881 tacggaagac tagcttggac gagctaccac agttttataa tgttctaaag ggagatatga + 5941 gtttggttgg cacacggcca ccaacagtgg acgagtatga gcactatacc ccagaacaaa + 6001 aacgccgact aagttttaaa cctggcataa caggtttatg gcaggtcagc ggacgaagtg + 6061 agatcaagaa tttcgatgaa gttgtcaaat tagatgtagc ctatatagac gattggacaa + 6121 tttggaaaga tattgagatt ttattgaaga cagttaaagt tgtattgatg aaggatggag + 6181 cgaagtaatt tctgtatatc catcatatta ggagagaaat gaaaaagtca gtttatatca + 6241 ttggttcaaa aggaattcct gctaagtatg gaggatttga aacttttgtt gaaaaattaa + 6301 cagccttcca acaagataag gctatccaat attatgtggc ttgtatgcgt gaaaattctg + 6361 caaaatcagg gattactgag gatgtttttg aacataatgg tgctatctgt tataacgtcg + 6421 atgttcctaa tattggtcca gcgcgagcta tagcgtatga tatcgctgca attaacagag + 6481 ctattgaaat tgccaaagaa aataaggatg aagatccaat cttctatatt ttagcttgtc + 6541 gaattggtcc gtttatccat ggaattaaga aaagaattca agcaataggt gggactcttc + 6601 tggttaatcc ggatggtcat gaatggctac gagaaaaatg gagtttacct gttcgcaaat + 6661 attggaaata ctctgaaaga cttatggtca aacatgcaga tcttttagtg tgtgatagta + 6721 agaatattga aaaatatatc caagaagatt ataaacagta tcaacctaag acaacctata + 6781 tcgcttatgg gactgataca acacgctcca tattaaagag tagtgacgaa aaagtacgtt + 6841 cttggttcaa agagaagaat gtttctgaaa acgagtatta cctagttgta ggacgttttg + 6901 ttccagaaaa taactatgag gctatgatac gtgggttttt agcatctaat tctaagaagg + 6961 actttgtctt aatcacaaat gtagaacaga ataaatttta taatcagttg ttggcaaaaa + 7021 ctggttttga taaggaccca cgagtaaaat ttgtaggtac agtctatgag caagagcttc + 7081 ttaaatatat tcgtgaaaac gcctttgctt acttccacgg gcatgaagtt ggtggaacca + 7141 atccttcgct tttagaagct ctggcatcaa ctaaactgaa tttattgcta gatgttggct + 7201 ttaaccgaga agttggggag caaagtgcaa tctattggaa aaaagatgag ctttcccaag + 7261 taatcgagaa agttgaacaa tttgatgcaa aaatgattga tgagttagat agacaatcaa + 7321 atcagagaat tgtggatttt ttcacttggg aaaagattgt cacagactac gagaaaatat + 7381 ttaaaaaatg aaaatattac attatacttt aggatttcaa ccccagcgaa caggtggttt + 7441 ggttaaatat gctgaggatt taatgctaga gcaaattgct caaggttatc aagtggctgc + 7501 cctatatcca ggaagaatta agttcttttc aaaaaaaata gaaataatta aagcgatgtc + 7561 aagacagttt gagtgttatg agctgcttaa tagcttacct atggctttat ttggaggtat + 7621 atccgatcca actgctttcc tgacaccttg tgacaaaaat gtttatcgta cttttttaga + 7681 aaaagtacaa cccgacatta tacatattca ctcgtttatg ggattgcata aagaattcct + 7741 cgaaattgct aaaaacttga atattagagt ggtttttacg agccatgatt attatggatt + 7801 agcacccgta cctcatttct attttaatgg ggtggattat agtaataaaa gtacaaactt + 7861 aacatggaat attatgtctt ccaatgcttt aagtgtgaaa aaactaagac tttttcaggt + 7921 ttcattttat cctactattc gtaaactttt gaaactatta gggaaaaatc caaaatctaa + 7981 aaagaattta gttattcgag atgttattga ggagcaagat tacagtgagc ttcgatacta + 8041 ttataatgag atgtttcact taatagatgg ttatttgttt aatagtagac ttgcaaagaa + 8101 ggtatatgag ataaatgaga ttaagtcagc taatagtata gtattatcta taacaaatag + 8161 ttcaattaat catcatcaga gattgacaac tacaaataat aaaattagag ttgcttatat + 8221 tggtccagat gaagaatata aaggatattt tgattttatt gactttgttg aaactttaga + 8281 tcgagagtcc tatgaagtgg caacttatgg ccatttacca aatggagagt gtccttcatt + 8341 cattgaacaa aaaggatatt ttactaagga aatgattgac agtgtctatg aaaatattga + 8401 tattcttatt gttccaagta agtggaagga gacatttgga ttgataacag tagaagcatt + 8461 atcctatggg gtaaatgttt tcgtgagtga aaatgttgga tcaaaagact tacttccaga + 8521 atcgcatgtt tttaaaaatc agaatgattt agtagttaaa tttttaaaaa atgatataga + 8581 aaatacaaaa ttgaaaactt tagatgaaca ctcgatagaa gtgattcagt attatgaaag + 8641 agtgataaat gatagttaag agtttcataa aaaagattac tggaaaaaca gtagacattc + 8701 atccagatgt acctttgtcg tatatactac aaagaggtat aaactatggt ttcggactct + 8761 ttcgtggggt tgtacgtgga atcggatttg gtcaaaacga caaacgttta ttcattggac + 8821 aaggagtttc tatcttagca aagcgtaaat tatttgttgg aaaaaatgtt cgaattggta + 8881 aaaaggtgtc tatagatgca ctgtcaaaag aaggaatcca ttttgcagat aatgtaaaga + 8941 ttggagatta ttctcaaatt attggcacag gttctataaa aaatatgggg attggcttga + 9001 aaatcggtaa gaactcatct ttttcagaat atagtttatt tggttctgct ggaggtatca + 9061 caattggtga taatgttatc gcaggtcaga atgttcgttt tcatgctgaa aatcataatt + 9121 atagtgattt agataaactc attgttgaac aaggggtatc tcgaaaggga atttcagtag + 9181 gtgataattg ttggattggt gctggatctg tttttttgga tgggtccagc attggttcag + 9241 gttgtgttgt agctgcaaat tctgtaatta cgaaaaactt tccagataac gttattgttg + 9301 ctggagtacc agctaaaatt ataaaaatga aatgatagga tgttaaatgg ggaaagaaat + 9361 taaagctgtt tatgcgatat taaattacaa tacttgggaa gatactgcgc gtttagcaca + 9421 gaaagttgca acatttcagc atattcaatc tgtgataata gtggataatc tatcaacaga + 9481 tgattcatac cattatttaa aaagacttga gggagagaaa atttcagttt atcaaacaca + 9541 aagaaatggt ggatattctg ttggaaataa tgttgcagca cgaaaagctt ataatatggg + 9601 agttgatatt cttttcattt caaatccaga cgttgatatt gatgaaaaag attccttgat + 9661 gattgcacaa aatttgtata aaaatagttc atatgcactg ctatcaggta tagaatataa + 9721 tgctatgaag gagatagatt tgccaattgt ctggcatgaa aattcctatt acgatgactt + 9781 acttgattgt ttgtttttaa ccagaaaatt gcgaagaaaa aaagaagata tcaatttgtc + 9841 aatgattaaa tcatctataa tagatgtaga tcttgttaaa ggctcgtttt ttgctgtaag + 9901 gctgtctgat tttcatgatg ttggttattt tgatgaatct gtatttcttt tttgtgaaga + 9961 gagaatatta gccaaaaagt tacaaaaagc aaataaaaaa ataggtattc tgcctgaagc + 10021 gaaatattac cacaatcatt caacttctat aaacgagaag tataaaaaga aaaaagaaca + 10081 gatagtttta ctatataatg ctcgttatta ttacaatgtg acgtatcaaa atattagctt + 10141 tttgaaaaaa atttgcctaa aactattcat gtttttatct attattgaat actcgatact + 10201 agattatatt aaacgaaagg gatagttatt tttatggtta ttaactttag taaatataat + 10261 tggattttaa ttttaatttt atcgagctca gaactgtttt ctaaagaaac aaatctattt + 10321 ttattactat ttattctact atactatgtt ttagttcgtg gaggtagact accaatttca + 10381 attccaggag cgaaatatta ttttacttta ttaatggtgg ggctatttat aggtattggg + 10441 aatgtaataa ttaacgaaaa tacagtattt aattttgtaa agcattttat ctattactta + 10501 ttacctctat ttttttggca gtttggatgt attctgtcaa ataacgataa tttatcttac + 10561 aagcaaaaca atattaagga atcaattgtt ataacagcat ttctattatc ttcttatgat + 10621 ttaataggtt caatcattag tttcttgtct agaactaagg aaattgttga tttatatagt + 10681 ttacggtcag agtttggtcg aggttcctat ataccaatta ttgcactgta tttagttctt + 10741 gtttattcta gagaaataaa gttgagcaaa aattttaagg gatttttgtt attactgttt + 10801 acaatctcga ttttgataca tttttctagg acacatttta ttattttatt gattctagta + 10861 tttttttcag gatttgaaaa aaatatgaaa agtattaaaa aaataatgtt tgcaggaaca + 10921 ttgatattag caggtgtagg tgttttatat ttatattttc caaatttagt tatagatttt + 10981 tataataaaa tatctcaatc aacgacggaa atcacgtttt ctaaatcgtc atggtcccat + 11041 aaagatatca tatggaattg gcgtggatat gaaatgtact ctgccttaaa tcattttaaa + 11101 tcttcaactt tattagagca aattttagga ggaggatttg gaacagtttt atacataggc + 11161 gaatatgcgt atttggtaag cgatttaccg tatcttcttt ttttacataa tggatatttc + 11221 actactttac ttgtttttgg tgttagtggg gtcatactat tcgttttatg ggtacttagt + 11281 ttatttagtt atagcaagta tgttaatgat acccaagatt caaattttat aaaaggtctt + 11341 gctgtggtta tattatttac cacatatttt gtaaatggtc ctcttttttc tgtttcacaa + 11401 gccaccttct tgctttattt tgcacttttt agtaataatc atggagaatt agatgaagat + 11461 ttttaaaaaa attaaattta tattaatgct gctttatacc tcaacttttc caagatgtga + 11521 gaaaatactg atttttggat catggttagg tgaaaaatat gcagacaatc caagatattt + 11581 gtttgagtat gtgattaaga atcgtcccga tttaaaagct atatggatta caagtaatca + 11641 agatgttttt aaagaattac agaagaaaca atatcccgtg atgatggcag atgagagtga + 11701 agctcataaa attatgaaga aagctaaata tatttttaca actacaggta tttttgatat + 11761 cggagtagaa aatagtaggt tgattggcgg tgctttttta attaaccttt ggcatggcat + 11821 tcctttgaaa aaaatcatgt atgatgataa acattcagcg cttcacaaac gtagtaaact + 11881 agtgacttgg gtagaaaaaa ttcctcttcg aaactatttt gttatttcta ctagtacggc + 11941 aataactcaa atttatcagt ctgcttttcg cgtaaagaaa tctaatatat tagaacttgg + 12001 acagcctaga aatgactatt tttatgatga gtcttatcca gtaagttcgc taatacaaga + 12061 attaaaaagt aaaaatatta tcttatatat gccgacacat cgcaatgaag gaaagaaaca + 12121 aattcctcta gataatttaa tggatttaaa tcgattaaat aaatggtgtg aagaaacaaa + 12181 ttcaattttt gtaattaaaa aacacttcta tcattcaaaa gaaaaaacac ttgagaaaga + 12241 atattcatca ataattgatg tgacaaatga gaaggtcgat gctcaagaat tactcaaata + 12301 ttcaaagatc ttaataactg actactcgag ctgctatatt gactacttat tgttggatcg + 12361 accaattata ttttttaatt atgactatga tgattatttg aggattgatc gttcgctata + 12421 ttttccatat gagaaggtta ctccagggga gaaatgtcaa aactttgatg aattattagt + 12481 gactctgcaa aatctatatc taggaaaaga tgattatagg aaaaagcgtg aaaatattaa + 12541 aactttcttt tattctagtg aaactcagaa gtcagtttct gaaaaaatca ttaatcacgt + 12601 actaaatcta taactttatt ggaatctgta atgaaaaaaa tattaaataa gtattattct + 12661 ttatctaatc ctgtaaaagc ttcaatttgg tttactattt gcaatgttct tcaaaaagga + 12721 atttcaatga ttactgttcc aatttttact agattattga caacggaaca atatggtgta + 12781 tactctgtat atcaatcatg gtattcaata attggagttt ttgcaacact aaacctatat + 12841 tatggagtct ttaataatgg aatggttaaa tacgagaaag ataaaaatgc ctttacttcc + 12901 tctatgcagg gactaacaac aacagttaca gctatatttt tagtgatata tttaataggg + 12961 attgattttt ggaactcgtt gttaggctta cctacgctac taatcttagt gatgttcttt + 13021 gatttgtttt ttactcctgc ttattctttt tgggctacgc gtcagagatt tgaatatcaa + 13081 tatcgaaact tagtatttat cacacttatt atagcgattg gaagccctat tattggtatt + 13141 tcttcagttg ttttatcgac ttataaagcg gaggctagag ttatctcatt tgtgttagtt + 13201 caatcttgta taggattata tttctatgtt ttgaaccttt accgaggtaa atattttttt + 13261 tgtaaaaaat attggctcta tgctttgaat tttaatttac ctcttattcc tcattattta + 13321 tcgcaatcag ttttaaatca atcggataga ataatgatta attcaatggt aggaatggga + 13381 gaagcagcta tttatagtgt tgcttacagc atatcaactt tgatggtttt agtgacaagt + 13441 gctataaaca gctcttttat tccttacaca tataaatgta ttcgagataa gaaatatact + 13501 gaactaggga aaagtgcaaa tcttttaatt actctggtag gcattggttc gattttaact + 13561 atttctcttg gaccagaaat cattcaatta tttgcaccaa aacaatatta cgaagcaata + 13621 tggattattc ctccagttgc tctttcagta tatttcatgt tcttatatcc catttttggt + 13681 aacattgagt tttactttga agcaaatcat tttgtaatgt gggcttcaat aggtggagca + 13741 attatgaata tttttttgaa ttttattttt ataaaacact ttggctatat tgcggcaggc + 13801 tatacaactt tattatgtta tattttattt gcattgggac attacatttt tatgagaaga + 13861 gcattgtatc agaatctttc gggtatccaa atttatgatt ctcgatatat tttctttttt + 13921 tcgtttcttc ttctgattct aatgctacta atcgtgacta tttatccatt tgtgttgatt + 13981 cgttatattg ctatctcact catcctagga ggatgttttt taaagaggag aaagataatg + 14041 agttcgatag tcatgataaa aaaacagtga ggtacacgaa tgacagaaat aaataaacag + 14101 ttacatgaaa cattaatcga aattttagac tttgtaaaag aaatttgtga aaaacatgaa + 14161 ttaacttatt ttttgatcta tggtacggca ctcggtgcaa aacgccattg tggatttatt + 14221 ccttgggatg atgatgttga tattgcttta ccgcgagagc actacaatat attaatcgac + 14281 gtgttatcta agatggaaca atctatattt agtcttcaaa atgaagataa cgagccgaac + 14341 tattttttac catttgctaa attaagaaaa aacaatacga tttttattga aaagattctt + 14401 gatgttgaat atgagaataa cggtatttac attgatattt ttccactaga tttcgtagag + 14461 aatccggact cttttaattt taagatgagg agaactatgt ttaattatat aaagcatatt + 14521 ttaaaatttt caagttgcag aagtttttat aaaaataaat acagtagcgt acgttatttg + 14581 atggaaaata ttatgagtat tcctaccctg tttttttcaa ataggagatt actattctta + 14641 gcgaataatt taatttcatc aacgaataaa gctaatttta ttggtcaata tgatgaaagt + 14701 agcgaaagag ctatcatgcc ttcaagctat tatttcccgt ctagatccgc tgtgtttgaa + 14761 ggaaagattt atagtgttcc tgcgaaatta gaagattatt taaaatattt ttatggttcg + 14821 gattatatgg aattaccacc aatagaaaaa agagtcactc atcaaccaat aaaacttaga + 14881 ttcaaaaaat aattggctat tctgtagaag gagaataatt caagagttgt gaagtaaaac + 14941 attgggttat ttttaaggta acgagatttg aaaaataatg atttaaagat aggaagtgga + 15001 gctattcatc aaatctccgc tacactttct caaaataata tttcgggaaa gattttatat + 15061 tgtgctgatc cagttgtcga tgacttgtac ggttcgatag tacgttcaca aatagaggaa + 15121 attggtcggg taaaggaaga aagttgcaat tataatacta ttgcttatgc gatgaatata + 15181 gcagaaaggg ctattgccac agatattgac tgtattgtgg gaatgggagg aggtcgtgtt + 15241 ttagatgtct gcaagtatgc atcttttatt tcgaaacgtc cttacctatc gattccgaca + 15301 acagcagcaa atgatggcat tgcttcccca gttgctgttt tgaaaaggca ggatgataga + 15361 ccaaaaagct taggggcggc tatcccctca atgacactaa ttgatattga tgttattgca + 15421 tcaggaccta tacaaaacat aaaagctggt atcggtgata caatatccaa ttacactgca + 15481 ttgaaagatt gggagttggc agttgagcga gggaaagatg agatgcatgg ttttgcatat + 15541 ctaatgtcgc aaaattcttt agatgcttta atgaaaacga agtataattc tattacccct + 15601 gattttattg aagttttggt aaactcttta gttttatcag gcattgcaat ggattttgcg + 15661 ggaagtagta gacctgtcag tgggtcagag catttattta gtcatgcatt agattactat + 15721 ggttctacaa ggaatcttca tggaattcag gttgcattag gtacagtcgc agttttgaaa + 15781 ttaattgaaa attctgttga tactgtagtg gattacttgc aaagatttga ggttcatatt + 15841 aacccgaaac ttttggggat agatgaagag ttgtttattt attgtatgca acatgctaca + 15901 aaaatgagaa gtaatcgcta tacctatctg catgaagttg atcttagcac agatagattg + 15961 aaacaaatat ataaggaact cataagcgag ttgtagaaaa gagaggaaaa aatgaaagca + 16021 cttattttag cagcagggtt aggaacacgt ctagccccaa ttaccaatga ggtaccaaaa + 16081 tctttggtac cagtcaacgg taagccaatt ttgatgaaac aaattgaaaa tttatatcaa + 16141 aataatatta cagatattac gattattgct ggatataagt catctgtatt aacagatgca + 16201 gttactgaaa agtatccaga aattaatatt attgataatg ttgattttaa aacgactaat + 16261 aatatgtatt cagcctatct aggaaaagct gcaatgggtg atagtgactt cttaatgatg + 16321 aatgcagatg tattttatga tgcttctgtt attaaaagtc tgttgcttca taaagctcca + 16381 aatgcaattg taactgattt aggtacttat attgaagagt ctatgaaagt cgtagaaaaa + 16441 aatgggcgtt tagtggaaat ttctaaacag atttcacctg aggaggcttt aggggcttct + 16501 attgatgttt ataaattctc ttatgaagca ggtgctcgat tctttgaaaa gtgtaaggaa + 16561 tttattgaag ataaacgaga acttcaaatg tggagtgagg ttgctcttaa tgcaatcctt + 16621 ccagaagttg aatttatagc atgtccattg gatggtcgtt ggttagaaat tgataatcat + 16681 gaagacctag ctgttgcaga aaaactattt gcttaaaccg aatatggaga atgaaattga + 16741 caaatagagt tgattatttt ggtgctgata ttagtgaact tcagaataaa aaattattct + 16801 tatttgatat ggatggtacc atttatgaag aagatagatt gtttgagggt actctcgaat + 16861 tattagacta tattcataat attggcggtg agtatatttt tattacaaac aattcatcta + 16921 agtctgttgt tgactatgtt gaaaaagtta acagattagg tattaaagct gaacgagata + 16981 atttttttac ctctgctcaa gccacaattg tttatattaa agaaaattat cctaaatcta + 17041 aagtttattg ccaaggaaca aaatctttga taaaagaact atctgacgca ggaattgatg + 17101 taactgagca agttagtgct gatatagatg ttgttcttgt tggttttgat acagaattaa + 17161 ccagtgataa aattcgcaat acctgcgaga ttctatcaac aaaggacgca cctttcatag + 17221 ctactaaccc tgatattcgc tgcccagtat cgtttggatt catcccagat tgtggttcta + 17281 tttgtgatat gattagtaaa tcagtcgata gggaacctgt ttacataggt aaacctgaac + 17341 ctacgatggt tgatattgtt cgaaaaaaat taaattattc tctatttgaa acagttgtga + 17401 ttggagatcg cttgtatacg gatatcatga ctggtataaa tgcaggagta acttcagttt + 17461 gtgtgctgac aggagaagca acggtgaatg atattcaaca aggtagtata aaaccgactt + 17521 atacatttaa aaacgtgaaa gaaatgtgga aaggaattgt ctgatttttt cattctgaat + 17581 agtgaattca tgaatactgt caaaatactc gtatgtattt aaattgattt cattatttta + 17641 ataatggaca aattaaaatt atttttctcc ccaaatcgtt cgtgaacgta aagtactcat + 17701 caacaaagaa aggtacccct tttatgaaag gtattattct agcaggtggt tcgggaactc + 17761 gcttgtatcc tttgactcga gccgcatcaa aacaacttat gccggtttat gataaaccga + 17821 tgatttacta cccactttca acattgatgt tggctgggat tagggatatt ttgattattt + 17881 ccactccaca ggatttacat cgatttcaag agcttcttca agacggatct gagtttggga + 17941 tcaaactttc ttatgcagag caaccaagtc cagatggttt ggcacaagcc tttatcattg + 18001 gggaagagtt tatttctgat gatagcgttg cgctaatctt aggtgataat atctaccatg + 18061 gttctgggct ttccaagatg ctacaaaagg cagcgagtaa ggagtcggga gcaactgttt + 18121 ttggctacca tgtcaaggat ccagagcgct ttggtgtggt tgagtttgat caggatatga + 18181 aggctatttc tattgaagaa aagccagagc aacctcgttc aaactatgca gttacaggtc + 18241 tctatttcta tgataatgat gtagtagaga ttgccaaaag tattaaacca agtcctcgtg + 18301 gtgaattgga aattacagac gttaacaagg cttatctaga acgtggtgat ttgtctgttg + 18361 agcttatggg gcgtggcttt gcttggttgg atactggcac tcatgaaagt ttactagagg + 18421 cttcgcagta catcgaaaca gtccaacgga tgcaaaatgt tcaggtagca aacttagaag + 18481 aaattgccta tcgcatgggt tatatcagtc gtgaagatgt attgacctta gcccaaccac + 18541 ttaagaaaaa tgaatacgga cagtatctgc tccgtttgat tggagaagca tagatgacag + 18601 ataatttttt cggtaagacg cttgcggcac gcaaggttga agctattcca ggcatgttgg + 18661 agtttgatat ccccgttcat ggagataatc gtggctggtt taaagaaaat ttccaaaagg + 18721 aaaaaatgct tccacttgga tttccagagt ctttctttgc agaaggaaaa ttgcaaaaca + 18781 atgtatcctt ctcacgtaaa aatgtccttc gaggcctcca cgcagagcct tgggataagt + 18841 acatctctgt agcagatgga gggaaagttc tgggttcttg ggttgatcta cgcgagggtg + 18901 aaacctttgg gaatacctat cagacagtaa ttgatgcaag caagggaatc tttgttcctc + 18961 gaggcgtagc taatggcttc caagttctat cagatacagt gtcatatagc tatctggtca + 19021 atgattactg ggctctcgag ctcaaaccca agtatgcctt tgtgaactac gctgatccaa + 19081 gccttggtat tgaatgggaa aatattgcag aagcagaggt ttcagaagca gaggtttcag + 19141 aagcagataa acatcatccc ctacttaagg atgtaaaacc tttgaaaaaa gaagatttgt + 19201 aaaaaggaaa gaatatgact gaatacaaaa atattatcgt gacaggtgga gctggcttta + 19261 tcggttctaa ctttgtccat tatgtttacg agaactttcc aggtgttcac gtgacagtcc + 19321 tagataagtt gacttatgct ggaaatcgcg cgaatattga ggaaatttta ggtaatcgtg + 19381 ttgagttagt tgttggtgac attgctgatg cggagttggt agacaagttg gctgctcaag + 19441 cagatgctat cgttcattat gcagcggaaa gccacaatga taattcgctc aatgatccat + 19501 cgccatttat tcatactaac ttcatcggaa cctatactct tttagaagct gctcgtaagt + 19561 atgatattcg cttccaccat gtatcgacag atgaagttta tggggatctc cctttacgcg + 19621 aagatttgcc aggtcatggt gaaagaccag gtgagaaatt tacggctgaa acaaaataca + 19681 acccaagctc tccgtactca tcaaccaagg cagcctcaga tttgattgtc aaagcctggg + 19741 tgcgttcttt tggagtcaag gcaacgattt ccaactgttc aaataactac ggtccttatc + 19801 aacatatcga aaaattcatc ccacgtcaga ttactaacat cctaagtggt atcaagccaa + 19861 aactttacgg tgaaggtaag aacgttcgtg attggattca taccaatgac cattcttcag + 19921 gagtttggac aatcttgaca aaagggcaaa tcggtgaaac ctacttgatt ggggctgatg + 19981 gtgagaagaa caataaggaa gttttggaac ttatccttaa ggaaatggga caagctgcgg + 20041 atgcctatga tcatgtgact gaccgtgcag gacatgacct tcgctatgcg attgatgcca + 20101 gcaagctccg tgaggagttg gggtggaaac ctgaatttac caactttgaa gctgggctca + 20161 aggcaacaat caagtggtat acagataacc aagaatggtg gaaagcagaa aaagaagctg + 20221 ttgaagccaa ttatgctaag actcaggaga ttattacagt ataaaaagca ggaaatagct + 20281 gctttttatt gctatattgg gaagagttac atattagaaa ggtctagaga tgattttaat + 20341 tacaggggca aatggccaat taggaacgga acttcgctat ttattggatg aacgtaatga + 20401 agaatacgtg gcagtagatg tggctgagat ggacattacc aatgcagaaa tggttgagaa + 20461 agtttttgaa gaggtgaaac cgactttagt ctaccactgt gcagcctaca ccgctgttga + 20521 tgcagcagag gatgaaggaa aagagttgga cttcgccatc aatgtgacgg ggacaaaaaa + 20581 tgtcgcaaaa gcatctgaaa agcatggtgc aactctagtt tatatttcta cggactatgt + 20641 ctttgacggt aagaaaccag ttggacaaga gtgggaagtt gatgaccgac cagaaccaca + 20701 gacagaatat ggacgcacta agcgtatggg ggaagagtta gttgagaagc atgtgtctaa + 20761 tttctatatt atccgtactg cctgggtatt tggaaattat ggcaaaaact tcgtttttac + 20821 catgcaaaat cttgcgaaaa ctcataagac tttaacagtt gtaaatgacc agtacggtcg + 20881 tccgacttgg actcgtacct tggctgagtt catgacctac ctagctgaaa atcgtaagga + 20941 atttggttat tatcatttgt caaatgatgc gacagaagac acaacatggt atgattttgc + 21001 agttgaaatt ttgaaagata cagatgtcga agtcaagcca gtagattcca gtcaatttcc + 21061 agccaaagct aaacgtccgc taaactcaac gatgagcctg gccaaagcca aagctactgg + 21121 atttgttatt ccaacttggc aagatgcatt gcaagaattt tacaaacaag aagtgagata + 21181 agtagtagaa tgattttcta gtctaataaa agaggcagat aatgaactcc aaaggagctt + 21241 aagatgtacg attatcttgt tgttggtgct ggtctctttg gcgcatagct ttggctcagt + 21301 ttctattatc gctcacacca tccatcagaa gtttaatctg aaggtaccca attatcgcca + 21361 agaagaagat tgggctagga tgggtttacc aatcacacgt aaggaaatct ctaattggca + 21421 tatcaaggca agtcaatact atttagagtc cctttataac cttttacgag aaaagttgtt + 21481 agaacaacct cttcttcatg cggatgaaac ctcttatcgg gttctagaga gtgatagcca + 21541 tctgacctac tattggacct ttttgtctgg gaaatcagag aaacaaggga ttacgcttta + 21601 ccatcatgat cagcgtcgga gtggttcggt agtgcaagaa ttcctaggaa attattctgc + 21661 ctatgcgata gcagtccaaa gtttaggagc aaggcgacgc taagcttggt aaactacgaa + 21721 ccgctagaag cttatcgtca actggaagaa gctgaacttg ttggatgttg ggcgcatgtg + 21781 agaaggaagt tttttgaagc gccccccaag caagcggata aatcatcgtt aggaaagaa +// + diff --git a/public/res/serotype_genbank/serotype_29.gb b/public/res/serotype_genbank/serotype_29.gb new file mode 100644 index 0000000..0aef144 --- /dev/null +++ b/public/res/serotype_genbank/serotype_29.gb @@ -0,0 +1,669 @@ +LOCUS CR931694 15096 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 34373 (serotype 29). +ACCESSION CR931694 +VERSION CR931694.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 15096) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 15096) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..15096 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="34373" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC29_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC29_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34071.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..445 + /gene="aliB" + /locus_tag="SPC29_0002" + /pseudo + CDS 293..445 + /gene="aliB" + /locus_tag="SPC29_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI34072.1" + gene complement(459..980) + /gene="tnp" + /locus_tag="SPC29_0003" + /pseudo + CDS complement(459..980) + /gene="tnp" + /locus_tag="SPC29_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1203..2648 + /gene="wzg" + /locus_tag="SPC29_0004" + CDS 1203..2648 + /gene="wzg" + /locus_tag="SPC29_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34074.1" + /db_xref="GOA:Q4JZY4" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZY4" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSICVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGIDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMIKLVNAQLESRGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQNVMEGR" + misc_feature 1203..1319 + /gene="wzg" + /locus_tag="SPC29_0004" + /note="Signal peptide predicted for SPC1437 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1407..1754 + /gene="wzg" + /locus_tag="SPC29_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.9e-63" + misc_feature 1932..2375 + /gene="wzg" + /locus_tag="SPC29_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.6e-70" + gene 2650..3381 + /gene="wzh" + /locus_tag="SPC29_0005" + CDS 2650..3381 + /gene="wzh" + /locus_tag="SPC29_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34075.1" + /db_xref="GOA:Q4JZY3" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZY3" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKLFGERYKFMKKRARYFLERDLVHVVASDMHNLNKRPPYMKEAYELIS + KQYGERRARELFIENPRLILSDQII" + misc_feature 2653..3261 + /gene="wzh" + /locus_tag="SPC29_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.3e-37" + gene 3390..4082 + /gene="wzd" + /locus_tag="SPC29_0006" + CDS 3390..4082 + /gene="wzd" + /locus_tag="SPC29_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34076.1" + /db_xref="GOA:Q4JZY2" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZY2" + /translation="MKENKEITIDVFQLFKVLWKKKTSIILTAIVAAVLAFAVSSFVL + TPEYSSTTRIYVVNRNQSEKAGLTNQDLQAGTYLVKDYKEIIISQDVLEEVISNLKLE + KTVKELSKKIQVTVPVDTRIVSITVKNAQPEEASRIANALREVAAEKIISVTRVSDVT + TLEEARPALSPSSPNIRRNTLLAFLVGGAVMVVSVLLLELLDDHVKRPEDVEEVMQIA + LLGIIPDLNKLK" + misc_feature 3390..3536 + /gene="wzd" + /locus_tag="SPC29_0006" + /note="Signal peptide predicted for SPC1439 by SignalP 2.0 + HMM (Signal peptide probability 0.987) with cleavage site + probability 0.704 between residues 49 and 50" + misc_feature 3408..3824 + /gene="wzd" + /locus_tag="SPC29_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.8e-46" + gene 4093..4776 + /gene="wze" + /locus_tag="SPC29_0007" + CDS 4093..4776 + /gene="wze" + /locus_tag="SPC29_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34077.1" + /db_xref="GOA:Q4JZY1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZY1" + /translation="MPTLAIEQKRLDFAKKAEENYNALRTNIQLSGDNLKVLSISSVK + PGEGKSVTSMNIAWAFARAGYKALLVDADIRNSIMSGVFKSREKITGLTDFLAGTTDL + SHGLCDTNIENLFVIQAGPVSPNPTALLQSENFATMIDTMRKYFDYVIVDTAPIGMVI + DAAIITQKCDASILVTAARETKRRDILKAKEQLEQTGVPFLGVILNKFNTEVEKYGAY + GVYGDYRKG" + gene 4787..5419 + /gene="wcjH" + /locus_tag="SPC29_0008" + CDS 4787..5419 + /gene="wcjH" + /locus_tag="SPC29_0008" + /note="member of homology group 61" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34078.1" + /db_xref="GOA:Q4JZY0" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JZY0" + /translation="MYFVLKNILDRFLAFFLFITLIIIPIIPITILLIWIEDPGDIFF + FQDRIGLNGKNFKVIKFRSMYKDADQRIKESIISGEIDRLNFKEHSQSMTTKVGKVIR + KLSIDELPQLVNIIKGDMAIVGPRPLQQFEITHHILTHKETGTTLKMSKRLSVKPGLL + CYWQVAPNKNDMPFSDRMNLDLLYIDNVSFKTDFLLILKGFYTVLMGNNN" + misc_feature 4802..5410 + /gene="wcjH" + /locus_tag="SPC29_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.5e-23" + gene 5421..6212 + /gene="wciB" + /locus_tag="SPC29_0009" + CDS 5421..6212 + /gene="wciB" + /locus_tag="SPC29_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34079.1" + /db_xref="GOA:Q4JZX9" + /db_xref="UniProtKB/TrEMBL:Q4JZX9" + /translation="MKNIKILVATHKKYKIPSDTSLYLPIHVGCEGKKKIGFQGDNSG + ENISNLNPYYCELTGLFWAWKNLDYDYLGLVHYRRYFTSRRQSYREDLNMDSIILSKS + EVEKMMLDYDVVVPRKRKYYIETLYSHYAHTHDRSHLDVTRQIISELNPDYIDTFDKV + MNRRSGYMFNMFIMSKDNVNAYCEWLFPIINELYKRLDITGYSAFDARLFGRVSERLF + NVWLAKQNLRIKETPFIYMEKINLLEKGKSFLQAKFFGKKYGQSF" + gene 6231..7412 + /gene="wzy" + /locus_tag="SPC29_0010" + CDS 6231..7412 + /gene="wzy" + /locus_tag="SPC29_0010" + /note="member of homology group 45" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34080.1" + /db_xref="UniProtKB/TrEMBL:Q4JZX8" + /translation="MKIVIQRRSLPEILALSALTIFLVMSIFDVTFYVQYLPKIVHRI + LIAILLILLVIKESYKRKLDYRTIISLFSTVLIYLLIGKMSTFSSNIAIGFIFIYVLR + DIPFKSVAKISLAVSVFMLLFVIASAKLGVIINYLEISGPRVRSYLGFRYALYPSILL + MNVIAITLYLKQNNIRYWQWLLLTLSVYWVYGQTDSRLTFYNSCILLVFNILIKWFPD + ILSKLGNVFKIFRLTFIINAIISFWISINYLGSNNSFVNSFLFKLNHMLGGRLFLANK + SLELFGFGLFGKQVDWNGNGLTIEGVRNYQTYLYVDNLYIQILQKFGLLVLVLMLALL + TLTLFKAIKKDQWVIAFILIVMSFQSMIDDLNMYLHYNIFWILIGSLIYTQYHYSNEG + T" + misc_feature 6231..6332 + /gene="wzy" + /locus_tag="SPC29_0010" + /note="Signal peptide predicted for SPC1443 by SignalP 2.0 + HMM (Signal peptide probability 0.972) with cleavage site + probability 0.932 between residues 34 and 35" + gene 7469..8596 + /gene="wcrJ" + /locus_tag="SPC29_0011" + CDS 7469..8596 + /gene="wcrJ" + /locus_tag="SPC29_0011" + /note="member of homology group 129" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI34081.1" + /db_xref="GOA:Q4JZX7" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4JZX7" + /translation="MNKRDRNYYVGLVMKIVTKPLKMLKVREERILFKSYDAENISCN + PKYIYNELKKNNRYELIWVLKNPEKTPEVKAIKYMSLKWLYYIATSKYVITNTGFNFW + LPKKKEQIYLNTWHGGGAYKDSDNLSNISKAQITQTQKSAELEDYFISSCAVFTKEYA + EKRLGFKGKILEVGTPRNDYLIHNHDNASLKNSIRRRLNIADDHFIVIYAPTWRDDAS + TIEDLDYDSLLECLREKYSEVTILVRGHHLQKNLVCIKNSNIINVSDYDDMQELLLIS + DLLVTDYSSSIWDMIHGGKKVLLYTPDLDEYLKYREFHVDIKEWSIPYFKTNEELIHF + IFSNGFTNMDEVMKNHMNRFGSFEHGNATQKIVELIEKGNK" + misc_feature 8048..8584 + /gene="wcrJ" + /locus_tag="SPC29_0011" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 9e-36" + gene 8593..9573 + /gene="wcrM" + /locus_tag="SPC29_0012" + CDS 8593..9573 + /gene="wcrM" + /locus_tag="SPC29_0012" + /note="member of homology group 117" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34082.1" + /db_xref="GOA:Q4JZX6" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZX6" + /translation="MKVSVIIPIYNVEKYLRRCLESIVNQTYKDIEIILVNDGSPDNS + KEICEEYVVKYSNIQLINQNNAGLGAARNKGLQYVTGDAITFVDSDDWLELDAIEYYV + ESMKKSDADIVVTKMIRKKEYTPSEEIKKSPVTEEVLTQKQFAKKYFKIDGNNIEYYA + CAKLYKKEIACEVKYPVGLFAEDVPAAFSYIIRSQNIFYSTKVTYNYFFNDNSLTANF + TNKDFDLEKIWDLVTEEAEDFGNEDYILYSKINRYRIDFNLLCRIALSEDKTDIETYV + KKIEELLGKVKRNKKILLEYLPFSRKVILRLFLVNYKLGRNVLRMFKNIM" + misc_feature 8602..9105 + /gene="wcrM" + /locus_tag="SPC29_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.8e-47" + gene 9597..10664 + /gene="wcrH" + /locus_tag="SPC29_0013" + CDS 9597..10664 + /gene="wcrH" + /locus_tag="SPC29_0013" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34083.1" + /db_xref="GOA:Q4JZX5" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4JZX5" + /translation="MGMYYFIKVEKDLKNTAGIKAPDDIERISKELGMQELLFPKFPF + EKNKVFQKLWLFSVIGYKWTSLLWKLKTNDVVIYQHPMYGVRVSNCLIPLLKKCKNIK + FIAVIHDLESLRKGIQGVIEDNETTNTIADTELLSKFDKIISHNSKMTNYLEGIGIKK + ENLVDLEIFDYLDPSEMKEKTEDGVVIAGNLAKGKSSYIYKLIEKKPGFKLNLFGPNF + NIEELPENVKYYGSLTPNELPQKLVGKFGLVWDGDSLDTCGGNTGNYLKFNNPHKTSL + YLASGIPVIIWKEAALAEFIENNNVGFTVNSLSEIEIVLKNISANDYSLMKANTMEVG + KKLREGYFYRQSIYKCKNDLK" + gene 10837..12261 + /gene="wzx" + /locus_tag="SPC29_0014" + CDS 10837..12261 + /gene="wzx" + /locus_tag="SPC29_0014" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34084.1" + /db_xref="GOA:Q4JZX4" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZX4" + /translation="MKVLKNYAYNLSYQLLIIILPIITTPYVTRVFSSDDLGSYGYFN + SIVTYFILLATLGVANYGTKVISGHRKNIEKNFWGIYSLQLGATVLSLLFYVILCLSI + SFMKNPTAYILGLSLISKGLDISWLFQGIEDFRKITVRNITVKVIGVTSVFLFVKSAS + DLYLYVFLLTIFELLGQLSMWVPAREFTGKPHFDWLYAKQHLKPVILLFLPQVAISLY + VTLDSTMLGSLSSIRDVGIYDQSLKLVKILLTLVTSLGSVMLPRVSNLLSSGDHKAVN + KMHEMSFLVYNLVIFPIMAGMLIVNDDFVTFFLGQDFQEARYAIAIMIFRMFFIGWTN + IMGIQILIPHNKNKEFMLSTTIPAIVSVGLNLLLLPKLGYIGAAIVSVLTEVLVWLIQ + LFYTRSYLREVPILGSLIKIIISSGVMYGILLFIKQFLNVSPIINVGLYAILGAMIYL + VLILIFRIINPNELKQQLLKNKGA" + misc_feature 10843..11637 + /gene="wzx" + /locus_tag="SPC29_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 5.8e-66" + gene 12263..13366 + /gene="glf" + /locus_tag="SPC29_0015" + CDS 12263..13366 + /gene="glf" + /locus_tag="SPC29_0015" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34085.1" + /db_xref="GOA:Q4JZX3" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZX3" + /translation="MYDYLVVGAGLFGAVFAHEAALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWEYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQVKIEEQRAILNGKAPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPAFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQ + GNVIFGGRLGHYRYYDMHQVIGAALQCVRNELN" + misc_feature 12698..13306 + /gene="glf" + /locus_tag="SPC29_0015" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 9.6e-115" + gene complement(order(13567..14151,14205..14766)) + /gene="tnp" + /locus_tag="SPC29_0016" + /pseudo + CDS complement(join(13567..14151,14205..14378,14378..14722, + 14719..14766)) + /gene="tnp" + /locus_tag="SPC29_0016" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI34086.1" + misc_feature complement(join(14071..14151,14205..14378,14378..14401)) + /gene="tnp" + /locus_tag="SPC29_0016" + /note="HMMPfam hit to PF01610, Transposase, score 1.1e-33" + /pseudo + gene 15049..>15096 + /gene="aliA" + /locus_tag="SPC29_0017" + CDS 15049..>15096 + /gene="aliA" + /locus_tag="SPC29_0017" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34087.1" + /db_xref="UniProtKB/TrEMBL:Q4K2C2" + /translation="MMKSSRLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggagtactgt ataaaagaca gaaatccttt gttttttata actaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga aaatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attaagctga taatatagtc aattgaaaca agagcaggac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtgtttaat gttggtaaga gaaatttctg aaactaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcaaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt tttgttcata attagattga aactagaata gtagacctct gcttctaaaa + 1021 cattgttaga aatcgatttg actgtcctga tagatttgtc atgttcttat ttcattttac + 1081 tatatttttg tttcgcggga agtctactaa tgatacttaa agatgcagat agtaaaaaaa + 1141 atgtagacat taccgtaaaa aagtgatata atcgtatgat gttcaaggta taggtgttaa + 1201 tcatgagtag acgttttaaa aaatcacgtt cacagaaagt gaagcgaagt gttaatatcg + 1261 ttttgctgac tatttattta ttgttagttt gttttttatt gttcttaatc tttaagtaca + 1321 atatccttgc ttttagatat cttaacctag tggtaactgc gttagtccta ctagttgcct + 1381 tggtagggct actcttgatt atctataaaa aagctgaaaa gtttactatt tttctgttgg + 1441 tgttctctat ccttgtcagc tctgtgtcgc tctttgcagt acagcagttt gttggactga + 1501 ccaatcgttt aaatgcgact tctaattact cagaatattc aatctgtgtc gctgttttag + 1561 cagatagtga tatcgaaaat gttacgcaac tgacgagtgt gacagcaccg actgggactg + 1621 ataatgaaaa tattcaaaaa ctactagctg atattaagtc aagtcagaat accgatttga + 1681 cggtcaacca gagttcgtct tacttggcag cttacaagag tttgattgca ggggagacta + 1741 aggccattgt cctaaatagt gtctttgaaa acatcatcga gtcagagtat ccagactacg + 1801 catcgaagat aaaaaagatt tataccaagg gattcactaa aaaagtagaa gctcctaaga + 1861 cgtctaagaa tcagtctttc aatatctatg ttagtggaat tgacacctat ggtcctatta + 1921 gttcggtgtc gcgatcagat gtcaatatcc tgatgactgt caatcgagat accaagaaaa + 1981 tcctcttgac cacaacgccg cgtgatgcct atgtaccaat cgcagatggt ggaaataatc + 2041 aaaaggataa attgactcat gctggtatat atggggttga ttcatccatt cataccttag + 2101 aaaaccttta tggtatagat attaattatt atgttcgttt gaattttacc tcatttttga + 2161 aattgattga cttattggga ggggtagatg ttcataatga tcaagagttt tcagctctac + 2221 atgggaagtt ccatttccca gtagggaatg tccatctaga ctctgagcag gctctaggtt + 2281 ttgtacgtga acgctactca ctagccgatg gagaccgtga ccgtggtcgc aaccaacaaa + 2341 aggtgattgt ggctatcctt caaaaattaa cgtcaaccga agcactgaaa aattatagta + 2401 cgatcattaa tagcttgcaa gattctatcc aaacaaatat gccacttgag actatgataa + 2461 aattggtcaa tgctcagtta gaaagtagag ggaattataa agtaaattct caagatttaa + 2521 aaggtacagg tcggatggat cttccttctt atgcaatgcc agacagtaac ctctatgtga + 2581 tggaaataga tgatagtagt ttagctgtag ttaaagcagc tatacagaat gtgatggagg + 2641 gtagatgaaa tgatagacat ccattcgcat atcgtttttg atgtagatga cggtcccaag + 2701 tcaagagagg aaagcaaggc tctcttggca gaatcctaca ggcagggggt gcgaaccatt + 2761 gtctctacct ctcaccgtcg caagggcatg tttgaaactc cggaagagaa gatagcagaa + 2821 aactttcttc aggttcggga aattgcaaaa gaagtagcag atgatttagt cattgcttat + 2881 ggcgcagaga tatactatac tctggatgct ctagaaaagc tagaaaaaaa agaaattcct + 2941 acccttaatg atagtcgtta tgccttgatt gagtttagca tgcatacttc ctatcgtcag + 3001 attcatacgg gattgagcaa tattttgatg ttgggaatta ctccagtcat tgcccacatc + 3061 gagcgctatg atgctcttga aaataatgaa aaacgcgttc gggaactgat tgatatgggg + 3121 tgctatactc agataaatag ttatcatgtt ttaaaaccta agctctttgg tgaaagatat + 3181 aaatttatga aaaagagagc tcggtatttt ttggaacgtg atttagttca tgtagttgca + 3241 agtgatatgc acaatttgaa caaacgtccc ccttatatga aagaagccta tgaacttatc + 3301 tcaaaacaat acggtgaaag aagagcgaga gaattattta ttgaaaatcc tcgcttaatc + 3361 ttatctgatc aaattattta ggagttgaca tgaaagaaaa taaagaaatt acgattgatg + 3421 tttttcaatt gtttaaagtc ctttggaaga agaaaacctc tattatacta actgcgattg + 3481 tagcagctgt cctagctttt gctgtaagta gttttgtact gacacctgag tattctagta + 3541 cgacacgtat ttatgtggtc aatcgaaatc aatcggaaaa agcagggttg acgaaccagg + 3601 atttgcaggc tgggacctat ctggtaaagg actataagga aatcatcatc tctcaagatg + 3661 tacttgagga agtcatttca aatcttaaac tagagaaaac agttaaggaa ttaagcaaga + 3721 agattcaggt aacagtacct gtggatactc gtatcgtatc aattactgta aaaaatgcac + 3781 aaccagaaga agctagccgt atcgcaaatg ctcttcgtga agtggctgct gaaaaaatca + 3841 tttctgtaac tcgtgtatct gatgtgacaa cattggaaga agcaaggcca gccctaagtc + 3901 cttcatcacc taatattcgt cgtaataccc tgctagcttt tctagtggga ggagcagtga + 3961 tggtagtttc agtcttgtta cttgagttgt tggatgatca tgttaaacga ccagaagacg + 4021 tggaagaagt aatgcagatt gcacttctag ggattattcc agatttgaat aagttaaaat + 4081 aagggagaaa atatgccaac attagcaata gaacaaaaac gtttagattt tgcgaaaaaa + 4141 gcagaagaga attacaatgc tttgcgaaca aatattcaat tgagtggtga taatctgaaa + 4201 gttctttcca tctcgtctgt taaacctggt gaggggaaat cggtaacatc aatgaatatt + 4261 gcttgggcct ttgcgcgtgc aggctataaa gctttattgg tggatgcgga tattcgtaat + 4321 tctatcatgt caggagtctt taaatcaaga gaaaaaatta ctgggctaac ggattttctg + 4381 gcaggtacca ctgacctttc tcatggactt tgtgatacaa atattgaaaa tttatttgtt + 4441 attcaggcag gacctgtatc ccctaaccca acagcacttt tacagagtga aaactttgcc + 4501 actatgattg atactatgcg taagtatttt gactatgtca ttgtcgatac tgcaccgatt + 4561 gggatggtca ttgatgctgc tattatcaca caaaaatgtg atgcttctat tttggtaaca + 4621 gcagcgaggg aaacaaagcg tcgtgatatt ttgaaagcaa aggaacagtt agaacagaca + 4681 ggagtacctt ttttaggagt tattctaaat aaattcaaca cagaagttga aaaatatgga + 4741 gcttatggtg tctatggaga ttataggaag ggataattga taaaaagtgt attttgtttt + 4801 aaaaaatatt ttagatagat ttttggcgtt tttcctattt atcacactga taatcatacc + 4861 gattattccg ataacaattc tgcttatttg gatagaagat ccaggagata tatttttctt + 4921 tcaagataga attggtttaa atgggaagaa ctttaaagta ataaagtttc ggagtatgta + 4981 taaagatgcc gatcaaagaa taaaggaaag tattattagt ggtgaaattg atcgtctaaa + 5041 ttttaaagaa cattctcaaa gtatgactac aaaagtcggt aaagtgatac gaaaactttc + 5101 aattgatgaa ttgcctcaat tagtgaatat tataaaaggt gatatggcta tagtgggacc + 5161 tcgtccatta caacaatttg aaataactca tcatattctt acccataaag aaacggggac + 5221 tactttaaag atgtctaaaa gattgtctgt gaaacctggt ttgctttgtt attggcaagt + 5281 tgcgccgaat aaaaatgaca tgccttttag tgatagaatg aatctagatt tattatacat + 5341 tgataatgta tctttcaaga ctgatttctt gcttattttg aagggattct atacagtttt + 5401 aatgggtaat aacaattaac atgaaaaata taaaaatatt agtagcaaca cataaaaaat + 5461 ataaaatacc cagtgataca agtttgtatc taccaattca tgtaggatgt gaaggaaaga + 5521 aaaaaattgg atttcaaggt gacaattcag gagaaaatat ttctaattta aatccttatt + 5581 attgtgaatt gactggcttg ttttgggctt ggaaaaactt agattatgat tatcttggat + 5641 tagtacacta tcgtagatat tttacttcaa gacgtcaatc ttatcgtgaa gatctcaaca + 5701 tggatagtat cattttatct aaatcagagg ttgaaaaaat gatgctggac tatgatgttg + 5761 ttgttccacg taaaagaaaa tattatattg aaactctcta ttctcactat gcacatactc + 5821 atgatcgaag tcatttagat gttactcgcc aaatcattag tgagttaaat ccggattata + 5881 ttgatacgtt tgataaagtg atgaatcgtc gtagcggcta tatgtttaac atgtttatca + 5941 tgtcaaaaga taatgtgaat gcatattgtg agtggttatt cccaattatt aatgagttat + 6001 ataaacggtt ggatattaca ggctattcgg cttttgatgc gagattgttt ggacgtgtca + 6061 gtgaacgctt atttaatgtt tggttagcta agcaaaattt gcgcataaaa gagacgcctt + 6121 ttatttatat ggagaaaatc aacttacttg aaaaagggaa atccttcctt caagcaaaat + 6181 tctttggtaa aaagtatgga cagagttttt agttgggaat aaaaatagtg atgaaaatag + 6241 taatacaaag aaggtctttg ccagaaattt tagctcttag tgcactaact atatttttag + 6301 ttatgtcaat ttttgatgtg actttttatg ttcagtatct gccgaaaatt gttcacagga + 6361 tactgatagc tattttgctt attctgcttg ttataaaaga gtcgtacaaa agaaagcttg + 6421 attatagaac tatcataagt ctattttcta ctgttttaat ttatctcctt atagggaaga + 6481 tgagtacttt tagttctaat attgcaatag gtttcatttt tatttatgtt ttacgcgata + 6541 tcccttttaa aagtgtggca aaaatttctt tagcggtaag tgtgttcatg ttactctttg + 6601 ttatagctag cgcaaagttg ggagttatta taaattattt agagatttct gggccccgag + 6661 tccgtagcta tctaggtttc agatatgcct tgtatccatc aatcctactt atgaatgtca + 6721 ttgcgattac actttattta aagcaaaaca atataaggta ttggcagtgg ttattactaa + 6781 ccttgtctgt ttactgggta tatggacaaa ctgattctcg cttaacattt tacaattctt + 6841 gtatattatt agtcttcaat atactaataa agtggttccc tgatattttg tctaagttag + 6901 gaaatgtgtt taaaattttt aggctgacct ttattataaa tgcaataatt agcttttgga + 6961 tttcaataaa ttatctcgga tcaaacaatt cttttgtaaa cagtttctta ttcaagttaa + 7021 atcacatgtt aggtggtcga cttttcttag ctaataaatc tctagaatta ttcggttttg + 7081 gtttgtttgg aaaacaggtt gactggaatg gaaatggtct gaccattgaa ggagtcagga + 7141 attatcagac ctatctttat gtcgataatt tgtatattca aattctacaa aaatttggtt + 7201 tactcgttct agttttaatg ttagcgttgt taacgttaac actgtttaaa gctataaaga + 7261 aagatcagtg ggtcattgct tttattttaa tcgtaatgag ttttcaatcc atgatagacg + 7321 atctaaacat gtaccttcat tacaatatct tttggatttt gataggaagt ttaatataca + 7381 ctcagtatca ctattctaat gaggggactt aaaagtttta gaataagtag tttgataaat + 7441 aaagaggaaa gttttaacag ggattgaaat gaataaaaga gataggaatt actatgttgg + 7501 attagtaatg aagattgtta ctaaaccttt aaaaatgttg aaggtaaggg aagaacgcat + 7561 tttatttaaa agctatgatg cagaaaatat atcgtgtaat ccaaaatata tttataatga + 7621 actaaaaaaa aataatcgtt atgaattgat ttgggttttg aaaaaccctg aaaaaacccc + 7681 ggaggtaaaa gctataaagt atatgtcatt gaaatggttg tattatatag caacatctaa + 7741 gtatgtgata acaaatacag gttttaattt ttggttacct aaaaagaaag aacagatata + 7801 tctgaacaca tggcacgggg gtggagcgta taaagatagt gacaatctaa gtaatataag + 7861 taaagcgcaa ataacccaaa ctcaaaaaag tgctgaattg gaagattatt ttatttcgag + 7921 ttgtgccgtt tttacaaagg agtacgcaga gaaaagacta ggattcaaag gaaaaatttt + 7981 agaggtgggt acgccgagaa atgattatct aattcataac catgataatg cttctttaaa + 8041 aaatagtatt agaagaagat taaatattgc agatgatcat ttcatagtaa tctatgctcc + 8101 aacatggcgt gatgacgctt ctactataga ggatttagat tatgatagtt tgctagagtg + 8161 tttaagagaa aaatattcag aagtgactat tttagtccga gggcatcacc ttcaaaagaa + 8221 cttggtatgt attaagaatt caaatattat taatgtatca gattatgatg atatgcaaga + 8281 attattactt atatcagatt tgttagtaac tgattactca tcatcaattt gggatatgat + 8341 tcatggaggt aagaaagttt tgttatatac tccagattta gatgaatact taaaatatcg + 8401 tgaatttcat gtagatataa aagaatggag tattccatat tttaagacta atgaggagtt + 8461 gattcatttt atattttcaa atggatttac taacatggac gaagtaatga agaatcatat + 8521 gaatagattt ggtagttttg aacatgggaa cgctacccaa aaaatagtag aattaataga + 8581 aaagggaaat aaatgaaggt tagtgtaata atacctatct ataatgtaga aaagtattta + 8641 agaaggtgtc tagaatccat tgttaatcag acatataagg acattgaaat aattttagta + 8701 aatgatggtt ctccagataa ttcaaaagaa atatgtgaag aatatgtagt taaatattcc + 8761 aatattcaat taataaatca aaataatgca ggtttaggtg cggctagaaa taaaggtttg + 8821 cagtatgtaa caggtgatgc gattactttc gtagattccg atgattggct tgaattagac + 8881 gcaattgaat attacgtgga atctatgaaa aagagtgatg cagatattgt agttactaaa + 8941 atgattagga aaaaagagta tactcctagt gaagaaatta agaagtcgcc ggtaacagag + 9001 gaagttctaa ctcagaaaca gtttgcgaaa aaatatttta aaatagatgg aaataatata + 9061 gaatattatg cttgtgccaa actttataag aaagaaattg cttgtgaggt taaatatcca + 9121 gttggtttat ttgctgaaga tgtacccgca gctttcagct atattatacg ttcacaaaat + 9181 atattctata gcacaaaagt aacttataat tattttttta acgataatag tttaacagcg + 9241 aattttacaa ataaagattt tgatttagag aagatttggg atttagtaac tgaagaagct + 9301 gaggattttg gaaacgagga ttatatttta tattctaaga taaataggta tagaatagac + 9361 tttaatcttt tgtgtaggat agcactatca gaagataaaa cagatattga aacatatgtt + 9421 aaaaaaatag aggaactact tggtaaagtt aaaagaaata agaaaatctt attagagtat + 9481 ttaccgtttt ctagaaaagt gatattgaga ttatttttgg ttaattacaa actaggaaga + 9541 aatgttttga gaatgtttaa aaatattatg tagttaataa atggtaatat aaggggatgg + 9601 gaatgtatta ttttataaaa gtagaaaaag atttaaaaaa tactgccgga ataaaagctc + 9661 cggatgatat agagagaatt tcaaaagaat taggaatgca agaattacta ttccctaaat + 9721 ttccatttga aaaaaataaa gtatttcaaa aactctggct ttttagtgtc ataggctaca + 9781 agtggacgag ccttttatgg aaacttaaaa ccaatgatgt agttatatat caacacccaa + 9841 tgtacggagt gagagtgtcc aattgtttga ttccattgtt aaaaaaatgc aaaaacatta + 9901 aatttatagc agtaatacat gatttggaat cactaagaaa aggtattcaa ggagttatcg + 9961 aagataatga aacaacaaat actattgcag atacagagtt gctatcgaaa ttcgataaaa + 10021 taatctctca taattcaaaa atgacaaatt atttggaagg gattggaata aaaaaagaaa + 10081 atttagttga tttagaaata tttgattatc tggacccatc ggaaatgaaa gaaaaaactg + 10141 aagatggagt agttatagct ggcaatctag ctaaaggtaa gagctcctat atttacaagc + 10201 taattgaaaa aaaaccagga tttaaattga acctttttgg tccgaatttt aatattgaag + 10261 aattgccaga gaatgttaaa tactatggta gtttaacacc aaatgaatta cctcaaaaac + 10321 tagtaggtaa gtttggattg gtttgggatg gtgatagttt agatacctgt ggcggaaaca + 10381 ctggtaatta tctgaaattt aataatccgc acaaaacatc cctatatctt gcttctggaa + 10441 taccagtgat tatatggaaa gaagctgcct tagcggaatt tattgaaaat aataatgttg + 10501 gatttactgt aaatagttta tcagaaatag aaattgtgtt aaaaaatata tcagcaaatg + 10561 attattcttt gatgaaagca aatacaatgg aagtgggaaa gaaattaaga gagggttatt + 10621 tttatcgtca atctatatat aaatgcaaaa atgatttgaa atagtagtag aattactaat + 10681 cgaaagccca taagctccta gtaactaatg tatactactg tccaaaaata ttatttacat + 10741 taaatgaaaa attgtgcgca aatagataat ttgagttttt gcaaacataa aacagagctc + 10801 taaaaataat aatttatatg gaaactgtaa acactaatga aagtattaaa aaactatgcc + 10861 tacaaccttt cttatcagtt gttgataatt atactcccta tcattactac tccctatgtg + 10921 acacgagtct tttcttcgga tgatttagga tcatatggtt atttcaattc gatagtgact + 10981 tattttatct tgttagcaac acttggggtt gctaactatg gtacaaaggt aatttcagga + 11041 catcgtaaaa acattgaaaa gaacttttgg ggcatctatt cgttacaatt aggtgcgaca + 11101 gttctttcac tgttattcta tgtcattcta tgtctctcta tatcttttat gaaaaatcca + 11161 acagcctata ttcttggatt gagtttaata tcaaaaggct tggatatttc ctggcttttt + 11221 caagggatag aggattttcg aaaaattaca gtaagaaata taactgtaaa agtcattggg + 11281 gtaacctcgg ttttcttatt tgtaaaatca gctagcgacc tctatcttta tgtttttctt + 11341 ttaacgatat ttgagttatt agggcaactt agtatgtggg taccagctcg ggaatttact + 11401 gggaaaccgc actttgactg gttgtatgct aaacaacatt tgaaaccagt tatcttatta + 11461 tttttaccac aggtcgctat atcgctttat gtgactttag atagtactat gcttggttct + 11521 ctatcttcaa ttagagatgt aggaatttat gatcaatctt tgaaacttgt caaaatatta + 11581 ttaacattag taacttcatt aggaagtgtc atgttgccac gagtttcaaa tcttttatct + 11641 tcaggggatc ataaagcagt taataaaatg catgagatgt catttctggt ttataacttg + 11701 gttatttttc ctattatggc aggaatgcta attgtaaatg atgactttgt aacctttttc + 11761 ctcgggcaag attttcaaga ggcacgttat gcgatagcaa ttatgatttt tagaatgttc + 11821 tttattggtt ggaccaatat tatggggatt caaattttga tacctcataa taaaaataaa + 11881 gaatttatgc tgtcaacaac aattcctgct attgttagtg taggcttaaa tcttctcttg + 11941 cttccaaagc tgggctatat aggtgcggca attgtatctg ttttaacaga ggtactagta + 12001 tggctgatac agttattcta tactcgttct tatttgagag aggtgcccat tctaggttca + 12061 ttgatcaaaa ttataatctc atctggagtt atgtatggta tcttgttatt tataaaacaa + 12121 ttcctaaatg tatcaccgat aatcaatgtg ggactatatg ctattctggg agcaatgatc + 12181 tatctcgtat taattttgat ttttaggatt ataaatccaa atgagttaaa acaacaatta + 12241 ttaaaaaata aaggagcata aaatgtacga ttatcttgtt gttggtgctg gtctctttgg + 12301 tgcagtcttt gcccatgaag cagccttaaa aggaaaaaaa gtaaaagtta ttgaaaaacg + 12361 aaatcatatc gcgggtaata tctatactcg tgaagaggaa ggaattcaag ttcatcaata + 12421 tggtgctcat atcttccata cttctgataa ggagatctgg gagtatgtaa atcagtttgc + 12481 agagtttaac cgttatacca attctcctgt tgcaaactat aagggagaga tttataactt + 12541 accttttaat atgaatacct tcaataaact ctggggagtt gtgacgccag cagaagcaca + 12601 agttaagatt gaggaacaac gtgctatttt aaatggtaaa gctcctgaaa atttggaaga + 12661 acaagcgatt tctcttgtag gtacagacat ctacgaaaaa ttaatcaaag actatacaga + 12721 gaaacagtgg ggcaaaccaa ctactgaact tccagccttt attattcgcc gtttgccagt + 12781 acgtctgacc tatgataaca actattttaa cgatacctat caagggattc caattggtgg + 12841 atacactcaa atagttgaaa aaatgttgga tcatgaaaat attgatgtag aaacaaatgt + 12901 tgatttcttt gtgaataaag agcaatatct gaaagatttt cctaagattg tctttactgg + 12961 tatgattgat gaattctttg actataagtt gggcgaacta gagtaccgta gtcttcgttt + 13021 tgaaaatgag accttggata tggaaaatta ccaaggaaat gcagttgtga actatacgga + 13081 tgcagaaacc ccatatactc gcattattga acacaaacat tttgagtttg ggagtcaagc + 13141 aaagactatc attactaaag aacattctaa aacatgggaa aaaggtgatg agccttatta + 13201 tccagttaat aatgatcgta ataatcattt gtataaatca tataaaaaac ttgctgatga + 13261 gcaagggaat gttatctttg gtggccgctt aggacactat cgttattacg atatgcacca + 13321 agtaattgga gcagctttgc agtgcgtgag aaatgagtta aattaatact caatgaaaat + 13381 taaagagcaa actaggaagc tagccacagg ttgctcaaaa cactgttttg aggttgcaga + 13441 tggaagctga cgcggtttga agagattttc gaagagtata aacaagtaaa actgactacc + 13501 agttattatt tagaaatagt attataaatt ccggctcttt gtcaactgta gtgggttgaa + 13561 aaaaagctaa gctcgagaaa ggacaaattt cgtcctttct tttttgatgt tcagagcgat + 13621 aaaaatccgt tttttgaagt tttcaaagtt tcgaaaacca aaggcattgc gcttgataag + 13681 tttgatgaga ttattggtcg cttccaattt ggcgttagaa tagtgtagtt gaagggcgtt + 13741 gacgattttc tctttgtcct ttagaaaggt tttaaagaca gtctgaaaaa gaggatgaac + 13801 ctgcttaaga ttgtcctcaa tgagtccgaa aaatttctct ggttccttat tctgaaagtg + 13861 aaacagcaag agttgataga gctgatagtg atgtttcaag tcttgtgaat agctcaaaag + 13921 cttgtctaaa atctctttat tggttaaatg catacgaaaa gtagggcgat aaaaatgttt + 13981 atcgctgagt ttacgactat cctgttgtat gagtttccag tagcgcttga tagccttgta + 14041 ttcatgggat tttcgatgaa actgattcat gatttggaca cgcacacgac tcatagcacg + 14101 gctaagatgt tgtacaatat gaaagcgatc aagaacgatt ttagcattcg ggagtgaaac + 14161 agtctgggag actgtttcag cctgagccta gaaatttgaa agcgaagctg tttagctaag + 14221 tcatagtaag gactaaacat atccatagta ataattttga cgcgacatcg gacggctcta + 14281 tcatatttaa gaaagtgatc tcggatgaca gcttgtgttc taccctcaag aacagtgatg + 14341 atatcgagct tttcaaaatc ttgcgcaata aagctcatct ccatctcccg attgaaacag + 14401 tcactccccg gactgtttca acgtcccaag acataatctt aggcagattt ctaaaattac + 14461 actcaaagtg gaagtcattg agctttcgaa tgacagttga agttgaaatg gccagctgat + 14521 gggcaatatc ggtcatagaa atcttttcaa ttaacttttg cgcaatcttt tggttgataa + 14581 tacgaggaat ttggtgattt ttcttgacga tagaagtttc agcgaccatc attttcaagc + 14641 aatgatagca cttaaaacga cgttttctaa ggagaattct agtaggcata ccagtcgttt + 14701 caaggtaagg aattttatag ggtctttaat gtctagtaat tttgtgataa aatgtaattg + 14761 ttccatatga ttctttctaa tgagttgttt tgtcgctttt cattatagat cttatgggac + 14821 tttttttcta cccaaaatag gctccataat atccataggg aatttaccca ctacaaatat + 14881 tatagagcct aaattccttg actatgtgat atagttgagg gatttttaaa tgatattcat + 14941 attttttgca aagatgttgt ttgaaaaata attttcaaaa attctgaaaa ttctgttgac + 15001 atctttctga aaagagtcta taatggagag aaagttttaa aggagaaaat gatgaaaagt + 15061 tcaagactac ttgcccttgc gggcgtgaca ttattg +// + diff --git a/public/res/serotype_genbank/serotype_29X.gb b/public/res/serotype_genbank/serotype_29X.gb new file mode 100755 index 0000000..62c61e5 --- /dev/null +++ b/public/res/serotype_genbank/serotype_29X.gb @@ -0,0 +1,737 @@ +LOCUS MK606434 18991 bp DNA linear BCT 30-SEP-2020 +DEFINITION Streptococcus pneumoniae strain GPS_MW_BQN1M5 cps gene cluster, + complete sequence. +ACCESSION MK606434 +VERSION MK606434.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18991) + AUTHORS van Tonder,A.J., Gladstone,R.A., Lo,S.W., Nahm,M.H., du Plessis,M., + Cornick,J., Kwambana-Adams,B., Madhi,S.A., Hawkins,P.A., + Benisty,R., Dagan,R., Everett,D., Antonio,M., Klugman,K.P., von + Gottberg,A., Breiman,R.F., McGee,L., Bentley,S.D. and The Global + Pneumococcal Sequencing,C.O. + TITLE Putative novel cps loci in a large global collection of pneumococci + JOURNAL Microb Genom 5 (7) (2019) + PUBMED 31184299 +REFERENCE 2 (bases 1 to 18991) + AUTHORS van Tonder,A.J. + TITLE Direct Submission + JOURNAL Submitted (06-MAR-2019) Parasites and Microbes, Wellcome Sanger + Institute, Wellcome Genome Campus, Hinxton, Cambridge CB10 1SA, + United Kingdom +COMMENT ##Assembly-Data-START## + Assembly Method :: Velvet v. 1.2 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..18991 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="GPS_MW_BQN1M5" + /isolation_source="nasopharyngeal swab" + /host="Homo sapiens" + /db_xref="taxon:1313" + /geo_loc_name="Malawi" + /collection_date="2015" + misc_feature 1..18991 + /note="cps gene cluster" + gene 1..1608 + /gene="dexB" + CDS 1..1608 + /gene="dexB" + /EC_number="3.2.1.70" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3280" + /inference="protein motif:CLUSTERS:PRK10933" + /inference="protein motif:Pfam:PF00128.18" + /inference="protein motif:TIGRFAMs:TIGR02403" + /inference="similar to AA sequence:RefSeq:YP_004326655.1" + /inference="similar to AA sequence:UniProtKB:Q99040" + /note="trehalose-6-phosphate hydrolase; maltooligosyl + trehalose synthase; alpha,alpha-phosphotrehalase; alpha + amylase catalytic domain protein" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="QCO91986.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNGDGIGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIAAIFGTMEDMDELIAEAKKRDIRIIMDLVVN + HTSDEHAWFVEACENPNSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGAKDLLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKGVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTGQPWLAVNPNYEMISVQEALANPDSIFYTYQKL + VQIRKENSWLVRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTAAKEVLEKQVLAPWDAFCVELL" + CDS 2165..2413 + /inference="ab initio prediction:Prodigal:2.60" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="QCO91987.1" + /translation="MLVREISETKLQKSRSSSSLRKSLEQLTHHLLDLQPKKSSDIFF + QILCLLLTDLLMSDHILDKNKYRILFRQSKQVLGALNY" + gene 2681..4126 + /gene="wzg" + CDS 2681..4126 + /gene="wzg" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09379" + /inference="protein motif:Pfam:PF03816.8" + /inference="protein motif:TIGRFAMs:TIGR00350" + /inference="similar to AA sequence:RefSeq:YP_001835063.1" + /inference="similar to AA sequence:UniProtKB:Q7WY78" + /note="putative transcriptional regulator ywtF; + membrane-bound transcriptional regulator LytR; cell + envelope-related function transcriptional attenuator + common domain; cell envelope-related transcriptional + attenuator domain protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14A" + /protein_id="QCO91988.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKRAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSVSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLMST + KALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 4128..4859 + /gene="wzh" + CDS 4128..4859 + /gene="wzh" + /EC_number="3.1.3.48" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4464" + /inference="protein motif:Pfam:PF02811.13" + /inference="similar to AA sequence:RefSeq:YP_003878593.1" + /inference="similar to AA sequence:UniProtKB:Q9AHD4" + /note="capsular polysaccharide biosynthesis protein; PHP + domain protein" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein phosphatase wzh" + /protein_id="QCO91989.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLAIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + gene 4865..5560 + /gene="wzd" + CDS 4865..5560 + /gene="wzd" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:Pfam:PF02706.9" + /inference="protein motif:TIGRFAMs:TIGR01006" + /inference="similar to AA sequence:RefSeq:YP_003724090.1" + /inference="similar to AA sequence:UniProtKB:P72367" + /note="capsular polysaccharide type 8 biosynthesis protein + cap8A; capsular polysaccharide biosynthesis protein; MPA1 + family polysaccharide export protein; chain length + determinant protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + wzd" + /protein_id="QCO91990.1" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFVYSAFI + VKPEYTSTTRIYVVNRDQGDKSGLTNQDLQAGTYLVKDYREIILSQNVLEKVATNLKL + DIPAKTLARKVQVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELFDIRVKRPEDVEDVLQI + PLLGVVPDLNKMK" + gene 5570..6253 + /gene="wze" + CDS 5570..6253 + /gene="wze" + /EC_number="2.7.10.1" + /EC_number="2.7.10.2" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:CLUSTERS:PRK11519" + /inference="protein motif:Pfam:PF01656.17" + /inference="protein motif:TIGRFAMs:TIGR01007" + /inference="similar to AA sequence:RefSeq:YP_002510377.1" + /inference="similar to AA sequence:UniProtKB:Q54520" + /note="tyrosine-protein kinase CpsD; tyrosine kinase; + capsular polysaccharide biosynthesis protein; capsular + exopolysaccharide family protein; CobQ/CobB/MinD/ParA + nucleotide binding domain" + /codon_start=1 + /transl_table=11 + /product="capsule biosynthesis tyrosine-protein kinase + Wze" + /protein_id="QCO91991.1" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + QGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITQKCDASILVTKAGEINRRDIQKAKEQLEHTGVPFLGVVLNKFNTEVEKYGAY + GVYGNYKKG" + gene 6453..6896 + /gene="wcaJ" + CDS 6453..6896 + /gene="wcaJ" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15204" + /inference="protein motif:Pfam:PF02397.10" + /inference="protein motif:TIGRFAMs:TIGR03025" + /inference="similar to AA sequence:RefSeq:YP_139560.1" + /inference="similar to AA sequence:UniProtKB:P71241" + /note="putative colanic biosynthesis UDP-glucose lipid + carrier transferase; undecaprenyl-phosphate galactose + phosphotransferase; exopolysaccharide biosynthesis + polyprenyl glycosylphosphotransferase; bacterial sugar + transferase" + /codon_start=1 + /transl_table=11 + /product="truncated exopolysaccharide biosynthesis + protein" + /protein_id="QCO91992.1" + /translation="MYKDADQRIKGSIISGEIDRLNFKEHSQSMTTKVGKVIRKLSID + ELPQLVNIIKGDMAIVGPRPLQQFEINHHILTHKEMGTTLKMSKRLSVKPGLLCYWQV + TPNKNDMPFSDRMNLDLLYIDNVSFKTDFLLILKGFYTVLMGNNN" + gene 6898..7689 + /gene="wciB" + CDS 6898..7689 + /gene="wciB" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_004326647.1" + /codon_start=1 + /transl_table=11 + /product="glycosyl transferase WciB" + /protein_id="QCO91993.1" + /translation="MKNIKILVATHKKYKIPSDTSLYLPIHVGCEGKKKIGFQGDNSG + ENISNLNPYYCELTGLFWAWKNLDYDYLGLVHYRRYFTSRRQSYREDLNMDSIILSKS + EVEKMMLDYDVVVPRKRKYYIETLYSHYAHTHDRSHLDVTRQIISELNPDYIDTFDKV + MNRRSGYMFNMFIMSKDNVNAYCEWLFPIINELYKRLDITGYSAFDARLFGRVSERLF + NVWLAKQNLRIKETPFIYMEEINLLEKGKSFLQAKFFGKKYGQSF" + gene 7708..8889 + /gene="wzy" + CDS 7708..8889 + /gene="wzy" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_004326646.1" + /note="lipid A core O-antigen ligase-related enzyme; + O-antigen ligase" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="QCO91994.1" + /translation="MKIVIQRRSLPEILALSALTIFLVMSIFDVTFYIQYLPKIVHRI + LIAILLILLVIKESYKRKLDYRTIISLFSTVLIYLLIGKMSTFSSNIAIGFIFIYVLR + DIPFKSVAKISLAVSVFMLLFVIASAKLGVIINYLEISGTRVRNYLGFRYALYPSILL + MNVIAITLYLKQNNIRYWQWLLLTLSVYWVYGQTDSRLTFYNSCILLAFNILIKWFPD + ILSKLGNVFKIFRLTFIINAIISFWISINYLGSNNSFVNSFLFKLNYTLGDRLFLANK + SLELFGFGLFGKQVDWNGNGLTIEGVRNYQTYLYVDNLYIQILQKFGLLVLVLMLALL + TLTLFKAIKKDQWVIAFILIVMSFQSMIDDLNMYLHYNIFWVLIGSLIYTQYHYSNEG + T" + gene 8946..10073 + /gene="wcrJ" + CDS 8946..10073 + /gene="wcrJ" + /EC_number="2.7.8.12" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF04464.8" + /inference="similar to AA sequence:RefSeq:YP_002510384.1" + /inference="similar to AA sequence:UniProtKB:P13485" + /note="CDP-glycerol:poly(glycerophosphate) + glycerophosphotransferase" + /codon_start=1 + /transl_table=11 + /product="glycerol phosphotransferase WchX" + /protein_id="QCO91995.1" + /translation="MNKRDRNYYVGLVMKIVTKPLKMLKVREERILFKSYDAENISCN + PKYIYNELKKNNRYELIWVLKNPEKTPEVKAIKYMSLKWLYYIATSKYVITNTGFNFW + LPKKKEQIYLNTWHGGGAYKDSDNLSNISKAQITQTQKSAELEDYFISSCAVFTKEYA + EKRLGFKGKILEVGTPRNDYLIHNHDNAFLKNSIRRRLNIADDHFIVIYAPTWRDDAS + TIEDLDYDSLLECLREKYSEVTILVRGHHLQKNLVCIKNSNIINVSDYDDMQELLLIS + DLLVTDYSSSIWDMIHGGKKVLLYTPDLDEYLKYREFHVDIKEWSIPYFKTNEELIHF + IFSNGFTNMDEVMKNHMNRFGSFEHGNATQKIVELIEKGNK" + gene 10070..11050 + /gene="wcrM" + CDS 10070..11050 + /gene="wcrM" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3858" + /inference="protein motif:CLUSTERS:PRK10073" + /inference="protein motif:Pfam:PF00535.20" + /inference="protein motif:TIGRFAMs:TIGR03937" + /inference="similar to AA sequence:RefSeq:YP_006070839.1" + /inference="similar to AA sequence:UniProtKB:Q8L0V4" + /note="hyaluronan synthase; putative glycosyl transferase; + putative glycosyl hydrolase; poly-beta-1,6 + N-acetyl-D-glucosamine synthase; Glycosyl transferase + family 2" + /codon_start=1 + /transl_table=11 + /product="family 2 glycosyl transferase" + /protein_id="QCO91996.1" + /translation="MKVSVIIPIYNVEKYLRRCLESIVNQTYKDIEIILVNDGSPDNS + KEICEEYVVKYSNIQLINQNNAGLGAARNKGLQYVTGNAITFVDSDDWLELDAIEYYV + ESMKKSDADIVVTKMIRKKEYTPSEEIKKSPVTEEVLTQKQFAKKYFKIDGNNIEYYA + CAKLYKKEIACEVKYPVGLFAEDVPAAFSYIIRSQNIFYSTKVTYNYFFNDNSLTANF + TNKDFDLEKIWDLVTEEAEDFGNEDYILYSKINRYRIDFNLLCRIALSEDKTDIETYV + KKIEELLGKVKRNKKILLEYLPFSRKVILRLFLVNYKLGRNVLRMFKNIM" + gene 11074..12141 + /gene="wcrH" + CDS 11074..12141 + /gene="wcrH" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09814" + /inference="similar to AA sequence:RefSeq:YP_005203542.1" + /note="beta-1,6-galactofuranosyltransferase" + /codon_start=1 + /transl_table=11 + /product="galactofuranose transferase" + /protein_id="QCO91997.1" + /translation="MGMYYFIKVEKDLKNTAGIKAPDDIERISKELGMQELLFPKFPF + EKNKVFQKLWLFSVIGYKWTSLLWKLKTNDVVIYQHPMYGVRVSNCLIPLLKKCKNIK + FIAVIHDLESLRKGIQGVIEDNETTNTIADTELLSKFDKIISHNSKMTNYLEGIGIKK + ENLVDLEIFDYLDPSEMKEKTEDGVVIAGNLAKGKSSYIYKLIEKKPGFKLNLFGPNF + NIEELPENVKYYGSLTPNELPQKLVGKFGLVWDGDSLDTCGGNTGNYLKFNNPHKTSL + YLASGIPVIIWKEAALAEFIENNNVGFTVNSLSEIEIVLKNISANDYSLMKANTMEVG + KKLREGYFYRQSIYKCKNDLK" + gene 12314..13729 + /gene="wzx" + CDS 12314..13729 + /gene="wzx" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF01943.11" + /inference="protein motif:TIGRFAMs:TIGR01695" + /inference="similar to AA sequence:RefSeq:YP_004326640.1" + /inference="similar to AA sequence:UniProtKB:P37746" + /note="polysaccharide biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="QCO91998.1" + /translation="MKVLKNYAYNLSYQLLIIILPIITTPYVTRVFSSNDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKEIEKNFWGIYSLQLGATVFSLTLYCLLCLTL + PFMQNPVAYILGLALVSKGLDISWLFQGLENFRKITVRNITVKFVGVISIFLFVKSAD + DLYLYVFLLTIFELLGQLSMWVPAREFIGRPHFDLEYARHHLKPVLLLFLPQVAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVSNLLSSGDHKAVN + KMHEISFLIYNLVIFPIMAGMLIVNDDFVTFFLGQDFQEARYAIAIMIFRMFFIGWTN + IMGIQILIPHNQNKEFMLSTTIPAIVSVGLNLLLLPKFGYIGAAIVSVLTEALVWAIQ + LYYTRTYLKDVPIIRTMIKIILASAIMYSVLLVSKTYIHFSPTINVLVFVVLGGIIYL + FSVLSLKVVDVIELKQVIRKN" + gene 14053..14724 + /gene="wefK" + CDS 14053..14724 + /gene="wefK" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3274" + /inference="protein motif:Pfam:PF01757.16" + /inference="similar to AA sequence:RefSeq:YP_004326639.1" + /note="inner membrane protein YiaH; acyltransferase family + protein" + /codon_start=1 + /transl_table=11 + /product="O-acetyltransferase WefK" + /protein_id="QCO91999.1" + /translation="MQKGYFFQFWFFGALILIYICLPVLKQFLNSKRSYLYFLSVLLV + IGLIFELTNIVLQMPIQAYVIQTFRLWTWLFYYILGGFISQFDKNTVKNGFKRWMKVI + AVLLLLVSPFILFFIAKTTYHNFFAEYFYDILLVKVVSVGIFLTIFSLVLNENSNKWI + IFLSNQTMGIFIIHTYIMKVWEKLFGFSFMGSYLLFAIFTLSVSFIIVGMLMKIPYFN + RIVKL" + gene 14737..15840 + /gene="glf" + CDS 14737..15840 + /gene="glf" + /EC_number="5.4.99.9" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG1232" + /inference="protein motif:CLUSTERS:PRK07208" + /inference="protein motif:Pfam:PF03275.7" + /inference="protein motif:TIGRFAMs:TIGR00031" + /inference="similar to AA sequence:RefSeq:YP_001200164.1" + /inference="similar to AA sequence:UniProtKB:P37747" + /note="protoporphyrinogen oxidase" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase" + /protein_id="QCO92000.1" + /translation="MYDYLVVGAGLFGAVFAHEAALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIDEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPSFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQ + GNVIFGGRLGHYRYYDMHQVIGAALQCVRNELN" + gene complement(16521..16805) + /gene="tnpC" + CDS complement(16521..16805) + /gene="tnpC" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG2826" + /inference="similar to AA sequence:RefSeq:YP_003446957.1" + /note="IS30 family protein" + /codon_start=1 + /transl_table=11 + /product="ISSmi3 transposase" + /protein_id="QCO92001.1" + /translation="MTKHKHLTLSERNDIQLGLERGETFKAIGQSILKDTTTVSKEVK + RNKQVRESTCDNLPCPLLDKAPFVCNGCPKRRQNCGYKKTFYLRELPLTT" + gene 17009..18991 + /gene="aliA" + CDS 17009..18991 + /gene="aliA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4166" + /inference="protein motif:CLUSTERS:PRK15104" + /inference="protein motif:Pfam:PF00496.16" + /inference="protein motif:TIGRFAMs:TIGR02294" + /inference="similar to AA sequence:RefSeq:YP_001835080.1" + /inference="similar to AA sequence:UniProtKB:P31306" + /note="76 kDa cell surface lipoprotein; oligopeptide ABC + transporter substrate-binding protein OppA; ABC-type + oligopeptide transport system, periplasmic component; + nickel ABC transporter, nickel/metallophore periplasmic + binding protein; Bacterial extracellular solute-binding + proteins, family 5 Middle" + /codon_start=1 + /transl_table=11 + /product="oligopeptide ABC transporter + oligopeptide-binding protein AliA" + /protein_id="QCO92002.1" + /translation="MKSSKLFALVGVTLLAATTLAACSGSGSSTKGEKTFSYIYETDP + DNLNYLTTGKTATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDA + KWYTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDAYVKGEIKDFSQVG + IKALDDQTVQYTLNKPESFWNSKTTMGVLAPVNEEFLNSKGDDFAKATDPSSLLYNGP + YLLKSIVTKSSVEFAKNPNYWDKDNVHVDKVKLSFWDGQDTSKPAENFKDGSLTAARL + YPTSASFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKALL + NKDFRQAIAFGFDRTAYASQLNGQTGASKILRNIFVPPTFVQADGKNFGDMVKEKLVT + YGDEWKDVNLADSQDGLYNPEKAKAEFAKAKSALQAEGVTFPIHLDMPVDQTATTKVQ + RVQSMKQSLEATLGADNVVIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPDFA + DPSTYLDIIKPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDEATDVAKRY + DKYAAAQAWLTDSALIIPTTSRTGRPILSKMVPFTIPFALSGNKGTSEPVLYKYLELQ + DKAVTVDEYQKAQEKWMKEKEESNKKAQEDLAKHVK" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg gagatggaat tggcgatttg ccaggaatta ccagtaagtt ggactatcta + 121 gccaagctag gaatcacagc aatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctatg atattgctga ttatcaagcg attgcggcta tttttggaac catggaggac + 241 atggatgaac tgattgcaga agctaagaag cgtgatatcc gtatcatcat ggacttggtg + 301 gtcaatcata cctcggatga gcatgcctgg tttgtagagg cctgtgaaaa tcctaatagc + 361 cctgagcgag actactatat ctggcgggat gagcctaacg atttagattc tatttttagt + 421 ggatctgctt gggaatacga tgaaaaatct ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaagg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agctaaggat ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ttactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcagc ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttacttcat + 1021 ctcatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatctctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaacct + 1261 tggttggcgg ttaatccaaa ttacgagatg attagtgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 gttcgagctg actttgaatt gcttgatacg gctgataagg tctttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacactg cggctaaaga agtacttgaa + 1561 aaacaggtct tggctccatg ggatgctttc tgtgtggaat tactataaat attttttgca + 1621 gaaaaattta aaattgaaat catataaaaa caagggagga ctgtataaaa gacagaaatc + 1681 ctttgttttt ttataaccaa ggtttataaa ctttcattct cgaaattcaa ttaactttac + 1741 aaattcccac tattaaggag aaagaagata aacataaaga agcgtgtcct tagtgcaggt + 1801 ctgacttttg catctgcttt gcttttagct gcttgcggcc aatcaggttc agatacaaaa + 1861 acttactcat caacctttag tggaaatcca actacattta actatctatt agactattac + 1921 gctgataata cagtcaattg aaacaagaac aagacaaaag agcctcgtaa aaagtattgc + 1981 aacttggtaa tacctttttg aggtgctttt tgatatgagc ccatgttttc tcaataggat + 2041 tgtactcagg tgagtaggga ggaagaaggt aaaagtttat gcccaaactc ttcgcataaa + 2101 agttctagct tccccagtct atggaatctt acattatcca taataataac cgatagtgtg + 2161 gttaatgttg gtaagagaaa tttctgaaac caagcttcaa aaaagtcgct cgtcatcgtc + 2221 tcttcgtaag tcattggagc aattaactca ccatttgtta gacctgcaac caaagaaatc + 2281 ctctgatatc ttcttccaga tactttgcct cttattaact gaccttttaa tgagcgacca + 2341 tattctcgat aaaaataagt atcgaatctt gtttcgtcaa tctaaacagg tgctaggtgc + 2401 tttaaactat taaaattctt aagaaataag gctacttttt ctgggtcttg ttcataatta + 2461 gattgaaact agaatagtac acctctgctt ctaaaacgtt gttagaaatc gatttgactg + 2521 tcctgatcgt tttatcatgt tcttatttca ttttactata tttttggttc gcgggaagtc + 2581 tactaagata cttaaagatg cagatagtga aaataaaggt gtagacatta ccgtaaaaaa + 2641 gtgatataat cgtatgatgt tcaatgtata ggtgttaatc atgagtagac gttttaaaaa + 2701 atcacgttca cagaaagtga agcgaagtgt taatatagtt ttgttgacta tttatttatt + 2761 gttagtttgt tttttattgt tcttaatctt taagtacaat atccttgctt ttagatatct + 2821 taatctagtg gtaactgcgt tagtcctact agttgccttg gtagggctac tcttgattat + 2881 ctataaaaga gctgaaaaat ttactatttt tctgttggtg ttctctatcc ttgtcagctc + 2941 tgtgtcgctc tttgcagtac agcagtttgt tggactgacc aatcgtttaa atgcgacttc + 3001 taattactca gaatattcgg tcagtgtcgc tgttttagca gatagtgaga tcgaaaatgt + 3061 tacgcaactg acgagtgtga cagcaccgac tgggactgat aatgaaaata ttcaaaaact + 3121 actagctgat atcaagtcaa gtcagaatac cgatttgacg gtcaaccaga gttcgtctta + 3181 cttggcagct tacaagagtt tgattgcagg ggagactaag gccattgtcc taaatagtgt + 3241 ctttgaaaat atcatcgagt cagagtatcc agactacgca tcgaagataa aaaagattta + 3301 taccaaggga ttcactaaaa aagtagaagc tcctaagacg tctaagaatc agtctttcaa + 3361 tatctatgtt agtggaattg acacctatgg tcctattagt tcggtgtcgc gatcagatgt + 3421 caatatcctg atgactgtca atcgagatac caagaaaatc ctcttgacca caacgccgcg + 3481 tgatgcctat gtaccaatcg cagatggtgg aaataatcaa aaagataaat taactcatgc + 3541 gggcatttat ggagttgatt cgtccattca caccttagaa aatctctatg gagtggatat + 3601 caattactat gtgcgattga acttcacttc tttcttaaaa atgattgact tattgggagg + 3661 ggtagatgtt cataatgatc aagagttttc agctctacat gggaagttcc atttcccagt + 3721 agggaatgtc catcttgatt cagaacaggc tctcggtttt gttcgtgagc gctactccct + 3781 agcagatggc gatcgtgacc gcgggcgcaa tcaacaaaag gtgattgtgg ctatccttca + 3841 aaaattaatg tcaaccaaag cactgaaaaa ttatagtacg atcattaata gcttgcaaga + 3901 ttctatccaa acaaatatgc cacttgagac tatgataaat ttggtcaatg ctcagttaga + 3961 aagtggaggg aattataaag taaattctca agatttaaaa ggtacaggtc ggacggatct + 4021 tccttcttat gcaatgccag acagtaacct ctatgtgatg gaaatagatg atagtagttt + 4081 agctgtagtt aaagcagcta tacaggatgt gatggagggt agatgaaatg atagacatcc + 4141 attcgcatat cgtttttgat gtagatgacg gtcccaagtc aagagaggaa agcaaggctc + 4201 tcttggcaga atcctacagg cagggggtgc gaaccattgt ctctacctct caccgtcgca + 4261 agggcatgtt tgaaactccg gaagagaaga tagcagaaaa ctttcttcag gttcgggaaa + 4321 tagctaagga agtggcgagt gacttggcca ttgcttacgg ggctgaaatt tactacacac + 4381 cagatgttct ggataagctg gaaaaaaagc ggattccgac cctcaatgat agtcgttatg + 4441 ccttgataga gtttagtatg aacactcctt atcgcgatat tcatagcgcc ttgagcaaga + 4501 tcttgatgtt gggaattact ccagtcattg cccacattga gcgctatgat gctcttgaaa + 4561 ataatgaaaa acgcgttcga gaactgatcg atatgggctg ttacacgcaa gtaaatagtt + 4621 cacatgtcct caaatccaaa ctttttggcg aacgttataa attcatgaaa aaaagagctc + 4681 agtatttttt agagcaggat ttggtccatg tcattgcaag tgatatgcac aatctagacg + 4741 gcagacctcc tcatatggca gaagcatatg accttgttac ccaaaaatac ggagaagcga + 4801 aggctcagga actttttata gacaatcctc gaaaaattgt aatggatcaa ctaatttagg + 4861 agaaatgatg aaagaacaaa acacgataga aatcgatgta tttcaattat ttaaaacctt + 4921 gtggaaacgc aagctaatga ttttattagt ggcacttgtg acaggtgcgg gggcttttgt + 4981 atatagcgct tttattgtta agccagaata tacgagtacc acgcgaattt acgtagtgaa + 5041 tcgcgatcaa ggagacaagt cggggctgac aaatcaggat ttgcaggcag gaacttatct + 5101 ggtaaaagac taccgtgaga ttatcctttc gcagaatgta ttggaaaaag tagcgacaaa + 5161 tttgaagttg gatataccag ccaaaacgtt agctagaaaa gttcaagtga ctgtaccagt + 5221 tgacactcgt atcgtctcaa tctctgtcaa ggataaacag ccagaggaag ccagtcgtat + 5281 cgctaattct ctacgagaag ttgctgcaga aaagatcatc gctgtaacgc gagtatctga + 5341 tgtaacgaca cttgaagaag cgcgaccagc tacgactccc tcttctccaa atgttcgacg + 5401 caattccttg tttggttttc ttggaggagc agtcgtaaca gtaattgctg ttcttttgat + 5461 tgagttgttc gacatccgtg tgaaacgtcc tgaagatgtc gaagatgtac tgcaaattcc + 5521 acttttaggg gtcgttccag atttgaacaa aatgaaatag gaggaagtta tgccaacatt + 5581 agaaatctca caggcaaaat tggattttgt aaaaaaggca gaggaaaatt ataacgcttt + 5641 gtgcacgaac ctacagttaa gtggagatga tttgaaagta ttttctatca cttctgtgaa + 5701 acaaggagaa ggaaaatcaa cgacttccac caatatcgct tgggcttttg cgcgtgcagg + 5761 ttacaaaacg ctgctgattg atggagatat tcgcaattct gttatgttag gtgtctttaa + 5821 agcaagagat aagattacag gcctgacaga atttttatca ggaactacag acctatcaca + 5881 agggctttgt gataccaata tcgaaaatct ctttgtaatt caggctggct ctgtgtcacc + 5941 gaatccgaca gctcttcttc aaagtaagaa tttcagtaca atgcttgaaa ccttgcgtaa + 6001 atattttgac tacatcattg tagatactgc tcctgtcggt gtcgtgattg atgcggctat + 6061 tattacgcaa aaatgcgatg cttctatttt agtgacgaag gcaggtgaaa taaatcgacg + 6121 ggatattcaa aaagcaaaag aacagttgga acacacagga gtaccttttt taggagttgt + 6181 tctaaataaa ttcaacacag aagttgaaaa atatggagct tatggtgtct atggaaatta + 6241 taagaaggga taattgataa aaagtgtatt ttgtttttaa aaatatttta gatagatttt + 6301 tggcattttt cctatttatc acactgataa tcataccgat tattccgata acaatcctgc + 6361 ttatttggat agaagatcca ggggatatat ttttctttca agatagaatt ggtttaaatg + 6421 ggaagagctt taaagtaata aagtttcgga gtatgtataa agatgccgat caaagaataa + 6481 agggaagtat tattagtggt gaaattgatc gtctaaattt taaagaacat tctcaaagta + 6541 tgactacaaa agtcggtaaa gtgatacgaa aactttcaat tgatgaattg cctcaattag + 6601 tgaatattat aaaaggtgat atggctatag tgggacctcg tccattacaa caatttgaaa + 6661 taaatcatca tattcttact cataaagaaa tggggactac tttaaagatg tctaaaagat + 6721 tgtctgtgaa acctggtttg ctttgttatt ggcaagttac gccgaataaa aatgacatgc + 6781 cttttagtga tagaatgaat ctagatttat tatacattga taatgtatct ttcaagactg + 6841 atttcttgct tattttgaag ggattttata cagttttaat gggtaataac aattaacatg + 6901 aaaaatataa aaatattagt agcaacacat aaaaaatata aaatacccag tgatacgagt + 6961 ttgtatctac caattcatgt aggatgtgaa ggaaagaaaa aaattggatt tcaaggtgac + 7021 aattcaggag aaaatatttc taatttaaat ccttattatt gtgaattgac tggcttgttt + 7081 tgggcttgga aaaacttaga ttatgattat cttggattag tacactatcg tagatatttt + 7141 acttcaagac gtcaatctta tcgtgaagat ctcaacatgg atagtatcat tttatctaaa + 7201 tcagaggttg aaaaaatgat gctggactat gatgttgttg ttccacgtaa aagaaaatat + 7261 tatattgaaa ctctctattc tcactatgca catactcatg atcgaagtca tttagatgtt + 7321 actcgccaaa tcattagtga gttaaatccg gattatattg atacgtttga taaagtgatg + 7381 aatcgtcgta gcggctatat gtttaacatg tttatcatgt caaaagataa tgtgaatgca + 7441 tattgtgagt ggttattccc aattattaat gagttatata aacggttgga tattacaggc + 7501 tattcggctt ttgatgcgag attgtttgga cgtgtcagtg aacgcttgtt taatgtttgg + 7561 ttagctaagc aaaatttgcg cataaaagag acacctttta tttatatgga ggaaatcaac + 7621 ttacttgaaa aagggaaatc cttccttcaa gcaaaattct ttggtaaaaa gtacggacag + 7681 agtttttagt taggaataaa aatagtgatg aaaatagtaa tacaaagaag gtctttgcca + 7741 gaaattttag ctcttagtgc actaactata tttttagtta tgtcaatttt tgatgtgact + 7801 ttttatattc agtatctgcc gaaaattgtt cataggatac tgatagctat tttgcttatt + 7861 ctgcttgtta taaaagagtc gtacaaaaga aagcttgatt atagaactat cataagtcta + 7921 ttttctactg ttttaattta tctccttata gggaagatga gtacttttag ttctaatatt + 7981 gcaataggtt tcatttttat ttatgtttta cgcgatatcc cttttaaaag tgtggcaaaa + 8041 atttctttag cggtaagtgt gttcatgtta ctctttgtta tagctagcgc aaagttggga + 8101 gttattataa attatttaga gatttctggg acccgagtcc gtaactatct aggtttcaga + 8161 tatgccttgt atccatcaat cctacttatg aatgtcattg ctattacact ttatttaaag + 8221 caaaacaata taaggtattg gcagtggtta ttactaacct tgtctgttta ctgggtatat + 8281 ggacaaactg attctcgctt aacattttac aattcttgta tattattagc cttcaatata + 8341 ctaataaagt ggttccctga tattttgtct aagttaggaa atgtgtttaa aatttttaga + 8401 ctaaccttta ttataaatgc aataattagc ttttggattt caataaatta tcttggatca + 8461 aacaattctt ttgtaaacag tttcttattc aagttaaatt acacgttagg tgatcgactt + 8521 ttcttagcta ataaatctct agaattattc ggttttggtt tgtttggaaa acaggttgac + 8581 tggaatggaa atggtctgac cattgaagga gtcaggaatt atcagaccta tctgtatgtc + 8641 gataatttgt atattcaaat tctacaaaaa tttggtttac tcgttctagt tttaatgtta + 8701 gcgttgttaa cgttaacact gtttaaagct ataaagaaag atcagtgggt cattgctttt + 8761 attttaatcg taatgagttt tcaatccatg atagacgatc taaacatgta ccttcattac + 8821 aatatctttt gggttttgat aggaagttta atatacactc agtatcacta ttctaatgag + 8881 ggtacttaaa agttttagaa taagtagttt gataaataaa gaggaaagtt ttaacaagaa + 8941 ttgaaatgaa taaaagagat aggaattact atgttggatt agtaatgaag attgttacta + 9001 aacctttaaa aatgttgaag gtaagggaag aacgcatttt atttaaaagc tatgatgcag + 9061 aaaatatatc gtgtaatcca aaatacattt ataatgaatt aaaaaaaaat aatcgttatg + 9121 aattgatttg ggttttgaaa aaccccgaaa aaacccctga ggtaaaagct ataaagtata + 9181 tgtcattgaa atggttgtat tatatagcaa catctaagta tgtaataaca aatacaggtt + 9241 ttaatttttg gttacctaaa aagaaagaac agatatatct gaacacatgg cacgggggtg + 9301 gagcgtataa agatagtgac aatctaagta atataagtaa agcgcaaata acccaaactc + 9361 aaaaaagtgc tgaattggaa gattatttta tttcgagttg tgccgttttt acaaaggagt + 9421 acgcagagaa aagactagga ttcaaaggaa aaattttaga ggtgggtacg ccgagaaatg + 9481 attatctaat tcataaccat gataatgctt ttttaaaaaa tagtattaga agaagattaa + 9541 atattgcaga tgatcatttc atagtaatct atgctccaac atggcgtgat gacgcttcga + 9601 ctatagagga tttagattat gatagtttgc tagagtgttt aagagaaaaa tattcagaag + 9661 tgactatttt agtccgaggg catcaccttc aaaagaactt ggtatgtatt aagaattcaa + 9721 atattattaa tgtatcagat tatgatgata tgcaagaatt attacttata tcagatttgt + 9781 tagtaactga ttactcatca tcaatttggg atatgattca tggaggtaag aaagttttgt + 9841 tatatactcc agatttagat gaatacttaa aatatcgtga atttcatgta gatataaaag + 9901 aatggagtat tccatatttt aagactaatg aggagttgat tcattttata ttttcaaatg + 9961 gatttactaa catggacgaa gtaatgaaga atcatatgaa tagatttggt agttttgaac + 10021 atgggaacgc tacccaaaaa atagtagaat taatagaaaa gggaaataaa tgaaggttag + 10081 tgtaataata cctatctata atgtagaaaa gtatttaaga aggtgtctag aatccattgt + 10141 taatcagaca tataaggaca ttgaaataat tttagtaaat gatggttctc cagataattc + 10201 aaaagaaata tgtgaagaat atgtagttaa atattccaat attcaattaa taaatcaaaa + 10261 taatgcaggt ttaggtgcgg ctagaaataa aggtttgcag tatgtaacag gtaatgcgat + 10321 tactttcgta gattccgatg attggcttga attagacgca attgaatatt acgtggaatc + 10381 tatgaaaaag agtgatgcag atattgtagt tactaaaatg attaggaaaa aagagtatac + 10441 tcctagtgaa gaaattaaga agtcgccggt aacagaggaa gttctaactc agaaacagtt + 10501 tgcgaaaaaa tattttaaaa tagatggaaa taatatagaa tattatgctt gtgccaaact + 10561 ttataagaaa gaaattgctt gtgaggttaa atatccagtt ggtttatttg ctgaagatgt + 10621 acccgcagct ttcagctata ttatacgttc gcaaaatata ttctatagca caaaagtaac + 10681 ttataattat ttttttaacg ataatagttt aacagcgaat tttacaaata aagattttga + 10741 tttagagaag atttgggatt tagtaactga agaagctgag gattttggaa acgaggatta + 10801 tattttatat tctaagataa ataggtatag aatagacttt aatcttttgt gtaggatagc + 10861 actatcagaa gataaaacag atattgaaac atatgttaaa aaaatagagg aactacttgg + 10921 taaagttaaa agaaataaga aaatcttatt agagtattta ccgttttcta gaaaagtgat + 10981 attgagatta tttttggtta attacaaact aggaagaaat gttttgagaa tgtttaaaaa + 11041 tattatgtag ttaatgaatg gtaatatgag gggatgggaa tgtattattt tataaaagta + 11101 gaaaaagatt taaaaaatac tgccggaata aaagctccgg atgatataga gagaatttca + 11161 aaagaattag gaatgcaaga attactattc cctaaatttc catttgaaaa aaataaagta + 11221 tttcaaaaac tctggctttt tagtgtcata ggctacaagt ggacgagcct tttatggaaa + 11281 cttaaaacca atgatgtagt tatatatcaa catccaatgt acggagtgag agtgtccaat + 11341 tgtttgattc cattgttaaa aaaatgcaaa aacattaaat ttatagcagt aatacatgat + 11401 ttggaatcac taagaaaagg tattcaagga gttatcgaag ataatgaaac aacaaatact + 11461 attgcagata cagagttgct atcgaaattc gataaaataa tctctcataa ttcaaaaatg + 11521 acaaattatt tggaagggat tggaataaaa aaagaaaact tagttgattt agaaatattt + 11581 gattatctag acccatcgga aatgaaagaa aaaactgaag atggagtagt tatagctggc + 11641 aatctagcta aaggtaagag ctcctatatt tacaagctaa ttgaaaaaaa accaggattt + 11701 aaattgaacc tttttggtcc gaattttaat attgaagaac tgccagagaa tgttaaatac + 11761 tatggtagtt taacaccaaa tgaattgcct caaaaactag taggtaagtt tggattggtt + 11821 tgggatggtg atagtttaga tacctgtggc ggaaacactg gtaattatct gaaatttaat + 11881 aatcctcaca aaacatccct atatcttgct tctggaatac cagtgattat atggaaagaa + 11941 gctgccttag cggaatttat tgaaaataat aatgttggat ttactgtaaa tagtttatca + 12001 gaaatagaaa ttgtgttaaa aaatatatca gcaaatgatt attctttgat gaaagcaaat + 12061 acaatggaag tgggaaagaa attaagagag ggttattttt atcgtcaatc tatatataaa + 12121 tgcaaaaatg atttgaaata gtagtagaat tactaatcga aagcccataa gctcctagta + 12181 actaatgtat actactgtcc aaaaatatta tttacattaa ataaaaaatt gtgcgcaaat + 12241 agataatttg agtttttgca aacatagaac agagcactaa aaataataat ttatatagaa + 12301 actgtaaaca ctaatgaaag tattaaaaaa ctatgcctac aacctttctt atcagttgtt + 12361 gataattata ctccctatca ttacgacccc ctatgtgaca cgggtctttt cttcgaatga + 12421 tctagggaca tatggttatt ttaactccat cgttacttat tttatcctct tagcaacgct + 12481 aggggttgcc aactatggga ccaaggtcat ttcagggcat cgtaaagaaa ttgaaaaaaa + 12541 cttttgggga atctactctc tgcaattagg tgcaacagtt ttttctctaa ccttgtattg + 12601 tcttctttgt ctaactcttc cctttatgca aaatccagta gcctacattc taggattggc + 12661 tttggtttct aaaggattag atatatcctg gctttttcaa gggctagaga attttcgaaa + 12721 gattactgtt cgaaatatca cagtcaagtt cgttggtgta atctctatct tcctctttgt + 12781 caaatctgca gatgatctat atctctatgt ctttttgcta accatatttg aactcttggg + 12841 gcagctaagt atgtgggtgc ctgctcgtga gtttattggt agacctcatt ttgatttaga + 12901 atatgctaga catcatttga aaccagtcct attattgttc cttccgcaag tggcgatttc + 12961 cttgtatgtt acgctagatc gtactatgct tggagcgtta gcttctacaa aagatgtagg + 13021 gatttatgac caggctttaa agttggtaaa tatccttctg accttggtaa cttccttggg + 13081 aagtgtcatg ttgcctagag tttcaaatct tttatcctca ggggatcata aagcagttaa + 13141 caaaatgcat gagatatcat ttttaattta taatttggtt attttcccca ttatggcagg + 13201 aatgctcatt gtaaatgatg actttgttac ctttttcctc gggcaagatt ttcaagaggc + 13261 acgttatgcg atagcaatta tgatttttag aatgttcttt attggttgga ccaatattat + 13321 ggggattcaa attttgatac ctcataatca aaataaagaa tttatgctgt caacaacaat + 13381 tcctgccatt gttagtgttg gattaaatct tctcttgctt cccaagtttg gatatatagg + 13441 agcagcaatt gtttctgtct taacagaggc gctagtatgg gctattcaat tgtactatac + 13501 tcgtacatac ctaaaagatg ttccgattat tagaactatg ataaagatta ttctagcctc + 13561 agctatcatg tatagcgttt tgctagtttc taagacatac atacattttt ccccaactat + 13621 aaatgttttg gtatttgtgg tgttaggtgg aatcatttat cttttttcag ttttatctct + 13681 aaaagtggta gatgtgatag aattaaaaca agtaattagg aaaaattaga atgcataaat + 13741 ttaaagatat taacttggat ttactaaaag taattgcatg tgttggagtt gttttactcc + 13801 atacagagat ggggggattt aaagagacag cttcatggaa tttttcgaca tatttatact + 13861 acttaggaac atattctatc cctctatttt ttatagttaa tggttattta ttgttaggaa + 13921 agaaagagat tacctattcc tacatattac agaaagtaaa atggattcta ataacagtgc + 13981 tgtcatggac ccttatagtt tggctattta aacgggattt ttcagttaat ccaataaaaa + 14041 aacttatagg atgtgcaaaa aggttatttc tttcagtttt ggttttttgg tgcgctcata + 14101 cttatttata tatgtctccc cgttttgaaa caatttctta attcaaaaag aagttattta + 14161 tactttttat ctgtattgct agttattggt ttgatttttg agttaacaaa tattgtactt + 14221 caaatgccaa tacaagcata tgtaatacaa acttttagat tatggacttg gcttttctat + 14281 tatattttag ggggctttat atctcagttt gataaaaata ccgtcaaaaa tgggtttaag + 14341 agatggatga aagtaattgc agtactttta ttattagttt cgccatttat attatttttc + 14401 atagcaaaga ccacttacca taattttttt gctgaatatt tttatgatat tttattagta + 14461 aaagttgtaa gcgtagggat ttttctaact attttctcac ttgtattgaa tgaaaatagc + 14521 aacaaatgga ttatttttct ttctaatcaa actatgggta tctttataat acacacttat + 14581 attatgaagg tatgggaaaa actatttggt tttagtttta tgggttcata tttacttttt + 14641 gctatattta ctttaagtgt tagttttatc attgttggaa tgttaatgaa aattccgtat + 14701 tttaatcgaa tcgtcaaatt ataaaaagga gaaaaaatgt acgattatct tgttgttggt + 14761 gctggtctct ttggtgcagt ctttgcccat gaagcagcct taaaaggaaa aaaagtaaaa + 14821 gtcattgaaa aacgaaatca tatcgcgggt aatatctata ctcgtgaaga ggaaggaatt + 14881 caagttcatc aatatggtgc tcatatcttc catacttctg ataaggagat ttgggattat + 14941 gtaaatcagt ttgcagagtt taaccgttac acaaattctc ctgttgcaaa ctataaggga + 15001 gagatttata acttaccttt taatatgaat accttcaata aactctgggg agttgtaacg + 15061 ccagcagaag cacaagctaa gattgatgaa caacgtgcta ttttaaatgg taaaactcct + 15121 gaaaatttgg aagaacaggc gatttctctt gtaggtacag acatctacga aaaattaatc + 15181 aaagactata cagagaaaca gtggggcaaa ccaactactg aacttccatc ctttattatt + 15241 cgccgtttgc cagtacgcct gacctatgat aacaactatt ttaacgatac ctatcaaggg + 15301 attccaattg gtggatacac tcaaatagtt gaaaaaatgt tggatcatga aaatattgat + 15361 gtagaaacaa atgttgattt ctttgtgaat aaagagcaat atctgaaaga ttttcctaag + 15421 attgtcttta ctggtatgat tgatgaattc tttgactata agttgggcga actagagtac + 15481 cgtagtcttc gttttgaaaa tgagacattg gatatggaaa attaccaagg aaatgcagtt + 15541 gtgaactata cggatgcaga aaccccatat actcgcatta ttgaacacaa acattttgag + 15601 tttgggagtc aagccaagac tatcattact aaagaacatt ctaaaacatg ggaaaaaggt + 15661 gatgagcctt attatccagt taataatgat cgtaataatc atttgtataa atcatataaa + 15721 aaacttgctg atgagcaagg gaatgttatc tttggtggcc gcttaggaca ctatcgttat + 15781 tacgatatgc accaagtaat tggagcagct ttgcagtgcg tgagaaatga gttaaattaa + 15841 tactcaatga aaatcaaaga gcaaactagg aagctagtcg caggttgctt aaaacactgt + 15901 tttgaggttg cagatggaag ctgacgcggt ttgaagagat tttcgaagag tataaacaag + 15961 taaaactgac taccagttat tatttagaaa tagtattaaa aattccttga ctatgtgata + 16021 tagttgaggg atttttaaat gatattcata ttttttgcaa agatgttgtt taaaaaaatt + 16081 ggtaaattcc caaactaagt tccatcgcta gtagaagtgg aagttagtct gaaaaaaatc + 16141 ctaaaaacca gtggaaatcc gtgtcagggt aagttccact ggttttaatc atgcttgatt + 16201 ttattgcttt tgtaaccaaa atgaatagaa aaaaagagcg tacaaaatcc cctcgtctga + 16261 aagcgtttca gattaagttc cgctatggtg gaagttagtg tgagacgttt gaatggggtt + 16321 gaagattagt ttttagaact tatgttggag taatttagac gactgataga cgtcttctgc + 16381 agatatttta gaaatgccca gaagcttagg aatctcttct ccataggtaa atgcaaagag + 16441 ttcataggct gactttccat ttaaagcaga gcgtttgacg ctgttgacat gcgaacaaac + 16501 gagattgata tcctcttgag ttaagttgtc aaaggaagtt cccttaggta gaaagtcttc + 16561 ttatagccac agttttgtct tcttttagga cagccattac agacaaaggg ggctttatcg + 16621 agtagagggc aagggaggtt atcacaggta gactctctga cttgtttgtt tcgtttgact + 16681 tctttggaaa cagtagtcgt gtcttttaga atggattgtc caatagcttt gaaggtttca + 16741 ccgcgctcta agcctaattg gatatcatta cgttctgaaa gggtaaggtg tttatgtttt + 16801 gtcatagtag acctcatttc taactcaaac gtctcatact taattccacc ataaaaatcc + 16861 gttttagact aatttcaact tcggttgggc aagtggaagt tactttgaga agttacggtt + 16921 taaaaaaatt ttcaaaaatt ctgaaaattc tgttgacaac tttctgaaaa gagtctataa + 16981 tggagagaaa gttttaaagg agaaaatgat gaaaagttca aaactatttg cccttgtggg + 17041 cgtgacatta ttggcggcga ctactttagc tgcatgctct ggatcaggtt caagcactaa + 17101 aggtgagaag acattctcat acatttatga gacagaccct gataacctca actatttgac + 17161 aactggtaag actgcgacag caaatattac cagtaacgtg gttgatggtt tgctagaaaa + 17221 tgatcgctac gggaactttg tgccgtctat ggctgaggat tggtctgtat ccaaggatgg + 17281 attgacttac acttatacta tccgtaagga tgcaaaatgg tatacttctg aaggtgaaga + 17341 atacgcggca gtcaaagctc aagactttgt aacaggacta aaatatgctg ctgataaaaa + 17401 atcagatgct ctttaccttg ttcaagaatc aatcaaagga ttggatgcct atgtaaaagg + 17461 ggaaatcaaa gatttctcac aagtaggaat taaggctctg gatgatcaga cagttcagta + 17521 cactttgaac aaacctgaaa gtttttggaa ctcaaaaaca accatgggtg tgcttgctcc + 17581 agttaatgaa gagtttttga attcaaaagg ggatgatttt gccaaagcga cggacccaag + 17641 tagtctcttg tataatggac cttatttgtt gaaatccatt gtgacaaaat cctctgttga + 17701 atttgcgaaa aatccgaact actgggataa ggacaatgtg catgttgaca aagttaaatt + 17761 gtcattctgg gatggtcaag ataccagcaa acctgcagaa aactttaaag atggtagcct + 17821 tacagcagct cgtctctatc caacaagtgc aagtttcgca gagcttgaga agagtatgaa + 17881 ggataatatt gtctatactc aacaagactc tattacgtat ctagttggta caaatattga + 17941 ccgtcagtcc tataaataca catctaaaac cagcgacgaa caaaaggcat cgactaaaaa + 18001 ggctctctta aacaaggatt tccgtcaggc tattgccttt ggttttgatc gtacagccta + 18061 tgcctctcag ttgaatggac aaactggagc aagcaaaatc ttacgtaata tctttgttcc + 18121 accaacattt gttcaagcag atggtaaaaa ctttggcgat atggtcaaag agaaattggt + 18181 tacttatggg gatgaatgga aggatgttaa tcttgcagat tctcaggatg gtctttacaa + 18241 tccagaaaaa gccaaggctg aatttgctaa agctaaatca gccttacaag cagaaggtgt + 18301 gacattccca attcatttgg atatgccagt tgaccaaaca gcaactacaa aagttcagcg + 18361 cgtccaatct atgaaacaat ccttggaagc aactttagga gcggataatg tagtcattga + 18421 tattcaacaa ctacaaaaag acgaagtaaa caatattaca tattttgctg aaaatgctgc + 18481 tggcgaagac tgggatttat cagataatgt cggttggggt ccagactttg ccgatccatc + 18541 aacctacctt gatatcatca aaccatctgt aggagaaagt actaaaacat atttagggtt + 18601 tgactcaggg gaagataacg tagctgctaa aaaagtaggt ctatatgact atgaaaaatt + 18661 ggttactgag gctggtgatg aggctacaga tgttgctaaa cgctatgata aatacgctgc + 18721 agcccaagct tggttgacag atagtgcttt gattattcca actacatctc gtacagggcg + 18781 tccaatcttg tctaagatgg taccatttac aataccattt gcattgtcag gaaataaagg + 18841 tacaagtgaa ccagtcttgt ataaatactt ggaacttcaa gacaaggcag tcactgtaga + 18901 tgaataccaa aaagctcagg aaaaatggat gaaagaaaaa gaagagtcta ataaaaaggc + 18961 tcaagaagat ctcgcaaaac atgtgaaata a +// + diff --git a/public/res/serotype_genbank/serotype_3.gb b/public/res/serotype_genbank/serotype_3.gb new file mode 100644 index 0000000..ec72f2a --- /dev/null +++ b/public/res/serotype_genbank/serotype_3.gb @@ -0,0 +1,479 @@ +LOCUS CR931634 10337 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 524/62 (serotype 3). +ACCESSION CR931634 +VERSION CR931634.2 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 10337) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 10337) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT On Mar 17, 2006 this sequence version replaced CR931634.1. + NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..10337 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="524/62" + /db_xref="taxon:1313" + gene <1..162 + /gene="dexB" + /locus_tag="SPC03_0001" + CDS <1..162 + /gene="dexB" + /locus_tag="SPC03_0001" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32738.2" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 321..494 + /gene="aliB" + /locus_tag="SPC03_0002" + /pseudo + CDS 321..494 + /gene="aliB" + /locus_tag="SPC03_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI32739.2" + gene complement(order(487..813,827..1336)) + /gene="tnp" + /locus_tag="SPC03_0003" + /pseudo + CDS complement(join(487..813,827..1336)) + /gene="tnp" + /locus_tag="SPC03_0003" + /note="member of homology group 4; + old_tribe:0004 68" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(965..1336) + /gene="tnp" + /locus_tag="SPC03_0003" + /note="HMMPfam hit to PF01710, Transposase, score 7.2e-19" + /pseudo + misc_feature order(1523..1765,1766..1850) + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 9.5e-52" + gene 1524..2748 + /gene="wzg" + /locus_tag="SPC03_0004" + /pseudo + CDS join(1524..1766,1765..2748) + /gene="wzg" + /locus_tag="SPC03_0004" + /note="member of homology group 0; + old_tribe:0000 80" + /pseudo + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg + (pseudogene)" + misc_feature 2025..2468 + /gene="wzg" + /locus_tag="SPC03_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.4e-68" + /pseudo + gene 2750..3480 + /gene="wzh" + /locus_tag="SPC03_0005" + /pseudo + CDS join(2750..3028,3028..3480) + /gene="wzh" + /locus_tag="SPC03_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1; + old_tribe:0001 80" + /pseudo + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh (pseudogene)" + /db_xref="PSEUDO:CAI32742.2" + misc_feature order(2753..3028,3028..3360) + /gene="wzh" + /locus_tag="SPC03_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 3.5e-35" + /pseudo + gene 3489..4181 + /gene="wzd" + /locus_tag="SPC03_0006" + CDS 3489..4181 + /gene="wzd" + /locus_tag="SPC03_0006" + /note="member of homology group 2; + old_tribe:0002 80" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32743.2" + /db_xref="GOA:Q4K355" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K355" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQGEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVA + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLGKLK" + misc_feature 3507..3923 + /gene="wzd" + /locus_tag="SPC03_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3e-53" + gene 4191..4604 + /gene="wze" + /locus_tag="SPC03_0007" + /pseudo + CDS 4191..4604 + /gene="wze" + /locus_tag="SPC03_0007" + /EC_number="2.7.1.112" + /note="member of homology group 3; + old_tribe:0003 80" + /pseudo + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze (pseudogene)" + gene 5173..5673 + /gene="tnp" + /locus_tag="SPC03_0008" + /pseudo + CDS 5173..5673 + /gene="tnp" + /locus_tag="SPC03_0008" + /pseudo + /codon_start=1 + /transl_table=11 + /product="IS1548 transposase" + /db_xref="PSEUDO:CAI32745.2" + gene 5752..6936 + /gene="ugd" + /locus_tag="SPC03_0009" + CDS 5752..6936 + /gene="ugd" + /locus_tag="SPC03_0009" + /note="member of homology group 20; + old_tribe:0020 15" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI32746.2" + /db_xref="GOA:Q4K352" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K352" + /translation="MKIAIAGSGYVGLSLAVLLAQHHEVKVIDVIKDKVESINNRKSP + IKDEAIEKYLVENELNLEASLDPAHVYKDVEYAIIATPTNYDVDLNQFDTSSVEAAIK + TCMEYNDTCTIVIKSTIPEGYTKEVREKFNTDRIIFSPEFLRESKALYDNLYPSRIVV + GTDLDDSELTKRAWQFADLLKGGAIKEEVPILVVAFNEAEVAKLFSNTYLATRVAYFN + EIDTYSEVKGLNPKTIIDIVCYDPRIGSYYNNPSFGYGGYCLPKDTKQLKASFRDVPE + NLITAVVQSNKTRKDYIAGAILAKQPSVVGIYRLIMKSDSDNFRSSAVKGVMERLDNY + GKEIVIYEPTIECDTFMGYRVIKSLDEFKNISDIVVANRMNDDLRDIQEKLYTRDLFG + RE" + misc_feature 5752..6288 + /gene="ugd" + /locus_tag="SPC03_0009" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.1e-42" + misc_feature 5752..6198 + /gene="ugd" + /locus_tag="SPC03_0009" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00044" + misc_feature 6337..6618 + /gene="ugd" + /locus_tag="SPC03_0009" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 3.8e-33" + misc_feature 6679..6915 + /gene="ugd" + /locus_tag="SPC03_0009" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 0.00028" + gene 6952..8205 + /gene="wchE" + /locus_tag="SPC03_0010" + CDS 6952..8205 + /gene="wchE" + /locus_tag="SPC03_0010" + /codon_start=1 + /transl_table=11 + /product="serotype 3 capsule synthase" + /protein_id="CAI32747.2" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K351" + /translation="MYTFILMLLDFFQNHDFHFFMLFFVFILIRWAVIYFHAVRYKSY + SCSVSDEKLFSSVIIPVVDEPLNLFESVLNRISRHKPSEIIVVINGPKNERLVKLCHD + FNEKLENNMTPIQCYYTPVPGKRNAIRVGLEHVDSQSDITVLVDSDTVWTPRTLSELL + KPFVCDKKIGGVTTRQKILDPERNLVTMFANLLEEIRAEGTMKAMSVTGKVGCLPGRT + IAFRTEILRECIHEFMNETFMGFHKEVSDDRSLTNLTLKKGYKTVMQDTSVVYTDAPT + SWKKFIRQQLRWAEGSQYNNLKMTPWMIRNAPLMFFIYFTDMILPMLLISFGVNIFLL + KILNITAIVYTASWWEIILYVLLGMIFSFGGRHFKAMSRMKWYYVFLIPVFIIVLSII + MCPIRLLGLMRCSDDLGWGTRNLTE" + misc_feature 7117..7641 + /gene="wchE" + /locus_tag="SPC03_0010" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 7.8e-17" + gene 8503..9423 + /gene="galU" + /locus_tag="SPC03_0011" + CDS 8503..9423 + /gene="galU" + /locus_tag="SPC03_0011" + /codon_start=1 + /transl_table=11 + /product="glucosephosphate uridylyltransferase" + /protein_id="CAI32748.2" + /db_xref="GOA:Q4K350" + /db_xref="InterPro:IPR005771" + /db_xref="InterPro:IPR005835" + /db_xref="UniProtKB/TrEMBL:Q4K350" + /translation="MKKVKKAVIPAAGLGTRFLPATKALAKEMLPIVDRPTIHFVIEE + ALRSGIEDILVVTEKSKRSIEDYFDSTFELEYSLRKQGKMELLKSVNESTDIKVHFVR + QSSPRGLGDAVLQAKSFVGDDPFVVMLGDDLMDITDSTAVPLTRQLMDDYNATQASTI + AVMPVRYEDVSSYGVISPRLESSNGLYSVDAFVEKPKPEEAPSNLAIIGRYLLTPEIF + SILETQKPGAGNEIQLTDAIDTLNKTQSVFAREFVGKRYDVGDKFNFMKTSIDYALQH + PQIKESLKNYVIALGKQLEKLDDCSSSGHL" + misc_feature 8518..9327 + /gene="galU" + /locus_tag="SPC03_0011" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 2.8e-21" + gene 9420..>10337 + /gene="pgm" + /locus_tag="SPC03_0012" + CDS 9420..>10337 + /gene="pgm" + /locus_tag="SPC03_0012" + /codon_start=1 + /transl_table=11 + /product="phosphoglucomutase" + /protein_id="CAI32749.2" + /db_xref="GOA:Q4K349" + /db_xref="InterPro:IPR005844" + /db_xref="InterPro:IPR005845" + /db_xref="InterPro:IPR016055" + /db_xref="UniProtKB/TrEMBL:Q4K349" + /translation="MNCIESYQKWLNVPDLPAYLKDELLSMDDKTKEDAFYTNLEFGT + AGMRGYIGAGTNRINIYVVRQATEGLAKLVESKGETAKKAGVAIAYDSRHFSPEFAFE + SAQVLAAHGIKSYVFESLRPTPELSFAVRHLGAFAGIMVTASYTPAPFNGYKVYGSDG + GQMLPADADALTDYIRAIDNPFAVALADLEEAKSTGLIEVIGETLDAAYLEEVKSVNI + NQDLIDQYGRDMKIVYTPLHGTGEMLARRALAQAGFESVQVVEAQAKPAPDFSTVASP + NPESQAAFALAEELGRQVDADVLVATTLAA" + misc_feature 9534..9965 + /gene="pgm" + /locus_tag="SPC03_0012" + /note="HMMPfam hit to PF02878, + Phosphoglucomutase/phosphomannomutase, alph, score + 4.8e-50" +ORIGIN + 1 gaccgtcgct tcctagttgt ggctaacttg tccaatgaag agcaagactt gacagtagaa + 61 ggaaaagtca aatctgtctt gattgaaaac accctagctc aagaagtctt tgaaaaacaa + 121 atcttagttc catgggatgc tttctgtgtg gaattactat aaatattttt tgcagaaaaa + 181 tttaaaattg aaatcgtata aaaacaaggg aggactgtat aaaagacaga aatcctttgt + 241 tttttataac aaaagtttat aaaccttcat tcttgaaatt caattaactt tacaaattcc + 301 cactattaag gagaaagaag atgaacataa agaagcgtgt ccttggtgca ggtctgactt + 361 ttgcatctgc tttgctttta gctgcttgcg gccaatcagg ttcagataca aaaacttact + 421 catcaacctt tagtggaaat ccaactacat ttaactatct attagactat tacgctgata + 481 atatagtcaa ttgaaacaag agcaggacaa aagagcctcg taaaaggtat tgcaacttgg + 541 taataccttt ttgatgtgtt ttttgatatg agcccatgtt ttctcaatag gattgtactc + 601 aggtgagtag ggaggaagag gtaaaagttt atgcccaaac tcttcgcata aaagttctag + 661 cttccccatt ctatggaatc ttgcattatc cataataata accgatggtg tggttaatgt + 721 tggtaagaaa aacttctgaa accatacttc aaaaaagtcg ctcgtcatca tctcttcgta + 781 agtcattgga gcgattaact caccattcat ttgttagacc tgcaaccaaa gaaatcctct + 841 gatatcttct tccagatact ttgcctcttc ttaactgacc ttttaaagag cgaccatgtt + 901 ctcgataaaa ataagtatcg aatcctgttt catcaatcta aacaggtgct aggtgcttta + 961 aactattaaa attcttaaga aataaggcta cttttctggg tcttgttcat agtaggtgtg + 1021 gttctttttt tcgagtgtag cccatagctt tgagcgcata gtggatggta gttggatgac + 1081 agccaaattc agaagctatt tcagtcaaat aagtatctgg attgtcagta agatagtttt + 1141 taagtctatc tctatcaact tttcttggtt ttgttccttt tacttggtgg tttagctctc + 1201 ctgttttttc ttttagcttt aaccagccat aaatggtatt acgtgagatt tggaaaacgt + 1261 gtgatgcttc tgttatacta cctattcgct cacaataaga gagaactttt ttacgaaaat + 1321 ctattgaata tgccataaga agattatacc acattgtgta ctatattaga ttgaaactag + 1381 agtagtacac ctctgcttct aaaatattgt tagaaatcga tttgactgtc ctgatcgatt + 1441 tgtcctgttc ttatttcatt ttgctatatt tttggttcgc gggaagtcta ctaagatact + 1501 taaagataca gatagtgaaa ataaaggtgt agacattacc gttggtgttc tctatccttg + 1561 tcagctctgt gtcgctcttt gcagtacagc agtttgttgg actgaccaat cgtttaaatg + 1621 cgacttctaa ttactcagaa tattcgatca gtgtcgctgt tttagcagat agtgagatcg + 1681 aaaatgttac gcaactgacg agtgtgacag caccgactgg gactgataat gaaaatattc + 1741 aaaaattact agctgatatc aagtcagaat accgatttga cggtcgacca gagttcgtct + 1801 tacttggctg cttacaagag tctgattgca ggtgacacca agaccattgt cctaaatagt + 1861 gtctttgaaa atatcatcga gtcagagtat ccagactacg catcgaagat aaaaaatatt + 1921 tataccaagg gatttactaa aaaagtagaa gctcctaaga cgtctaagaa tcagtctttc + 1981 aatatctaag ttagtggaat tgacacctat ggtcctatta gttcggtgtc gcgatcagat + 2041 gttaatatcc tgatgactgt caatcgagat accaagaaaa tcctcttgac cacaacgccg + 2101 cgtgatgcct atgtaccaat tgcagatggt ggaaataatc aaaaagataa attgactcat + 2161 gcgggcattt atggagttga ttcgtccatt cacaccttag aaaatctcta tggagtggat + 2221 atcaattact atgtacgatt gaacttcact tcgtttttga aattgattga tttgttggat + 2281 ggaattgatg tttataatga tcaagaattt actgcccata cgaatggaaa gtattaccct + 2341 gaaggcaatg ttcatcttga ttcagaacag gctctcggtt ttgttcgtga gcgctactcc + 2401 ctagcagatg gcgatcgtga ccgcgggcgc aatcaacaaa aggtgattgt ggctatcctt + 2461 caaaaattaa cgtcaaccga agaactgaaa aattatagta cgatcattga tagcttgcaa + 2521 gattctatcc aaacaaatat gccgattgag actatgatag atttagtgaa tactcagttg + 2581 gaaagtggag ggaattataa agtaaattct caagatttaa aagggacagg tcggatggat + 2641 cttccttctt atgcaatgcc agacagtaac ctctatgtga tggaaataga tgatagtagt + 2701 ttagctgtag ttaaagcagc tatacaggat gtgatgaaag gtagatgaaa tgatagacat + 2761 ccattcgcat atcgtttttg atgtagatga cggtccaaag tcaatagagg atagcaaggc + 2821 acttttaaga gaagcttata atcaaggagt tcgaatgatt gtgtctactt cgcatcgtcg + 2881 aaaagggatg tttgaaactc cagaagaaaa aattgtaaca aattttatta aggttcgtga + 2941 aattgcaaaa gaagtagcag atgatttagt cattgcttat ggcgcagaga tatactatac + 3001 tctggatgct ctagaaaagc tagaaaaaaa gaaattccta cccttaatga tagtcgttat + 3061 gctttgattg agtttagcat gcatacttcc tatcgtgaga ttcatacgag attgagcaat + 3121 attttgatgt tgggaatcac gccagtaatt gctcatattg aacgttatga tgctttagag + 3181 aataacgaaa aacgtgttcg tgaactgatt gatatggggt gctatactca gatagatagt + 3241 tatcatgttt caaaacctaa gttctttggt gaaaaatata aattcatgaa aaagagagct + 3301 cggtattttt tggaacgtga tttagttcat gtagttgcaa gtgacatgca caatttagac + 3361 agtagacctc catatatgca acaggcatat gatatcattg ctaagaaata tagagcgaaa + 3421 aaagcgaaag aactttttgt agataatccc agaaaaatta taatggatca attaatttag + 3481 gagaaaatat gaaggaacaa aacactttgg aaatcgatgt attgcaacta ttcagagctt + 3541 tatggaaaag aaagttggtc attttattag tggcaattat aacttcttca gttgcttttg + 3601 cctacagtac ttttgttatc aaacctgagt ttactagtac gactcggatt tatgtagtta + 3661 accgtaatca gggagagaag tctggtttaa ccaatcaaga cttgcaggca ggatcatact + 3721 tggttaaaga ctatcgtgaa attatcctat cgcaggatgt tttggaggaa gttatttctg + 3781 atttgaaact agatttgacg ccaaaaggtt tggctaataa aattaaagta acagtaccag + 3841 ttgatacccg tattgtctct gtttcagtta atgatcgagt tcctgaagag gcaagccgta + 3901 tcgctaactc tttgagagaa gtagctgctc aaaaaattat cagtattact cgtgtttctg + 3961 atgtggcaac actggaggag gcaagaccgg cgatatcacc gtcttcgcca aatattaaac + 4021 gcaatacact aattggtttt ttggcagggg ggattggaac tagtgttata gttcttcttc + 4081 ttgaactttt ggacactcat gtgaaacgtc cggaagatat cgaagataca ctgcagatga + 4141 cacttttggg agttgtacca aacttgggta agttgaaata ggagagagga atgccgacat + 4201 tagaaatagc acaaaaaaaa ctggagttca ttaagaaggc agaagaatat tacaatgcct + 4261 tgtgtacaaa tatacagttg agcggagata aactaaaagt aatttccgtt acttctgtta + 4321 accctgggga aggaaaaaca actacttccg taaatatagc aaggtcgttt gcgcgtgcag + 4381 gctataaaac tcttttgatc gatggtgata ctcgaaattc agttatgtca ggatttttta + 4441 aatctcgtga aaaaattaca gagctaacag aatttttatc tgggacagct gatttatctc + 4501 acggtttatg tgatacaaat attgaaaatt tatttgtagt tcaatcggga tctgtatcac + 4561 caaaccctac agccttgtta caaagtaaaa attttgtggt tatggtaaag attttttcaa + 4621 aagaggtcag tatattgagt tggtggaaac gataaaatac ataatatttt attcctttgg + 4681 ttatcaaatt agcccctcct gaagctcccc aattgacggc ttgagctcca atcaaagggt + 4741 gtttgtccgc tttttgacag agggtaatcg ctagaggaca gcaaacggcc atagtagtga + 4801 aaaatccagc acctaaagca gacaaaaggg ttgccatcag gtataaaatc atgtagaggg + 4861 cgttagggtg ggtgcgtgtg cggtagagaa tgtgttgagc caaaacatca agagtaccgt + 4921 tagttgttgc aacgttataa aagagagaga cgctaaaaat ggtaaaaaag agtgaggttg + 4981 gccaaaaatg aagaagttct ttgggactta atcccatgag agtggttgcg atgaggtaag + 5041 aaaaagcaat agccagcagg ccaatattga ttttggtgcg gtaaccaatt ccaatggcta + 5101 gagcaatggc gctaatcatt attaaatgaa tcattgaatt gtcctttcag ttagaatata + 5161 gaaagaggat agattgaagt tcgagaatac tgggtgtctt ctgatgttaa gtggttgtgt + 5221 caaaaccatc ccaaatggca taaattgcgt ggaattggaa tgactcgtaa tactattgat + 5281 agagatggta ttacaagtca agacgttcgc tattttatct ttaactttaa gcttgatgtg + 5341 atgacctttt gccatagtgt tcgaggtcat tggtcagcag aaagtatgca ttggttattg + 5401 gatgtggttt atcgtgaaga ccatcatcag accctggata aacgagctgc ttttaacctt + 5461 aatcttatcc gaaaaatgtg tttatatttt ctaaaagtga tggtattttc taaaaaagac + 5521 ctcagctatc gatgcaaaca acggtatatc tctgtccatt tggaagatta tttggaaaca + 5581 gaggttagga aagtaattag tttaacggga tatcttttca aagctgatac taaggcacaa + 5641 aaaaagtttg atattcccct tgacaataga taaaattatt atataattaa actattgctt + 5701 tttaaataaa gtgagaatat taataataca gagaaagagg actgtagtaa aatgaaaatt + 5761 gccattgcag gaagtggtta tgtaggactg tctttagcgg tgctactagc tcagcatcat + 5821 gaagttaagg tcattgatgt tataaaggat aaggtagagt cgataaacaa tagaaaatct + 5881 ccaattaagg atgaggcgat tgagaaatac ttagttgaaa acgagttgaa tcttgaagcc + 5941 tccttagatc ctgcacacgt ttataaagac gtggagtatg ctattattgc tactccgact + 6001 aattatgatg tagacttaaa tcagtttgat acatcttcag ttgaagctgc tatcaagact + 6061 tgtatggaat ataatgatac ttgtacaatc gtaatcaaaa gtactattcc tgaagggtat + 6121 actaaagaag tgagggaaaa gtttaataca gatcgtatta tcttttctcc agagtttcta + 6181 cgtgaatcca aagctttata tgataatttg tatccatcta gaattgttgt aggaactgat + 6241 ttggatgatt ctgagttaac aaaaagagca tggcagtttg cagatctact taaaggtgga + 6301 gctattaagg aagaggttcc gatactggtt gttgctttta atgaagcaga ggttgcaaaa + 6361 ttgtttagta acacttactt ggcaactcgc gtagcttatt ttaatgagat agatacatat + 6421 agcgaggtaa aagggcttaa tcccaagaca attattgata ttgtttgtta tgatcctaga + 6481 attggatcat actataataa ccctagcttt ggttacggag ggtattgctt accaaaagac + 6541 acaaagcaat tgaaagcaag ttttagggat gttcctgaaa atctgattac agctgtggtg + 6601 caatctaata aaacaagaaa agattatata gctggagcta ttctagctaa acaacctagt + 6661 gttgtaggta tttatagatt aattatgaaa tctgattctg ataattttcg ttctagtgct + 6721 gttaagggag ttatggaacg tttggacaat tatggtaaag aaattgttat ttacgaacct + 6781 actattgagt gtgatacttt tatgggatac agagtaatta aatctttaga tgaatttaag + 6841 aatatttctg acattgttgt agcgaatcgt atgaacgatg atttaaggga tatacaagaa + 6901 aaactctata cacgcgattt atttggcaga gaataagggg aaataatttt tatgtataca + 6961 tttattttaa tgttattgga tttttttcag aatcatgatt ttcatttctt tatgttgttt + 7021 tttgtcttta ttcttattcg ttgggcggtt atatattttc atgctgtcag atataagtcc + 7081 tacagttgta gtgtaagtga tgagaagtta tttagttctg taattatccc tgtcgtggat + 7141 gaaccactta atctttttga aagtgtactg aatagaattt ccagacataa accatccgaa + 7201 attattgtgg ttattaacgg cccaaaaaac gagagacttg taaaactttg tcatgatttt + 7261 aatgaaaaat tagaaaataa tatgactcca attcaatgtt attacactcc tgttcctggc + 7321 aagagaaatg ctatccgcgt tgggctggag catgtggatt cgcagagtga tattacagtt + 7381 ctagtagata gtgatacagt atggacgcct agaaccttga gtgagttgct gaagcctttt + 7441 gtttgcgata aaaaaatagg tggggtaacg acaagacaaa aaattcttga ccctgagcgt + 7501 aatctcgtga caatgtttgc taacttgtta gaggaaatta gggcagaagg aactatgaaa + 7561 gcaatgagtg tgactggtaa agtagggtgc ttacctggtc gaacaattgc ttttagaaca + 7621 gagattctca gagagtgtat acatgagttt atgaatgaga ctttcatggg atttcataag + 7681 gaagtttctg atgatagaag tcttacaaat ttgactttaa aaaaaggcta taaaactgtt + 7741 atgcaggata cttctgttgt gtatacagat gctcctacaa gttggaaaaa gttcattaga + 7801 cagcaactaa ggtgggcaga aggttctcag tataacaatc taaagatgac tccttggatg + 7861 attagaaatg cccctcttat gttttttatt tattttacag atatgatttt acctatgcta + 7921 cttattagct ttggtgtgaa tatattcctg ttgaaaatat taaatataac tgcaattgtt + 7981 tatacagctt catggtggga aattatttta tatgttcttt tgggaatgat ttttagcttt + 8041 ggaggaagac actttaaagc tatgtctaga atgaagtggt attatgtatt tcttattcct + 8101 gtttttataa tcgttttgag tataattatg tgccctatta ggctattagg acttatgaga + 8161 tgttctgatg atttagggtg gggaactagg aatttaacag agtgagataa atagtagtgc + 8221 gtatatagag tatttactca gagtattaat tgatttttga aaaggaaaag tgtttttaaa + 8281 tgttaagaaa gaacttgaaa tatcagatta tgacacgagc tggaacaatt ttagctatct + 8341 tgtttttcat tatattaggg attattgttg aagttttgtt ttaaggctca ttgtcatctg + 8401 tagtggctca cttcagacgt aagggtcata ttttaatgtg aaaagagtgt taaaagatta + 8461 atcacttata ttattttaat agaaatagtg taaggaattg ttatgaaaaa agtaaaaaaa + 8521 gctgttattc ctgctgcagg gctgggcaca cgatttttgc ctgccactaa agctttggca + 8581 aaagaaatgc ttccaattgt agaccgcccc acaattcatt ttgtcattga agaagcttta + 8641 cgttcgggta ttgaagatat tctagtagtt actgaaaaga gtaaacgttc tattgaagat + 8701 tattttgatt caacttttga attggaatat agtcttagaa aacaaggaaa gatggaactt + 8761 cttaagtcag ttaatgaatc gactgatatt aaagtacatt tcgttcgtca aagttcacca + 8821 cgtggtcttg gtgacgctgt tctccaagcg aagtcttttg ttggtgacga tccctttgtt + 8881 gtaatgcttg gtgatgacct tatggatatc accgactcaa ctgctgtacc tttaacaaga + 8941 caattgatgg atgattacaa cgcaacacag gcttcaacta tcgcagtaat gcctgttaga + 9001 tatgaagatg tttcttctta tggtgtgatt tctcctagat tggaaagtag taatggcctc + 9061 tatagtgttg atgcttttgt agagaaacca aaaccagaag aagcgcctag caatttagct + 9121 attattggac gttatctact tactcctgag attttttcta tattagaaac ccaaaagcca + 9181 ggagcaggta atgaaattca attgacagat gctattgata cattgaataa gacacagagt + 9241 gtttttgcgc gtgaatttgt gggcaaacgt tatgatgttg gtgataagtt taattttatg + 9301 aaaacatcaa ttgattatgc tcttcaacat cctcagatta aagagagttt aaaaaattac + 9361 gttattgcac ttggtaagca attggagaag ctagatgact gttcgtcaag tggacaccta + 9421 tgaattgtat agaaagttat caaaaatggc taaatgtccc tgatcttcca gcttatttaa + 9481 aagatgaatt gctcagcatg gatgacaaaa caaaagaaga cgccttttac acaaaccttg + 9541 aattcggaac agctggtatg cgtggttata ttggtgctgg gacaaaccgt attaatatct + 9601 atgtggtgcg tcaagcaaca gaaggccttg ccaaattagt tgaatcaaaa ggcgaaacgg + 9661 ccaaaaaagc tggggttgct attgcctatg actcgcgaca tttttcacca gaattcgctt + 9721 ttgaatctgc ccaagtatta gcggcccatg gcattaaatc ttatgttttt gaaagcctac + 9781 gccctactcc tgagctgtct tttgctgttc gtcatctcgg agcatttgct ggtattatgg + 9841 taaccgccag ttatacccct gctcctttta atggttataa agtttacggt tctgatggtg + 9901 ggcaaatgct tccagctgat gctgatgctt taactgacta tattcgtgcg attgataacc + 9961 catttgctgt agcccttgct gacttagaag aagctaaatc aactggtctt attgaagtaa + 10021 ttggtgaaac tctcgatgct gcctaccttg aagaggttaa aagcgttaat atcaatcaag + 10081 atttgattga ccaatacggt cgcgatatga aaattgtcta cacacctctt catggtactg + 10141 gagaaatgct agcacgtcga gctttagcac aagctggttt cgaatctgtt caagttgtcg + 10201 aagctcaagc aaaaccagcc ccagacttct caacagttgc atcaccaaac cctgaaagtc + 10261 aagccgcctt tgccttagct gaagaactag ggcgtcaagt cgatgctgat gtattagtgg + 10321 cgactacttt agctgca +// + diff --git a/public/res/serotype_genbank/serotype_31.gb b/public/res/serotype_genbank/serotype_31.gb new file mode 100644 index 0000000..c6fea6a --- /dev/null +++ b/public/res/serotype_genbank/serotype_31.gb @@ -0,0 +1,1043 @@ +LOCUS CR931695 22164 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain nr. 34374 (serotype 31). +ACCESSION CR931695 +VERSION CR931695.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22164) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22164) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22164 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="nr. 34374" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC31_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC31_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34088.1" + /db_xref="GOA:Q4JZX1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JZX1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILIP + WDAFCVELL" + gene 322..474 + /gene="aliB" + /locus_tag="SPC31_0002" + /pseudo + CDS 322..474 + /gene="aliB" + /locus_tag="SPC31_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI34089.1" + gene complement(order(491..1025,1027..1353)) + /gene="tnp" + /locus_tag="SPC31_0003" + /pseudo + CDS complement(join(491..550,549..1025,1027..1353)) + /gene="tnp" + /locus_tag="SPC31_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(963..1025,1027..1335)) + /gene="tnp" + /locus_tag="SPC31_0003" + /note="HMMPfam hit to PF01710, Transposase, score 2.1e-22" + /pseudo + gene 1588..3033 + /gene="wzg" + /locus_tag="SPC31_0004" + CDS 1588..3033 + /gene="wzg" + /locus_tag="SPC31_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34091.1" + /db_xref="GOA:Q4JZX0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZX0" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKSQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLTDGDRDRGRNQQKVIVAILQKLTST + EVLKNYSTIINSLQDSIQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1588..1704 + /gene="wzg" + /locus_tag="SPC31_0004" + /note="Signal peptide predicted for SPC1454 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1792..2139 + /gene="wzg" + /locus_tag="SPC31_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.3e-62" + misc_feature 2317..2760 + /gene="wzg" + /locus_tag="SPC31_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 4.4e-70" + gene 3035..3766 + /gene="wzh" + /locus_tag="SPC31_0005" + CDS 3035..3766 + /gene="wzh" + /locus_tag="SPC31_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34092.1" + /db_xref="GOA:Q4JZW9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZW9" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDFVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3038..3646 + /gene="wzh" + /locus_tag="SPC31_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1e-37" + gene 3772..4467 + /gene="wzd" + /locus_tag="SPC31_0006" + CDS 3772..4467 + /gene="wzd" + /locus_tag="SPC31_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34093.1" + /db_xref="GOA:Q4JZW8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZW8" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRDQGDKSGLTNQDLQAGTYLVKDYREITLSQDVLEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPVTTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELIDTRVKRPEDVEDVLQI + PLLGVVPDLDKMK" + misc_feature 3772..3888 + /gene="wzd" + /locus_tag="SPC31_0006" + /note="Signal peptide predicted for SPC1456 by SignalP 2.0 + HMM (Signal peptide probability 0.721) with cleavage site + probability 0.467 between residues 39 and 40" + misc_feature 3793..4209 + /gene="wzd" + /locus_tag="SPC31_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 2.8e-54" + misc_feature 4315..4392 + /gene="wzd" + /locus_tag="SPC31_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4477..5151 + /gene="wze" + /locus_tag="SPC31_0007" + CDS 4477..5151 + /gene="wze" + /locus_tag="SPC31_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34094.1" + /db_xref="GOA:Q4JZW7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZW7" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + LGEGKSTTSTNIAWAFAHAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGKK" + gene 5250..5843 + /gene="wcjG" + /locus_tag="SPC31_0008" + CDS 5250..5843 + /gene="wcjG" + /locus_tag="SPC31_0008" + /note="member of homology group 50" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34095.1" + /db_xref="GOA:Q4JZW6" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JZW6" + /translation="MDVFIGLFGTIFIVLPSSLMIYIIYKIKGYKGNIFFTQYRVGLK + GKKFKIIKFRSMVENAEEVLAANKALYEKYINNSYKLPPNEDPRLTNIGDFIRKTSID + EIPQFINLMLGDMSLIGPRPILENELEEYSKEEQQVLLSVRPGITGMWQVSGRSEVYY + PERCEMELYYPRNQSFLLDVKIFFLTIKKVLSGEGAH" + misc_feature 5259..5840 + /gene="wcjG" + /locus_tag="SPC31_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.4e-53" + gene 6060..6854 + /gene="wciB" + /locus_tag="SPC31_0009" + CDS 6060..6854 + /gene="wciB" + /locus_tag="SPC31_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34096.1" + /db_xref="GOA:Q4JZW5" + /db_xref="UniProtKB/TrEMBL:Q4JZW5" + /translation="MSKKYKIIVATHKRFQMPEDKDLYVPVQVGSEGKENLGYQRDNQ + GNHISYLNPYYCELTGLYWAWKNLDCDYLGLVHYRRYFTDKNRPYHDKINMNEVILSA + DQVKELMSEVDVVVPKKRKYYIETLYSHYAHTHDSSHLDVTREIIKEVSPEYLATFDK + VMAYRSGYMFNMFIMSKENVSSYCEWLFPIIDELYRRLDITGYSAFDARLFGRVSERL + FNVWLDYQNLHVKELPFMYMEKVDLLEKGKSFLMAKFFGKKYGQSF" + gene 6838..7935 + /gene="wcrP" + /locus_tag="SPC31_0010" + CDS 6838..7935 + /gene="wcrP" + /locus_tag="SPC31_0010" + /note="member of homology group 89" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34097.1" + /db_xref="GOA:Q4JZW4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZW4" + /translation="MVRVFEMLEKKSPLFSVIVPTYKISESNLRQCIDSLLYDNQDVE + IILVDDNANSDICGEVIDEYAEKYNNISVIHQENQGVSVARNAAMSIAVGKYLVFVDP + DDWVAENFYSQMTFAVQKNPSSDVIILAAIVDYNGKRFTNHFWHTSRSFRGKVKDDLE + LQLIAKGATSYFPAEIGVGVPWAKIYRNEFVRANGLVFNPSLRRMQDNIFNMYAFEFA + NEIVYIDEPIYYYRKSMDSVTNKKNDKVIYYFDLVNDEVEKFILKFNKPKIFEDALHI + KRLIGINSYYKLYFQFASTSSEKKKMRQEFRELLEREEYANSLKQVNTAYLLPKEKIF + ISILKQKDLWIFSLLQKLEKLSVRLKSRQFS" + misc_feature 6883..7422 + /gene="wcrP" + /locus_tag="SPC31_0010" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.2e-30" + gene 8038..8931 + /gene="wcrR" + /locus_tag="SPC31_0011" + CDS 8038..8931 + /gene="wcrR" + /locus_tag="SPC31_0011" + /note="member of homology group 90" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34098.1" + /db_xref="GOA:Q4JZW3" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZW3" + /translation="MENVLNKKIGIVILNYLNWEDTLECINSLRSQSDQDFEAVIVEN + GSPNESVSRIRDYIKNDKNIHICVVDNNLGYANGNNMGILYLKNRYSINRILLTNNDV + VFDDEDYIKKLEDIKYSNTIGAIGTKIIGSDGLDQNPAYFPISFKSSIKLLIINLLAF + SKAFTFIKRRYLSSWAKKVNDFSAPRYNNQKYCLHGSVIFLTENYLDKFMGLYGGTFL + YYEEVILGIIFEKAGLDMLYIPNFSIYHKEDQSSLQSFNNDDLVRRRYLLQSIWSSMR + IYRSSIDNLSNIIENSIKEKL" + misc_feature 8065..8565 + /gene="wcrR" + /locus_tag="SPC31_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.3e-13" + gene 8928..10190 + /gene="wzy" + /locus_tag="SPC31_0012" + CDS 8928..10190 + /gene="wzy" + /locus_tag="SPC31_0012" + /note="member of homology group 121" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34099.1" + /db_xref="UniProtKB/TrEMBL:Q4JZW2" + /translation="MINSSKYLKFVLYYQIISFYFLGIFYRLSTFNQYLYVIADIVFI + SVYLLIFERKIAYTNIKLFIIFILFYLFGSFQGYDSGGAFIIFLLIYLKYILFKFIII + NIPQSNLIRAFTNIGILNTVILLAEVLSHGHINLFVNHYTLAQKIETLNKVGTNLAVL + RGGFENPLVTSVMLSSTLLFFMTIEKALLRNILIMSNLFLIMATEKRTGILISIALLF + CYYFRKNLKTKSVSKFIIKFLGGLFFLGFALLAINMITISGRSISQMIIERFSSLSSG + SDFSAIHRSMAFKIGIEIIWSRNILNILFGNGFYFLPTFMYNNNITITKLGFLVIDNS + YLSFLADFGMMPLISIMFYLIGGIFKNLVSNETDNISEVVMFSLIALLLSASVFDILN + WYQSTLLTCFFVAYLSVYHDSSKRKGNK" + gene 10187..11431 + /gene="wcrW" + /locus_tag="SPC31_0013" + CDS 10187..11431 + /gene="wcrW" + /locus_tag="SPC31_0013" + /note="member of homology group 122" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI34100.1" + /db_xref="UniProtKB/TrEMBL:Q4JZW1" + /translation="MTIKNEIKHLKRKIDKNFFQKDFTSISDIKNYQIAPSLNPRPRL + NLLITSMNSQDVYAGIKSAVDFFMKFKKFDIDLRIIVMGKKIDESSLYQVPGFEFIKD + YSIDNDSESRIICDLSKNRSPLFIRERDYFLSTMWYTAYNANNVLDEQKRIFGKRMPM + VYLVQDYEPGFYPWSSEYLLAESTYHLDNQLVVFNSKYLKEFFDANGYRFENSYYFDP + VLNEKLGEILNSAELSNIERKNRILFYGRPSKARNAFQLICMALEKWSLLDEHSSNWE + IFSAGEDLKDIKLNNNIVIKSLGKMSVEEYAKFMLESKIGISLMASPHPSYPPLEMAT + FGMKVITNSFVTKDISDFNENIISIEHININKLAKELHFLTTSDIEYKISKNDDYING + ISQLDTIVDKIGGHLQFQHSEV" + gene 11434..12876 + /gene="wzx" + /locus_tag="SPC31_0014" + CDS 11434..12876 + /gene="wzx" + /locus_tag="SPC31_0014" + /note="member of homology group 123" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34101.1" + /db_xref="GOA:Q4JZW0" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZW0" + /translation="MKRKSIARNYLLNLIKTTLSILFPLISYPYVSRILSVDGLGAIN + FSASFVNYFVLIAIFGINVYAVREGAKYRDDKKLLGKFVTEMLLVSICTAMISFSLLT + VSLLLPALSEYRSLILIFSITIIFNVVGMEWFFQLMEDYQYITLRAIIFQILSLIFLF + IFVKDRNDIYVYALITVAANAGSQILNLFRLRKEVEIFRYKDYNIRNYFKPMFLIFLT + LLSMNIYRYLDVTFLGFFKNDRSVGYYSLATKITSAIISMVSSVTVILTPRLAYHYKK + EEFDKFYKIAYSSFDFILLLAIPVVIGVLSFSSILVDFLGGSTFVSSVLTVEILSLTI + LFSNLNALLITPILTVMNREKAVLKIFIIALIFNVITNMLLIPVMDFNGSALVTVLTE + GIICILSLISIKSVFNVRRLFKNLFQYLVASIFIIVVKIVISQYVSSNYIIFISTALL + SAILYFLTLILLRNELVPQLIIEVRKKIYR" + misc_feature 11449..12255 + /gene="wzx" + /locus_tag="SPC31_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 7.1e-45" + gene 12892..13572 + /gene="wcrX" + /locus_tag="SPC31_0015" + CDS 12892..13572 + /gene="wcrX" + /locus_tag="SPC31_0015" + /note="member of homology group 124" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34102.1" + /db_xref="GOA:Q4JZV9" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4JZV9" + /translation="MFTIYRAMKKIIIIILSLPKIFYINFKCLPLNQAVKLPIYVHFN + TRLMIRGDIKIIDTHLSRFTIILGKDGSNHISPHESRLFIYDGGQLILGRNILLSSGF + NLCIEQGGTVKLGDNVSFNRNSSIFCKKQINIGKNSLFGWNCSLRDNNGHRIYYQGNC + IKSEGVIVIGENCWITADSIILKNSVLPFSTVVATGSLVNKEFNQSNILIAGRPARII + RDDIKWER" + gene 13640..14860 + /gene="ugd" + /locus_tag="SPC31_0016" + CDS 13640..14860 + /gene="ugd" + /locus_tag="SPC31_0016" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI34103.1" + /db_xref="GOA:Q4JZV8" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4JZV8" + /translation="MKIAVAGTGYVGLSIAVLMAQHHEVVAVDIISEKVNLINNGKSP + IKDDYIEEYLATKPLNLVATLDTNLAYQNADFVIIAAPTNYDSEKNFFDTSAVESVIE + TVLETNPNAVMVIKSTVPVGYTQSVRNKYKTSNILFSPEFLRESKALYDNLYPSRIIV + GLDMDDAYLKERAETFAELLQEGAIKEAIEILYMGFTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDTKAIIEGIGLDPRIGNQYNNPSFGYGGYCLPKDSKQLLANYKDVPQ + NMITAIVESNRTRKDFIAEQILKFAGVSNNGEIYPKDVIIGLYRLTMKSNSDNFRQSS + IQGVMKRLKAEGANVIIYEPTLSDNETFFGSKIVNDLEHFKSISNVIVANRYDDLLKD + VSDKVYSRDIFKRD" + misc_feature 13640..14194 + /gene="ugd" + /locus_tag="SPC31_0016" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 9.2e-51" + misc_feature 14225..14506 + /gene="ugd" + /locus_tag="SPC31_0016" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 2.4e-36" + misc_feature 14588..14839 + /gene="ugd" + /locus_tag="SPC31_0016" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 1.1e-06" + gene 14873..15973 + /gene="glf" + /locus_tag="SPC31_0017" + CDS 14873..15973 + /gene="glf" + /locus_tag="SPC31_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34104.1" + /db_xref="GOA:Q4JZV7" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZV7" + /translation="MYDYLIIGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYINQFAEFNNYINSPVANYKGSLYNLPFNMNTFYT + MWGTKTPQEVKDKIAEQTAGMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASANKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGMQPKTVITHEYPADWKRGDEPYYPINDEKNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFSN" + misc_feature 15308..15910 + /gene="glf" + /locus_tag="SPC31_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 5.3e-139" + gene 16001..16870 + /gene="rmlA" + /locus_tag="SPC31_0018" + CDS 16001..16870 + /gene="rmlA" + /locus_tag="SPC31_0018" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34105.1" + /db_xref="GOA:Q4JYY8" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JYY8" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLT + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSTMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEHPRSNYAVTGIYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLGRGDLSVEVMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 16004..16720 + /gene="rmlA" + /locus_tag="SPC31_0018" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 6.4e-118" + gene 16871..17464 + /gene="rmlC" + /locus_tag="SPC31_0019" + CDS 16871..17464 + /gene="rmlC" + /locus_tag="SPC31_0019" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34106.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 16907..17437 + /gene="rmlC" + /locus_tag="SPC31_0019" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 17477..18526 + /gene="rmlB" + /locus_tag="SPC31_0020" + CDS 17477..18526 + /gene="rmlB" + /locus_tag="SPC31_0020" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34107.1" + /db_xref="GOA:Q4K121" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K121" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 17492..18448 + /gene="rmlB" + /locus_tag="SPC31_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 7.1e-05" + misc_feature 17495..18331 + /gene="rmlB" + /locus_tag="SPC31_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0039" + misc_feature 17495..18235 + /gene="rmlB" + /locus_tag="SPC31_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2.7e-76" + misc_feature 17498..18310 + /gene="rmlB" + /locus_tag="SPC31_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.6e-05" + gene 18592..19443 + /gene="rmlD" + /locus_tag="SPC31_0021" + CDS 18592..19443 + /gene="rmlD" + /locus_tag="SPC31_0021" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34108.1" + /db_xref="GOA:Q4K1G6" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G6" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 18592..19440 + /gene="rmlD" + /locus_tag="SPC31_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-147" + misc_feature 18595..19236 + /gene="rmlD" + /locus_tag="SPC31_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 18595..19224 + /gene="rmlD" + /locus_tag="SPC31_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 18598..19326 + /gene="rmlD" + /locus_tag="SPC31_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene 19506..20615 + /gene="glf" + /locus_tag="SPC31_0022" + CDS 19506..20615 + /gene="glf" + /locus_tag="SPC31_0022" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34109.1" + /db_xref="GOA:Q4JZV2" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZV2" + /translation="MYDYIIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKITEQTADMKDVEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + misc_feature 19941..20543 + /gene="glf" + /locus_tag="SPC31_0022" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1e-138" + gene 20563..21630 + /gene="wcjE" + /locus_tag="SPC31_0023" + CDS 20563..21630 + /gene="wcjE" + /locus_tag="SPC31_0023" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34110.1" + /db_xref="GOA:Q4JZV1" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZV1" + /translation="MNGRLRLWRKSLDMTKSRINWIDFGKGFSIFLVLAGHVLLGLYQ + SEKFPTANNILSLLIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPY + IFYSIIHFGLQKVAGASVRVPTTISDLLNIYKDPLGVSWYLYILWSILIIYGLLSILV + KNRRMLFLISVFAYCLTLFVQTDIYIIQRTLVWGICFFLGSVLSEIHFDKINLKKFLF + FFVLFDFIYMFAWFLFYEVGSKKDYVSYSNPGLWGIAFIVCVLVAFAIFPKMEKNFPK + TFLYFTKYGKDSLGIYILHAPICSMIRILMLKVGINSVFIHVVVGIVLGWYLSILATY + ILKKIPFLNIVLLPQKYIKLK" + gene 21805..>22164 + /gene="aliA" + /locus_tag="SPC31_0024" + CDS 21805..>22164 + /gene="aliA" + /locus_tag="SPC31_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34111.1" + /db_xref="GOA:Q4JZV0" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JZV0" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSAKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVLSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 21805..21897 + /gene="aliA" + /locus_tag="SPC31_0024" + /note="Signal peptide predicted for SPC1474 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.782 between residues 31 and 32" + misc_feature 22051..22119 + /gene="aliA" + /locus_tag="SPC31_0024" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttaatt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttacagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggtctgact + 361 tttgcatctg ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaattacc tgttagacta ttaatctgat + 481 gatatattca atcgaaacaa gaacaagaca aaagagcctt gtaaaaggta ttgcaatttg + 541 gtaatacctt ttatgaggtg ctttttgata tgagcccatg ttttctcaat aggattgtac + 601 tcaggtgagt agggaggaag aggtaaaagt ttatgcccaa actcttcaca caagagctct + 661 aacttcccca ttctatggaa tcttgcatta tccataataa taaccgatgg tgtgtttaat + 721 gttggtaaga aaaacttctg aaaccaagct tcaaaaaagt cgctcgtcat cgtctcttcg + 781 taagtcattg gagcgattaa ctcaccattt gttagacctg caaccaaaga aatcctctga + 841 tatcttcttc cagatacttt tcctcttctt aactgacctt ttaatgagcg accatattct + 901 cgataaaaat aagtatcgaa tcctgtttcg tcaatctaaa caggtgctag gtgctttaaa + 961 ctattaaaat tcttaagaaa taaggctact ttttctgggt cttgttcata gtaggtgtgg + 1021 ttcttttttt cgagtgtagc ccatagcttt gagcgcatag tggatggtag ttggatgaca + 1081 gccaaattca gaagctattt cagtcaaata agcgtctgga ttgtcagtaa gatagttttt + 1141 aagtctatct ctatcaactt ttcttggttt tattcctttt acttggtggt ttagctctcc + 1201 tgttttctct tttagcttta accagccata aatggtatta cgtgagattt ggaaaacgta + 1261 tgatgcttct gttatactac ctgttcgctc acaataagag agaacttttt tacgaaaatc + 1321 tattgaatat gccataagaa gattatacca cattgtgtac tatattatat tgaaactaga + 1381 atagtacacc tttgcttcta aaacattgtt agaaatcgat tggactgtcc tgaacgattt + 1441 gttctgttct tatttcattt tactatattt ttgtttcgcg ggaagtctac taagatactt + 1501 aaagatgcag atagtaaaaa taaaggtgta gacattaccg taaaaaagtg atataatcgt + 1561 acagtgttca atgtataggt attaatcatg agtagacgtt ttaaaaaatc acgttcacag + 1621 aaagtgaagc gaagtgttaa tatagttttg ctgactattt atttattgtt agtttgtttt + 1681 ttattgttct taatctttaa gtacaatatc cttgctttta gatatcttaa tctagtggta + 1741 actgcgttag tcctactagt tgccttggta gggctactct tgattatcta taaaaaagct + 1801 gaaaaattta ctatttttct gttgctgttc tctatccttg tcagctctgt gtcgctcttt + 1861 gcagtacagc agtttgttgg actgaccaat cgtttaaatg cgacttctaa ttactcagaa + 1921 tattcaatca gtgtcgctgt tttagcagat agtgagatcg aaaatgttac gcaactgacg + 1981 agtgtgacag caccgactgg gactgataat gaaaatattc agaaattact agctgatatc + 2041 aagtcaagtc agaataccga tttgacggtc aaccagagtt cgtcttactt ggcagcttac + 2101 aagagtttga ttgcagggga gactaaggcc attgtcctaa atagtgtctt tgaaaacatc + 2161 atcgagtcag agtatccaga ctacgcatcg aagataaaaa agatttatac taagggattc + 2221 actaaaaaag tagaagctcc taagacgtct aagagtcagt ctttcaatat ctatgttagt + 2281 ggaattgaca cctatggtcc tattagttcg gtgtcgcgat cagatgtcaa catcctgatg + 2341 actgtcaatc gagataccaa gaaaatcctc ttgaccacaa cgccacgtga tgcctatgta + 2401 ccaatcgcag atggtggaaa taatcaaaaa gataaattaa cccatgcggg catttatgga + 2461 gttgattcgt ccattcacac cttagaaaat ctctatggag tggatatcaa ttactatgtg + 2521 cgattgaact tcacttcttt cttgaaaatg attgacttat tgggaggggt agatgttcat + 2581 aatgatcaag agttttcagc tctacatggg aagttccatt tcccagtagg gaatgtccat + 2641 ctagactctg agcaagcttt aggttttgta cgtgaacgct actcactaac cgatggagac + 2701 cgtgaccgtg gtcgcaacca acaaaaggtg attgtggcta tccttcaaaa attaacgtca + 2761 accgaagtac tgaaaaatta tagtacgatc attaatagct tgcaagattc tatccaaaca + 2821 aatatgccga ttgagactat gatagattta gtgaatactc agttggaaag tggagggaat + 2881 tataaagtaa attctcaaga tttaaaaggg acaggtcgga tggatcttcc ttcttatgca + 2941 atgccagaca gtaacctcta tgtgatggaa atagatgata gtagtttagc tgtagttaaa + 3001 gcagctatac aggatgtgat ggagggtaga tgaaatgata gacatccatt cgcatatcgt + 3061 ttttgatgta gatgacggtc ccaagtcaag agaggaaagc aaggctctct tggcagaatc + 3121 ctacaggcag ggggtgcgaa ctattgtctc tacctctcac cgtcgcaagg gtatgtttga + 3181 aactccggaa gagaagatag cagaaaactt tcttcaggtt cgggaaattg caaaagaagt + 3241 agcagatgat ttagtcattg cttacggggc tgaaatttac tacacaccag atgttctgga + 3301 taagctggga aaaaagcgga ttccgaccct caatgatagt cgttatgcct tgatagagtt + 3361 tagtatgaac actccttatc gcgatattca tagcgccttg agcaagatct tgatgttggg + 3421 aattactcca gtcattgccc acattgagcg ctatgatgct cttgaaaata atgaaaaacg + 3481 cgttcgagaa ctgatcgata tgggctgtta cacgcaagta aatagttcac atgtcctcaa + 3541 acccaaactt tttggcgaac gttataaatt catgaaaaaa agagctcagt attttttaga + 3601 gcaggatttg gtccatgtca ttgcaagtga tatgcacaat ctagacggta gacctcctca + 3661 tatggcagaa gcatatgact ttgttaccca aaaatacgga gaagcgaagg ctcaggaact + 3721 ttttatagac aatcctcgaa aaattgtaat ggatcaacta atttaggaga aatgatgaaa + 3781 gaacaaaaca cgatagaaat cgatgtattt caattattta aaaccttgtg gaaacgcaag + 3841 ttaatgattt tattagtggc acttgtgaca ggtgcggggg cttttgcata tagcactttt + 3901 attgttaagc cagaatatac gagtaccacg cgaatttacg tagtgaatcg cgatcaagga + 3961 gacaagtcgg ggctgacaaa tcaggatttg caggcaggaa cttatctggt aaaagactac + 4021 cgtgagatta ccctttcgca ggatgtattg gaaaaagtag cgacaaattt gaagttggat + 4081 atgccagcaa aaacattagc cagcaaagtt caagtgactg taccagctga cactcgtatc + 4141 gtctcaatct ctgtcaagga taaacagcca gaggaagcca gtcgtatcgc taattctcta + 4201 cgagaagttg ctgcagaaaa gatcgtcgct gtaacgcgag tatctgatgt aacgacactt + 4261 gaagaagcgc gaccagttac gactccctct tctccaaatg ttcgacgcaa ttccttgttt + 4321 ggttttcttg gaggagcagt cgtaacagta attgctgttc ttttgattga gttgatcgac + 4381 acccgtgtga aacgtcctga agatgtcgaa gatgtactgc aaattccact tttaggggtc + 4441 gttccagatt tggacaaaat gaaataggag gaaattatgc caacgttaga aatttcacag + 4501 gcaaaattgg attttgtaaa aaaggcagag gaaaattata acgctttgtg cacgaaccta + 4561 cagttaagtg gagatgattt gaaagtattt tctatcactt ctgtgaaact aggagaagga + 4621 aaatcaacga cttccaccaa tatcgcttgg gcttttgcgc atgcaggtta caaaacgctg + 4681 ctgattgatg gagatattcg caattctgtt atgttaggtg tctttaaagc aagggataag + 4741 attacaggcc tgacagaatt tttatcagga actacagacc tatcacaagg gctttgtgat + 4801 accaatatcg aaaatctctt tgtaattcag gctggctctg tgtcaccgaa tccgacagct + 4861 cttcttcaaa gtaagaattt cagtacaatg cttgaaacct tgcgtaaata ttttgactac + 4921 atcattgtag atactgctcc tgtcggtgtc gtgattgatg cggctattat tacgcgaaaa + 4981 tgcgatgctt ctattttagt gacggaggca ggtgaaataa atcgacggga tattcaaaaa + 5041 gcaaaagaac agttggaaca cacagggaag ccgtttttgg gagttgtgtt gaataaattc + 5101 gatacttcag tagacaaata cggttcttat gggaactatg gaaagaaata aataatcttg + 5161 tagtaccaag gttatttgag atgattacca tgagaggaga gtttaaggtg aaacagaatg + 5221 gcatcatcta tattggcttt aaaagaatta tggatgtttt tatcggctta tttgggacaa + 5281 tattcatagt cttgcctagt tctttaatga tttatattat ttataaaata aaaggttaca + 5341 aaggaaatat attcttcaca caatatagag tggggctaaa ggggaaaaaa tttaaaatta + 5401 ttaaatttag atcaatggtt gaaaatgctg aagaagtttt ggccgcaaat aaagcactct + 5461 atgaaaaata tataaataac agttataaat tacctccaaa tgaggatcct cgtcttacca + 5521 atatcggaga ttttataaga aaaacgagta ttgatgaaat tcctcaattt ataaatttaa + 5581 tgttaggtga tatgagtctt attggaccta gaccgatttt ggagaatgag ttagaggagt + 5641 attctaagga agaacagcaa gttttgttat ctgtacgacc aggtattaca gggatgtggc + 5701 aagtttctgg taggagtgag gtatattatc ctgaacgctg tgaaatggag ctgtactatc + 5761 ctcggaacca atcctttttg ttggatgtaa aaatcttctt tttgacaata aaaaaagttc + 5821 tatctggaga aggggctcat tgatgtatga gctaaatcat ctagcaaaaa atagatagaa + 5881 agaagaagtt gaatacggat agcgtttctt gggtattcgt attcattttt tcaagtgaag + 5941 gaagcattat gaataagtgg atttaatcta gtgtttttgc ttgaaaaaat ggatgggaat + 6001 tcaatctaaa gaattgtcca gtgaggcaag attttaggaa ttggagttag gatgtagaaa + 6061 tgtcaaaaaa gtataaaatt atagtagcga ctcataaaag atttcaaatg ccagaagata + 6121 aggacttata tgttcctgtt caggttggca gtgaaggaaa ggaaaattta ggctaccaac + 6181 gagataatca aggtaatcat atttcatatc ttaatcctta ttattgtgag ttgacaggat + 6241 tatactgggc ttggaaaaat ttagactgtg attatctagg attagttcat taccgacgtt + 6301 attttacaga taagaaccga ccttatcatg ataagattaa catgaatgaa gttatcctat + 6361 cggctgatca agttaaggag ctcatgtctg aagtagatgt cgttgttccc aaaaagagaa + 6421 aatattatat agaaactctc tattctcatt atgctcacac tcatgattcc agtcatttag + 6481 atgtaacacg agaaattata aaagaggttt cgccagaata tttagcaaca tttgacaagg + 6541 tgatggccta tcgtagcggc tacatgttca atatgtttat catgtccaaa gaaaatgtat + 6601 catcttattg tgagtggttg ttccctatca ttgatgagtt gtacagaaga ttggacataa + 6661 cagggtactc tgcttttgat gcaagactat ttggacgtgt tagtgaacgt ctctttaatg + 6721 tttggttaga ttaccaaaat ctacatgtta aagaacttcc gtttatgtat atggaaaagg + 6781 tggatttgct tgaaaaaggg aaatccttct taatggcaaa atttttcgga aagaagtatg + 6841 gtcagagttt ttgaaatgtt agaaaaaaaa tctccacttt ttagtgttat tgttccaacc + 6901 tataagatat cagaatctaa tctacgccag tgcatagact ctctgttata tgataatcaa + 6961 gatgttgaaa ttattttggt agatgataat gcaaactcag atatatgtgg tgaagtgata + 7021 gacgaatatg ctgaaaaata taataatatt tcagttattc atcaggaaaa ccaaggtgtg + 7081 tcagtcgcaa gaaatgctgc tatgtctatt gctgtaggaa agtatcttgt ttttgtagac + 7141 cctgatgatt gggttgctga aaatttttat agccaaatga cttttgcggt tcaaaaaaat + 7201 ccttcaagtg atgtgattat attagctgct attgtagact ataatggtaa acgatttacg + 7261 aatcattttt ggcacacttc tcgttctttt cgtggaaaag tcaaagatga tttggaactt + 7321 caattgattg ccaaaggagc aacgagttat tttccagctg agataggggt tggtgttcct + 7381 tgggcaaaaa tttatcgtaa tgagtttgtg cgagcaaatg gcttggtttt taatccttct + 7441 cttcgtcgaa tgcaagataa cattttcaat atgtatgcat ttgaatttgc gaatgagatc + 7501 gtctacattg atgagccgat ttactattat agaaagagca tggatagtgt aactaataag + 7561 aaaaatgata aagtaattta ttatttcgac ttagttaatg atgaggttga aaaatttatt + 7621 ctaaaattta ataagcctaa aatatttgaa gatgctctac atataaaaag acttatagga + 7681 atcaattcgt attataagtt gtattttcag tttgcgtcta cttcaagcga gaaaaagaaa + 7741 atgcgacaag aatttcgtga acttttagaa agggaagaat atgcaaattc gttaaaacaa + 7801 gtgaatacag cctatcttct cccaaaagaa aaaattttta taagcatttt aaagcagaaa + 7861 gacttatgga tattctcatt gttacaaaaa cttgaaaaat tgtctgtgag gttgaagagt + 7921 cgacagttta gttagaggga atatgagaca gttacagtag ggatttataa gccgatatat + 7981 aaatccaaat atattagaga aaaaatgtta ggaaacggtt tataaaaatt gtagaggatg + 8041 gagaatgtct tgaataaaaa aataggaatt gttattttaa attatcttaa ttgggaggac + 8101 actttagaat gcataaatag tttgcgctca caaagtgatc aagattttga agctgtcata + 8161 gtagaaaatg gttctccaaa tgaatctgtt tctaggatta gagattatat aaaaaacgac + 8221 aagaatattc atatttgtgt agtggataat aacttaggtt atgcaaatgg aaataatatg + 8281 ggcatcctct acttaaaaaa tagatactct ataaatagaa ttctattaac taataatgat + 8341 gttgtttttg atgatgaaga ctacataaaa aaattagaag atattaagta tagtaatact + 8401 attggagcga ttggaacaaa aattattggt tctgatggct tagatcaaaa tccagcctat + 8461 tttccaatat cttttaaatc aagtattaaa ttgttgatta tcaatttatt agctttttct + 8521 aaagctttta cttttattaa aagacgttat ctatcttcat gggcgaaaaa agttaatgat + 8581 ttttcggctc caagatacaa caatcaaaaa tattgtttac atggatcagt tatctttctt + 8641 accgagaatt atttagataa atttatggga ttgtatggtg gaacttttct ttactatgaa + 8701 gaagtgattt taggtattat atttgaaaaa gcaggtctcg atatgttgta tatacctaac + 8761 ttctcaatct atcataaaga agatcaatcg tcgctacaaa gttttaataa tgatgactta + 8821 gtgcgacgtc gttatttgtt gcaaagtatt tggtctagta tgcgaatata tagaagctca + 8881 atagataacc tatctaatat tatagaaaat tcaatcaagg aaaaattatg attaattcgt + 8941 ctaagtatct taaatttgtc ttatattatc agataatatc attttatttt ttaggtattt + 9001 tttataggct atctactttt aatcaatatt tatatgtaat agcagatata gtttttatat + 9061 cagtatactt attgatattt gagcgtaaaa tcgcttatac taatataaaa ctatttatta + 9121 tctttatttt attctatcta tttggaagtt ttcaaggata tgatagtggt ggtgcattta + 9181 ttatattttt actaatttat ttaaaatata ttttattcaa atttataatt ataaatatac + 9241 cgcaatccaa tttaataaga gcatttacaa acataggtat tttaaatacg gtcattttat + 9301 tagcagaagt tttaagtcac ggacatatta atttatttgt gaatcattat actttggcgc + 9361 agaaaataga aaccttaaat aaggttggga caaaccttgc ggttttacgt ggggggtttg + 9421 aaaatccctt agtgacatct gtaatgctat cttctacatt attatttttt atgactattg + 9481 agaaggctct cttacgtaat atactaatta tgtctaactt atttttgatt atggcaacag + 9541 aaaaaagaac aggaattcta attagtatcg cgttgttgtt ctgttactat ttcagaaaaa + 9601 atttaaaaac aaagagtgtt agtaagttta taataaaatt cttgggagga ttgtttttct + 9661 tgggatttgc tttattagcc ataaatatga taacaatttc tggtcgtagc atttctcaga + 9721 tgataataga gaggttttca tcattaagta gtggttcaga cttttctgct atacataggt + 9781 caatggcttt taaaataggc atagaaataa tttggagtag gaatatattg aatatattat + 9841 tcggtaatgg tttctacttt ttgccaactt ttatgtacaa taataatatt acgattacaa + 9901 agttgggttt tttagtaata gataattctt atttatcttt tttagccgat tttggcatga + 9961 tgcctttaat aagtataatg ttttatctta tagggggtat ctttaagaat cttgtttcga + 10021 atgagactga taatatttca gaagtagtta tgtttagctt aattgcattg cttttatcgg + 10081 cgagtgtgtt cgatatttta aactggtatc agagtactct tttaacatgc ttttttgttg + 10141 cttatttaag tgtatatcat gattctagca aaaggaaagg gaataaatga ctatcaaaaa + 10201 tgaaattaaa catttaaaac gaaaaataga taaaaatttt tttcaaaaag atttcacttc + 10261 catctctgat attaagaact atcagattgc accttctttg aatcctagac cacgtcttaa + 10321 tttattaatt acttcaatga attctcagga tgtatatgct ggcatcaaat cagccgtgga + 10381 tttttttatg aagttcaaaa aatttgatat agatttaaga atcattgtaa tggggaaaaa + 10441 aatcgatgaa tcgtctcttt atcaagttcc tggttttgaa tttattaaag actattcaat + 10501 tgataatgat agtgagtcta ggattatttg cgatttatct aagaatcgtt ctccattatt + 10561 tattagggag cgtgattatt ttctatcaac aatgtggtac accgcttata atgctaacaa + 10621 tgtgttggat gagcaaaaaa gaatttttgg gaaacggatg cccatggttt atctagttca + 10681 agactatgaa ccaggtttct atccatggtc ctcagagtat cttttggctg agagcacata + 10741 tcatctagat aaccagcttg ttgtctttaa ttctaagtat ttaaaagaat tttttgatgc + 10801 aaatggttat agatttgaaa atagttatta ttttgatcca gttttaaatg aaaaattggg + 10861 ggagattctt aattcagcag agctttctaa tattgaaagg aaaaatcgta ttttatttta + 10921 tggaaggcct agtaaagcta gaaatgcttt tcagttaatc tgtatggcat tggaaaaatg + 10981 gagcctttta gacgaacata gttcaaattg ggaaattttt tctgcaggag aagatttaaa + 11041 agatattaaa ttgaataata acatagtaat aaaatcgtta gggaagatgt cagttgaaga + 11101 atacgcaaaa tttatgttgg aatctaaaat cggaatctct ctaatggctt caccgcatcc + 11161 gagctatcct ccgttagaaa tggctacatt tggtatgaaa gtcataacga attctttcgt + 11221 tacaaaagat atttctgatt ttaatgaaaa cataatttct attgaacata ttaatattaa + 11281 taaattagcg aaagaattac attttttaac aacatctgat atagaatata aaatttcgaa + 11341 aaacgatgat tatataaatg gtattagcca gcttgataca attgtagata aaattggagg + 11401 acatttacaa tttcagcata gcgaggtgtg attgtgaaaa ggaaatccat tgcccgaaat + 11461 tatttactta atttgataaa aacgaccttg tctattctat ttcccctgat atcataccca + 11521 tatgtgtcgc gtattttatc tgtggatggg ctgggtgcaa tcaatttttc agcctcgttt + 11581 gttaattatt tcgtactaat tgcaatcttt ggaattaatg tctacgctgt tagagaaggt + 11641 gccaaatatc gagatgataa aaagttactt gggaagtttg taacggagat gttacttgtt + 11701 agtatttgca cggcaatgat ttcattctct ttattaactg tttccttact cctacctgct + 11761 ctatcagaat atagaagtct tattctaatt ttttcaatta ccattatatt taatgttgtg + 11821 gggatggagt ggttttttca attgatggaa gactatcaat atataacact tcgtgcaatt + 11881 atatttcaaa ttctatcttt gatattttta ttcatatttg tcaaagatag gaatgatatt + 11941 tatgtgtacg ctctaattac agttgcagca aatgcaggtt ctcaaatact gaatttattt + 12001 agacttagaa aagaagttga aatatttaga tataaagact ataatattag aaattatttt + 12061 aaaccgatgt ttctgatatt tttaacctta ttgtctatga atatatatag atatttagat + 12121 gttacttttc tgggcttctt taaaaatgat cgaagtgtgg gctactatag cttagctaca + 12181 aaaataacaa gtgctataat ttcgatggta tcttctgtta cagttatttt gacacctcgt + 12241 ctagcatatc attataagaa ggaggagttt gataaattct ataaaattgc ttatagttcc + 12301 tttgatttta ttttattact tgctatacca gttgttatag gtgtattgag ttttagttct + 12361 attttagtag attttttggg tgggagtact tttgtttctt ctgtgttaac ggtggagata + 12421 ttaagtttaa caattctatt ctctaatttg aatgctttat taattacacc tattttaacg + 12481 gttatgaatc gtgagaaagc ggttttaaaa atttttatta tcgcattgat tttcaatgtt + 12541 attacaaaca tgttacttat tccagtaatg gattttaatg gttcagcttt ggttacagtt + 12601 ttgacagaag gaattatttg catattatct ttaattagta taaaaagtgt gtttaatgtt + 12661 agaaggctat ttaagaatct ttttcaatat ctggtagcta gtatctttat aattgttgtc + 12721 aagattgtta tttctcagta cgtttcatca aattatatta tttttatttc aactgcttta + 12781 ctaagcgcaa ttttatattt ccttactttg atattattga gaaatgagtt agtaccacaa + 12841 ttaataatag aagttagaaa gaaaatatat agatagtgga gttaaatata aatgtttacc + 12901 atatatagag ccatgaaaaa aataattata attattttgt cgcttcccaa gattttttat + 12961 ataaatttta aatgccttcc gttgaatcag gcggttaaac ttcctatata tgttcatttt + 13021 aatactcgat taatgattag gggagacata aaaatcattg atactcattt atcacgtttt + 13081 actattattt tggggaaaga tggctctaat catatctctc ctcatgagag tagattattt + 13141 atttatgatg gggggcaatt aattctaggg agaaatattc tattatctag tggatttaat + 13201 ttgtgtatag agcaaggagg tacggttaaa ttaggagata atgtctcttt taacagaaat + 13261 tcttcgatct tttgtaaaaa acaaattaat attggtaaaa atagtttgtt tggttggaac + 13321 tgtagtttac gtgataataa tggacatagg atctattatc aggggaactg tattaagagt + 13381 gaaggagtta ttgtaatagg agagaattgc tggataacag cagactcaat cattcttaaa + 13441 aatagtgttc ttcctttttc tactgtagtt gctacaggta gtttagtaaa taaagagttt + 13501 aatcagagta acattttgat agctggaagg cctgctagaa ttattagaga tgatataaaa + 13561 tgggaaagat aagatagtaa ttgattaatt aggtcgtgta atttttaaca gagataacga + 13621 aaggtaatgg gtgaagtaaa tgaaaattgc agttgcaggt acaggctatg taggactatc + 13681 tattgcagtt ttaatggctc agcatcatga ggtggtagct gttgatatta tttctgaaaa + 13741 ggtcaatctg attaataatg gaaaatctcc aattaaggat gactatattg aagaatactt + 13801 agcaacaaag cccctcaact tagtggcaac attggataca aatctagcgt accaaaatgc + 13861 agattttgtt attatagcag ctccaacaaa ttatgattca gaaaagaact tttttgatac + 13921 atctgctgta gaatcagtta ttgaaacggt gttagagact aatcctaacg ctgtaatggt + 13981 aattaaaagt actgttcctg taggctatac tcaatcggtt cgtaataaat ataaaacaag + 14041 taatatttta tttagtccag aatttttacg tgagtcaaag gctttatatg ataatttata + 14101 tcctagccgt ataattgttg ggcttgatat ggacgatgca tatttaaagg agagagccga + 14161 aacttttgca gaactgctac aagaaggagc tattaaagag gctatagaaa ttctttacat + 14221 gggatttaca gaggcagaag cagtcaaact ttttgcaaat acatatttag ccttacgtgt + 14281 ttcttatttc aatgagttgg atacttatgc agaagttaaa gggctagata ccaaagctat + 14341 tattgaaggt attggcttag atccacgtat cggaaaccaa tataataatc cttcttttgg + 14401 atatggggga tattgccttc caaaagatag taaacaacta ttggcaaact ataaagatgt + 14461 tccacagaat atgataacag ctatcgttga gagcaatcgt actagaaaag attttattgc + 14521 agagcagatt ttgaaatttg caggagtttc aaataatggg gaaatttacc caaaagatgt + 14581 aataataggc ctttatcggt taactatgaa gagcaactcc gataattttc gtcaatcttc + 14641 tattcaaggt gttatgaaac gattgaaggc agaaggagca aatgtcataa tttatgagcc + 14701 aactcttagt gataacgaga cgttttttgg tagtaagatt gtaaatgatt tggaacactt + 14761 taaatcaatt agtaatgtta tcgtggcaaa tcgttatgat gatttgctta aagatgtgag + 14821 tgacaaggtt tatagtcgtg atatttttaa gagagattag gtagaagtta taatgtatga + 14881 ttatttaatc attggagctg gtttgtctgg tgcaatcttt gcgcacgaag ctacaaaacg + 14941 tggaaaaaaa gtaaaagtga ttgataaacg tgatcacatc ggtgggaaca tctattgtga + 15001 gaatgtagaa ggtatcaatg ttcataaata tggtgcccat attttccata cttctaataa + 15061 aaaagtttgg gactatatca atcaattcgc tgagtttaac aactatatca actcacctgt + 15121 cgcaaactat aagggaagtc tttataacct tcctttcaat atgaatacct tctatactat + 15181 gtggggcaca aaaactccac aagaagtgaa ggataagatt gctgagcaga cagctggtat + 15241 gaaggatgtt gagccgaaaa atctggaaga acaagctatc aagttgattg gtccggatat + 15301 ctatgaaaag ttgatcaagg gttatacaga aaagcaatgg ggacgctcag cgacagaact + 15361 tcctccattt atcataaaac gccttccagt tcgtttaacc tttgataata actattttaa + 15421 tgaccgttac caagggattc ctattggtgg ttacaatgtc atcatcgaaa atatgctgaa + 15481 agatgtagaa gttgaacttg gagtagactt ttttgctcat cgtgaagagt tggaagcatc + 15541 tgctaacaaa gttgtcttca caggaatgat cgaccaatat tttgactaca agcacggaga + 15601 gttagaatac cgtagccttc gttttgagca tgagatttta gacgaggaaa attatcaagg + 15661 gaatgctgta gtgaactata cagagcgtga gatcccttat actcgtatta tcgaacacaa + 15721 acattttgaa tatggaatgc agccaaagac agttatcacg catgaatatc cagctgactg + 15781 gaagcgtggg gacgagccct actatcctat taacgatgag aaaaataatg ctatgtttgc + 15841 taaataccaa gaagaagcag cgcagaatga taaagttatc ttttgtgggc gtttagcaga + 15901 ctataaatat tacgatatgc atgtggtgat tgaacgggcg cttgaggttg tggagaaaga + 15961 atttagtaat tgaaaaacaa cgaagaaagg ttgcttatat atgaaaggta ttattcttgc + 16021 aggtggttcg gggacacgat tatatccttt gactcgggct gcatcaaaac aacttatgcc + 16081 ggtttatgat aaacccatga tttactatcc tttgtcaacc ctgatgttga ctggaataaa + 16141 ggacattttg attatctcaa caccacagga tttgccccgt tttaaggact tgctcttgga + 16201 tggttccgaa tttgggatca agctttccta tgcggaacaa cctagtcccg atggacttgc + 16261 tcaggctttt attatcggtg aagagtttat cggtgacgat agcgttgcct tgattttagg + 16321 tgacaatatt taccatggtc ctggtctgag cacaatgctt caaaaagcag ccaagaaaga + 16381 gaaaggtgcg actgtttttg gctaccaagt gaaggatcca gagcgttttg gtgtggttga + 16441 gtttgataca gacatgaatg ctatttctat cgaagaaaag ccagagcacc ctcgttcaaa + 16501 ctatgcagtt acaggaatct atttctatga taatgatgta gtagagattg ccaaaagtat + 16561 aaaaccaagc cctcgtggtg aactggaaat tacagatgta aacaaggctt acctaggtcg + 16621 tggagattta tccgttgagg ttatgggacg aggctttgct tggctggata ctggaactca + 16681 tgaaagttta ttagaggctt cgcagtacat cgaaacagtc caacggatgc aaaatgttca + 16741 ggtagcaaac ttagaagaaa ttgcctatcg catgggttat atcagtcgtg aagatgtatt + 16801 gaccttagcc caaccactta agaaaaatga atacggacag tatctgctcc gtttgattgg + 16861 agaagcatag atgacagata attttttcgg taagacgctt gcggcacgca aggttgaagc + 16921 tattccaggc atgttggagt ttgatatccc cgttcatgga gataatcgtg gctggtttaa + 16981 agaaaatttc caaaaggaaa aaatgcttcc acttggattt ccagagtctt tctttgcaga + 17041 aggaaaattg caaaacaatg tatccttctc acgtaaaaat gtccttcgag ggctccacgc + 17101 agagccttgg gataagtaca tctctgtagc agatggaggg aaagttctgg gttcttgggt + 17161 tgatctacgc gagggtgaaa cctttgggaa tacctatcag acagtaattg atgcaagcaa + 17221 gggaatcttt gttcctcgag gcgtagctaa tggcttccaa gttctatcag atacagtgtc + 17281 atatagctat ctggtcaatg attactgggc tctcgagctc aaacccaagt atgcctttgt + 17341 gaactacgct gatccaagcc ttggtattga atgggaaaat attgcagaag cagaggtttc + 17401 agaagcagat aaacatcatc ccctacttaa ggatgtaaaa cctttgaaaa aagaagattt + 17461 gtaaaaagga aagaatatga ctgaatacaa aaatattatc gtgacaggtg gagctggctt + 17521 tatcggttct aactttgtcc attatgttta cgagaacttt ccaggtgttc acgtgacagt + 17581 cctagataag ttgacttatg ctggaaatcg cgcgaatatt gaggaaattt taggtaatcg + 17641 tgttgagtta gttgttggtg acattgctga tgcggagttg gtagacaagt tggctgctca + 17701 agcagatgct atcgttcatt atgcagcgga aagccacaat gataattcgc tcaatgatcc + 17761 atcgccattt attcatacta acttcatcgg aacctatact cttttagaag ctgctcgtaa + 17821 gtatgatatt cgcttccacc atgtatcgac agatgaagtt tatggggatc tccctttacg + 17881 cgaagatttg ccaggtcatg gtgaaggacc aggtgagaaa tttactgctg aaacaaaata + 17941 caacccaagc tctccgtact catcaaccaa ggcagcctca gatttgattg tcaaagcctg + 18001 ggtgcgttct tttggagtca aggcaacgat ttccaactgt tcaaataact acggtcctta + 18061 tcaacatatc gaaaaattca tcccacgtca gattactaac atcctaagtg gaattaagcc + 18121 aaaactttac ggtgaaggta agaatgttcg tgactggatt cataccaatg accattcttc + 18181 aggagtttgg acaatcttga caaaagggca aatcggtgaa acctacttga ttggggctga + 18241 tggtgagaag aacaataagg aagttttgga acttatcctt aaggaaatgg gacaagctac + 18301 ggatgcctat gatcatgtga ctgaccgtgc aggacatgac cttcgctatg cgattgatgc + 18361 cagcaagctc cgtgatgagt tggggtggaa acctgaattt accaactttg aagctgggct + 18421 caaggcaaca atcaagtggt atacagataa ccaagaatgg tggaaagcag aaaaagaagc + 18481 tgttgaagcc aattatgcta agactcagga gattattaca gtataaaaac caggaaatag + 18541 ctgcttttta ttgctatatt gggaagagtt acatattaga aaggtctaga gatgatttta + 18601 attacagggg caaatggcca attaggaacg gaacttcgct atttattgga tgaacgtaat + 18661 gaagaatacg tggcagtaga tgtggctgag atggacatta ccaatgaaga aatggttgag + 18721 aaagtttttg aagaggtgaa accgacttta gtctaccatt gtgcagccta caccgctgtt + 18781 gatgcagcag aggatgaagg aaaagagttg gacttcgcca tcaatgtgac ggggacaaaa + 18841 aatgtcgcaa aagcatctga aaagcatggt gcaactctag tttatatttc tacggactat + 18901 gtctttgacg gtaagaaacc agttggacaa gagtgggaag ttgatgaccg accagatcca + 18961 cagacagaat atggacgcac taagcgtatg ggggaagagt tagttgagaa gcatgtgtct + 19021 aatttctata ttatccgtac tgcctgggta tttggaaatt atggcaaaaa cttcgttttt + 19081 accatgcaaa atcttgcgaa aactcataag actttaacag ttgtaaatga ccagtacggt + 19141 cgtccgactt ggactcgtac cttggctgag ttcatgacct acctagctga aaatcgtaag + 19201 gaatttggtt attatcattt gtcaaatgat gcgacagaag acacaacatg gtatgatttt + 19261 gcagttgaaa ttttgaaaga tacagatgtc gaagtcaagc cagtagattc cagtcaattt + 19321 ccagccaaag ctaaacgtcc gctaaactca acgatgagcc tggccaaagc caaagctact + 19381 ggatttgtta ttccaacttg gcaagatgca ttgcaagaat tttacaaaca agaagtgaga + 19441 taagtagtag aatgattttc tagtctaata aaagaggcag agaatgaact ccaaaggagc + 19501 ttaagatgta cgattatatt attgtcggtg ctggtttgtc aggagcaatt tttgcttatg + 19561 aggcgaccaa gcgtggaaaa aaagtaaaag tgattgataa acgtaaccac attggtggga + 19621 atatctactg tgagaatgta gaaggagtta atgttcataa atatggtgcc catatctttc + 19681 atacttctaa taagaaagtt tgggattatg ttaatcaatt tgctgaattt aacaactacg + 19741 tcaactcgcc tgtagctaat tacaagggta gcctctataa tctacctttc aatatgaata + 19801 ccttctatgc tatgtggggg acaaaaactc ctcaagaagt caaagataag attactgagc + 19861 agacagctga tatgaaggat gttgagccga aaaatctgga agaacaggct atcaagttga + 19921 ttggtccaga tgtctatgaa aagttaatca agggttatac tgaaaagcag tggggacgct + 19981 cagcaacgga acttcctcca tttatcatta aacgtcttcc agttcgttta acatttgata + 20041 ataactattt taacgaccgt taccaaggaa ttcctattgg tggttacaat gtcatcatcg + 20101 aaaatatgct taaagacgtt gaagttgagc ttggtgttga tttctttgct catcgtgaag + 20161 agttagaagc atcagctgaa aaagttgtct ttacagggat gatcgaccag tattttgact + 20221 acaagcacgg agagttagaa taccgtagcc ttcgttttga gcatgagatt ttagacgagg + 20281 aaaattatca aggaaatgct gtagtgaact atacggagcg tgagattcct tatactcgta + 20341 ttatcgaaca caagcatttt gaatatggaa cgcaggcaaa gacagttatc acgcgtgaat + 20401 atccagctga ctggaagcgt ggggacgagc cttactatcc gatcaacgat gagaaaaata + 20461 atgctatgtt tgctaagtac caagaggaag cttcaaagaa tgataaggtt attttctgtg + 20521 gacgtttagc agattataaa tattatgata tgcatgtggt gattgaacgg gcgcttgagg + 20581 ttgtggagaa agagtttgga tatgacaaaa agtagaatca attggataga ttttggaaaa + 20641 ggcttttcca tatttttagt cttagcaggg catgtgttgc ttggactgta tcaatcggaa + 20701 aaatttccca cagcaaataa catactatcg ttgttgatag cacaagtcta catatttcat + 20761 ataccagtat tttttgcctt atcaggatac tttttcaaac ctgtgtcgga tttgaaggag + 20821 ttctggcaat atgctaaaaa gaagacaatt gtttttggtc tgccatatat tttctattcg + 20881 atcattcact ttggtcttca aaaagttgca ggggcatctg ttcgtgttcc tacaaccata + 20941 tctgatttgc taaatatcta taaagatcct cttggagttt cgtggtattt atatatactc + 21001 tggtcgattt tgataatcta tggattattg tctattttag tcaaaaatcg tagaatgtta + 21061 tttttgataa gtgttttcgc ttattgttta accctatttg ttcaaacaga tatttatatt + 21121 attcaaagaa cgctagtttg ggggatttgt ttctttcttg gcagtgtatt gagtgaaatt + 21181 cactttgata aaattaattt gaaaaaattt ctttttttct ttgtgttatt tgattttatt + 21241 tatatgttcg cttggttctt gttttatgaa gtagggtcta agaaggatta tgtaagctat + 21301 agtaacccag gtttgtgggg gattgctttt attgtctgtg tattagttgc ttttgcgatt + 21361 tttcctaaaa tggagaaaaa ttttcctaaa actttcctat atttcactaa atacgggaaa + 21421 gatagtttag ggatctatat tcttcatgca ccaatttgta gcatgattcg gattctaatg + 21481 ttgaaagtgg gaataaactc agtttttatt cacgttgttg ttgggattgt gctaggctgg + 21541 tatttatcca tactagcaac ttatatattg aaaaaaattc catttttgaa tattgtttta + 21601 ttaccacaaa agtatattaa attaaaataa attattttag atttataatg tggctctttg + 21661 tcaactaaca tctggagagg acaatcactg tcttctcttt ttttgtcttt tcagaatata + 21721 ccaaattaac acaaaaattc tgaaaattct attgacaact ttctgaaaag agtctataat + 21781 ggagagaaag ttttaaagga gaaaatgatg aaaagttcaa aactatttgc ccttgcgggc + 21841 gtgacattat tggcggcgac tactttagcc gcatgctctg gatcaggttc aagcgctaaa + 21901 ggtgagaaga cattctcata catttatgag acagaccctg ataacctcaa ctatttgaca + 21961 actgctaagg ctgcgacagc aaatattacc agtaacgtgg ttgatggttt gctagaaaat + 22021 gatcgctacg ggaactttgt gctgtctatg gctgaggatt ggtctgtatc taaggatgga + 22081 ttgacttaca cttatactat ccgtaaggat gcaaaatggt atacttctga aggtgaagaa + 22141 tacgcggcag tcaaagctca agac +// + diff --git a/public/res/serotype_genbank/serotype_32A.gb b/public/res/serotype_genbank/serotype_32A.gb new file mode 100644 index 0000000..a420c1e --- /dev/null +++ b/public/res/serotype_genbank/serotype_32A.gb @@ -0,0 +1,1143 @@ +LOCUS CR931696 25372 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 2813/41 (serotype 32a). +ACCESSION CR931696 +VERSION CR931696.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 25372) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 25372) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..25372 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="2813/41" + /db_xref="taxon:1313" + gene <1..33 + /gene="dexB" + /locus_tag="SPC32A_0001" + CDS <1..33 + /gene="dexB" + /locus_tag="SPC32A_0001" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34112.1" + /db_xref="UniProtKB/TrEMBL:Q4JZU9" + /translation="PWDAFCVELL" + gene 192..360 + /gene="aliB" + /locus_tag="SPC32A_0002" + /pseudo + CDS 192..360 + /gene="aliB" + /locus_tag="SPC32A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(361..1165) + /gene="tnp" + /locus_tag="SPC32A_0003" + /pseudo + CDS complement(join(361..795,794..1165)) + /gene="tnp" + /locus_tag="SPC32A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(793..795,794..1147)) + /gene="tnp" + /locus_tag="SPC32A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.9e-19" + /pseudo + gene complement(1562..2955) + /gene="tnp" + /locus_tag="SPC32A_0004" + /pseudo + CDS complement(join(1562..1696,1696..2955)) + /gene="tnp" + /locus_tag="SPC32A_0004" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(1969..2472) + /gene="tnp" + /locus_tag="SPC32A_0004" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 3.6e-20" + /pseudo + gene complement(3061..4014) + /gene="tnp" + /locus_tag="SPC32A_0005" + CDS complement(3061..4014) + /gene="tnp" + /locus_tag="SPC32A_0005" + /note="member of homology group 39" + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + /protein_id="CAI34116.1" + /db_xref="GOA:Q4K0X9" + /db_xref="InterPro:IPR001584" + /db_xref="InterPro:IPR012337" + /db_xref="UniProtKB/TrEMBL:Q4K0X9" + /translation="MQEHYTPKGKHLTIDNRRLIERWKNENKSNREIAGLLGKAPQTI + HNEVKRGTTLQQVRKGLYKKVYSADYAQTVYQFNRKRSVKKLILTKEIREKILHYHKQ + KFSPEMMVNKKQVKVGISTIYYWFHNGHLGLTKADMLYPRKRKGVKKQASPNFKPAGK + SIEERPDVINLRLENGHYEIDTVLLTKIKNYCLLVLTDRRSRHQIIRLIPNKTAESVN + QALTLLLGEHRILSITADNGSEFKRLSEVFPEEHIYYAHAYSSWERGSNENHNRLIRR + WLPKGTKKTTPKEVAFIENWINNYPKKCLDYKSPSEFLLGG" + misc_feature complement(3070..3507) + /gene="tnp" + /locus_tag="SPC32A_0005" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 6.6e-23" + misc_feature complement(3868..3933) + /gene="tnp" + /locus_tag="SPC32A_0005" + /note="Predicted helix-turn-helix motif with score + 1087.000, SD 2.89 at aa 28-49, sequence + KSNREIAGLLGKAPQTIHNEVK" + gene 4368..5822 + /gene="wzg" + /locus_tag="SPC32A_0006" + CDS 4368..5822 + /gene="wzg" + /locus_tag="SPC32A_0006" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34117.1" + /db_xref="GOA:Q4JZS6" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZS6" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLMSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYGTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMGL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 4368..4493 + /gene="wzg" + /locus_tag="SPC32A_0006" + /note="Signal peptide predicted for SPC1480 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 4581..4928 + /gene="wzg" + /locus_tag="SPC32A_0006" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.7e-63" + misc_feature 5106..5549 + /gene="wzg" + /locus_tag="SPC32A_0006" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 5824..6555 + /gene="wzh" + /locus_tag="SPC32A_0007" + CDS 5824..6555 + /gene="wzh" + /locus_tag="SPC32A_0007" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34118.1" + /db_xref="GOA:Q4JZS5" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZS5" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEKDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 5827..6435 + /gene="wzh" + /locus_tag="SPC32A_0007" + /note="HMMPfam hit to PF02811, PHP domain, score 1.5e-36" + gene 6561..7256 + /gene="wzd" + /locus_tag="SPC32A_0008" + CDS 6561..7256 + /gene="wzd" + /locus_tag="SPC32A_0008" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34119.1" + /db_xref="GOA:Q4JZS4" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZS4" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSAFI + VKPEYTSTTRIYVVNRNQGDKSGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLTRKVQVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDIRVKRPEDVEDVLQI + PLLGVVPDFDKMK" + misc_feature 6561..6677 + /gene="wzd" + /locus_tag="SPC32A_0008" + /note="Signal peptide predicted for SPC1482 by SignalP 2.0 + HMM (Signal peptide probability 0.729) with cleavage site + probability 0.460 between residues 39 and 40" + misc_feature 6582..6998 + /gene="wzd" + /locus_tag="SPC32A_0008" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.5e-56" + misc_feature 7104..7181 + /gene="wzd" + /locus_tag="SPC32A_0008" + /note="PS00217 Sugar transport proteins signature 2." + gene 7266..7955 + /gene="wze" + /locus_tag="SPC32A_0009" + CDS 7266..7955 + /gene="wze" + /locus_tag="SPC32A_0009" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34120.1" + /db_xref="GOA:Q4JZS3" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZS3" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + QGEGKSTTSTNIAWAFARAGYKTLLIDADIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 7970..9337 + /gene="wchA" + /locus_tag="SPC32A_0010" + CDS 7970..9337 + /gene="wchA" + /locus_tag="SPC32A_0010" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34121.1" + /db_xref="GOA:Q4JZS2" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZS2" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDQFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKIVAEGEIVNFATHEVVDEVFIDLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKNGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 7970..8062 + /gene="wchA" + /locus_tag="SPC32A_0010" + /note="Signal peptide predicted for SPC1484 by SignalP 2.0 + HMM (Signal peptide probability 0.902) with cleavage site + probability 0.355 between residues 31 and 32" + misc_feature 8753..9334 + /gene="wchA" + /locus_tag="SPC32A_0010" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.4e-156" + gene 9341..10555 + /gene="wchF" + /locus_tag="SPC32A_0011" + CDS 9341..10555 + /gene="wchF" + /locus_tag="SPC32A_0011" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI34122.1" + /db_xref="GOA:Q4JZS1" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4JZS1" + /translation="MPLSLVRREMKQSVYIIGSKGIPAKYGGFETFVEKLTEYQKDGN + IQYYVACMRENSAKSGFTADTFEYNGAICYNIDVPNIGPARAIAYDIAAVNKAIELAK + GNKDEAPIFYILACRIGPFISGLKKKIRSVGGRLLVNPDGHEWLRAKWSMPVRKYWKF + SEQLMVKHADLLVCDSKNIEKYIREDYKQYQPKTTYIAYGTDTTPSSLKSEDVKVRNW + YREKGVSENGYYLVVGRFVPENNYETMIREFIKSKSNKDFVLITNVEQNKFYDQLLKE + TGFDKDPRVKFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLD + VGFNREVGEDGAIYWKKDVGDLARLIDIVDRKDETFREKLGLMAKDRIETAYSWQFIE + KEYKEIWDEEAI" + misc_feature 9986..10483 + /gene="wchF" + /locus_tag="SPC32A_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00031" + gene 10485..11570 + /gene="wcyH" + /locus_tag="SPC32A_0012" + CDS 10485..11570 + /gene="wcyH" + /locus_tag="SPC32A_0012" + /note="member of homology group 178" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34123.1" + /db_xref="GOA:Q4JZU1" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZU1" + /translation="MKQHIVGNSLKKSIRRFGMRKRYDNLDGLRVISCLGIIAMHIKA + NADYQIYGWIFEVFVPSLTLLVYLFLLISGFGMFCGYYERFKEGKIDLNNFYKKRYKK + IIPFFAFLIFIDILVERSFSHLIEGFTEATLVFGLLPNNQPDVIGVSWTIGVIFLFYM + LFPFFVWLCWDKKRAFISFIISVILNIFCEIYYFTDKFVIDSFASRHSFLYCSPFFLG + GGLIYMYRKEIKDFVSQRKLFCLLGCLGITGFHYLFIQPWFKMDNLGSLLLLLYLPWL + CYAISVDSIVLSNKVMKYFSKISLELYLAHMVLFRVVEKMNFLYFFGKGWLSFILVFV + AVLIGLILLIEFLKKMTSFSRRLLIKE" + misc_feature 10485..10622 + /gene="wcyH" + /locus_tag="SPC32A_0012" + /note="Signal peptide predicted for SPC1486 by SignalP 2.0 + HMM (Signal peptide probability 0.823) with cleavage site + probability 0.803 between residues 46 and 47" + misc_feature 10551..11546 + /gene="wcyH" + /locus_tag="SPC32A_0012" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 7.2e-06" + gene 11751..12986 + /gene="wzy" + /locus_tag="SPC32A_0013" + CDS 11751..12986 + /gene="wzy" + /locus_tag="SPC32A_0013" + /note="member of homology group 179" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34124.1" + /db_xref="UniProtKB/TrEMBL:Q4JZR9" + /translation="MDMNKITIRELIILFVLILFIFQNLLEKYFVYAQYIDEIVALLF + LIHYFLRVVLNKSISKKFSRLVLLLLTIILITLISNFWNNVQTNILIISIDLFSIFKF + IFIFLGAQSFLNDLTHKEIKRIILRVYFISNIYLSVLIVLAFLNIFIGLGMHQEYRYG + LPTFSFIFGTPGQVINLSIIFLLLYQLNKLYNSKNNLIHLVLIFLLLLSTLKTRAIVL + AIVFVYILYLFEIRNISSMKKRVLPVLGLGAVVGFEQFKTYFLTSDTPRLTLFKYGML + TMRRYFPLGSGFATYGSDIAAKNYSLLYYQYGFHNRYGMNPYDIRFLNDNFYPMIFAQ + FGFLGGILYVFLLLDYFRLLLRVASINDKVIKTSVFIYIFNVVLSSIQSSYPGTNSMV + ITTFLICLILRYSDKWRIL" + gene 12971..13681 + /gene="wcyI" + /locus_tag="SPC32A_0014" + CDS 12971..13681 + /gene="wcyI" + /locus_tag="SPC32A_0014" + /note="member of homology group 180" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="CAI34125.1" + /db_xref="UniProtKB/TrEMBL:Q4JZR8" + /translation="MEDFMIIEAIGLPGSGKTFLFHELEKEFRSNSIRTYNFTELSRN + NISVKIVVKLLLKFVSLKYICKKWKKELYDILSEELPYESKFDLYENPDYCVNYALML + LFIYRLFQNSKIVLLLDEGMYHNIVKLCADFDFSIRLSNKLIEKCVLLSRLNDSKHIV + IYNIFPISETLLSIEKRNRHVSKFDELETTQLSKILDNYDKLNNAIYNNDKKQIISVF + RKDFIEKNISYIKQNLNI" + gene 13759..14637 + /gene="wchQ" + /locus_tag="SPC32A_0015" + CDS 13759..14637 + /gene="wchQ" + /locus_tag="SPC32A_0015" + /note="member of homology group 43" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34126.1" + /db_xref="GOA:Q4JZR7" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZR7" + /translation="MVIFVVLHYMVFKETKQCVNSIKNNVKGEKKIIIVDNCSPNGSY + SSLVDAFGCDKDIIIMKSDSNLGFARGNNLGYKYAVENFNPDFIVVMNNDMEIFQEDF + IDKLYESYAKYGYYILGPDIYSTKQEYHQNPQTRKVLDRSDLKLLYRKLVIKDRLRFL + VPVKWWFKNILIKNKSVDNNSKDKNEYVQNIVKNPLLHGSCYVFSKKFTEKHQHTCFY + DKTFMYMEAEILHYMALKNNELMLYYPDLKVYHHEDVATDSTFVKQYKKSFFSIRCLL + QSTKAFIDLIDSDKKE" + misc_feature 13765..14259 + /gene="wchQ" + /locus_tag="SPC32A_0015" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 7.8e-15" + gene 14641..16101 + /gene="wzx" + /locus_tag="SPC32A_0016" + CDS 14641..16101 + /gene="wzx" + /locus_tag="SPC32A_0016" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34127.1" + /db_xref="GOA:Q4JZR6" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZR6" + /translation="MESQKKSVEKNYIYNLIYQMLTVVIPIIITPYISRVLNADGIGI + FSYTTAVVGYFVLLGNLGIATYGQLQVAKYQEDRFKLSKIFFELLILRTILLLLVLLI + YLVFIQFQDIIYKSIYYVLIIQILCSLLDISWFLQGLEEFKSIVMRNTLIKVLSVISI + LIFVKKDTDLILYALIMNASTLLGNISIFAYVPKYVQRVKLAEINLLKHISHCLVYFI + PTIATTIYLTLDKTMIGWFSLNTFENGYYEQAQKIEQMVVTIVTSLSVVTMPRMTYLL + NNNQFQEFKVRLEQSIRFILFLSLPMSLGLVGIANNFIPLFLGVGFEKSISILKIFSL + LVIIIGLNNALGKQILMPSGQQRAYNISVVIGAVINIVFNLILIPQFFSLGAAISSVL + AEFAILIIFLYYSRNCIPPKWVIRTAVKYLGSSIVMFLIIRTIELLSPPSWTVVIIQV + IVGVAVYILSLYILKDQIVRKYYLRLRKLNVLARKV" + misc_feature 14662..15468 + /gene="wzx" + /locus_tag="SPC32A_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.7e-44" + gene 16141..17097 + /gene="wcyS" + /locus_tag="SPC32A_0017" + CDS 16141..17097 + /gene="wcyS" + /locus_tag="SPC32A_0017" + /note="member of homology group 118" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34128.1" + /db_xref="GOA:Q4JZR5" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JZR5" + /translation="MSIFSTLIKKKGAEIFKDLIQSRVLFRTIAILPLVGFSKKSLEI + VRLNNSNVVLSKLRRKYKQTIKNLDREKQYSLSYNQRHKDASNKIWICWFQGLDTAPH + VVQECIASVKKHLADREVVVLTDENYHQYVTFPDYIKEKATQGFISKAHFADLLRLEL + LTEYGGTWIDGTIFCSSSDIPAYMLDSDLFLFQNLKPGLDGQALAISNWFITASYSNH + PLLNMTKDLLYDYWKNHNGVVDYFIFHHFFQLSIEEFPEYWSKVVPFNNSTPHILQLR + LFEEFDEVMYGYILEQTPFHKLTYKFEEEKSRIPNTYYKHLF" + misc_feature 16276..17091 + /gene="wcyS" + /locus_tag="SPC32A_0017" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 3.3e-69" + gene 17173..17994 + /gene="wcrN" + /locus_tag="SPC32A_0018" + CDS 17173..17994 + /gene="wcrN" + /locus_tag="SPC32A_0018" + /note="member of homology group 119" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34129.1" + /db_xref="GOA:Q4JZR4" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZR4" + /translation="MKELTTREMQEVSLEILHTIASICEKHHFRYALIYGTLIGAVRH + KGYIPWDDDVDIMMPRPDYDRLLEYLKENIADYPHLKVFNREECPEYPYMITRISDQR + YRIEMENEKPFDLGVFIDIYPYDGLGDTKEEAVDFGMKGDRLSSFCYQATREHFAIET + TTSTFRKLIKYPVYLFSKMIGKDYFQKQLAKLARVKDYDNSEYVGCVIWLSWGEKDIF + PREWFDETILVPFEKYEFRIPKEFDKVLRHEYGDYMILPPEKDRVGHHYFKAYKK" + misc_feature 17242..17925 + /gene="wcrN" + /locus_tag="SPC32A_0018" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 2.5e-45" + gene 18159..18428 + /gene="HG271" + /locus_tag="SPC32A_0019" + /pseudo + CDS 18159..18428 + /gene="HG271" + /locus_tag="SPC32A_0019" + /note="member of homology group 271" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative transferase (pseudogene)" + misc_feature 18162..18215 + /gene="HG271" + /locus_tag="SPC32A_0019" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.13" + /pseudo + misc_feature 18249..18302 + /gene="HG271" + /locus_tag="SPC32A_0019" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.26" + /pseudo + misc_feature 18303..18356 + /gene="HG271" + /locus_tag="SPC32A_0019" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.032" + /pseudo + gene 18898..19767 + /gene="rmlA" + /locus_tag="SPC32A_0020" + CDS 18898..19767 + /gene="rmlA" + /locus_tag="SPC32A_0020" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34131.1" + /db_xref="GOA:Q4JZR3" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JZR3" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSINPSPRGELEITDVNKAYLDRGGLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISKEQVHELAQPLKKN + EYGQYLLRLIGEV" + misc_feature 18901..19617 + /gene="rmlA" + /locus_tag="SPC32A_0020" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.3e-118" + gene 19768..20364 + /gene="rmlC" + /locus_tag="SPC32A_0021" + CDS 19768..20364 + /gene="rmlC" + /locus_tag="SPC32A_0021" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34132.1" + /db_xref="GOA:Q4JZR2" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4JZR2" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGKTYQTVIDASKGIFVPRGVANGFQVLSDTASYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENLEEADVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 19804..20334 + /gene="rmlC" + /locus_tag="SPC32A_0021" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 3e-16" + gene 20374..21423 + /gene="rmlB" + /locus_tag="SPC32A_0022" + CDS 20374..21423 + /gene="rmlB" + /locus_tag="SPC32A_0022" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34133.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 20389..21345 + /gene="rmlB" + /locus_tag="SPC32A_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 20392..21132 + /gene="rmlB" + /locus_tag="SPC32A_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 20395..21207 + /gene="rmlB" + /locus_tag="SPC32A_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 21489..22340 + /gene="rmlD" + /locus_tag="SPC32A_0023" + CDS 21489..22340 + /gene="rmlD" + /locus_tag="SPC32A_0023" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34134.1" + /db_xref="GOA:Q4K1G6" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G6" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 21489..22337 + /gene="rmlD" + /locus_tag="SPC32A_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-147" + misc_feature 21492..22133 + /gene="rmlD" + /locus_tag="SPC32A_0023" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 21492..22121 + /gene="rmlD" + /locus_tag="SPC32A_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 21495..22223 + /gene="rmlD" + /locus_tag="SPC32A_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene order(22416..23369,23380..23601) + /gene="tnp" + /locus_tag="SPC32A_0024" + /pseudo + CDS join(22416..23369,23380..23601) + /gene="tnp" + /locus_tag="SPC32A_0024" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 22422..22865 + /gene="tnp" + /locus_tag="SPC32A_0024" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 6e-05" + /pseudo + gene complement(23698..24954) + /gene="tnp" + /locus_tag="SPC32A_0025" + CDS complement(23698..24954) + /gene="tnp" + /locus_tag="SPC32A_0025" + /note="member of homology group 13" + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /protein_id="CAI34136.1" + /db_xref="GOA:Q4JZQ9" + /db_xref="InterPro:IPR002560" + /db_xref="InterPro:IPR012287" + /db_xref="UniProtKB/TrEMBL:Q4JZQ9" + /translation="MEQLHLITKLLDIKDPNIKILDIINMDTHKEIIAKLDYEAPSCP + DCGSLMKKYDFQKPSKIPYLETTGMPSRILLRKRRFKCYHCSKMMVAETPLVKKNHQI + PRIINQKIAQKLIEKISMTDIAHQLAISTSTVIRKLNDFHFEHDFSRLPKIMSWDEYA + FTKGKMSFIAQDFDNLNIITVLEGRTQAVIRNHFLRYDRAVRCQVKIITMDMFSPYYD + LAKQLFPCAKIVLDRFHIIQHLSRAMSRFRVQIMNQFERKSHEYKAIKRYWKLIQQDS + RKLSDKRFYRPTFRMHLTNKEILDKILSYSEDLKHHYQIYQLLLFHFQNKDPEKFFGL + IEDNLKQVHPLFQTVFKTFLKNKEKIVNALQLHYSNAKLEATNNLIKLIKRNAFGFRN + FENFKKRIFIALNIKKERTKFVLSQA" + misc_feature complement(24202..24498) + /gene="tnp" + /locus_tag="SPC32A_0025" + /note="HMMPfam hit to PF01610, Transposase, score 5e-48" + misc_feature complement(24538..24603) + /gene="tnp" + /locus_tag="SPC32A_0025" + /note="Predicted helix-turn-helix motif with score + 1691.000, SD 4.95 at aa 118-139, sequence + ISMTDIAHQLAISTSTVIRKLN" + gene 25220..>25372 + /gene="aliA" + /locus_tag="SPC32A_0026" + CDS 25220..>25372 + /gene="aliA" + /locus_tag="SPC32A_0026" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34137.1" + /db_xref="UniProtKB/TrEMBL:Q4K0S2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYL" + misc_feature 25220..25306 + /gene="aliA" + /locus_tag="SPC32A_0026" + /note="Signal peptide predicted for SPC1500 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" +ORIGIN + 1 ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa atttaaaatt + 61 gaaatcgtat aaaaacaagg gaggactgta taaaaggcag aaatcctttg ttttttataa + 121 ccaaggttta taaaccttca ttctcgaaat tcaattaact ttacaaattc ccactattaa + 181 ggagaaagaa gacgaacata aagaagcgta tccttagtgc aggcctgact tttacatctg + 241 ctttgctttt agctgcttgc gaccaatcag gttcagatac aaaaacttac tcatcaacct + 301 ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat aatatagtca + 361 attgaaacaa gaacaagaca aaagagccca tgttttctca ataggattgt actcaggtga + 421 atagggagga agaggtaaaa gtttatgccc aaactcttca cacaagagtt ctagcttccc + 481 cattctatgg aatcttgcat tatccataat aataaccgat ggtgtggtta atgttggtaa + 541 gagaaatttc tgaaaccaag cttcaaaaaa gtcgctcgtc atcgtctctt cgtaagtcat + 601 tggagcgatt aactcaccat ttgttagacc tgcaaccaaa gaaatcctct gatatcttct + 661 tccagatact ttgcctcttc ttaactgacc ttttaaagag cgaccatgtt ctcgataaaa + 721 ataagtatcg aatcctgttt cgtcaatcta aacaggtgct aggtgcttta atctattaaa + 781 attcttaaga aataaggcta ctttttctgg gtcttgttca tagtaagtgt ggttcttttt + 841 ttcgagtgta gcccatagct ttgagcgcat agtggatggt agttggatga cagccaaatt + 901 cagaagctat ttcagtcaaa taagcgtctg gattgtcagt aagatagttt ttaagtctat + 961 ctctatcaac ttttcttggt tttgttcctt ttacttggtg gtttagctct cctgtttttt + 1021 cttttagctt taaccagcca taaatggtat tacgtgagat ttggaaaacg tgtgatgctt + 1081 ctgttatact acctattcgc tcacaataag agagaacttt tttacgaaaa tctattgaat + 1141 atgccataaa aagattatac cacattgtgt actatattat attgaaacta gaatagtaca + 1201 catctgcttc taaaatattg ttagaaaacg atttgactgt cctgatcaat ttgtcatgtt + 1261 cttatttcat tttactatat tttgctactc cccgtaaagt gtcaatcgaa agtgattatg + 1321 tcccaaaaaa atggagatat tgaggtcaat tattttgatt tcatttgaca cgaggaaccc + 1381 ttgaagctgt tttgccagct aaaccaaggc tagtcttagc cttggctcgc cagcctaaca + 1441 gctccaagcc tcgtgtcaaa tgaaatgctt gtcttacact ccttactttc tcgctcctaa + 1501 atgtaaggga tagagtgatt tcctttaagg aaaagcttcc catttagcga gaaatagatt + 1561 agacttgtag atgaggagaa tcaagctcct cactagtaaa ctcttcataa tcctttttat + 1621 ttttatgaag gtattgtttg aaagatgtga atttccacgg atgggtttgt ggagggatat + 1681 acttgcgtct ttcttttttt gttctggttc ttgttcaaag tttttcgaat agagttcatg + 1741 aactagtagc tcctttgtgt gatagatttt gtcagcgata ttgaggtaga tgtcaccatc + 1801 aaatgctttt ataactaatg ctttcgtctt tctgctgaaa tagacttctt ttccttgttc + 1861 ggtagggata tagcaacgat tttggaagcg gatatggtgt ccactatcga cgactctctc + 1921 cgccagtcta gccagaatga gatttcgttc agagggctta ggagccttct caaagacaga + 1981 gagttttgtc ttgtttccaa actgttcatt aaaggtttgg atgtaggaaa gcaggaaggt + 2041 attggcttct tccaaggtat gaatcttgtt tcgttccagt tcgataggca ggcgagattg + 2101 tagtgtctga ttgagtcttt cgactctccc tttagcttga gggatagagg ttgtctccag + 2161 aagaatcccc agttggtgac aggcgtatcc gaattgtgta tgggtatcgt cctccatttt + 2221 cttagagttg gagatttgat aggtaaagac tgttttttta tctgttttga tttgaagggg + 2281 aatgccgtgg ttgtctaaaa tttgttcgag gacatgatag taagcattca aggtctcttg + 2341 tttatcaaaa taagcgccta ggatattgcc agaagcatca tcaatggcta ggtgtaagtt + 2401 agaggtttgg gctccaaacc aggcatgagg gctggcatcc atttggatga gttctccagc + 2461 aaatttcttt ctgagtctac taggatgtac ttttttaggg tcttcaagga aattttcagc + 2521 tgtcggtaag attggcttgt ctaggggttg cttggggttc agtttagctt gttttcttag + 2581 tctcttcttt gtctttctat gggacttagg cgacaggata ttttccttat agagtatttt + 2641 tctaacagtt gtatcagaga gctgaattcc ttcttcttca gctagcaatt cacagaaatg + 2701 acggacattt ggtttatatg ttttatagga gaggtatttc tttaggatac gttctttgat + 2761 ttcatcaggg attgcatgtt ttggttttcg atttctgttt ccgtgtctga aggcttcttt + 2821 tcctttcagt tgatagacca gtagtagacg attgatttgc ctttcagaaa gattgagttc + 2881 ggcacaggct cgtttctttg ttttctttcc ttgggctata gcttttatca caagatattt + 2941 tttcatttca ttcatattta gttggatcct tttcatatga ctattctacc aaatgggaca + 3001 ttttcacgtt cgatttacta aagacattat cacattcgaa tcccaaattt caagttgaag + 3061 ttagccaccc aaaagaaatt cacttggcga cttgtagtcc aagcattttt tagggtagtt + 3121 gttaatccaa ttttcgataa aagctacttc tttcggagtc gttttcttgg ttcctttagg + 3181 taaccatctc cgaattaatc gattatgatt ttcatttgaa cctctctccc atgaagagta + 3241 agcatgtgcg tagtagatat gttcctcagg aaatacctca gacaatcgtt tgaactccga + 3301 accattatct gcagtaatgg acagaatacg atgctcccct aatagtaacg taagcgcctg + 3361 attgacagat tcagcagttt tatttggaat taaccttata atttggtgtc tgctccgccg + 3421 gtcggttaag actaacaggc aataattttt tatcttagtc agtaggacgg tatcaatttc + 3481 ataatgacca ttttccaagc gaagattaat aacgtcagga cgttcttcga tagatttacc + 3541 tgccggctta aagttcggac tagcttgctt cttgacacct ttcctttttc tgggataaag + 3601 catgtcggcc ttcgtcaatc ctaaatgacc attatgaaac cagtagtaga tggttgaaat + 3661 accaactttc acttgcttct tgttaaccat catttcaggc gaaaattttt gcttatgata + 3721 gtgtaagatc ttctctctga tttcctttgt taaaattaac tttttcaccg accgttttcg + 3781 attgaattgg taaacagttt gtgcgtaatc ggcagaatag acctttttgt atagcccttt + 3841 tctcacttgt tgtaaagttg tacctctttt gacttcatta tgaatcgttt gaggcgcctt + 3901 tcctaacaag cctgcaattt cacgattgga cttattttca ttcttccacc gctcaatcaa + 3961 gcgacggtta tctattgtca aatgtttccc ttttggggta taatgttctt gcatctctgt + 4021 gcctttcctt gtgtttgtgg tgaacaacaa gtatagcaca gaggtgtttt cttatacctt + 4081 aaatcacatt tcatttgaca acaggaaccc ttgaacctgt tttttcagct aaaccaaggc + 4141 tatgattagc cttggccacc tagcctaaca gtttcaaacc tgttatcaaa tgaaatcatc + 4201 aacttactca aacatagtga aacatctaat tcttgactaa ggtaaggtgg ctaacttcat + 4261 tatagaactt tcaatcacat tcgaatcaca taaagatgca gatagtaaaa aaagatgtag + 4321 acattaccgt aaaaaagtga tataattgta cgatgttcaa ggtataggtg ttaatcatga + 4381 gtagacgttt taaaaaatca cgttcacaga aagtgaagcg aagtgttaat atcgttttgc + 4441 tgactattta tttattgtta gtttgttttt tattgttctt aatctttaag tacaatatcc + 4501 ttgcttttag atatcttaat ctagtggtaa ctgcgttagt cctactagtt gccttggtag + 4561 ggctactctt gattatctat aaaaaagctg aaaagtttac tatttttctg ttggtgttct + 4621 ctatccttgt cagctctgtg tcgctctttg cagtacagca gtttgttgga ctgaccaatc + 4681 gtttaaatgc gacttctaat tactcagaat attcaatcag tgtcgctgtt ttagcagata + 4741 gtgagatcga aaatgttacg caactgatga gtgtgacagc accgactggg actgataatg + 4801 aaaatattca aaaactacta gctgatatca agtcaagtca gaataccgat ttgacggtta + 4861 accagagttc gtcttacttg gcagcttaca agagtttgat tgcaggggag actaaggcca + 4921 ttgtcctaaa tagtgtcttt gaaaacatca tcgagtcaga gtatccagac tacgcatcga + 4981 agataaaaaa gatttatacc aagggattca ctaaaaaagt agaagctcct aagacgtcta + 5041 agaatcagtc tttcaatatc tatgttagtg gaattgacac ctatggtcct attagttcgg + 5101 tgtcgcgatc agatgtcaat atcctgatga ctgtcaatcg agataccaag aaaatcctct + 5161 tgaccacaac gccacgtgat gcctatgtac caatcgcaga tggtggaaat aatcaaaaag + 5221 ataaattaac ccatgcgggc atttatggag ttgattcgtc cattcacacc ttagaaaatc + 5281 tctatggagt ggatatcaat tactatgtgc gattgaactt cacttctttc ttgaaaatga + 5341 ttgacttatt gggaggggta gatgttcata atgatcaaga gttttcagct ctacatggga + 5401 agttccattt cccagtaggg aatgtccatc tagactctga gcaggctcta ggttttgtac + 5461 gtgaacgcta ctcactagcc gatggagacc gtgaccgtgg tcgcaaccaa caaaaggtga + 5521 ttgtggctat ccttcaaaaa ttaacgtcaa ccgaagcact gaaaaattat ggtacgatca + 5581 ttaatagctt gcaagattct atccaaacaa atatgccact tgagaccatg ataaatttgg + 5641 tcaatgctca gttagaaagt ggagggaatt ataaagtaaa ttctcaagat ttaaaaggta + 5701 caggtcgaat gggtcttcct tcttatgcaa tgccagacag taacctctat gtgatggaaa + 5761 tagatgatag tagtttagct gtagttaaag cagctataca ggatgtgatg gagggtagat + 5821 gaaatgatag acatccattc gcatatcgtt tttgatgtag atgatggtcc caagtcaaga + 5881 gaggaaagca aggctctctt ggcagaatcc tacaggcagg gggtgagaac cattgtctct + 5941 acctctcacc gtcgcaaggg catgtttgaa actccggaag agaagatagc agaaaacttt + 6001 cttcaggttc gggaaatagc taaggaagtg gcgagtgact tggtcattgc ttacggggct + 6061 gaaatttact acacaccaga tgttctggat aagctagaaa aaaagcggat tccgaccctc + 6121 aatgatagtc gttatgcctt gatagagttt agtatgaaca ctccttatcg cgatattcat + 6181 agcgccttga gcaagatctt gatgttggga attactccag tcattgccca cattgagcgc + 6241 tatgatgctc ttgaaaataa tgaaaaacgc gttcgggagc tgattgatat gggctgttac + 6301 acgcaagtaa atagttcaca tgtcctcaaa cccaaacttt ttggcgaacg ttataaattc + 6361 atgaaaaaaa gagctcagta ttttttagag aaagatttgg ttcatatcat tgcaagtgat + 6421 atgcacaatc tagacggtag acctcctcat atggcagaag catatgacct tgttacccaa + 6481 aaatacggag aagcgaaggc tcaggaactt tttatagaca atcctcgaaa aattgtaatg + 6541 gatcaactaa tttaggagaa atgatgaaag aacaaaacac gatagaaatc gatgtatttc + 6601 aattatttaa aaccttgtgg aaacgcaagc taatgatttt attagtggca cttgtgacag + 6661 gtgcgggggc ttttgcatat agcgctttta ttgttaagcc agaatatacg agtaccacgc + 6721 gaatttacgt agtgaatcgc aatcaaggag acaagtcggg gctgacaaat caggatttgc + 6781 aggcaggatc ttatctggta aaagactacc gtgagattat cctttcgcag gatgtattgg + 6841 aaaaagtagc gacaaatttg aagttggata tgccagccaa aacgttaacc agaaaagttc + 6901 aagtgactgt accagttgac actcgtatcg tctcaatctc tgtcaaggat aaacagccag + 6961 aggaagccag tcgtatcgct aattctctac gagaagttgc tgcagaaaag atcgtcgctg + 7021 taacgcgagt atctgatgta acgacacttg aagaagcgcg accagctacg accccctctt + 7081 ctccaaatgt tcgacgcaat tccttgtttg gttttcttgg aggagcagtc gtaacagtaa + 7141 ttgctgttct tttgattgag ttgctcgaca tccgtgtgaa acgtcctgaa gatgtcgaag + 7201 acgtactgca aattccactt ttaggggtcg ttccagattt tgacaaaatg aaataggagg + 7261 aaattatgcc aacattagaa atctcacagg caaaattgga ttttgtaaaa aaggcagagg + 7321 aaaattataa cgctttgtgc acgaacctac agttaagtgg agatgatttg aaagtatttt + 7381 ctatcacttc tgtgaaacaa ggagaaggaa aatcaacgac ttccaccaat atcgcttggg + 7441 cttttgcgcg tgcaggttac aaaacgctgc tgattgatgc agatattcgc aattctgtta + 7501 tgttaggtgt ctttaaagca agggataaga ttacaggcct gacagaattt ttatcaggaa + 7561 ctacagacct atcacaaggg ctttgtgata ccaatatcga aaatctcttt gtaattcagg + 7621 ctggctctgt gtcaccgaat ccgacagctc ttcttcaaag taagaatttc agtacaatgc + 7681 ttgaaacctt gcgtaaatat tttgactaca tcattgtaga tactgctcct gtcggtgtcg + 7741 tgattgatgc ggctattatt acgcgaaaat gcgatgcttc tattttagtg acggaggcag + 7801 gtgaaataaa tcgacgggat attcaaaaag caaaagaaca gttggaacac acagggaagc + 7861 cgtttttggg agttgtgttg aataaattcg atacttcagt agacaaatac ggttcttatg + 7921 gaaattatgg agattacggg aaaaataaaa aataggtcgg gggatagaga tgaacggaaa + 7981 aatagtaaag tcttcattgg ccataatcca gagttttctt gttattttat tgacttatct + 8041 acttagtgct gtgagagaag cggagattgt ttcaacaaca gctattgcac tttatatcct + 8101 ccattatttt gtcttttata tcagtgatta tggacaggat ttctttaaaa ggagatattt + 8161 gattgaactt gtccagacat tgaaatatat cctattcttt gcactagcga ttagtatttc + 8221 taattttttc ttagaggatc aatttagtat ttccagacga ggcatgattt acttcctcac + 8281 attacatgct ctcttagtct atgtgctaaa cctatttatc aagtggtatt ggaagcgggc + 8341 ttatcccaac tttaaaggaa gtaagaagat tctcctactt acagcaactt ctcgtgtcga + 8401 aaaggtactg gatagattaa tagaatcaaa tgaggttgtt ggggagttgg tagccgtcag + 8461 tgtcttagat aaaccagatt ttcagcatga ttgtttaaag atagtagcag agggggagat + 8521 agtaaacttt gcgactcatg aggtggtcga tgaagtcttt atcgatcttc caagtgaaaa + 8581 atacaatatt ggagagcttg tctctcagtt tgaaacgatg ggaattgatg taacagttaa + 8641 tctaaatgct tttgatcgta gtttggcacg taacaagcaa attcgtgaga tggcaggatt + 8701 aaacgttgtg actttttcta caacatttta taagactagc catgtaattg ctaagcggat + 8761 tattgatatt atgggtgcat tggtagggct gatactatgt ggtttagtca gtattgtact + 8821 ggttcctttg attcgaaagg atgggggctc tgctattttt gctcagacgc gtataggaaa + 8881 aaatggtcgt cagtttactt tttataagtt tcgctctatg tgtgtagatg ccgaggcgaa + 8941 aaaaagagaa ctcatggaac aaaataccat gcagggtgga atgtttaagg tggacgatga + 9001 tcctcgtatc acgaaaaatg gtcgttttat acggaagact agcttggacg agctaccaca + 9061 gttttataat gttctaaagg gagatatgag tttggttggc acacggccac caacagtgga + 9121 cgagtatgaa cactataccc cagaacaaaa acgtcggcta agttttaaac ctggtataac + 9181 aggcttatgg caggtcagtg gacgaagtga gattaagaat tttgatgaag ttgtcaaatt + 9241 agatgtagcc tatatagacg attggacaat ttggaaagac attgaaattt tattgaagac + 9301 agttaaagtt gtattgatga aagatggagc gaagtgattt ttgcccctca gtcttgttag + 9361 gagagagatg aaacagtcag tttatatcat tggttcaaag gggattcctg ccaagtatgg + 9421 aggatttgaa acctttgttg agaaattaac agaatatcaa aaagatggta acatccaata + 9481 ctatgttgcc tgcatgcgcg aaaattctgc aaagtcagga tttacagcag atacatttga + 9541 gtacaacggt gctatttgtt acaacattga tgtgcctaat attggtcctg ctagagccat + 9601 cgcttacgat attgcagcgg tcaataaggc tattgaattg gctaagggaa acaaggacga + 9661 ggctcccatt ttttacattc tagcttgtcg tatcggacct tttatttctg gacttaagaa + 9721 aaaaattcgt tcggtcggag gccgtttact ggtaaatcca gatggccatg agtggcttcg + 9781 ggctaaatgg agcatgccag ttcggaagta ttggaaattt tcggaacagt tgatggtcaa + 9841 gcatgcagat ttattagtct gtgatagcaa aaatatcgaa aaatatatcc gagaggacta + 9901 taaacagtat cagcccaaga cgacctatat tgcttatggt acagatacta ccccttcaag + 9961 tctaaaatca gaagatgtca aagttcgaaa ctggtatcgt gaaaagggag taagcgaaaa + 10021 tggctattat ctagtggtgg gacgattcgt tcccgaaaac aactatgaaa ccatgattcg + 10081 tgaatttatc aagtctaagt ccaataagga ctttgtcctt attacaaatg tggagcaaaa + 10141 taaattttac gatcagttgc tgaaggaaac aggtttcgac aaggatccaa gagtcaaatt + 10201 tgtgggaaca gtctatgacc aagaattgct caaatacatc cgagagaatg cttttgctta + 10261 cttccatggc catgaagttg gtgggacaaa cccatcgctt ttagaagccc ttgcatcaac + 10321 aaaactaaat ttgttactag atgttggttt taaccgtgaa gttggtgagg atggagctat + 10381 ttattggaaa aaagatgttg gtgatttagc cagattaatt gacattgttg acagaaagga + 10441 tgagacgttt cgggaaaagc ttggcttaat ggcgaaagat agaattgaaa cagcatatag + 10501 ttggcaattc attgaaaaag agtataagga gatttgggat gaggaagcga tatgataatt + 10561 tggatggatt acgagtaatt tcttgtctgg gtataatagc gatgcatatt aaagctaatg + 10621 ctgactatca aatttatggt tggatatttg aagtgttcgt accgtcttta acgttgcttg + 10681 tctatttatt cttacttatt agtgggtttg gaatgttttg tggctattac gagcgattta + 10741 aagaaggaaa aattgatcta aataattttt ataaaaaaag gtataaaaag attatcccat + 10801 tttttgcttt tttgattttt atagatattt tagtagaacg aagtttttcg catttgattg + 10861 aaggatttac tgaagctaca cttgtcttcg gccttctgcc gaataatcaa ccggatgtta + 10921 ttggtgttag ctggacgatt ggggttattt tccttttcta tatgcttttt cctttttttg + 10981 tatggctatg ctgggataaa aagagggcgt ttattagttt tataatttca gttatattga + 11041 atatattttg tgagatatat tacttcactg ataagtttgt tatagattcg tttgcgtcgc + 11101 gtcatagttt tttatactgc tccccgttct ttcttggagg tggcctcatt tatatgtaca + 11161 gaaaggaaat aaaagatttt gtttcgcaac gtaaattgtt ctgcttactt ggttgtttag + 11221 gtattacagg tttccattat ctattcattc aaccttggtt taaaatggat aatttaggat + 11281 ctttattgtt acttctttac cttccatggc tttgctatgc tataagcgtt gatagtatag + 11341 ttcttagtaa caaagtaatg aaatatttta gtaaaattag cttagaactt tatttagcgc + 11401 atatggtact ttttcgagtt gttgagaaaa tgaatttctt atattttttt ggtaaaggct + 11461 ggcttagctt catattagtt tttgtagctg ttcttattgg attgatttta ttgattgaat + 11521 ttttgaaaaa gatgacaagt ttttctagga gattgctaat aaaggagtaa tttaagtggt + 11581 gtgatgtcat caagatttaa gttaaagaga atataggttg atagaaaaaa tatttccttt + 11641 ttctaaagtg tggattacaa atgctacttt ttgtaaacta attaataaat ttctatagca + 11701 ctaatatata ttacctctaa gaaaatgatg gaaagtgtgg aaaattaaac ttggatatga + 11761 acaaaattac aataagagaa ttgataatac tatttgtgtt aattcttttt atatttcaaa + 11821 atcttttaga aaagtatttt gtatatgctc agtatattga tgaaatagtt gcattattat + 11881 ttctcattca ttacttttta agagtagtgt taaataagag tatttcaaaa aaattttccc + 11941 gacttgttct tcttttatta actatcatat taattacttt aatttcaaat ttttggaata + 12001 atgtgcaaac taatatttta attatctcca ttgatttatt tagtattttt aaatttattt + 12061 ttatattttt gggggcacaa tcttttctca atgacttaac gcataaagaa ataaaaagaa + 12121 taattttacg agtttacttt attagtaata tatacttatc tgttttgatt gtcttagcat + 12181 ttttaaatat ttttataggc ttaggaatgc atcaagaata tcgctatggt ttaccaactt + 12241 tttcttttat ttttggtacg ccaggtcaag taattaatct ctcgattata ttcttacttc + 12301 tatatcagtt aaataaactt tataattcta aaaataatct cattcattta gtattaattt + 12361 ttttattact gctgtctaca ttaaaaacac gggcaattgt cttagcaatt gtgtttgtct + 12421 atattctcta tctatttgaa atacgaaata tttcatcaat gaaaaagaga gtacttcctg + 12481 ttctaggctt gggagcagtg gttgggtttg aacaatttaa aacttatttt ttgacttctg + 12541 atactccaag gctcacatta tttaaatacg gtatgcttac aatgagacgc tattttcctc + 12601 tgggaagtgg ttttgctaca tatggatccg atattgctgc taaaaactat tctctgttat + 12661 attatcaata tggatttcat aacagatatg gaatgaatcc atatgatatt agatttttaa + 12721 atgataattt ttatccaatg atttttgcac aatttggatt tttaggagga atactttatg + 12781 tatttctact attagattat tttagattat tattacgtgt tgcaagtata aatgataagg + 12841 ttattaaaac ttcagtattt atttatatct ttaatgttgt cttatcgtct attcaatcat + 12901 cttatccggg aacgaattca atggtaataa caacgtttct aatctgttta atattgagat + 12961 atagtgacaa gtggaggatt ttatgattat agaagctata ggtttacctg gaagcggaaa + 13021 aacgttttta ttccatgagc ttgaaaaaga atttcggagt aattcaatca gaacttataa + 13081 ttttactgaa ttatcacgga ataatatttc agtcaaaatt gttgtaaaat tattgctaaa + 13141 gtttgtatcg ttgaaatata tttgtaaaaa atggaaaaaa gaattatacg atattctttc + 13201 tgaagagctt ccgtatgaga gtaaatttga tttatatgaa aatccagatt attgtgtgaa + 13261 ttatgcgctt atgcttctct ttatctatag attatttcaa aatagtaaaa ttgtattatt + 13321 actagatgag ggaatgtatc ataatattgt gaaattatgt gctgactttg atttttcaat + 13381 cagactatca aataagttaa ttgaaaaatg tgtattgtta agtagattaa atgatagtaa + 13441 gcatatagtt atttacaata tttttccaat ttctgagaca ctattgtcta ttgaaaaacg + 13501 taatcgacat gtgtctaaat ttgatgaact agaaactacc cagttgagca agatattaga + 13561 taactacgat aaactaaata atgcaatcta taataatgac aaaaaacaga taatatcagt + 13621 ttttagaaag gattttattg aaaagaatat ttcttatata aaacaaaatt taaatattta + 13681 atgctctgct agttattatt ttggcaggta atataagcgt ttattctcta ataattgata + 13741 agtacgatga ggtataatat ggtaattttt gtggtgttgc attacatggt ttttaaagaa + 13801 actaaacaat gcgtcaattc aattaagaat aatgttaaag gagaaaagaa aattataatt + 13861 gttgataatt gttctcctaa tggctcatat agtagtttag tagatgcttt tggttgtgat + 13921 aaagatatta ttattatgaa gtcagatagt aatttaggct ttgctagggg aaataatctt + 13981 ggttataaat atgcagttga aaattttaat ccagatttta ttgttgtaat gaacaatgat + 14041 atggaaatat ttcaagaaga ttttattgat aaactgtatg aaagttacgc aaagtatggc + 14101 tactatatat taggtccaga tatatattca actaaacagg aatatcatca aaatcctcag + 14161 acaagaaagg ttctggatag gtctgatttg aagttattat atcgaaagct agttattaaa + 14221 gataggctaa ggttcttagt tcctgtaaaa tggtggttta aaaatatatt aattaaaaat + 14281 aaaagtgtag ataataattc aaaagataaa aatgaatatg ttcaaaatat agtaaaaaat + 14341 ccgttattac atggctcgtg ttatgttttt tctaagaagt ttactgaaaa acatcaacac + 14401 acatgttttt atgataaaac gtttatgtat atggaggcag aaattttaca ttatatggca + 14461 ttgaagaaca atgaattaat gctttattac ccagatttaa aagtttacca tcatgaagat + 14521 gtggcaacag attcaacgtt tgtaaagcaa tataagaaat cgttcttctc aatcaggtgt + 14581 ctactgcagt caacaaaagc gtttattgat ttaattgatt cagataaaaa agagtaacaa + 14641 atggaaagtc aaaaaaagag cgttgaaaag aattatattt ataatttgat ttatcaaatg + 14701 ctaactgtag ttattccaat tatcataaca ccctatattt cacgtgttct aaacgctgat + 14761 gggataggga tttttagcta cacaacagca gtggtaggtt attttgtttt attgggtaat + 14821 ttaggaattg caacttacgg acaactacaa gttgctaaat accaagaaga cagatttaaa + 14881 ttatccaaaa tattttttga gttattgatt ttacgaacta tattgctttt actagtttta + 14941 ctgatatatc ttgtatttat ccaatttcaa gatataattt ataaatctat ttattacgtt + 15001 ttaataattc aaatactttg tagtttgctg gatatttcat ggtttttgca gggtcttgaa + 15061 gaatttaaaa gtattgtgat gcgtaatacc ctaataaagg tgttaagtgt aatatctatc + 15121 ttgatttttg taaaaaaaga tacagatttg attttatatg ctttgattat gaacgcatca + 15181 acactgcttg gaaatatttc tatttttgca tatgtaccta aatatgttca aagagttaag + 15241 ttggctgaga ttaatttatt aaagcatatt tcacactgtt tagtttactt tataccaaca + 15301 atagcaacta caatatattt aactttggat aagacaatga taggttggtt ttccttaaat + 15361 acttttgaaa atggttatta tgagcaggct caaaaaattg agcagatggt tgtgacaata + 15421 gttacatctt taagtgtagt aacgatgcct agaatgactt atttattgaa taacaatcaa + 15481 tttcaagaat ttaaagtgcg acttgaacaa tcgataaggt ttatcctttt tttatcctta + 15541 cctatgagtt taggattagt agggatagca aataatttta tacctttgtt tttaggtgta + 15601 ggatttgaaa agtctatatc aatattaaag atttttagtc tactagttat cattataggt + 15661 ttaaataatg cattagggaa gcaaatactt atgccttcag ggcagcaaag ggcttataat + 15721 attagtgtgg taataggtgc tgttatcaat atagtcttca atttaatatt gataccgcaa + 15781 tttttttcac tgggtgctgc gatttcttcc gttcttgcag agtttgcaat tttaataata + 15841 tttctctatt attctagaaa ttgtattcct cctaaatggg ttattagaac agcagtgaaa + 15901 taccttggat ctagtatagt aatgtttctt attattagga caatagagct actatctcct + 15961 ccttcgtgga cagttgttat aatacaagtc attgttggag tcgcagtata tattctatcg + 16021 ttatatatat taaaagatca aattgtaaga aaatactatc taagattgag aaaactaaat + 16081 gttcttgcaa ggaaagtatg agagtcttat aataattatt cagaatatgg agagatttca + 16141 gtgagtattt tttcaacatt gattaaaaaa aagggcgcag agatttttaa agacttaatt + 16201 cagtcaagag tgctttttag aacgatagct attttacctc tggttggttt ttcaaaaaaa + 16261 tcattagaga tagtccgtct aaataatagt aatgtagttc tttcaaaatt gagaaggaag + 16321 tataagcaga ctattaaaaa cttggataga gagaaacagt attcacttag ctataatcag + 16381 cgacataaag atgcatcaaa taagatatgg atttgctggt ttcaaggctt agatactgcc + 16441 cctcatgtgg ttcaggagtg tatcgcttcg gtaaaaaaac acctagcaga cagagaagtg + 16501 gttgttttaa cagatgaaaa ttaccatcag tatgtgactt ttccagacta tatcaaagaa + 16561 aaagcaaccc agggttttat ttcaaaagcg cactttgcag atttattgcg cttggaatta + 16621 ctgaccgagt atggtggtac gtggattgat gggacgatat tttgttcgag ttcagatatt + 16681 cctgcctata tgttagattc tgatttattt ctatttcaaa atttaaaacc aggtcttgat + 16741 ggacaggcat tggcaatttc taattggttc attactgcta gctactctaa ccatcctctt + 16801 ttaaatatga cgaaagattt gctttatgat tattggaaga atcataatgg agtggttgat + 16861 tattttattt ttcatcactt ctttcagtta tcaatcgaag aatttcctga atactggagt + 16921 aaggtagttc ctttcaataa ttcaactcct catattttgc agttacgctt atttgaagag + 16981 tttgacgaag tgatgtatgg ttatattctc gaacagacac cattccataa gctaacatat + 17041 aaatttgaag aagaaaagtc gagaataccg aatacttact ataaacactt attttgataa + 17101 aaatgatagt agttgattga gagactgttg ttaggtatag aatgctattg agattttatc + 17161 gggagggatg atatgaaaga actaactact cgagagatgc aagaagtatc gttggagatt + 17221 ttacacacga ttgctagtat ttgtgaaaaa caccattttc gctatgcttt gatttacggg + 17281 actttaattg gtgcggttag gcataaaggg tatattcctt gggatgatga tgttgacatt + 17341 atgatgcctc gaccagatta tgaccgccta ttggagtatt tgaaggaaaa tatcgccgat + 17401 tatccacatt taaaagtatt caatcgagaa gagtgtccag aatatcctta tatgattact + 17461 cgaattagtg atcagagata ccggattgag atggaaaatg agaaaccttt tgatttgggg + 17521 gttttcattg atatctatcc ctatgatggt ttgggagata cgaaagaaga ggcggttgac + 17581 tttggtatga agggggatcg tttatcgtcg ttttgttatc aggcaactag agaacatttt + 17641 gcgattgaaa cgacaacatc aacttttagg aagttgatta agtatccagt ttatttattc + 17701 tctaaaatga ttgggaaaga ttacttccaa aagcaactag ccaagttagc cagagttaaa + 17761 gactacgata acagtgaata tgtaggttgc gttatttggt tgtcatgggg agaaaaagat + 17821 atttttccgc gtgaatggtt tgatgagact attttggttc cttttgagaa atatgaattt + 17881 aggattccta aagaatttga taaagttcta cggcatgaat atggagatta catgattttg + 17941 cctccagaga aggatagagt agggcatcac tattttaaag cttataaaaa atgataattt + 18001 gctaagcaaa gaaaaggaaa atcatgaaat tattttattt tatttacaat tggagtagaa + 18061 agtttaaggg tggagttttt ctgctcagag ttctatatgg ttttgagtgc ccacgtaaag + 18121 ctaaaattgg gaaaaacgtc aatttttcac atcgtgggat gggaacagtt gtaagtagta + 18181 atgctatcat tggggataat gtgactatac aacatcatgt aacattagga attaaaaacg + 18241 ataatgatag aattatcatc ggggagaact gttttatagg agcctatgca tttatcttag + 18301 gaaatgtaaa aattggtgca aattctaaga ttggagcagg tacgatggtt ttacatgatg + 18361 tcccagatgg aagcacagta gttaatcctg tggaactaaa agcacttgct tcaaaaaaag + 18421 acgttcagta agagagaaat gaatagaata ttgaaaacaa tgttatagga aagtcatggt + 18481 aacactttat aatactgaaa attttattca ctttttaaca cattagagtt aatgtttact + 18541 ccacaaattt aatttaatca ctcaataaag agattaagag acaagcaaaa aaaagattgt + 18601 ctttccgaat ggagaagcct tagattattg tctggttccg atgaatacaa agtaaaatat + 18661 aaaaattgca ataacaaaga attcgaattt tgttcaggtg ctttataaag cctatttgag + 18721 taattaaata gcaacttgac actgtgatta cataaaatta ttgataagcc taatttttat + 18781 ttaatcgtat ggattattta taaaaaatgt ataaaattga atataaatgt gaggtgtgat + 18841 tttggtttat aaacatggga aaataaaagt gcaaataaca aagaaaggta ccctactatg + 18901 aaaggtatta ttttagcagg tggttcgggg acacgtttat atcctttgac tcgcgctgca + 18961 tcaaaacaac ttatgccggt ttatgataag ccgatgattt actacccact ttcaacattg + 19021 atgttggctg ggattaggga tattttgatt atttccactc cacaggattt acatcgattc + 19081 caagagcttc ttcaagacgg atctgagttt gggatcaaac tttcttatgc agagcaacca + 19141 agtccagatg gtttggcaca agcctttatc attggggaag agtttatttc tgatgatagc + 19201 gttgcgctaa tcttaggtga taatatctac catggttctg ggctttccaa gatgctacaa + 19261 aaggcagcga gtaaggagtc gggagcaact gtttttggct accatgtcaa ggatccagag + 19321 cgctttggtg tggttgagtt tgatcaggat atgaaggcta tttctattga agaaaagcca + 19381 gagtaccctc gttcaaacta tgcagttaca ggtctctatt tctatgataa tgatgtagta + 19441 gagattgcca agagtattaa cccaagtcct cgtggtgaac tggaaattac agatgtaaac + 19501 aaggcttacc tagatcgtgg tggtttgtct gttgagctta tgggacgtgg ctttgcttgg + 19561 ctggatactg gaactcatga aagtttacta gaggcctcac agtacatcga aacagtgcaa + 19621 cggatgcaaa atgttcaggt agcaaactta gaagaaattg cttaccgtat gggctatatc + 19681 agtaaagagc aagtgcatga attggcgcag ccgttgaaga aaaatgaata cgggcagtac + 19741 ctgctccgtt tgattggaga agtatagatg acagataatt ttttcggtaa gacgcttgcg + 19801 gcacgcaagg ttgaagctat tccaggcatg ttagagtttg atatccccgt tcatggagat + 19861 aatcgtggct ggtttaaaga aaatttccaa aaggaaaaaa tgcttccact tggatttcca + 19921 gagtctttct ttgcagaagg aaaattgcaa aacaatgtat ccttctcacg taaaaatgtc + 19981 cttcgaggcc tccacgcaga gccttgggat aagtacatct ctgtagcaga tggagggaaa + 20041 gttctgggtt cttgggttga tctacgcgag ggtgaaacct ttgggaagac ctatcagaca + 20101 gtaattgatg caagcaaggg aatctttgtt cctcgaggcg tagctaatgg cttccaagtt + 20161 ttatcagata cagcttcata tagctatctg gtcaatgatt actgggctct tgaactcaaa + 20221 cccaagtatg cctttgtgaa ctacgctgat ccaagccttg gtattgaatg ggaaaatctg + 20281 gaagaagcag acgtatctga agcagacaaa catcatcccc tacttaagga cgtgaagcct + 20341 ttgaaaaaag aagatttgga ataaggaaag aatatgactg aatacaaaaa tattatcgtg + 20401 acaggtggag ctggctttat cggttctaac tttgtccatt atgtttacga gaactttcca + 20461 gatgttcatg tgacagtcct agataagttg acttatgctg gaaaccgcgc gaatattgag + 20521 gaaattttag gcaatcgtgt tgagttagtt gttggtgaca ttgctgatgc ggagttggta + 20581 gacaagttgg ctgctcaagc agatgctatc gttcattatg cagcggaaag ccacaatgat + 20641 aattcgctca atgatccatc gccatttatt catactaact tcattggaac ctatactctt + 20701 ttagaagctg ctcgtaagta cgatattcgc ttccaccatg tatcgacaga tgaagtttat + 20761 ggggatctcc ctttacgaga agatttgcca ggtcatggtg aaggcccagg tgagaaattt + 20821 actgctgaaa caaaatacaa ccctagctct ccgtactcat caaccaaggc agcctcagat + 20881 ttgattgtca aagcttgggt gcgttctttt ggagtcaagg caacgatttc caactgttca + 20941 aataactacg gtccttatca acatatcgaa aaattcatcc cacgtcagat tactaacatc + 21001 ctaagtggaa ttaagccaaa actttacggt gaaggtaaga acgttcgtga ctggattcat + 21061 accaatgacc attcttcagg agtttggaca atcttgacaa aagggcaaat cggtgaaacc + 21121 tacttgattg gggctgatgg tgagaagaac aataaggaag ttttggaact tatccttaag + 21181 gaaatgggac aagctgcgga tgcctatgat catgtgactg accgtgcagg acatgacctt + 21241 cgctatgcga ttgatgccag caagctccgt gatgagttgg ggtggaaacc tgaatttact + 21301 aactttgaag ctgggctcaa ggcaacaatc aagtggtata cagataacca agaatggtgg + 21361 aaagcagaaa aagaagctgt tgaagccaat tatgctaaga ctcaggagat tattacagta + 21421 taaaaagcag gaaatagctg ctttttattg ctatattggg aagagttaca tattagaaag + 21481 gtctagagat gattttaatt acaggggcaa atggccaatt aggaacggaa cttcgctatt + 21541 tattggatga acgtaatgaa gaatacgtgg cagtagatgt ggctgagatg gacattacca + 21601 atgaagaaat ggttgagaaa gtttttgaag aggtgaaacc gactttagtc taccattgtg + 21661 cagcctacac cgctgttgat gcagcagagg atgaaggaaa agagttggac ttcgccatca + 21721 atgtgacggg gacaaaaaat gtcgcaaaag catctgaaaa gcatggtgca actctagttt + 21781 atatttctac ggactatgtc tttgacggta agaaaccagt tggacaagag tgggaagttg + 21841 atgaccgacc agatccacag acagaatatg gacgcactaa gcgtatgggg gaagagttag + 21901 ttgagaagca tgtgtctaat ttctatatta tccgtactgc ctgggtattt ggaaattatg + 21961 gcaaaaactt cgtttttacc atgcaaaatc ttgcgaaaac tcataagact ttaacagttg + 22021 taaatgacca gtacggtcgt ccgacttgga ctcgtacctt ggctgagttc atgacctacc + 22081 tagctgaaaa tcgtaaggaa tttggttatt atcatttgtc aaatgatgcg acagaagaca + 22141 caacatggta tgattttgca gttgaaattt tgaaagatac agatgtcgaa gtcaagccag + 22201 tagattccag tcaatttcca gccaaagcta aacgtccgct aaactcaacg atgagcctgg + 22261 ccaaagccaa agctactgga tttgttattc caacttggca agatgcattg caagaatttt + 22321 acaaacaaga agtgagataa gtagtagaat gattttctag tctaataaaa gaggtagata + 22381 atgaactcca aaggagctta agatatacga ttatcttgtt gttggtgctg gtctctttgg + 22441 tgcatagcta tggctcagtt tctattatcg ctcacaccat ccatcagaag tttaatctga + 22501 aggtacccaa ttatcgccaa gaagaagatt gggctaagat gggtttacca atcacacgca + 22561 aggaaatctc taattggcat atcaagacga gtcaatacta tttggagccc ctctataacc + 22621 tcttgcgaga gagactattg actcagccct tacttcatgc ggatgaaact tcttataggg + 22681 tgctagagag tgatagtcag ctgacttact attggacttt tttgtcaggt aaatcagaga + 22741 aacaagggat tacgctttac caccatgatc agtgtcgaag tggttcagta gtacaagaat + 22801 tcctaggaga ttattctggc tatgtgcatt gtgatatgtt gcggcagtaa cttaggactt + 22861 tagtcctcta gttctgccta tgcgatagca gtccaaggtt taggagcaag gcgacgctaa + 22921 gcttggtaaa ctgcgaaccg ctagaagctt atcgtcaact ggaagaagct gaacttgttg + 22981 gatgttgggt acatgtgaga aggaagtttt ttgaagcgac ccccaagcaa gcggataaat + 23041 catccttagg agctaaaggt ttagcttatt gtaatcagtt attttccttg gaaagagact + 23101 gggaggcttt gccagctgat gaacgactac agaaacgtca agaagagctc caacccctac + 23161 tggaagactt ctttgcttgg tgccggcgtc agtcagtttt atcgggttca aaactaggaa + 23221 gggcaattga atacagcctc aagtataaag aaacctttaa gaccattttg aaagacggac + 23281 atctggtcct ttccaataat ctagctgaat gcgccattaa atcattggtt atgggacgga + 23341 gtaaaagagt ccagtggact cttttagcct aagctcagtt taaaaaagcg agggtggtta + 23401 ttttctcaaa gttttgaagg agctaaagca agagctatta ttatgagttt gttggaaaca + 23461 gctaaacgtc atcaattaaa tagcgagaaa tatctattct atcttctaga atgtcttcca + 23521 aacgaggaaa ctctcgtaaa caaagaggtt ttagaggttt atttatcatg gactaaagtt + 23581 gtacaagaaa agtgcaaata agaaatctcc agattaggaa ctatccgtga gttctctagt + 23641 ctggagattt ttcaatatac ttcggctctt tgtcaactgt agtgggttga agaaaagcta + 23701 agcttgagaa aggacaaatt tcgtcctttc ttttttgata ttcagggcga taaaaatccg + 23761 ttttttgaag ttttcaaagt tccgaaaacc aaaggcattg cgcttgataa gtttgatgag + 23821 attattggtc gcttccagtt tggcattaga atagtgtagt tgaagggcgt tgacgatttt + 23881 ctctttgttc tttagaaagg ttttaaagac agtctgaaaa agaggatgaa cctgcttcag + 23941 attgtcctca atgagtccga aaaatttctc agggtctttg ttctgaaagt gaaaaagtaa + 24001 gagttgatag atctgatagt ggtgtttcaa gtcttctgaa tagcttaaaa tcttgtcaag + 24061 aatttcttta tttgttaagt gcatgcgaaa agtagggcga taaaaacgtt tatcgctcaa + 24121 tttacgacta tcctgttgga tgagtttcca gtaacgcttg atagccttgt attcatgaga + 24181 ttttcgttca aactgattca taatttgaac acgaaaacga ctcatggcac ggctgagatg + 24241 ttggataata tggaaacgat ctagaacgat tttagcacac ggaaaaagct gtttagccaa + 24301 gtcatagtaa ggactaaaca tatccatcgt aatgattttc acttgacaac gaacggctct + 24361 atcgtagcga agaaagtgat ttcggatgac agcttgtgtt ctgccttcaa gaacagtgat + 24421 aatattaaga ttatcaaaat cttgcgcaat gaaactcatc tttcccttag tgaaggcata + 24481 ctcatcccaa gacataatct ttggaagccg agaaaaatca tgctcaaagt gaaagtcatt + 24541 gagcttgcga atgacagttg aagttgaaat ggccagctga tgggcaatat cagtcataga + 24601 aattttttca attaactttt gagcaatttt ttggttgatg atacgaggga tttggtgatt + 24661 tttctttacc aggggagtct cagcaaccat catttttgaa cagtgatagc acttgaaacg + 24721 gcgttttcta aggagaattc tagaaggcat accagttgtt tcgaggtaag ggatcttaga + 24781 cggtttttga aagtcatatt tcttcattag acttccacaa tcagggcaag atggagcctc + 24841 ataatccagc ttagcgataa tttctttgtg ggtatccata ttgatgatat ctagaatctt + 24901 gatgtttggg tctttaatat cgagcagttt tgtgataaga tgtaattgtt ccatatgatt + 24961 ctttctaatg agttgttttg tcgcttttca ttataggtca tatgggactt tttttctaca + 25021 caaaaataag ctccataata tccatagggg atttacccac tacaaatatt atagagccta + 25081 tacttcgtta ttgggcggtt acgatattca tattttttgc aaagatattg tttgaaaaat + 25141 aattttcaaa aattctgaaa attctgttga caactttctg aaaagagtct ataatggaga + 25201 gaaagtttta aaggagaaaa tgatgaaaag ttcaaaacta tttgcccttg cgggcgtgac + 25261 attattggcg gcgactactt tagctgcatg ctctggatca ggttcaagca ctaaaggtga + 25321 gaagacattc tcatacattt atgagacaga ccctgataac ctcaactatt tg +// + diff --git a/public/res/serotype_genbank/serotype_32F.gb b/public/res/serotype_genbank/serotype_32F.gb new file mode 100644 index 0000000..d1e989f --- /dev/null +++ b/public/res/serotype_genbank/serotype_32F.gb @@ -0,0 +1,1136 @@ +LOCUS CR931697 25363 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain nr. 34375 (serotype 32f). +ACCESSION CR931697 +VERSION CR931697.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 25363) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 25363) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..25363 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="nr. 34375" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC32F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC32F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34138.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC32F_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC32F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(462..1266) + /gene="tnp" + /locus_tag="SPC32F_0003" + /pseudo + CDS complement(join(462..896,895..1266)) + /gene="tnp" + /locus_tag="SPC32F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(894..896,895..1248)) + /gene="tnp" + /locus_tag="SPC32F_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.9e-19" + /pseudo + gene complement(1663..3056) + /gene="tnp" + /locus_tag="SPC32F_0004" + /pseudo + CDS complement(join(1663..1797,1797..3056)) + /gene="tnp" + /locus_tag="SPC32F_0004" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(2070..2573) + /gene="tnp" + /locus_tag="SPC32F_0004" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 3.6e-20" + /pseudo + gene complement(3162..4115) + /gene="tnp" + /locus_tag="SPC32F_0005" + CDS complement(3162..4115) + /gene="tnp" + /locus_tag="SPC32F_0005" + /note="member of homology group 39" + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + /protein_id="CAI34142.1" + /db_xref="GOA:Q4K0X9" + /db_xref="InterPro:IPR001584" + /db_xref="InterPro:IPR012337" + /db_xref="UniProtKB/TrEMBL:Q4K0X9" + /translation="MQEHYTPKGKHLTIDNRRLIERWKNENKSNREIAGLLGKAPQTI + HNEVKRGTTLQQVRKGLYKKVYSADYAQTVYQFNRKRSVKKLILTKEIREKILHYHKQ + KFSPEMMVNKKQVKVGISTIYYWFHNGHLGLTKADMLYPRKRKGVKKQASPNFKPAGK + SIEERPDVINLRLENGHYEIDTVLLTKIKNYCLLVLTDRRSRHQIIRLIPNKTAESVN + QALTLLLGEHRILSITADNGSEFKRLSEVFPEEHIYYAHAYSSWERGSNENHNRLIRR + WLPKGTKKTTPKEVAFIENWINNYPKKCLDYKSPSEFLLGG" + misc_feature complement(3171..3608) + /gene="tnp" + /locus_tag="SPC32F_0005" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 6.6e-23" + misc_feature complement(3969..4034) + /gene="tnp" + /locus_tag="SPC32F_0005" + /note="Predicted helix-turn-helix motif with score + 1087.000, SD 2.89 at aa 28-49, sequence + KSNREIAGLLGKAPQTIHNEVK" + gene 4469..5923 + /gene="wzg" + /locus_tag="SPC32F_0006" + CDS 4469..5923 + /gene="wzg" + /locus_tag="SPC32F_0006" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34143.1" + /db_xref="GOA:Q4JZS6" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZS6" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLMSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYGTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMGL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 4469..4594 + /gene="wzg" + /locus_tag="SPC32F_0006" + /note="Signal peptide predicted for SPC1506 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 4682..5029 + /gene="wzg" + /locus_tag="SPC32F_0006" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.7e-63" + misc_feature 5207..5650 + /gene="wzg" + /locus_tag="SPC32F_0006" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 5925..6656 + /gene="wzh" + /locus_tag="SPC32F_0007" + CDS 5925..6656 + /gene="wzh" + /locus_tag="SPC32F_0007" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34144.1" + /db_xref="GOA:Q4JZS5" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZS5" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEKDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 5928..6536 + /gene="wzh" + /locus_tag="SPC32F_0007" + /note="HMMPfam hit to PF02811, PHP domain, score 1.5e-36" + gene 6662..7357 + /gene="wzd" + /locus_tag="SPC32F_0008" + CDS 6662..7357 + /gene="wzd" + /locus_tag="SPC32F_0008" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34145.1" + /db_xref="GOA:Q4JZS4" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZS4" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSAFI + VKPEYTSTTRIYVVNRNQGDKSGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLTRKVQVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDIRVKRPEDVEDVLQI + PLLGVVPDFDKMK" + misc_feature 6662..6778 + /gene="wzd" + /locus_tag="SPC32F_0008" + /note="Signal peptide predicted for SPC1508 by SignalP 2.0 + HMM (Signal peptide probability 0.729) with cleavage site + probability 0.460 between residues 39 and 40" + misc_feature 6683..7099 + /gene="wzd" + /locus_tag="SPC32F_0008" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.5e-56" + misc_feature 7205..7282 + /gene="wzd" + /locus_tag="SPC32F_0008" + /note="PS00217 Sugar transport proteins signature 2." + gene 7367..8056 + /gene="wze" + /locus_tag="SPC32F_0009" + CDS 7367..8056 + /gene="wze" + /locus_tag="SPC32F_0009" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34146.1" + /db_xref="GOA:Q4JZS3" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZS3" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + QGEGKSTTSTNIAWAFARAGYKTLLIDADIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 8071..9438 + /gene="wchA" + /locus_tag="SPC32F_0010" + CDS 8071..9438 + /gene="wchA" + /locus_tag="SPC32F_0010" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34147.1" + /db_xref="GOA:Q4JZS2" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZS2" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDQFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKIVAEGEIVNFATHEVVDEVFIDLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKNGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 8071..8163 + /gene="wchA" + /locus_tag="SPC32F_0010" + /note="Signal peptide predicted for SPC1510 by SignalP 2.0 + HMM (Signal peptide probability 0.902) with cleavage site + probability 0.355 between residues 31 and 32" + misc_feature 8854..9435 + /gene="wchA" + /locus_tag="SPC32F_0010" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.4e-156" + gene 9442..10656 + /gene="wchF" + /locus_tag="SPC32F_0011" + CDS 9442..10656 + /gene="wchF" + /locus_tag="SPC32F_0011" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI34148.1" + /db_xref="GOA:Q4JZS1" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4JZS1" + /translation="MPLSLVRREMKQSVYIIGSKGIPAKYGGFETFVEKLTEYQKDGN + IQYYVACMRENSAKSGFTADTFEYNGAICYNIDVPNIGPARAIAYDIAAVNKAIELAK + GNKDEAPIFYILACRIGPFISGLKKKIRSVGGRLLVNPDGHEWLRAKWSMPVRKYWKF + SEQLMVKHADLLVCDSKNIEKYIREDYKQYQPKTTYIAYGTDTTPSSLKSEDVKVRNW + YREKGVSENGYYLVVGRFVPENNYETMIREFIKSKSNKDFVLITNVEQNKFYDQLLKE + TGFDKDPRVKFVGTVYDQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLD + VGFNREVGEDGAIYWKKDVGDLARLIDIVDRKDETFREKLGLMAKDRIETAYSWQFIE + KEYKEIWDEEAI" + misc_feature 10087..10584 + /gene="wchF" + /locus_tag="SPC32F_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00031" + gene 10640..11671 + /gene="wcyH" + /locus_tag="SPC32F_0012" + CDS 10640..11671 + /gene="wcyH" + /locus_tag="SPC32F_0012" + /note="member of homology group 178" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34149.1" + /db_xref="GOA:Q4JZS0" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZS0" + /translation="MRKRYDNLDGLRVISCLGIIAMHIKANADYQIYGWIFEVFVPSL + TLLVYLFLLISGFGMFCGYYERFKEGKIDLNNFYKKRYKKIIPFFAFLIFIDILVERS + FSHLIEGFTEATLVFGLLPNNQPDVIGVSWTIGVIFLFYMLFPFFVWLCWDKKRAFIS + FIISVILNIFCEIYYFTDKFVIDSFASRHSFLYCSPFFLGGGLIYMYRKEIKDFVSQR + KLFCLLGCLGITGFHYLFIQPWFKMDNLGSLLLLLYLPWLCYAISVDSIVLSNKVMKY + FSKISLELYLAHMVLFRVVEKMNFLYFFGKGWLSFILVFVAVLIGLILLIEFLKKMTS + FSRRLLIKE" + misc_feature 10640..10723 + /gene="wcyH" + /locus_tag="SPC32F_0012" + /note="Signal peptide predicted for SPC1512 by SignalP 2.0 + HMM (Signal peptide probability 0.608) with cleavage site + probability 0.593 between residues 28 and 29" + misc_feature 10652..11647 + /gene="wcyH" + /locus_tag="SPC32F_0012" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 7.2e-06" + gene 11852..13087 + /gene="wzy" + /locus_tag="SPC32F_0013" + CDS 11852..13087 + /gene="wzy" + /locus_tag="SPC32F_0013" + /note="member of homology group 179" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34150.1" + /db_xref="UniProtKB/TrEMBL:Q4JZR9" + /translation="MDMNKITIRELIILFVLILFIFQNLLEKYFVYAQYIDEIVALLF + LIHYFLRVVLNKSISKKFSRLVLLLLTIILITLISNFWNNVQTNILIISIDLFSIFKF + IFIFLGAQSFLNDLTHKEIKRIILRVYFISNIYLSVLIVLAFLNIFIGLGMHQEYRYG + LPTFSFIFGTPGQVINLSIIFLLLYQLNKLYNSKNNLIHLVLIFLLLLSTLKTRAIVL + AIVFVYILYLFEIRNISSMKKRVLPVLGLGAVVGFEQFKTYFLTSDTPRLTLFKYGML + TMRRYFPLGSGFATYGSDIAAKNYSLLYYQYGFHNRYGMNPYDIRFLNDNFYPMIFAQ + FGFLGGILYVFLLLDYFRLLLRVASINDKVIKTSVFIYIFNVVLSSIQSSYPGTNSMV + ITTFLICLILRYSDKWRIL" + gene 13072..13782 + /gene="wcyI" + /locus_tag="SPC32F_0014" + CDS 13072..13782 + /gene="wcyI" + /locus_tag="SPC32F_0014" + /note="member of homology group 180" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="CAI34151.1" + /db_xref="UniProtKB/TrEMBL:Q4JZR8" + /translation="MEDFMIIEAIGLPGSGKTFLFHELEKEFRSNSIRTYNFTELSRN + NISVKIVVKLLLKFVSLKYICKKWKKELYDILSEELPYESKFDLYENPDYCVNYALML + LFIYRLFQNSKIVLLLDEGMYHNIVKLCADFDFSIRLSNKLIEKCVLLSRLNDSKHIV + IYNIFPISETLLSIEKRNRHVSKFDELETTQLSKILDNYDKLNNAIYNNDKKQIISVF + RKDFIEKNISYIKQNLNI" + gene 13860..14738 + /gene="wchQ" + /locus_tag="SPC32F_0015" + CDS 13860..14738 + /gene="wchQ" + /locus_tag="SPC32F_0015" + /note="member of homology group 43" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34152.1" + /db_xref="GOA:Q4JZR7" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZR7" + /translation="MVIFVVLHYMVFKETKQCVNSIKNNVKGEKKIIIVDNCSPNGSY + SSLVDAFGCDKDIIIMKSDSNLGFARGNNLGYKYAVENFNPDFIVVMNNDMEIFQEDF + IDKLYESYAKYGYYILGPDIYSTKQEYHQNPQTRKVLDRSDLKLLYRKLVIKDRLRFL + VPVKWWFKNILIKNKSVDNNSKDKNEYVQNIVKNPLLHGSCYVFSKKFTEKHQHTCFY + DKTFMYMEAEILHYMALKNNELMLYYPDLKVYHHEDVATDSTFVKQYKKSFFSIRCLL + QSTKAFIDLIDSDKKE" + misc_feature 13866..14360 + /gene="wchQ" + /locus_tag="SPC32F_0015" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 7.8e-15" + gene 14742..16202 + /gene="wzx" + /locus_tag="SPC32F_0016" + CDS 14742..16202 + /gene="wzx" + /locus_tag="SPC32F_0016" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34153.1" + /db_xref="GOA:Q4JZR6" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZR6" + /translation="MESQKKSVEKNYIYNLIYQMLTVVIPIIITPYISRVLNADGIGI + FSYTTAVVGYFVLLGNLGIATYGQLQVAKYQEDRFKLSKIFFELLILRTILLLLVLLI + YLVFIQFQDIIYKSIYYVLIIQILCSLLDISWFLQGLEEFKSIVMRNTLIKVLSVISI + LIFVKKDTDLILYALIMNASTLLGNISIFAYVPKYVQRVKLAEINLLKHISHCLVYFI + PTIATTIYLTLDKTMIGWFSLNTFENGYYEQAQKIEQMVVTIVTSLSVVTMPRMTYLL + NNNQFQEFKVRLEQSIRFILFLSLPMSLGLVGIANNFIPLFLGVGFEKSISILKIFSL + LVIIIGLNNALGKQILMPSGQQRAYNISVVIGAVINIVFNLILIPQFFSLGAAISSVL + AEFAILIIFLYYSRNCIPPKWVIRTAVKYLGSSIVMFLIIRTIELLSPPSWTVVIIQV + IVGVAVYILSLYILKDQIVRKYYLRLRKLNVLARKV" + misc_feature 14763..15569 + /gene="wzx" + /locus_tag="SPC32F_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.7e-44" + gene 16242..17198 + /gene="wcyS" + /locus_tag="SPC32F_0017" + CDS 16242..17198 + /gene="wcyS" + /locus_tag="SPC32F_0017" + /note="member of homology group 118" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34154.1" + /db_xref="GOA:Q4JZR5" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JZR5" + /translation="MSIFSTLIKKKGAEIFKDLIQSRVLFRTIAILPLVGFSKKSLEI + VRLNNSNVVLSKLRRKYKQTIKNLDREKQYSLSYNQRHKDASNKIWICWFQGLDTAPH + VVQECIASVKKHLADREVVVLTDENYHQYVTFPDYIKEKATQGFISKAHFADLLRLEL + LTEYGGTWIDGTIFCSSSDIPAYMLDSDLFLFQNLKPGLDGQALAISNWFITASYSNH + PLLNMTKDLLYDYWKNHNGVVDYFIFHHFFQLSIEEFPEYWSKVVPFNNSTPHILQLR + LFEEFDEVMYGYILEQTPFHKLTYKFEEEKSRIPNTYYKHLF" + misc_feature 16377..17192 + /gene="wcyS" + /locus_tag="SPC32F_0017" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 3.3e-69" + gene 17274..18095 + /gene="wcrN" + /locus_tag="SPC32F_0018" + CDS 17274..18095 + /gene="wcrN" + /locus_tag="SPC32F_0018" + /note="member of homology group 119" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34155.1" + /db_xref="GOA:Q4JZR4" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZR4" + /translation="MKELTTREMQEVSLEILHTIASICEKHHFRYALIYGTLIGAVRH + KGYIPWDDDVDIMMPRPDYDRLLEYLKENIADYPHLKVFNREECPEYPYMITRISDQR + YRIEMENEKPFDLGVFIDIYPYDGLGDTKEEAVDFGMKGDRLSSFCYQATREHFAIET + TTSTFRKLIKYPVYLFSKMIGKDYFQKQLAKLARVKDYDNSEYVGCVIWLSWGEKDIF + PREWFDETILVPFEKYEFRIPKEFDKVLRHEYGDYMILPPEKDRVGHHYFKAYKK" + misc_feature 17343..18026 + /gene="wcrN" + /locus_tag="SPC32F_0018" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 2.5e-45" + gene 18255..18524 + /gene="HG272" + /locus_tag="SPC32F_0019" + /pseudo + CDS 18255..18524 + /gene="HG272" + /locus_tag="SPC32F_0019" + /note="member of homology group 272" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative transferase (pseudogene)" + misc_feature 18258..18311 + /gene="HG272" + /locus_tag="SPC32F_0019" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.13" + /pseudo + misc_feature 18345..18398 + /gene="HG272" + /locus_tag="SPC32F_0019" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.26" + /pseudo + misc_feature 18399..18452 + /gene="HG272" + /locus_tag="SPC32F_0019" + /note="HMMPfam hit to PF00132, Bacterial transferase + hexapeptide (three rep, score 0.032" + /pseudo + gene 18994..19863 + /gene="rmlA" + /locus_tag="SPC32F_0020" + CDS 18994..19863 + /gene="rmlA" + /locus_tag="SPC32F_0020" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34157.1" + /db_xref="GOA:Q4JZR3" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JZR3" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSINPSPRGELEITDVNKAYLDRGGLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISKEQVHELAQPLKKN + EYGQYLLRLIGEV" + misc_feature 18997..19713 + /gene="rmlA" + /locus_tag="SPC32F_0020" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.3e-118" + gene 19864..20460 + /gene="rmlC" + /locus_tag="SPC32F_0021" + CDS 19864..20460 + /gene="rmlC" + /locus_tag="SPC32F_0021" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34158.1" + /db_xref="GOA:Q4JZR2" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4JZR2" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGKTYQTVIDASKGIFVPRGVANGFQVLSDTASYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENLEEADVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 19900..20430 + /gene="rmlC" + /locus_tag="SPC32F_0021" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 3e-16" + gene 20470..21519 + /gene="rmlB" + /locus_tag="SPC32F_0022" + CDS 20470..21519 + /gene="rmlB" + /locus_tag="SPC32F_0022" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34159.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 20485..21441 + /gene="rmlB" + /locus_tag="SPC32F_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 20488..21228 + /gene="rmlB" + /locus_tag="SPC32F_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 20491..21303 + /gene="rmlB" + /locus_tag="SPC32F_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 21585..22436 + /gene="rmlD" + /locus_tag="SPC32F_0023" + CDS 21585..22436 + /gene="rmlD" + /locus_tag="SPC32F_0023" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34160.1" + /db_xref="GOA:Q4K1G6" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1G6" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 21585..22433 + /gene="rmlD" + /locus_tag="SPC32F_0023" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-147" + misc_feature 21588..22229 + /gene="rmlD" + /locus_tag="SPC32F_0023" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 21588..22217 + /gene="rmlD" + /locus_tag="SPC32F_0023" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 21591..22319 + /gene="rmlD" + /locus_tag="SPC32F_0023" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.9e-08" + gene order(22512..23465,23476..23697) + /gene="tnp" + /locus_tag="SPC32F_0024" + /pseudo + CDS join(22512..23465,23476..23697) + /gene="tnp" + /locus_tag="SPC32F_0024" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 22518..22961 + /gene="tnp" + /locus_tag="SPC32F_0024" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 6e-05" + /pseudo + gene complement(23794..25050) + /gene="tnp" + /locus_tag="SPC32F_0025" + CDS complement(23794..25050) + /gene="tnp" + /locus_tag="SPC32F_0025" + /note="member of homology group 13" + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /protein_id="CAI34162.1" + /db_xref="GOA:Q4JZQ9" + /db_xref="InterPro:IPR002560" + /db_xref="InterPro:IPR012287" + /db_xref="UniProtKB/TrEMBL:Q4JZQ9" + /translation="MEQLHLITKLLDIKDPNIKILDIINMDTHKEIIAKLDYEAPSCP + DCGSLMKKYDFQKPSKIPYLETTGMPSRILLRKRRFKCYHCSKMMVAETPLVKKNHQI + PRIINQKIAQKLIEKISMTDIAHQLAISTSTVIRKLNDFHFEHDFSRLPKIMSWDEYA + FTKGKMSFIAQDFDNLNIITVLEGRTQAVIRNHFLRYDRAVRCQVKIITMDMFSPYYD + LAKQLFPCAKIVLDRFHIIQHLSRAMSRFRVQIMNQFERKSHEYKAIKRYWKLIQQDS + RKLSDKRFYRPTFRMHLTNKEILDKILSYSEDLKHHYQIYQLLLFHFQNKDPEKFFGL + IEDNLKQVHPLFQTVFKTFLKNKEKIVNALQLHYSNAKLEATNNLIKLIKRNAFGFRN + FENFKKRIFIALNIKKERTKFVLSQA" + misc_feature complement(24298..24594) + /gene="tnp" + /locus_tag="SPC32F_0025" + /note="HMMPfam hit to PF01610, Transposase, score 5e-48" + misc_feature complement(24634..24699) + /gene="tnp" + /locus_tag="SPC32F_0025" + /note="Predicted helix-turn-helix motif with score + 1691.000, SD 4.95 at aa 118-139, sequence + ISMTDIAHQLAISTSTVIRKLN" + gene 25316..>25363 + /gene="aliA" + /locus_tag="SPC32F_0026" + CDS 25316..>25363 + /gene="aliA" + /locus_tag="SPC32F_0026" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34163.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaaggca gaaatccttt gttttttata accaaggttt ataaaccttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagccc atgttttctc aataggattg tactcaggtg aatagggagg aagaggtaaa + 541 agtttatgcc caaactcttc acacaagagt tctagcttcc ccattctatg gaatcttgca + 601 ttatccataa taataaccga tggtgtggtt aatgttggta agagaaattt ctgaaaccaa + 661 gcttcaaaaa agtcgctcgt catcgtctct tcgtaagtca ttggagcgat taactcacca + 721 tttgttagac ctgcaaccaa agaaatcctc tgatatcttc ttccagatac tttgcctctt + 781 cttaactgac cttttaaaga gcgaccatgt tctcgataaa aataagtatc gaatcctgtt + 841 tcgtcaatct aaacaggtgc taggtgcttt aatctattaa aattcttaag aaataaggct + 901 actttttctg ggtcttgttc atagtaagtg tggttctttt tttcgagtgt agcccatagc + 961 tttgagcgca tagtggatgg tagttggatg acagccaaat tcagaagcta tttcagtcaa + 1021 ataagcgtct ggattgtcag taagatagtt tttaagtcta tctctatcaa cttttcttgg + 1081 ttttgttcct tttacttggt ggtttagctc tcctgttttt tcttttagct ttaaccagcc + 1141 ataaatggta ttacgtgaga tttggaaaac gtgtgatgct tctgttatac tacctattcg + 1201 ctcacaataa gagagaactt ttttacgaaa atctattgaa tatgccataa aaagattata + 1261 ccacattgtg tactatatta tattgaaact agaatagtac acatctgctt ctaaaatatt + 1321 gttagaaaac gatttgactg tcctgatcaa tttgtcatgt tcttatttca ttttactata + 1381 ttttgctact ccccgtaaag tgtcaatcga aagtgattat gtcccaaaaa aatggagata + 1441 ttgaggtcaa ttattttgat ttcatttgac acgaggaacc cttgaagctg ttttgccagc + 1501 taaaccaagg ctagtcttag ccttggctcg ccagcctaac agctccaagc ctcgtgtcaa + 1561 atgaaatgct tgtcttacac tccttacttt ctcgctccta aatgtaaggg atagagtgat + 1621 ttcctttaag gaaaagcttc ccatttagcg agaaatagat tagacttgta gatgaggaga + 1681 atcaagctcc tcactagtaa actcttcata atccttttta tttttatgaa ggtattgttt + 1741 gaaagatgtg aatttccacg gatgggtttg tggagggata tacttgcgtc tttctttttt + 1801 tgttctggtt cttgttcaaa gtttttcgaa tagagttcat gaactagtag ctcctttgtg + 1861 tgatagattt tgtcagcgat attgaggtag atgtcaccat caaatgcttt tataactaat + 1921 gctttcgtct ttctgctgaa atagacttct tttccttgtt cggtagggat atagcaacga + 1981 ttttggaagc ggatatggtg tccactatcg acgactctct ccgccagtct agccagaatg + 2041 agatttcgtt cagagggctt aggagccttc tcaaagacag agagttttgt cttgtttcca + 2101 aactgttcat taaaggtttg gatgtaggaa agcaggaagg tattggcttc ttccaaggta + 2161 tgaatcttgt ttcgttccag ttcgataggc aggcgagatt gtagtgtctg attgagtctt + 2221 tcgactctcc ctttagcttg agggatagag gttgtctcca gaagaatccc cagttggtga + 2281 caggcgtatc cgaattgtgt atgggtatcg tcctccattt tcttagagtt ggagatttga + 2341 taggtaaaga ctgttttttt atctgttttg atttgaaggg gaatgccgtg gttgtctaaa + 2401 atttgttcga ggacatgata gtaagcattc aaggtctctt gtttatcaaa ataagcgcct + 2461 aggatattgc cagaagcatc atcaatggct aggtgtaagt tagaggtttg ggctccaaac + 2521 caggcatgag ggctggcatc catttggatg agttctccag caaatttctt tctgagtcta + 2581 ctaggatgta cttttttagg gtcttcaagg aaattttcag ctgtcggtaa gattggcttg + 2641 tctaggggtt gcttggggtt cagtttagct tgttttctta gtctcttctt tgtctttcta + 2701 tgggacttag gcgacaggat attttcctta tagagtattt ttctaacagt tgtatcagag + 2761 agctgaattc cttcttcttc agctagcaat tcacagaaat gacggacatt tggtttatat + 2821 gttttatagg agaggtattt ctttaggata cgttctttga tttcatcagg gattgcatgt + 2881 tttggttttc gatttctgtt tccgtgtctg aaggcttctt ttcctttcag ttgatagacc + 2941 agtagtagac gattgatttg cctttcagaa agattgagtt cggcacaggc tcgtttcttt + 3001 gttttctttc cttgggctat agcttttatc acaagatatt ttttcatttc attcatattt + 3061 agttggatcc ttttcatatg actattctac caaatgggac attttcacgt tcgatttact + 3121 aaagacatta tcacattcga atcccaaatt tcaagttgaa gttagccacc caaaagaaat + 3181 tcacttggcg acttgtagtc caagcatttt ttagggtagt tgttaatcca attttcgata + 3241 aaagctactt ctttcggagt cgttttcttg gttcctttag gtaaccatct ccgaattaat + 3301 cgattatgat tttcatttga acctctctcc catgaagagt aagcatgtgc gtagtagata + 3361 tgttcctcag gaaatacctc agacaatcgt ttgaactccg aaccattatc tgcagtaatg + 3421 gacagaatac gatgctcccc taatagtaac gtaagcgcct gattgacaga ttcagcagtt + 3481 ttatttggaa ttaaccttat aatttggtgt ctgctccgcc ggtcggttaa gactaacagg + 3541 caataatttt ttatcttagt cagtaggacg gtatcaattt cataatgacc attttccaag + 3601 cgaagattaa taacgtcagg acgttcttcg atagatttac ctgccggctt aaagttcgga + 3661 ctagcttgct tcttgacacc tttccttttt ctgggataaa gcatgtcggc cttcgtcaat + 3721 cctaaatgac cattatgaaa ccagtagtag atggttgaaa taccaacttt cacttgcttc + 3781 ttgttaacca tcatttcagg cgaaaatttt tgcttatgat agtgtaagat cttctctctg + 3841 atttcctttg ttaaaattaa ctttttcacc gaccgttttc gattgaattg gtaaacagtt + 3901 tgtgcgtaat cggcagaata gacctttttg tatagccctt ttctcacttg ttgtaaagtt + 3961 gtacctcttt tgacttcatt atgaatcgtt tgaggcgcct ttcctaacaa gcctgcaatt + 4021 tcacgattgg acttattttc attcttccac cgctcaatca agcgacggtt atctattgtc + 4081 aaatgtttcc cttttggggt ataatgttct tgcatctctg tgcctttcct tgtgtttgtg + 4141 gtgaacaaca agtatagcac agaggtgttt tcttatacct taaatcacat ttcatttgac + 4201 aacaggaacc cttgaacctg ttttttcagc taaaccaagg ctatgattag ccttggccac + 4261 ctagcctaac agtttcaaac ctgttatcaa atgaaatcat caacttactc aaacatagtg + 4321 aaacatctaa ttcttgacta aggtaaggtg gctaacttca ttatagaact ttcaatcaca + 4381 ttcgaatcac ataaagatgc agatagtaaa aaaagatgta gacattaccg taaaaaagtg + 4441 atataattgt acgatgttca aggtataggt gttaatcatg agtagacgtt ttaaaaaatc + 4501 acgttcacag aaagtgaagc gaagtgttaa tatcgttttg ctgactattt atttattgtt + 4561 agtttgtttt ttattgttct taatctttaa gtacaatatc cttgctttta gatatcttaa + 4621 tctagtggta actgcgttag tcctactagt tgccttggta gggctactct tgattatcta + 4681 taaaaaagct gaaaagttta ctatttttct gttggtgttc tctatccttg tcagctctgt + 4741 gtcgctcttt gcagtacagc agtttgttgg actgaccaat cgtttaaatg cgacttctaa + 4801 ttactcagaa tattcaatca gtgtcgctgt tttagcagat agtgagatcg aaaatgttac + 4861 gcaactgatg agtgtgacag caccgactgg gactgataat gaaaatattc aaaaactact + 4921 agctgatatc aagtcaagtc agaataccga tttgacggtt aaccagagtt cgtcttactt + 4981 ggcagcttac aagagtttga ttgcagggga gactaaggcc attgtcctaa atagtgtctt + 5041 tgaaaacatc atcgagtcag agtatccaga ctacgcatcg aagataaaaa agatttatac + 5101 caagggattc actaaaaaag tagaagctcc taagacgtct aagaatcagt ctttcaatat + 5161 ctatgttagt ggaattgaca cctatggtcc tattagttcg gtgtcgcgat cagatgtcaa + 5221 tatcctgatg actgtcaatc gagataccaa gaaaatcctc ttgaccacaa cgccacgtga + 5281 tgcctatgta ccaatcgcag atggtggaaa taatcaaaaa gataaattaa cccatgcggg + 5341 catttatgga gttgattcgt ccattcacac cttagaaaat ctctatggag tggatatcaa + 5401 ttactatgtg cgattgaact tcacttcttt cttgaaaatg attgacttat tgggaggggt + 5461 agatgttcat aatgatcaag agttttcagc tctacatggg aagttccatt tcccagtagg + 5521 gaatgtccat ctagactctg agcaggctct aggttttgta cgtgaacgct actcactagc + 5581 cgatggagac cgtgaccgtg gtcgcaacca acaaaaggtg attgtggcta tccttcaaaa + 5641 attaacgtca accgaagcac tgaaaaatta tggtacgatc attaatagct tgcaagattc + 5701 tatccaaaca aatatgccac ttgagaccat gataaatttg gtcaatgctc agttagaaag + 5761 tggagggaat tataaagtaa attctcaaga tttaaaaggt acaggtcgaa tgggtcttcc + 5821 ttcttatgca atgccagaca gtaacctcta tgtgatggaa atagatgata gtagtttagc + 5881 tgtagttaaa gcagctatac aggatgtgat ggagggtaga tgaaatgata gacatccatt + 5941 cgcatatcgt ttttgatgta gatgatggtc ccaagtcaag agaggaaagc aaggctctct + 6001 tggcagaatc ctacaggcag ggggtgagaa ccattgtctc tacctctcac cgtcgcaagg + 6061 gcatgtttga aactccggaa gagaagatag cagaaaactt tcttcaggtt cgggaaatag + 6121 ctaaggaagt ggcgagtgac ttggtcattg cttacggggc tgaaatttac tacacaccag + 6181 atgttctgga taagctagaa aaaaagcgga ttccgaccct caatgatagt cgttatgcct + 6241 tgatagagtt tagtatgaac actccttatc gcgatattca tagcgccttg agcaagatct + 6301 tgatgttggg aattactcca gtcattgccc acattgagcg ctatgatgct cttgaaaata + 6361 atgaaaaacg cgttcgggag ctgattgata tgggctgtta cacgcaagta aatagttcac + 6421 atgtcctcaa acccaaactt tttggcgaac gttataaatt catgaaaaaa agagctcagt + 6481 attttttaga gaaagatttg gttcatatca ttgcaagtga tatgcacaat ctagacggta + 6541 gacctcctca tatggcagaa gcatatgacc ttgttaccca aaaatacgga gaagcgaagg + 6601 ctcaggaact ttttatagac aatcctcgaa aaattgtaat ggatcaacta atttaggaga + 6661 aatgatgaaa gaacaaaaca cgatagaaat cgatgtattt caattattta aaaccttgtg + 6721 gaaacgcaag ctaatgattt tattagtggc acttgtgaca ggtgcggggg cttttgcata + 6781 tagcgctttt attgttaagc cagaatatac gagtaccacg cgaatttacg tagtgaatcg + 6841 caatcaagga gacaagtcgg ggctgacaaa tcaggatttg caggcaggat cttatctggt + 6901 aaaagactac cgtgagatta tcctttcgca ggatgtattg gaaaaagtag cgacaaattt + 6961 gaagttggat atgccagcca aaacgttaac cagaaaagtt caagtgactg taccagttga + 7021 cactcgtatc gtctcaatct ctgtcaagga taaacagcca gaggaagcca gtcgtatcgc + 7081 taattctcta cgagaagttg ctgcagaaaa gatcgtcgct gtaacgcgag tatctgatgt + 7141 aacgacactt gaagaagcgc gaccagctac gaccccctct tctccaaatg ttcgacgcaa + 7201 ttccttgttt ggttttcttg gaggagcagt cgtaacagta attgctgttc ttttgattga + 7261 gttgctcgac atccgtgtga aacgtcctga agatgtcgaa gacgtactgc aaattccact + 7321 tttaggggtc gttccagatt ttgacaaaat gaaataggag gaaattatgc caacattaga + 7381 aatctcacag gcaaaattgg attttgtaaa aaaggcagag gaaaattata acgctttgtg + 7441 cacgaaccta cagttaagtg gagatgattt gaaagtattt tctatcactt ctgtgaaaca + 7501 aggagaagga aaatcaacga cttccaccaa tatcgcttgg gcttttgcgc gtgcaggtta + 7561 caaaacgctg ctgattgatg cagatattcg caattctgtt atgttaggtg tctttaaagc + 7621 aagggataag attacaggcc tgacagaatt tttatcagga actacagacc tatcacaagg + 7681 gctttgtgat accaatatcg aaaatctctt tgtaattcag gctggctctg tgtcaccgaa + 7741 tccgacagct cttcttcaaa gtaagaattt cagtacaatg cttgaaacct tgcgtaaata + 7801 ttttgactac atcattgtag atactgctcc tgtcggtgtc gtgattgatg cggctattat + 7861 tacgcgaaaa tgcgatgctt ctattttagt gacggaggca ggtgaaataa atcgacggga + 7921 tattcaaaaa gcaaaagaac agttggaaca cacagggaag ccgtttttgg gagttgtgtt + 7981 gaataaattc gatacttcag tagacaaata cggttcttat ggaaattatg gagattacgg + 8041 gaaaaataaa aaataggtcg ggggatagag atgaacggaa aaatagtaaa gtcttcattg + 8101 gccataatcc agagttttct tgttatttta ttgacttatc tacttagtgc tgtgagagaa + 8161 gcggagattg tttcaacaac agctattgca ctttatatcc tccattattt tgtcttttat + 8221 atcagtgatt atggacagga tttctttaaa aggagatatt tgattgaact tgtccagaca + 8281 ttgaaatata tcctattctt tgcactagcg attagtattt ctaatttttt cttagaggat + 8341 caatttagta tttccagacg aggcatgatt tacttcctca cattacatgc tctcttagtc + 8401 tatgtgctaa acctatttat caagtggtat tggaagcggg cttatcccaa ctttaaagga + 8461 agtaagaaga ttctcctact tacagcaact tctcgtgtcg aaaaggtact ggatagatta + 8521 atagaatcaa atgaggttgt tggggagttg gtagccgtca gtgtcttaga taaaccagat + 8581 tttcagcatg attgtttaaa gatagtagca gagggggaga tagtaaactt tgcgactcat + 8641 gaggtggtcg atgaagtctt tatcgatctt ccaagtgaaa aatacaatat tggagagctt + 8701 gtctctcagt ttgaaacgat gggaattgat gtaacagtta atctaaatgc ttttgatcgt + 8761 agtttggcac gtaacaagca aattcgtgag atggcaggat taaacgttgt gactttttct + 8821 acaacatttt ataagactag ccatgtaatt gctaagcgga ttattgatat tatgggtgca + 8881 ttggtagggc tgatactatg tggtttagtc agtattgtac tggttccttt gattcgaaag + 8941 gatgggggct ctgctatttt tgctcagacg cgtataggaa aaaatggtcg tcagtttact + 9001 ttttataagt ttcgctctat gtgtgtagat gccgaggcga aaaaaagaga actcatggaa + 9061 caaaatacca tgcagggtgg aatgtttaag gtggacgatg atcctcgtat cacgaaaaat + 9121 ggtcgtttta tacggaagac tagcttggac gagctaccac agttttataa tgttctaaag + 9181 ggagatatga gtttggttgg cacacggcca ccaacagtgg acgagtatga acactatacc + 9241 ccagaacaaa aacgtcggct aagttttaaa cctggtataa caggcttatg gcaggtcagt + 9301 ggacgaagtg agattaagaa ttttgatgaa gttgtcaaat tagatgtagc ctatatagac + 9361 gattggacaa tttggaaaga cattgaaatt ttattgaaga cagttaaagt tgtattgatg + 9421 aaagatggag cgaagtgatt tttgcccctc agtcttgtta ggagagagat gaaacagtca + 9481 gtttatatca ttggttcaaa ggggattcct gccaagtatg gaggatttga aacctttgtt + 9541 gagaaattaa cagaatatca aaaagatggt aacatccaat actatgttgc ctgcatgcgc + 9601 gaaaattctg caaagtcagg atttacagca gatacatttg agtacaacgg tgctatttgt + 9661 tacaacattg atgtgcctaa tattggtcct gctagagcca tcgcttacga tattgcagcg + 9721 gtcaataagg ctattgaatt ggctaaggga aacaaggacg aggctcccat tttttacatt + 9781 ctagcttgtc gtatcggacc ttttatttct ggacttaaga aaaaaattcg ttcggtcgga + 9841 ggccgtttac tggtaaatcc agatggccat gagtggcttc gggctaaatg gagcatgcca + 9901 gttcggaagt attggaaatt ttcggaacag ttgatggtca agcatgcaga tttattagtc + 9961 tgtgatagca aaaatatcga aaaatatatc cgagaggact ataaacagta tcagcccaag + 10021 acgacctata ttgcttatgg tacagatact accccttcaa gtctaaaatc agaagatgtc + 10081 aaagttcgaa actggtatcg tgaaaaggga gtaagcgaaa atggctatta tctagtggtg + 10141 ggacgattcg ttcccgaaaa caactatgaa accatgattc gtgaatttat caagtctaag + 10201 tccaataagg actttgtcct tattacaaat gtggagcaaa ataaatttta cgatcagttg + 10261 ctgaaggaaa caggtttcga caaggatcca agagtcaaat ttgtgggaac agtctatgac + 10321 caagaattgc tcaaatacat ccgagagaat gcttttgctt acttccatgg ccatgaagtt + 10381 ggtgggacaa acccatcgct tttagaagcc cttgcatcaa caaaactaaa tttgttacta + 10441 gatgttggtt ttaaccgtga agttggtgag gatggagcta tttattggaa aaaagatgtt + 10501 ggtgatttag ccagattaat tgacattgtt gacagaaagg atgagacgtt tcgggaaaag + 10561 cttggcttaa tggcgaaaga tagaattgaa acagcatata gttggcaatt cattgaaaaa + 10621 gagtataagg agatttggga tgaggaagcg atatgataat ttggatggat tacgagtaat + 10681 ttcttgtctg ggtataatag cgatgcatat taaagctaat gctgactatc aaatttatgg + 10741 ttggatattt gaagtgttcg taccgtcttt aacgttgctt gtctatttat tcttacttat + 10801 tagtgggttt ggaatgtttt gtggctatta cgagcgattt aaagaaggaa aaattgatct + 10861 aaataatttt tataaaaaaa ggtataaaaa gattatccca ttttttgctt ttttgatttt + 10921 tatagatatt ttagtagaac gaagtttttc gcatttgatt gaaggattta ctgaagctac + 10981 acttgtcttc ggccttctgc cgaataatca accggatgtt attggtgtta gctggacgat + 11041 tggggttatt ttccttttct atatgctttt tccttttttt gtatggctat gctgggataa + 11101 aaagagggcg tttattagtt ttataatttc agttatattg aatatatttt gtgagatata + 11161 ttacttcact gataagtttg ttatagattc gtttgcgtcg cgtcatagtt ttttatactg + 11221 ctccccgttc tttcttggag gtggcctcat ttatatgtac agaaaggaaa taaaagattt + 11281 tgtttcgcaa cgtaaattgt tctgcttact tggttgttta ggtattacag gtttccatta + 11341 tctattcatt caaccttggt ttaaaatgga taatttagga tctttattgt tacttcttta + 11401 ccttccatgg ctttgctatg ctataagcgt tgatagtata gttcttagta acaaagtaat + 11461 gaaatatttt agtaaaatta gcttagaact ttatttagcg catatggtac tttttcgagt + 11521 tgttgagaaa atgaatttct tatatttttt tggtaaaggc tggcttagct tcatattagt + 11581 ttttgtagct gttcttattg gattgatttt attgattgaa tttttgaaaa agatgacaag + 11641 tttttctagg agattgctaa taaaggagta atttaagtgg tgtgatgtca tcaagattta + 11701 agttaaagag aatataggtt gatagaaaaa atatttcctt tttctaaagt gtggattaca + 11761 aatgctactt tttgtaaact aattaataaa tttctatagc actaatatat attacctcta + 11821 agaaaatgat ggaaagtgtg gaaaattaaa cttggatatg aacaaaatta caataagaga + 11881 attgataata ctatttgtgt taattctttt tatatttcaa aatcttttag aaaagtattt + 11941 tgtatatgct cagtatattg atgaaatagt tgcattatta tttctcattc attacttttt + 12001 aagagtagtg ttaaataaga gtatttcaaa aaaattttcc cgacttgttc ttcttttatt + 12061 aactatcata ttaattactt taatttcaaa tttttggaat aatgtgcaaa ctaatatttt + 12121 aattatctcc attgatttat ttagtatttt taaatttatt tttatatttt tgggggcaca + 12181 atcttttctc aatgacttaa cgcataaaga aataaaaaga ataattttac gagtttactt + 12241 tattagtaat atatacttat ctgttttgat tgtcttagca tttttaaata tttttatagg + 12301 cttaggaatg catcaagaat atcgctatgg tttaccaact ttttctttta tttttggtac + 12361 gccaggtcaa gtaattaatc tctcgattat attcttactt ctatatcagt taaataaact + 12421 ttataattct aaaaataatc tcattcattt agtattaatt tttttattac tgctgtctac + 12481 attaaaaaca cgggcaattg tcttagcaat tgtgtttgtc tatattctct atctatttga + 12541 aatacgaaat atttcatcaa tgaaaaagag agtacttcct gttctaggct tgggagcagt + 12601 ggttgggttt gaacaattta aaacttattt tttgacttct gatactccaa ggctcacatt + 12661 atttaaatac ggtatgctta caatgagacg ctattttcct ctgggaagtg gttttgctac + 12721 atatggatcc gatattgctg ctaaaaacta ttctctgtta tattatcaat atggatttca + 12781 taacagatat ggaatgaatc catatgatat tagattttta aatgataatt tttatccaat + 12841 gatttttgca caatttggat ttttaggagg aatactttat gtatttctac tattagatta + 12901 ttttagatta ttattacgtg ttgcaagtat aaatgataag gttattaaaa cttcagtatt + 12961 tatttatatc tttaatgttg tcttatcgtc tattcaatca tcttatccgg gaacgaattc + 13021 aatggtaata acaacgtttc taatctgttt aatattgaga tatagtgaca agtggaggat + 13081 tttatgatta tagaagctat aggtttacct ggaagcggaa aaacgttttt attccatgag + 13141 cttgaaaaag aatttcggag taattcaatc agaacttata attttactga attatcacgg + 13201 aataatattt cagtcaaaat tgttgtaaaa ttattgctaa agtttgtatc gttgaaatat + 13261 atttgtaaaa aatggaaaaa agaattatac gatattcttt ctgaagagct tccgtatgag + 13321 agtaaatttg atttatatga aaatccagat tattgtgtga attatgcgct tatgcttctc + 13381 tttatctata gattatttca aaatagtaaa attgtattat tactagatga gggaatgtat + 13441 cataatattg tgaaattatg tgctgacttt gatttttcaa tcagactatc aaataagtta + 13501 attgaaaaat gtgtattgtt aagtagatta aatgatagta agcatatagt tatttacaat + 13561 atttttccaa tttctgagac actattgtct attgaaaaac gtaatcgaca tgtgtctaaa + 13621 tttgatgaac tagaaactac ccagttgagc aagatattag ataactacga taaactaaat + 13681 aatgcaatct ataataatga caaaaaacag ataatatcag tttttagaaa ggattttatt + 13741 gaaaagaata tttcttatat aaaacaaaat ttaaatattt aatgctctgc tagttattat + 13801 tttggcaggt aatataagcg tttattctct aataattgat aagtacgatg aggtataata + 13861 tggtaatttt tgtggtgttg cattacatgg tttttaaaga aactaaacaa tgcgtcaatt + 13921 caattaagaa taatgttaaa ggagaaaaga aaattataat tgttgataat tgttctccta + 13981 atggctcata tagtagttta gtagatgctt ttggttgtga taaagatatt attattatga + 14041 agtcagatag taatttaggc tttgctaggg gaaataatct tggttataaa tatgcagttg + 14101 aaaattttaa tccagatttt attgttgtaa tgaacaatga tatggaaata tttcaagaag + 14161 attttattga taaactgtat gaaagttacg caaagtatgg ctactatata ttaggtccag + 14221 atatatattc aactaaacag gaatatcatc aaaatcctca gacaagaaag gttctggata + 14281 ggtctgattt gaagttatta tatcgaaagc tagttattaa agataggcta aggttcttag + 14341 ttcctgtaaa atggtggttt aaaaatatat taattaaaaa taaaagtgta gataataatt + 14401 caaaagataa aaatgaatat gttcaaaata tagtaaaaaa tccgttatta catggctcgt + 14461 gttatgtttt ttctaagaag tttactgaaa aacatcaaca cacatgtttt tatgataaaa + 14521 cgtttatgta tatggaggca gaaattttac attatatggc attgaagaac aatgaattaa + 14581 tgctttatta cccagattta aaagtttacc atcatgaaga tgtggcaaca gattcaacgt + 14641 ttgtaaagca atataagaaa tcgttcttct caatcaggtg tctactgcag tcaacaaaag + 14701 cgtttattga tttaattgat tcagataaaa aagagtaaca aatggaaagt caaaaaaaga + 14761 gcgttgaaaa gaattatatt tataatttga tttatcaaat gctaactgta gttattccaa + 14821 ttatcataac accctatatt tcacgtgttc taaacgctga tgggataggg atttttagct + 14881 acacaacagc agtggtaggt tattttgttt tattgggtaa tttaggaatt gcaacttacg + 14941 gacaactaca agttgctaaa taccaagaag acagatttaa attatccaaa atattttttg + 15001 agttattgat tttacgaact atattgcttt tactagtttt actgatatat cttgtattta + 15061 tccaatttca agatataatt tataaatcta tttattacgt tttaataatt caaatacttt + 15121 gtagtttgct ggatatttca tggtttttgc agggtcttga agaatttaaa agtattgtga + 15181 tgcgtaatac cctaataaag gtgttaagtg taatatctat cttgattttt gtaaaaaaag + 15241 atacagattt gattttatat gctttgatta tgaacgcatc aacactgctt ggaaatattt + 15301 ctatttttgc atatgtacct aaatatgttc aaagagttaa gttggctgag attaatttat + 15361 taaagcatat ttcacactgt ttagtttact ttataccaac aatagcaact acaatatatt + 15421 taactttgga taagacaatg ataggttggt tttccttaaa tacttttgaa aatggttatt + 15481 atgagcaggc tcaaaaaatt gagcagatgg ttgtgacaat agttacatct ttaagtgtag + 15541 taacgatgcc tagaatgact tatttattga ataacaatca atttcaagaa tttaaagtgc + 15601 gacttgaaca atcgataagg tttatccttt ttttatcctt acctatgagt ttaggattag + 15661 tagggatagc aaataatttt atacctttgt ttttaggtgt aggatttgaa aagtctatat + 15721 caatattaaa gatttttagt ctactagtta tcattatagg tttaaataat gcattaggga + 15781 agcaaatact tatgccttca gggcagcaaa gggcttataa tattagtgtg gtaataggtg + 15841 ctgttatcaa tatagtcttc aatttaatat tgataccgca atttttttca ctgggtgctg + 15901 cgatttcttc cgttcttgca gagtttgcaa ttttaataat atttctctat tattctagaa + 15961 attgtattcc tcctaaatgg gttattagaa cagcagtgaa ataccttgga tctagtatag + 16021 taatgtttct tattattagg acaatagagc tactatctcc tccttcgtgg acagttgtta + 16081 taatacaagt cattgttgga gtcgcagtat atattctatc gttatatata ttaaaagatc + 16141 aaattgtaag aaaatactat ctaagattga gaaaactaaa tgttcttgca aggaaagtat + 16201 gagagtctta taataattat tcagaatatg gagagatttc agtgagtatt ttttcaacat + 16261 tgattaaaaa aaagggcgca gagattttta aagacttaat tcagtcaaga gtgcttttta + 16321 gaacgatagc tattttacct ctggttggtt tttcaaaaaa atcattagag atagtccgtc + 16381 taaataatag taatgtagtt ctttcaaaat tgagaaggaa gtataagcag actattaaaa + 16441 acttggatag agagaaacag tattcactta gctataatca gcgacataaa gatgcatcaa + 16501 ataagatatg gatttgctgg tttcaaggct tagatactgc ccctcatgtg gttcaggagt + 16561 gtatcgcttc ggtaaaaaaa cacctagcag acagagaagt ggttgtttta acagatgaaa + 16621 attaccatca gtatgtgact tttccagact atatcaaaga aaaagcaacc cagggtttta + 16681 tttcaaaagc gcactttgca gatttattgc gcttggaatt actgaccgag tatggtggta + 16741 cgtggattga tgggacgata ttttgttcga gttcagatat tcctgcctat atgttagatt + 16801 ctgatttatt tctatttcaa aatttaaaac caggtcttga tggacaggca ttggcaattt + 16861 ctaattggtt cattactgct agctactcta accatcctct tttaaatatg acgaaagatt + 16921 tgctttatga ttattggaag aatcataatg gagtggttga ttattttatt tttcatcact + 16981 tctttcagtt atcaatcgaa gaatttcctg aatactggag taaggtagtt cctttcaata + 17041 attcaactcc tcatattttg cagttacgct tatttgaaga gtttgacgaa gtgatgtatg + 17101 gttatattct cgaacagaca ccattccata agctaacata taaatttgaa gaagaaaagt + 17161 cgagaatacc gaatacttac tataaacact tattttgata aaaatgatag tagttgattg + 17221 agagactgtt gttaggtata gaatgctatt gagattttat cgggagggat gatatgaaag + 17281 aactaactac tcgagagatg caagaagtat cgttggagat tttacacacg attgctagta + 17341 tttgtgaaaa acaccatttt cgctatgctt tgatttacgg gactttaatt ggtgcggtta + 17401 ggcataaagg gtatattcct tgggatgatg atgttgacat tatgatgcct cgaccagatt + 17461 atgaccgcct attggagtat ttgaaggaaa atatcgccga ttatccacat ttaaaagtat + 17521 tcaatcgaga agagtgtcca gaatatcctt atatgattac tcgaattagt gatcagagat + 17581 accggattga gatggaaaat gagaaacctt ttgatttggg ggttttcatt gatatctatc + 17641 cctatgatgg tttgggagat acgaaagaag aggcggttga ctttggtatg aagggggatc + 17701 gtttatcgtc gttttgttat caggcaacta gagaacattt tgcgattgaa acgacaacat + 17761 caacttttag gaagttgatt aagtatccag tttatttatt ctctaaaatg attgggaaag + 17821 attacttcca aaagcaacta gccaagttag ccagagttaa agactacgat aacagtgaat + 17881 atgtaggttg cgttatttgg ttgtcatggg gagaaaaaga tatttttccg cgtgaatggt + 17941 ttgatgagac tattttggtt ccttttgaga aatatgaatt taggattcct aaagaatttg + 18001 ataaagttct acggcatgaa tatggagatt acatgatttt gcctccagag aaggatagag + 18061 tagggcatca ctattttaaa gcttataaaa aatgataatt tgctaagcaa agaaaaggaa + 18121 aatcatgaaa ttattttatt tacaattgga gtagaaagtt taagggtgga gtttttctgc + 18181 tcagagttct atatggtttt gagtgcccac gtaaagctaa aattgggaaa aacgtcaatt + 18241 tttcacatcg tgggatggga acagttgtaa gtagtaatgc tatcattggg gataatgtga + 18301 ctatacaaca tcatgtaaca ttaggaatta aaaacgataa tgatagaatt atcatcgggg + 18361 agaactgttt tataggagcc tatgcattta tcttaggaaa tgtaaaaatt ggtgcaaatt + 18421 ctaagattgg agcaggtacg atggttttac atgatgtccc agatggaagc acagtagtta + 18481 atcctgtgga actaaaagca cttgcttcaa aaaaagacgt tcagtaagag agaaatgaat + 18541 agaatattga aaacaatgtt ataggaaagt catggtaaca ctttataata ctgaaaattt + 18601 tattcacttt ttaacacatt agagttaatg tttactccac aaatttaatt taatcactca + 18661 ataaagagat taagagacaa gcaaaaaaaa gattgtcttt ccgaatggag aagccttaga + 18721 ttattgtctg gttccgatga atacaaagta aaatataaaa attgcaataa caaagaattc + 18781 gaattttgtt caggtgcttt ataaagccta tttgagtaat taaatagcaa cttgacactg + 18841 tgattacata aaattattga taagcctaat ttttatttaa tcgtatggat tatttataaa + 18901 aaatgtataa aattgaatat aaatgtgagg tgtgattttg gtttataaac atgggaaaat + 18961 aaaagtgcaa ataacaaaga aaggtaccct actatgaaag gtattatttt agcaggtggt + 19021 tcggggacac gtttatatcc tttgactcgc gctgcatcaa aacaacttat gccggtttat + 19081 gataagccga tgatttacta cccactttca acattgatgt tggctgggat tagggatatt + 19141 ttgattattt ccactccaca ggatttacat cgattccaag agcttcttca agacggatct + 19201 gagtttggga tcaaactttc ttatgcagag caaccaagtc cagatggttt ggcacaagcc + 19261 tttatcattg gggaagagtt tatttctgat gatagcgttg cgctaatctt aggtgataat + 19321 atctaccatg gttctgggct ttccaagatg ctacaaaagg cagcgagtaa ggagtcggga + 19381 gcaactgttt ttggctacca tgtcaaggat ccagagcgct ttggtgtggt tgagtttgat + 19441 caggatatga aggctatttc tattgaagaa aagccagagt accctcgttc aaactatgca + 19501 gttacaggtc tctatttcta tgataatgat gtagtagaga ttgccaagag tattaaccca + 19561 agtcctcgtg gtgaactgga aattacagat gtaaacaagg cttacctaga tcgtggtggt + 19621 ttgtctgttg agcttatggg acgtggcttt gcttggctgg atactggaac tcatgaaagt + 19681 ttactagagg cctcacagta catcgaaaca gtgcaacgga tgcaaaatgt tcaggtagca + 19741 aacttagaag aaattgctta ccgtatgggc tatatcagta aagagcaagt gcatgaattg + 19801 gcgcagccgt tgaagaaaaa tgaatacggg cagtacctgc tccgtttgat tggagaagta + 19861 tagatgacag ataatttttt cggtaagacg cttgcggcac gcaaggttga agctattcca + 19921 ggcatgttag agtttgatat ccccgttcat ggagataatc gtggctggtt taaagaaaat + 19981 ttccaaaagg aaaaaatgct tccacttgga tttccagagt ctttctttgc agaaggaaaa + 20041 ttgcaaaaca atgtatcctt ctcacgtaaa aatgtccttc gaggcctcca cgcagagcct + 20101 tgggataagt acatctctgt agcagatgga gggaaagttc tgggttcttg ggttgatcta + 20161 cgcgagggtg aaacctttgg gaagacctat cagacagtaa ttgatgcaag caagggaatc + 20221 tttgttcctc gaggcgtagc taatggcttc caagttttat cagatacagc ttcatatagc + 20281 tatctggtca atgattactg ggctcttgaa ctcaaaccca agtatgcctt tgtgaactac + 20341 gctgatccaa gccttggtat tgaatgggaa aatctggaag aagcagacgt atctgaagca + 20401 gacaaacatc atcccctact taaggacgtg aagcctttga aaaaagaaga tttggaataa + 20461 ggaaagaata tgactgaata caaaaatatt atcgtgacag gtggagctgg ctttatcggt + 20521 tctaactttg tccattatgt ttacgagaac tttccagatg ttcatgtgac agtcctagat + 20581 aagttgactt atgctggaaa ccgcgcgaat attgaggaaa ttttaggcaa tcgtgttgag + 20641 ttagttgttg gtgacattgc tgatgcggag ttggtagaca agttggctgc tcaagcagat + 20701 gctatcgttc attatgcagc ggaaagccac aatgataatt cgctcaatga tccatcgcca + 20761 tttattcata ctaacttcat tggaacctat actcttttag aagctgctcg taagtacgat + 20821 attcgcttcc accatgtatc gacagatgaa gtttatgggg atctcccttt acgagaagat + 20881 ttgccaggtc atggtgaagg cccaggtgag aaatttactg ctgaaacaaa atacaaccct + 20941 agctctccgt actcatcaac caaggcagcc tcagatttga ttgtcaaagc ttgggtgcgt + 21001 tcttttggag tcaaggcaac gatttccaac tgttcaaata actacggtcc ttatcaacat + 21061 atcgaaaaat tcatcccacg tcagattact aacatcctaa gtggaattaa gccaaaactt + 21121 tacggtgaag gtaagaacgt tcgtgactgg attcatacca atgaccattc ttcaggagtt + 21181 tggacaatct tgacaaaagg gcaaatcggt gaaacctact tgattggggc tgatggtgag + 21241 aagaacaata aggaagtttt ggaacttatc cttaaggaaa tgggacaagc tgcggatgcc + 21301 tatgatcatg tgactgaccg tgcaggacat gaccttcgct atgcgattga tgccagcaag + 21361 ctccgtgatg agttggggtg gaaacctgaa tttactaact ttgaagctgg gctcaaggca + 21421 acaatcaagt ggtatacaga taaccaagaa tggtggaaag cagaaaaaga agctgttgaa + 21481 gccaattatg ctaagactca ggagattatt acagtataaa aagcaggaaa tagctgcttt + 21541 ttattgctat attgggaaga gttacatatt agaaaggtct agagatgatt ttaattacag + 21601 gggcaaatgg ccaattagga acggaacttc gctatttatt ggatgaacgt aatgaagaat + 21661 acgtggcagt agatgtggct gagatggaca ttaccaatga agaaatggtt gagaaagttt + 21721 ttgaagaggt gaaaccgact ttagtctacc attgtgcagc ctacaccgct gttgatgcag + 21781 cagaggatga aggaaaagag ttggacttcg ccatcaatgt gacggggaca aaaaatgtcg + 21841 caaaagcatc tgaaaagcat ggtgcaactc tagtttatat ttctacggac tatgtctttg + 21901 acggtaagaa accagttgga caagagtggg aagttgatga ccgaccagat ccacagacag + 21961 aatatggacg cactaagcgt atgggggaag agttagttga gaagcatgtg tctaatttct + 22021 atattatccg tactgcctgg gtatttggaa attatggcaa aaacttcgtt tttaccatgc + 22081 aaaatcttgc gaaaactcat aagactttaa cagttgtaaa tgaccagtac ggtcgtccga + 22141 cttggactcg taccttggct gagttcatga cctacctagc tgaaaatcgt aaggaatttg + 22201 gttattatca tttgtcaaat gatgcgacag aagacacaac atggtatgat tttgcagttg + 22261 aaattttgaa agatacagat gtcgaagtca agccagtaga ttccagtcaa tttccagcca + 22321 aagctaaacg tccgctaaac tcaacgatga gcctggccaa agccaaagct actggatttg + 22381 ttattccaac ttggcaagat gcattgcaag aattttacaa acaagaagtg agataagtag + 22441 tagaatgatt ttctagtcta ataaaagagg tagataatga actccaaagg agcttaagat + 22501 atacgattat cttgttgttg gtgctggtct ctttggtgca tagctatggc tcagtttcta + 22561 ttatcgctca caccatccat cagaagttta atctgaaggt acccaattat cgccaagaag + 22621 aagattgggc taagatgggt ttaccaatca cacgcaagga aatctctaat tggcatatca + 22681 agacgagtca atactatttg gagcccctct ataacctctt gcgagagaga ctattgactc + 22741 agcccttact tcatgcggat gaaacttctt atagggtgct ggagagtgat agtcagctga + 22801 cttactattg gacttttttg tcaggtaaat cagagaaaca agggattacg ctttaccacc + 22861 atgatcagtg tcgaagtggt tcagtagtac aagaattcct aggagattat tctggctatg + 22921 tgcattgtga tatgttgcgg cagtaactta ggactttagt cctctagttc tgcctatgcg + 22981 atagcagtcc aaggtttagg agcaaggcga cgctaagctt ggtaaactgc gaaccgctag + 23041 aagcttatcg tcaactggaa gaagctgaac ttgttggatg ttgggtacat gtgagaagga + 23101 agttttttga agcgaccccc aagcaagcgg ataaatcatc cttaggagct aaaggtttag + 23161 cttattgtaa tcagttattt tccttggaaa gagactggga ggctttgcca gctgatgaac + 23221 gactacagaa acgtcaagaa gagctccaac ccctactgga agacttcttt gcttggtgcc + 23281 ggcgtcagtc agttttatcg ggttcaaaac taggaagggc aattgaatac agcctcaagt + 23341 ataaagaaac ctttaagacc attttgaaag acggacatct ggtcctttcc aataatctag + 23401 ctgaatgcgc cattaaatca ttggttatgg gacggagtaa aagagtccag tggactcttt + 23461 tagcctaagc tcagtttaaa aaagcgaggg tggttatttt ctcaaagttt tgaaggagct + 23521 aaagcaagag ctattattat gagtttgttg gaaacagcta aacgtcatca attaaatagc + 23581 gagaaatatc tattctatct tctagaatgt cttccaaacg aggaaactct cgtaaacaaa + 23641 gaggttttag aggtttattt atcatggact aaagttgtac aagaaaagtg caaataagaa + 23701 atctccagat taggaactat ccgtgagttc tctagtctgg agatttttca atatacttcg + 23761 gctctttgtc aactgtagtg ggttgaagaa aagctaagct tgagaaagga caaatttcgt + 23821 cctttctttt ttgatattca gggcgataaa aatccgtttt ttgaagtttt caaagttccg + 23881 aaaaccaaag gcattgcgct tgataagttt gatgagatta ttggtcgctt ccagtttggc + 23941 attagaatag tgtagttgaa gggcgttgac gattttctct ttgttcttta gaaaggtttt + 24001 aaagacagtc tgaaaaagag gatgaacctg cttcagattg tcctcaatga gtccgaaaaa + 24061 tttctcaggg tctttgttct gaaagtgaaa aagtaagagt tgatagatct gatagtggtg + 24121 tttcaagtct tctgaatagc ttaaaatctt gtcaagaatt tctttatttg ttaagtgcat + 24181 gcgaaaagta gggcgataaa aacgtttatc gctcaattta cgactatcct gttggatgag + 24241 tttccagtaa cgcttgatag ccttgtattc atgagatttt cgttcaaact gattcataat + 24301 ttgaacacga aaacgactca tggcacggct gagatgttgg ataatatgga aacgatctag + 24361 aacgatttta gcacacggaa aaagctgttt agccaagtca tagtaaggac taaacatatc + 24421 catcgtaatg attttcactt gacaacgaac ggctctatcg tagcgaagaa agtgatttcg + 24481 gatgacagct tgtgttctgc cttcaagaac agtgataata ttaagattat caaaatcttg + 24541 cgcaatgaaa ctcatctttc ccttagtgaa ggcatactca tcccaagaca taatctttgg + 24601 aagccgagaa aaatcatgct caaagtgaaa gtcattgagc ttgcgaatga cagttgaagt + 24661 tgaaatggcc agctgatggg caatatcagt catagaaatt ttttcaatta acttttgagc + 24721 aattttttgg ttgatgatac gagggatttg gtgatttttc tttaccaggg gagtctcagc + 24781 aaccatcatt tttgaacagt gatagcactt gaaacggcgt tttctaagga gaattctaga + 24841 aggcatacca gttgtttcga ggtaagggat cttagacggt ttttgaaagt catatttctt + 24901 cattagactt ccacaatcag ggcaagatgg agcctcataa tccagcttag cgataatttc + 24961 tttgtgggta tccatattga tgatatctag aatcttgatg tttgggtctt taatatcgag + 25021 cagttttgtg ataagatgta attgttccat atgattcttt ctaatgagtt gttttgtcgc + 25081 ttttcattat aggtcatatg ggactttttt tctacacaaa aataagctcc ataatatcca + 25141 taggggattt acccactaca aatattatag agcctatact tcgttattgg gcggttacga + 25201 tattcatatt ttttgcaaag atattgtttg aaaaataatt ttcaaaaatt ctgaaaattc + 25261 tgttgacaac tttctgaaaa gagtctataa tggagagaaa gttttaaagg agaaaatgat + 25321 gaaaagttca aaactatttg cccttgcggg cgtgacatta ttg +// + diff --git a/public/res/serotype_genbank/serotype_33A.gb b/public/res/serotype_genbank/serotype_33A.gb new file mode 100644 index 0000000..3ae9a89 --- /dev/null +++ b/public/res/serotype_genbank/serotype_33A.gb @@ -0,0 +1,820 @@ +LOCUS CR931698 18409 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Biehl (serotype 33a). +ACCESSION CR931698 +VERSION CR931698.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18409) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 18409) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..18409 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Biehl" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC33A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC33A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34164.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC33A_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC33A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(462..984) + /gene="tnp" + /locus_tag="SPC33A_0003" + /pseudo + CDS complement(join(462..779,781..984)) + /gene="tnp" + /locus_tag="SPC33A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1205..2650 + /gene="wzg" + /locus_tag="SPC33A_0004" + CDS 1205..2650 + /gene="wzg" + /locus_tag="SPC33A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34167.1" + /db_xref="GOA:O86885" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:O86885" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1205..1321 + /gene="wzg" + /locus_tag="SPC33A_0004" + /note="Signal peptide predicted for SPC1530 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1409..1756 + /gene="wzg" + /locus_tag="SPC33A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.3e-62" + misc_feature 1934..2377 + /gene="wzg" + /locus_tag="SPC33A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2652..3383 + /gene="wzh" + /locus_tag="SPC33A_0005" + CDS 2652..3383 + /gene="wzh" + /locus_tag="SPC33A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34168.1" + /db_xref="GOA:O86886" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:O86886" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDRGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2655..3263 + /gene="wzh" + /locus_tag="SPC33A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.6e-36" + gene 3389..4084 + /gene="wzd" + /locus_tag="SPC33A_0006" + CDS 3389..4084 + /gene="wzd" + /locus_tag="SPC33A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34169.1" + /db_xref="GOA:O86887" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:O86887" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3389..3505 + /gene="wzd" + /locus_tag="SPC33A_0006" + /note="Signal peptide predicted for SPC1532 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3410..3826 + /gene="wzd" + /locus_tag="SPC33A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.1e-55" + misc_feature 3932..4009 + /gene="wzd" + /locus_tag="SPC33A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4094..4783 + /gene="wze" + /locus_tag="SPC33A_0007" + CDS 4094..4783 + /gene="wze" + /locus_tag="SPC33A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34170.1" + /db_xref="GOA:Q4JZQ3" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZQ3" + /translation="MSTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 4798..6165 + /gene="wchA" + /locus_tag="SPC33A_0008" + CDS 4798..6165 + /gene="wchA" + /locus_tag="SPC33A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34171.1" + /db_xref="GOA:O86888" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:O86888" + /translation="MNGKIVKPSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISVYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRTYPNFKGSKKILLLTATFRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGVTGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 4798..4890 + /gene="wchA" + /locus_tag="SPC33A_0008" + /note="Signal peptide predicted for SPC1534 by SignalP 2.0 + HMM (Signal peptide probability 0.845) with cleavage site + probability 0.335 between residues 31 and 32" + misc_feature 5581..6162 + /gene="wchA" + /locus_tag="SPC33A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.7e-157" + gene 6152..6958 + /gene="wciB" + /locus_tag="SPC33A_0009" + CDS 6152..6958 + /gene="wciB" + /locus_tag="SPC33A_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34172.1" + /db_xref="GOA:O86889" + /db_xref="UniProtKB/TrEMBL:O86889" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDL + ILSRANVEILLEKSDIIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDYTLFESRLFGRV + SELLFNVWLCQKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 6962..8002 + /gene="wciC" + /locus_tag="SPC33A_0010" + CDS 6962..8002 + /gene="wciC" + /locus_tag="SPC33A_0010" + /note="member of homology group 125" + /codon_start=1 + /transl_table=11 + /product="putative galactosyl transferase" + /protein_id="CAI34173.1" + /db_xref="GOA:O86890" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:O86890" + /translation="MKVTIIGQIKNKRTGLGKAINDFRDYCCNRATRVTEIDITNNFN + FLSSLFQILISDTDVYYFTPAGSVAGNIRDSLFLFFMIMKRKKIVTHFHNSAFGNVMR + QHPTLMIINRILYSKVDLIILLGEKSKIMFQQLRILDEKFKIIRNGVDGYLFIEKNEL + NKKMSDLPINIIFFSNMIREKGYEILLEVAKKMVGDEKYHFYFSGKFQDNNLKTRFIN + EIYSMNNVTYLDGVYGSDKKKLLQKMHYFVLPSYYKDETLPISMLEAMANGLYIIVSD + VGVVSEVINKETASLIEMINEETADSIIEIINQTSNKLNELDFNVSKYKQELLNENIQ + ASIYQQLERIAN" + misc_feature 7421..7933 + /gene="wciC" + /locus_tag="SPC33A_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2e-14" + gene 8080..8997 + /gene="wciD" + /locus_tag="SPC33A_0011" + CDS 8080..8997 + /gene="wciD" + /locus_tag="SPC33A_0011" + /note="member of homology group 60" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34174.1" + /db_xref="GOA:O86891" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:O86891" + /translation="MPTILSAKNIERVELLIVNDGSTDRTEEIARQFEREYEGIVRVI + SKENCGHGSAVNAGIENAVGNYFKVVDADDWVNTNNLEDLIVFLSEVDVDQVLSPYDK + IFVNYRGDIEREEECNEFSQVENEVIYSAEEFYTRIKQTVGMHSITVKTSLLQENNIR + LSEKMFYVDMEYIVYMLPYVKKVVLFDKSIYRYRLGTETQSISMASYIKNRDMHKQVI + YHLVDFYNQMRSSAVLRRITWKLILNLIRQQWIIYFNLSKKEGKNSECFEFDNWLIKE + GRIKKIPLYFFKAVKYIRFKVKYFLGIRK" + gene 8999..9967 + /gene="wciE" + /locus_tag="SPC33A_0012" + CDS 8999..9967 + /gene="wciE" + /locus_tag="SPC33A_0012" + /note="member of homology group 44" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34175.1" + /db_xref="GOA:O86892" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:O86892" + /translation="MRKIGKVINEYFVLRKSFTPAIARNKLFEKFWGRIGNYKIFNNI + ASNFYQYKHETIINFLEKDFSQFLKSYNFKEVSHKEIEQRKIFSMWIQGYESAPKLVQ + KTIDSQRKYAEKYGYKFVFLDENNIREYVTLPSEIVEKYENGTIDFIKYSDVVRGTLL + SKYGGVWLDSTIYVDSSRELNYLKKDFYTIRAKTHERVPKYIANGRWSAFCLSGEKQN + IVFDFLEKFHVAYFMKYDIVLDYFLIDYIIELGYRTNDLIRNYIDKVEENNQELFFLA + DNFSNQYDEKEWAGVLSTTALFKCSYKCPINEATGTYFDRLMKGEL" + misc_feature 9098..9949 + /gene="wciE" + /locus_tag="SPC33A_0012" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.1e-144" + gene 9987..10958 + /gene="wciF" + /locus_tag="SPC33A_0013" + CDS 9987..10958 + /gene="wciF" + /locus_tag="SPC33A_0013" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34176.1" + /db_xref="GOA:O86893" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:O86893" + /translation="MISVIVPVYNVADYLRFALDSLLEQTYKDFEVILVNDGSTDNSG + EICDEYGKLYDNIHVFHKKNGGLSDARNFGLEKSRGEFITFLDSDDYFEPYALELLIT + IQKKYDVDIVSTKGGITYSHDIYSKKLMAEDYLTVKILTNKEFLAAVYYNDEMTVSAW + GKLYKRDLFKTIFPKGKIYEDLYVVAERLLNIKTVAHTDLPIYHYYQRQGSIVNSTFS + DRQYDFFDAIDHNEAIIKKFYCGDKELLAALNAKRVIGSFILSNSAFYNSKNDITKII + RIIKPYYWEVIKNKKIPMKRKVQCVLFLLSPNYYYKIKDKMLQRGRI" + misc_feature 9993..10505 + /gene="wciF" + /locus_tag="SPC33A_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6.8e-50" + gene 10959..12182 + /gene="wzy" + /locus_tag="SPC33A_0014" + CDS 10959..12182 + /gene="wzy" + /locus_tag="SPC33A_0014" + /note="member of homology group 126" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34177.1" + /db_xref="UniProtKB/TrEMBL:O86894" + /translation="MHVRLDGLLDYIFLFSVIITCNTMYSTSQGFDGLGKWATLLLVV + SVFLKLLISRISMKAINVIVSRSLIFILIILLIVILNGFKISETSFVYYFVLFPIFMM + ILQMYYDVNEIANLIRKFVRIIFLLAIGSLLFWLIGSVFHIISPTVYVLNYWNGGGIV + EGYYNLHFEAQKIEILGAILIRNTGIFAEAPMWSLVLSLALIFQTLHIKKWNFTTWTL + IITIMTTTSTTGVYIIGLIFLYVLFSKTSGVKRYVSSLFILAIICCFSILWDNKSGTG + SATIRFDDYKAGFLAWQKSPIWGLGISDGLRTIEQHMDRTVRYNLGYSNSFFVVLAQG + GIMLASYYFYPVIKIILNKFSSNDLKFSALLIIFLMITTIFIETYMFLFVISLYYSLD + FGDDRDCHEKQYITN" + misc_feature 11781..11978 + /gene="wzy" + /locus_tag="SPC33A_0014" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1e-11" + gene 12213..13628 + /gene="wzx" + /locus_tag="SPC33A_0015" + CDS 12213..13628 + /gene="wzx" + /locus_tag="SPC33A_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34178.1" + /db_xref="GOA:O86895" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:O86895" + /translation="MKILKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFS + SIVTYFTLLATLGVANYGTKEISAHRKEIGKNFWGIYSLQFGATWLSILLYLALCFLF + TSMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGAISIFLFVKSAN + DLYLYVFLLTIFELLGQLSMWLPARQFIGKSYFDWKYAKKHLKPVILLFLPQIAISLY + VTLDRTMLGVLASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVSSLLSSGDYKAVN + KMHEMSFLIYNLVIFPIIAGMLIVNDDFVRFFLGQNFQDARYAIAIMTFRMFFIGWTN + IMGIQILIPHNKNKEFMVSTTVPAILSVGLNLLLLPQFGYIGAAIVSVLTEAFVWGIQ + LFYTRFYLKEVPIIGSMTKTALASAVMYGLLLGSKTSIHFSPTINVLIFSVLGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 12219..13013 + /gene="wzx" + /locus_tag="SPC33A_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.4e-79" + gene 13630..14628 + /gene="wciG" + /locus_tag="SPC33A_0016" + CDS 13630..14628 + /gene="wciG" + /locus_tag="SPC33A_0016" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34179.1" + /db_xref="GOA:O86896" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:O86896" + /translation="MSKFRNINLDLLKVLACVGVVLLHTTMGGFKETGAWNFLTYLYY + LGTYSIPLFFMVNGYLLLGKREITYSYILQKIKWLLITVSSWTFIVWLFKRDFTENLI + KKIIGSLIQKGYFFQFWFFGALILIYLCLPILRQFLNSKRSYLYSLSLLMTIGLIFEL + SNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTIEEIESRFKNWMKIVSILLLLI + SPIILFFIAKTIYHNLFAEYFYDTLFVKVSTLGIFLTILMLTLNENRRESIVSLSNQT + MGVFIIHTYIMKVWEKVLGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 14642..15751 + /gene="glf" + /locus_tag="SPC33A_0017" + CDS 14642..15751 + /gene="glf" + /locus_tag="SPC33A_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34180.1" + /db_xref="GOA:O86897" + /db_xref="HSSP:1I8T" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O86897" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKITEQTADMKDVEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASAEKVVFTGMIDQYFGYKHGELEYRSLRFDHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + misc_feature 15077..15679 + /gene="glf" + /locus_tag="SPC33A_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 2.3e-137" + gene 15732..16838 + /gene="wcjE" + /locus_tag="SPC33A_0018" + CDS 15732..16838 + /gene="wcjE" + /locus_tag="SPC33A_0018" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34181.1" + /db_xref="GOA:Q4JZP2" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZP2" + /translation="MDMTKSRINWIDFGKGFSIFLVLAGHVLLGLYQSEKFPTANNIL + SLLIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQ + KVAGATVRVPTTIFDLINIYKNPIGVSWYLYILWSILIMYGLVSILIKNRRILFLISV + FAYCLTLFVQTDIYIIQRTLVWGICFFLGSVLNEIHFNKISLKKFLVFFVIFDFIYML + VWFLFYEVESKRDSVSYSNPGVWGIAFIVCILVAFVIFPKISEKFPKTFLYFTKYGKD + SLGIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIV + LLPQKYIKLKWLFVNCSGLKSAKLEKGQNSSFLF" + gene complement(16798..18090) + /gene="tnp" + /locus_tag="SPC33A_0019" + CDS complement(16798..18090) + /gene="tnp" + /locus_tag="SPC33A_0019" + /note="member of homology group 13" + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /protein_id="CAI34182.1" + /db_xref="GOA:Q4JZP1" + /db_xref="InterPro:IPR002560" + /db_xref="InterPro:IPR012287" + /db_xref="UniProtKB/TrEMBL:Q4JZP1" + /translation="MKSDKTIIRKIHMEQLHFITKLLDIKDPNIKILDIINMDTHKEI + IAKLDYEAPSCPDCGSLMKKYDFQKPSKIPYLETTGMPSRILLRKRRFKCYHCSKMMV + AETPLVKKNHQIPRIINQKIAQKLIEKISMTDIAHQLAISTSTVIRKLNDFHFEHDFS + RLPKIMSWDEYAFTKGKMSFIAQDFDNLNIITVLEGRTQAVIRNHFLRYDRAVRCQVK + IITMDMFSPYYDLAKQLFPCAKIVLDRFHIIQHLSRAMSRFRVQIMNQFERKSHEYKA + IKRYWKLIQQDSRKLSDKRFYRPTFRMHLTNKEILDKILSYSEDLKHHYQIYQLLLFH + FQNKDPEKFFGLIEDNLKQVHPIFQTVFKTFLKNKEKIVNALQLPYSNAKLEATNNLI + KLIKRNAFGFRNFENFKKRIFIALNIKKERTNFVLSRA" + misc_feature complement(17302..17598) + /gene="tnp" + /locus_tag="SPC33A_0019" + /note="HMMPfam hit to PF01610, Transposase, score 5e-48" + misc_feature complement(17638..17703) + /gene="tnp" + /locus_tag="SPC33A_0019" + /note="Predicted helix-turn-helix motif with score + 1691.000, SD 4.95 at aa 130-151, sequence + ISMTDIAHQLAISTSTVIRKLN" + gene 18362..>18409 + /gene="aliA" + /locus_tag="SPC33A_0020" + CDS 18362..>18409 + /gene="aliA" + /locus_tag="SPC33A_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34183.1" + /db_xref="UniProtKB/TrEMBL:Q4K2C2" + /translation="MMKSSRLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaaggca gaaatccttt gttttttata accaaggttt ataaaccttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtt aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaatttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattc + 781 atttgttaga cctgcaatca aagaaatcct ctgatatctt cttccagata ctttgcctct + 841 tcttaactga ccttttaatg agcgaccata ttctcgatga aaataagtat cgaatcctgt + 901 ttcatcaatc taaacaggtg ctaggtgctt taaactatta aaattcttaa gaaataaggc + 961 tactttttct gggtcttgtt cataattaga ttgaaactag agtagtacac ctctgcttct + 1021 aaaaaatttt tagaaatcga tttaactgtc ctgatcgatt tgtcatgttc ttatttcatt + 1081 ttactatatt tttgtttcgc gggaagtcta ctaagatact taaagatgca gatagtaaaa + 1141 aaatgtagac attaccgtaa aaaagtgata taatcgtatg atgttcaatg tataggtgtt + 1201 aatcatgagt agacgtttta aaaaatcacg ttcacagaaa gtgaagcgaa gtgttaatat + 1261 agttttgctg actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta + 1321 caatatcctt gcttttagat atcttaatct agtggtaact gcgttagtcc tactagttgc + 1381 cttggtaggg ctactcttga ttatctataa aaaagctgaa aaatttacta tttttctgtt + 1441 gctgttctct atccttgtca gctctgtgtc gctctttgca gtacagcagt ttgttggact + 1501 gaccaatcgt ttaaatgcga cttctaatta ctcagaatat tcaatcagtg tcgctgtttt + 1561 agcagatagt gagatcgaaa atgttacgca actgacgagt gtgacagcac cgactgggac + 1621 tgataatgaa aatattcaaa aactactagc tgatatcaag tcaagtcaga ataccgattt + 1681 gacggtcaac cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac + 1741 taaggccatt gtcctaaata gtgtctttga aaatatcatc gagtcagagt atccagacta + 1801 cgcatcgaag ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa + 1861 gacgtctaag aatcagtctt tcaatatcta tgttagtgga attgacacct atggccctat + 1921 tagttcagtg tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa + 1981 aatcctcttg accacaacgc cacgtgatgc ctatgtacca atcgcagatg gtggaaataa + 2041 tcaaaaagat aaattaaccc atgcgggcat ttatggagtt gattcgtcca ttcacacctt + 2101 agaaaatctc tatggagtgg atatcaatta ctatgtgcga ttgaacttca cttcgttttt + 2161 gaaattgatt gatttgttgg gtggaattga tgtttataat gatcaagaat ttactgccca + 2221 tacgaatgga aagtattacc ctgcaggcaa tgttcatctt gattcagaac aggctctcgg + 2281 ttttgttcgt gagcgctact cactagcaga tggcgatcgt gaccgcgggc gcaatcaaca + 2341 aaaggtgatt gtggctatcc ttcaaaaatt aacgtcaacc gaagcactga aaaattatag + 2401 cacgatcatt aatagcttgc aagattctat ccaaacaaat atgccacttg agactatgat + 2461 aaatttggtc aatgctcagt tagaaagtgg agggaattat aaagtaaatt ctcaagattt + 2521 aaaaggtaca ggtcggacgg atcttccttc ttatgcaatg ccagacagta acctctatgt + 2581 gatggaaata gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga + 2641 gggtagatga aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca + 2701 agtcaagaga ggaaagcaag gctctcttga cagaatccta caggcagggg gtgagaacca + 2761 ttgtctctac ctctcaccgt cgcaagggca tgtttgaaac tccggaagag aagatagcag + 2821 aaaactttct tcaggttcgg gaaatagcta aggaagtggc gagtgacttg gtcattgctt + 2881 atggggctga aatttactac acaccagatg ttctggataa gctggaaaaa aagcggattc + 2941 cgaccctcaa tgatagtcgt tatgccttga tagagttcag tatgaacact ccttatcgcg + 3001 atattcatag cgccttgagc aagatcttga tgttgggaat tactccagtc attgcccaca + 3061 ttgagcgcta tgatgctctt gaaaataatg aaaaacgcgt tcgagaactg attgataggg + 3121 gctgttacac gcaagtaaat agttcacatg tcctcaaacc caaacttttt ggcgaacgtt + 3181 ataaattcat gaaaaaaaga gctcagtatt ttttagagca ggatttggtt catatcattg + 3241 caagtgatat gcacaatcta gacggtagac ctcctcatat ggcagaagca tatgaccttg + 3301 ttacccaaaa atacggagaa gcgaaggctc aggaactttt tatagacaat cctcgaaaaa + 3361 ttgtaatgga tcaactaatt taggagaaat gatgaaagaa caaaacacga tagaaatcga + 3421 tgtatttcaa ttatttaaaa ccttgtggaa acgcaagcta atgattttaa tagtggcact + 3481 tgtgacaggt gcgggggctt ttgcatatag cacttttatt gttaagccag aatatacgag + 3541 taccacgcga atttacgtag tgaatcgcaa tcaaggagac aagccggggc tgacaaatca + 3601 ggatttgcag gcaggatctt atctggtaaa agactaccgt gagattatcc tttcgcagga + 3661 tgcattggaa aaagtagcga caaatttgaa gttggatatg ccagcaaaaa cgttagccag + 3721 caaagttcaa gtgactgtac cagctgacac tcgtatcgtc tcaatctctg tcaaggataa + 3781 acagccagag gaagccagtc gtatcgctaa ttctctacga gaagttgctg cagaaaagat + 3841 cgtcgctgta acgcgagtat ctgatgtaac gacacttgaa gaagcgcgac cagctacgac + 3901 tccctcttct ccaaatgttc gacgcaattc cttgtttggt tttcttggag gagcagtcgt + 3961 aacagtaatt gctgttcttt tgattgagtt gctggacacc cgtgtgaaac gtcctgaaga + 4021 tgttgaagat gtactgaaaa ttccactttt agggctcgtt ccagattttg acaaaataaa + 4081 ataggaggaa gttatgtcaa cattagaaat ctcacaggca aaattggatt ctgtaaaaaa + 4141 ggcagaggaa tattataacg ctttgtgcac gaacctacag ttaagtggag atggtttgaa + 4201 agtattttct atcacttctg tgaaaatagg agaaggaaaa tcaacgactt ccgccaatat + 4261 cgcttgggct tttgcgcgtg caggttacaa aacgctgctg attgatggag atattcgcaa + 4321 ttctgttatg ttaggtgtct ttaaagcaag gaataagatt acaggcctga cagaattttt + 4381 atcaggaact acagacttat cacaagggct ttgtgatacc aatatcgaaa atctctttgt + 4441 aattcaggct ggctctgtgt caccgaatcc gacagctctt cttcaaagta agaatttcac + 4501 tacaatgctt gaaaccttgc gtaaatattt tgactacatc attgtagata ctgctcctgt + 4561 tggtgtcgtg attgatgcgg ctattattac gcgaaactgc gatgcttcta ttttagtgac + 4621 ggaggcaggt gaaataaatc gtcgggatat tcaaaaagca aaagaacagt tggaacacac + 4681 aggaaagccg tttttgggaa ttgtgttgaa taaattcgat acttcagtag acaaatacgg + 4741 ttcttatgga aattatggag attacgggaa aaataaaaaa taggtcgggg gatagagatg + 4801 aatggaaaaa tagtaaagcc ttcattggcc ataatccaga gttttcttgt tattttattg + 4861 acttatctac ttagtgctgt gagagaagcg gagattgttt caacaacagc tattgcactt + 4921 tatatcctcc attattttgt cttttatatc agtgtttatg ggcaggattt ctttaaaagg + 4981 ggatatttga ttgaacttgt ccagacattg aaatatatcc tattctttgc actagcgatt + 5041 agtatttcta attttttctt agaggatcga tttagtattt ccagacgagg catgatttac + 5101 ttcctcacat tacatgctct cttagtctat gtgctaaacc tatttatcaa gtggtattgg + 5161 aagcggactt atcccaactt taaaggaagt aagaagatcc tcttgcttac agcaactttt + 5221 cgtgtcgaaa aggtactgga tagattaata gaatcaaatg aggttgttgg ggagttggta + 5281 gccgtcagtg tcttagataa accagatttt cagcatgatt gtttaaaggt agtagcagag + 5341 ggggagatag taaactttgc gactcatgag gtggtcgatg aagtctttat caatcttccg + 5401 agtgaaaaat acaatattgg agagcttgtc tctcagtttg aaacgatggg aattgatgta + 5461 acagttaatc taaatgcttt tgatcgtagt ttggcacgta acaagcaaat tcgtgagatg + 5521 gcaggattaa acgttgtgac tttttctaca acattttata agactagtca tgtaattgct + 5581 aagcggatta ttgatatcat gggtgcattg gtcgggttga tattatgtgg tttagtcagt + 5641 attgtactgg ttcctttgat tcgaaaggat gggggctctg ctatttttgc tcagacgcgt + 5701 ataggaaaaa atggtcgtca gttcaccttt tataagtttc gctctatgtg tgtagatgcc + 5761 gaggcgaaaa aaagagaact catggaacaa aataccatgc agggtggaat gtttaaggtg + 5821 gacgatgatc ctcgtatcac gaaaattggt cgttttatac ggaagactag cttggacgag + 5881 ctaccacagt tttataatgt tctaaaggga gatatgagtt tggttggcac acggccacca + 5941 acagtggatg agtatgaaca ctatacccca gaacaaaaac gtcggctaag ttttaaacct + 6001 ggtgtaacag gcttatggca ggtcagtgga cgaagtgaaa tcaaaaattt cgatgaagtt + 6061 gtcaaattag atgtggctta tatagatgat tggacaatct ggaaagatat tgaaatttta + 6121 ttgaagacag ttaaggtagt attgatgaag gatggagcga agtagattga tagatgtaaa + 6181 aatcattgtg gcaacgcata aagaggttaa aatgcctcaa gacaatagtc tttaccttcc + 6241 aatacatgtt gggagagacg gtaaatcaga tattggtttt atcggtgata atactggcga + 6301 taatatatcc tctctaaatc catattattg tgagttaacg ggactttatt gggcatggaa + 6361 gaatcttgat tataattact taggtttagt tcattaccgt cgttatttta caaataaatc + 6421 tcaagggtat aatgaaaatg tcaatatgga tgacctcatt ttgtctcgag ctaatgttga + 6481 aatattatta gagaaatctg acataatagt tccaaagaag cgaaagtatt atattgaaac + 6541 tctttattca cattatgccc atacccttaa cggagaacat ctggatcttg ctaggaaaat + 6601 tattgagcaa aatagttcag agtatctttc atcctttgat aaagtgatga aacaaagaag + 6661 cggttatatg ttcaatatgt ttatcatgaa aaaagaacta ttagatgatt atttaccgtg + 6721 gcttttttct attctggata ctatgtacga acagatggac ttgactgact atactttatt + 6781 tgagtcacgt ttattcgggc gagttagtga gttgttgttt aatgtttggt tatgtcaaaa + 6841 aggaataacg cctaaagagg taccatttat gtacatggag agagtggatt tgtttgaaaa + 6901 aggaaaatct tttttaatgg ctaaattttt tggaaagaag tatggacaga gtttctagga + 6961 tatgaaagta actattattg gacaaataaa aaataagaga acaggtcttg gaaaggcgat + 7021 taatgatttt agggattatt gttgcaatcg tgctacaaga gtaacggaaa tagatataac + 7081 aaataatttt aattttttaa gctctctttt tcaaatttta atatctgata cagatgttta + 7141 ttattttact ccagctggtt cagtagctgg taatattagg gattcactgt ttttgttctt + 7201 tatgataatg aaaaggaaaa aaatagtgac ccattttcat aatagtgctt ttggaaatgt + 7261 gatgagacaa catccgactc taatgataat aaatagaata ttgtattcta aagttgattt + 7321 gattatatta ttgggagaga aatcgaaaat aatgtttcaa caactaagaa ttttagacga + 7381 aaaatttaaa ataattagga atggtgtgga tggatattta tttattgaaa aaaatgaatt + 7441 aaataaaaaa atgagcgatc tacccataaa tattattttt tttagtaata tgattagaga + 7501 aaaaggttac gaaattttat tagaagttgc taagaagatg gtgggggatg agaaatatca + 7561 cttttatttt tctggaaaat ttcaggataa taatttaaag actaggttta ttaatgaaat + 7621 ttatagtatg aataatgtaa catatttaga tggtgtatat ggtagtgata agaaaaagtt + 7681 attgcaaaaa atgcattact ttgttttacc atcgtattat aaagatgaaa ctttacctat + 7741 cagtatgtta gaagcaatgg caaatggtct ctatattatt gtaagcgatg tgggagttgt + 7801 gtcagaggtg attaataaag aaactgctag tcttattgaa atgataaacg aagaaacagc + 7861 agacagtatc atagaaatta ttaatcagac ttcaaataaa cttaatgagt tagattttaa + 7921 tgtatcaaaa tataagcaag agttgttaaa tgaaaatata caagcatcaa tttatcagca + 7981 attagagagg atagcaaatt gacgaagaaa aaaaatactg gaaaaatatt aacagtagtt + 8041 gtaccatcat ataatgcaga aaattattta caagagacga tgccgacgat actttctgct + 8101 aagaatatag agagggtaga attactgatt gtaaacgatg gttctacaga cagaaccgaa + 8161 gaaatagcaa gacaattcga gagagaatat gagggaattg ttagagttat aagtaaggaa + 8221 aactgtggtc acggttcggc agtaaatgcg gggattgaga atgctgttgg taattacttt + 8281 aaagtggtag atgcagatga ttgggtgaac accaataatt tagaagattt gatagtgttt + 8341 ctatctgagg tggatgtgga tcaagtttta tcaccatatg ataaaatttt tgtgaattat + 8401 cgaggtgata tagagcgtga agaagagtgc aacgagtttt cgcaagttga gaacgaggtg + 8461 atctattctg cagaagaatt ctatacacga attaaacaaa cggtaggaat gcattccatt + 8521 actgtgaaaa cgagtctttt gcaagagaac aatattcggc tgtctgaaaa aatgttctat + 8581 gtagatatgg aatatattgt ttatatgctt ccatatgtaa aaaaggttgt tttatttgat + 8641 aaaagtatct atagatatcg tctaggaaca gagacacaaa gcattagtat ggcgagttat + 8701 attaaaaatc gtgatatgca taaacaagtg atctatcatt tggttgattt ttataatcaa + 8761 atgagatcta gcgctgtttt aaggagaata acatggaaat tgattttaaa tttaataaga + 8821 cagcaatgga taatttattt taatttatct aaaaaagagg ggaaaaacag cgagtgtttt + 8881 gaatttgata attggctaat aaaagaagga cggataaaaa aaataccact atactttttt + 8941 aaagctgtga aatatatcag atttaaggtg aaatattttc tggggataag aaaataatat + 9001 gagaaaaata ggaaaagtaa taaacgagta ttttgtatta agaaaatcat ttactcctgc + 9061 tattgctcgg aataaattat ttgaaaagtt ttggggacgg atagggaatt ataaaatttt + 9121 caataatata gctagtaatt tttatcaata caaacatgaa acaatcataa attttttgga + 9181 aaaagatttt agccaatttt taaaatccta taactttaaa gaggtatcgc acaaggagat + 9241 agaacaaaga aaaatcttct ctatgtggat acaaggatac gaaagtgctc ctaagttggt + 9301 tcagaagacg attgatagcc aaaggaaata tgcagaaaaa tacggatata aatttgtttt + 9361 tttggatgaa aacaatatcc gtgaatatgt gacacttcca tcagagatag tagaaaaata + 9421 tgagaatgga actatagatt ttataaaata ttcggatgtt gtaaggggaa cattgctttc + 9481 aaaatatgga ggagtgtggt tagattcgac tatttatgtt gattcttcac gagaactgaa + 9541 ttatttaaaa aaagattttt atactattcg agcaaagaca catgagagag tgcccaaata + 9601 tatcgcaaat ggtaggtggt ctgcattttg tttgtcaggg gaaaagcaaa acatagtatt + 9661 tgatttttta gagaaatttc atgtagcata ttttatgaaa tacgatatag tgctagatta + 9721 ttttttaatt gactatatta tagaattagg ttataggaca aatgacttga ttagaaacta + 9781 tattgataaa gtcgaagaaa ataatcagga gttgttcttt ttggcagaca atttttctaa + 9841 ccagtatgat gaaaaagagt gggcaggagt tttatcaaca actgcattgt ttaagtgtag + 9901 ttataagtgt ccgataaatg aagcgacagg aacctatttt gatagattga tgaagggtga + 9961 actgtagcat aaagagaggg aatggtatga tttcagttat tgttccagta tacaatgtcg + 10021 cggattatct gcgctttgcg ttggatagtc ttttggaaca gacgtataaa gattttgagg + 10081 ttattctagt aaatgatgga tccactgata attctgggga aatatgtgat gaatatggga + 10141 aactgtatga taatattcat gttttccata agaagaatgg cggactttcg gatgctagaa + 10201 attttggttt ggagaagagt cgaggagagt ttataacttt tcttgattca gatgattatt + 10261 ttgaaccgta tgcattagaa ttgttaatta ctattcaaaa aaaatatgat gtagatatcg + 10321 tatcaactaa agggggaata acctattctc atgatattta tagcaaaaaa ctgatggctg + 10381 aggactacct aactgtaaaa atattgacaa ataaagaatt tttggcagct gtatattata + 10441 acgatgaaat gacggtatct gcttggggaa aattgtataa aagagattta tttaaaacga + 10501 tttttccaaa aggaaagatc tacgaggatt tgtatgttgt tgcagagcgt ttgttgaata + 10561 ttaaaacagt tgctcatacc gatttgccta tatatcatta ttatcagaga cagggaagta + 10621 ttgttaattc aacattttcg gatagacagt atgatttttt tgatgcgatt gatcataatg + 10681 aagccataat aaaaaaattc tattgtggag ataaggaatt gttagcagcc ttaaatgcta + 10741 aaagagtaat tggctccttt attttgagta atagcgcatt ttataatagt aaaaacgata + 10801 ttactaaaat aataagaata attaaaccgt attattggga agtaataaaa aataaaaaaa + 10861 ttccaatgaa aaggaaagtt caatgtgttt tgtttctgct ttccccaaat tactactata + 10921 aaataaaaga taagatgtta cagagaggca ggatatagat gcatgttaga ttagatggtt + 10981 tgctggacta tatatttcta tttagtgtga ttattacttg taatactatg tattcaacta + 11041 gtcaaggatt tgatggacta gggaaatggg cgactctgtt acttgtggta tcagtttttc + 11101 tgaaattgct tatctctaga atatctatga aggcaatcaa tgtgattgtg tcgcgttctt + 11161 taatatttat attaattatt ctactcatag taatattaaa tggttttaag atttctgaga + 11221 caagtttcgt ctattatttt gtattatttc cgatttttat gatgattttg cagatgtact + 11281 atgatgttaa tgaaatcgca aatctgatac ggaaatttgt tcgtataata tttcttttag + 11341 caattggctc tctcctattt tggcttattg gtagtgtatt tcatattata tccccaacgg + 11401 tttatgtgtt gaattattgg aatggtgggg gaatagtaga agggtactat aatcttcatt + 11461 ttgaagcaca aaaaatagag attttggggg cgatactgat aagaaatacg gggatttttg + 11521 ctgaagcacc tatgtggagt ttggtattga gccttgcatt gatatttcaa acgcttcata + 11581 taaaaaaatg gaatttcaca acttggactc ttattattac aattatgaca actacgtcaa + 11641 caacaggggt ttatataata ggtttgattt tcctatatgt tttattttca aaaacaagtg + 11701 gtgtgaagag atatgtttct agtttattta ttttagcgat tatatgttgt ttttcaatat + 11761 tatgggataa taaatctgga actggttcag caactatacg ctttgatgat tataaggctg + 11821 gttttttggc atggcagaaa agtcctattt ggggattagg tatttcagac ggtcttagaa + 11881 ccattgaaca acatatggat agaactgtta gatataatct tgggtatagc aatagctttt + 11941 ttgttgtttt agctcaagga gggataatgt tggcttcgta ttacttttat ccagtaatta + 12001 aaattatttt gaataaattt agttcgaatg atttgaagtt ttctgcgcta ttaataattt + 12061 tccttatgat aactactata tttatagaga cctatatgtt tttatttgtc atttctttat + 12121 actattctct tgattttggg gacgatagag attgtcatga gaaacagtac attactaatt + 12181 aataataaag gtgtgaacag aaataagaag aaatgaaaat actaaaaaac tatgcctaca + 12241 atctttctta tcaattgttg gtgatcatac tccctatcat tacgactccc tatgtaacga + 12301 gggtttttag ttctgacgat ttaggaacgt atggctactt tagctccatt gttacctatt + 12361 ttaccttgct tgcaactctt ggtgttgcca actacggtac caaagagatt tcagcacatc + 12421 gtaaggaaat tgggaagaat ttctggggaa tttattctct ccagtttggt gcaacttggc + 12481 tatccatttt gctttatctt gccctttgtt tcttatttac ttcaatgcaa aatccggtag + 12541 cttatatatt gggattaagt ttagtgtcaa aaggtttgga tatttcttgg ttatttcaag + 12601 gtttggagga ttttagaaag attacagttc ggaacatcac tgttaagtta gttggtgcaa + 12661 tctctatttt cctatttgta aaatcagcta atgacttata cttatatgta tttcttctta + 12721 ccattttcga attgttaggg caattaagca tgtggttacc cgcaagacaa tttattggta + 12781 aatcatattt tgattggaaa tacgctaaga agcatttgaa accagttatc ttgttattct + 12841 tgccacagat tgccatctcg ctttatgtga ctttggaccg tacgatgctg ggggtgttgg + 12901 cttcgacaaa ggatgttgga atttatgatc aagctttgaa gcttgttaat attttactga + 12961 ctttggttac ctcactgggg agtgttatgt tgccacgagt atctagcctt ttatcgtctg + 13021 gggattacaa agccgttaat aagatgcacg agatgtcttt tttaatctat aacttggtga + 13081 ttttcccaat catagcagga atgttgattg tcaacgatga ttttgttcgt ttcttccttg + 13141 ggcaaaattt tcaagatgct cgctatgcga ttgctattat gaccttccgt atgttcttta + 13201 ttggttggac caatataatg ggaattcaaa tcttgattcc gcacaataaa aataaggaat + 13261 ttatggtttc aacgacagtt cccgctattc tgagtgtggg attgaatttg ttgcttcttc + 13321 cccaatttgg ttatataggt gctgcgattg tttcagtttt gactgaggcg tttgtatggg + 13381 ggattcagtt attctataca cgtttttatt taaaagaagt tcctattatc ggttcaatga + 13441 caaaaactgc acttgcatct gctgttatgt atggtctctt gctaggttca aaaacatcta + 13501 tacatttttc gccaaccata aatgttttaa tattttcggt gctaggcgga attatctatc + 13561 tttttgcaat tctatctctg aaagtggtag atgtgaaaga attaaaacaa ataatcagga + 13621 aaaattagaa tgagcaaatt tcgaaatatt aacttagatt tactaaaagt gcttgcatgt + 13681 gttggagtcg ttctacttca tacaactatg ggtgggttta aagagacagg tgcatggaat + 13741 tttttgacat atttatatta cttaggaacc tattctatcc ctctattttt tatggtcaat + 13801 ggttatttat tgttggggaa gagagaaatt acctattcct acatattgca aaaaataaaa + 13861 tggctcctaa taacagtgtc gtcatggact tttatcgttt ggctgtttaa aagagacttt + 13921 acagagaact taattaaaaa aattataggt tctttgatac aaaaggggta tttcttccag + 13981 ttttggtttt tcggtgcact catacttatc tatttatgtt tgccaatttt gagacaattt + 14041 ctaaattcaa aaagaagcta tttatacagt ttatctttat tgatgactat tggtttgatt + 14101 tttgagttat caaatatcct acttcaaatg ccaatacaaa catatgtaat acaaactttt + 14161 agattatgga cgtggttttt ttactatctt ttaggtggtt atatagcgca attcactata + 14221 gaagaaatcg aatcaaggtt taagaattgg atgaaaatag ttagcatact tttgttattg + 14281 atttcaccaa taatattatt tttcatagcg aagactatat accataatct atttgctgaa + 14341 tacttttatg atactttatt tgtaaaagtc agtactttag gaatttttct aactatcctc + 14401 atgcttactt tgaatgaaaa ccgaagagaa tcgattgttt ccctttctaa tcaaacaatg + 14461 ggggttttca taatacatac ttatattatg aaagtgtggg aaaaagtgct tggttttaat + 14521 tttgtaggag catatttact ttttgctcta tttactttaa gtgttagttt tattattgtt + 14581 gggatgttaa tgaagattcc ttacttcaat cgaatcgtca aattataaaa aggagaacaa + 14641 gatgtacgat tatcttattg tcggtgctgg tttgtcagga gcaatttttg cttatgaggc + 14701 gaccaagcgt ggaaaaaaag taaaagtgat tgataaacgt aaccacattg gtgggaatat + 14761 ctactgtgag aatgtagaag gagttaatgt tcataaatat ggtgcccata tctttcatac + 14821 ttctaataag aaagtttggg attatgttaa tcaatttgct gaatttaaca actacgtcaa + 14881 ctcgcctgta gctaattaca agggtagcct ctataatcta cctttcaata tgaatacctt + 14941 ctatgctatg tgggggacaa aaactcctca agaagtcaaa gataagatta ctgagcagac + 15001 agctgatatg aaggatgttg agccgaaaaa tctggaagaa caggctatca agttgattgg + 15061 tccagatgtc tatgaaaagt taatcaaggg ttatactgaa aagcagtggg gacgctcagc + 15121 aacggaactt cctccattta tcattaaacg tcttccagtt cgtttaacat ttgataataa + 15181 ctattttaac gaccgttacc aaggaattcc tattggtggt tacaatgtca tcatcgaaaa + 15241 tatgcttaaa gacgttgaag ttgagcttgg tgttgatttc tttgctcatc gtgaagagtt + 15301 agaagcatca gctgaaaaag ttgtctttac agggatgatc gaccagtatt ttggctacaa + 15361 gcacggagag ttagaatacc gtagccttcg ctttgatcat gaaattttgg acgaggaaaa + 15421 ttatcaagga aatgctgtag tgaactatac ggagcgtgag attccttata ctcgtattat + 15481 cgaacacaag cattttgaat atggaacaca ggcaaagaca gttatcacgc gtgaatatcc + 15541 agctgactgg aagcgtgggg acgagcctta ctatccgatc aacgatgaga aaaataatgc + 15601 tatgtttgct aagtaccaag aggaagcttc aaagaatgat aaggttattt tctgtggacg + 15661 tttagcagat tataaatatt acgatatgca tgtggtgatt gaacgggcgc ttgaggttgt + 15721 ggagaaagag tttggatatg acaaaaagta gaatcaattg gatagatttt ggaaaaggct + 15781 tttccatatt tttagtctta gcaggacatg tgttgcttgg actgtatcaa tcggaaaaat + 15841 ttcccacagc aaataacata ctatcgttgt tgatagcaca agtctacata tttcatatac + 15901 cagtattttt tgccttatca ggatactttt tcaaacctgt gtcggatttg aaggagttct + 15961 ggcaatatgc taaaaagaag acaattgttt ttggtctgcc atatattttc tattcgatca + 16021 ttcactttgg tcttcaaaaa gttgcagggg cgactgttag agtcccgacg actatatttg + 16081 atttaataaa tatctataaa aatcctattg gagtctcatg gtatttatac atactctggt + 16141 cgattttgat aatgtatgga ttagtatcta ttttaatcaa aaatcgtaga atattatttt + 16201 tgataagtgt ttttgcttat tgtttaaccc tatttgttca aacagatatt tatattattc + 16261 aaagaacgct agtttggggt atttgtttct ttcttggaag tgtattgaac gaaattcact + 16321 ttaataaaat tagtttgaaa aaatttcttg ttttctttgt gatatttgac tttatttata + 16381 tgcttgtatg gttcttattt tatgaagtag agtctaaaag ggatagtgta agctatagta + 16441 acccaggggt gtgggggatt gcttttattg tctgtatatt agttgcgttt gtaatcttcc + 16501 ctaaaatatc ggaaaaattt cctaaaactt tcctatattt cactaaatat ggtaaagata + 16561 gtttaggtat ctatatcctc catgcaccaa tttgtagcat gattcggatt ctaatgttga + 16621 aagtgggaat aaactcagtt tttcttcacg ttgttgttgg gattgtcttg ggttggtatt + 16681 tatccatact ggcaacttat atattgaaaa aaattccatt tttgaatatt gttttattac + 16741 cacaaaagta tattaaatta aaatggctct ttgtcaactg tagtgggttg aagtcagcta + 16801 agctcgagaa aggacaaaat tcgtcctttc ttttttgatg ttcagagcga taaaaatcct + 16861 ttttttgaag ttttcaaagt tccgaaatcc aaaggcgttt cgtttgataa gtttgatgag + 16921 attattggtc gcttccaatt ttgcgttgga ataaggtaat tgaagagcgt tgacgatttt + 16981 ttctttgttc tttagaaagg ttttaaagac agtctgaaaa ataggatgaa cctgcttcag + 17041 attgtcctca atgagtccga aaaatttctc agggtctttg ttctgaaagt gaaaaagtaa + 17101 gagttgatag atctgatagt ggtgtttcaa gtcttctgaa tagcttaaaa tcttgtcaag + 17161 aatttcttta tttgttaagt gcatgcgaaa agtagggcga taaaaacgtt tatcgctcaa + 17221 tttacgacta tcctgttgga taagtttcca gtaacgtttg atagccttgt attcatgaga + 17281 ttttcgttca aactgattca taatttgaac acgaaaacga ctcatggcac ggctgagatg + 17341 ttggataata tggaaacgat ctagaacgat tttagcacac ggaaaaagct gtttagccaa + 17401 gtcatagtaa ggactaaaca tatccatcgt aatgattttc acttgacaac gaacggctct + 17461 atcgtagcga agaaagtgat ttcggatgac agcttgtgtt ctgccttcaa gaacagtgat + 17521 aatattaaga ttatcaaaat cttgcgcaat gaaactcatc tttcccttag tgaaggcata + 17581 ctcatcccaa gacataatct ttggaagccg agaaaaatca tgctcaaagt gaaagtcatt + 17641 gagcttgcga atgacagttg aagttgaaat ggccagctga tgggcaatat cagtcataga + 17701 aattttttca attaactttt gagcaatttt ttggttgatg atacgaggga tttggtgatt + 17761 tttctttacc aggggagtct cagcaaccat catttttgaa cagtgatagc acttgaaacg + 17821 gcgttttcta aggagaattc tagaaggcat accagttgtt tcgaggtaag ggatcttaga + 17881 cggtttttga aagtcatatt tcttcattag acttccacaa tcagggcaag atggagcctc + 17941 ataatccagc ttagcgataa tttctttgtg ggtatccata ttgatgatat ctagaatctt + 18001 gatgtttggg tctttaatat cgagcagttt tgtgataaaa tgtaattgtt ccatatgaat + 18061 ctttctaatg atggttttgt cgcttttcat tataggtcat atgggacttt ttttctacaa + 18121 taaaataggc tccataatat ctatagtgga tttacccact atagatatta tagagccatt + 18181 aaaataaatt attttagatt tataatgtgg ctctttgtca actaacatct ggagaggaca + 18241 atcactgtct tctccttttt tgtcttttca gaatatacca aattaacaca aaaattctga + 18301 aaattctgtt gacaactttc tgaaaagagt ctataatgga gagaaagttt taaaggagaa + 18361 aatgatgaaa agttcaagac tacttgccct tgcgggcgtg acattattg +// + diff --git a/public/res/serotype_genbank/serotype_33B.gb b/public/res/serotype_genbank/serotype_33B.gb new file mode 100644 index 0000000..0c499c0 --- /dev/null +++ b/public/res/serotype_genbank/serotype_33B.gb @@ -0,0 +1,850 @@ +LOCUS CR931699 19039 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain E294 (serotype 33b). +ACCESSION CR931699 +VERSION CR931699.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 19039) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 19039) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..19039 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="E294" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC33B_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC33B_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34184.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC33B_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC33B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(462..992,994..1323)) + /gene="tnp" + /locus_tag="SPC33B_0003" + /pseudo + CDS complement(join(462..992,994..1323)) + /gene="tnp" + /locus_tag="SPC33B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(933..992,994..1305)) + /gene="tnp" + /locus_tag="SPC33B_0003" + /note="HMMPfam hit to PF01710, Transposase, score 7.9e-23" + /pseudo + gene 1558..3003 + /gene="wzg" + /locus_tag="SPC33B_0004" + CDS 1558..3003 + /gene="wzg" + /locus_tag="SPC33B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34187.1" + /db_xref="GOA:Q4JZN8" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZN8" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVGFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLM + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDRSLAVVKAAIQDVMEGR" + misc_feature 1558..1674 + /gene="wzg" + /locus_tag="SPC33B_0004" + /note="Signal peptide predicted for SPC1550 by SignalP 2.0 + HMM (Signal peptide probability 0.998) with cleavage site + probability 0.539 between residues 39 and 40" + misc_feature 1762..2109 + /gene="wzg" + /locus_tag="SPC33B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.8e-63" + misc_feature 2287..2730 + /gene="wzg" + /locus_tag="SPC33B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 3005..3736 + /gene="wzh" + /locus_tag="SPC33B_0005" + CDS 3005..3736 + /gene="wzh" + /locus_tag="SPC33B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34188.1" + /db_xref="GOA:Q4JZK3" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZK3" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLIIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIIMDQLI" + misc_feature 3008..3616 + /gene="wzh" + /locus_tag="SPC33B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 6.2e-37" + gene 3742..4437 + /gene="wzd" + /locus_tag="SPC33B_0006" + CDS 3742..4437 + /gene="wzd" + /locus_tag="SPC33B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34189.1" + /db_xref="GOA:Q4JZK2" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZK2" + /translation="MMKEQNMIEIDVFQLFKTLWKRKLIILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRDQGDKPGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIEVLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3742..3858 + /gene="wzd" + /locus_tag="SPC33B_0006" + /note="Signal peptide predicted for SPC1552 by SignalP 2.0 + HMM (Signal peptide probability 0.649) with cleavage site + probability 0.422 between residues 39 and 40" + misc_feature 3763..4179 + /gene="wzd" + /locus_tag="SPC33B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.5e-56" + misc_feature 4285..4362 + /gene="wzd" + /locus_tag="SPC33B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4447..5136 + /gene="wze" + /locus_tag="SPC33B_0007" + CDS 4447..5136 + /gene="wze" + /locus_tag="SPC33B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34190.1" + /db_xref="GOA:Q4JZN5" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZN5" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVLSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAVIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5151..6518 + /gene="wchA" + /locus_tag="SPC33B_0008" + CDS 5151..6518 + /gene="wchA" + /locus_tag="SPC33B_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34191.1" + /db_xref="GOA:Q4JZN4" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZN4" + /translation="MNGKILRSSLVIIQSFLVILLTYLLSTVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELLQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTAFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5151..5243 + /gene="wchA" + /locus_tag="SPC33B_0008" + /note="Signal peptide predicted for SPC1554 by SignalP 2.0 + HMM (Signal peptide probability 0.936) with cleavage site + probability 0.432 between residues 31 and 32" + misc_feature 5934..6515 + /gene="wchA" + /locus_tag="SPC33B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.8e-160" + gene 6646..7590 + /gene="wciN" + /locus_tag="SPC33B_0009" + CDS 6646..7590 + /gene="wciN" + /locus_tag="SPC33B_0009" + /note="member of homology group 62" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34192.1" + /db_xref="GOA:Q4JZN3" + /db_xref="InterPro:IPR002495" + /db_xref="UniProtKB/TrEMBL:Q4JZN3" + /translation="MDIVYTTDNNFVEVLYASISSLYETNALLYPNVWIIADKVSAKN + RDKINELASKNNQNTINWIENIEKPFKLTSDRGSISSYSRLFLGEVLPKKVRKVLYLD + CDIIIMDSLSDLFDEEFDGKIIQGVSDVLNKEYKKILNIPVSAPVFNSGVLYIDLDKW + REQRIEEKLVYIINKFKGNVIQGDEGVLNAVLFDSYKELSPRYNYMTIFEDMSYEDMI + AFKQPVNYYSKEVLEESRKNIIIRHFTTCFLSLRPWQESSEVTHVEIFKKYYRGAYKQ + ASPSKLLNIYKILPKKMSLYLLGFIQSKVRPKLYRITK" + misc_feature 6649..7419 + /gene="wciN" + /locus_tag="SPC33B_0009" + /note="HMMPfam hit to PF01501, Glycosyl transferase + family, score 1.2e-58" + gene 7600..8310 + /gene="wciO" + /locus_tag="SPC33B_0010" + CDS 7600..8310 + /gene="wciO" + /locus_tag="SPC33B_0010" + /note="member of homology group 81" + /codon_start=1 + /transl_table=11 + /product="putative ribitol phophotransferase" + /protein_id="CAI34193.1" + /db_xref="GOA:Q4JZJ8" + /db_xref="InterPro:IPR000462" + /db_xref="UniProtKB/TrEMBL:Q4JZJ8" + /translation="MVSVKSIEQKTMTEEKKREAKKDIFAFYVGRPLSYILTIPFLKT + KMTPNQISILSIVPLIIGTALVTVSSNQFVLLLNWLCFFLWNLLDGVDGNVARFKGIT + SPMGSVIDAMAGYAAMYLSFLTMGIIASDYSQTLFFTQKTYLILGSLSGVFVLFPRLI + MHKAINTVGSKNSEQYKGRKNFGVIEMIALNVTSITGFAQLFMLIAILLKLSDLFTLV + YFLINLLVMVISIKKIVK" + misc_feature 7834..8298 + /gene="wciO" + /locus_tag="SPC33B_0010" + /note="HMMPfam hit to PF01066, CDP-alcohol + phosphatidyltransferase, score 0.0078" + gene 8325..9419 + /gene="wcrC" + /locus_tag="SPC33B_0011" + CDS 8325..9419 + /gene="wcrC" + /locus_tag="SPC33B_0011" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34194.1" + /db_xref="GOA:Q4JZJ7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZJ7" + /translation="MKKIAIVRYNLSKIGGAEKVAINMANEFSQNHKTYLISILLNED + KNINYDISSDVEVESFFYGDLRVRKVIIPAMLKLRKHLIKNEIDVVFSIAPATNIIIF + LATLGLNIKTVFCDHHSLEFQDTFSREIQRYIGAKFFDKIVTLTEEDKNRYRKDFSLR + NEKVTSIYNWMEDINNIPAYTNKSKSIITVGRIEYQKGYDYLAKAIVNVLSKYKDWEW + DIYGSGNEQIKQDLITELDKGGVLSRVHFKGNVNGTENIYPGHSIYVMTSRYEGLPLV + LLEAKQYGLPIVSFKCPTGPSEIVLDEENGYLVDNYDVDYMSRKISDLIENENLRLKF + SDESMKDTEKFSKKKIIKQWEDLIEEMTGE" + misc_feature 8835..9347 + /gene="wcrC" + /locus_tag="SPC33B_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.8e-31" + gene 9421..10428 + /gene="wciD" + /locus_tag="SPC33B_0012" + CDS 9421..10428 + /gene="wciD" + /locus_tag="SPC33B_0012" + /note="member of homology group 60" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34195.1" + /db_xref="GOA:Q4JZN0" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZN0" + /translation="MGKKLLTIAVPSYNAEKYLPDTIPTILSAKNVHLIDLLIVNDGS + SDGTGEIAEEFERNYPDIIRVLNKPNGGHGSAVNAGIKNAYGTYFKIVDADDWVDTEN + LDDLIEYLKETDVDEILSPYYRVYVNQAGDVVSIENYNEFSMIQTDKVYQVDSFYEQI + GRTVGMHTMTLKTKLLKENQVELSENMYYVDMEYITYVLPYIETVFLFNKPIYKYRLG + TSTQSISIESYIKNRSMHKQVTFNLIDFYNQTKLGFGRSKAVKNLIINLINQQWNIYF + NLNNVTEAKKELIEFEKSIAIKNKSFLKNSTGLKMNFVRKSRYHLFNIAKYYSNWRVK + S" + misc_feature 9439..9948 + /gene="wciD" + /locus_tag="SPC33B_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.9e-29" + gene 10425..11393 + /gene="wciE" + /locus_tag="SPC33B_0013" + CDS 10425..11393 + /gene="wciE" + /locus_tag="SPC33B_0013" + /note="member of homology group 44" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34196.1" + /db_xref="GOA:Q4JZM9" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JZM9" + /translation="MNKIKKMTREYMKLKKIFSTQIANNMLLEKIAARLSRYNFLHGL + VVFIYSKKHKDILDFLKKDFDIFLSTYSYDFEKSNEQNGKKIFSLWLQGYENAPEIVQ + KSIQTQKEYAERFGYEYILLDKSNLETFVKIPENIARKFEDGKIDAIKYSDIIRTFLL + FKYGGIWFDATIYIKTDSKLSYLDDEFYTIRAKGDETYPKYVADGRWALFCIAGYRNG + IVFDFLRKFQVEYFSKYDLPINYFLIDYLMELGYEYNPIIRKQVDKVITNNQDLYFLV + NNFSNMYRDEDWKKVLETTNIFKCSYKIYVSDKLDTYFYKLKNQTL" + misc_feature 10518..11375 + /gene="wciE" + /locus_tag="SPC33B_0013" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.7e-58" + gene 11406..12374 + /gene="wciF" + /locus_tag="SPC33B_0014" + CDS 11406..12374 + /gene="wciF" + /locus_tag="SPC33B_0014" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34197.1" + /db_xref="GOA:Q4JZJ4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZJ4" + /translation="MISIIVPVYNVKDYLHYAMESLFRQTYTDFEVILVNDGSTDSSG + ELCNRYAENHENVYVFHKKNGGLSDARNFGVTKASSDWIVFLDPDDYFEVDALELLVK + IQQRYDADLISTKVKSTSTYEDYNSDYMGESVYSNLEVLSKEEALELMLQDKVATVSA + CAKLYHKSILERAPFPIGKVYEDFYVVGEHLALANRIVISPYKTYNYFCRPGSIVRSK + FTVKRFNFFEAAEHNRSIIKKYYNSKNLENVLNIKIVQGSFSIASSAAESDVESLLAI + RKKLSSLYWSVFTSPKASYRLKLKYTLFLLFPKGYYKLKKMIKRVD" + misc_feature 11412..11927 + /gene="wciF" + /locus_tag="SPC33B_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 7.4e-42" + gene 12375..13583 + /gene="wzy" + /locus_tag="SPC33B_0015" + CDS 12375..13583 + /gene="wzy" + /locus_tag="SPC33B_0015" + /note="member of homology group 127" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34198.1" + /db_xref="UniProtKB/TrEMBL:Q4JZM7" + /translation="MSVRKLSLIDILDYMWIILIIVQCHSIYTVKSEPLNLIVPFLVT + TAMLLLLNLLRFTLSIKYIYILGLYFIAMATFFLTNIGANVTPLNITKYFIMLPLFFL + INSIYVNKEIFSALLSKFVNVVVILAIFSLFFWIFGTLLNVVHPTSTVINQWSGGQLI + NSYYNLYFETQQMIFFGFRIIRNSGIFAESPIWGLILSIAYVIDFLILKFDKNSKRNI + IILTMLSTISTTGIIIVGLAILYKIMTTSRWMTKLLLLPVTLSLGLSLLLLLAEKSET + VSANLRVDDYNIGFIVWKTSLWIGHGLNNGILAIQSHISTFTRNLGYSNTLFVILAQG + GLLLFLIYFSPMILLLFKKNINLDFKFAIILFFILVTTIIFEGTFLFLWILTLSYSYF + SFVTLDKTGT" + misc_feature 13200..13394 + /gene="wzy" + /locus_tag="SPC33B_0015" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 0.00012" + gene 13720..15135 + /gene="wzx" + /locus_tag="SPC33B_0016" + CDS 13720..15135 + /gene="wzx" + /locus_tag="SPC33B_0016" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34199.1" + /db_xref="GOA:Q4JZM6" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZM6" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKQIQKNFLGIYSLQLGATVLSLSLYALLCLTL + PFMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVISIFLFVKSSN + DLYLYVFLLTIFELFGQFSMWIPAREFIGRPHFDIEYARHHLKPVILLFLPQVAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVAHLLATDDHKAVN + RMHEMSFFIYNLVIFPMMAGILIVNDDFVQFFLGQDFQDARYAIAIMIFRMFFIGWTN + IMGIQMLIPHNQNKEFMISTTAPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LFYTRRYLKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSPTLNVLAFAALGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 13726..14520 + /gene="wzx" + /locus_tag="SPC33B_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.8e-68" + gene 15137..16135 + /gene="wciG" + /locus_tag="SPC33B_0017" + CDS 15137..16135 + /gene="wciG" + /locus_tag="SPC33B_0017" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34200.1" + /db_xref="GOA:Q4JZM5" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZM5" + /translation="MRKIRNINLDLLKVLACVGVVLLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMINGYLLLGKREITYLYILQKVKWILITVSSWTFIVWFFYRDFTTNPI + KKIVGSLIQRGYFSQFWFFGALILIYLCLPIVRQFLNSKRSYLYSLSLLMTIGLIFEL + LNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTKEEIESRFKNWMKIASILLLLI + SPIILFFIAKTTYHNFFAEYFYDILLVKVVSVGIFLTIFSLVLNENSNKWIIFLSNQT + MGIFIIHTYIMKVWEKLFGFSFIGSYLLFAIFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 16148..17251 + /gene="glf" + /locus_tag="SPC33B_0018" + CDS 16148..17251 + /gene="glf" + /locus_tag="SPC33B_0018" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34201.1" + /db_xref="GOA:Q4JZC4" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZC4" + /translation="MYDYLVVGAGLFGAVFAHEAALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIEEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPSFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQ + GNVIFGGRLGHYRYYDMHQVIGVALQCVRNELN" + misc_feature 16583..17191 + /gene="glf" + /locus_tag="SPC33B_0018" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.7e-113" + gene complement(17452..18708) + /gene="tnp" + /locus_tag="SPC33B_0019" + CDS complement(17452..18708) + /gene="tnp" + /locus_tag="SPC33B_0019" + /note="member of homology group 13" + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /protein_id="CAI34202.1" + /db_xref="GOA:Q4JZM3" + /db_xref="InterPro:IPR002560" + /db_xref="InterPro:IPR012287" + /db_xref="UniProtKB/TrEMBL:Q4JZM3" + /translation="MGQLHFITKLLDIKDTNIQIIDVVNRDSHKEIIAKLDYDAPSCP + DCGSLMKKYDFQKPSKIPYLETTGMPSRILLRKRRFKCYHSSKMMVAETPLVKKNHQI + PRIINQKIAQKLIEKISMTDIAHQLAISTSTVIRKLNDFHFEHDFSRLPKIMSWDEYA + FTKGKMSFIAQDFDNLNIITVLEGRTQAVIRNHFLRYDRAVRCQVKIITMDMFSPYYD + LAKQLFPCAKIVLDRFHIIQHLSRAMSRFRVQIMNQFERKSHEYKAIKRYWKLIQQDS + RKLSDKRFYRPTFRMHLTNKEILDKILSYSEDLKHHYQIYQLLLFHFQNKDPEKFFGL + IEDNLKQVHPIFQTVFKTFLKNKEKIVNALQLPYSNAKLEATNNLIKLIKRNAFGFRN + FENFKKRIFIALNIKKERTKFVLSQA" + misc_feature complement(17956..18252) + /gene="tnp" + /locus_tag="SPC33B_0019" + /note="HMMPfam hit to PF01610, Transposase, score 5e-48" + misc_feature complement(18292..18357) + /gene="tnp" + /locus_tag="SPC33B_0019" + /note="Predicted helix-turn-helix motif with score + 1691.000, SD 4.95 at aa 118-139, sequence + ISMTDIAHQLAISTSTVIRKLN" + gene 18992..>19039 + /gene="aliA" + /locus_tag="SPC33B_0020" + CDS 18992..>19039 + /gene="aliA" + /locus_tag="SPC33B_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34203.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt ctcactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct tgtaaaaggt attgcaactt ggtaatacct ttttgaggtt ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgaccaa actcttcaca caagagttct agcttaccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaatttttg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaagtca gaagctattt cagtcaaata + 1081 agcgtctgga ttgtcagtaa gatagttttt aagtctatct ctatcaacct ttcttggttt + 1141 tattcctttt acttggtggt ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatggtatta cgtgagattt ggaaaacgtg tgatgcttct gttatactac ctgttcgctc + 1261 acaataagag agaacttttt tacgaaaatc tattgaatat gccataggaa gattatacca + 1321 cattgtgtac tacagtagat tgaaactaga acagtacacc tctacttcta aaacattgtt + 1381 agaaatcgat tttactgtcc cgatcgattt gtcatcttct tatttcattt tactatattt + 1441 ttggttcgcg ggaagtctac taagatactt aaagatgcag atagtggaaa taaaggtgta + 1501 gacattaccg taaaaaagtg atacaattgt aagatattga atgtataggt attaatcatg + 1561 agtagacgtt ttaaaaaatc acgttcacag aaagtgaagc gaagtgttaa tatagttttg + 1621 ctgactattt atttattgtt agttggtttt ttattgttct taatctttaa gtacaatatc + 1681 cttgctttta gatatcttaa cctagtggta actgcgttag tcctactagt tgccttggta + 1741 gggctactct tgattatcta taaaaaagct gaaaagttta ctatttttct gttggtgttc + 1801 tctatccttg tcagctctgt gtcgctcttt gcagtacagc agtttgttgg actgaccaat + 1861 cgtttaaatg cgacttctaa ttactcagaa tattcaatca gtgtcgctgt tttagcagat + 1921 agtgagatcg aaaatgttac gcaactgacg agtgtgacag caccgactgg gactgataat + 1981 gaaaatattc agaaactact agctgatatc aagtcaagtc agaataccga tttgatggtc + 2041 aaccagagtt cgtcttactt ggcagcttac aagagtttga ttgcagggga gactaaggcc + 2101 attgtcctaa atagtgtctt tgaaaacatc atcgagtcag agtatccaga ctacgcatcg + 2161 aagataaaaa agatttatac caagggattc actaaaaaag tagaagctcc taagacgtct + 2221 aagaatcagt ctttcaatat ctatgttagt ggaattgaca cctatggtcc tattagttcg + 2281 gtgtcgcgat cagatgtcaa tatcctgatg actgtcaatc gagataccaa gaaaatcctc + 2341 ttgaccacaa cgccacgtga tgcctatgta ccaatcgcag atggtggaaa taatcaaaaa + 2401 gataaattaa cccatgcagg catttatgga gttgattcgt ccattcacac cttagaaaat + 2461 ctctatggag tggatatcaa ttactatgtg cgattgaact tcacttcttt cttgaaaatg + 2521 attgacttat tgggaggggt agatgttcat aatgatcaag agttttcagc tctacatggg + 2581 aagttccatt tcccagtagg gaatgtccat ctagactctg agcaggctct aggttttgta + 2641 cgtgaacgct actcactagc cgatggagac cgtgatcgcg ggcgcaatca acaaaaggtg + 2701 attgtggcta tccttcaaaa attaacgtca accgaagcac tgaaaaatta tagtacgatc + 2761 attaatagct tgcaagattc tatccaaaca aatatgccac ttgagactat gataaatttg + 2821 gtcaatgctc agttagaaag tggagggaat tataaagtaa attctcaaga tttaaaaggg + 2881 acaggtcgga tggatcttcc ttcttatgca atgccagaca gtaacctcta tgtgatggaa + 2941 atagatgatc gtagtttagc tgtagttaaa gcagctatac aggatgtgat ggagggtaga + 3001 tgaaatgata gacatccatt cgcacatcgt ctttgatgta gatgatggtc ccaagtcaag + 3061 agaggaaagc aaggctctct tggcagaatc ctacagacag ggggtgcgaa ccattgtctc + 3121 tacctctcac cgtcgcaagg gcatgtttga aactccggaa gagaagatag cagaaaactt + 3181 tcttcaggtt cgggaaatag ctaaggaagt ggcgagtgac ttgatcattg cttacggggc + 3241 tgaaatttac tacacaccag atgttctgga taagctggaa aaaaagcgga ttccgaccct + 3301 caatgatagt cgttatgcct tgatagagtt tagtatgaac actccttatc gcgatattca + 3361 tagcgccttg agcaagatct tgatgttggg aattactcca gtcattgccc acattgagcg + 3421 ctatgatgct cttgaaaata atgaaaaacg cgttcgagaa ctgattgata tgggctgtta + 3481 cacgcaagta aatagttcac atgtcctcaa atccaaactt tttggcgaac gttataaatt + 3541 catgaaaaaa agagctcagt attttttaga gcaggatttg gtccatgtca ttgcaagtga + 3601 tatgcacaat ctagacggca gacctcctca tatggcagaa gcatatgacc ttgttaccca + 3661 aaaatacgga gaagcgaagg ctcaggaact ttttatagac aatcctcgaa aaattataat + 3721 ggatcaacta atttaggaga aatgatgaaa gaacaaaaca tgatagaaat cgatgtattt + 3781 caattattta aaaccttgtg gaaacgcaag ctaataattt taatagtggc acttgtgaca + 3841 ggtgcggggg cttttgcata tagcactttt attgttaagc cagaatatac gagtaccacg + 3901 cgaatttacg tagtgaatcg cgatcaagga gacaagccgg ggctgacaaa tcaggatttg + 3961 caggcaggat cttatctggt aaaagactac cgtgagatta tcctttcgca ggatgtattg + 4021 gaaaaagtag cgacaaattt gaagttggat atgccagcaa aaacgttagc cagcaaagtt + 4081 caagtgactg taccagctga cactcgtatc gtctcaatct ctgtcaagga taaacagcca + 4141 gaggaagcca gtcgtatcgc taattctcta cgagaagttg ctgcagaaaa gatcgtcgct + 4201 gtaacgcgag tatctgatgt aacgacactt gaagaagcgc gaccagctac gactccttct + 4261 tctccaaatg ttcgacgcaa ttccttgttt ggttttcttg gaggagcagt cgtaacagta + 4321 attgctgttc ttttgattga ggtgctggac acccgtgtga aacgtcctga agatgttgaa + 4381 gatgtactga aaattccact tttagggctc gttccagatt ttgacaaaat aaaataggag + 4441 gaagttatgc caacattaga aatctcacag gcaaaattgg attctgtaaa aaaggcagag + 4501 gaatattata acgctttgtg cacgaaccta cagttaagtg gagatggttt gaaagtattg + 4561 tctatcactt ctgtgaaaat aggagaagga aaatcaacga cttccgccaa tatcgcttgg + 4621 gcttttgcgc gtgcaggtta caaaacgctg ctgattgatg gagatattcg caattctgtt + 4681 atgttaggtg tctttaaagc aaggaataag attacaggcc tgacagaatt tttatcagga + 4741 actacagacc tatcacaagg gctttgtgat accaatatcg aaaatctctt tgtaattcag + 4801 gctggctctg tgtcaccgaa tccgacagct cttcttcaaa gtaagaattt cactacaatg + 4861 cttgaaacct tgcgtaaata ttttgactac atcattgtag atactgctcc tgttggtgtc + 4921 gtgattgatg cggttattat tacgcgaaac tgcgatgctt ctattttagt gacggaggca + 4981 ggtgaaataa atcgacggga tattcaaaaa gcaaaagaac agttggaaca cacagggaag + 5041 ccgtttttgg gaattgtgtt gaataaattc gatacttcag tagacaaata cggttcttat + 5101 ggaaattatg gagattacgg gaaaaataaa aaataggtcg ggggatagag atgaatggaa + 5161 aaatattaag gtcttcattg gtcataatcc agagttttct tgttatttta ttgacttatc + 5221 tacttagtac tgtgagagaa gcggagattg tttcaacaac agctattgca ctttatatcc + 5281 tccattattt tgtcttttat atcagtgatt atggacagga tttctttaaa aggggatatt + 5341 tgattgaact tctccagaca ttgaaatata tcctattctt tgcactagcg attagtattt + 5401 ctaatttttt cttagaggat cgatttagta tttccagacg aggcatgatt tacttcctca + 5461 cattacatgc tctcttagtc tatgtgctaa acctatttat caagtggtat tggaagcggg + 5521 cttatcccaa ctttaaagga agtaagaaga ttctcctact tacagcaact tctcgtgtcg + 5581 aaaaggtact ggatagatta atagaatcaa atgaggttgt tgggaagttg gtagccgtca + 5641 gtgtcttaga taaaccagat tttcagcatg attgtttaaa ggtagtagca gagggggaga + 5701 tagtaaactt tgcgactcat gaggtggtag atgaagtctt tatcaatctt ccaagtgaaa + 5761 aatacaatat tggagagctg gtctctcagt ttgaaacgat gggaattgat gtaacagtta + 5821 atctaaatgc ttttgatcgt agtttggcac gtaacaagca aattcgtgag atggcaggat + 5881 taaacgttgt gactttttct acagcatttt ataagactag tcatgtaatt gctaagagga + 5941 ttattgatat cgtgggtgca ttggtagggc tgatactatg tggtttagtc agtattgtat + 6001 tggttccttt gattcgaaag gatgggggct ctgctatttt tgctcagacg cgtataggaa + 6061 aaaatggtcg tcagttcact ttttataagt ttcgctctat gtgtgtagat gccgaggcga + 6121 aaaaaagaga actcatggaa caaaatacca tgcagggtgg aatgtttaag gtggacgatg + 6181 atcctcgtat cacgaaaatt ggtcgtttta tacggaagac tagcttggac gagctaccac + 6241 agttttataa tgttctaaag ggagatatga gtttggttgg cacacggcca ccaacagtgg + 6301 acgagtatga acactatacc ccagaacaaa aacgtcggct aagttttaaa cctggtataa + 6361 caggcttatg gcaggtcagt ggacgaagtg aaattaagaa ttttgatgaa gttgttaaat + 6421 tagatgtggc ttatatagat gattggacaa tctggaaaga tattgaaatt ttattgaaga + 6481 cagttaaagt agtatttatg agagatggag cgaagtgaaa gttatctttt ccgataaaag + 6541 tgcacgatta gagaagggaa attacaactc tatatgacta ttaaatcgta tcaaaatatt + 6601 taaatgattt taaacgataa aatattagaa aagttgaggt aaaaaatgga tatagtatat + 6661 acgacagaca ataactttgt tgaggtactt tatgcatcaa tttcatcttt atatgaaacg + 6721 aatgcattat tatatcccaa cgtttggata attgctgata aggtatcagc taaaaataga + 6781 gataaaatca atgagttagc tagtaaaaat aatcaaaata cgataaactg gatagaaaat + 6841 atagaaaaac cttttaaatt gacatcagat agaggttcta taagttctta tagtagatta + 6901 tttttaggag aagttcttcc caaaaaagtt aggaaagtac tttatcttga ttgtgacatt + 6961 attatcatgg atagtttatc agatttattt gatgaagaat ttgatggaaa aataatccaa + 7021 ggtgtgtccg atgttttaaa taaggagtat aaaaaaatat tgaatattcc tgttagtgca + 7081 cctgtattta actcaggtgt attatatatt gatttagata aatggcgtga acaacgaatc + 7141 gaggaaaaat tagtttatat aataaataaa tttaaaggaa atgtaattca aggagatgaa + 7201 ggagttttga atgctgttct gtttgattct tataaagaat tatctccaag atacaattat + 7261 atgaccattt ttgaggatat gtcttatgag gatatgattg cttttaagca acctgtaaac + 7321 tattatagta aggaagtttt agaagaatca agaaagaata taataatccg ccatttcaca + 7381 acgtgttttc tatcactcag accttggcaa gaaagtagtg aggtaacgca tgtggaaata + 7441 tttaaaaaat actatagagg agcatacaaa caagcatctc catctaagtt attaaatatt + 7501 tataaaattt tacctaaaaa aatgtcgctc tatctactag gttttattca atcaaaagtg + 7561 cgtccaaaac tgtatagaat tacaaaatag aggtgtaaaa tggtaagtgt taaaagtata + 7621 gaacaaaaaa cgatgacgga agaaaagaaa agggaagcaa aaaaagacat ttttgctttc + 7681 tatgtaggta gacctctatc atacatattg acaattcctt ttcttaaaac aaaaatgaca + 7741 ccgaatcaga tttctatatt gtctattgta cctttaatta tcggaacagc tttggtaaca + 7801 gtaagttcta atcagtttgt actattgcta aattggcttt gttttttctt atggaattta + 7861 cttgacggtg ttgacggaaa tgttgctcgt ttcaagggaa ttacctctcc tatgggaagt + 7921 gttatagatg caatggcagg ctatgctgca atgtatttat cattcctcac tatgggaatt + 7981 attgcaagtg actatagtca aacactattc tttacacaaa aaacatattt aattttaggg + 8041 tcactatctg gtgtttttgt tttgtttcct agattaatta tgcacaaagc tataaatact + 8101 gtaggaagta agaatagtga gcagtacaaa ggtagaaaaa attttggtgt tatagaaatg + 8161 attgcactta atgtaacctc tataacagga tttgctcaat tgtttatgct tattgcaata + 8221 ttattaaaat tgagcgactt atttacacta gtttatttcc tcattaattt attagttatg + 8281 gtgatctcta ttaaaaagat agtaaaataa gaataaggcg agttatgaaa aaaattgcga + 8341 tagtaaggta taatttaagt aaaattggtg gagctgaaaa agttgctata aatatggcta + 8401 atgaattttc tcaaaaccac aaaacatact taatttctat tttactaaat gaagacaaga + 8461 acataaatta tgacatatca tctgatgttg aagttgagtc ctttttttat ggtgatttaa + 8521 gagttcgcaa agtgataatt ccagctatgc tgaagttaag aaaacacttg ataaagaatg + 8581 aaattgatgt agtgttttct attgctccgg ctacaaatat tattatcttt ttagcaacgt + 8641 taggattaaa tataaaaact gtcttttgtg accaccatag tttagagttt caagacactt + 8701 tcagtcgcga gatacaaaga tatattgggg caaagttttt tgacaaaatt gtaactttga + 8761 ctgaggaaga taaaaataga tatcgaaaag acttttcatt aagaaatgaa aaggttactt + 8821 caatctataa ttggatggaa gacattaata acattcccgc atatactaat aaaagcaaga + 8881 gcattataac agttggaaga atagaatatc aaaaaggata tgactattta gctaaagcta + 8941 ttgttaacgt tctgtcaaaa tataaagact gggaatggga catatacggt tcgggaaacg + 9001 agcaaataaa acaagatctg attactgaat tggataaagg tggcgtttta tcgcgggttc + 9061 attttaaagg gaatgttaat ggtacagaaa atatttatcc tggtcattct atttatgtaa + 9121 tgacttctcg ttatgaaggt cttcccttag ttcttttaga agctaaacag tatggactac + 9181 cgattgttag ttttaaatgt ccaacgggtc catcagaaat agttttagat gaggaaaatg + 9241 gatatttagt tgataattac gatgttgatt acatgagtag aaaaatttct gatttaattg + 9301 aaaacgagaa tttgagatta aaattttcag atgaatcaat gaaagatact gaaaaattta + 9361 gcaagaaaaa gattataaag cagtgggaag acttaattga agaaatgaca ggggaataga + 9421 atgggaaaga aattattaac aatagcagtg ccatcataca atgcggaaaa atatttacca + 9481 gatactatac caacaatatt atctgcaaag aatgtacatt taattgattt acttatagta + 9541 aatgatggtt cgagtgatgg tacgggggaa atcgctgaag aattcgagcg aaattaccct + 9601 gatattattc gtgttttaaa taaaccaaat ggtgggcatg gatcagctgt aaatgcaggt + 9661 ataaaaaatg cttatggaac gtattttaag attgttgatg cagatgattg ggttgataca + 9721 gaaaatttag atgatttgat agaatattta aaagaaacag atgtggatga aattctttca + 9781 ccgtattatc gagtttatgt taatcaagct ggagatgtag tatctattga aaattataac + 9841 gaattttcga tgattcagac agataaagtg taccaggtcg attctttcta tgaacaaata + 9901 ggtagaaccg taggaatgca cactatgaca ttaaaaacca agctgttaaa agaaaatcaa + 9961 gtagaattat ctgaaaatat gtactatgta gatatggaat atatcaccta tgttctacca + 10021 tatatagaaa cggtttttct ttttaataaa ccgatttata aataccgttt aggaacatct + 10081 acgcaaagta ttagtataga aagttatata aaaaatagat ctatgcataa acaagttact + 10141 tttaatctta ttgattttta caatcaaacg aaacttggat ttggtcgctc caaagcagta + 10201 aagaatctaa taataaatct tataaatcag cagtggaata tctatttcaa tttaaataat + 10261 gtaactgaag ctaaaaaaga attaatagaa tttgaaaaat ctatagctat taaaaataaa + 10321 agcttcttga aaaattctac gggcttaaag atgaattttg tcagaaaaag tcgttaccat + 10381 ttatttaaca ttgctaaata ttatagtaat tggagagtga aatcttgaat aaaatcaaaa + 10441 aaatgacaag agaatacatg aaattgaaaa aaattttctc tacccaaatt gcaaataata + 10501 tgctcttaga aaagatagct gcacgactat caagatataa ttttttgcat ggtttagtag + 10561 tatttattta ctctaaaaaa cataaggata ttttagattt tctaaaaaag gattttgata + 10621 tatttttatc tacctattct tatgatttcg aaaaatctaa tgagcaaaat ggaaaaaaga + 10681 ttttttcatt atggcttcaa ggatatgaaa atgctccaga aattgttcaa aaatccatac + 10741 aaacccaaaa agaatatgct gaaagatttg gttatgaata catattgtta gataagtcaa + 10801 atttagagac atttgttaaa attcctgaaa atattgctag aaaatttgaa gatgggaaaa + 10861 tagatgcaat aaaatattca gatatcatta gaactttctt gttatttaaa tacggtggta + 10921 tctggttcga tgcaactatt tatataaaaa cagattcaaa gttaagttat ttagatgatg + 10981 agttttatac tattcgtgcg aagggagatg aaacctatcc taagtatgtt gcggatggac + 11041 gttgggcctt gttttgtata gctggatatc gtaatgggat tgtattcgat tttttaagaa + 11101 aatttcaagt tgaatatttc tctaaatatg acttaccaat aaattacttt ttgatagact + 11161 atttaatgga gttaggctat gagtataatc caataattcg aaaacaggtt gataaggtaa + 11221 ttaccaacaa ccaagatctc tattttttag taaataattt ttctaatatg tacagggatg + 11281 aggattggaa aaaagtatta gaaacaacaa atatttttaa atgcagctat aaaatatatg + 11341 taagcgataa attggacaca tacttttata aattgaaaaa tcaaactcta tagtgaggaa + 11401 atgtaatgat ttcgattatt gttccagtat ataatgtgaa agactatcta cattatgcaa + 11461 tggaaagttt atttagacaa acatacacag actttgaagt tattttagtt aatgatggtt + 11521 caacagatag ttctggtgaa ttatgtaatc ggtacgctga aaatcatgag aatgtttatg + 11581 tttttcataa aaaaaatggt ggactttcgg atgctagaaa ttttggtgtc acgaaggctt + 11641 cttcggattg gatagttttt ctggatccag atgactattt tgaagtagat gctttagaac + 11701 tattagttaa gattcagcaa agatatgacg cagatttgat atcaactaaa gtaaaatcta + 11761 cttcgacata tgaagattat aattctgact atatgggaga atctgtttat agtaatcttg + 11821 aagtactttc aaaagaggaa gcattagaac tgatgcttca agataaagtt gcaacagtat + 11881 cggcctgtgc taaactatat cataagagta ttttagaaag agctcccttc cctattggaa + 11941 aagtctatga agatttttat gttgttggtg aacatttggc attagcaaat agaattgtaa + 12001 taagtcctta taaaacctac aattattttt gtagaccggg tagtatcgtt cgttctaaat + 12061 ttactgttaa gaggtttaac ttttttgaag ctgctgaaca taatcgtagt attattaaaa + 12121 aatattataa ttcaaaaaat cttgaaaatg ttttaaatat caaaatagtg cagggttcct + 12181 tttctattgc ttcatcagct gctgaatcag atgtagaatc cttactagca attaggaaga + 12241 aactgtcctc attgtattgg agtgttttca catcaccaaa agcttcttat agactaaaat + 12301 taaaatatac gttattttta cttttcccta aaggatatta caaattaaaa aaaatgataa + 12361 agagagtgga ttaaatgtca gttagaaaac tatctttaat agatatactg gactatatgt + 12421 ggataatatt aattattgta cagtgtcatt caatatatac agtaaaatct gaacctctta + 12481 atttaattgt gccattttta gttacaacag caatgttgtt gttactcaat ttattacgat + 12541 tcactttgtc aataaaatat atatatatat taggtctata ttttatagca atggctacat + 12601 tttttttaac taacataggt gctaatgtta ctcccttaaa tattacgaag tattttataa + 12661 tgcttccttt atttttttta ataaatagta tttatgtgaa taaagaaatt ttttcagcgt + 12721 tactatcaaa atttgtaaac gtagtagtaa ttttagcaat tttttcctta ttcttttgga + 12781 tatttggaac acttctgaat gttgtacacc ctacctcaac agtaattaat caatggtctg + 12841 gtggtcaatt aataaatagc tactataatc tatattttga aactcaacag atgatttttt + 12901 ttgggttccg tataatacgg aattcaggaa tatttgctga atctcctatt tgggggctaa + 12961 tactaagtat tgcttatgtt attgattttc ttattttgaa atttgataaa aatagcaagc + 13021 gtaatataat tattctaact atgttaagta caatttcaac gacaggtatt attattgtcg + 13081 ggttagctat attatataaa ataatgacta ctagtcgttg gatgacaaaa ctcttacttc + 13141 tccctgtcac attgagctta ggactctctt tattgctcct attggctgag aaatcagaga + 13201 cagtttcagc taatcttaga gttgatgatt ataatattgg ttttatagta tggaagacaa + 13261 gtttgtggat aggacacgga ttgaataatg gtatattagc aattcaatca catatctcaa + 13321 cgtttacaag aaatttaggc tatagtaaca cattatttgt tattttggct cagggaggtt + 13381 tattattatt cttgatttat ttttctccaa tgatactatt attgtttaag aaaaatatca + 13441 atcttgattt taagtttgcc attatcttat tctttatctt agtaacaaca attatttttg + 13501 aagggacatt tttatttctc tggattttaa cattatcgta tagctacttt tcctttgtaa + 13561 cattagataa aactggaacg taaagtagat aatatataat gtcatatata aattttgata + 13621 tttgtttaat caacttattc ttattattgt gacattctta cttttacagt tgatgataga + 13681 aacaaatctt ttaaagcaag tgaaataaat taataaaaca tgaaagtact aaaaaattac + 13741 gcctacaatc tttcttacca attgttggtg attatactcc ctatcattac gacgccctat + 13801 gtaacaaggg tcttttcttc ggatgattta gggacgtatg gttattttaa ttccatcgtt + 13861 acttatttta tcctcttagc gacgctagga gttgctaact atgggaccaa ggtcatttca + 13921 gggcatcgaa agcaaattca aaaaaacttt ttgggaatct attctctgca attaggtgca + 13981 acagttcttt ctctgtcctt gtatgctctt ctttgtctaa ctcttccctt tatgcaaaat + 14041 ccggtagcct atattctagg cttgagttta gtttctaaag gtttagacat ctcctggctc + 14101 tttcaagggt tggaggattt tcgaaagatt actgtccgaa atataacagt taaactagtt + 14161 ggggtcattt ccatcttcct ctttgttaaa tcatcaaatg acctttacct ctatgtcttt + 14221 ttgctaacca tttttgaact ctttggtcaa ttcagtatgt ggataccagc tcgagaattt + 14281 attggtagac ctcattttga catagaatat gctagacatc atttgaaacc agtcatatta + 14341 ttgttccttc cgcaagtggc gatttccttg tatgttacgc tagatcgtac tatgcttgga + 14401 gcgttagctt ctacaaaaga tgtagggatt tatgaccagg ctttaaagtt ggtaaatatc + 14461 cttctgacct tggtaacttc cttgggaagc gttatgttac ctcgagtcgc tcatttgtta + 14521 gcgacagatg atcataaggc agtcaatagg atgcatgaaa tgtctttctt catttataat + 14581 ttagtgattt ttccaatgat ggcaggaatc ttgattgtca atgatgattt tgttcagttt + 14641 ttccttggtc aagattttca agatgcgcgt tatgcaatcg ccattatgat cttccgtatg + 14701 ttctttatcg gttggaccaa tatcatggga attcagatgc tgatacctca taatcaaaat + 14761 aaagaattca tgatttcaac aacagctccc gcaattatca gtgtaggttt gaacttacta + 14821 ttccttccta aactgggata tatcggggca gccattgtct ctgttttaac agaggcactt + 14881 gtatgggcaa tccaattatt ctatactcgc agatatttaa aagaagttcc tataatcgga + 14941 tcaatgtcaa aaattatact agcatctgcc attatgtatg gccttttact aagttcaaaa + 15001 acagttatac atttttcacc gaccttaaat gttctagcat ttgcagcgct tggtggaatc + 15061 atttatcttt ttgcaattct atctctgaaa gtggtagatg tgaaagaatt aaaacaaatt + 15121 attaggaaaa actaaaatga gaaaaattcg aaatatcaac ctagatttac taaaagtgct + 15181 tgcatgtgtt ggagttgttt tacttcatac aacaatgggc ggatttaaag agacaggctc + 15241 atggaatctt ttggcatatt tatattattt aggtacttac tctattcccc tgttttttat + 15301 gatcaatggt tatttattgt taggcaagag ggaaataact tatctttaca tactccagaa + 15361 agtaaaatgg attttaataa cagtgtcatc atggacattt atcgtatggt ttttttatcg + 15421 tgattttaca actaatccta ttaaaaaaat tgtaggttct ttgatacaaa gaggttattt + 15481 ctctcagttt tggtttttcg gtgcactaat acttatctat ttatgtctgc caattgtgag + 15541 acaatttcta aattcaaaaa gaagctattt atacagttta tctttattga tgactattgg + 15601 tttgattttt gagttattaa atatcctact tcagatgcca atacaaacat atgtaataca + 15661 gacttttaga ttatggacgt ggttttttta ctatctttta ggtggttata tagcgcaatt + 15721 cactaaagaa gaaatcgaat caagatttaa gaattggatg aaaatagcta gcatactttt + 15781 gttattgatt tcaccaataa tattattttt catagcaaag accacttacc ataatttttt + 15841 tgctgaatat ttttatgata ttttattagt aaaagttgta agcgtaggga tttttctaac + 15901 tattttctca cttgtattga atgaaaatag caacaaatgg attatttttc tttctaatca + 15961 aactatgggt atctttataa tacacactta tattatgaag gtatgggaaa aactatttgg + 16021 ttttagtttt ataggttcat atttactttt tgctatattt actttaagtg ttagttttat + 16081 cattgttgga atgttaatga aaattccgta ttttaatcga atcgtcaaat tataaaaagg + 16141 agaaaaaatg tacgattatc ttgttgttgg tgctggtctc tttggtgcag tctttgccca + 16201 tgaagcagcc ttaaaaggaa aaaaagtaaa agttattgaa aaacgaaatc atatcgcggg + 16261 taatatctat actcgtgaag aggaaggaat tcaagttcat caatatggtg ctcatatctt + 16321 ccatacttct gataaggaga tctgggatta tgtaaatcag tttgcagagt ttaaccgtta + 16381 taccaattct cctgttgcaa actataaggg tgagatttat aaccttcctt ttaatatgaa + 16441 tactttcaat aaactctggg gagttgtaac gccagcagaa gcacaagcta agattgagga + 16501 acaacgtgct attttaaatg gtaaaactcc tgaaaatttg gaagaacagg cgatttctct + 16561 tgtaggtaca gacatctacg aaaaattaat caaagactat acagagaaac agtggggcaa + 16621 accaactact gaacttccat cctttattat tcgccgtttg ccagtacgcc tgacctatga + 16681 taacaactat tttaacgata cctatcaagg gattccaatt ggtggataca ctcaaatagt + 16741 tgaaaaaatg ttggatcatg aaaatattga tgtagaaaca aatgttgatt tctttgtgaa + 16801 taaagagcaa tatctgaaag attttcctaa gattgtcttt actggtatga ttgatgaatt + 16861 ctttgactat aagttgggcg aactagagta ccgtagtctt cgttttgaaa atgagacctt + 16921 ggatatggaa aattaccaag gaaatgcagt tgtgaactat acggatgcag aaactccata + 16981 tactcgcatt attgaacaca aacattttga gtttgggagt caagcaaaga ctatcattac + 17041 taaagaacat tctaaaacat gggaaaaagg tgatgagcct tattatccag ttaataatga + 17101 tcgtaataat catttgtata aatcatataa aaaacttgct gatgagcaag ggaatgttat + 17161 ctttggtggc cgcttaggac actatcgtta ttacgatatg caccaagtaa ttggagtagc + 17221 tttgcagtgc gtgagaaatg agttaaatta atactcaatg aaaattaaag agcaaactag + 17281 gaagctagcc acaggttgct caaaacactg ttttgaggtt gcagatggac gctgacgcgg + 17341 tttgaagaga ttttcgaaga gtataaacaa gtaaaactga ctaccagtta ttatttagaa + 17401 atagtattaa aaattccggc tctttgtcaa ctgtagtggg ttgaaaaaaa gctaagcttg + 17461 agaaaggaca aatttcgtcc tttctttttt gatgttcaga gcgataaaaa tccgtttttt + 17521 gaagttttca aagtttcgaa aaccaaaggc attgcgtttg ataagtttga tgagattatt + 17581 ggtcgcttcc aatttggcgt ttgaataggg tagttgaagg gcgttgacga ttttctcttt + 17641 gttctttaga aaggttttaa agacagtctg aaaaatagga tgaacctgct tcagattgtc + 17701 ctcaatgagt ccgaaaaatt tctcagggtc tttgttctga aagtgaaaaa gtaagagttg + 17761 atagatctga tagtggtgtt tcaagtcttc tgaatagctt aaaatcttgt caagaatttc + 17821 tttatttgtt aagtgcatgc gaaaagtagg gcgataaaaa cgtttatcgc tcaatttacg + 17881 actatcctgt tggatgagtt tccagtaacg cttgatagcc ttgtattcat gagattttcg + 17941 ttcaaactga ttcataattt gaacacgaaa acgactcatg gcacggctga gatgttggat + 18001 aatatggaaa cgatctagaa cgattttagc acacggaaaa agctgtttag ccaagtcata + 18061 gtaaggacta aacatatcca tcgtaatgat tttcacttga caacgaacgg ctctatcgta + 18121 gcgaagaaag tgatttcgga tgacagcttg tgttctgcct tcaagaacag tgataatatt + 18181 aagattatca aaatcttgcg caatgaaact catctttccc ttagtgaagg catactcatc + 18241 ccaagacata atctttggaa gccgagaaaa atcatgctca aagtgaaagt cattgagctt + 18301 gcgaatgaca gttgaagttg aaatggccag ctgatgggca atatcagtca tagaaatttt + 18361 ttcaattaac ttttgagcaa ttttttggtt gatgatacga gggatttggt gatttttctt + 18421 taccagggga gtctcagcaa ccatcatttt tgaagagtga tagcacttga aacggcgttt + 18481 tctaaggaga attctagaag gcataccagt tgtttcgagg taagggatct tagacggttt + 18541 ttgaaagtca tatttcttca ttagacttcc acaatcaggg caagatgggg cgtcgtagtc + 18601 cagtttggcg atgatttctt tgtgtgaatc cctattgacg acatctataa tttggatatt + 18661 tgtgtctttg atatcgagta gttttgtgat aaaatgtaat tgtcccatat gaatctttct + 18721 aatgagttgt ttgatcgctt ttcattatag atcttatggg actttttttc tacaataaaa + 18781 taggctccat aatatctata gtggatttac ccactacaaa tattatagag ccaaaattcc + 18841 ttgactatgt gatatagttg agggattttt aaatgatatt catatttttt gcaaagatgt + 18901 tgtttgaaaa ataattttca aaaattctga aaattctgtt gacaactttc tgaaaagagt + 18961 ctataatgga gagaaagttt taaaggagaa aatgatgaaa agttcaaaac tacttgccct + 19021 tgcgggcgtg acattattg +// + diff --git a/public/res/serotype_genbank/serotype_33C.gb b/public/res/serotype_genbank/serotype_33C.gb new file mode 100644 index 0000000..75e3e53 --- /dev/null +++ b/public/res/serotype_genbank/serotype_33C.gb @@ -0,0 +1,725 @@ +LOCUS CR931700 15918 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 7098/41 (serotype 33c). +ACCESSION CR931700 +VERSION CR931700.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 15918) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 15918) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..15918 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="7098/41" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC33C_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC33C_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34204.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..445 + /gene="aliB" + /locus_tag="SPC33C_0002" + /pseudo + CDS 293..445 + /gene="aliB" + /locus_tag="SPC33C_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI34205.1" + gene complement(459..980) + /gene="tnp" + /locus_tag="SPC33C_0003" + /pseudo + CDS complement(459..980) + /gene="tnp" + /locus_tag="SPC33C_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1205..2650 + /gene="wzg" + /locus_tag="SPC33C_0004" + CDS 1205..2650 + /gene="wzg" + /locus_tag="SPC33C_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34207.1" + /db_xref="GOA:Q4JZM0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZM0" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMISLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1205..1321 + /gene="wzg" + /locus_tag="SPC33C_0004" + /note="Signal peptide predicted for SPC1570 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1409..1756 + /gene="wzg" + /locus_tag="SPC33C_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.6e-63" + misc_feature 1934..2377 + /gene="wzg" + /locus_tag="SPC33C_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2652..3383 + /gene="wzh" + /locus_tag="SPC33C_0005" + CDS 2652..3383 + /gene="wzh" + /locus_tag="SPC33C_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34208.1" + /db_xref="GOA:O86886" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:O86886" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDRGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2655..3263 + /gene="wzh" + /locus_tag="SPC33C_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.6e-36" + gene 3389..4084 + /gene="wzd" + /locus_tag="SPC33C_0006" + CDS 3389..4084 + /gene="wzd" + /locus_tag="SPC33C_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34209.1" + /db_xref="GOA:Q4JZL8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZL8" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DIPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIEVLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3389..3505 + /gene="wzd" + /locus_tag="SPC33C_0006" + /note="Signal peptide predicted for SPC1572 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3410..3826 + /gene="wzd" + /locus_tag="SPC33C_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 8.7e-55" + misc_feature 3932..4009 + /gene="wzd" + /locus_tag="SPC33C_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4094..4777 + /gene="wze" + /locus_tag="SPC33C_0007" + CDS 4094..4777 + /gene="wze" + /locus_tag="SPC33C_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34210.1" + /db_xref="GOA:Q4JZL7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZL7" + /translation="MPTLEISHAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSENFTTMLETLRKYFDYIIVDTAPIGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GGYGNYGNK" + gene 4831..5466 + /gene="wcjG" + /locus_tag="SPC33C_0008" + CDS 4831..5466 + /gene="wcjG" + /locus_tag="SPC33C_0008" + /note="member of homology group 50" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34211.1" + /db_xref="GOA:Q4JZL6" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JZL6" + /translation="MKQNGIIYICFKRVMDVFIGLFGTIFIVLPSSLIIYIIYKIKGY + KGSIFFTQYRVGLKGKKFKIIKFRSMVENAEEVLAANKALYEKYINNSYKLPPNEDPR + LTNIGDFIRKTSIDEIPQFINLMLGDMSLIGPRPILENELEEYSKEEQPVLLSVRPGI + TGMWQVSGRSEVYYPERCEMELYYPRNQSFLLDVKIFFLTIKKVLSGEGAH" + misc_feature 4864..5463 + /gene="wcjG" + /locus_tag="SPC33C_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.3e-56" + gene 5638..6582 + /gene="wciN" + /locus_tag="SPC33C_0009" + CDS 5638..6582 + /gene="wciN" + /locus_tag="SPC33C_0009" + /note="member of homology group 62" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34212.1" + /db_xref="GOA:Q4JZL5" + /db_xref="InterPro:IPR002495" + /db_xref="UniProtKB/TrEMBL:Q4JZL5" + /translation="MDIVYATDNNFIEVLYASISSLYETNASLYLNIWIIADKVSAKN + KERINELASKNNQNTINWIENIEIPFKLKLDRGSISSYSRLFLGEVLPKKVKKVLYLD + CDIIIMDSLSGLFDEEFDGKIIQGVSDVLNKDYKKVLNIPVSAPVFNAGVLYIDLEKW + REERIEEKLIYIINKFKGAVIQGDEGVLNAVLFNSYKELSPRYNYMTIFEDMSYEDMI + TFKQPVNYYSKEVLEEAGKHIIIRHFTTCFLSLRPWQESSEVAHVEIFKKYYRGTYKQ + VSPSKLLSIYKILPKKMSLHLLGFIQSKIRPKLYRILK" + misc_feature 5641..6411 + /gene="wciN" + /locus_tag="SPC33C_0009" + /note="HMMPfam hit to PF01501, Glycosyl transferase + family, score 4.3e-57" + gene 6597..7394 + /gene="wcrO" + /locus_tag="SPC33C_0010" + CDS 6597..7394 + /gene="wcrO" + /locus_tag="SPC33C_0010" + /note="member of homology group 46" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34213.1" + /db_xref="GOA:Q4JZL4" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZL4" + /translation="MKKKEKILLKIQEEELKLLKEFIRICSQNKIRYFALGGSLLGAV + RHKGFIPWDDDMDLGIPRNDFDKFTNGIDFNKYNKNYILENSEVNLGVFQYKLKSGVQ + VFGEKYEVCLDIFPLDGVPVNRFKKLYFERKILFYRMLYKFSVIDQVVDKDRGTFENL + LFKIAKFLKLNKFISTSLMNCKLKRLIKSYDYSSSRYVGNILGRYRSKEIVEKDFFGE + GVLLPFEDIYINCPVNYDCYLKNIYCDYMQLPPVKDRIPHFEELKNQ" + misc_feature 6672..7328 + /gene="wcrO" + /locus_tag="SPC33C_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 7.2e-33" + gene 7391..8482 + /gene="wcrC" + /locus_tag="SPC33C_0011" + CDS 7391..8482 + /gene="wcrC" + /locus_tag="SPC33C_0011" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34214.1" + /db_xref="GOA:Q4JZL3" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZL3" + /translation="MKKIGIVRWQMHTAGGGEKVAINLASELSQKYEVHLVSMFSNAE + VFFSLNNSFRFINLFSKKLSMSKNFLEAVKKLRTYIIEHDIDIVLGIGVSMNCIGTAS + TLGMKAKFVSCDHTNSIVDLDTRVKRIQRYVASRFADKIITLTTSDRENYIKKYKLNP + LKIDYIYNWMDPLVVDKLFDRNSKKLITVGRFDKQKGYDLLSKVAIQVLLNNPDWEWD + IYGSGNDQIKQNLITALDKGGVLSRVHFKGNVKGTENIYPGHAIYVMTSRYEGLPLVL + LEAKQYGLPIVSFDCPTGPSEIILDGENGYLIENFDVKQMSQKIIELIRNDELRLRFS + RNAMLDTDKFNKKRIIEQWIELIEEMTGE" + misc_feature 7898..8410 + /gene="wcrC" + /locus_tag="SPC33C_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 8.6e-35" + gene 8484..9488 + /gene="wcrD" + /locus_tag="SPC33C_0012" + CDS 8484..9488 + /gene="wcrD" + /locus_tag="SPC33C_0012" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34215.1" + /db_xref="GOA:Q4JZL2" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZL2" + /translation="MYDKLVTIIVPMYNIEQYITKCIESFKQVDKKYYADFEVIVVND + GSTDNSLQVVEDLIINSCLNIRVVNKENGGHGSTINVGIRESKGKFFKVIDGDDWIDV + PSFEKLLEELKGIDVDMIITNYTEQHTYNQTEKEIGFSDILDCNKIYEGIPFKRIPMH + ALTYKTSILKESGINISEKTFYVDMEYTLLPLQYVKNYVYIDLNVYQYFLGRKDQSMN + LNVMKQKADHHNRVTKKILDYYEEIRFDKNIEPVVKDVLTYLINKQCQLFIMNNNIEE + ASRLFSYAHKCHYRWKYDHSKKTVSLIYINYRFKNIFNLILKTLINKQQKEWSEMDEY + " + misc_feature 8502..9002 + /gene="wcrD" + /locus_tag="SPC33C_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.2e-31" + gene 9478..10440 + /gene="wciF" + /locus_tag="SPC33C_0013" + CDS 9478..10440 + /gene="wciF" + /locus_tag="SPC33C_0013" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34216.1" + /db_xref="GOA:Q4JZL1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZL1" + /translation="MNISVVIPVYNVEAYLHYAIESLVNQTHKNFEVLLINDGSTDNS + GKLCDKYAQEYDWIRVFHKENGGLSDARNYGVLKATNEWIFFLDPDDYIEPFTFELLS + LIQEKYQADLISTKVQTTNEYEKFSKKQFNLETAKKVTKEEALELMLQDKVATVSACA + KLYHKSILEKAPFPIGKIYEDFYVVAEHLALANRIVISPYKTYNYYCRPGSIVRSKFT + VKRFNFFEAAENNRSIIKEHYNSKELEELLNIKIVQGSFSISSSAAESDVESLLSIRR + KLSSFYWSVFFSPKASFKLKVQYTLFLLFPKQYFKLKNIIKRVD" + misc_feature 9487..9993 + /gene="wciF" + /locus_tag="SPC33C_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.3e-39" + gene 10441..11673 + /gene="wzy" + /locus_tag="SPC33C_0014" + CDS 10441..11673 + /gene="wzy" + /locus_tag="SPC33C_0014" + /note="member of homology group 127" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34217.1" + /db_xref="UniProtKB/TrEMBL:Q4JZL0" + /translation="MAVRKLSLVNILDYVWLTLIILQCYSIYTVKSEPLTLIVPLLIT + TVTLLLFNLLRFTLSLNFIHKFIYMLGLYFTAIVTFFLTNIGANVTILNITKYFILFP + LFFLINSMYMNRKILPALLSKFVNVVVILAMFSLFFWIFGTLLNVVHPTSTVINQWSG + GRLINSYYNLYFETQQMTFFGIHIIRNSGIFAESPIWGLILSIAYVIDLLILKSDKNN + KRNIIILTMLSTISTAGISIIGLAILYKIATNRHKAKLLLFPVTVGLGFSLLLLLTEK + SETVSANLRVDDYNIGFIVWKTSLWIGHGLNNGILAIQSHIPTFIRGVGYSNTLFVIL + AQGGLFLFLIYFSPMILLLFKKKINFDFKFAIILFLILVTTIIFEGTYLFFWILALSY + SYLFFMILDKNSIQNRQL" + gene 11849..13261 + /gene="wzx" + /locus_tag="SPC33C_0015" + CDS 11849..13261 + /gene="wzx" + /locus_tag="SPC33C_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34218.1" + /db_xref="GOA:Q4JZK9" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZK9" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFN + SIVTYFILLATLGVANYGTRVISGYRKEIEKNFWGIYSLQLGATVLSLSLYSVFCLTL + PFMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVFSIFLFVKSAN + DLYLYVFLLTIFELLGQLSTWLPAREFIGRPHFDLEYAKHHLKPVILLFLPQVAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVAHLLATGNHKAVN + KMHEMSFLIYNLVIFPMMAGILIVNDDFVSFFLGQNFQDARYAIAIMIFRMFFIGWTN + IMGIQILIPHNQNKEFMISTTVPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LYFTRRYLKEVPIIGFLTKIILASAIMYGILLGLKTVIHFLPIINVIVFAVLGGIIYL + FAILSLKVVDVKELKQIIKK" + misc_feature 11855..12649 + /gene="wzx" + /locus_tag="SPC33C_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.3e-67" + gene 13261..14373 + /gene="glf" + /locus_tag="SPC33C_0016" + CDS 13261..14373 + /gene="glf" + /locus_tag="SPC33C_0016" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34219.1" + /db_xref="GOA:Q4JZK8" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZK8" + /translation="MELTMYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNI + YCENVEGINVHKYGAHIFHTSNKKVWDYVNQFTEFNNYINSPVANYKGSLYNLPFNMN + TFYAMWGTKTPQEVKNKIAQQTANMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQW + GRSATDLPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLGDVEVELGVDFF + ANREELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEALDEENYQGNAVVNYTER + EIPYTRIIEHKHFEYGTQPKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAA + KNDKVIFCGRLADYKYYDMHVVIERALEVVLSELGK" + misc_feature 13708..14310 + /gene="glf" + /locus_tag="SPC33C_0016" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 7.9e-136" + gene 14454..15512 + /gene="wcyO" + /locus_tag="SPC33C_0017" + CDS 14454..15512 + /gene="wcyO" + /locus_tag="SPC33C_0017" + /note="member of homology group 80" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34220.1" + /db_xref="GOA:Q4JZF8" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZF8" + /translation="MKKIKEYDILKIMAIILVVLSHSAYYKISSNYGGMDYQQYLNSH + SAFTLYKILGKFMEIIYYFHMPLFMAISGVFFSIQIKKDRWNKIEKLLTSKFKRLILP + FFVFTLLYSLPLKYISNYYNGVSFWRAITGQFLLLGNSHLWYLYALFIIFIISFYCLR + RDTSIFVYLSLYIIHVLSFLIHITLVSAPLQFLFWFSMGFLFESKRRKYNIFLENHKW + ISLLFFVLFIFLVVLNFLFKSDFKVLSRFFVDLLAILGSLICYNISYFLSNKTKILDS + KLLNLILINGLGIYIFSDTLNYFILSISYFVSDRFMFTSFGIIIIFLIRFVFTLFLGL + VFTLLFKKVFPKYSWLVN" + misc_feature 14463..15494 + /gene="wcyO" + /locus_tag="SPC33C_0017" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 6.5e-06" + gene 15871..>15918 + /gene="aliA" + /locus_tag="SPC33C_0018" + CDS 15871..>15918 + /gene="aliA" + /locus_tag="SPC33C_0018" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34221.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctgttagact attaagttga taatatagtc aatcgaaaca agaacaagac + 481 aaaagagcct tgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaacagt + 601 ttatgcccaa actcctcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcaattaa ctcaccattt + 781 gttagccctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttatt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata attagattga aactagaata gtacacctct gcttctaaaa + 1021 cattgttaga aatcgatttg actgtcctga ttgatttatc ctgttcttat ttcattttac + 1081 tatatttttg gttcgcggga agtctactaa gatacttaaa gatacagata gtgaaaataa + 1141 aggtgtagac attaccgtaa aaaagtgata taatcgtgta atgttcaatg tataggtgtt + 1201 aatcatgagt agacgtttta aaaaatcacg ttcacagaaa gtgaagcgaa gtgttaatat + 1261 agttttgctg actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta + 1321 caatatcctt gcttttagat atcttaatct agtggtaact gcgttagtcc tactagttgc + 1381 cttggtaggg ctactcttga ttatctataa aaaagctgaa aaatttacta tttttctgtt + 1441 gctgttctct atccttgtca gctctgtgtc gctctttgca gtacagcagt ttgttggact + 1501 gaccaatcgt ttaaatgcga cttctaatta ctcagaatat tcaatcagtg tcgctgtttt + 1561 agcagatagt gatatcgaaa atgttacgca actgacgagt gtgacagcac cgactgggac + 1621 tgataatgaa aatattcaaa aactactagc tgatatcaag tcaagtcaga ataccgattt + 1681 gacggtcaac cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac + 1741 taaggccatt gtcctaaata gtgtctttga aaatatcatc gagtcagagt atccagacta + 1801 cgcatcgaag ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa + 1861 gacgtctaag aatcagtctt tcaatatcta tgttagtgga attgacacct atggccctat + 1921 tagttcggtg tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa + 1981 aatcctcttg accacaacgc cacgtgatgc ctatgtacca atcgcagatg gtggaaataa + 2041 tcaaaaagat aaattaaccc atgcgggcat ttatggagtt gattcgtcca ttcacacctt + 2101 agaaaatctc tatggagtgg atatcaatta ctatgtgcga ttgaacttca cttcgttttt + 2161 gaaattgatt gatttgttgg gtggaattga tgtttataat gatcaagaat ttactgccca + 2221 tacgaatgga aagtattacc ctgcaggcaa tgttcatctt gattcagaac aggctctcgg + 2281 ttttgttcgt gagcgctact cactagcaga tggcgatcgt gaccgcgggc gcaatcaaca + 2341 aaaggtgatt gtggctatcc ttcaaaaatt aacgtcaacc gaagcactga aaaattatag + 2401 cacgatcatt aatagcttgc aagattctat ccaaacaaat atgccacttg agactatgat + 2461 aagtttggtc aatgctcagt tagaaagtgg agggaattat aaagtaaatt ctcaagattt + 2521 aaaaggtaca ggtcggacgg atcttccttc ttatgcaatg ccagacagta acctctatgt + 2581 gatggaaata gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga + 2641 gggtagatga aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca + 2701 agtcaagaga ggaaagcaag gctctcttga cagaatccta caggcagggg gtgcgaacca + 2761 ttgtctctac ctctcaccgt cgcaagggca tgtttgaaac tccggaagag aagatagcag + 2821 aaaactttct tcaggttcgg gaaatagcta aggaagtggc gagtgacttg gtcattgctt + 2881 acggggctga aatttactac acaccagatg ttctggataa gctggaaaaa aagcggattc + 2941 cgaccctcaa tgatagtcgt tatgccttga tagagttcag tatgaacact ccttatcgcg + 3001 atattcatag cgccttgagc aagatcttga tgttgggaat tactccagtc attgcccaca + 3061 ttgagcgcta tgatgctctt gaaaataatg aaaaacgcgt tcgagaactg attgataggg + 3121 gctgttacac gcaagtaaat agttcacatg tcctcaaacc caaacttttt ggcgaacgtt + 3181 ataaattcat gaaaaaaaga gctcagtatt ttttagagca ggatttggtt catatcattg + 3241 caagtgatat gcacaatcta gacggtagac ctcctcatat ggcagaagca tatgaccttg + 3301 ttacccaaaa atacggagaa gcgaaggctc aggaactttt tatagacaat cctcgaaaaa + 3361 ttgtaatgga tcaactaatt taggagaaat gatgaaagaa caaaacacga tagaaatcga + 3421 tgtatttcaa ttatttaaaa ccttgtggaa acgcaagcta atgattttaa tagtggcact + 3481 tgtgacaggt gcgggggctt ttgcatatag cacttttatt gttaagccag aatatacgag + 3541 taccacgcga atttacgtag tgaatcgcaa tcaaggagac aagccggggc tgacaaatca + 3601 ggatttgcag gcaggatctt atctggtaaa agactaccgt gagattatcc tttcgcagga + 3661 tgcattggaa aaagtagcga caaatttgaa gttggatata ccagcaaaaa cgttagccag + 3721 caaagttcaa gtgactgtac cagctgacac tcgtatcgtc tcaatctctg tcaaggataa + 3781 acagccagag gaagccagtc gtatcgctaa ttctctacga gaagttgctg cagaaaagat + 3841 cgtcgctgta acgcgagtat ctgatgtaac gacacttgaa gaagcgcgac cagctacgac + 3901 tccttcttct ccaaatgttc gacgcaattc cttgtttggt tttcttggag gagcagtcgt + 3961 aacagtaatt gctgttcttt tgattgaggt gctggacacc cgtgtgaaac gtcctgaaga + 4021 tgttgaagat gtactgaaaa ttccactttt agggctcgtt ccagattttg acaaaataaa + 4081 ataggaggaa gttatgccaa cattagaaat ctcacatgca aaattggatt ctgtaaaaaa + 4141 ggcagaggaa tattataacg ctttgtgcac gaacctacag ttaagtggag atggtttgaa + 4201 agtattttct atcacttctg tgaaaatagg agaaggaaaa tcaacgactt ccgccaatat + 4261 cgcttgggct tttgcgcgtg caggttacaa aacgctgctg attgatggag atattcgcaa + 4321 ttctgttatg ttaggtgtct ttaaagcaag gaataagatt acaggcctga cagaattttt + 4381 atcaggaact acagacctat cacaagggct ttgtgatacc aatatcgaaa atctctttgt + 4441 aattcaggct ggctctgtgt caccgaatcc gacagctctt cttcaaagtg agaatttcac + 4501 tacaatgctt gaaaccttgc gtaaatattt tgactacatc attgtagata ctgctcctat + 4561 tggtgtcgtg attgatgcgg ctattattac gcgaaactgc gatgcttcta ttttagtgac + 4621 ggaggcaggt gaaataaatc gacgggatat tcaaaaagca aaagaacagt tggaacacac + 4681 agggaagccg tttttgggaa ttgtgttgaa taaattcgat acttcagtag acaaatacgg + 4741 ttcttatggg ggctatggga actatggaaa taaatagtct tgtagtacca agattatttg + 4801 agatgattat tatgggaggg ggagtttaag gtgaaacaga atggcatcat ttatatttgc + 4861 tttaaaagag ttatggatgt ttttattggc ttatttggaa caatattcat agtcttgcct + 4921 agttctttaa taatttatat tatctataaa ataaaaggtt acaaaggaag tatattcttc + 4981 acacaatata gagtggggct aaaggggaaa aaatttaaaa ttattaaatt tagatcaatg + 5041 gttgaaaatg ctgaagaagt tttggccgca aataaggcac tctatgaaaa atatataaat + 5101 aacagttata aattacctcc aaatgaggat cctcgtctta ccaatatcgg agattttata + 5161 agaaaaacga gtattgatga aattcctcaa tttataaatt taatgttagg tgatatgagt + 5221 cttattggac ctagaccgat tttggagaat gagttagagg agtattctaa ggaagaacag + 5281 ccagttttac tatctgtacg accaggtatt acggggatgt ggcaagtttc tggtaggagt + 5341 gaggtatatt atcctgaacg ctgtgaaatg gagctgtatt accctcgaaa ccaatccttt + 5401 ttgttggatg ttaaaatctt ctttttgaca ataaaaaaag ttctgtctgg agaaggggct + 5461 cattaaaggt gaaaggctaa aaatagccaa aaagatgaag cgaagtgaat ggttatctcc + 5521 tgtaaagaat agaacagagt tggggaagag gatttataag gttatattac tattaagctg + 5581 aactctaaca tttagttgat tttaaacgga gaattagaag aaaaagtgag gtaaaaaatg + 5641 gatatagtat atgcgacaga caataacttt attgaggtgc tttatgcttc aatttcatct + 5701 ttatatgaaa cgaatgcatc attatatctc aatatttgga ttattgctga caaggtatca + 5761 gctaagaata aagagagaat caatgagtta gctagtaaaa ataatcaaaa cacgataaac + 5821 tggatagaaa atatagaaat accttttaaa ttgaaattag atagaggttc tataagttct + 5881 tatagtagat tatttttagg agaagttctc cccaaaaaag ttaagaaagt actttatctt + 5941 gattgtgata ttattatcat ggatagttta tcaggtttat ttgatgaaga atttgatgga + 6001 aaaataatcc aaggtgtgtc cgatgtttta aataaggatt ataaaaaagt attgaatatt + 6061 cctgttagcg cacctgtatt taacgcaggt gtattatata ttgatttaga gaaatggcgt + 6121 gaagaacgaa tcgaagaaaa gttgatttat ataatcaata aatttaaagg agccgttatt + 6181 caaggtgatg aaggagtttt gaatgctgtt ttgtttaatt cttataaaga attatctcca + 6241 agatacaatt atatgaccat ttttgaggat atgtcttatg aggatatgat cacttttaag + 6301 caacctgtaa actattatag taaggaagtt ttagaagaag caggaaagca tataataatc + 6361 cgccatttta caacgtgttt tctatcacta agaccttggc aagaaagtag tgaggtagcg + 6421 catgtggaaa tatttaaaaa atactataga gggacataca aacaagtatc tccatctaag + 6481 ttgttaagta tttataagat tttaccgaaa aaaatgtcac tccatctact aggatttatt + 6541 caatcaaaaa ttagaccaaa gttgtataga attttgaaat aaggtagata ttagcaatga + 6601 agaaaaaaga aaaaatttta ttaaaaattc aagaagaaga attgaaatta ttaaaagagt + 6661 tcataagaat atgttctcaa aataaaatca gatattttgc tctgggaggg agcctgttag + 6721 gagcagtaag gcataaaggt ttcattccgt gggatgatga tatggattta ggaattccaa + 6781 gaaatgattt tgataagttt accaatggaa tagattttaa caaatataat aaaaattata + 6841 ttttagaaaa ttctgaagta aatttaggtg tttttcaata taaattaaaa tcaggtgttc + 6901 aagtatttgg ggaaaaatat gaagtatgtt tagatatatt tccgttagat ggagtaccag + 6961 taaatagatt taaaaaatta tattttgaaa gaaaaattct tttttataga atgctttata + 7021 aattttcagt tatagatcaa gtagttgata aagatagagg aacttttgaa aatttattat + 7081 ttaaaattgc caaatttctc aagcttaata aatttatttc aacttcattg atgaattgca + 7141 aacttaagag attaataaaa tcttatgatt atagtagttc aagatatgta ggtaacattt + 7201 taggtcgtta ccgtagtaaa gaaattgtag aaaaggattt ttttggagag ggagttttat + 7261 taccctttga agatatatat attaattgtc cagtaaatta tgactgttat ttaaaaaata + 7321 tttattgtga ttacatgcag ttaccaccgg ttaaagatag aattccacat tttgaggagc + 7381 tgaaaaatca atgaaaaaaa taggtatagt gagatggcaa atgcatactg ctggtggtgg + 7441 agaaaaagta gcaataaatt tagcaagtga gttgtcacaa aaatatgagg tccatctagt + 7501 gtcaatgttt tcaaatgctg aagttttttt ttcgttgaat aattcttttc gttttataaa + 7561 tttattttca aaaaagctat caatgagtaa gaatttttta gaagccgtga aaaaattgag + 7621 aacatacatt attgaacatg atattgatat cgttttgggc attggagtaa gtatgaattg + 7681 tattggaact gcaagtacat taggaatgaa ggcgaaattt gtttcatgtg atcatacaaa + 7741 ttcgatcgtt gatttagata ctagagtaaa aagaattcaa aggtatgtgg catccagatt + 7801 tgcagataag ataattacac ttactacatc ggatagagag aattatataa aaaaatataa + 7861 attaaatccc ctaaaaatag actatattta taactggatg gatccacttg tagtagataa + 7921 attatttgat agaaactcta agaaacttat tactgttgga cgctttgata aacaaaaagg + 7981 ctatgatttg ttatctaagg tagcaattca agtattatta aataatccag attgggaatg + 8041 ggacatatat ggttcgggta atgatcaaat aaaacaaaat ttgatcactg cattggataa + 8101 aggtggtgtt ttatcacgag ttcattttaa agggaatgta aaaggtacag aaaatattta + 8161 tccaggacat gctatttatg taatgacttc tcgttatgaa ggattaccct tagtactttt + 8221 agaggcaaaa caatatggat taccaattgt tagctttgac tgtccaacag gtccatctga + 8281 gataatatta gatggtgaaa atggttattt aattgagaat tttgatgtaa agcaaatgag + 8341 tcaaaaaata atagaattaa ttagaaatga tgaattgaga ttaagatttt cacgaaatgc + 8401 gatgttagat actgataaat ttaataaaaa gagaattatt gaacaatgga ttgaattgat + 8461 agaagaaatg acgggagaat gaaatgtacg ataaattagt gacaatcata gtaccaatgt + 8521 ataatattga acaatatatt actaagtgca tagaatcatt taaacaagta gataaaaaat + 8581 attatgcgga ttttgaagtg attgttgtta atgacggtag tacggataac tcacttcaag + 8641 ttgtagaaga tttaattatt aatagttgtc taaatattag agttgttaat aaagaaaatg + 8701 gtggacatgg gtcaacgatt aatgttggta taagagaatc taaaggaaaa ttttttaaag + 8761 ttattgatgg ggatgattgg attgatgtac caagttttga aaaattatta gaagaactta + 8821 agggtataga tgtcgatatg attattacaa attatacgga acaacatacc tataatcaga + 8881 ctgaaaaaga gattggtttt tccgatatat tagattgtaa taaaatatat gagggaatac + 8941 ctttcaaacg tattccaatg catgctctga catacaaaac atctatattg aaagaatctg + 9001 gaattaatat aagtgaaaaa accttttatg ttgatatgga gtatactttg ttaccgttac + 9061 aatacgtaaa aaattatgtt tatattgatt tgaatgttta ccagtatttc ttaggtagaa + 9121 aagatcagag tatgaattta aatgtgatga aacaaaaagc agaccatcac aatagagtaa + 9181 caaaaaaaat tctcgattat tatgaggaaa ttcgctttga taagaacata gaaccagtag + 9241 tcaaagacgt attgacatac ttaatcaaca agcaatgtca gttgtttata atgaataata + 9301 atatcgagga agcgagccga ttatttagtt atgctcataa atgccattat agatggaaat + 9361 atgatcattc gaaaaaaaca gtctcactaa tttatataaa ttatagattt aaaaatatat + 9421 ttaatctcat cttaaaaacg ctaatcaata agcaacaaaa agaatggagt gagatggatg + 9481 aatattagtg tagttattcc tgtgtataat gttgaggctt accttcatta tgctatagaa + 9541 agtttagtaa atcaaactca taaaaatttt gaggtcttac taatcaatga tggttcaact + 9601 gataactcag gaaaattatg tgataaatac gctcaagaat atgattggat tagagtattt + 9661 cacaaagaga atggtggctt atctgatgcg cgtaattatg gagtgctaaa agcaactaat + 9721 gagtggatat tctttttgga tccggatgat tacatagagc cttttacatt tgaattattg + 9781 tctcttattc aagagaaata tcaagctgat ttgatatcaa caaaggttca aactacaaat + 9841 gaatatgaaa agtttagcaa gaaacaattt aatttagaaa ctgctaaaaa agttacaaaa + 9901 gaagaagcac ttgagctaat gctccaagat aaagttgcaa cagtatcagc ttgcgcaaaa + 9961 ctatatcata agagtatttt agagaaagcc cccttcccta ttggaaaaat ttatgaggat + 10021 ttttatgttg tcgctgaaca tttagcacta gcaaatagaa ttgtgattag tccttataaa + 10081 acttacaatt actattgtcg accaggaagt attgttcgat ctaagtttac tgtaaagaga + 10141 tttaactttt ttgaagctgc tgaaaataat cgtagtatta ttaaagaaca ttacaattca + 10201 aaagaacttg aagaactttt gaatatcaaa atagttcaag gttccttttc aatttcttca + 10261 tcagctgctg aatcagatgt ggagtcctta ctctcaatta ggagaaaatt gagctcattt + 10321 tattggagtg tttttttctc tccaaaagct tcttttaaat tgaaagtgca atatacgtta + 10381 tttttacttt ttcctaagca atatttcaaa ttgaaaaata taataaagag agtagattaa + 10441 atggcagtta gaaaactatc tttagtaaat atactagatt atgtatggtt aacattaatt + 10501 attttacagt gttattctat atacaccgta aagtctgaac ctcttacttt aatcgtgcca + 10561 ttattaatta caaccgtaac gttgttgtta ttcaatttat tacgttttac tttatcatta + 10621 aattttatac ataaatttat ctatatgtta gggctgtatt ttacagcaat agttacattt + 10681 tttttaacta acattggtgc taatgttact atcttaaata ttacgaagta ctttatattg + 10741 ttccctttat tttttttaat aaatagcatg tatatgaata gaaagattct tccagcatta + 10801 ctttctaaat ttgtaaatgt ggtagtaatt ttagcaatgt tttccttatt tttttggata + 10861 tttgggacac ttctgaatgt tgtacatcct acctcgacag taattaatca gtggtctggt + 10921 ggtcgattaa taaatagcta ctataaccta tattttgaaa cccaacagat gacttttttt + 10981 gggatccata taatacgaaa ttcaggaata tttgctgaat ctcctatttg ggggttaata + 11041 ctaagtatcg cttatgttat tgatttactt attttaaaat ctgataaaaa taataagcgt + 11101 aatataatta ttctaacaat gttaagcacg atttcaacgg caggtataag tattatcggg + 11161 ttagctatat tatataaaat agctacgaat cgtcataagg caaaactttt actattccct + 11221 gtcacagtag gtttaggctt ctctttgtta ctcctattga ctgagaaatc agagacagtt + 11281 tcagcaaatc ttagagttga tgattataat attggtttta tagtatggaa gacaagtttg + 11341 tggataggac acggattgaa taatggtata ttagcaattc aatcacatat tccaacgttt + 11401 ataagaggtg taggctatag taacacatta tttgttattt tggctcaggg aggattattt + 11461 ctatttctaa tctatttttc tcctatgatc ctattattat ttaagaaaaa aattaatttt + 11521 gattttaaat ttgcgattat cctattttta attttagtaa caacaattat ttttgaggga + 11581 acgtacttat ttttctggat tttagcatta tcttatagct atttgttctt tatgatttta + 11641 gataaaaaca gtattcaaaa tagacaatta taatctataa gttcatattc gaaaaatttt + 11701 tgtattagtg gaaatcaatc tttttaaata aattgcattt cccttattct tctaaattaa + 11761 ttatttttta taattgtagg attattactt ttgcagttga tactataaag taattttttt + 11821 gagatgaatg gaataagata aataaaacat gaaagtacta aaaaactacg cttataatct + 11881 ttcttatcaa ttgttggtga ttatactccc tatcattacg actccctatg tgacacgggt + 11941 cttttcttcg gatgacctag ggacatatgg ttattttaac tccatcgtga cttattttat + 12001 cctcttagca acgctaggag ttgccaacta tgggaccagg gtcatttcag gatataggaa + 12061 agaaattgaa aaaaattttt ggggaattta ttctttgcaa ctaggtgcaa ccgttctttc + 12121 tctatccttg tatagtgttt tttgcctaac tcttcccttt atgcaaaatc ctgtagccta + 12181 cattttaggc ttgagtttgg tttctaaagg attagatata tcatggcttt ttcaagggtt + 12241 ggaggatttt cgtaagatta cggttcgaaa tattacagta aaattagttg gagtgttctc + 12301 catcttcctc tttgtcaaat ctgcaaatga cctctatctc tatgtctttt tacttactat + 12361 atttgaactc ttggggcagc taagtacgtg gttgcctgct cgtgagttta ttggtagacc + 12421 tcattttgat ttagaatatg ctaagcatca tttgaaaccc gttatattat tattccttcc + 12481 tcaagtagct atctctttgt atgttactct agatcgtacc atgcttggag ccttagcttc + 12541 tacaaaagat gtaggaattt atgaccaggc cctaaaatta gtaaatatcc ttctgacctt + 12601 ggtaacttcc ttgggaagcg ttatgttgcc tcgtgtcgcg catttgttag cgacaggtaa + 12661 tcacaaagcg gttaacaaaa tgcatgagat gtccttcctc atttataatc tagtgatttt + 12721 cccaatgatg gcaggaattt taatcgtcaa tgatgatttt gttagctttt tccttgggca + 12781 gaattttcag gatgcacgtt atgcaattgc cattatgatc ttccgtatgt tctttatcgg + 12841 ttggaccaat atcatgggaa ttcagatact gatacctcac aatcaaaata aagaattcat + 12901 gatttcaaca acagttcccg caattatcag tgtaggtttg aacttactat tccttcctaa + 12961 acttggatat atcggagcag ccattgtttc tgttttgaca gaggcgttgg tatgggcgat + 13021 acaattatac tttacccgta gatacctaaa agaagttccg attatcggat ttttgacaaa + 13081 aattattcta gcttcagcta tcatgtatgg tatcttgcta ggtttaaaaa cagttataca + 13141 ttttttacca atcataaatg ttatagtatt tgcagtgctt ggtggaatca tttatctttt + 13201 tgcaattcta tctttgaaag tggtagatgt aaaagaatta aaacaaatca ttaagaaata + 13261 atggagttaa ctatgtacga ttatcttatc gtcggtgctg gtttgtctgg agcaatcttt + 13321 gcacacgaag ctacaaaacg cggtaaaaaa gtaaaagtga ttgacaagcg tgatcacatc + 13381 ggtggaaata tctactgtga aaatgttgag ggcatcaatg tccacaagta tggtgcccac + 13441 attttccata cttccaataa aaaagtatgg gactatgtta accaattcac tgagtttaac + 13501 aactatatca actcgccagt ggctaactac aaggggagtc tttacaatct tcctttcaat + 13561 atgaatacct tctacgctat gtggggaact aagacaccac aagaagtcaa gaacaagatt + 13621 gcccagcaaa cggctaatat gaaagatgtt gagcccaaga acttggaaga acaagccatc + 13681 aagttgattg gtccagatat ctatgaaaag ttgatcaagg gctatactga aaaacaatgg + 13741 ggacgttctg caacagacct tccgccattt attatcaagc gcctcccagt gcgtttgacc + 13801 tttgataaca actactttaa cgaccgttac caaggtattc caatcggtgg ctataacgtc + 13861 atcattgaaa acatgcttgg cgatgtagaa gtagagcttg gtgttgattt ctttgccaat + 13921 cgtgaagagc tagaagcatc agctgaaaaa gttgtcttta cagggatgat tgaccagtac + 13981 tttgactaca aacacgggga gttagaatac cgtagccttc gttttgaaca tgaagccttg + 14041 gatgaagaaa attatcaagg gaatgctgtg gtcaactata cagaacgtga gattccttat + 14101 actcgtatca ttgagcacaa gcatttcgag tatggtactc aaccaaagac ggttatcact + 14161 cgtgagtatc cagctgattg gaaacgtgga gatgagccat attatccaat caatgatgag + 14221 agaaacaatg ccatgtttgc taagtatcaa gaagaagcag ccaaaaatga caaggttatc + 14281 ttctgtggac gcctagctga ctataaatac tacgacatgc atgtggtcat tgaacgtgcc + 14341 ttagaagtcg tattaagtga gttaggaaag tagtcaatta cattaaggtc aagtttaatg + 14401 accttatatc ttttctataa agaaaaacta caattagagg agcgagattt aatgtgaaaa + 14461 agataaaaga atatgatatt ttaaaaatta tggctattat tttagttgtg ttaagtcata + 14521 gtgcgtatta taaaatatcg agcaattatg gtggaatgga ttatcaacaa tatttaaata + 14581 gtcattcagc atttactcta tataagatac ttggtaaatt tatggaaatt atctattatt + 14641 ttcatatgcc attatttatg gctatatcgg gtgtattttt ctctattcaa ataaaaaaag + 14701 atcgatggaa taagattgag aaattattaa ctagtaagtt taaaagatta atattgccat + 14761 tttttgtttt tactttatta tatagtttgc cattaaaata tatatcaaac tactacaatg + 14821 gtgtttcatt ttggagagct ataactggtc aattcttgtt attaggaaat tctcacttat + 14881 ggtatttgta tgcattattt attatcttta taattagttt ttattgttta agaagagata + 14941 cttctatatt tgtatacttg tccttatata ttatacatgt actgagtttc ttgattcata + 15001 taacgttagt aagtgcacca ttgcagtttc ttttttggtt ttccatggga tttttgttcg + 15061 aatctaaaag aaggaagtat aatatttttt tggaaaatca caaatggatt agccttttat + 15121 tctttgtgtt atttatattt ttggtggttt taaattttct atttaaaagc gattttaaag + 15181 tattgagtcg attttttgtt gacttattag ctattttagg atcacttatt tgttacaata + 15241 tttcgtactt tttaagtaat aaaactaaaa ttttagatag taaactactt aatctcattt + 15301 tgattaatgg tttagggata tatatttttt ctgatacttt aaactatttt atattaagta + 15361 tttcttattt tgtaagtgat agatttatgt ttacttcatt tggtataatt attatatttt + 15421 taattagatt tgttttcact ttatttttgg gattagtctt tacattgcta tttaaaaaag + 15481 tatttccaaa atattcttgg ttagttaact agaaaataca atatcagtga ttatgcacta + 15541 taagctatcc tgtaattctt acagttaaat attttatctt atatactgag gagacaaata + 15601 aaataactta tagtattttg caccttatct agtttaattg taatataaaa gaaaatatcc + 15661 aggaagtggt atagtactct ctcattgttt aacttcgctt aaatatatag gttaattcct + 15721 tgactatgtg atatagttga gggattttta aatgatattc atattttttg caaagatgtt + 15781 gtttgaaaaa taattttcaa aaattctgaa aattctgttg acaactttct gaaaagagtc + 15841 tataatggag agaaagtttt aaaggagaaa atgatgaaaa gttcaaaact acttgccctt + 15901 gcgggcgtga cattattg +// + diff --git a/public/res/serotype_genbank/serotype_33D.gb b/public/res/serotype_genbank/serotype_33D.gb new file mode 100644 index 0000000..e443c77 --- /dev/null +++ b/public/res/serotype_genbank/serotype_33D.gb @@ -0,0 +1,787 @@ +LOCUS CR931701 17583 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain CSF/79 (serotype 33d). +ACCESSION CR931701 +VERSION CR931701.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17583) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17583) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17583 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="CSF/79" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC33D_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC33D_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34222.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC33D_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC33D_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(462..992,994..1323)) + /gene="tnp" + /locus_tag="SPC33D_0003" + /pseudo + CDS complement(join(462..992,994..1323)) + /gene="tnp" + /locus_tag="SPC33D_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(933..992,994..1305)) + /gene="tnp" + /locus_tag="SPC33D_0003" + /note="HMMPfam hit to PF01710, Transposase, score 7.3e-22" + /pseudo + gene 1558..3003 + /gene="wzg" + /locus_tag="SPC33D_0004" + CDS 1558..3003 + /gene="wzg" + /locus_tag="SPC33D_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34225.1" + /db_xref="GOA:Q4JZK4" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZK4" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVGFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1558..1674 + /gene="wzg" + /locus_tag="SPC33D_0004" + /note="Signal peptide predicted for SPC1588 by SignalP 2.0 + HMM (Signal peptide probability 0.998) with cleavage site + probability 0.539 between residues 39 and 40" + misc_feature 1762..2109 + /gene="wzg" + /locus_tag="SPC33D_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 2287..2730 + /gene="wzg" + /locus_tag="SPC33D_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 3005..3736 + /gene="wzh" + /locus_tag="SPC33D_0005" + CDS 3005..3736 + /gene="wzh" + /locus_tag="SPC33D_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34226.1" + /db_xref="GOA:Q4JZK3" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZK3" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLIIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIIMDQLI" + misc_feature 3008..3616 + /gene="wzh" + /locus_tag="SPC33D_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 6.2e-37" + gene 3742..4437 + /gene="wzd" + /locus_tag="SPC33D_0006" + CDS 3742..4437 + /gene="wzd" + /locus_tag="SPC33D_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34227.1" + /db_xref="GOA:Q4JZK2" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZK2" + /translation="MMKEQNMIEIDVFQLFKTLWKRKLIILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRDQGDKPGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIEVLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3742..3858 + /gene="wzd" + /locus_tag="SPC33D_0006" + /note="Signal peptide predicted for SPC1590 by SignalP 2.0 + HMM (Signal peptide probability 0.649) with cleavage site + probability 0.422 between residues 39 and 40" + misc_feature 3763..4179 + /gene="wzd" + /locus_tag="SPC33D_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.5e-56" + misc_feature 4285..4362 + /gene="wzd" + /locus_tag="SPC33D_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4447..5136 + /gene="wze" + /locus_tag="SPC33D_0007" + CDS 4447..5136 + /gene="wze" + /locus_tag="SPC33D_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34228.1" + /db_xref="GOA:Q4JZK1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZK1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5211..6518 + /gene="wchA" + /locus_tag="SPC33D_0008" + CDS 5211..6518 + /gene="wchA" + /locus_tag="SPC33D_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34229.1" + /db_xref="GOA:Q4JZK0" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZK0" + /translation="MTYLLSAVREAEIVSTTAIALYILHYFVFYISDYGQDFFKRGYL + IELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYFLTLHTLLVYVLNLFIKWYWK + RAYPNFKGSKKILLLTATSRIEKVLDRLIESNEVVGELVAVSVLDKPDFQHDYLKVVA + EGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMGIDVTVNLNAFDRSLARNKQI + REMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLILCGLVSIVLVPLIRKDGGSAI + FAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTMQGGMFKVDDDPRITKIGRFI + RKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQKRRLSFKPGITGLWQVSGR + SEIKNFDEVVKLDVAYINGWTIWKDIEILLKTVKVVFMRDGAK" + misc_feature 5934..6515 + /gene="wchA" + /locus_tag="SPC33D_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.7e-160" + gene 6524..7558 + /gene="wciN" + /locus_tag="SPC33D_0009" + CDS 6524..7558 + /gene="wciN" + /locus_tag="SPC33D_0009" + /note="member of homology group 62" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34230.1" + /db_xref="GOA:Q4JZJ9" + /db_xref="InterPro:IPR002495" + /db_xref="UniProtKB/TrEMBL:Q4JZJ9" + /translation="MCRIFVEVKVSNISHSIFFISENKFRSRNFMNIVYATDNNFVDV + LSASIKSLYTTNSDLDLNLWIIADKVSDRNKEKINRLSKQFAQREINWIENVEIPFKL + HLDRGSISSFSRLFLGSVLPSSMSKVLYLDSDIIVMDSLRSIFDIDFKGKILYGVNDT + FNKEYKQVLGIPIDKPMFNAGVMLINLELWRNNNVEERFLQVIQKFNGTILQGDLGVL + NAVLYNSFGVLPPEYNYMTIFEDLTYEEMIVFKKPINYYSKEEIKNARERIVLRHFTT + SFLSKRPWQESSEVTHVEIFKKYYRGAYKQASPSKLLNIYKILPKKMSLYLLGFIQSK + VRPKLYRITK" + misc_feature 6617..7387 + /gene="wciN" + /locus_tag="SPC33D_0009" + /note="HMMPfam hit to PF01501, Glycosyl transferase + family, score 3.5e-72" + gene 7568..8278 + /gene="wciO" + /locus_tag="SPC33D_0010" + CDS 7568..8278 + /gene="wciO" + /locus_tag="SPC33D_0010" + /note="member of homology group 81" + /codon_start=1 + /transl_table=11 + /product="putative ribitol phophotransferase" + /protein_id="CAI34231.1" + /db_xref="GOA:Q4JZJ8" + /db_xref="InterPro:IPR000462" + /db_xref="UniProtKB/TrEMBL:Q4JZJ8" + /translation="MVSVKSIEQKTMTEEKKREAKKDIFAFYVGRPLSYILTIPFLKT + KMTPNQISILSIVPLIIGTALVTVSSNQFVLLLNWLCFFLWNLLDGVDGNVARFKGIT + SPMGSVIDAMAGYAAMYLSFLTMGIIASDYSQTLFFTQKTYLILGSLSGVFVLFPRLI + MHKAINTVGSKNSEQYKGRKNFGVIEMIALNVTSITGFAQLFMLIAILLKLSDLFTLV + YFLINLLVMVISIKKIVK" + misc_feature 7802..8266 + /gene="wciO" + /locus_tag="SPC33D_0010" + /note="HMMPfam hit to PF01066, CDP-alcohol + phosphatidyltransferase, score 0.0078" + gene 8293..9387 + /gene="wcrC" + /locus_tag="SPC33D_0011" + CDS 8293..9387 + /gene="wcrC" + /locus_tag="SPC33D_0011" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34232.1" + /db_xref="GOA:Q4JZJ7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZJ7" + /translation="MKKIAIVRYNLSKIGGAEKVAINMANEFSQNHKTYLISILLNED + KNINYDISSDVEVESFFYGDLRVRKVIIPAMLKLRKHLIKNEIDVVFSIAPATNIIIF + LATLGLNIKTVFCDHHSLEFQDTFSREIQRYIGAKFFDKIVTLTEEDKNRYRKDFSLR + NEKVTSIYNWMEDINNIPAYTNKSKSIITVGRIEYQKGYDYLAKAIVNVLSKYKDWEW + DIYGSGNEQIKQDLITELDKGGVLSRVHFKGNVNGTENIYPGHSIYVMTSRYEGLPLV + LLEAKQYGLPIVSFKCPTGPSEIVLDEENGYLVDNYDVDYMSRKISDLIENENLRLKF + SDESMKDTEKFSKKKIIKQWEDLIEEMTGE" + misc_feature 8803..9315 + /gene="wcrC" + /locus_tag="SPC33D_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.8e-31" + gene 9389..10396 + /gene="wciD" + /locus_tag="SPC33D_0012" + CDS 9389..10396 + /gene="wciD" + /locus_tag="SPC33D_0012" + /note="member of homology group 60" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34233.1" + /db_xref="GOA:Q4JZJ6" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZJ6" + /translation="MGKKLLTIAVPSYNAEKYLPDTIPTILSAKNVHLIDLLIVNDGS + SDGTGEIAEEFERNYPDIIRVLNKPNGGHGSAVNAGIKNAYGTYFKVVDADDWVDTEN + LDDLIEYLKETDVDEILSPYYRVYVNQAGDVVSIENYNEFSMIQTDKVYQVDAFYEQI + GRTVGMHTMTLKTKLLKENQVELSENMYYVDMEYITYVLPYIETVFLFNKPIYKYRLG + TSTQSISIESYIKNRSMHKQVIFNLIDFYNQTKLGFGRSKAVKNLIINLINQQWNIYF + NLNNVTEAKKELIEFEKSIAIKNKSFLKNSTGLKMNFVRKSRYHLFNIAKYYSNWRVK + S" + misc_feature 9407..9916 + /gene="wciD" + /locus_tag="SPC33D_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.8e-29" + gene 10378..11361 + /gene="wciE" + /locus_tag="SPC33D_0013" + CDS 10378..11361 + /gene="wciE" + /locus_tag="SPC33D_0013" + /note="member of homology group 44" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34234.1" + /db_xref="GOA:Q4JZJ5" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JZJ5" + /translation="MESEILNKIKKMTREYMKLKKIFSTQIANNMLLEKIAARLSRYN + FLHGLVVFIYSKKHKDILDFLKKDFDIFLSTYSYDFEKSNEQNGKKIFSLWLQGYENA + PEIVQKSIQTQKEYAERFGYEYILLDKSNLETFVKIPENIARKFEDGKIDAIKYSDII + RTFLLFKYGGIWFDATIYIKTDSKLSYLDDEFYTIRAKGDETYPKYVADGRWALFCIA + GYRNGIVFDFLRKFQVEYFSKYDLPINYFLIDYLMELGYEYNPIIRKQVDKVITNNQD + LYFLVNNFSNMYRDEDWKKVLETTNIFKCSYKIYVSDKLDTYFYKLKNQTL" + misc_feature 10486..11343 + /gene="wciE" + /locus_tag="SPC33D_0013" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.7e-58" + gene 11374..12342 + /gene="wciF" + /locus_tag="SPC33D_0014" + CDS 11374..12342 + /gene="wciF" + /locus_tag="SPC33D_0014" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34235.1" + /db_xref="GOA:Q4JZJ4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZJ4" + /translation="MISIIVPVYNVKDYLHYAMESLFRQTYTDFEVILVNDGSTDSSG + ELCNRYAENHENVYVFHKKNGGLSDARNFGVTKASSDWIVFLDPDDYFEVDALELLVK + IQQRYDADLISTKVKSTSTYEDYNSDYMGESVYSNLEVLSKEEALELMLQDKVATVSA + CAKLYHKSILERAPFPIGKVYEDFYVVGEHLALANRIVISPYKTYNYFCRPGSIVRSK + FTVKRFNFFEAAEHNRSIIKKYYNSKNLENVLNIKIVQGSFSIASSAAESDVESLLAI + RKKLSSLYWSVFTSPKASYRLKLKYTLFLLFPKGYYKLKKMIKRVD" + misc_feature 11380..11895 + /gene="wciF" + /locus_tag="SPC33D_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 7.4e-42" + gene 12343..13551 + /gene="wzy" + /locus_tag="SPC33D_0015" + CDS 12343..13551 + /gene="wzy" + /locus_tag="SPC33D_0015" + /note="member of homology group 127" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34236.1" + /db_xref="UniProtKB/TrEMBL:Q4JZJ3" + /translation="MSVRKLSLIDILDYMWIILIIVQCHSIYTVKSEPLNLIVPFLVT + TAMLLLLNLLRFTLSIKYIYMLGLYFIAMATFFLTNIGANVTPLNITKYFIMLPLFFL + INSIYVNKEIFSALLSKFVNVVVILAIFSLFFWIFGTLLNVVHPTSTVINQWSGGQLI + NSYYNLYFETQQMIFFGFRIIRNSGIFAESPIWGLILSIAYVIDFLILKFDKNSKRNI + IILTMLSTISTTGIIIVGLAILYKIMTTSRWMTKLLLLPVTLSLGLSLLLLLAEKSET + VSANLRVDDYNIGFIVWKASLWIGHGLNNGILAIQSHISTFTRNLGYSNTLFVILAQG + GLLLFLIYFSPMILLLFKKNINLDFKFAIILFFILVTTIIFEGTFLFLWILTLSYSYF + SFVTLDKTGT" + misc_feature 13168..13362 + /gene="wzy" + /locus_tag="SPC33D_0015" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 7.4e-05" + gene 13688..15103 + /gene="wzx" + /locus_tag="SPC33D_0016" + CDS 13688..15103 + /gene="wzx" + /locus_tag="SPC33D_0016" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34237.1" + /db_xref="GOA:Q4JZJ2" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZJ2" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKQIQKNFLGIYSLQLGATVLSLSLYALLCLTL + PFMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVSAIFLFVKSAS + DLYLYVFLLTAFELLGQLSMWFPAREYIGKPHFDIEYARHHLKPVILLFLPQIAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVAHLLATGDHKVVN + KMHEVSFLIYNLVIFPIMAGMLIVNDDFVQFFLGQDFQDARYAISIMIFRMFFIGWTN + IMGIQMLIPYNQNKEFMISTTAPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LFYTRRYLKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSPTLNVLAFAALGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 13694..14488 + /gene="wzx" + /locus_tag="SPC33D_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.2e-68" + gene 15105..16103 + /gene="wciG" + /locus_tag="SPC33D_0017" + CDS 15105..16103 + /gene="wciG" + /locus_tag="SPC33D_0017" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34238.1" + /db_xref="GOA:Q4JZJ1" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZJ1" + /translation="MRKIRNINLDLLKVLACVGVVLLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMINGYLLLGKREITYLYILQKVKWILITVSSWTFIVWLFHRDFTTNPI + KKIVGSLIQRGYFSQFWFFGALILIYLCLPIVRQFLNSKRSYLYSLSLLMTIGLIFEL + LNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTKEEIKSRFKNWMKIASILLLLI + SPIILFFIAKTTYHNFFAEYFYDILLVKVVSVGIFLTIFSLVLNENSNKWIIFLSNQT + MGIFIIHTYIMKVWEKLFGFNFIGSYLLFAIFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 16116..17219 + /gene="glf" + /locus_tag="SPC33D_0018" + CDS 16116..17219 + /gene="glf" + /locus_tag="SPC33D_0018" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34239.1" + /db_xref="GOA:Q4JZJ0" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZJ0" + /translation="MYDYLVVGAGLFGAVFAHEAALKGKKVKVIEKRNHIAGNIYTRE + QEGIQVHQYGAHIFHTSDKEIWEYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIDEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPAFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQ + GNVIFGGRLGHYRYYDMHQVIGAALQCVRNELN" + misc_feature 16551..17159 + /gene="glf" + /locus_tag="SPC33D_0018" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 9.6e-115" + gene 17536..>17583 + /gene="aliA" + /locus_tag="SPC33D_0019" + CDS 17536..>17583 + /gene="aliA" + /locus_tag="SPC33D_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34240.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaaagca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgaacccatg ttttctcaat aggattgtac tcaggtgaat agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcaca caagagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaactaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttatt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa tatggctact + 961 ttttctgggt cttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaattca gaagctattt cagtcaaata + 1081 agcatctgga ttgtcagtaa gatagttttt aagtctatct ctatcaactt ttcttggttt + 1141 tgttcctttt acttggtggt ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatggtatta cgtgagattt ggaaaacgtg tgatgcttct gttatactac ctgttcgctc + 1261 acaataagag agaacttttt tacgaaaatc tattgaatat cccataagaa gattatacca + 1321 cattgtgtac tacagtagat tgaaactaga acagtacacc tctacttcta aaacattgtt + 1381 agaaatcgat ttgactgtcc cgatcgattt gtcatcttct tatttcattt tactatattt + 1441 ttggttcgcg ggaagtctac taagatactt aaagatgcag atagtggaaa taaaggtgta + 1501 gacattaccg taaaaaagtg atacaattgt aagatattga atgtataggt attaatcatg + 1561 agtagacgtt ttaaaaaatc acgttcacag aaagtgaagc gaagtgttaa tatagttttg + 1621 ctgactattt atttattgtt agttggtttt ttattgttct taatctttaa gtacaatatc + 1681 cttgctttta gatatcttaa cctagtggta actgcgttag tcctactagt tgccttggta + 1741 gggctactct tgattatcta taaaaaagct gaaaaattta ctatttttct gttggtgttc + 1801 tctatccttg tcagctctgt gtcgctcttt gcagtacagc agtttgttgg actgaccaat + 1861 cgtttaaatg cgacttctaa ttactcagaa tattcaatca gtgtcgctgt tttagcagat + 1921 agtgagatcg aaaatgttac gcaactgacg agtgtgacag caccgactgg gactgataat + 1981 gaaaatattc aaaaactact agctgatatt aagtcaagtc agaataccga tttgacggtc + 2041 aaccagagtt cgtcttactt ggcagcttac aagagtttga ttgcagggga gactaaggcc + 2101 attgtcctaa atagtgtctt tgaaaacatc atcgagtcag agtatccaga ctacgcatcg + 2161 aagataaaaa agatttatac caagggattc actaaaaaag tagaagctcc taagacgtct + 2221 aagaatcagt ctttcaatat ctatgttagt ggaattgaca cctatggtcc tattagttcg + 2281 gtgtcgcgat cagatgtcaa tatcctgatg actgtcaatc gagataccaa gaaaatcctc + 2341 ttgaccacaa cgccacgtga tgcctatgta ccaatagcag atggtggaaa taatcaaaaa + 2401 gataaattaa cccatgcagg catttatgga gttgattcgt ccattcacac cttagaaaat + 2461 ctctatggag tggatatcaa ttactatgtg cgattgaact tcacttcttt cttgaaaatg + 2521 attgacttat tgggaggggt agatgttcat aatgatcaag agttttcagc tctacatggg + 2581 aagttccatt tcccagtagg gaatgtccat ctagactctg agcaggctct aggttttgta + 2641 cgtgaacgct actcactagc cgatggagac cgtgatcgcg ggcgcaatca acaaaaggtg + 2701 attgtggcta tccttcaaaa attaacgtca accgaagcac tgaaaaatta tagtacgatc + 2761 attaatagct tgcaagattc tatccaaaca aatatgccac ttgagactat gataaatttg + 2821 gtcaatgctc agttagaaag tggagggaat tataaagtaa attctcaaga tttaaaaggg + 2881 acaggtcgga tggatcttcc ttcttatgca atgccagaca gtaacctcta tgtgatggaa + 2941 atagatgata gtagtttagc tgtagttaaa gcagctatac aggatgtgat ggagggtaga + 3001 tgaaatgata gacatccatt cgcacatcgt ctttgatgta gatgatggtc ccaagtcaag + 3061 agaggaaagc aaggctctct tggcagaatc ctacagacag ggggtgcgaa ccattgtctc + 3121 tacctctcac cgtcgcaagg gcatgtttga aactccggaa gagaagatag cagaaaactt + 3181 tcttcaggtt cgggaaatag ctaaagaagt ggcgagtgac ttgatcattg cttacggggc + 3241 tgaaatttac tacacaccag atgttctgga taagctggaa aaaaagcgga ttccgaccct + 3301 caatgatagt cgttatgcct tgatagagtt tagtatgaac actccttatc gcgatattca + 3361 tagcgccttg agcaagatct tgatgttggg aattactcca gtcattgccc acattgagcg + 3421 ctatgatgct cttgaaaata atgaaaaacg cgttcgagaa ttgatcgata tgggctgtta + 3481 cacgcaagta aatagttcac atgtcctcaa atccaaactt tttggcgaac gttataaatt + 3541 catgaaaaaa agagctcagt attttttaga gcaggatttg gtccatgtca ttgcaagtga + 3601 tatgcacaat ctagacggca gacctcctca tatggcagaa gcatatgacc ttgttaccca + 3661 aaaatacgga gaagcgaagg ctcaggaact ttttatagac aatcctcgaa aaattataat + 3721 ggatcaacta atttaggaga aatgatgaaa gaacaaaaca tgatagaaat cgatgtattt + 3781 caattattta aaaccttgtg gaaacgcaag ctaataattt taatagtggc acttgtgaca + 3841 ggtgcggggg cttttgcata tagcactttt attgttaagc cagaatatac gagtaccacg + 3901 cgaatttacg tagtgaatcg cgatcaagga gacaagccgg ggctgacaaa tcaggatttg + 3961 caggcaggat cttatctggt aaaagactac cgtgagatta tcctttcgca ggatgtattg + 4021 gaaaaagtag cgacaaattt gaagttggat atgccagcaa aaacgttagc cagcaaagtt + 4081 caagtgactg taccagctga cactcgtatc gtctcaatct ctgtcaagga taaacagcca + 4141 gaggaagcca gtcgtatcgc taattctcta cgagaagttg ctgcagaaaa gatcgtcgct + 4201 gtaacgcgag tatctgatgt aacgacactt gaagaagcgc gaccagctac gactccttct + 4261 tctccaaatg ttcgacgcaa ttccttgttt ggttttcttg gaggagcagt cgtaacagta + 4321 attgctgttc ttttgattga ggtgctggac acccgtgtga aacgtcctga agatgttgaa + 4381 gatgtactga aaattccact tttagggctc gttccagatt ttgacaaaat aaaataggag + 4441 gaagttatgc caacattaga aatctcacag gcaaaattgg attctgtaaa aaaggcagag + 4501 gaatattata acgctttgtg cacgaaccta cagttaagtg gagatggttt gaaagtattt + 4561 tctatcactt ctgtgaaaat aggagaagga aaatcaacga cttccgccaa tatcgcttgg + 4621 gcttttgcgc gtgcaggtta caaaacgctg ctgattgatg gagatattcg caattctgtt + 4681 atgttaggtg tctttaaagc aaggaataag attacaggcc tgacagaatt tttatcagga + 4741 actacagacc tatcacaagg gctttgtgat accaatatcg aaaatctctt tgtaattcag + 4801 gctggctctg tgtcaccgaa tccgacagct cttcttcaaa gtaagaattt cactacaatg + 4861 cttgaaacct tgcgtaaata ttttgactac atcattgtag atactgctcc tgttggtgtc + 4921 gtgattgatg cggctattat tacgcgaaac tgcgatgctt ctattttagt gacggaggca + 4981 ggtgaaataa atcgacggga tattcaaaaa gcaaaagaac agttggaaca cacagggaag + 5041 ccgtttttgg gaattgtgtt gaataaattc gatacttcag tagacaaata cggttcttat + 5101 ggaaattatg gagattacgg gaaaaataaa aaataggtcg ggggatagag atgaatggaa + 5161 aaatattaag gtcttcattg gtcataatcc agagttttct tgttatttta ttgacttatc + 5221 tacttagtgc tgtgagagaa gcggagattg tttcaacaac agctattgca ctttatatcc + 5281 tccattattt tgttttttat atcagtgatt atggacagga tttctttaaa aggggatatt + 5341 tgattgaact tgtccagaca ttgaaatata tcctattctt tgcactagcg attagtattt + 5401 ctaatttttt cttagaggat cgatttagta tttccagacg aggcatgatt tacttcctca + 5461 cattacatac tctcttagtc tatgtgctaa acctatttat caagtggtat tggaagcggg + 5521 cttatcccaa ttttaaagga agtaagaaga ttctcctact tacagcaact tctcgtatcg + 5581 aaaaggtact ggatagatta atagaatcaa atgaggttgt tggggagttg gtagccgtca + 5641 gtgtcttaga taaaccagat tttcagcatg attatttaaa ggtagtagca gagggggaga + 5701 tagtaaactt tgcgactcat gaggtggtcg atgaagtctt tatcaatctt ccaagtgaaa + 5761 aatacaatat tggagagctt gtctctcagt ttgaaacgat gggaattgat gtaacagtca + 5821 atctaaatgc ttttgatcgt agtttggcac gtaacaagca aattcgtgag atggcaggat + 5881 taaacgttgt gactttttct acaacatttt ataagactag tcatgtaatt gctaagcgaa + 5941 ttattgatat cgtgggtgca ttggtagggc tgatattatg tggtttagtc agtattgtac + 6001 tggttccttt gattcgaaag gatgggggct ctgctatttt tgctcagacg cgtataggaa + 6061 aaaatggtcg tcagttcact ttttataagt ttcgctctat gtgtgtagat gccgaggcga + 6121 aaaaaagaga actcatggaa caaaatacca tgcagggtgg aatgtttaag gtggacgatg + 6181 atcctcgtat cacgaaaatt ggtcgtttta tacggaagac tagcttggac gagctaccac + 6241 agttttacaa tgttctaaag ggagatatga gcttggtagg tacacgacca ccaacagtgg + 6301 acgagtatga gcactatacc ccagaacaaa aacgccgact aagctttaaa cctggcataa + 6361 caggtttatg gcaggtcagc ggacgaagtg aaatcaagaa tttcgatgaa gttgtcaaat + 6421 tagatgtggc ctatattaat ggttggacaa tctggaaaga tattgaaatt ttattgaaaa + 6481 cggttaaagt tgtatttatg agagatggag cgaaatagtt tggttgtgta ggatatttgt + 6541 agaggtaaaa gtttcgaata tatctcactc aatctttttt ataagtgaaa ataaatttag + 6601 aagtaggaat tttatgaata tagtttatgc cacagataat aattttgtag atgtattgag + 6661 tgcttccatc aaatcacttt acactactaa ttcagatttg gatttaaatt tatggattat + 6721 tgctgataaa gtttcggata gaaataaaga aaagataaat agattatcaa aacaatttgc + 6781 gcagagagaa attaattgga tagagaacgt tgagatccca tttaaattac atttagatag + 6841 gggatcaatt agttcattta gcagattatt tctgggaagt gttcttccat cttcaatgag + 6901 taaagttctt tatcttgaca gtgatattat tgttatggat tctttacgaa gtatttttga + 6961 tattgatttt aagggtaaaa ttctctatgg ggtgaatgat acttttaata aagaatacaa + 7021 gcaggtgttg ggtataccaa ttgacaagcc aatgtttaat gctggagtta tgcttattaa + 7081 tttagagtta tggagaaata ataacgtcga agaaagattt ttgcaagtaa ttcaaaagtt + 7141 taatggtact atattacaag gagatttagg ggttttaaat gcagttttat ataactcatt + 7201 tggtgtactt cctccagaat ataattatat gaccatattt gaagatttga cttatgaaga + 7261 aatgatagtt tttaaaaaac caattaatta ttattcaaaa gaggaaatta aaaatgccag + 7321 agaacgtata gtcttgcgac atttcacaac tagtttttta tcaaaaagac cttggcaaga + 7381 aagtagtgag gtaacgcatg tggaaatatt taaaaaatac tatagaggag catacaaaca + 7441 agcatctcca tctaagttat taaatattta taaaatttta cctaaaaaaa tgtcgctcta + 7501 tctactaggt tttattcaat caaaagtgcg tccaaaactg tatagaatta caaaatagag + 7561 gtataaaatg gtaagtgtta aaagtataga acaaaaaacg atgacggaag aaaagaaaag + 7621 ggaagcaaaa aaagacattt ttgctttcta tgtaggtaga cctctatcat acatattgac + 7681 aattcctttt cttaaaacaa aaatgacacc gaatcagatt tctatattgt ctattgtacc + 7741 tttaattatc ggaacagctt tggtaacagt aagttctaat cagtttgtac tattgctaaa + 7801 ttggctttgt tttttcttat ggaatttact tgacggtgtt gacggaaatg ttgctcgttt + 7861 caagggaatt acctctccta tgggaagtgt tatagatgca atggcaggct atgctgcaat + 7921 gtatttatca ttcctcacga tgggaattat tgcaagtgac tatagtcaaa cactattctt + 7981 tacacaaaaa acatatttaa ttttagggtc actatctggt gtttttgttt tgtttcctag + 8041 attaattatg cacaaagcta taaatactgt aggaagtaag aatagtgagc agtacaaagg + 8101 tagaaaaaat tttggtgtta tagaaatgat tgcacttaat gtaacctcta taacaggatt + 8161 tgctcaattg tttatgctta ttgcaatatt attaaaattg agcgacttat ttacactagt + 8221 ttatttcctc attaatttat tagttatggt gatctctatt aaaaagatag taaaataaga + 8281 ataaggcgag ttatgaaaaa aattgcgata gtaaggtata atttaagtaa aattggtgga + 8341 gctgaaaaag ttgctataaa tatggctaat gaattttctc aaaaccacaa aacatactta + 8401 atttctattt tactaaatga agacaagaac ataaattatg acatatcatc tgatgttgaa + 8461 gttgagtcct ttttttatgg tgatttaaga gttcgtaaag tgataattcc agctatgctg + 8521 aagttaagaa aacacttgat aaagaatgaa attgatgtag tgttttctat tgctccggct + 8581 acaaatatta ttatcttttt agcaacgtta ggattaaata taaaaactgt cttttgtgac + 8641 caccatagtt tagagtttca agacactttc agtcgcgaga tacaaagata tattggggca + 8701 aagttttttg acaaaattgt aactttgact gaggaagata aaaatagata tcgaaaagac + 8761 ttttcattaa gaaatgaaaa ggttacttca atctataatt ggatggaaga cattaataac + 8821 attcccgcat atactaataa aagcaagagc attataacag ttggaagaat agaatatcaa + 8881 aaaggatatg actatttagc taaagctatt gttaacgttt tgtcaaaata taaagactgg + 8941 gaatgggaca tatacggttc gggaaacgag caaataaaac aagatctgat tactgaattg + 9001 gataaaggtg gcgttttatc gcgggttcat tttaaaggga atgttaatgg tacagaaaat + 9061 atttatcccg gtcattctat ttatgtaatg acttctcgtt atgaaggtct tcccttagtt + 9121 cttttagaag ctaaacagta tggactaccg attgttagtt ttaaatgtcc aacgggtcca + 9181 tcagaaatag ttttagatga ggaaaatgga tatttagttg ataattacga tgttgattac + 9241 atgagtagaa aaatttctga tttaattgaa aacgagaatt tgagattaaa attttcagat + 9301 gaatcaatga aagatactga aaaatttagc aagaaaaaga ttataaagca gtgggaagac + 9361 ttaattgaag aaatgacagg ggaatagaat gggaaagaaa ttattaacaa tagcagtgcc + 9421 atcatacaat gcggaaaaat atttaccaga tactatacca acaatattat ctgcaaagaa + 9481 tgtacattta attgatttac ttatagtaaa tgatggttcg agtgatggta cgggggaaat + 9541 cgctgaagaa ttcgagcgaa attaccctga tattattcgt gttttaaata aaccaaatgg + 9601 tgggcatgga tcagctgtaa atgcaggtat aaaaaatgct tatggaacgt attttaaggt + 9661 tgttgatgca gatgattggg ttgatacaga aaatttagat gatttgatag aatatttaaa + 9721 agaaacagat gtggatgaaa ttctttcacc gtattatcga gtttatgtta atcaagctgg + 9781 agatgtagta tctattgaaa attataacga attttcgatg attcagacag ataaagtgta + 9841 ccaggtagat gctttctatg aacaaatagg tagaaccgta ggaatgcaca ctatgacatt + 9901 aaaaaccaag ctgttaaaag aaaatcaagt agaattatct gaaaatatgt actatgtaga + 9961 tatggaatat atcacctatg ttctaccata tatagaaacg gtttttcttt ttaataaacc + 10021 gatttataaa taccgtttag gaacatctac gcaaagtatt agtatagaaa gttatataaa + 10081 aaatagatct atgcataaac aagttatttt taatcttatt gatttttaca atcaaacgaa + 10141 acttggattt ggtcgctcca aagcagtaaa gaatctaata ataaatctta taaatcagca + 10201 gtggaatatc tatttcaatt taaataatgt aactgaagct aaaaaagaat taatagaatt + 10261 tgaaaaatct atagctatta aaaataaaag cttcttgaaa aattctacgg gcttaaagat + 10321 gaattttgtc agaaaaagtc gttaccattt atttaacatt gctaaatatt atagtaattg + 10381 gagagtgaaa tcttgaataa aatcaaaaaa atgacaagag aatacatgaa attgaaaaaa + 10441 attttctcta cccaaattgc aaataatatg ctcttagaaa agatagctgc acgactatca + 10501 agatataatt ttttgcatgg tttagtagta tttatttact ctaaaaaaca taaggatatt + 10561 ttagattttc taaaaaagga ttttgatata tttttatcta cctattctta tgatttcgaa + 10621 aaatctaatg agcaaaatgg aaaaaagatt ttttcattat ggcttcaagg atatgaaaat + 10681 gctccagaaa ttgttcaaaa atccatacaa acccaaaaag aatatgctga aagatttggt + 10741 tatgaataca tattgttaga taagtcaaat ttagagacat ttgttaaaat tcctgaaaat + 10801 attgctagaa aatttgaaga tgggaaaata gatgcaataa aatattcaga tatcattaga + 10861 actttcttgt tatttaaata cggtggtatc tggttcgatg caactattta tataaaaaca + 10921 gattcaaagt taagttattt agatgatgag ttttatacta ttcgtgcgaa gggagatgaa + 10981 acctatccta agtatgttgc ggatggacgt tgggccttgt tttgtatagc tggatatcgt + 11041 aatgggattg tattcgattt tttaagaaaa tttcaagttg aatatttctc taaatatgac + 11101 ttaccaataa attacttttt gatagactat ttaatggagt taggctatga gtataatcca + 11161 ataattcgaa aacaggttga taaggtaatt accaacaacc aagatctcta ttttttagta + 11221 aataattttt ctaatatgta cagggatgag gattggaaaa aagtattaga aacaacaaat + 11281 atttttaaat gtagctataa aatatatgta agcgataaat tggacacata cttttataaa + 11341 ttgaaaaatc aaactctata gtgaggaaat gtaatgattt cgattattgt tccagtatat + 11401 aatgtgaaag actatctaca ttatgcaatg gaaagtttat ttagacaaac atacacagac + 11461 tttgaagtta ttttagttaa tgatggttca acagatagtt ctggtgaatt atgtaatcgg + 11521 tacgctgaaa atcatgagaa tgtttatgtt tttcataaaa aaaatggtgg actttcggat + 11581 gctagaaatt ttggtgtcac gaaggcttct tcggattgga tagtttttct agatccagat + 11641 gactattttg aagtagatgc tttagaacta ttagttaaga ttcagcaaag atatgacgca + 11701 gatttgatat caactaaagt aaaatctact tcgacatatg aagattataa ttctgactat + 11761 atgggagaat ctgtttatag taatcttgaa gtactttcaa aagaggaagc attagaactg + 11821 atgcttcaag ataaagttgc aacagtatcg gcctgtgcta aactatatca taagagtatt + 11881 ttagaaagag ctcccttccc tattggaaaa gtctatgaag atttttatgt tgttggtgaa + 11941 catttggcat tagcaaatag aattgtaata agtccttata aaacctacaa ttatttttgt + 12001 agaccgggta gtatcgttcg ttctaaattt actgttaaga ggtttaactt ttttgaagct + 12061 gctgaacata atcgtagtat tattaaaaaa tattataatt caaaaaatct tgaaaatgtt + 12121 ttaaatatca aaatagtgca gggttccttt tctattgctt catcagctgc tgaatcagat + 12181 gtagaatcct tactagcaat taggaagaaa ctgtcctcat tgtattggag tgttttcaca + 12241 tcaccaaaag cttcttatag actaaaatta aaatatacgt tatttttact tttccctaaa + 12301 ggatattaca aattaaaaaa aatgataaag agagtggatt aaatgtcagt tagaaaacta + 12361 tctttaatag atatactgga ctatatgtgg ataatattaa ttattgtaca gtgtcattca + 12421 atatatacag taaaatctga acctcttaat ttaattgtgc catttttagt tacaacagca + 12481 atgttgttgt tactcaattt attacgattc actttgtcaa taaaatatat atatatgtta + 12541 gggctatatt ttatagcaat ggctacattt tttttaacta acataggtgc taatgttact + 12601 cccttaaata ttacgaagta ttttataatg cttcctttat tttttttaat aaatagtatt + 12661 tatgtgaata aagaaatttt ttcagcgtta ctatcaaaat ttgtaaacgt agtagtaatt + 12721 ttagcaattt tttccttatt cttttggata tttggaacac ttctgaatgt tgtacaccct + 12781 acctcaacag taattaatca atggtctggt ggtcaattaa taaatagcta ctataatcta + 12841 tattttgaaa ctcaacagat gatttttttt gggttccgta taatacggaa ttcaggaata + 12901 tttgctgaat ctcctatttg ggggctaata ctaagtattg cttatgttat tgattttctt + 12961 attttgaaat ttgataaaaa tagcaagcgt aatataatta ttctaactat gttaagtaca + 13021 atttcaacga caggtattat tattgtcggg ttagctatat tatataaaat aatgactact + 13081 agtcgttgga tgacaaaact cttacttctc cctgtcacat tgagcttagg actctcttta + 13141 ttgctcctat tggctgagaa atcagagaca gtttcagcta atcttagagt tgatgattat + 13201 aatattggtt ttatagtatg gaaggcaagt ttgtggatag gacacggatt gaataatggt + 13261 atattagcaa ttcaatcaca tatctcaacg tttacaagaa atttaggcta tagtaacaca + 13321 ttatttgtta ttttggctca gggaggttta ttattattct tgatttattt ttctccaatg + 13381 atactattat tgtttaagaa aaatatcaat cttgatttta agtttgctat tatcttattc + 13441 tttatcttag taacaacaat tatttttgaa gggacatttt tatttctctg gattttaaca + 13501 ttatcgtata gctacttttc ctttgtaaca ttagataaaa ctggaacgta aagtagataa + 13561 tatataatgt catatataaa ttttgatatt tgtttaatca acttattctt attattgtga + 13621 cattcttact tttacagttg atgatagaaa caaatctttt aaagcaagtg aaataaatta + 13681 ataaaacatg aaagtactaa aaaattacgc ctacaatctt tcttaccaat tgttggtgat + 13741 tatactccct atcattacga cgccctatgt aacaagggtc ttttcttcgg atgatttagg + 13801 gacgtatggt tattttaatt ccatcgttac ttattttatc ctcttagcga cgctaggagt + 13861 tgctaactat gggaccaagg tcatttcagg gcatcgaaag caaattcaaa aaaacttttt + 13921 gggaatctat tctctgcaat taggtgcaac agttctttct ctgtccttgt atgctcttct + 13981 ttgtctaact cttcccttta tgcaaaatcc ggtagcctat attctaggct tgagtttagt + 14041 ttctaaaggt ttagacatct cctggctctt tcaagggtta gaagattttc gtaaaattac + 14101 ggtcagaaat atcacagtga agcttgttgg tgtaagtgcc attttcttgt ttgtaaaatc + 14161 agcgagtgat ctatacttgt atgtttttct tctaacagca tttgaattgt tgggtcagtt + 14221 aagtatgtgg tttccagccc gtgaatatat tggaaaacca cattttgata tagaatatgc + 14281 taggcatcat ctgaagccag ttatcttgct attcttacca caaattgcta tctcgcttta + 14341 tgtgacttta gatcgtacaa tgttaggggc gctagcttct acaaaagatg tcggcattta + 14401 tgatcaggct ttgaagctgg ttaatatttt actgaccttg gtaacttcct tgggaagtgt + 14461 tatgctgcca cgcgttgcgc atttgttagc gacaggtgat cataaggtag tcaataagat + 14521 gcatgaggta tccttcttaa tttataattt ggttattttt ccgattatgg cagggatgtt + 14581 gattgtgaat gatgattttg ttcaattttt ccttgggcaa gactttcaag atgcacgcta + 14641 tgcaatttcc attatgatct tccgtatgtt ctttatcggt tggaccaata tcatgggaat + 14701 tcagatgctg ataccttata atcaaaataa agaattcatg atttcaacaa cagctcccgc + 14761 aattatcagt gtaggtttga acttactatt ccttcctaaa ctgggatata tcggggcagc + 14821 cattgtctct gttttaacag aggcacttgt atgggcaatc caattattct atactcgcag + 14881 atatttaaaa gaagttccta taatcggatc aatgtcaaaa attatactag catctgccat + 14941 tatgtatggc cttttactaa gttcaaaaac agttatacat ttttcaccga ccttaaatgt + 15001 tctagcattt gcagcgcttg gtggaatcat ttatcttttt gcaattctat ctctgaaagt + 15061 ggtagatgtg aaagaattaa aacaaattat taggaaaaac taaaatgaga aaaattcgaa + 15121 atatcaacct agatttacta aaagtgcttg catgtgttgg agttgtttta cttcatacaa + 15181 caatgggcgg atttaaagag acaggctcat ggaatctttt ggcatattta tattatttag + 15241 gtacttactc tattcccctg ttttttatga tcaatggtta tttattgtta ggcaagaggg + 15301 aaataactta tctttacata ctccagaaag taaaatggat tttaataaca gtgtcatcat + 15361 ggacatttat cgtatggctt tttcatcgtg attttacaac taatcctatt aaaaaaattg + 15421 taggttcttt gatacaaaga ggttatttct ctcagttttg gtttttcggt gcactaatac + 15481 ttatctattt atgtctgcca attgtgagac aatttctaaa ttcaaaaaga agctatttat + 15541 acagtttatc tttattgatg actattggtt tgatttttga gttattaaat atcctacttc + 15601 agatgccaat acaaacatat gtaatacaga cttttagatt atggacgtgg tttttttact + 15661 atcttttagg tggttatata gcgcaattca ctaaagaaga aatcaaatca agatttaaga + 15721 attggatgaa aatagctagc atacttttgt tattgatttc accaataata ttatttttca + 15781 tagcaaagac cacttaccat aatttttttg ctgaatattt ttatgatatt ttattagtaa + 15841 aagttgtaag cgtagggatt tttctaacta ttttctcact tgtattgaat gaaaatagca + 15901 acaaatggat tatttttctt tctaatcaaa ctatgggtat ctttataata cacacttata + 15961 ttatgaaggt atgggaaaaa ctatttggtt ttaattttat aggttcatat ttactttttg + 16021 ctatatttac tttaagtgtt agttttatca ttgttggaat gttaatgaaa attccgtatt + 16081 ttaatcgaat cgtcaaatta taaaaaggag aaaaaatgta cgattatctt gttgttggtg + 16141 ctggtctctt tggtgcagtc tttgcccatg aagcagcctt aaaaggaaaa aaagtaaaag + 16201 ttattgaaaa acgaaatcat atcgcgggta atatctatac tcgtgaacag gaaggaattc + 16261 aagttcatca atatggtgct catatcttcc atacttctga taaggagatc tgggagtatg + 16321 taaatcagtt tgcagagttt aaccgttata ccaattctcc tgttgcaaac tataagggag + 16381 agatttataa cttacctttt aatatgaata ccttcaataa actctgggga gttgtaacgc + 16441 cagcagaagc acaagctaag attgatgaac aacgtgctat tttaaatggt aaaactcctg + 16501 aaaatttgga agaacaggcg atttctcttg taggtacaga catctacgaa aaattaatca + 16561 aagactatac agagaaacag tggggcaaac caactactga acttccagcc tttattattc + 16621 gccgtttgcc agtacgcctg acctatgata acaactattt taacgatacc tatcaaggga + 16681 ttccaattgg tggatacact caaatagttg aaaaaatgtt ggatcatgaa aatattgatg + 16741 tagaaacaaa tgttgatttc tttgtgaata aagagcaata tctgaaagat tttcctaaga + 16801 ttgtctttac tggtatgatt gatgaattct ttgactataa gttgggcgaa ctagagtacc + 16861 gtagtcttcg ttttgaaaat gagaccttgg atatggaaaa ttaccaagga aatgcagttg + 16921 tgaactatac ggatgcagaa accccatata ctcgcattat tgaacacaaa cattttgagt + 16981 ttgggagtca agcaaagact atcattacta aagaacattc taaaacatgg gaaaaaggtg + 17041 atgagcctta ttatccagtt aataatgatc gtaataatca tttgtataaa tcatataaaa + 17101 aacttgctga tgagcaaggg aatgttatct ttggtggccg cttaggacac tatcgttatt + 17161 acgatatgca ccaagtaatt ggagcagctt tgcagtgcgt gagaaatgag ttaaattaat + 17221 actcaatgaa aattaaagag caaactagga agctagccac aggttgctca aaacactgtt + 17281 ttgaggttgc agatggaagc tgacgcggtt tgaagagatt ttcgaagagt ataaacaagt + 17341 aaaactgact accagttatt atttagaaat agtattaaaa attccttgac tatgtgatgt + 17401 agttgaggga tttttgataa tattcatatt ttttgcaaag atgttgtttg aaaaataatt + 17461 ttcaaaaatt ctgaaaattc tgttgacaac tttctgaaaa gagtctataa tggagagaaa + 17521 gttttaaagg agaaaatgat gaaaagttca aaactacttg cccttgcggg cgtgacatta + 17581 ttg +// + diff --git a/public/res/serotype_genbank/serotype_33E.gb b/public/res/serotype_genbank/serotype_33E.gb new file mode 100644 index 0000000..2f28de6 --- /dev/null +++ b/public/res/serotype_genbank/serotype_33E.gb @@ -0,0 +1,814 @@ +LOCUS contig_1 18603 bp DNA linear UNK 11-JUN-2024 +DEFINITION contig_1, whole genome shotgun sequence. +ACCESSION contig_1 +VERSION contig_1 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/11/2024, 01:43:57 + CDSs :: 19 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 1 +FEATURES Location/Qualifiers + source 1..18603 + /mol_type="genomic DNA" + gene complement(1..348) + /locus_tag="PKOAIA_00005" + CDS complement(1..348) + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A7G1IQ53" + /db_xref="UniRef:UniRef90_A0A0H2ZRF4" + /product="IS630-Spn1, transposase Orf1" + /locus_tag="PKOAIA_00005" + /protein_id="gnl|Bakta|PKOAIA_00005" + /translation="MWYNLPMAYSIDFRKKVLSYCERTGSITEASHVFQISRNTIYGWL + KLKEKTGELNHQVKGTKPRKVDRDRLKNYLTDNPDAYLTEIASEFGCHPTTIHYALKAM + GYTRKKEPHLL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A0H2ZRF4" + gene 583..2028 + /locus_tag="PKOAIA_00010" + /gene="wzg" + CDS 583..2028 + /db_xref="BlastRules:WP_000091082" + /db_xref="COG:COG1316" + /db_xref="COG:M" + /db_xref="RefSeq:WP_061647449.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0007652D0D" + /db_xref="UniRef:UniRef100_A0A3G5AX38" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_O54604" + /db_xref="UniprotKB:O86885" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="PKOAIA_00010" + /protein_id="gnl|Bakta|PKOAIA_00010" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVGFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLMVNQ + SSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYS + TIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSYAMPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647449.1" + /gene="wzg" + gene 2030..2761 + /locus_tag="PKOAIA_00015" + /gene="wzh" + CDS 2030..2761 + /db_xref="BlastRules:WP_000565352" + /db_xref="RefSeq:WP_050096433.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00005400C7" + /db_xref="UniRef:UniRef100_Q4JZK3" + /db_xref="UniRef:UniRef90_Q9AHD4" + /db_xref="UniprotKB:O86886" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="PKOAIA_00015" + /protein_id="gnl|Bakta|PKOAIA_00015" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLIIAYGAEIYYTPDVLDKLEKKRIPTLNDSRY + ALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVTQKYG + EAKAQELFIDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050096433.1" + /gene="wzh" + gene 2770..3462 + /locus_tag="PKOAIA_00020" + /gene="wzd" + CDS 2770..3462 + /db_xref="RefSeq:WP_050096434.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E84C14" + /db_xref="UniRef:UniRef100_Q4JZK2" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_A0A139PG18" + /db_xref="UniprotKB:O86887" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="PKOAIA_00020" + /protein_id="gnl|Bakta|PKOAIA_00020" + /translation="MKEQNMIEIDVFQLFKTLWKRKLIILIVALVTGAGAFAYSTFIVK + PEYTSTTRIYVVNRDQGDKPGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKLDMP + AKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVTTLE + EARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIEVLDTRVKRPEDVEDVLKIPLLGL + VPDFDKIK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050096434.1" + /gene="wzd" + gene 3472..4161 + /locus_tag="PKOAIA_00025" + /gene="wze" + CDS 3472..4161 + /db_xref="RefSeq:WP_061647448.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0007654C9E" + /db_xref="UniRef:UniRef100_A0A3G5AX80" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_O84996" + /db_xref="UniprotKB:Q4JZK1" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="PKOAIA_00025" + /protein_id="gnl|Bakta|PKOAIA_00025" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVLSITSVKI + GEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDLSQ + GLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVIDAA + IITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVNKYGSYGNYG + DYGKNKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647448.1" + /gene="wze" + gene 4176..5543 + /locus_tag="PKOAIA_00030" + /gene="wchA" + CDS 4176..5543 + /db_xref="RefSeq:WP_061647447.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00076569C6" + /db_xref="UniRef:UniRef100_A0A3G5AX28" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_Q8VU30" + /db_xref="UniprotKB:O86888" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="PKOAIA_00030" + /protein_id="gnl|Bakta|PKOAIA_00030" + /translation="MNGKILRSSLVIIQSFLVILLTYLLSTVREAEIVSTTAIALYILH + YFVFYISDYGQDFFKRGYLIELLQTLKYILFFALAISISNFFLEDRFSISRRGMIYFLT + LHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKLVAV + SVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMGIDVT + VNLNAFDRSLARNKQIREMAGLNVVTFSTAFYKTSHVIAKRIIDIVGALVGLILCGLVS + IVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTMQGGMFK + VDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPEQKRRLSF + KPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLMKDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647447.1" + /gene="wchA" + gene 5530..6336 + /locus_tag="PKOAIA_00035" + /gene="wciB" + CDS 5530..6336 + /db_xref="RefSeq:WP_180681146.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000F6F00E1" + /db_xref="UniRef:UniRef100_A0A3G5AX39" + /db_xref="UniRef:UniRef50_O86889" + /db_xref="UniRef:UniRef90_O86889" + /db_xref="UniprotKB:O86889" + /db_xref="UserProtein:wciB" + /product="""putative glycosyl transferase""" + /locus_tag="PKOAIA_00035" + /protein_id="gnl|Bakta|PKOAIA_00035" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFIG + DNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDVIL + SRANVEILLEKSDIIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLSSFD + KVMKQRSGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDYTLFESRLFGRVSELL + FNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_180681146.1" + /gene="wciB" + gene 6340..7380 + /locus_tag="PKOAIA_00040" + /gene="wciC" + CDS 6340..7380 + /db_xref="RefSeq:WP_061647446.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0007654110" + /db_xref="UniRef:UniRef100_A0A3G5AX60" + /db_xref="UniRef:UniRef50_O86890" + /db_xref="UniRef:UniRef90_O86890" + /db_xref="UniprotKB:O86890" + /db_xref="UserProtein:wciC" + /product="""putative galactosyl transferase""" + /locus_tag="PKOAIA_00040" + /protein_id="gnl|Bakta|PKOAIA_00040" + /translation="MKVTIIGQIKNKRTGLGKAINDFRDYCCNRATRVTEIDITNNFNF + LSSLFQILISDTDVYYFTPAGSVAGNIRDSLFLFFMIMKRKKIVTHFHNSAFGNVMRQH + PTLMIINRILYSKVDLIILLGEKSKIMFQQLRILDEKFKIIRNGVDGYLFIEKNELNKK + MSDLPINIIFFSNMIREKGYEILLEVAKKMREDEKYHFYFSGKFQDNNLKTRFINEIYS + MNNVTYLDGVYGSDKKKLLQKMHYFVLPSYYKDETLPISMLEAMANGLYIIVSDVGVVS + EVINKETASLIEMINEETADSIIEIIDQTSNKLNELDFNVSKYKQELLNENIQASIYQQ + LERIAN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647446.1" + /gene="wciC" + gene 7377..8375 + /locus_tag="PKOAIA_00045" + /gene="wciD" + CDS 7377..8375 + /db_xref="RefSeq:WP_061647445.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000765536D" + /db_xref="UniRef:UniRef100_A0A3G5AX27" + /db_xref="UniRef:UniRef50_Q4JZ65" + /db_xref="UniRef:UniRef90_Q4JZ65" + /db_xref="UniprotKB:Q4JZI0" + /db_xref="UserProtein:wciD" + /product="""putative glycosyl transferase""" + /locus_tag="PKOAIA_00045" + /protein_id="gnl|Bakta|PKOAIA_00045" + /translation="MTEKKNTGKILTVVVPSYNAENYLQETMPTILSAKNIERVELLIV + NDGSTDKTEEIARQFEREYEGIVRVISKENGGHGSAVNAGIENAVGNYFKVVDADDWVN + TNNLEDLIVFLSEVDVDQVLSPYDKIFVNYRGDIEREEECNEFSQVENEVIYSAEEFYT + RIKQTVGMHSITVKTSLLQENNIRLSEKMFYVDMEYIVYILPYVKRVVLFDKSIYRYRL + GTETQSVSMASYIKNRDMHKQVIYHLVDFYNQMRSSAVLKRITWKLILNLIRQQWIIYF + NLSKKEGKNSECFEFDNWLIKEGRIKKIPLYFFKAVKYIRFKVKYFLGIRK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647445.1" + /gene="wciD" + gene 8377..8652 + /locus_tag="PKOAIA_00050" + CDS 8377..8652 + /product="hypothetical protein" + /locus_tag="PKOAIA_00050" + /protein_id="gnl|Bakta|PKOAIA_00050" + /translation="MRKIGKVINEYFALRKSFTPAIARNKLFEKFWGRIGNYKIFNNIA + SDFYQYKHETIINFLEKDFSQFLKSYNFKEVSHKEIEQRKIFSMWI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + gene <8674..9345 + /locus_tag="PKOAIA_00055" + /pseudogene="unitary" + CDS <8674..9345 + /note="Internal stop codon at 8650. Nonsense mutation + around 8650. Truncated wciE" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_O86892" + /db_xref="UniRef:UniRef90_O86892" + /product="Capp33fI protein" + /locus_tag="PKOAIA_00055" + /pseudogene="unitary" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + gene 9365..10336 + /locus_tag="PKOAIA_00060" + /gene="wciF" + CDS 9365..10336 + /db_xref="RefSeq:WP_061647443.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0007656FDB" + /db_xref="UniRef:UniRef100_A0A3G5AX49" + /db_xref="UniRef:UniRef50_O86893" + /db_xref="UniRef:UniRef90_O86893" + /db_xref="UniprotKB:O86893" + /db_xref="UserProtein:wciF" + /product="""putative glycosyl transferase""" + /locus_tag="PKOAIA_00060" + /protein_id="gnl|Bakta|PKOAIA_00060" + /translation="MISVIVPVYNVADYLRFALDSLLEQTYKDFEIILVNDGSTDNSGE + ICDEYGKLYDNIYVFHKKNGGLSDARNFGLEKSRGEFITFLDSDDYFEPYALELLITIQ + KKYDVDIVSTKGVITYSHDIYSKKLMDEDYLTVKILTNKEFLAAAYYNDEMTVSAWGKL + YKRDLFKTIFPKGKIYEDLYVVAERLLNIKTVAHTDLPIYHYYQRQGSIVNSTFSDRQY + DFFDAIDHNEAIIKKFYCGDKELLAALNAKRVIGSFILSNSAFYNSKNDITKIIRIIKP + YYWEVIKNKKIPMKRKVQCVLFLLSPNYYYKIKDKMLQRGRI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647443.1" + /gene="wciF" + gene 10337..11560 + /locus_tag="PKOAIA_00065" + /gene="wzy" + CDS 10337..11560 + /db_xref="RefSeq:WP_061647442.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0007655091" + /db_xref="UniRef:UniRef100_A0A3G5AXF6" + /db_xref="UniRef:UniRef50_O86894" + /db_xref="UniRef:UniRef90_O86894" + /db_xref="UniprotKB:O86894" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="PKOAIA_00065" + /protein_id="gnl|Bakta|PKOAIA_00065" + /translation="MHVRLDGLLDYIFLFSVIITCNTMYSTSQGFDGLGKWATLLLVVS + VILKLLISRISMKAINVIVSRSLIFILIILLIVILNGFKISETSFVYYFVLFPIFMMIL + QMYYDVNEIANLIRKFVRIIFLLAIGSLLFWLIGSVFHIISPTVYVLNYWNGGGIVEGY + YNLHFEAQKIEILGAILIRNTGIFAEAPMWSLVLSLALIFQTLHIKKWNFTTWTLIITI + MTTTSTTGVYIIGLIFLYVLFSKTSGVKRYVSSLFILAIICCFSILWDNKSGTGSATIR + FDDYKAGFLAWQKSPIWGLGISDGLRTIEQHMDRTVRYNLGYSNSFFVVLAQGGIMLAS + YYFYPVIKIILNKFSSNDLKFSALLIIFLMITTIFIETYMFLFVISLYYSLDFGDDRDC + HEKQYITN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647442.1" + /gene="wzy" + gene 11591..13006 + /locus_tag="PKOAIA_00070" + /gene="wzx" + CDS 11591..13006 + /db_xref="RefSeq:WP_000698078.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00000B7DD2" + /db_xref="UniRef:UniRef100_O86895" + /db_xref="UniRef:UniRef50_K8MPI1" + /db_xref="UniRef:UniRef90_O86895" + /db_xref="UniprotKB:O86895" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="PKOAIA_00070" + /protein_id="gnl|Bakta|PKOAIA_00070" + /translation="MKILKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFSS + IVTYFTLLATLGVANYGTKEISAHRKEIGKNFWGIYSLQFGATWLSILLYLALCFLFTS + MQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGAISIFLFVKSANDLY + LYVFLLTIFELLGQLSMWLPARQFIGKSYFDWKYAKKHLKPVILLFLPQIAISLYVTLD + RTMLGVLASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVSSLLSSGDYKAVNKMHEM + SFLIYNLVIFPIIAGMLIVNDDFVRFFLGQNFQDARYAIAIMTFRMFFIGWTNIMGIQI + LIPHNKNKEFMVSTTVPAILSVGLNLLLLPQFGYIGAAIVSVLTEAFVWGIQLFYTRFY + LKEVPIIGSMTKTALASAVMYGLLLGSKTSIHFSPTINVLIFSVLGGIIYLFAILSLKV + VDVKELKQIIRKN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000698078.1" + /gene="wzx" + gene 13008..14006 + /locus_tag="PKOAIA_00075" + /gene="wefK" + CDS 13008..14006 + /db_xref="RefSeq:WP_061647440.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000765607B" + /db_xref="UniRef:UniRef100_A0A3G5AXE3" + /db_xref="UniRef:UniRef50_K8MVE5" + /db_xref="UniRef:UniRef90_A0A0T7ZMW5" + /product="Repeating unit O-acetyltransferase WefK" + /locus_tag="PKOAIA_00075" + /protein_id="gnl|Bakta|PKOAIA_00075" + /translation="MSKFRNINLDLLKVLACVGVVLLHTTMGGFKETGAWNFLTYLYYL + GTYSIPLFFMVNGYLLLGKREITYSYILQKIKWLLITVSSWTFIVWLFKRDFTENLIKK + IIGSLIQKGYFFQFWFFGALILIYICLPVLKNFLNLKRNYLYILSVLLVIGLIFELANI + VFQMPAQTYVIQTFRLWTWFFYYLLGGFIAQFNKDIIRNRFKIWMKVATVLLLLISPLI + LFFLAKTTYHNLFAEYFYDILFVKVVSLGIFLTIFSLALNQDINKWIIFLSNQTMGVFI + IHTYIMKVWEKLFGFSFVGAYLLFAIFTLSISFIIAGMLMKIPYFNRIVKL" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647440.1" + /gene="wefK" + gene 14020..15120 + /locus_tag="PKOAIA_00080" + /gene="glf" + CDS 14020..15120 + /db_xref="COG:COG0562" + /db_xref="COG:M" + /db_xref="EC:5.4.99.9" + /db_xref="GO:0008767" + /db_xref="GO:0009273" + /db_xref="RefSeq:WP_061647439.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0007650464" + /db_xref="UniRef:UniRef100_A0A3G5AX90" + /db_xref="UniRef:UniRef50_A0A4S2G265" + /db_xref="UniRef:UniRef90_F8WRM7" + /db_xref="UniprotKB:O86897" + /db_xref="UserProtein:glf" + /product="""UDP-galactopyranose mutase Glf""" + /locus_tag="PKOAIA_00080" + /protein_id="gnl|Bakta|PKOAIA_00080" + /translation="MYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCENV + EGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYAMW + GTKTPQEVKDKIAEQTAHMKDIEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSATEL + PPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFTHREELEA + SAEKVVFTGMIDQYFDYKHGELEYRSLRFDHEILAEENYQGNAVVNYTEREIPYTRIIE + HKHFEYGTQAKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAAQNDKVIFCGR + LADYKYYDMHVVIERALEVVLSELGK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647439.1" + /gene="glf" + gene 15201..15437 + /locus_tag="PKOAIA_00085" + CDS 15201..15437 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A4P8GD58" + /db_xref="UniRef:UniRef90_A0A4P8GD58" + /product="Fucose 4-O-acetylase-related acetyltransferase" + /locus_tag="PKOAIA_00085" + /protein_id="gnl|Bakta|PKOAIA_00085" + /translation="MKKIKEYDILKIMAIILVVLSHSAYYKISSNYGGMDYQQYLNSHS + AFTLYEILGKFMEIIYYFHIPLFMAISGVFFSI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A4P8GD58" + gene 15501..16259 + /locus_tag="PKOAIA_00090" + CDS 15501..16259 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000766BF55" + /db_xref="UniRef:UniRef100_A0A4P8GC94" + /db_xref="UniRef:UniRef50_A0A4P8GC94" + /db_xref="UniRef:UniRef90_A0A4P8GC94" + /product="Acyltransferase family" + /locus_tag="PKOAIA_00090" + /protein_id="gnl|Bakta|PKOAIA_00090" + /translation="MPFFVFTLLYSLPLKYISNYYNGVSFWRAITGQFLLLGNSHLWYL + YALFIIFIISFYCLRRDTSIFVYLSLYIIHVLSFLIHITLVSAPLQFLFWFSMGFLFES + KRRKYNIFLENHKWISLLFFVLFIFLVVLNFLFKSDFKVLSRFFVDLLAILGSLICYNI + SYFLSNKTKILDSKLLNLILINALGIYIFSDTLNYFILSISYFVSDRFMFTSFGIIIIF + LIRFVFTLFLGLVFTLLFKKVFPKYSWLVN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef100_A0A4P8GC94" + gene 16621..18603 + /locus_tag="PKOAIA_00095" + /gene="aliA" + CDS 16621..18603 + /db_xref="COG:COG4166" + /db_xref="COG:E" + /db_xref="GO:0015031" + /db_xref="GO:0015833" + /db_xref="GO:0042597" + /db_xref="GO:0043190" + /db_xref="GO:0055085" + /db_xref="RefSeq:WP_061647437.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0007656D72" + /db_xref="UniRef:UniRef100_UPI0007656D72" + /db_xref="UniRef:UniRef50_P35592" + /db_xref="UniRef:UniRef90_P35592" + /product="Oligopeptide-binding protein AliA" + /locus_tag="PKOAIA_00095" + /protein_id="gnl|Bakta|PKOAIA_00095" + /translation="MKSSKLFALAGVTLLAATTLAACSGSGSSAKGEKTFSYIYETDPD + NLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDAKW + YTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDAYVKGGIKDFSQVGIKA + LDDQTVQYTLNKPESFWNSKTTMGVLAPVNEEFLNSKGDDFAKATDPSSLLYNGPYLLK + SIVTKSSVEFAKNPNYWDKDNVHVDKVKLSFWDGQDTSKPAENFKDGSLTAARLYPTSA + SFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKALLNKDFRQ + AIAFGFDRTAYASQLNGQTGASKILRNLFVPPTFVQADGKNFGDMVKERLVTYGDEWKD + VNLADSQDGLYNPEKAKAEFAKAKSALQAEGVTFPIHLDMPVDQTATTKVQRVQSMKQS + LEATLGADNVVIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPDFADPSTYLDII + KPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDEATDVAKRYDKYAAAQAWL + TDSALIIPTTSRTGRPILSKMVPFTIPFALSGNKGTSEPVLYKYLELQDKAVTVDEYQK + AQEKWMKEKEESNKKAQEDLAKHVK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_061647437.1" + /gene="aliA" +ORIGIN + 1 tcatagtagg tgtggttctt tttttcgagt gtagcccata gctttgagcg catagtggat + 61 ggtagttgga tgacagccaa attcagaagc tatttcagtc aaataagcgt ctggattgtc + 121 agtaagatag tttttaagtc tatctctatc aacctttctt ggttttgttc cttttacttg + 181 gtggtttagc tctcctgttt tctcttttag ctttaaccag ccataaatgg tattacgtga + 241 gatttggaaa acgtgtgatg cttctgttat actacctgtt cgctcacaat aagagagaac + 301 ttttttacga aaatctattg aatatgccat aggaagatta taccacattg tgtactacag + 361 tagattgaaa ctagaacagt acacctctac ttctaaaaca ttgttagaaa tcgattttac + 421 tgtcccgatc gatttgtcat cttcttattt cattttacta tatttttggt tcgcgggaag + 481 tctactaaga tacttaaaga tgcagatagt ggaaataaag gtgtagacat taccgtaaaa + 541 aagtgataca attgtaagat attgaatgta taggtattaa tcatgagtag acgttttaaa + 601 aaatcacgtt cacagaaagt gaagcgaagt gttaatatag ttttgctgac tatttattta + 661 ttgttagttg gttttttatt gttcttaatc tttaagtaca atatccttgc ttttagatat + 721 cttaacctag tggtaactgc gttagtccta ctagttgcct tggtagggct actcttgatt + 781 atctataaaa aagctgaaaa gtttactatt tttctgttgg tgttctctat ccttgtcagc + 841 tctgtgtcgc tctttgcagt acagcagttt gttggactga ccaatcgttt aaatgcgact + 901 tctaattact cagaatattc aatcagtgtc gctgttttag cagatagtga gatcgaaaat + 961 gttacgcaac tgacgagtgt gacagcaccg actgggactg ataatgaaaa tattcagaaa + 1021 ctactagctg atatcaagtc aagtcagaat accgatttga tggtcaacca gagttcgtct + 1081 tacttggcag cttacaagag tttgattgca ggggagacta aggccattgt cctaaatagt + 1141 gtctttgaaa acatcatcga gtcagagtat ccagactacg catcgaagat aaaaaagatt + 1201 tataccaagg gattcactaa aaaagtagaa gctcctaaga cgtctaagaa tcagtctttc + 1261 aatatctatg ttagtggaat tgacacctat ggtcctatta gttcggtgtc gcgatcagat + 1321 gtcaatatcc tgatgactgt caatcgagat accaagaaaa tcctcttgac cacaacgcca + 1381 cgtgatgcct atgtaccaat cgcagatggt ggaaataatc aaaaagataa attaacccat + 1441 gcaggcattt atggagttga ttcgtccatt cacaccttag aaaatctcta tggagtggat + 1501 atcaattact atgtgcgatt gaacttcact tctttcttga aaatgattga cttattggga + 1561 ggggtagatg ttcataatga tcaagagttt tcagctctac atgggaagtt ccatttccca + 1621 gtagggaatg tccatctaga ctctgagcag gctctaggtt ttgtacgtga acgctactca + 1681 ctagccgatg gagaccgtga tcgcgggcgc aatcaacaaa aggtgattgt ggctatcctt + 1741 caaaaattaa cgtcaaccga agcactgaaa aattatagta cgatcattaa tagcttgcaa + 1801 gattctatcc aaacaaatat gccacttgag actatgataa atttggtcaa tgctcagtta + 1861 gaaagtggag ggaattataa agtaaattct caagatttaa aagggacagg tcggatggat + 1921 cttccttctt atgcaatgcc agacagtaac ctctatgtga tggaaataga tgatagtagt + 1981 ttagctgtag ttaaagcagc tatacaggat gtgatggagg gtagatgaaa tgatagacat + 2041 ccattcgcac atcgtctttg atgtagatga tggtcccaag tcaagagagg aaagcaaggc + 2101 tctcttggca gaatcctaca gacagggggt gcgaaccatt gtctctacct ctcaccgtcg + 2161 caagggcatg tttgaaactc cggaagagaa gatagcagaa aactttcttc aggttcggga + 2221 aatagctaag gaagtggcga gtgacttgat cattgcttac ggggctgaaa tttactacac + 2281 accagatgtt ctggataagc tggaaaaaaa gcggattccg accctcaatg atagtcgtta + 2341 tgccttgata gagtttagta tgaacactcc ttatcgcgat attcatagcg ccttgagcaa + 2401 gatcttgatg ttgggaatta ctccagtcat tgcccacatt gagcgctatg atgctcttga + 2461 aaataatgaa aaacgcgttc gagaactgat tgatatgggc tgttacacgc aagtaaatag + 2521 ttcacatgtc ctcaaatcca aactttttgg cgaacgttat aaattcatga aaaaaagagc + 2581 tcagtatttt ttagagcagg atttggtcca tgtcattgca agtgatatgc acaatctaga + 2641 cggcagacct cctcatatgg cagaagcata tgaccttgtt acccaaaaat acggagaagc + 2701 gaaggctcag gaacttttta tagacaatcc tcgaaaaatt ataatggatc aactaattta + 2761 ggagaaatga tgaaagaaca aaacatgata gaaatcgatg tatttcaatt atttaaaacc + 2821 ttgtggaaac gcaagctaat aattttaata gtggcacttg tgacaggtgc gggggctttt + 2881 gcatatagca cttttattgt taagccagaa tatacgagta ccacgcgaat ttacgtagtg + 2941 aatcgcgatc aaggagacaa gccggggctg acaaatcagg atttgcaggc aggatcttat + 3001 ctggtaaaag actaccgtga gattatcctt tcgcaggatg tattggaaaa agtagcgaca + 3061 aatttgaagt tggatatgcc agcaaaaacg ttagccagca aagttcaagt gactgtacca + 3121 gctgacactc gtatcgtctc aatctctgtc aaggataaac agccagagga agccagtcgt + 3181 atcgctaatt ctctacgaga agttgctgca gaaaagatcg tcgctgtaac gcgagtatct + 3241 gatgtaacga cacttgaaga agcgcgacca gctacgactc cttcttctcc aaatgttcga + 3301 cgcaattcct tgtttggttt tcttggagga gcagtcgtaa cagtaattgc tgttcttttg + 3361 attgaggtgc tggacacccg tgtgaaacgt cctgaagatg ttgaagatgt actgaaaatt + 3421 ccacttttag ggctcgttcc agattttgac aaaataaaat aggaggaagt tatgccaaca + 3481 ttagaaatct cacaggcaaa attggattct gtaaaaaagg cagaggaata ttataacgct + 3541 ttgtgcacga acctacagtt aagtggagat ggtttgaaag tattgtctat cacttctgtg + 3601 aaaataggag aaggaaaatc aacgacttcc gccaatatcg cttgggcttt tgcgcgtgca + 3661 ggttacaaaa cgctgctgat tgatggagat attcgcaatt ctgttatgtt aggtgtcttt + 3721 aaagcaagga ataagattac aggcctgaca gaatttttat caggaactac agacctatca + 3781 caagggcttt gtgataccaa tatcgaaaat ctctttgtaa ttcaggctgg ctctgtgtca + 3841 ccgaatccga cagctcttct tcaaagtaag aatttcacta caatgcttga aaccttgcgt + 3901 aaatattttg actacatcat tgtagatact gctcctgttg gtgtcgtgat tgatgcggct + 3961 attattacgc gaaactgcga tgcttctatt ttagtgacgg aggcaggtga aataaatcga + 4021 cgggatattc aaaaagcaaa agaacagttg gaacacacag ggaagccgtt tttgggaatt + 4081 gtgttgaata aattcgatac ttcagtaaac aaatacggtt cttatggaaa ttatggagat + 4141 tacgggaaaa ataaaaaata ggtcggggga tagagatgaa tggaaaaata ttaaggtctt + 4201 cattggtcat aatccagagt tttcttgtta ttttattgac ttatctactt agtactgtga + 4261 gagaagcgga gattgtttca acaacagcta ttgcacttta tatcctccat tattttgtct + 4321 tttatatcag tgattatgga caggatttct ttaaaagggg atatttgatt gaacttctcc + 4381 agacattgaa atatatccta ttctttgcac tagcgattag tatttctaat tttttcttag + 4441 aggatcgatt tagtatttcc agacgaggca tgatttactt cctcacatta catgctctct + 4501 tagtctatgt gctaaaccta tttatcaagt ggtattggaa gcgggcttat cccaacttta + 4561 aaggaagtaa gaagattctc ctacttacag caacttctcg tgtcgaaaag gtactggata + 4621 gattaataga atcaaatgag gttgttggga agttggtagc cgtcagtgtc ttagataaac + 4681 cagattttca gcatgattgt ttaaaggtag tagcagaggg ggagatagta aactttgcga + 4741 ctcatgaggt ggtagatgaa gtctttatca atcttccaag tgaaaaatac aatattggag + 4801 agctggtctc tcagtttgaa acgatgggaa ttgatgtaac agttaatcta aatgcttttg + 4861 atcgtagttt ggcacgtaac aagcaaattc gtgagatggc aggattaaac gttgtgactt + 4921 tttctacagc attttataag actagtcatg taattgctaa gaggattatt gatatcgtgg + 4981 gtgcattggt agggctgata ctatgtggtt tagtcagtat tgtattggtt cctttgattc + 5041 gaaaggatgg gggctctgct atttttgctc agacgcgtat aggaaaaaat ggtcgtcagt + 5101 tcacttttta taagtttcgc tctatgtgtg tagatgccga ggcgaaaaaa agagaactca + 5161 tggaacaaaa taccatgcag ggtggaatgt ttaaggtgga cgatgatcct cgtatcacga + 5221 aaattggtcg ttttatacgg aagactagct tggacgagct accacagttt tataatgttc + 5281 taaagggaga tatgagtttg gttggcacac ggccaccaac agtggacgag tatgaacact + 5341 ataccccaga acaaaaacgt cggctaagtt ttaaacctgg tataacaggc ttatggcagg + 5401 tcagtggacg aagtgaaatc aaaaatttcg atgaagttgt caaattagat gtggcttata + 5461 tagatgattg gacaatctgg aaagatattg aaattttatt gaagacagtt aaggtagtat + 5521 tgatgaagga tggagcgaag tagattgata gatgtaaaaa tcattgtggc aacgcataaa + 5581 gaggttaaaa tgcctcaaga caatagtctt taccttccaa tacatgttgg gagagacggt + 5641 aaatcagata ttggttttat cggtgataat actggcgata atatatcctc tctaaatcca + 5701 tattattgtg agttaacggg actttattgg gcatggaaga atcttgatta taattactta + 5761 ggtttagttc attaccgtcg ttattttaca aataaatctc aagggtataa tgaaaatgtc + 5821 aatatggatg acgtcatttt gtctcgagct aatgttgaaa tattattaga gaaatctgac + 5881 ataatagttc caaagaagcg aaagtattat attgaaactc tttattcaca ttatgcccat + 5941 acccttaacg gagaacatct ggatcttgct aggaaaatta ttgagcaaaa tagttcagag + 6001 tatctttcat cctttgataa agtgatgaaa caaagaagcg gttatatgtt caatatgttt + 6061 atcatgaaaa aagaactatt agatgattat ttaccgtggc ttttttctat tctggatact + 6121 atgtacgaac agatggactt gactgactat actttatttg agtcacgttt attcgggcga + 6181 gttagtgagt tgttgtttaa tgtttggtta tgtaaaaaag gaataacgcc taaagaggta + 6241 ccatttatgt acatggagag agtggatttg tttgaaaaag gaaaatcttt tttaatggct + 6301 aaattttttg gaaagaagta tggacagagt ttctaggata tgaaagtaac tattattgga + 6361 caaataaaaa ataagagaac aggtcttgga aaggcgatta atgattttag ggattattgt + 6421 tgcaatcgtg ctacaagagt aacggaaata gatataacaa ataattttaa ttttttaagc + 6481 tctctttttc aaattttaat atctgataca gatgtttatt attttactcc agctggttca + 6541 gtagctggta atattaggga ttcactgttt ttgttcttta tgataatgaa aaggaaaaaa + 6601 atagtgaccc attttcataa tagtgctttt ggaaatgtga tgagacaaca tccgactcta + 6661 atgataataa atagaatatt gtattctaaa gttgatttga ttatattatt gggagagaaa + 6721 tcgaaaataa tgtttcaaca actaagaatt ttagacgaaa aatttaaaat aattaggaat + 6781 ggtgtggatg gatatttatt tattgaaaaa aatgaattaa ataaaaaaat gagcgatcta + 6841 cccataaata ttattttttt tagtaatatg attagagaaa aaggttatga aattttatta + 6901 gaagttgcta aaaagatgag ggaagatgag aaatatcact tttatttttc tggaaaattt + 6961 caggataata atttaaagac taggtttatt aatgaaattt atagtatgaa taatgtaaca + 7021 tatttagatg gcgtatatgg tagtgataag aaaaagttat tgcaaaaaat gcattacttt + 7081 gttttaccat cgtattataa agacgaaact ttacctatca gtatgttaga agcaatggca + 7141 aatggtctct atattattgt aagcgatgtg ggagttgtgt ctgaggtgat taataaagaa + 7201 actgctagtc ttattgaaat gataaacgaa gaaacagcag acagtattat agaaattatt + 7261 gatcagactt caaataaact taatgagtta gattttaatg tatcaaaata taagcaagag + 7321 ttgttaaatg aaaatataca agcatcaatt tatcagcaat tagagaggat agcaaattga + 7381 cggagaaaaa aaatactgga aaaatattaa cagtagttgt accatcatat aatgcagaaa + 7441 attatttaca agagacgatg ccgacgatac tttctgctaa gaatatagag agggtagaat + 7501 tactgattgt aaacgatggt tctacagaca aaaccgaaga aatagcaaga caattcgaga + 7561 gagaatatga gggaattgtc agagttataa gtaaggaaaa cggtggtcac ggttcggcag + 7621 taaatgcggg aattgaaaat gctgttggta attactttaa agtggtagat gcagatgatt + 7681 gggtgaacac caataattta gaagatttga tagtgtttct atctgaggtg gatgtggatc + 7741 aagttttatc accgtatgat aaaatttttg tgaattatcg aggtgatata gagcgtgaag + 7801 aagagtgcaa cgagttttcg caagttgaga acgaggtgat ctattctgca gaagaattct + 7861 atacacgaat taaacaaacg gtaggaatgc attccattac tgtgaaaacg agtcttttgc + 7921 aagagaacaa tattcggctg tctgaaaaaa tgttctatgt agatatggaa tatattgttt + 7981 atatacttcc atatgtaaaa agggttgttt tatttgataa aagtatttat agatatcgtc + 8041 taggaacaga gacacaaagc gttagtatgg cgagttatat taaaaatcgt gatatgcata + 8101 aacaagtgat ctatcatttg gttgattttt ataatcaaat gagatctagc gctgttttaa + 8161 agagaataac atggaaattg attttaaatt taataagaca gcaatggata atttatttta + 8221 atttatctaa aaaagagggg aaaaacagcg agtgttttga atttgataat tggctaataa + 8281 aagaaggacg gataaaaaaa ataccactat acttttttaa agctgtgaaa tatatcagat + 8341 ttaaggtgaa atattttctg gggataagga aataatatga ggaaaatagg aaaagtaata + 8401 aacgagtatt ttgcattaag aaaatcattt actcctgcta ttgctcggaa taaattattt + 8461 gaaaagtttt ggggacggat agggaattat aaaattttca ataatatagc tagtgatttt + 8521 tatcaataca aacatgaaac aatcataaat tttttggaaa aagattttag ccaattttta + 8581 aaatcctata actttaaaga ggtatcgcac aaggagatag aacaaagaaa aatcttctct + 8641 atgtggatat aaggatacga aagtgctcct aagttggttc agaagacgat tgatagccaa + 8701 aggaaatatg cagaaaaata cggatataaa tttgtttttt tggataaaaa caatatccgt + 8761 gaatatgtga cacttccatc agagatagta gaaaaatatg agaatggaac tatagatttt + 8821 ataaaatatt cggatgttgt aaggggaaca ttgctttcaa aatatggagg agtgtggtta + 8881 gattcgacta tttatgttga ttcttcacga gaactgaatt atttaaaaaa agatttttat + 8941 actattcgag caaagacaca tgagagagtg cccaaatata tcgcaaatgg taggtggtct + 9001 gcattttgtt tgtcagggga aaagcaaaac atagtatttg attttttaga gaaatttcat + 9061 gtagcatatt ttatgaaata cgatatagtg ctagattatt ttttgattga ctatattata + 9121 gaattaggtt ataggacaaa tgacttgatt agaaactata ttgataaagt cgaagaaaat + 9181 aatcaggagt tgttcttttt ggcagacaat ttttctaacc agtatgatga aaaagagtgg + 9241 gcaggagttt tatcaacaac tgcattgttt aagtgtagtt ataagtgtcc gataaatgaa + 9301 gcgacaggaa cctattttga tagattgatg aagggtgaac tgtagcataa agagagggaa + 9361 tggtatgatt tcagttattg ttccagtata caatgtcgcg gattatctgc gctttgcgtt + 9421 ggatagtctt ttggaacaga cgtataaaga ttttgagatt attctagtaa atgatggatc + 9481 cactgataat tctggagaaa tatgtgatga atatgggaaa ctatatgata atatttatgt + 9541 tttccataag aagaatggcg gactttcgga tgctagaaat tttggtttgg agaagagtcg + 9601 aggagagttt ataacctttc ttgattcaga tgattatttt gaaccgtatg cattagaatt + 9661 gttaattact attcaaaaaa aatatgatgt agatatcgta tcaactaaag gggtaataac + 9721 ctattctcat gatatttata gcaaaaaact gatggatgag gactacctaa ctgtaaaaat + 9781 attgacaaat aaagaatttt tggcagctgc atattataac gatgaaatga cggtatctgc + 9841 ttggggaaaa ttgtataaaa gagatttatt taaaacgatt tttccaaaag gaaagatcta + 9901 cgaggatttg tatgttgttg cagagcgttt gttgaatatt aaaacagttg ctcataccga + 9961 tttgcctata tatcattatt atcagagaca gggaagtatt gttaattcaa cattttcgga + 10021 tagacagtat gatttttttg atgcgattga tcataatgaa gccataataa aaaagttcta + 10081 ttgtggagat aaggaattgc tagcagcctt aaatgctaaa agagtaattg gctcctttat + 10141 tttgagtaat agcgcatttt ataatagtaa aaacgatatt actaaaataa taagaataat + 10201 taaaccgtat tattgggaag taataaaaaa taaaaaaatt ccaatgaaaa ggaaagttca + 10261 atgtgttttg tttctgcttt ccccaaatta ctactataaa ataaaagata agatgttaca + 10321 gagaggcagg atatagatgc atgttagatt agatggtttg ctggactata tatttctatt + 10381 tagtgtgatt attacttgta atactatgta ttcaactagt caaggatttg atggactagg + 10441 gaaatgggcg actctgttac ttgtggtatc agttattctg aaattgctta tctctagaat + 10501 atctatgaag gcaatcaatg tgattgtgtc gcgttcttta atatttatat taattattct + 10561 actcatagta atattaaatg gttttaagat ttctgagaca agtttcgtct attattttgt + 10621 attatttccg atttttatga tgattttgca gatgtactat gatgttaatg aaatcgcaaa + 10681 tctgatacgg aaatttgttc gtataatatt tcttttagca attggctctc tcctattttg + 10741 gcttattggt agtgtatttc atattatatc cccaacggtt tatgtgttga attattggaa + 10801 tggtggggga atagtagaag ggtactataa tcttcatttt gaagcacaaa aaatagagat + 10861 tttgggggcg atactgataa gaaatacggg gatttttgct gaagcaccta tgtggagttt + 10921 ggtattgagc cttgcattga tatttcaaac gcttcatata aaaaaatgga atttcacaac + 10981 ttggactctt attattacaa ttatgacaac tacgtcaaca acaggggttt atataatagg + 11041 tttgattttc ctatatgttt tattttcaaa aacaagtggt gtgaagagat atgtttctag + 11101 tttatttatt ttagcgatta tatgttgttt ttcaatatta tgggataata aatctggaac + 11161 tggttcagca actatacgct ttgatgatta taaggctggt tttttggcat ggcagaaaag + 11221 tcctatttgg ggattaggta tttcagacgg tcttagaacc attgaacaac atatggatag + 11281 aactgttaga tataatcttg ggtatagcaa tagctttttt gttgttttag ctcaaggagg + 11341 gataatgttg gcttcgtatt acttttatcc agtaattaaa attattttga ataaatttag + 11401 ttcgaatgat ttgaagtttt ctgcgctatt aataattttc cttatgataa ctactatatt + 11461 tatagagacc tatatgtttt tatttgtcat ttctttatac tattctcttg attttgggga + 11521 cgatagagat tgtcatgaga aacagtacat tactaattaa taataaaggt gtgaacagaa + 11581 ataagaagaa atgaaaatac taaaaaatta tgcctacaat ctttcttatc aattgttggt + 11641 gatcatactc cctatcatta cgactcccta tgtaacgagg gtttttagtt ctgacgattt + 11701 aggaacgtat ggctacttta gctccattgt tacctatttt accttgcttg caactcttgg + 11761 tgttgccaac tacggtacca aagagatttc agcacatcgt aaggaaattg ggaagaattt + 11821 ctggggaatt tattctctcc agtttggtgc aacttggcta tccattttgc tttatcttgc + 11881 cctttgtttc ttatttactt caatgcaaaa tccggtagct tatatattgg gattaagttt + 11941 agtgtcaaaa ggtttggata tttcttggtt atttcaaggt ttggaggatt ttagaaagat + 12001 tacagttcgg aacatcactg ttaagttagt tggtgcaatc tctattttcc tatttgtaaa + 12061 atcagctaat gacttatact tatatgtatt tcttcttacc attttcgaat tgttagggca + 12121 attaagcatg tggttacccg caagacaatt tattggtaaa tcatattttg attggaaata + 12181 cgctaagaag catttgaaac cagttatctt gttattcttg ccacagattg ccatctcgct + 12241 ttatgtgact ttggaccgta cgatgctggg ggtgttggct tcgacaaagg atgttggaat + 12301 ttatgatcaa gctttgaagc ttgttaatat tttactgact ttggttacct cactggggag + 12361 tgttatgttg ccacgagtat ctagcctttt atcgtctggg gattataaag ccgttaataa + 12421 gatgcacgag atgtcttttt taatctataa cttggtgatt ttcccaatca tagcaggaat + 12481 gttgattgtc aacgatgatt ttgttcgttt cttccttggg caaaattttc aagatgctcg + 12541 ctatgcgatt gctattatga ccttccgtat gttctttatt ggttggacca atataatggg + 12601 aattcaaatc ttgattccgc acaataaaaa taaggaattt atggtttcaa cgacagttcc + 12661 cgctattctg agtgtgggat tgaatttgtt gcttcttccc caatttggtt atataggtgc + 12721 tgcgattgtt tcagttttga ctgaggcgtt tgtatggggg attcagttat tctatacacg + 12781 tttttattta aaagaagttc ctattatcgg ttcaatgaca aaaactgcac ttgcatctgc + 12841 tgttatgtat ggtctcttgc taggttcaaa aacatctata catttttcgc caaccataaa + 12901 tgttttaata ttttcggtgc taggcggaat tatctatctt tttgcaattc tatctctgaa + 12961 agtggtagat gtgaaagaat taaaacaaat aatcaggaaa aattagaatg agcaaatttc + 13021 gaaatattaa cttagattta ctaaaagtgc ttgcatgtgt tggagtcgtt ctacttcata + 13081 caactatggg tgggtttaaa gagacaggtg catggaattt tttgacatat ttatattact + 13141 taggaaccta ttctatccct ctatttttta tggtcaatgg ttatttattg ttggggaaga + 13201 gagaaattac ctattcctac atattgcaaa aaataaaatg gctcctaata acagtgtcgt + 13261 catggacttt tatcgtttgg ctgtttaaaa gagactttac agagaactta attaaaaaaa + 13321 ttataggttc tttgatacaa aaggggtatt tcttccagtt ttggtttttt ggtgcactca + 13381 tacttattta tatatgtttg cctgttttga aaaatttcct taatttaaaa agaaattatt + 13441 tatacattct atctgtattg ctggttattg gtttgatttt tgagttagcg aatattgtat + 13501 ttcaaatgcc agcacaaaca tatgttatac aaacctttag attatggact tggttttttt + 13561 actacctttt aggtggtttt atagcgcaat ttaacaagga tattattaga aataggttta + 13621 agatatggat gaaagtagct actgtactct tattattaat ttcaccatta atattatttt + 13681 tcttagcgaa gaccacttac cataatcttt ttgctgaata tttttatgat attttatttg + 13741 taaaagttgt aagtttagga atttttctaa ctatattctc acttgcattg aatcaagata + 13801 tcaacaaatg gattattttt ctttctaacc aaactatggg tgtctttata atacacactt + 13861 atattatgaa agtgtgggaa aaactatttg gttttagttt tgtaggagca tatttacttt + 13921 ttgctatatt tactttaagt attagtttta ttattgctgg aatgttaatg aaaattcctt + 13981 atttcaatcg aattgtcaaa ttataaaaag gagaacaaaa tgtacgacta tctaatcgtc + 14041 ggtgcgggtt tgtctggagc tatttttgct cacgaagcta caaaacgtgg aaaaaaagta + 14101 aaagtgattg ataaacgcga tcacattgga gggaacatct actgtgaaaa tgtagaaggt + 14161 atcaatgtcc ataaatatgg tgcccatatc ttccatacct caaacaaaaa agtttgggac + 14221 tatgtcaatc aattcgctga atttaacaac tatatcaatt cacctgtcgc gaactataaa + 14281 ggaagtcttt ataatcttcc tttcaatatg aatactttct atgctatgtg ggggacaaaa + 14341 actcctcaag aggtcaaaga taagattgct gagcaaacgg ctcacatgaa ggacattgaa + 14401 cctaaaaact tggaagaaca ggctatcaag ttgatcggtc cagatgtcta tgaaaaatta + 14461 atcaagggtt atactgaaaa gcagtgggga cgctcagcaa cggaacttcc tccatttatc + 14521 attaaacgtc ttccagttcg tttaacattt gataataact attttaacga ccgttaccaa + 14581 ggaattccta ttggtggtta caatgtcatc atcgaaaata tgcttaaaga cgttgaagtt + 14641 gagcttggtg ttgatttctt tactcatcgt gaagagttag aagcatcagc tgaaaaagtt + 14701 gtcttcacag ggatgatcga ccagtatttt gactacaagc atggagagtt agaataccgt + 14761 agccttcgct ttgatcatga aattttggcc gaggaaaatt atcaaggaaa tgctgtagtg + 14821 aactatacgg agcgtgagat tccttatact cgtattattg agcataaaca ctttgagtat + 14881 ggtacgcaag ctaaaacggt cattactcgt gaatacccag ctgattggaa acgcggagat + 14941 gaaccttatt atccaatcaa tgatgagaga aacaatgcta tgtttgctaa atatcaagaa + 15001 gaagcagcac agaatgataa ggtgattttc tgcggacgtt tggccgatta taaatactac + 15061 gacatgcatg tggtcattga acgtgcctta gaagtcgtat taagtgagtt aggaaagtag + 15121 tcaattacat taaggtcaag tttaatggcc ttatatcttt tctataaaga aaaactacaa + 15181 ttagaggagc gagatttaat gtgaaaaaga taaaagaata tgacatttta aaaattatgg + 15241 ctattatttt agttgtgtta agtcatagtg cgtattataa aatatcgagc aattatggtg + 15301 gaatggatta tcaacaatat ttaaatagtc attcagcatt tactctatat gagatacttg + 15361 gtaaatttat ggaaattatc tattattttc atataccatt atttatggct atatcgggtg + 15421 tatttttctc tatttaaata aaaaaagatc gatggaataa gattgagaaa ttattaacta + 15481 gtaagtttaa aagattaata ttgccatttt ttgtttttac tttattatat agtttgccat + 15541 taaaatatat atcaaactac tacaatggtg tttcattttg gagagctata actggtcaat + 15601 tcttgttatt aggaaattct cacttatggt atttgtatgc attatttatt atctttataa + 15661 ttagttttta ttgtttaaga agagatactt ctatatttgt atacttgtcc ttatatatta + 15721 tacatgtact gagtttcttg attcatataa cgttagtaag tgcaccattg cagtttcttt + 15781 tttggttttc catgggattt ttgttcgaat ctaaaagaag gaagtataat atttttttgg + 15841 aaaatcacaa atggattagc cttttattct ttgtgttatt tatatttttg gtggttttaa + 15901 attttctatt taaaagcgat tttaaagtat tgagtcgatt ttttgttgac ttattagcta + 15961 ttttaggatc acttatttgt tacaatattt cgtacttttt aagtaataaa actaaaattt + 16021 tagatagtaa actacttaat ctcattttga ttaatgcttt agggatatat attttttctg + 16081 atactttaaa ctattttata ttaagtattt cttattttgt aagtgataga tttatgttta + 16141 cttcatttgg tataattatt atatttttaa ttagatttgt tttcacttta tttttgggat + 16201 tagtctttac attgctattt aaaaaagtat ttccaaaata ttcttggtta gttaactaga + 16261 aaatacaata tcagtgatta tgcactataa gctatcctgt aattcttaca gttaaatatt + 16321 ttatcctata tactgaggag acaaataaaa taacttatag tattttgcac cttatctagt + 16381 ttaattgtaa tataaaagaa aatatccagg aagtggtata gtactctctc attgtttaac + 16441 ttcgcttaaa tatataggtt aattccttga ctatgtgata tagttgaggg atttttaaat + 16501 gatattcata ttttttgcaa agatgttgtt tgaaaaataa ttttcaaaaa ttctgaaaat + 16561 tctgttgaca actttctgaa aagagtctat aatggagaga aagttttaaa ggagaaaatg + 16621 atgaaaagtt caaaactatt tgcccttgcg ggcgtgacat tattggcggc gactacttta + 16681 gctgcatgct ctggatcagg ttcaagcgct aaaggtgaga agacattctc atacatttat + 16741 gagacagacc ctgataacct caactatttg acaactgcta aggctgcgac agcaaatatt + 16801 accagtaacg tggttgatgg tttgctagaa aatgatcgct acgggaactt tgtgccgtct + 16861 atggctgagg attggtctgt atccaaggat ggattgactt acacttatac tatccgtaag + 16921 gatgcaaaat ggtatacttc tgaaggtgaa gaatacgcgg cagtcaaagc tcaagacttt + 16981 gtaacaggac taaaatatgc tgctgataaa aaatcagatg ctctttacct tgttcaagaa + 17041 tcaatcaaag ggttggatgc ctatgtaaaa gggggaatca aagatttctc acaagtagga + 17101 attaaggctt tggatgatca gacagttcag tacactttga acaaaccaga aagcttctgg + 17161 aattctaaga caaccatggg tgtgcttgcg ccagttaatg aagagttttt gaactcaaaa + 17221 ggggatgatt ttgccaaagc gacggatcca agtagtctct tgtataacgg tccttatttg + 17281 ttgaaatcca ttgtgacaaa atcctctgtt gaatttgcga aaaatccgaa ctactgggat + 17341 aaggacaatg tgcatgttga caaagttaaa ttgtcattct gggatggtca agataccagc + 17401 aaacctgcag aaaactttaa agatggtagc cttacagcag ctcgtcttta tccaacaagt + 17461 gcaagtttcg cagagcttga gaagagtatg aaggacaata ttgtctatac tcaacaagac + 17521 tctattacgt atctagttgg tacaaatatt gaccgtcagt cctataaata cacatctaag + 17581 accagcgacg aacaaaaggc atcgactaaa aaggctctct taaacaagga tttccgtcag + 17641 gctattgcat ttggatttga ccgtacagcc tatgcctctc agttgaatgg acaaactgga + 17701 gcaagtaaaa tcttgcgtaa tctctttgtg ccaccaacat ttgttcaagc agatggtaaa + 17761 aactttggcg atatggtcaa agagagattg gtcacttatg gggatgaatg gaaggatgtt + 17821 aatcttgcag attctcagga tggtctttac aatccagaaa aagccaaggc tgaatttgct + 17881 aaagctaaat cagccttaca agcagaaggt gtgacattcc caattcattt ggatatgcca + 17941 gttgaccaaa cagcaactac aaaagttcag cgcgtccaat ctatgaaaca atccttggaa + 18001 gcaactttag gagcggataa tgtagtcatt gatattcaac aactacaaaa agacgaagta + 18061 aacaatatta catattttgc tgaaaatgct gctggcgaag actgggattt atcagataat + 18121 gtcggttggg gtccagactt tgccgatcca tcaacctacc ttgatatcat caaaccatct + 18181 gtaggagaaa gtactaaaac atatttaggg tttgactcag gggaagataa tgtagctgct + 18241 aaaaaagtag gtctatatga ctacgaaaaa ttggttactg aggctggtga tgaggctaca + 18301 gatgttgcta aacgctatga taaatacgct gcagcccaag cttggttgac agatagtgct + 18361 ttgattattc caactacatc tcgtacaggg cgtccaatct tgtctaagat ggtaccattt + 18421 acaataccat ttgcattgtc aggaaataaa ggtacaagtg aaccagtctt gtataaatac + 18481 ttggaacttc aagacaaggc agtcactgta gatgaatacc aaaaagctca ggaaaaatgg + 18541 atgaaagaaa aagaagagtc taataaaaag gctcaagaag atctcgcaaa acatgtgaaa + 18601 taa +// diff --git a/public/res/serotype_genbank/serotype_33F.gb b/public/res/serotype_genbank/serotype_33F.gb new file mode 100644 index 0000000..64474eb --- /dev/null +++ b/public/res/serotype_genbank/serotype_33F.gb @@ -0,0 +1,769 @@ +LOCUS CR931702 16989 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 3084/37 (serotype 33f). +ACCESSION CR931702 +VERSION CR931702.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 16989) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 16989) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..16989 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="3084/37" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC33F_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC33F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34241.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..461 + /gene="aliB" + /locus_tag="SPC33F_0002" + /pseudo + CDS 293..461 + /gene="aliB" + /locus_tag="SPC33F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(462..984) + /gene="tnp" + /locus_tag="SPC33F_0003" + /pseudo + CDS complement(join(462..779,781..984)) + /gene="tnp" + /locus_tag="SPC33F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1205..2650 + /gene="wzg" + /locus_tag="SPC33F_0004" + CDS 1205..2650 + /gene="wzg" + /locus_tag="SPC33F_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34244.1" + /db_xref="GOA:O86885" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:O86885" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1205..1321 + /gene="wzg" + /locus_tag="SPC33F_0004" + /note="Signal peptide predicted for SPC1607 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1409..1756 + /gene="wzg" + /locus_tag="SPC33F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.3e-62" + misc_feature 1934..2377 + /gene="wzg" + /locus_tag="SPC33F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2652..3383 + /gene="wzh" + /locus_tag="SPC33F_0005" + CDS 2652..3383 + /gene="wzh" + /locus_tag="SPC33F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34245.1" + /db_xref="GOA:O86886" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:O86886" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDRGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2655..3263 + /gene="wzh" + /locus_tag="SPC33F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.6e-36" + gene 3389..4084 + /gene="wzd" + /locus_tag="SPC33F_0006" + CDS 3389..4084 + /gene="wzd" + /locus_tag="SPC33F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34246.1" + /db_xref="GOA:O86887" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:O86887" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3389..3505 + /gene="wzd" + /locus_tag="SPC33F_0006" + /note="Signal peptide predicted for SPC1609 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3410..3826 + /gene="wzd" + /locus_tag="SPC33F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.1e-55" + misc_feature 3932..4009 + /gene="wzd" + /locus_tag="SPC33F_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4094..4783 + /gene="wze" + /locus_tag="SPC33F_0007" + CDS 4094..4783 + /gene="wze" + /locus_tag="SPC33F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34247.1" + /db_xref="GOA:Q4JZK1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZK1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 4798..6165 + /gene="wchA" + /locus_tag="SPC33F_0008" + CDS 4798..6165 + /gene="wchA" + /locus_tag="SPC33F_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34248.1" + /db_xref="GOA:O86888" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:O86888" + /translation="MNGKIVKPSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISVYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRTYPNFKGSKKILLLTATFRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGVTGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 4798..4890 + /gene="wchA" + /locus_tag="SPC33F_0008" + /note="Signal peptide predicted for SPC1611 by SignalP 2.0 + HMM (Signal peptide probability 0.845) with cleavage site + probability 0.335 between residues 31 and 32" + misc_feature 5581..6162 + /gene="wchA" + /locus_tag="SPC33F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.7e-157" + gene 6152..6958 + /gene="wciB" + /locus_tag="SPC33F_0009" + CDS 6152..6958 + /gene="wciB" + /locus_tag="SPC33F_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34249.1" + /db_xref="GOA:O86889" + /db_xref="UniProtKB/TrEMBL:O86889" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDL + ILSRANVEILLEKSDIIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDYTLFESRLFGRV + SELLFNVWLCQKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 6962..8002 + /gene="wciC" + /locus_tag="SPC33F_0010" + CDS 6962..8002 + /gene="wciC" + /locus_tag="SPC33F_0010" + /note="member of homology group 125" + /codon_start=1 + /transl_table=11 + /product="putative galactosyl transferase" + /protein_id="CAI34250.1" + /db_xref="GOA:O86890" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:O86890" + /translation="MKVTIIGQIKNKRTGLGKAINDFRDYCCNRATRVTEIDITNNFN + FLSSLFQILISDTDVYYFTPAGSVAGNIRDSLFLFFMIMKRKKIVTHFHNSAFGNVMR + QHPTLMIINRILYSKVDLIILLGEKSKIMFQQLRILDEKFKIIRNGVDGYLFIEKNEL + NKKMSDLPINIIFFSNMIREKGYEILLEVAKKMVGDEKYHFYFSGKFQDNNLKTRFIN + EIYSMNNVTYLDGVYGSDKKKLLQKMHYFVLPSYYKDETLPISMLEAMANGLYIIVSD + VGVVSEVINKETASLIEMINEETADSIIEIINQTSNKLNELDFNVSKYKQELLNENIQ + ASIYQQLERIAN" + misc_feature 7421..7933 + /gene="wciC" + /locus_tag="SPC33F_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2e-14" + gene 7999..8997 + /gene="wciD" + /locus_tag="SPC33F_0011" + CDS 7999..8997 + /gene="wciD" + /locus_tag="SPC33F_0011" + /note="member of homology group 60" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34251.1" + /db_xref="GOA:Q4JZI0" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZI0" + /translation="MTKKKNTGKILTVVVPSYNAENYLQETMPTILSAKNIERVELLI + VNDGSTDRTEEIARQFEREYEGIVRVISKENCGHGSAVNAGIENAVGNYFKVVDADDW + VNTNNLEDLIVFLSEVDVDQVLSPYDKIFVNYRGDIEREEECNEFSQVENEVIYSAEE + FYTRIKQTVGMHSITVKTSLLQENNIRLSEKMFYVDMEYIVYMLPYVKKVVLFDKSIY + RYRLGTETQSISMASYIKNRDMHKQVIYHLVDFYNQMRSSAVLRRITWKLILNLIRQQ + WIIYFNLSKKEGKNSECFEFDNWLIKEGRIKKIPLYFFKAVKYIRFKVKYFLGIRK" + misc_feature 8032..8577 + /gene="wciD" + /locus_tag="SPC33F_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 4.1e-31" + gene 8999..9967 + /gene="wciE" + /locus_tag="SPC33F_0012" + CDS 8999..9967 + /gene="wciE" + /locus_tag="SPC33F_0012" + /note="member of homology group 44" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34252.1" + /db_xref="GOA:O86892" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:O86892" + /translation="MRKIGKVINEYFVLRKSFTPAIARNKLFEKFWGRIGNYKIFNNI + ASNFYQYKHETIINFLEKDFSQFLKSYNFKEVSHKEIEQRKIFSMWIQGYESAPKLVQ + KTIDSQRKYAEKYGYKFVFLDENNIREYVTLPSEIVEKYENGTIDFIKYSDVVRGTLL + SKYGGVWLDSTIYVDSSRELNYLKKDFYTIRAKTHERVPKYIANGRWSAFCLSGEKQN + IVFDFLEKFHVAYFMKYDIVLDYFLIDYIIELGYRTNDLIRNYIDKVEENNQELFFLA + DNFSNQYDEKEWAGVLSTTALFKCSYKCPINEATGTYFDRLMKGEL" + misc_feature 9098..9949 + /gene="wciE" + /locus_tag="SPC33F_0012" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.1e-144" + gene 9987..10958 + /gene="wciF" + /locus_tag="SPC33F_0013" + CDS 9987..10958 + /gene="wciF" + /locus_tag="SPC33F_0013" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34253.1" + /db_xref="GOA:O86893" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:O86893" + /translation="MISVIVPVYNVADYLRFALDSLLEQTYKDFEVILVNDGSTDNSG + EICDEYGKLYDNIHVFHKKNGGLSDARNFGLEKSRGEFITFLDSDDYFEPYALELLIT + IQKKYDVDIVSTKGGITYSHDIYSKKLMAEDYLTVKILTNKEFLAAVYYNDEMTVSAW + GKLYKRDLFKTIFPKGKIYEDLYVVAERLLNIKTVAHTDLPIYHYYQRQGSIVNSTFS + DRQYDFFDAIDHNEAIIKKFYCGDKELLAALNAKRVIGSFILSNSAFYNSKNDITKII + RIIKPYYWEVIKNKKIPMKRKVQCVLFLLSPNYYYKIKDKMLQRGRI" + misc_feature 9993..10505 + /gene="wciF" + /locus_tag="SPC33F_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6.8e-50" + gene 10959..12182 + /gene="wzy" + /locus_tag="SPC33F_0014" + CDS 10959..12182 + /gene="wzy" + /locus_tag="SPC33F_0014" + /note="member of homology group 126" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34254.1" + /db_xref="UniProtKB/TrEMBL:O86894" + /translation="MHVRLDGLLDYIFLFSVIITCNTMYSTSQGFDGLGKWATLLLVV + SVFLKLLISRISMKAINVIVSRSLIFILIILLIVILNGFKISETSFVYYFVLFPIFMM + ILQMYYDVNEIANLIRKFVRIIFLLAIGSLLFWLIGSVFHIISPTVYVLNYWNGGGIV + EGYYNLHFEAQKIEILGAILIRNTGIFAEAPMWSLVLSLALIFQTLHIKKWNFTTWTL + IITIMTTTSTTGVYIIGLIFLYVLFSKTSGVKRYVSSLFILAIICCFSILWDNKSGTG + SATIRFDDYKAGFLAWQKSPIWGLGISDGLRTIEQHMDRTVRYNLGYSNSFFVVLAQG + GIMLASYYFYPVIKIILNKFSSNDLKFSALLIIFLMITTIFIETYMFLFVISLYYSLD + FGDDRDCHEKQYITN" + misc_feature 11781..11978 + /gene="wzy" + /locus_tag="SPC33F_0014" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1e-11" + gene 12213..13628 + /gene="wzx" + /locus_tag="SPC33F_0015" + CDS 12213..13628 + /gene="wzx" + /locus_tag="SPC33F_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34255.1" + /db_xref="GOA:O86895" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:O86895" + /translation="MKILKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFS + SIVTYFTLLATLGVANYGTKEISAHRKEIGKNFWGIYSLQFGATWLSILLYLALCFLF + TSMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGAISIFLFVKSAN + DLYLYVFLLTIFELLGQLSMWLPARQFIGKSYFDWKYAKKHLKPVILLFLPQIAISLY + VTLDRTMLGVLASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVSSLLSSGDYKAVN + KMHEMSFLIYNLVIFPIIAGMLIVNDDFVRFFLGQNFQDARYAIAIMTFRMFFIGWTN + IMGIQILIPHNKNKEFMVSTTVPAILSVGLNLLLLPQFGYIGAAIVSVLTEAFVWGIQ + LFYTRFYLKEVPIIGSMTKTALASAVMYGLLLGSKTSIHFSPTINVLIFSVLGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 12219..13013 + /gene="wzx" + /locus_tag="SPC33F_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.4e-79" + gene 13630..14628 + /gene="wciG" + /locus_tag="SPC33F_0016" + CDS 13630..14628 + /gene="wciG" + /locus_tag="SPC33F_0016" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34256.1" + /db_xref="GOA:O86896" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:O86896" + /translation="MSKFRNINLDLLKVLACVGVVLLHTTMGGFKETGAWNFLTYLYY + LGTYSIPLFFMVNGYLLLGKREITYSYILQKIKWLLITVSSWTFIVWLFKRDFTENLI + KKIIGSLIQKGYFFQFWFFGALILIYLCLPILRQFLNSKRSYLYSLSLLMTIGLIFEL + SNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTIEEIESRFKNWMKIVSILLLLI + SPIILFFIAKTIYHNLFAEYFYDTLFVKVSTLGIFLTILMLTLNENRRESIVSLSNQT + MGVFIIHTYIMKVWEKVLGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 14642..15751 + /gene="glf" + /locus_tag="SPC33F_0017" + CDS 14642..15751 + /gene="glf" + /locus_tag="SPC33F_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34257.1" + /db_xref="GOA:O86897" + /db_xref="HSSP:1I8T" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O86897" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKITEQTADMKDVEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASAEKVVFTGMIDQYFGYKHGELEYRSLRFDHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + misc_feature 15077..15679 + /gene="glf" + /locus_tag="SPC33F_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 2.3e-137" + gene order(15738..16187,16201..16767) + /gene="wcjE" + /locus_tag="SPC33F_0018" + CDS join(15738..16187,16201..16767) + /gene="wcjE" + /locus_tag="SPC33F_0018" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34258.1" + /db_xref="GOA:Q4JZH3" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZH3" + /translation="MTKSRINWIDFGKGFSIFLVLAGHVLLGLYQSEKFPTANNILSL + LIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQKV + AGATVRVPTTIFDLINIYKNPIGVSWYLYILWSILIMYGLVSIFNQKSLISVFAYCLT + LFVQTDIYIIQRTLVWGICFFLGSVLNEIHFNKISLKKFLVFFVIFDFIYMLVWFLFY + EVESKRDSVSYSNPGVWGIAFIVCILVAFVIFPKISEKFPKTFLYFTKYGKDSLGIYI + LHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLLPQKY + IKLK" + gene 16942..>16989 + /gene="aliA" + /locus_tag="SPC33F_0019" + CDS 16942..>16989 + /gene="aliA" + /locus_tag="SPC33F_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34259.1" + /db_xref="UniProtKB/TrEMBL:Q4K2C2" + /translation="MMKSSRLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaaggca gaaatccttt gttttttata accaaggttt ataaaccttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaatttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattc + 781 atttgttaga cctgcaatca aagaaatcct ctgatatctt cttccagata ctttgcctct + 841 tcttaactga ccttttaatg agcgaccata ttctcgatga aaataagtat cgaatcctgt + 901 ttcatcaatc taaacaggtg ctaggtgctt taaactatta aaattcttaa gaaataaggc + 961 tactttttct gggtcttgtt cataattaga ttgaaactag agtagtacac ctctgcttct + 1021 aaaaaatttt tagaaatcga tttaactgtc ctgatcgatt tgtcatgttc ttatttcatt + 1081 ttactatatt tttgtttcgc gggaagtcta ctaagatact taaagatgca gatagtaaaa + 1141 aaatgtagac attaccgtaa aaaagtgata taatcgtatg atgttcaatg tataggtgtt + 1201 aatcatgagt agacgtttta aaaaatcacg ttcacagaaa gtgaagcgaa gtgttaatat + 1261 agttttgctg actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta + 1321 caatatcctt gcttttagat atcttaatct agtggtaact gcgttagtcc tactagttgc + 1381 cttggtaggg ctactcttga ttatctataa aaaagctgaa aaatttacta tttttctgtt + 1441 gctgttctct atccttgtca gctctgtgtc gctctttgca gtacagcagt ttgttggact + 1501 gaccaatcgt ttaaatgcga cttctaatta ctcagaatat tcaatcagtg tcgctgtttt + 1561 agcagatagt gagatcgaaa atgttacgca actgacgagt gtgacagcac cgactgggac + 1621 tgataatgaa aatattcaaa aactactagc tgatatcaag tcaagtcaga ataccgattt + 1681 gacggtcaac cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac + 1741 taaggccatt gtcctaaata gtgtctttga aaatatcatc gagtcagagt atccagacta + 1801 cgcatcgaag ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa + 1861 gacgtctaag aatcagtctt tcaatatcta tgttagtgga attgacacct atggccctat + 1921 tagttcagtg tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa + 1981 aatcctcttg accacaacgc cacgtgatgc ctatgtacca atcgcagatg gtggaaataa + 2041 tcaaaaagat aaattaaccc atgcgggcat ttatggagtt gattcgtcca ttcacacctt + 2101 agaaaatctc tatggagtgg atatcaatta ctatgtgcga ttgaacttca cttcgttttt + 2161 gaaattgatt gatttgttgg gtggaattga tgtttataat gatcaagaat ttactgccca + 2221 tacgaatgga aagtattacc ctgcaggcaa tgttcatctt gattcagaac aggctctcgg + 2281 ttttgttcgt gagcgctact cactagcaga tggcgatcgt gaccgcgggc gcaatcaaca + 2341 aaaggtgatt gtggctatcc ttcaaaaatt aacgtcaacc gaagcactga aaaattatag + 2401 cacgatcatt aatagcttgc aagattctat ccaaacaaat atgccacttg agactatgat + 2461 aaatttggtc aatgctcagt tagaaagtgg agggaattat aaagtaaatt ctcaagattt + 2521 aaaaggtaca ggtcggacgg atcttccttc ttatgcaatg ccagacagta acctctatgt + 2581 gatggaaata gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga + 2641 gggtagatga aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca + 2701 agtcaagaga ggaaagcaag gctctcttga cagaatccta caggcagggg gtgagaacca + 2761 ttgtctctac ctctcaccgt cgcaagggca tgtttgaaac tccggaagag aagatagcag + 2821 aaaactttct tcaggttcgg gaaatagcta aggaagtggc gagtgacttg gtcattgctt + 2881 atggggctga aatttactac acaccagatg ttctggataa gctggaaaaa aagcggattc + 2941 cgaccctcaa tgatagtcgt tatgccttga tagagttcag tatgaacact ccttatcgcg + 3001 atattcatag cgccttgagc aagatcttga tgttgggaat tactccagtc attgcccaca + 3061 ttgagcgcta tgatgctctt gaaaataatg aaaaacgcgt tcgagaactg attgataggg + 3121 gctgttacac gcaagtaaat agttcacatg tcctcaaacc caaacttttt ggcgaacgtt + 3181 ataaattcat gaaaaaaaga gctcagtatt ttttagagca ggatttggtt catatcattg + 3241 caagtgatat gcacaatcta gacggtagac ctcctcatat ggcagaagca tatgaccttg + 3301 ttacccaaaa atacggagaa gcgaaggctc aggaactttt tatagacaat cctcgaaaaa + 3361 ttgtaatgga tcaactaatt taggagaaat gatgaaagaa caaaacacga tagaaatcga + 3421 tgtatttcaa ttatttaaaa ccttgtggaa acgcaagcta atgattttaa tagtggcact + 3481 tgtgacaggt gcgggggctt ttgcatatag cacttttatt gttaagccag aatatacgag + 3541 taccacgcga atttacgtag tgaatcgcaa tcaaggagac aagccggggc tgacaaatca + 3601 ggatttgcag gcaggatctt atctggtaaa agactaccgt gagattatcc tttcgcagga + 3661 tgcattggaa aaagtagcga caaatttgaa gttggatatg ccagcaaaaa cgttagccag + 3721 caaagttcaa gtgactgtac cagctgacac tcgtatcgtc tcaatctctg tcaaggataa + 3781 acagccagag gaagccagtc gtatcgctaa ttctctacga gaagttgctg cagaaaagat + 3841 cgtcgctgta acgcgagtat ctgatgtaac gacacttgaa gaagcgcgac cagctacgac + 3901 tccctcttct ccaaatgttc gacgcaattc cttgtttggt tttcttggag gagcagtcgt + 3961 aacagtaatt gctgttcttt tgattgagtt gctggacacc cgtgtgaaac gtcctgaaga + 4021 tgttgaagat gtactgaaaa ttccactttt agggctcgtt ccagattttg acaaaataaa + 4081 ataggaggaa gttatgccaa cattagaaat ctcacaggca aaattggatt ctgtaaaaaa + 4141 ggcagaggaa tattataacg ctttgtgcac gaacctacag ttaagtggag atggtttgaa + 4201 agtattttct atcacttctg tgaaaatagg agaaggaaaa tcaacgactt ccgccaatat + 4261 cgcttgggct tttgcgcgtg caggttacaa aacgctgctg attgatggag atattcgcaa + 4321 ttctgttatg ttaggtgtct ttaaagcaag gaataagatt acaggcctga cagaattttt + 4381 atcaggaact acagacttat cacaagggct ttgtgatacc aatatcgaaa atctctttgt + 4441 aattcaggct ggctctgtgt caccgaatcc gacagctctt cttcaaagta agaatttcac + 4501 tacaatgctt gaaaccttgc gtaaatattt tgactacatc attgtagata ctgctcctgt + 4561 tggtgtcgtg attgatgcgg ctattattac gcgaaactgc gatgcttcta ttttagtgac + 4621 ggaggcaggt gaaataaatc gtcgggatat tcaaaaagca aaagaacagt tggaacacac + 4681 aggaaagccg tttttgggaa ttgtgttgaa taaattcgat acttcagtag acaaatacgg + 4741 ttcttatgga aattatggag attacgggaa aaataaaaaa taggtcgggg gatagagatg + 4801 aatggaaaaa tagtaaagcc ttcattggcc ataatccaga gttttcttgt tattttattg + 4861 acttatctac ttagtgctgt gagagaagcg gagattgttt caacaacagc tattgcactt + 4921 tatatcctcc attattttgt cttttatatc agtgtttatg ggcaggattt ctttaaaagg + 4981 ggatatttga ttgaacttgt ccagacattg aaatatatcc tattctttgc actagcgatt + 5041 agtatttcta attttttctt agaggatcga tttagtattt ccagacgagg catgatttac + 5101 ttcctcacat tacatgctct cttagtctat gtgctaaacc tatttatcaa gtggtattgg + 5161 aagcggactt atcccaactt taaaggaagt aagaagatcc tcttgcttac agcaactttt + 5221 cgtgtcgaaa aggtactgga tagattaata gaatcaaatg aggttgttgg ggagttggta + 5281 gccgtcagtg tcttagataa accagatttt cagcatgatt gtttaaaggt agtagcagag + 5341 ggggagatag taaactttgc gactcatgag gtggtcgatg aagtctttat caatcttccg + 5401 agtgaaaaat acaatattgg agagcttgtc tctcagtttg aaacgatggg aattgatgta + 5461 acagttaatc taaatgcttt tgatcgtagt ttggcacgta acaagcaaat tcgtgagatg + 5521 gcaggattaa acgttgtgac tttttctaca acattttata agactagtca tgtaattgct + 5581 aagcggatta ttgatatcat gggtgcattg gtcgggttga tattatgtgg tttagtcagt + 5641 attgtactgg ttcctttgat tcgaaaggat gggggctctg ctatttttgc tcagacgcgt + 5701 ataggaaaaa atggtcgtca gttcaccttt tataagtttc gctctatgtg tgtagatgcc + 5761 gaggcgaaaa aaagagaact catggaacaa aataccatgc agggtggaat gtttaaggtg + 5821 gacgatgatc ctcgtatcac gaaaattggt cgttttatac ggaagactag cttggacgag + 5881 ctaccacagt tttataatgt tctaaaggga gatatgagtt tggttggcac acggccacca + 5941 acagtggatg agtatgaaca ctatacccca gaacaaaaac gtcggctaag ttttaaacct + 6001 ggtgtaacag gcttatggca ggtcagtgga cgaagtgaaa tcaaaaattt cgatgaagtt + 6061 gtcaaattag atgtggctta tatagatgat tggacaatct ggaaagatat tgaaatttta + 6121 ttgaagacag ttaaggtagt attgatgaag gatggagcga agtagattga tagatgtaaa + 6181 aatcattgtg gcaacgcata aagaggttaa aatgcctcaa gacaatagtc tttaccttcc + 6241 aatacatgtt gggagagacg gtaaatcaga tattggtttt atcggtgata atactggcga + 6301 taatatatcc tctctaaatc catattattg tgagttaacg ggactttatt gggcatggaa + 6361 gaatcttgat tataattact taggtttagt tcattaccgt cgttatttta caaataaatc + 6421 tcaagggtat aatgaaaatg tcaatatgga tgacctcatt ttgtctcgag ctaatgttga + 6481 aatattatta gagaaatctg acataatagt tccaaagaag cgaaagtatt atattgaaac + 6541 tctttattca cattatgccc atacccttaa cggagaacat ctggatcttg ctaggaaaat + 6601 tattgagcaa aatagttcag agtatctttc atcctttgat aaagtgatga aacaaagaag + 6661 cggttatatg ttcaatatgt ttatcatgaa aaaagaacta ttagatgatt atttaccgtg + 6721 gcttttttct attctggata ctatgtacga acagatggac ttgactgact atactttatt + 6781 tgagtcacgt ttattcgggc gagttagtga gttgttgttt aatgtttggt tatgtcaaaa + 6841 aggaataacg cctaaagagg taccatttat gtacatggag agagtggatt tgtttgaaaa + 6901 aggaaaatct tttttaatgg ctaaattttt tggaaagaag tatggacaga gtttctagga + 6961 tatgaaagta actattattg gacaaataaa aaataagaga acaggtcttg gaaaggcgat + 7021 taatgatttt agggattatt gttgcaatcg tgctacaaga gtaacggaaa tagatataac + 7081 aaataatttt aattttttaa gctctctttt tcaaatttta atatctgata cagatgttta + 7141 ttattttact ccagctggtt cagtagctgg taatattagg gattcactgt ttttgttctt + 7201 tatgataatg aaaaggaaaa aaatagtgac ccattttcat aatagtgctt ttggaaatgt + 7261 gatgagacaa catccgactc taatgataat aaatagaata ttgtattcta aagttgattt + 7321 gattatatta ttgggagaga aatcgaaaat aatgtttcaa caactaagaa ttttagacga + 7381 aaaatttaaa ataattagga atggtgtgga tggatattta tttattgaaa aaaatgaatt + 7441 aaataaaaaa atgagcgatc tacccataaa tattattttt tttagtaata tgattagaga + 7501 aaaaggttac gaaattttat tagaagttgc taagaagatg gtgggggatg agaaatatca + 7561 cttttatttt tctggaaaat ttcaggataa taatttaaag actaggttta ttaatgaaat + 7621 ttatagtatg aataatgtaa catatttaga tggtgtatat ggtagtgata agaaaaagtt + 7681 attgcaaaaa atgcattact ttgttttacc atcgtattat aaagatgaaa ctttacctat + 7741 cagtatgtta gaagcaatgg caaatggtct ctatattatt gtaagcgatg tgggagttgt + 7801 gtcagaggtg attaataaag aaactgctag tcttattgaa atgataaacg aagaaacagc + 7861 agacagtatc atagaaatta ttaatcagac ttcaaataaa cttaatgagt tagattttaa + 7921 tgtatcaaaa tataagcaag agttgttaaa tgaaaatata caagcatcaa tttatcagca + 7981 attagagagg atagcaaatt gacgaagaaa aaaaatactg gaaaaatatt aacagtagtt + 8041 gtaccatcat ataatgcaga aaattattta caagagacga tgccgacgat actttctgct + 8101 aagaatatag agagggtaga attactgatt gtaaacgatg gttctacaga cagaaccgaa + 8161 gaaatagcaa gacaattcga gagagaatat gagggaattg ttagagttat aagtaaggaa + 8221 aactgtggtc acggttcggc agtaaatgcg gggattgaga atgctgttgg taattacttt + 8281 aaagtggtag atgcagatga ttgggtgaac accaataatt tagaagattt gatagtgttt + 8341 ctatctgagg tggatgtgga tcaagtttta tcaccatatg ataaaatttt tgtgaattat + 8401 cgaggtgata tagagcgtga agaagagtgc aacgagtttt cgcaagttga gaacgaggtg + 8461 atctattctg cagaagaatt ctatacacga attaaacaaa cggtaggaat gcattccatt + 8521 actgtgaaaa cgagtctttt gcaagagaac aatattcggc tgtctgaaaa aatgttctat + 8581 gtagatatgg aatatattgt ttatatgctt ccatatgtaa aaaaggttgt tttatttgat + 8641 aaaagtatct atagatatcg tctaggaaca gagacacaaa gcattagtat ggcgagttat + 8701 attaaaaatc gtgatatgca taaacaagtg atctatcatt tggttgattt ttataatcaa + 8761 atgagatcta gcgctgtttt aaggagaata acatggaaat tgattttaaa tttaataaga + 8821 cagcaatgga taatttattt taatttatct aaaaaagagg ggaaaaacag cgagtgtttt + 8881 gaatttgata attggctaat aaaagaagga cggataaaaa aaataccact atactttttt + 8941 aaagctgtga aatatatcag atttaaggtg aaatattttc tggggataag aaaataatat + 9001 gagaaaaata ggaaaagtaa taaacgagta ttttgtatta agaaaatcat ttactcctgc + 9061 tattgctcgg aataaattat ttgaaaagtt ttggggacgg atagggaatt ataaaatttt + 9121 caataatata gctagtaatt tttatcaata caaacatgaa acaatcataa attttttgga + 9181 aaaagatttt agccaatttt taaaatccta taactttaaa gaggtatcgc acaaggagat + 9241 agaacaaaga aaaatcttct ctatgtggat acaaggatac gaaagtgctc ctaagttggt + 9301 tcagaagacg attgatagcc aaaggaaata tgcagaaaaa tacggatata aatttgtttt + 9361 tttggatgaa aacaatatcc gtgaatatgt gacacttcca tcagagatag tagaaaaata + 9421 tgagaatgga actatagatt ttataaaata ttcggatgtt gtaaggggaa cattgctttc + 9481 aaaatatgga ggagtgtggt tagattcgac tatttatgtt gattcttcac gagaactgaa + 9541 ttatttaaaa aaagattttt atactattcg agcaaagaca catgagagag tgcccaaata + 9601 tatcgcaaat ggtaggtggt ctgcattttg tttgtcaggg gaaaagcaaa acatagtatt + 9661 tgatttttta gagaaatttc atgtagcata ttttatgaaa tacgatatag tgctagatta + 9721 ttttttaatt gactatatta tagaattagg ttataggaca aatgacttga ttagaaacta + 9781 tattgataaa gtcgaagaaa ataatcagga gttgttcttt ttggcagaca atttttctaa + 9841 ccagtatgat gaaaaagagt gggcaggagt tttatcaaca actgcattgt ttaagtgtag + 9901 ttataagtgt ccgataaatg aagcgacagg aacctatttt gatagattga tgaagggtga + 9961 actgtagcat aaagagaggg aatggtatga tttcagttat tgttccagta tacaatgtcg + 10021 cggattatct gcgctttgcg ttggatagtc ttttggaaca gacgtataaa gattttgagg + 10081 ttattctagt aaatgatgga tccactgata attctgggga aatatgtgat gaatatggga + 10141 aactgtatga taatattcat gttttccata agaagaatgg cggactttcg gatgctagaa + 10201 attttggttt ggagaagagt cgaggagagt ttataacttt tcttgattca gatgattatt + 10261 ttgaaccgta tgcattagaa ttgttaatta ctattcaaaa aaaatatgat gtagatatcg + 10321 tatcaactaa agggggaata acctattctc atgatattta tagcaaaaaa ctgatggctg + 10381 aggactacct aactgtaaaa atattgacaa ataaagaatt tttggcagct gtatattata + 10441 acgatgaaat gacggtatct gcttggggaa aattgtataa aagagattta tttaaaacga + 10501 tttttccaaa aggaaagatc tacgaggatt tgtatgttgt tgcagagcgt ttgttgaata + 10561 ttaaaacagt tgctcatacc gatttgccta tatatcatta ttatcagaga cagggaagta + 10621 ttgttaattc aacattttcg gatagacagt atgatttttt tgatgcgatt gatcataatg + 10681 aagccataat aaaaaaattc tattgtggag ataaggaatt gttagcagcc ttaaatgcta + 10741 aaagagtaat tggctccttt attttgagta atagcgcatt ttataatagt aaaaacgata + 10801 ttactaaaat aataagaata attaaaccgt attattggga agtaataaaa aataaaaaaa + 10861 ttccaatgaa aaggaaagtt caatgtgttt tgtttctgct ttccccaaat tactactata + 10921 aaataaaaga taagatgtta cagagaggca ggatatagat gcatgttaga ttagatggtt + 10981 tgctggacta tatatttcta tttagtgtga ttattacttg taatactatg tattcaacta + 11041 gtcaaggatt tgatggacta gggaaatggg cgactctgtt acttgtggta tcagtttttc + 11101 tgaaattgct tatctctaga atatctatga aggcaatcaa tgtgattgtg tcgcgttctt + 11161 taatatttat attaattatt ctactcatag taatattaaa tggttttaag atttctgaga + 11221 caagtttcgt ctattatttt gtattatttc cgatttttat gatgattttg cagatgtact + 11281 atgatgttaa tgaaatcgca aatctgatac ggaaatttgt tcgtataata tttcttttag + 11341 caattggctc tctcctattt tggcttattg gtagtgtatt tcatattata tccccaacgg + 11401 tttatgtgtt gaattattgg aatggtgggg gaatagtaga agggtactat aatcttcatt + 11461 ttgaagcaca aaaaatagag attttggggg cgatactgat aagaaatacg gggatttttg + 11521 ctgaagcacc tatgtggagt ttggtattga gccttgcatt gatatttcaa acgcttcata + 11581 taaaaaaatg gaatttcaca acttggactc ttattattac aattatgaca actacgtcaa + 11641 caacaggggt ttatataata ggtttgattt tcctatatgt tttattttca aaaacaagtg + 11701 gtgtgaagag atatgtttct agtttattta ttttagcgat tatatgttgt ttttcaatat + 11761 tatgggataa taaatctgga actggttcag caactatacg ctttgatgat tataaggctg + 11821 gttttttggc atggcagaaa agtcctattt ggggattagg tatttcagac ggtcttagaa + 11881 ccattgaaca acatatggat agaactgtta gatataatct tgggtatagc aatagctttt + 11941 ttgttgtttt agctcaagga gggataatgt tggcttcgta ttacttttat ccagtaatta + 12001 aaattatttt gaataaattt agttcgaatg atttgaagtt ttctgcgcta ttaataattt + 12061 tccttatgat aactactata tttatagaga cctatatgtt tttatttgtc atttctttat + 12121 actattctct tgattttggg gacgatagag attgtcatga gaaacagtac attactaatt + 12181 aataataaag gtgtgaacag aaataagaag aaatgaaaat actaaaaaac tatgcctaca + 12241 atctttctta tcaattgttg gtgatcatac tccctatcat tacgactccc tatgtaacga + 12301 gggtttttag ttctgacgat ttaggaacgt atggctactt tagctccatt gttacctatt + 12361 ttaccttgct tgcaactctt ggtgttgcca actacggtac caaagagatt tcagcacatc + 12421 gtaaggaaat tgggaagaat ttctggggaa tttattctct ccagtttggt gcaacttggc + 12481 tatccatttt gctttatctt gccctttgtt tcttatttac ttcaatgcaa aatccggtag + 12541 cttatatatt gggattaagt ttagtgtcaa aaggtttgga tatttcttgg ttatttcaag + 12601 gtttggagga ttttagaaag attacagttc ggaacatcac tgttaagtta gttggtgcaa + 12661 tctctatttt cctatttgta aaatcagcta atgacttata cttatatgta tttcttctta + 12721 ccattttcga attgttaggg caattaagca tgtggttacc cgcaagacaa tttattggta + 12781 aatcatattt tgattggaaa tacgctaaga agcatttgaa accagttatc ttgttattct + 12841 tgccacagat tgccatctcg ctttatgtga ctttggaccg tacgatgctg ggggtgttgg + 12901 cttcgacaaa ggatgttgga atttatgatc aagctttgaa gcttgttaat attttactga + 12961 ctttggttac ctcactgggg agtgttatgt tgccacgagt atctagcctt ttatcgtctg + 13021 gggattacaa agccgttaat aagatgcacg agatgtcttt tttaatctat aacttggtga + 13081 ttttcccaat catagcagga atgttgattg tcaacgatga ttttgttcgt ttcttccttg + 13141 ggcaaaattt tcaagatgct cgctatgcga ttgctattat gaccttccgt atgttcttta + 13201 ttggttggac caatataatg ggaattcaaa tcttgattcc gcacaataaa aataaggaat + 13261 ttatggtttc aacgacagtt cccgctattc tgagtgtggg attgaatttg ttgcttcttc + 13321 cccaatttgg ttatataggt gctgcgattg tttcagtttt gactgaggcg tttgtatggg + 13381 ggattcagtt attctataca cgtttttatt taaaagaagt tcctattatc ggttcaatga + 13441 caaaaactgc acttgcatct gctgttatgt atggtctctt gctaggttca aaaacatcta + 13501 tacatttttc gccaaccata aatgttttaa tattttcggt gctaggcgga attatctatc + 13561 tttttgcaat tctatctctg aaagtggtag atgtgaaaga attaaaacaa ataatcagga + 13621 aaaattagaa tgagcaaatt tcgaaatatt aacttagatt tactaaaagt gcttgcatgt + 13681 gttggagtcg ttctacttca tacaactatg ggtgggttta aagagacagg tgcatggaat + 13741 tttttgacat atttatatta cttaggaacc tattctatcc ctctattttt tatggtcaat + 13801 ggttatttat tgttggggaa gagagaaatt acctattcct acatattgca aaaaataaaa + 13861 tggctcctaa taacagtgtc gtcatggact tttatcgttt ggctgtttaa aagagacttt + 13921 acagagaact taattaaaaa aattataggt tctttgatac aaaaggggta tttcttccag + 13981 ttttggtttt tcggtgcact catacttatc tatttatgtt tgccaatttt gagacaattt + 14041 ctaaattcaa aaagaagcta tttatacagt ttatctttat tgatgactat tggtttgatt + 14101 tttgagttat caaatatcct acttcaaatg ccaatacaaa catatgtaat acaaactttt + 14161 agattatgga cgtggttttt ttactatctt ttaggtggtt atatagcgca attcactata + 14221 gaagaaatcg aatcaaggtt taagaattgg atgaaaatag ttagcatact tttgttattg + 14281 atttcaccaa taatattatt tttcatagcg aagactatat accataatct atttgctgaa + 14341 tacttttatg atactttatt tgtaaaagtc agtactttag gaatttttct aactatcctc + 14401 atgcttactt tgaatgaaaa ccgaagagaa tcgattgttt ccctttctaa tcaaacaatg + 14461 ggggttttca taatacatac ttatattatg aaagtgtggg aaaaagtgct tggttttaat + 14521 tttgtaggag catatttact ttttgctcta tttactttaa gtgttagttt tattattgtt + 14581 gggatgttaa tgaagattcc ttacttcaat cgaatcgtca aattataaaa aggagaacaa + 14641 gatgtacgat tatcttattg tcggtgctgg tttgtcagga gcaatttttg cttatgaggc + 14701 gaccaagcgt ggaaaaaaag taaaagtgat tgataaacgt aaccacattg gtgggaatat + 14761 ctactgtgag aatgtagaag gagttaatgt tcataaatat ggtgcccata tctttcatac + 14821 ttctaataag aaagtttggg attatgttaa tcaatttgct gaatttaaca actacgtcaa + 14881 ctcgcctgta gctaattaca agggtagcct ctataatcta cctttcaata tgaatacctt + 14941 ctatgctatg tgggggacaa aaactcctca agaagtcaaa gataagatta ctgagcagac + 15001 agctgatatg aaggatgttg agccgaaaaa tctggaagaa caggctatca agttgattgg + 15061 tccagatgtc tatgaaaagt taatcaaggg ttatactgaa aagcagtggg gacgctcagc + 15121 aacggaactt cctccattta tcattaaacg tcttccagtt cgtttaacat ttgataataa + 15181 ctattttaac gaccgttacc aaggaattcc tattggtggt tacaatgtca tcatcgaaaa + 15241 tatgcttaaa gacgttgaag ttgagcttgg tgttgatttc tttgctcatc gtgaagagtt + 15301 agaagcatca gctgaaaaag ttgtctttac agggatgatc gaccagtatt ttggctacaa + 15361 gcacggagag ttagaatacc gtagccttcg ctttgatcat gaaattttgg acgaggaaaa + 15421 ttatcaagga aatgctgtag tgaactatac ggagcgtgag attccttata ctcgtattat + 15481 cgaacacaag cattttgaat atggaacaca ggcaaagaca gttatcacgc gtgaatatcc + 15541 agctgactgg aagcgtgggg acgagcctta ctatccgatc aacgatgaga aaaataatgc + 15601 tatgtttgct aagtaccaag aggaagcttc aaagaatgat aaggttattt tctgtggacg + 15661 tttagcagat tataaatatt acgatatgca tgtggtgatt gaacgggcgc ttgaggttgt + 15721 ggagaaagag tttggatatg acaaaaagta gaatcaattg gatagatttt ggaaaaggct + 15781 tttccatatt tttagtctta gcaggacatg tgttgcttgg actgtatcaa tcggaaaaat + 15841 ttcccacagc aaataacata ctatcgttgt tgatagcaca agtctacata tttcatatac + 15901 cagtattttt tgccttatca ggatactttt tcaaacctgt gtcggatttg aaggagttct + 15961 ggcaatatgc taaaaagaag acaattgttt ttggtctgcc atatattttc tattcgatca + 16021 ttcactttgg tcttcaaaaa gttgcagggg cgactgttag agtcccgacg actatatttg + 16081 atttaataaa tatctataaa aatcctattg gagtctcatg gtatttatac atactctggt + 16141 cgattttgat aatgtatgga ttagtatcta tatttaatca aaaatcgtag aatattattt + 16201 ttgataagtg tttttgctta ttgtttaacc ctatttgttc aaacagatat ttatattatt + 16261 caaagaacgc tagtttgggg tatttgtttc tttcttggaa gtgtattgaa cgaaattcac + 16321 tttaataaaa ttagtttgaa aaaatttctt gttttctttg tgatatttga ctttatttat + 16381 atgcttgtat ggttcttatt ttatgaagta gagtctaaaa gggatagtgt aagctatagt + 16441 aacccagggg tgtgggggat tgcttttatt gtctgtatat tagttgcgtt tgtaatcttc + 16501 cctaaaatat cggaaaaatt tcctaaaact ttcctatatt tcactaaata tggtaaagat + 16561 agtttaggta tctatatcct ccatgcacca atttgtagca tgattcggat tctaatgttg + 16621 aaagtgggaa taaactcagt ttttcttcac gttgttgttg ggattgtctt gggttggtat + 16681 ttatccatac tggcaactta tatattgaaa aaaattccat ttttgaatat tgttttatta + 16741 ccacaaaagt atattaaatt aaaataaatt attttagatt tataatgtgg ctctttgtca + 16801 actaacatct ggagaggaca atcactgtct tctccttttt tttcttttca gaatatacca + 16861 aattaacaca aaaattctga aaattctgtt gacaactttc tgaaaagagt ctataatgga + 16921 gagaaagttt taaaggagaa aatgatgaaa agttcaagac tacttgccct tgcgggcgtg + 16981 acattattg +// + diff --git a/public/res/serotype_genbank/serotype_33G.gb b/public/res/serotype_genbank/serotype_33G.gb new file mode 100644 index 0000000..40e4f06 --- /dev/null +++ b/public/res/serotype_genbank/serotype_33G.gb @@ -0,0 +1,676 @@ +LOCUS OR509570 22028 bp DNA linear BCT 09-OCT-2023 +DEFINITION Streptococcus pneumoniae strain PMP1486 capsular polysaccharide + gene locus, complete sequence. +ACCESSION OR509570 +VERSION OR509570.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22028) + AUTHORS Manna,S., Werren,J.P., Ortika,B.D., Bellich,B., Pell,C.L., + Nikolaou,E., Gjuroski,I., Lo,S., Hinds,J., Tundev,O., Dunne,E.M., + Gessner,B.D., Bentley,S.D., Russell,F.M., Mulholland,E.K., + Mungun,T., von Mollendorf,C., Licciardi,P.V., Cescutti,P., + Ravenscroft,N., Hilty,M. and Satzke,C. + TITLE Streptococcus pneumoniae serotype 33G: genetic, serological and + structural analysis of a new capsule type + JOURNAL Unpublished +REFERENCE 2 (bases 1 to 22028) + AUTHORS Manna,S., Werren,J.P., Ortika,B.D., Bellich,B., Pell,C.L., + Nikolaou,E., Gjuroski,I., Lo,S., Hinds,J., Tundev,O., Dunne,E.M., + Gessner,B.D., Bentley,S.D., Russell,F.M., Mulholland,E.K., + Mungun,T., von Mollendorf,C., Licciardi,P.V., Cescutti,P., + Ravenscroft,N., Hilty,M. and Satzke,C. + TITLE Direct Submission + JOURNAL Submitted (31-AUG-2023) Infection and Immunity, Murdoch Children's + Research Institute, 50 Flemington Road, Melbourne, VIC 3052, + Australia +COMMENT ##Assembly-Data-START## + Assembly Method :: Spades v. 3.15.4 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..22028 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="PMP1486" + /serotype="33G" + /isolation_source="nasopharynx" + /db_xref="taxon:1313" + /geo_loc_name="Mongolia" + misc_feature 1..22028 + /note="capsular polysaccharide gene locus" + gene 1..1608 + /gene="dexB" + CDS 1..1608 + /gene="dexB" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="WNT95315.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNGDGVGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIATIFGTMEDMDQLIAEAKKRDIRIIMDLVVN + HTSDEHAWFVEACENTDSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGAKDLLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKGVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTGQPWLAVNPNYEMINVQEALANPDSIFYTYQKL + VQIRKENSWLIRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTLAQEVFEKQILVPWDAFCVELL" + CDS complement(1916..2272) + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="WNT95316.1" + /translation="MVAGLTNGELIAPMTYEETMTSDFFEAWFQKFLLPTLTTPSVII + MDNARFHRMGKLELLCEEFGHKLLPLPPYSPEYNPIEKTWAHIKKHLIKGITKLQYLL + RGSFVLFLFQLTILSV" + CDS complement(2451..2780) + /codon_start=1 + /transl_table=11 + /product="IS630 family transposase IS630-Spn1" + /protein_id="WNT95317.1" + /translation="MAYSIDFRKKVLSYCERTGSITEASHVFQISRNTIYGWLKLKEK + TGELNHQVKGTKPRKVDRDRLKNYLTDNPDAYLTEIASEFGCHPTTIHYALKAMGYTR + KKEPHLL" + gene 3014..4459 + /gene="wzg" + CDS 3014..4459 + /gene="wzg" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="WNT95318.1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVGFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLVIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 4461..5192 + /gene="wzh" + CDS 4461..5192 + /gene="wzh" + /codon_start=1 + /transl_table=11 + /product="tyrosine phosphatase Wzh" + /protein_id="WNT95319.1" + /translation="MIDIHSHIVFDVDDGPKSREESKTLLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDILDKLEKKRIPTLNDS + RYALIEFSVNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + gene 5201..5893 + /gene="wzd" + CDS 5201..5893 + /gene="wzd" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="WNT95320.1" + /translation="MKEQNTIEIDVFQLVKTLWKRKLMILIVALVTGAGAFAYSTFIV + KPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKLD + MSAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDVT + TLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQIP + LLGLVPDLDKMK" + gene 5903..6592 + /gene="wze" + CDS 5903..6592 + /gene="wze" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="WNT95321.1" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 6607..7974 + /gene="wchA" + CDS 6607..7974 + /gene="wchA" + /codon_start=1 + /transl_table=11 + /product="initial transferase WchA" + /protein_id="WNT95322.1" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREVEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAINISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDYLKVVAEREIVNFATYEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIRKMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQMRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQISGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + gene 7976..8767 + /gene="wciB" + CDS 7976..8767 + /gene="wciB" + /codon_start=1 + /transl_table=11 + /product="glycosyltransferase WciB" + /protein_id="WNT95323.1" + /translation="MIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFIGDNTG + DNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDVILSRS + NVEILLEKSDIIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLSSFDKV + MKQRSGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDYTPFESRLFGRVSELLF + NVWLCKQGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 9415..10320 + /gene="wcrB" + CDS 9415..10320 + /gene="wcrB" + /codon_start=1 + /transl_table=11 + /product="glycosyltransferase WcrB" + /protein_id="WNT95324.1" + /translation="MGLSTVTLFKNLKFSDSKFIKLEGELLLKYQEYLLKIMEDIVTV + CEEEGLYYSLSGGSALGAYRHKGFIPWDDDMDIFMLGSEREIFFQKFSQKFSDKYWIH + NSQTPNYGMPIGRIRQKGTVLRGREDVGVEECGFFIDIFWLENVPNSKILRQLHGFLC + MAIGLLLSCRNFYKNRQLMLEIMKEHKEVRLVFRIKLVLGFLISFISLRQFTRLTERI + YSLCKNNESRYLSVPSGRKHYFGEMFIREDMQLTRKLNFEGHKWNVPNNIEHYLTVMY + GDYMKIPAVEDRESHIILEISFPNE" + gene 10359..11447 + /gene="wcrC" + CDS 10359..11447 + /gene="wcrC" + /codon_start=1 + /transl_table=11 + /product="glycosyltransferase WcrC" + /protein_id="WNT95325.1" + /translation="MKKIAIVRYNLSKIGGAEKVAINMANELSQYYDVKLLSILLDED + GFINYDINPNVTLINFHKGDLRIRTATLKLTGKLRNYIKREKIEVIFSITPLTNTMVR + LATLGLNVKIVFCDHHSLEFRDFRGREVQRFVGAKFFDKIVTLTEEDRIKYSDKYNIP + INKVNAIYNWIDEEDSENTPFDNETNKIITVGRFHSQKGYDYLAEVAIKVLSQHPDWQ + WDIYGSGDKLIEQDLKRKLEEGCVSSQVNFKGNVKGTENIYPNHSIYVMTSRHEGLPL + VLLEAQQYNLPIVSFRCPTGPSEIVEDGVNGFLIDCYDVYQMSEKLLELMKNDDLRQS + FSEHAKDNIDKFDKNEILNQWIELIDTI" + gene 11456..12460 + /gene="wcrD" + CDS 11456..12460 + /gene="wcrD" + /codon_start=1 + /transl_table=11 + /product="glycosyltransferase WcrD" + /protein_id="WNT95326.1" + /translation="MQECLLTIIMPSYNIQDYISKGIESFQQVHLDYKQKFEILIVND + GSTDDTAKVAEETLRKDLLLNGRIITKENGGHGSTINRGIQEAKGKFFKVIDGDDWVI + PSEFEKFLDDLTVTEVDMILTDFTEQHVYNNTTVRNDFVEKYEVGKEYSGIPEKRIPM + HSVTYRTSILVENEIRLSEKTFYVDIQYTLFPLEYVHSFCYWNYDVYQYYIGRPEQSM + NIESMKRNVRHHLTVTNSVLTYFSKIADDPVLKKVVADTLVYLISLQIDLSWMVEDSK + TLSEELYRQIEQSSYEYIPTKKFDRLSYLNYKFHYFLDFVFNPVLKKYSKKKEKERGI + " + gene 12462..13415 + /gene="wciF" + CDS 12462..13415 + /gene="wciF" + /codon_start=1 + /transl_table=11 + /product="glycosyltransferase WciF" + /protein_id="WNT95327.1" + /translation="MFISVVVPVYNVFDYLHFAMDSLIKQTYQNFEVILVNDGSTDNS + PQLCEEYAKQYENVSVFHKENGGLSDARNFGVSKASSDWIFFLDPDDYLEDYTLELIV + KIQQEYQANLISTKVKATSKYNDYSLYQLEESDYKDLFVVTKEKALELMLDDKIATVS + ACAKLYHKNILEKVPFSVGKIYEDFYVVADHLALADKIVISPLETYNYYRREGSIVRS + TFTEKRYDFFDAVSKNEEVINKEYTQSLELQQSLQAKKLRGGFVVIGAKADSGLTDFS + KDRDLLKVDFKNMLLNKKISWKLKLKYTIFMLSSKMYLRLR" + gene 13922..15115 + /gene="wzy" + CDS 13922..15115 + /gene="wzy" + /codon_start=1 + /transl_table=11 + /product="polymerase" + /protein_id="WNT95328.1" + /translation="MKINLMNIVDTLLLLLIIIKTNSIYLYIGVENKLNFYLIVVITI + AVLLEVISGRLSLQYLKKMLLVIVLYFFAIIINILVSASVISSNILTYYFIVVPLMLI + LVMYKYYKNTLTNFLVIFVRIVLILAVISLLFWCFGSVLNIIKPTNYVVSSWSGGQVT + TSYYNLYFETQNALFLGYKMIRNSGIFAEAPMWSLLLSVALIFQELLLKHSTRIFVLL + MLTIFTTASTTGFFIVGSLLIYKVINQKRSWFKYINLTSIPVLIFTLVKVWGEKSDSA + SASIRYDDYVAGFLAWKNHFIFGSGLSSGIRAIESYMDTTIRSNLGYSNSFFVILAQG + GIILGVLHFYPVVSVLLKRFSSNSKMLALLFIILIFTAIFTDTPLFILFVGIFYALIL + NRENT" + gene 16194..17609 + /gene="wzx" + CDS 16194..17609 + /gene="wzx" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="WNT95329.1" + /translation="MKVLKNYAYNLSYQLLVILLPIITTPYVTRVFSSDDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKQIQKNFLGIYSLQLGATVLSLSLYALLCLTL + PFMQNPVVYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVISIFLFVKSSN + DLYLYVFLLTIFELLGQFSMWIPAREFIGRPHFDIEYARHHLKPVILLFLPQVAISLY + VTLNRTMLGALASTKDVGIYDQALKLVTILLTLVTSLGSVMLPRVAHLLATDDHKAVN + RMHEMSFLIYNLVIFPMMAGILIVNDDFVQFFLGQDFQDARYAIAIMIFRMFFIGWTN + IMGIQMLIPHNQNKEFMISTTAPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LFYTRRYLKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSPTLNVLAFAALGGIIYL + FAILSLKVVDVKELKQIIRKN" + gene 17611..18609 + /gene="wciG" + CDS 17611..18609 + /gene="wciG" + /codon_start=1 + /transl_table=11 + /product="O-acetyltransferase WciG" + /protein_id="WNT95330.1" + /translation="MRKIRNINLDLLKVLACVGVVLLHTTMGGFKETGSYNLLAYLYY + LGTYSIPLFFMINGYLLLGKREITYLYILQKVKWILITVSSWTFIVWLFYRDFTTNPI + KKIVGSLIQRGYFSQFWFFGALILIYLCLPIVRQFLNSKRSYLYSLSLLMTIGLIFEL + LNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTKEEIESRFKNWMKIASILLLLI + SPIILFFIAKTTYHNFFAEYFYDILLVKVVSVGIFLTIFSLVLNENSNKWIIFLSNQT + MGIFIIHTYIMKVWEKLFGFSFIGSYLLFAIFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 18622..19725 + /gene="glf" + CDS 18622..19725 + /gene="glf" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase" + /protein_id="WNT95331.1" + /translation="MYDYLVVGAGLFGAVFAHEAALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIEEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPSFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQ + GNVIFGGRLGHYRYYDMHQVIGVALQCVRNELN" + gene 20046..22028 + /gene="aliA" + CDS 20046..22028 + /gene="aliA" + /codon_start=1 + /transl_table=11 + /product="oligopeptide-binding protein AliA" + /protein_id="WNT95332.1" + /translation="MKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETDP + DNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDA + KWYTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDAYVKGEINDFSQVG + IKALDEQTVQYTLNKPESFWNSKTTMGVLAPVNEEFLNSKGDDFAKATDPSSLLYNGP + YLLKSIVTKSSVEFAKNPNYWDKDNVHIDKVKLSFWDGQDTSKPAENFKDGSLTAARL + YPTSASFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKALL + NKDFRQAIAFGFDRTAYASQLNGQTGASKILRNIFVPPTFVQADGKNFGDMVKEKLVT + YGDEWKDVNLADSQDGLYNPEKAKAEFAKAKSALQAEGVTFPIHLDMPVDQTATTKVQ + RVQSMKQSLEATLGADNVVIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPDFA + DPSTYLDIIKPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDEATDVAKRY + DKYAAAQAWLTDSALIIPTTSRTGRPILSKMVPFTIPFALSGNKGTSEPVLYKYLELQ + DKAVTVDEYQKAQEKWMKEKEESNKKAQEDLAKHVK" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg gagatggagt tggtgatttg ccaggtatta ccagtaagtt ggactatcta + 121 gctaagttag gaatcacagc gatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctacg atattgctga ttatcaagcg attgcaacga tttttggaac catggaggat + 241 atggatcaac tgattgcgga agctaagaag cgtgacattc gtatcatcat ggacttggtg + 301 gttaatcata cctcagatga acatgcttgg tttgtcgaag cctgtgaaaa tactgatagc + 361 cctgagcgag actactatat ctggcgcgat gaacccaatg acctagattc tatctttagt + 421 gggtctgctt gggaatacga tgaaaagtca ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaagg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agctaaggat ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcaac ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttacttcat + 1021 ctcatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatccctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaacct + 1261 tggttggcgg ttaatccaaa ttacgagatg atcaatgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 attcgagctg actttgaatt gcttgatacg gctgataagg tctttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacaccc tagctcaaga agtctttgaa + 1561 aaacaaatct tagttccatg ggatgctttc tgtgtggaat tactataaat attttttgca + 1621 gaaaaattta aaattgaaat cgtataaaaa caagggagga ctgtataaaa gtcagaaatc + 1681 ctttgttttt tataaccaag gtttataaac tttcattctc gaaattcaat taactttaca + 1741 aattcccact attaaggaga aagaagatga acataaagaa gcgtgtcctt agtgcaggcc + 1801 tggcttttgc atctgctttg cttttagctg cttgcggcca atcagattca gatacaaaaa + 1861 cttactcatc aacctttagt ggaaatccaa ctacatttaa ctatctatta gactattaca + 1921 ctgataatat agtcaattga aacaagaaca agacaaaaga gcctcgtaaa aggtattgca + 1981 acttggtaat accttttatg aggtgctttt tgatatgagc ccatgttttc tcaataggat + 2041 tgtactcagg tgagtaggga ggaagaggta aaagtttatg accaaactcc tcgcataaaa + 2101 gttctaactt acccattcta tggaatcttg cattatccat aataataacc gatggtgtgg + 2161 ttaatgttgg taagagaaat ttctgaaacc aagcttcaaa aaagtcgctc gtcatcgtct + 2221 cttcgtaagt cattggagcg attaactcac catttgttag acctgcaacc aaagaaatcc + 2281 tctgatatct tcttccagat actttacctc ttcttaactg accttttaat gagcgaccat + 2341 attctcgata aaaataagta ttgaatcctg tttcatcaat ctaaacaggt gctaagtgct + 2401 ttaaactatt aaaattctta agaaataagg ctactttttc tgggtcttgt tcatagtagg + 2461 tgtggttctt tttttcgagt gtagcccata gctttgagcg catagtggat ggtagttgga + 2521 tgacagccaa attcagaagc tatttcagtc aaataagcgt ctggattgtc agtaagatag + 2581 tttttaagtc tatctctatc aacttttctt ggttttgttc cttttacttg gtggtttagc + 2641 tctcctgttt tctcttttag ctttaaccag ccataaatgg tattacgtga gatttggaaa + 2701 acgtgtgatg cttctgttat actacctgtt cgctcacaat aagagagaac ttttttacga + 2761 aaatctattg aatatgccat aaaaagatta taccacattg tgtactatat tagattgaaa + 2821 ctagaatagt acacatctgc ttctaaaaca ttgttagaaa tcgatttgac tgtccttatt + 2881 tcattttatt atatttttgg ttcgcgggaa gtctactaag atacttaaag atgcagatag + 2941 tgaaaataaa ggtgtagaca ttaccgtaaa aaagtgatat aattgtatga tgttcaatgt + 3001 ataggtgtta atcatgagta gacgttttaa aaaatcaggt tcacagaaag tgaagcgaag + 3061 tgttaatatc gttttactga ctatttattt attgttagtt ggttttttat tgttcttaat + 3121 ctttaagtac aatatccttg cttttagata tcttaaccta gtggtaactg cgttagtcct + 3181 actagttgcc ttggtagggc tactcttggt tatctataaa aaagctgaaa aatttactat + 3241 ttttctgttg ctgttctcta tccttgtcag ctctgtgtcg ctctttgcag tacagcagtt + 3301 tgttggactg accaatcgtt taaatgcgac ttctaattac tcagaatatt caatcagtgt + 3361 cgctgtttta gcagatagtg atatcgaaaa tgttacgcaa ctgacgagtg tgacagcacc + 3421 gactgggact gataatgaaa atattcaaaa actactagct gatatcaagt caagtcagaa + 3481 taccgatttg acggtcaacc agagttcgtc ttacttggca gcttacaaga gtttgattgc + 3541 aggggagact aaggccattg tcctaaatag tgtctttgaa aatatcatcg agtcagagta + 3601 tccagactac gcatcgaaga taaaaaagat ttataccaag ggattcacta aaaaagtaga + 3661 agctcctaag acgtctaaga atcagtcttt caatatctat gttagtggaa ttgacaccta + 3721 tggccctatt agttcggtgt cgcgatcaga tgtcaatatc ctgatgactg tcaatcgaga + 3781 taccaagaaa atcctcttga ccacaacgcc acgtgatgcc tatgtaccaa tcgcagatgg + 3841 tggaaataat caaaaagata aattaaccca tgcgggcatt tatggagttg attcgtccat + 3901 tcacacctta gaaaatctct atggagtgga tatcaattac tatgtgcgat tgaacttcac + 3961 ttcgtttttg aaattgattg atttgttggg tggaattgat gtttataatg atcaagaatt + 4021 tactgcccat acgaatggaa agtattaccc tgcaggcaat gttcatcttg attcagaaca + 4081 ggctctcggt tttgttcgtg agcgctactc cctagcagat ggcgatcgtg accgcgggcg + 4141 caatcaacaa aaggtgattg tggctatcct tcaaaaatta acgtcaaccg aagcactgaa + 4201 aaattatagt acgatcattg atagcttgca agattctatc caaacaaata tgccacttga + 4261 gacaatgata aatttggtca atgctcagtt ggaaagtgga gggaattata aagtaaattc + 4321 tcaagattta aaagggacag gtcggatgga tcttccttct tatgcaatgc cagacagtaa + 4381 cctctatgtg atggaaatag atgatagtag tttagctgta gttaaagcag ctatacagga + 4441 tgtgatggag ggtagatgaa atgatagaca tccattcgca catcgtcttt gatgtagatg + 4501 atggtcccaa gtcaagggag gaaagcaaga ctctcttggc agaagcctat agacaggggg + 4561 tgcgaaccat tgtctctacc tctcaccgtc gcaagggcat gtttgaaact ccggaagaga + 4621 agatagcaga aaactttctt caggttcggg aaatagctaa ggaagtggcg agtgacttgg + 4681 tcattgctta cggggctgaa atttactaca caccagatat tctggataag ctggaaaaaa + 4741 agcggattcc gaccctcaat gatagtcgtt atgccttgat agagtttagt gtgaacactc + 4801 cttatcgcga tattcatagc gccttgagca agatcttgat gttgggaatt actccagtca + 4861 ttgcccacat tgagcgctat gatgctcttg aaaataatga aaaacgcgtt cgagaactga + 4921 tcgatatggg ctgttacacg caagtaaata gttcacatgt cctcaaaccc aaactttttg + 4981 gcgaacgtta taaattcatg aaaaaaagag ctcagtattt tttagagcag gatttggttc + 5041 atgtcattgc aagtgatatg cacaatctag acggtagacc tcctcatatg gcagaagcat + 5101 atgaccttgt tacccaaaaa tacggagaag cgaaggctca ggaacttttt atagacaatc + 5161 ctcgaaaaat tgtaatggat caactaattt aggagaaatg atgaaagaac aaaacacgat + 5221 agaaatcgat gtatttcaat tagttaaaac cttgtggaaa cgcaagctaa tgattttaat + 5281 agtggcactt gtgacaggtg cgggggcttt tgcatatagc acttttattg ttaagccaga + 5341 atatacgagt accacgcgaa tttacgtagt gaatcgcaat caaggagaca agccggggct + 5401 gacaaatcag gatttgcagg caggaactta tctggtaaaa gactaccgtg agattatcct + 5461 ttcgcaggat gcattggaaa aagtagcgac aaatttgaag ttggatatgt cagcaaaaac + 5521 gttagccagc aaagttcaag tggctgtacc agctgacact cgtatcgtct caatctctgt + 5581 caaggataaa cagccagagg aagccagtcg tatcgctaat tctctacgag aagttgctgc + 5641 agaaaagatc gtcgctgtaa cgcgagtatc tgatgtaacg acacttgaag aagcgcgacc + 5701 agctacgact ccctcttctc caaatgttcg acgcaattcc ttgtttggtt ttcttggagg + 5761 agcagtcgta acagtaattg ctgttctttt gattgagttg ctcgacaccc gtgtgaaacg + 5821 tcctgaagat gttgaagatg tactgcaaat tccactttta gggctcgttc cagatttgga + 5881 caaaatgaaa taggaggaag ttatgccaac gttagaaatc tcacaggcaa aattggattt + 5941 tgtaaaaaag gcagaggaat attataacgc tttgtgcacg aacctacagt taagtggaga + 6001 tggtttgaaa gtattttcta tcacttctgt gaaaatagga gaaggaaaat caacgacttc + 6061 taccaatatc gcttgggctt ttgcgcgtgc aggttacaaa acgctgctga ttgatggaga + 6121 tattcgcaat tctgttatgt taggtgtctt taaagcaagg gataagatta cgggcctgac + 6181 agaattttta tcaggaacta cagacctatc acaagggctt tgtgatacca atatcgaaaa + 6241 tctctttgta attcaggctg gctctgtgtc accgaatccg acagctcttc ttcaaagtaa + 6301 gaatttcagt acaatgcttg aaaccttgcg taaatatttt gactacatca ttgtagatac + 6361 tgctcctgtc ggtgtcgtga ttgatgctgc tattattacg cgaaaatgcg atgcttctat + 6421 tttagtgacg gaggcaggtg aaataaatcg acgggatatt caaaaagcaa aagaacagtt + 6481 agaacacaca gggaagccgt ttttgggagt tgtgttgaat aaattcgata cttcagtaga + 6541 caaatacggt tcttatggaa attatggaga ttacgggaaa aataaaaaat aggtcggggg + 6601 atagagatga atggaaaaat agtaaagtct tcattggcta taatccagag ttttcttgtt + 6661 attttattga cttatctact tagtgctgtg agagaagtgg agattgtttc aacaacagct + 6721 attgcacttt atatcctcca ttattttgtc ttttatatca gtgattatgg acaggatttc + 6781 tttaaaaggg gatatttgat tgaacttgtc cagacattga aatatatcct attctttgca + 6841 ctagcgatta atatttctaa ttttttctta gaggatcgat ttagtatttc cagacgaggc + 6901 atgatttact tcctcacatt acatgctctc ttagtctatg tgctaaacct atttatcaag + 6961 tggtattgga agcgggctta tcccaacttt aaaggaagta agaagattct cctacttaca + 7021 gcaacttctc gtgtcgaaaa ggtactggat agattaatag aatcaaatga ggttgttggg + 7081 gagttggtag ccgtcagtgt cttagataaa ccagattttc agcatgatta tttaaaggta + 7141 gtagcagaga gggagatagt aaactttgcg acttatgagg tggtcgatga agtctttatc + 7201 aatcttccaa gtgaaaaata caatattgga gagcttgttt ctcagtttga aacgatggga + 7261 attgatgtaa cagttaatct aaatgctttt gatcgtagtt tggcacgtaa caagcaaatt + 7321 cgtaagatgg caggattaaa cgttgtgact ttttctacaa cattttataa gactagtcat + 7381 gtaattgcta agcggattat tgatatcatg ggtgcattgg tagggctgat actatgtggt + 7441 ttagtcagta ttgtactggt tcctttgatt cgaaaggatg ggggctctgc tatttttgct + 7501 cagatgcgta taggaaaaaa tggtcgtcag ttcacttttt ataagtttcg ctctatgtgt + 7561 gtagatgccg aggcgaaaaa aagagaactc atggaacaaa atactatgca gggtggaatg + 7621 tttaaggtgg acgatgatcc tcgtatcacg aaaattggtc gttttatacg gaagactagc + 7681 ttggacgagc taccacagtt ttataatgtt ctaaagggag atatgagttt ggttggcaca + 7741 cggccaccaa cagtggacga gtatgaacac tataccccag aacaaaaacg tcggctaagt + 7801 tttaaacctg gtataacagg cttatggcag atcagtggac gaagtgagat taagaatttt + 7861 gatgaagttg tcaaattaga tgtagcctat atagacgatt ggacaatttg gaaagatatt + 7921 gagattttat tgaagacagt taaagttgta ttgatgaagg atggagcgaa gtagattgat + 7981 agatgtaaaa atcattgtgg caacgcataa agaggttaaa atgcctcaag acaatagtct + 8041 ttaccttcca atacatgttg ggagagacgg taaatcagat attggtttta tcggtgataa + 8101 tactggcgat aatatatcct ctctaaatcc atattattgt gagttgacgg gactttattg + 8161 ggcatggaag aatcttgatt ataattactt aggtttagtt cattaccgtc gttattttac + 8221 aaataaatct caagggtata atgaaaatgt caatatggat gacgtcattt tgtctcgatc + 8281 taatgttgaa atattattag agaaatctga cataatagtt ccaaagaagc gaaagtatta + 8341 tattgaaact ctttattcac attatgccca tacccttaac ggagaacatc tggatcttgc + 8401 taggaaaatt attgagcaaa atagttcaga gtatctttca tcctttgata aagtgatgaa + 8461 acaaagaagc ggttatatgt tcaatatgtt tatcatgaaa aaagaactat tagatgatta + 8521 tttaccgtgg cttttttcta ttctggatac tatgtacgaa cagatggact tgaccgacta + 8581 tactccattt gagtcacgtt tattcgggcg agttagtgag ttgttgttta atgtttggtt + 8641 atgtaaacaa ggaataacgc ctaaagaggt accatttatg tacatggaga gagtggattt + 8701 gtttgaaaaa ggaaaatctt ttttaatggc taaatttttt ggaaagaagt atggacagag + 8761 tttttaaatt atggttttgt tattacttac ttttgcattc tttttagttt tctctgtgct + 8821 gtcaataagt ttaagtgtta tagggctagt aaatgacaaa aagcgttcaa aaatctattt + 8881 actactaatt agttttgcag tatcaattgt tgcgctgcgt tatattcctc atcatatggc + 8941 tgatggcgct tttcattttc gtgcgactac ggcccttatt cgctatgata gtattttcga + 9001 aatgttttaa gaattttcta gtggatggaa tgtgggaaga tatgattatg gttctatgcc + 9061 agtttttact tcattaatgt atcttattcg aaacactcat cactatagtt tactgagttt + 9121 tatttcagct tttataactt actttagttt tggttacgta gtcgttgatc tatttaaaga + 9181 cttggacaag gtttctaaac tatcgtatgc tacagtatta attgctgtac tatgtttaaa + 9241 taattataga tatacaactg gtggaatgag attttgtatt gtagttgcct tgatgatgct + 9301 tttattgatt ttagtaagac ggacttactc ataaaaaata tttttcaatt cttttcaagt + 9361 ttgccattta cataataaga ctatgtgctt ttattttatt ttttggagga ttatatggga + 9421 ctatctaccg tgacattgtt taaaaattta aagttctcag atagtaaatt tattaaattg + 9481 gaaggagagc tccttcttaa atatcaagag tatttattaa aaatcatgga agatattgta + 9541 acagtgtgtg aggaagaagg gttatattat tcactttctg gtgggagtgc attaggggct + 9601 taccgacaca aagggtttat tccatgggat gatgatatgg acatatttat gctaggaagt + 9661 gagcgggaga ttttctttca aaaattttct cagaaatttt ctgataaata ttggatacat + 9721 aattcacaaa caccaaacta tggcatgccc attggtcgta tcagacaaaa aggaacagtt + 9781 ttacgtggtc gagaggatgt tggagttgaa gaatgtggat tttttattga tattttttgg + 9841 cttgaaaatg ttcctaattc aaaaatattg agacaactcc acggttttct ctgcatggcg + 9901 attggattgc tactatcatg tagaaatttt tataaaaatc gtcagctgat gctggagatt + 9961 atgaaggaac ataaagaagt aaggcttgtt tttcgaataa aactagtttt agggtttcta + 10021 attagtttta tatctttgag acaatttaca agacttacgg aaaggatcta ctcattgtgc + 10081 aagaataatg aatcaagata ccttagtgtt ccttcaggaa gaaaacatta ttttggcgag + 10141 atgtttataa gagaagatat gcagttaact aggaaactca attttgaagg acataagtgg + 10201 aatgttccaa ataatattga gcattattta actgtaatgt acggtgatta tatgaaaata + 10261 cctgcagttg aagataggga atcacatatc attttagaaa tctccttccc taacgagtaa + 10321 acagtacttt cattttttat atgtaaggaa ttaatttaat gaaaaaaata gcaattgtta + 10381 gatataatct aagtaaaatt ggtggagcag aaaaagtagc tattaatatg gctaatgaat + 10441 tgtcacaata ctatgatgta aaactgttat ctattctatt ggatgaggat ggctttataa + 10501 attatgatat taaccctaat gtgacattaa taaattttca caagggtgat cttagaatta + 10561 gaactgctac attaaaatta acaggtaaat taaggaacta tattaaaaga gaaaaaattg + 10621 aagtgatttt ttctataacc ccattaacaa atactatggt tagattagct actctaggat + 10681 taaatgtgaa aatagttttc tgtgatcatc atagcttaga atttcgtgat tttagaggta + 10741 gggaagtgca gagatttgta ggagctaaat tttttgacaa gattgtcact ttaacagaag + 10801 aagatagaat aaaatactcc gataaatata atatacctat aaataaagta aatgctattt + 10861 ataattggat tgatgaagaa gattctgaaa ataccccatt tgataatgag acaaataaaa + 10921 taataacggt aggtcgattt cacagtcaaa agggatatga ttatcttgcc gaagtagcta + 10981 taaaagtatt atcacaacat ccagactggc agtgggatat atatggttca ggggataaac + 11041 ttattgaaca ggatctaaaa agaaaactag aagaaggttg tgtttcttca caagttaatt + 11101 ttaaagggaa tgtaaaggga actgaaaata tttatcccaa tcatagtatc tatgtcatga + 11161 cttctcgcca tgagggctta cctttagtcc tattagaagc acaacaatac aatcttccta + 11221 ttgttagctt cagatgtcca acgggaccta gtgagattgt tgaagatgga gtcaatggat + 11281 ttttgattga ttgctatgac gtgtatcaga tgagtgagaa attgcttgaa ttgatgaaaa + 11341 atgatgattt gcgacaatct ttctcagaac atgccaaaga caatatagat aaatttgata + 11401 aaaatgaaat tcttaatcag tggatagaat tgattgatac aatttaggag gtaagatgca + 11461 agagtgttta ttgacaatta taatgcctag ttataatatt caggactata tttccaaagg + 11521 aatcgagtca ttccagcaag tacacctaga ttacaaacaa aaatttgaga tcttaattgt + 11581 gaatgatgga agtacggacg acacagccaa agtagcagaa gagaccctaa gaaaagattt + 11641 attgctgaat ggtcgtatta tcacaaagga aaatggaggc catggctcaa caatcaatcg + 11701 tggtatccag gaagcaaagg gaaaattctt taaagttatt gatggggatg actgggttat + 11761 tccatcagaa tttgaaaagt ttttagatga ccttacagtt actgaagtgg atatgatctt + 11821 gacagatttt acagaacaac atgtttacaa caatactact gttcgaaatg attttgttga + 11881 aaagtatgag gttggtaagg aatattctgg aattccagag aaacggattc caatgcactc + 11941 ggtaacttat agaacatcta tcctagttga gaatgaaatt cgtttaagtg aaaagacatt + 12001 ttatgttgat attcagtaca ctctttttcc tttagagtat gttcatagtt tctgttattg + 12061 gaattatgat gtataccaat actatatcgg acgacccgag cagagtatga atattgagag + 12121 tatgaaacga aatgttcgtc accatttgac tgtaacaaat tctgtgctga cttatttctc + 12181 aaaaattgcg gatgatcctg tcttaaagaa agtggttgca gatactttag tttatcttat + 12241 cagtttgcag atagatttgt catggatggt tgaggactca aagacactat cagaagagtt + 12301 atacagacaa attgagcaga gttcttatga gtatatccct acgaaaaaat ttgatagatt + 12361 gtcttatttg aactataagt ttcactattt tctagacttt gttttcaatc cagtattgaa + 12421 aaaatattct aaaaagaaag aaaaagagag aggaatttag aatgttcatt agtgttgttg + 12481 ttccggttta taatgttttt gactatttac actttgccat ggatagtctg ataaagcaaa + 12541 cgtatcaaaa ttttgaagta atccttgtaa atgatggttc aacagataac tctcctcagt + 12601 tatgtgaaga gtatgctaag caatatgaaa acgtctctgt ttttcataaa gaaaatggag + 12661 ggttgtctga tgctcgtaat tttggagttt caaaagcatc atcagattgg attttctttc + 12721 tagatccaga cgattatttg gaagattata ctctagaatt gatagtgaaa attcaacagg + 12781 aatatcaagc aaacttgatt tcaaccaaag taaaggcaac ttctaaatat aatgattata + 12841 gtctttatca acttgaggag tcagattata aagatttgtt tgtcgttaca aaagagaagg + 12901 ctcttgagct aatgctagac gacaaaattg cgacagtttc tgcttgtgct aagctttatc + 12961 acaagaatat cttggaaaaa gttccatttt cagttggaaa aatctatgaa gatttttatg + 13021 tggtcgcgga tcatcttgcc ttagcagata aaattgtaat tagtccactt gaaacgtata + 13081 actattaccg cagagaaggt agtattgttc gttcgacttt tactgagaaa agatatgatt + 13141 tttttgatgc tgtttcgaaa aacgaagaag ttataaataa agaatacaca caaagtttag + 13201 aattacaaca atctctgcaa gcgaaaaaat tacgaggagg ttttgttgta attggtgcga + 13261 aagctgactc tggtttaaca gatttttcga aagatagaga cctattaaaa gttgatttta + 13321 aaaacatgtt attaaataaa aaaatatcat ggaaactaaa attaaaatat acaatattta + 13381 tgctatcatc taaaatgtat ttaagattaa ggtgactgtt tcaagaatca agcatctcta + 13441 ttagttttta aaattataaa tagctgttcg gatgtaagtg ttgtaatagt gtttagtatt + 13501 tctagttcat tattataatc gggaaagaat ttaatacagc tacttatttg aaagggaaat + 13561 tcatgagaca agcatatcta ataatagcac ataataagtt tgaatagttg aaatttttaa + 13621 tttctctgtt ggattataag gaacataata tttttattat tgtggacagc aaagttaatg + 13681 ctgaggagtc tacgattaat cactatactt cccatcatta taacttccta tgtgacatgg + 13741 atattttaac tctattgtta cctattttgt tagtcacttt aggagttgct agttatggca + 13801 ttaaggaaat ttaagctaat cgaaaaaaga gccacagaat ttttggggta tctgtaaaac + 13861 ttaaaatgaa gtatagttta ttttgagttt aataagcgat taaaaggtag ggggaatatt + 13921 attgaagatt aacttaatga atattgttga tacgttactg cttttgctaa taattataaa + 13981 aacaaactct atttatttgt atataggtgt agagaacaaa ttaaattttt atctgattgt + 14041 tgtgattaca attgcagttt tattggaagt aattagcggt agattatctc tccaatattt + 14101 aaaaaaaatg ctattagtta ttgttcttta tttttttgca attattatta atattttagt + 14161 ttcggcttct gtcatatcgt caaatatact aacatactat tttattgttg tgccattaat + 14221 gctaatacta gtaatgtata aatattataa aaatacatta acaaattttt tagttatctt + 14281 tgtgaggatt gttttaattt tagctgttat ttctctgctc ttttggtgtt ttggtagtgt + 14341 tttaaatata ataaaaccga caaactatgt ggtgagtagc tggagtggtg gtcaggtaac + 14401 tactagttat tataatctgt attttgaaac gcaaaacgct ttatttttgg gttataaaat + 14461 gattaggaat agcggtattt ttgcagaagc gccaatgtgg agtttattgc taagtgttgc + 14521 tttaatattt caagagttat tgcttaaaca tagcactaga atatttgttt tattaatgtt + 14581 gacaattttt acaacagcat caacaacagg tttttttata gttggttcat tacttattta + 14641 taaagtgata aatcaaaaaa gaagttggtt taaatatatc aacttgacat ctatccctgt + 14701 attaatcttt actttggtta aagtgtgggg ggaaaaatcc gattccgctt cagcaagtat + 14761 tcgatatgat gattatgtag caggtttttt ggcatggaaa aatcacttta tttttggttc + 14821 aggtttatca tctgggatta gagcgattga gtcctatatg gataccacta tacgaagtaa + 14881 tttaggatac agtaatagtt tttttgtcat cttagctcaa gggggaataa ttttgggcgt + 14941 gctacacttt tatcctgttg ttagtgtact attgaagaga ttttcatcaa actctaagat + 15001 gttagcttta ttgtttataa ttctaatatt tacagcaata tttacagata caccgttatt + 15061 tatcctgttt gttgggatat tttatgcctt gattctgaat agagagaata catgaagaag + 15121 gaatatgata ttttaaaagt aattgccatt ttaatggttg tattaagcca cagtacatac + 15181 tatgtgattt cgactaagta cggggggatt atcaacaata tataaatcaa aatttatcgt + 15241 tggtattgta taaagttttt gataaagtaa gagaagtatt atattacttc catatgccac + 15301 tttttatggc attatcagga gctttctact atcttcaggt tcaaagagat aaatggttta + 15361 ctttaaaatt aattgtgcaa aataaaataa ggtaaagaga ttgctttttc ctttcattat + 15421 atttactgtc ctttattcaa taccaataaa atatatttca aattattttg attttacagc + 15481 tccttttaaa gcatttgtag gagaattttt cttaattgga aatagtcatt tatggtattt + 15541 atatgcttta tttattattt ttatatttgc attctatacg ctaaaaaaga aacaaatctt + 15601 gctacttatg ttgtttttta tgttctgtat attttgagtt acaaaataga actcacacta + 15661 tttaaagtac ctcttcaatt tttattttac tttagtttag gcttcttgtt tgaatcaaat + 15721 agagaaaaat ataatcaatt tattaatagg aaaaaaatta tattttgtta ttatctacgg + 15781 tatttgtctt aatggttttg ttaaatttac tcaggtattt tttagtaaag tattagttga + 15841 gctattggct gtcttgggtt cattattaac gtatagcatc gcatatcaat tatctcaaaa + 15901 gaaaagtgtt ggtgatgcta gtatttttaa gatgattcta attaatggat taggtatata + 15961 tattttttct gatccattaa attatttaat cttgaagtta agttattccc taaattcgta + 16021 ttttatgttt acaccagtag gaataattgt tttagtagta ttacgatttt ttctcacgtt + 16081 attcatatca ttgataggaa caatcatatt taaaaaaata caaatggcta gtcaactagg + 16141 tagagacaat agctatttaa aaagttaaat ctatatataa tggagaaaaa gtaatgaaag + 16201 tacttaaaaa ctacgcctac aatctttctt atcaattgtt ggtgatttta ctcccgatta + 16261 ttacgactcc ctatgtaaca cgggtctttt cttcggatga tttagggacg tatggttatt + 16321 ttaattccat cgttacttat tttatcctct tagcgacgct aggagttgct aactatggga + 16381 ccaaggtcat ttcagggcat cgaaagcaaa ttcaaaaaaa ctttttggga atctattctc + 16441 tgcaattagg tgcaacagtt ctttctctgt ccttgtatgc tcttctttgt ctaactcttc + 16501 cctttatgca aaatccggta gtctatattc taggcttgag tttagtttct aaaggtttag + 16561 acatctcctg gctctttcaa gggttggagg attttcgaaa gattactgtc cgaaatataa + 16621 cagttaaact agttggggtc atttccatct tcctctttgt taaatcatca aatgaccttt + 16681 acctctatgt ctttttgcta accatttttg aactcttggg tcaattcagt atgtggatac + 16741 cagctcgaga gtttattggt agacctcatt ttgacataga atatgctaga catcatttga + 16801 aaccagtcat attattgttc cttccgcaag tggcgatttc cttgtatgtt acgctaaatc + 16861 gtactatgct tggagcgtta gcttctacaa aagatgtagg gatttatgac caggctttaa + 16921 agttggtaac tatccttctg accttggtaa cttccttggg aagcgttatg ttacctcgag + 16981 tcgctcattt gttagcgaca gatgatcata aggcagtcaa taggatgcat gaaatgtctt + 17041 tcttaattta taatttagta atttttccaa tgatggcagg aatcttgatt gtcaatgatg + 17101 attttgttca gtttttcctt ggtcaagatt ttcaggatgc gcgttatgca atcgccatta + 17161 tgatcttccg tatgttcttt atcggttgga ccaatatcat gggaattcag atgctgatac + 17221 ctcataatca aaataaagaa ttcatgattt caacaacagc tcccgcaatt atcagtgtag + 17281 gtttgaactt actattcctt cctaaactgg gatatatcgg agcagccatt gtctctgttt + 17341 taacagaggc acttgtatgg gcaatccaat tattctatac tcgcagatat ttaaaagaag + 17401 ttcctataat cggatcaatg tcaaaaatta tactagcatc tgccattatg tatggccttt + 17461 tactaagttc aaaaacagtt atacattttt caccgacctt aaatgttcta gcatttgcag + 17521 cgcttggtgg aatcatttat ctttttgcaa ttctatctct gaaagtggta gatgtgaaag + 17581 aattaaaaca aattattagg aaaaactaaa atgagaaaaa ttcgaaatat caacctagat + 17641 ttactaaaag tgcttgcatg tgttggagtt gttttacttc atacaacaat gggcggattt + 17701 aaagagacag gctcatataa tcttttggca tatttatatt atttaggtac ttactctatt + 17761 cccctgtttt ttatgatcaa tggttattta ttgttaggca agagggaaat aacttatctt + 17821 tacatactcc agaaagtaaa atggatttta ataacagtgt catcatggac atttatcgta + 17881 tggctttttt atcgtgattt tacaactaat cctattaaaa aaattgtagg ttctttgata + 17941 caaagaggtt atttctctca gttttggttt ttcggtgcac taatacttat ctatttatgt + 18001 ttgccaattg tgagacaatt tctaaattca aaaagaagct atttatacag tttatcttta + 18061 ttgatgacta ttggtttgat ttttgagtta ttaaatatcc tacttcagat gccaatacaa + 18121 acatatgtaa tacagacttt tagattatgg acgtggtttt tttactatct tttaggtggt + 18181 tatatagcgc aattcactaa agaagaaatc gaatcaagat ttaagaattg gatgaaaata + 18241 gctagcatac ttttgttatt gatttcacca ataatattat ttttcatagc aaagaccact + 18301 taccataatt tttttgctga atatttttat gatattttat tagtaaaagt ggtaagcgta + 18361 gggatttttc taactatttt ctcacttgta ttgaatgaaa atagcaacaa atggattatt + 18421 tttctttcta atcaaactat gggtatcttt ataatacaca cttatattat gaaggtatgg + 18481 gaaaaactat ttggttttag ttttataggt tcatatttac tttttgctat atttacttta + 18541 agtgttagtt ttatcattgt tggaatgtta atgaaaattc cgtattttaa tcgaatcgtc + 18601 aaattataaa aaggagaaaa aatgtacgat tatcttgttg ttggtgctgg tctctttggt + 18661 gcagtctttg cccatgaagc agccttaaaa ggaaaaaaag taaaagttat tgaaaaacga + 18721 aatcatatcg cgggtaatat ctatactcgt gaagaggaag gaattcaagt tcatcaatat + 18781 ggtgctcata tcttccatac ttctgataag gagatctggg attatgtaaa tcagtttgca + 18841 gagtttaacc gttataccaa ttctcctgtt gcaaactata agggtgagat ttataacctt + 18901 ccttttaata tgaatacttt caataaactc tggggagttg taacgccagc agaagcacaa + 18961 gctaagattg aggaacaacg tgctatttta aatggtaaaa ctcctgaaaa tttggaagaa + 19021 caggcgattt ctcttgtagg tacagacatc tacgaaaaat taatcaaaga ctatacagag + 19081 aaacagtggg gcaaaccaac tactgaactt ccatccttta ttattcgccg tttgccagta + 19141 cgcctgacct atgataacaa ctattttaac gatacctatc aagggattcc aattggtgga + 19201 tacactcaaa tagttgaaaa aatgttggat catgaaaata ttgatgtaga aacaaatgtt + 19261 gatttctttg tgaataaaga gcaatatctg aaagattttc ctaagattgt ctttactggt + 19321 atgattgatg aattctttga ctataagttg ggtgaactag agtaccgtag tcttcgtttt + 19381 gaaaatgaga ccttggatat ggaaaattac caaggaaatg cagttgtgaa ctatacggat + 19441 gcagaaactc catatactcg cattattgaa cacaaacatt ttgagtttgg gagtcaagca + 19501 aagactatca ttactaaaga acattctaaa acatgggaaa aaggtgatga gccttattat + 19561 ccagttaata atgatcgtaa taatcatttg tataaatcat ataaaaaact tgctgatgag + 19621 caagggaatg ttatctttgg tggccgctta ggacactatc gttattacga tatgcaccaa + 19681 gtaattggag tagctttgca gtgcgtgaga aatgagttaa attaatactc aatgaaaatt + 19741 aaagagcaaa ctaggaagct agccacaggt tgctcaaaac actgttttga ggttgcagat + 19801 ggacgctgac gcggtttgaa gagattttcg aagagtataa acaagtaaaa ctgactacca + 19861 gttattattt agaaatagta ttaaaaattc cttgactatg tgatatagtt gagggatttt + 19921 taaatgatat tcatattttt tgcaaagatg ttgtttgaaa aataattttc aaaaattctg + 19981 aaaattctgt tgacaacttt ctgaaaagag tctataatgg agagaaagtt ttaaaggaga + 20041 aaatgatgaa aagttcaaaa ctatttgccc ttgcgggcgt gacattattg gcggcgacta + 20101 ctttagctgc atgctctgga tcaggttcaa gcactaaagg tgagaagaca ttctcataca + 20161 tttatgagac agaccctgat aacctcaact atttgacaac tgctaaggct gcgacagcaa + 20221 atattaccag taacgtggtt gatggtttgc tagaaaatga tcgctacggg aactttgtgc + 20281 cgtctatggc tgaggattgg tctgtatcca aggatggatt gacttacact tatactatcc + 20341 gtaaggatgc aaaatggtat acttctgaag gtgaagaata cgcagcagtc aaagctcaag + 20401 actttgtaac aggactaaaa tatgctgctg ataaaaaatc agatgctctt taccttgttc + 20461 aagaatcaat caaagggttg gatgcctatg taaaagggga aatcaacgat ttctcacaag + 20521 taggaattaa ggctctggat gaacagacag ttcagtacac tttgaacaaa ccagaaagct + 20581 tctggaattc taagacaacc atgggtgtgc ttgcgccagt taatgaagag tttttgaatt + 20641 caaaagggga tgattttgcc aaagctacgg atccaagtag tctcttgtat aacggtcctt + 20701 atttgttgaa atccattgtg accaaatctt ctgttgaatt tgcgaaaaat ccgaactact + 20761 gggataagga caatgtgcat attgacaaag ttaaattgtc attctgggat ggtcaagata + 20821 ccagcaaacc tgcagaaaac tttaaagatg gtagccttac agcagctcgt ctctatccaa + 20881 caagtgcaag tttcgcagag cttgagaaga gtatgaagga caatattgtc tatactcaac + 20941 aagactctat tacgtatcta gttggtacaa atattgaccg tcagtcctat aaatacacat + 21001 ctaagaccag cgacgaacaa aaggcatcga ctaaaaaggc tctcttaaac aaggatttcc + 21061 gtcaggctat tgcctttggt tttgatcgta cagcctatgc ctctcagttg aatggacaaa + 21121 ctggagcaag caaaatctta cgtaatatct ttgttccacc aacatttgtt caagcagatg + 21181 gtaaaaactt tggcgatatg gtcaaagaga aattggttac ttatggggat gaatggaagg + 21241 atgttaatct tgcagattct caggatggtc tttacaatcc agaaaaagcc aaggctgaat + 21301 ttgctaaagc taaatcagcc ttacaagcag aaggtgtgac attcccaatt catttggata + 21361 tgccagttga ccaaacagca actacaaaag ttcagcgcgt ccaatctatg aaacaatcct + 21421 tggaagcaac tttaggagcg gataatgtag tcattgatat tcaacaacta caaaaagacg + 21481 aagtaaacaa tattacatat tttgctgaaa atgctgctgg cgaagactgg gatttatcag + 21541 ataatgtcgg ttggggtcca gactttgccg atccatcaac ctaccttgat atcatcaaac + 21601 catctgtagg agaaagtact aaaacatatt tagggtttga ctcaggggaa gataatgtag + 21661 ctgctaaaaa agtaggtcta tatgactacg aaaaattggt tactgaggct ggtgatgagg + 21721 ctacagatgt tgctaaacgc tatgataaat acgctgcagc ccaagcttgg ttgacagata + 21781 gtgctttgat tattccaact acatctcgta cagggcgtcc aattttgtct aagatggtac + 21841 catttacaat accatttgca ttgtcaggaa ataaaggtac aagtgaacca gtcttgtata + 21901 aatacttgga acttcaagac aaggcagtca ctgtagatga ataccaaaaa gctcaggaaa + 21961 aatggatgaa agaaaaagaa gagtctaata aaaaggctca agaagatctc gcaaaacatg + 22021 tgaaataa +// + diff --git a/public/res/serotype_genbank/serotype_34.gb b/public/res/serotype_genbank/serotype_34.gb new file mode 100644 index 0000000..afd9483 --- /dev/null +++ b/public/res/serotype_genbank/serotype_34.gb @@ -0,0 +1,718 @@ +LOCUS CR931703 15938 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 676/74 (serotype 34). +ACCESSION CR931703 +VERSION CR931703.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 15938) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 15938) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..15938 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="676/74" + /db_xref="taxon:1313" + gene <1..33 + /gene="dexB" + /locus_tag="SPC34_0001" + CDS <1..33 + /gene="dexB" + /locus_tag="SPC34_0001" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34260.1" + /db_xref="UniProtKB/TrEMBL:Q4JZU9" + /translation="PWDAFCVELL" + gene 192..360 + /gene="aliB" + /locus_tag="SPC34_0002" + /pseudo + CDS 192..360 + /gene="aliB" + /locus_tag="SPC34_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(361..891,893..1222)) + /gene="tnp" + /locus_tag="SPC34_0003" + /pseudo + CDS complement(join(361..891,893..1222)) + /gene="tnp" + /locus_tag="SPC34_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(832..891,893..1204)) + /gene="tnp" + /locus_tag="SPC34_0003" + /note="HMMPfam hit to PF01710, Transposase, score 2e-23" + /pseudo + gene 1455..2900 + /gene="wzg" + /locus_tag="SPC34_0004" + CDS 1455..2900 + /gene="wzg" + /locus_tag="SPC34_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34263.1" + /db_xref="GOA:Q4JZH0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZH0" + /translation="MSRRFKKSGSQKVKRSVSIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILASSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1455..1571 + /gene="wzg" + /locus_tag="SPC34_0004" + /note="Signal peptide predicted for SPC1626 by SignalP 2.0 + HMM (Signal peptide probability 0.995) with cleavage site + probability 0.529 between residues 39 and 40" + misc_feature 1659..2006 + /gene="wzg" + /locus_tag="SPC34_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.5e-63" + misc_feature 2184..2627 + /gene="wzg" + /locus_tag="SPC34_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2902..3633 + /gene="wzh" + /locus_tag="SPC34_0005" + CDS 2902..3633 + /gene="wzh" + /locus_tag="SPC34_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34264.1" + /db_xref="GOA:Q4JZG9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZG9" + /translation="MIDIHSHIVFDVDDGPKSREESKTLLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMHTSYREIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRVQYFLEQDLVHVIASDMHNLDSRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRRIVMDQLI" + misc_feature 2905..3513 + /gene="wzh" + /locus_tag="SPC34_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.4e-38" + gene 3639..4334 + /gene="wzd" + /locus_tag="SPC34_0006" + CDS 3639..4334 + /gene="wzd" + /locus_tag="SPC34_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34265.1" + /db_xref="GOA:Q4JZG8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZG8" + /translation="MMKEQNTTEIDVFQLVKTLWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIVLSQDVLEKVVTNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANFLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFNKIK" + misc_feature 3639..3755 + /gene="wzd" + /locus_tag="SPC34_0006" + /note="Signal peptide predicted for SPC1628 by SignalP 2.0 + HMM (Signal peptide probability 0.614) with cleavage site + probability 0.407 between residues 39 and 40" + misc_feature 3660..4076 + /gene="wzd" + /locus_tag="SPC34_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 5.5e-54" + misc_feature 4182..4259 + /gene="wzd" + /locus_tag="SPC34_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4344..5033 + /gene="wze" + /locus_tag="SPC34_0007" + CDS 4344..5033 + /gene="wze" + /locus_tag="SPC34_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34266.1" + /db_xref="GOA:Q4JZG7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZG7" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GDYGDYGKNKK" + gene 5048..6415 + /gene="wchA" + /locus_tag="SPC34_0008" + CDS 5048..6415 + /gene="wchA" + /locus_tag="SPC34_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34267.1" + /db_xref="GOA:Q4JZG6" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZG6" + /translation="MNGKIVKPSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVIVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGCFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5048..5134 + /gene="wchA" + /locus_tag="SPC34_0008" + /note="Signal peptide predicted for SPC1630 by SignalP 2.0 + HMM (Signal peptide probability 0.660) with cleavage site + probability 0.345 between residues 29 and 30" + misc_feature 5831..6412 + /gene="wchA" + /locus_tag="SPC34_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.8e-160" + gene 6402..7208 + /gene="wciB" + /locus_tag="SPC34_0009" + CDS 6402..7208 + /gene="wciB" + /locus_tag="SPC34_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34268.1" + /db_xref="GOA:Q4JZG5" + /db_xref="UniProtKB/TrEMBL:Q4JZG5" + /translation="MERSRLIDVKIIVATHKEVKMPQDSSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDV + ILSRSNVEILLEKSDIIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRRGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDYTPFESRLFGRV + SELLFNVWLCKKGITPKEVPFMYMERVHLFEKGKSFLMAKFFGKKYGQSF" + gene 7299..8669 + /gene="wzy" + /locus_tag="SPC34_0010" + CDS 7299..8669 + /gene="wzy" + /locus_tag="SPC34_0010" + /note="member of homology group 252" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34269.1" + /db_xref="UniProtKB/TrEMBL:Q4JZG4" + /translation="MLYILFYLLLLFFIINYAFVRGDYFHPTIIFNFTFLIATLFCIL + NAQEYAIEFNGGTVFIVTISMLVFTIITVLSKKIFKTNTFTFKNKLKYLYVSKSLIFT + IIIIQILNLIFFYRYEQALFSAYVGGRGSFSQIINNYDQLVKFFTEDLVGLGVRSPFF + YRVFNSFISPISYVIIYIICHNYVATRRIDKFQLLVPCLFAIQIFMTGSRGSLFKILT + FILVVFYILLLRNKGLSKLSSRFAFKVLIVVVAVAPLFVLYLNATGRSGGVGQDGIIE + ALNRELFKYIGAPLLNFNNFIAGYDPYRSDSVYWGEQTFYGFYKFLYSKLHLIDFNIK + SIIGSDSFVKSTNGLPTGNVFTTFYTFFYDFTYFGIIPLVSVIALYFVPTYSRILGTE + YCAKKYLFDYKLFIYAYLFNDVIMLIFSNRFFESILTVGFLRFLITSAILVWIIKQNI + VFKYKK" + gene 8721..9530 + /gene="wcrO" + /locus_tag="SPC34_0011" + CDS 8721..9530 + /gene="wcrO" + /locus_tag="SPC34_0011" + /note="member of homology group 46" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34270.1" + /db_xref="GOA:Q4JZG3" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZG3" + /translation="MEEDTKLYKIQSKELELLKVLTNICEENNLTYYALGGTLLGAVR + HKGFIPWDDDIDIGMPREDYEKFKILAPNLLPSNLKIVNNPLNLDITQLVDKNVIVKI + ANSESNVFIDIFPLDGYTEKGFFAAKLHSFRLLFQRMLCKISVLDQLEDKDRGTVENL + IVKISKMLRIQKVLPKDTLVENLHKVIQKYDFKTSRYVGNVLGRYREREIVPREYFKE + PVSLIFEDTMINCPTKYKEYLNEIYGDYMKLPSVEDRVAHNIELISVGDAE" + misc_feature 8793..9452 + /gene="wcrO" + /locus_tag="SPC34_0011" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 6.8e-49" + gene 9527..10651 + /gene="wcrC" + /locus_tag="SPC34_0012" + CDS 9527..10651 + /gene="wcrC" + /locus_tag="SPC34_0012" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34271.1" + /db_xref="GOA:Q4JZG2" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZG2" + /translation="MKGRIEIGKKICIVKWILDDSGGGERVAVSLANELTKKYEVHLI + GITTKQSDLFFKINSQVRYSNFFDHRVRLSKNILKISKMLRKYFIDNEIEVGFGIGIS + ANVFLSLAGIGTQTKVVLCDHTNSITDNREFSQKFQRYVGTKLADKIITLTQEDRENY + IKKYGVPEERICYIYNWKEAALSDVSYNKKSTKIVTVGRFDYQKGYDYLIQVAKKVLE + KRADWTWEIYGSGNQDEVDKIRDLINENDLQDRLVIKGLEKNQDLIYGDKGIYVMTSR + YEGLPLVLLEAQQYNLPIASFSCPTGPNEIVEDGVNGYLVECYDVEAMSNRLLELMND + KELRNRFSSHAKDNIKKFNKDRIIHQWIDLIEEVSGGENV" + misc_feature 10058..10570 + /gene="wcrC" + /locus_tag="SPC34_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2e-39" + gene 10644..11660 + /gene="wcrD" + /locus_tag="SPC34_0013" + CDS 10644..11660 + /gene="wcrD" + /locus_tag="SPC34_0013" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34272.1" + /db_xref="GOA:Q4JZG1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZG1" + /translation="MSNKILTITVPTYNIENYIGKCIESFKAVNPAYYSDFEVLIIND + GSTDNSVQVVKDLMEGSTLDLRIITKENGGHGSTINRGIKEANGKYFKVIDGDDWINV + QEFESLLDKLREINTDLVISDYTEQHVYNNSTIFKEFSSYLIPNQETRGIPSKWTPMH + ALVYKTSILKDNAITISENTFYVDQEYTMLPLQFVENYIYFKLDIYQYLLGRADQSMN + IDIMRKRADHHERVTKRILDLYKESYTQKPELEKVVSDSLQYLVNKQNILYVMNEELD + KVYELFSYSEKSGFKFKFETKTKTSNLLYVNYKTKYLFNLVIKNLVKRKANSLEKEFQ + EKGF" + misc_feature 10662..11162 + /gene="wcrD" + /locus_tag="SPC34_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.9e-32" + gene 11765..13177 + /gene="wzx" + /locus_tag="SPC34_0014" + CDS 11765..13177 + /gene="wzx" + /locus_tag="SPC34_0014" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34273.1" + /db_xref="GOA:Q4JZG0" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZG0" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHREEIQKNFWGIYSLQLGATVLSLALYVLLCLIL + PFMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVISIFLFVKSAN + DLYLYVFLLTIFELLGQLSMWLPAREFIDRPHFDLEYAKPHLKPVILLFLPQVAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVANLLATGNHRAVN + KMHEISFLIYNLVIFPMMAGILIVNDDFVQFFLGQDFQDARYAIAIMSFRMFFIGWTN + IMGTQILIPHNQNKEFMISTTAPAIVSVGLNLLFLPKLGYIGAAIVSVSTEALVWAIQ + LYFTRRYLKEVPIIGSLTKIVLASAIMYGILLGSKTLIQFSPTINVIVFAVLGGIIYL + FAILSLKVVDIKELKHIIKK" + misc_feature 11771..12565 + /gene="wzx" + /locus_tag="SPC34_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.2e-71" + gene 13189..14289 + /gene="glf" + /locus_tag="SPC34_0015" + CDS 13189..14289 + /gene="glf" + /locus_tag="SPC34_0015" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34274.1" + /db_xref="GOA:Q4JZF9" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZF9" + /translation="MYDYLIVGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTAHMKDIEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFTHRE + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFDHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVLSELGK" + misc_feature 13624..14226 + /gene="glf" + /locus_tag="SPC34_0015" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 6e-136" + gene 14370..15428 + /gene="wcyO" + /locus_tag="SPC34_0016" + CDS 14370..15428 + /gene="wcyO" + /locus_tag="SPC34_0016" + /note="member of homology group 80" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34275.1" + /db_xref="GOA:Q4JZF8" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZF8" + /translation="MKKIKEYDILKIMAIILVVLSHSAYYKISSNYGGMDYQQYLNSH + SAFTLYKILGKFMEIIYYFHMPLFMAISGVFFSIQIKKDRWNKIEKLLTSKFKRLILP + FFVFTLLYSLPLKYISNYYNGVSFWRAITGQFLLLGNSHLWYLYALFIIFIISFYCLR + RDTSIFVYLSLYIIHVLSFLIHITLVSAPLQFLFWFSMGFLFESKRRKYNIFLENHKW + ISLLFFVLFIFLVVLNFLFKSDFKVLSRFFVDLLAILGSLICYNISYFLSNKTKILDS + KLLNLILINGLGIYIFSDTLNYFILSISYFVSDRFMFTSFGIIIIFLIRFVFTLFLGL + VFTLLFKKVFPKYSWLVN" + misc_feature 14379..15410 + /gene="wcyO" + /locus_tag="SPC34_0016" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 6.5e-06" + gene 15786..>15938 + /gene="aliA" + /locus_tag="SPC34_0017" + CDS 15786..>15938 + /gene="aliA" + /locus_tag="SPC34_0017" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34276.1" + /db_xref="UniProtKB/TrEMBL:Q4JZF7" + /translation="MMKSSKLLALAGVTLLAATTLAACSGSGSSAKGEKTFSYIYETD + PDNLNYL" + misc_feature 15786..15878 + /gene="aliA" + /locus_tag="SPC34_0017" + /note="Signal peptide predicted for SPC1639 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.804 between residues 31 and 32" +ORIGIN + 1 ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa atttaaaatt + 61 gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg ttttttataa + 121 ccaaggttta taagctttca ttctcgaaat tcaattaact ttacaaattc ccactattaa + 181 ggagaaagaa aatgaacata aagaagcgtg tccttagtgc aggcctgact tttgcatctg + 241 ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac tcatcaacct + 301 ttggtggaaa tccaactaca tttaactatc tattagacta ttacgctgat aacatagtca + 361 attgaaacaa gaacaggaca aaagagcctc gtaaaaggta ttgcaactgg gtaatacctt + 421 tttgaggtgc tttttgatat gagcccatgt tttctcaata ggattgtact caggtgagta + 481 gggaggaaga ggtaaaagtt tacgcccaaa ctcctcgcat aaaagttcta gcttccccat + 541 tctatggaat cttacattat ccataataat aaccgatggt gtgtttaatg ttggtaagag + 601 aaaattctga aaccaagctt caaaaaagtc gctcgtcatc gtctcttcgt aagtcattgg + 661 agcgattaat tcaccatttg ttagacctgc aaccaaagaa atcctctgat atcttcttcc + 721 agatactttg cctcttctta actgaccttt taatgagcga ccatattctc gataaaaata + 781 agtatcgaat cctgtttcat caatctaaac aggtgctagg tgctttaaac tattaaaatt + 841 cttaagaaat aaggctgctt tttctgggtc ttgttcatag taggtgtggt tctttttttc + 901 gagtgtagcc catagctttg agcgcatagt ggatggtagt tggatgacag ccaaattcag + 961 aagctatttc agtcaaataa gcgtctggat tgtcagtaag atagttttta agtctatctc + 1021 tatcaacttt tcttggtttt gttcctttta cttggtggtt tagctctcct gttttctctt + 1081 ttagctttaa ccagccataa atggtattac gtgagatttg gaaaacgtgt gatgcttctg + 1141 ttatactacc tgttcgctca caataagaga gaactttttt acgaaaatct attgaatatg + 1201 ccataaaaag attataccac attgtgtact atagtagatt gaaactagaa tagtccacct + 1261 ctgcttctaa aacattgtta gaaatcgatt tgactgtcct gatcgatttg tcctgttctt + 1321 atttcatttt actatatttt tggtttgcgg gaagtctact aagatattta aagatgcaga + 1381 tagtaaaaaa agatgtagac attaccgtaa aaaagtgata taatcgtatg atgttcaatg + 1441 tataggtgtt aatcatgagt agacgtttta aaaaatcagg ttcacagaaa gtgaagcgaa + 1501 gtgttagtat cgttttgctg actatttatt tattgttagt ttgtttttta ttgttcttaa + 1561 tctttaagta caatatcctt gcttttagat atcttaatct agtggtaact gcgttagtcc + 1621 tactagttgc cttggtaggg ctactcttga ttatctataa aaaagctgaa aagtttacta + 1681 tttttctgtt ggtgttctct atccttgcca gctctgtgtc gctctttgca gtacagcagt + 1741 ttgttggact gaccaatcgt ttaaatgcga cttcgaatta ctcagaatat tcaatcagtg + 1801 tcgctgtttt agcagatagt gagatcgaaa atgttacgca actgacgagt gtgacagcac + 1861 cgactgggac tgataacgaa aatattcaaa aactactagc tgatatcaag tcaagtcaga + 1921 ataccgattt gacggtcaac cagagttcgt cttacttggc agcttacaag agtttgattg + 1981 caggggagac taaggccatt gtcctaaata gtgtctttga aaatatcatc gagtcagagt + 2041 atccagacta cgcatcgaag ataaagaaga tttataccaa gggattcact aaaaaagtag + 2101 aagctcctaa gacgtctaag aatcagtctt tcaatatcta tgttagtgga attgacacct + 2161 atggtcctat tagttcggtg tcgcgatcag atgtcaatat cctgatgact gtcaatcgag + 2221 ataccaagaa aatcctcttg accacaacgc cacgtgatgc ctatgtacca atcgcagatg + 2281 gtggaaataa tcaaaaagat aaattaaccc atgcgggcat ttatggagtt gattcgtcca + 2341 ttcataccct agagaacctt tatggtgtag atattaatta ttatgttcgt ttgaatttta + 2401 cttcattttt gaaattgatt gatttgttgg gtggaattga tgtttataat gatcaagaat + 2461 ttactgccca tacgaatgga aagtattatc ctgcaggcaa tgttcatctt gattcagaac + 2521 aggctctcgg ttttgttcgt gagcgctact ccctagcaga tggcgatcgt gaccgtggtc + 2581 gcaaccaaca aaaggtgatt gtggctatcc ttcaaaaatt aacgtcaacc gaagcactga + 2641 aaaattatag tacgatcatt aatagcttgc aagattctat ccaaacaaat atgccacttg + 2701 agactatgat aaatttggtc aatgctcagt tagaaagtgg agggaattat aaagtaaatt + 2761 ctcaagattt aaaaggtaca ggtcggacgg atcttccttc ttatgcaatg ccagacagta + 2821 acctctatgt gatggaaata gatgatagta gtttagctgt agttaaagca gctatacagg + 2881 atgtgatgga gggtagatga aatgatagac atccattcgc acatcgtctt tgatgtagat + 2941 gatggtccca agtcaaggga ggaaagcaag actctcttgg cagaagccta cagacagggg + 3001 gtgcgaacca ttgtctctac ctctcaccgt cgcaagggca tgtttgaaac tccggaagag + 3061 aagatagcag aaaactttct tcaggttcgg gaaatagcta aggaagtggc gagtgacttg + 3121 gtcattgctt acggggctga aatttactac acaccagatg ttctggataa gctggaaaaa + 3181 aagcggattc cgaccctcaa tgatagtcgt tatgctttga ttgagtttag catgcatact + 3241 tcctatcgtg agattcatag cgccttgagc aagatcttga tgttgggaat tactccagtc + 3301 attgcccaca ttgagcgcta tgatgctctt gaaaataatg aaaaacgcgt tcgggaactg + 3361 atcgatatgg gctgttacac gcaagtaaat agttcacatg tcctcaaacc caaacttttt + 3421 ggcgaacgtt ataaattcat gaaaaaaaga gttcagtatt ttttagagca ggatttggtt + 3481 catgtcattg caagtgatat gcacaatcta gacagtagac ctcctcatat ggcagaagca + 3541 tatgaccttg ttacccaaaa atacggagaa gcgaaggctc aggaactttt tatagacaat + 3601 cctcgaagaa ttgtaatgga tcaactaatt taggagaaat gatgaaagaa caaaacacga + 3661 cagaaatcga tgtatttcaa ttagttaaaa ccttgtggaa acgcaagcta atgattttat + 3721 tagtggcact tgtgacaggt gcgggggctt ttgcatatag cacttttatt gttaagccag + 3781 aatatacgag taccacgcga atttacgtag tgaatcgaaa tcaaggagac aagccggggc + 3841 tgacaaatca ggatttgcag gcaggatctt atctggtaaa agactaccgt gagattgtcc + 3901 tttcgcagga tgtattggaa aaagtagtga caaatttgaa gttggatatg ccagcaaaaa + 3961 cgttagccag caaagttcaa gtgactgtac cagctgacac tcgtatcgtc tcaatctctg + 4021 tcaaggataa acagccagag gaagccagtc gtatcgctaa ttttctacga gaagttgctg + 4081 cagaaaagat cgtcgctgta acgcgagtat ctgatgtaac gacacttgaa gaagcgcgac + 4141 cagctacaac tccctcttct ccaaatgttc gacgcaattc cttgtttggt tttcttggag + 4201 gagcagtcgt aacagtaatt gctgttcttt tgattgagtt gctcgacacc cgtgtgaaac + 4261 gtcctgaaga tgttgaagat gtactgaaaa ttccactttt agggctcgtt ccagatttta + 4321 acaaaataaa ataggaggaa gttatgccaa cattagaaat ctcacaggca aaattggatt + 4381 ctgtaaaaaa ggcagaggaa tattataacg ctttgtgcac gaacctacag ttaagtggag + 4441 atggtttgaa agtattttct atcacttctg tgaaaatagg agaaggaaaa tcaacgactt + 4501 ccgccaatat cgcttgggct tttgcgcgtg caggttacaa aacgctgctg attgatggag + 4561 atattcgcaa ttctgttatg ttaggtgtct ttaaagcaag gaataagatt acaggcctga + 4621 cagaattttt atcaggaact acagacctat cacaagggct ttgtgatacc aatatcgaaa + 4681 atctctttgt aattcaggct ggctctgtgt caccgaatcc gacagctctt cttcaaagta + 4741 agaatttcac tacaatgctt gaaaccttgc gtaaatattt tgactacatc attgtagata + 4801 ctgctcctgt tggtgtcgtg attgatgcgg ctattattac gcgaaactgc gatgcttcta + 4861 ttttagtgac ggaggcaggt gaaataaatc gtcgggatat tcaaaaagca aaagaacagt + 4921 tggaacacac aggaaagccg tttttgggaa ttgtgttgaa taaattcgat acttcagtag + 4981 acaaatacgg ttcttatgga gattatggag attacgggaa aaataaaaaa taggtcgggg + 5041 gatagagatg aatggaaaaa tagtaaagcc ttcattggcc ataatccaga gttttcttgt + 5101 tattttattg acttatctac ttagtgctgt gagagaaacg gagattgttt caacaacagc + 5161 tattgcactt tatatcctcc attattttgt cttttatatc agtgattatg gacaggattt + 5221 ctttaaaagg agatatttga ttgaacttgt ccagacattg aaatatatcc tattctttgc + 5281 actagcgatt agtatttcta attttttctt agaggatcga tttagtattt ccagacgagg + 5341 catgatttac ttcctcacat tacatgctct cttagtctat gtgctaaacc tatttatcaa + 5401 gtggtattgg aagcgggctt atcccaactt taaaggaagt aagaagattc tcctacttac + 5461 agcaacttct cgtgtcgaaa aggtactgga tagattaata gaatcaaatg aggttgttgg + 5521 gaagttggta gccgtcagtg tcttagataa accagatttt cagcatgatt gtttaaaggt + 5581 agtagcagag ggggagatag taaactttgc gactcatgag gtggtcgatg aagtctttat + 5641 caatcttcca agtgaaaaat acaatattgg agagcttgtc tctcagtttg aaacgatggg + 5701 aattgatgta atagtcaatc taaatgcttt tgatcgtagt ttggcacgta acaagcaaat + 5761 tcgtgagatg gcagggttaa acgttgtgac tttttctaca acattttata agactagtca + 5821 tgtaattgct aagcggatta ttgatatcgt gggtgcattg gtagggctga tactatgtgg + 5881 tttagtcagt attgtactgg ttcctttgat tcgaaaggat gggggatctg ctatttttgc + 5941 tcagacgcgt ataggaaaaa atggtcgtca gttcactttt tataagtttc gctctatgtg + 6001 tgtagatgcc gaggcgaaaa aaagagaact catggaacaa aataccatgc aaggtggaat + 6061 gtttaaggtg gacgatgatc ctcgtatcac gaaaattggt tgttttatac ggaagactag + 6121 cttggacgag ctaccacagt tttataatgt tctaaaggga gatatgagtt tggttggcac + 6181 acggccacca acagtggacg agtatgaaca ctatacccca gaacaaaaac gtcggctaag + 6241 ttttaaacct ggtataacag gcttatggca ggtcagtgga cgaagtgaga ttaagaattt + 6301 tgatgaagtt gtcaaattag atgtagccta tatagacgat tggacaattt ggaaagatat + 6361 tgagatttta ttgaagacag ttaaagttgt attgatgaag gatggagcga agtagattga + 6421 tagatgtaaa aatcattgtg gcaacacata aagaggttaa aatgcctcaa gacagtagtc + 6481 tttaccttcc aatacatgtt gggagagacg gtaaatcaga tattggtttt atcggtgata + 6541 atactggcga taatatatcc tctctaaatc catattattg tgagttgacg ggactttatt + 6601 gggcatggaa gaatcttgat tataattact taggtttagt tcattaccgt cgttatttta + 6661 caaataaatc tcaagggtat aatgaaaatg tcaatatgga tgacgtcatt ttgtctcgat + 6721 ctaatgttga aatattatta gagaaatctg acataatagt tccaaagaag cgaaagtatt + 6781 atattgaaac tctttattca cattatgccc atacccttaa tggagaacat ctggatcttg + 6841 ctaggaaaat tattgagcaa aatagttcag agtatctttc atcctttgat aaagtgatga + 6901 aacaaagaag aggttatatg ttcaatatgt ttatcatgaa aaaagaacta ttagatgatt + 6961 atttaccgtg gcttttttct attctggata ctatgtacga acagatggac ttgaccgact + 7021 atactccatt tgagtcacgt ttattcgggc gagttagtga gttgttgttt aatgtttggt + 7081 tatgtaaaaa aggaataacg cctaaagagg taccatttat gtacatggag agagtgcatt + 7141 tgtttgaaaa aggaaaatct tttttaatgg ctaaattttt tggaaagaag tatggacaga + 7201 gtttttaaga gcacttatta aattatatac tccgaattct atatgtttag taaataaaca + 7261 ttttgtagtt aagagtatta atacttgaag gaatgtagat gctttatata ttattttatt + 7321 tattattatt attttttatt ataaattatg cttttgtaag aggagattat tttcacccaa + 7381 caattatctt taactttact tttttgatag caacactgtt ttgcatttta aatgctcaag + 7441 agtatgctat tgagttcaat ggaggtacag tttttattgt gacgatttca atgctcgttt + 7501 ttacaataat aacagtatta tcaaagaaaa tatttaagac taatactttc acctttaaga + 7561 ataaattaaa atatctatat gtcagtaaaa gtctaatttt tacaataatt attattcaga + 7621 ttttaaatct tattttcttt tatcgatacg aacaagcttt attcagcgct tatgttggcg + 7681 gtcgtggaag tttctcgcaa ataattaata actatgacca attagtaaag ttttttactg + 7741 aagacttagt cggattgggg gtcaggtctc cgttttttta tagagtgttt aatagcttca + 7801 tatctcctat ttcttacgtg attatataca ttatttgtca caattatgtg gcaacaagaa + 7861 gaatagataa atttcaactc ctagttcctt gtttatttgc aattcaaatt tttatgactg + 7921 gtagtagagg gtccttgttt aaaattttga cttttatatt agttgttttt tatattttac + 7981 tactgcgtaa taaaggactt agtaaattga gttctcgctt tgcttttaag gtccttattg + 8041 ttgtagtggc agttgctcct ctatttgtac tttatttaaa tgcaacgggg cgttccggtg + 8101 gagtaggtca agatgggatt attgaagctc ttaatcgaga actattcaag tacattggcg + 8161 ctccgttatt aaattttaac aattttattg ctggatatga tccgtataga agtgactcag + 8221 tatattgggg agaacagact ttttatggct tttataaatt cttgtatagt aaactacact + 8281 tgatagattt taatattaaa agtattattg gtagtgattc ttttgtgaag agtaccaatg + 8341 gattgcctac agggaatgtc tttacaactt tttatacgtt tttttatgac ttcacttatt + 8401 tcggcattat tccattagta tctgtaattg cattatattt tgttccaact tatagtagga + 8461 tattgggtac agaatattgt gcaaaaaaat atttatttga ttataagtta tttatctatg + 8521 cttatttgtt taatgatgtt ataatgttga ttttttcaaa tcgatttttt gaaagtatat + 8581 taacagttgg ttttttacgt tttttaataa ctagtgccat tttagtctgg ataataaaac + 8641 aaaatattgt ttttaagtat aaaaaatagt tgaaagctat gcaaattggt aatttatcta + 8701 aaaaaggtgg agaatagtaa atggaagaag atacaaagtt atataagatt caatctaaag + 8761 aattagaatt acttaaggtt ttgactaata tttgtgaaga aaataacctg acctactatg + 8821 ctctaggtgg gaccttgttg ggcgcggtac gtcataaagg attcatacct tgggatgacg + 8881 atattgatat cggtatgcca agagaagatt atgaaaagtt taaaatacta gctccaaacc + 8941 tgttaccaag taatttaaaa atagttaata atccacttaa tcttgatata actcagttag + 9001 tagataaaaa tgttattgtt aaaattgcga attcggaaag caatgtgttt attgacattt + 9061 ttcctctaga tggttataca gaaaaaggat tttttgcagc taaattgcat agttttaggc + 9121 tattgtttca aagaatgctt tgtaaaatat cagttttaga ccagcttgaa gataaagacc + 9181 gtggcactgt ggagaatctt atagttaaaa tatcgaaaat gctaagaatc caaaaagtac + 9241 ttcctaagga tacattggta gaaaatctgc ataaagttat tcaaaaatat gattttaaaa + 9301 cttctcgtta cgtcggtaat gttctaggta gatataggga gagagaaata gttccgagag + 9361 agtattttaa agaacctgtt tctcttattt ttgaggatac gatgataaac tgtccgacaa + 9421 agtacaagga atatttaaac gaaatctacg gtgattacat gaaattacca tcagtagaag + 9481 atagagtagc acataatata gaacttatat cagtaggtga tgcagagtga agggtaggat + 9541 agaaattggg aaaaaaatat gtattgtgaa atggattttg gatgattctg gtggcggtga + 9601 gcgagttgct gtatctttgg caaacgaact tacaaaaaag tatgaagttc atttaattgg + 9661 aattacaaca aagcaatcgg acctgttctt taaaatcaat tctcaagtaa gatactccaa + 9721 tttttttgac catagagtac gcttgtctaa gaatattcta aaaatctcaa aaatgttaag + 9781 aaaatatttc atagataatg aaatagaggt tggttttggg atagggatat ctgctaatgt + 9841 atttttatct ttggcaggaa taggaactca aactaaagta gttttgtgtg atcataccaa + 9901 ttcgattacg gataatagag aattttctca gaaattccaa agatatgttg ggacaaagtt + 9961 ggcagacaag attatcactc tcactcaaga agaccgtgaa aattatataa aaaaatacgg + 10021 tgttcctgag gaaagaattt gctacatcta taattggaaa gaggctgctc tttcagatgt + 10081 atcttataat aaaaaatcaa ctaaaattgt gactgttggc cgttttgatt atcaaaaagg + 10141 ctatgattat ctcattcaag tcgcgaaaaa agtgttagag aaaagggctg actggacttg + 10201 ggaaatctac ggttccggca atcaagatga agtagataaa atcagagatt taatcaacga + 10261 aaatgattta caggataggt tagtcataaa aggactcgaa aaaaatcaag atttgattta + 10321 tggagataaa gggatttatg tcatgacttc tcgctatgaa ggtctacctt tagtcctgct + 10381 ggaagcacaa caatacaatc ttcctatagc tagctttagt tgtccgacag gaccgaacga + 10441 aattgttgaa gatggagtta atggctatct ggttgagtgt tatgatgtag aagcgatgtc + 10501 taatagatta ttagaactaa tgaatgataa ggagctaaga aatcgttttt catctcatgc + 10561 aaaagataac attaaaaaat ttaataaaga ccgaattata catcagtgga tagatttgat + 10621 agaagaagta tctggggggg aaaatgtcta ataaaatact gacgattact gtgccaacct + 10681 ataatattga aaactatatt ggtaaatgca tagaatcatt taaagctgta aatcctgctt + 10741 attacagtga ttttgaagtg ttaatcatta atgacggaag tactgataat tctgtacaag + 10801 ttgttaagga tttaatggaa ggtagcactt tagatttaag aattatcaca aaagaaaatg + 10861 ggggccatgg ctcaactatt aatcgcggga ttaaagaagc taatggaaaa tattttaagg + 10921 tcattgatgg ggatgattgg atcaatgttc aagaatttga aagcttattg gataagttaa + 10981 gagagattaa cactgattta gtgatttctg actatacaga gcagcatgta tataataata + 11041 gcactatttt taaagaattc tcttcttatc taattccaaa tcaagagaca agaggtattc + 11101 ctagcaagtg gacacctatg catgccctgg tctataaaac aagtatcttg aaggataatg + 11161 ctattacgat tagtgaaaat acattttatg tcgaccaaga gtatacaatg ctccccctcc + 11221 aatttgtaga aaattatatt tattttaagt tggatattta tcagtactta ttgggaagag + 11281 ctgatcagag tatgaatatt gatataatga gaaagagagc agatcatcat gagagagtaa + 11341 cgaaacgaat cttagactta tataaagaga gttatacaca aaagccagaa ttagaaaagg + 11401 ttgtcagtga ctctttgcag tatctggtta ataagcaaaa tattttgtat gttatgaatg + 11461 aggaacttga caaggtatat gaactgtttt catattctga aaaaagtgga ttcaaattta + 11521 aatttgaaac aaaaacaaag acttcaaatt tactttatgt caattataaa acgaagtatc + 11581 tttttaacct tgttattaaa aatctagtta aaagaaaagc aaacagtcta gaaaaagaat + 11641 ttcaagagaa gggattttga tgaaatatgc cagagagcaa aataaagcat caatttcttc + 11701 tgagggtatt tatgaatcga ttaagtattc tgcttaagat gatgttcaat aggagagtgc + 11761 aggtatgaaa gtactaaaaa actacgccta taatctttct tatcagttat tagtgattat + 11821 actcccaatc attacgactc cctatgtaac acgggtcttt tcttcggatg atttagggac + 11881 gtatggatac tttaattcca ttgtcaccta ctttatcctc ttagcgacgc tgggagttgc + 11941 taactatggg actaaggtca tttcagggca tcgcgaggaa attcaaaaaa acttttgggg + 12001 aatctactct ctacaattag gggcaacagt tctttctctg gccttatatg ttcttctttg + 12061 tctgatcctt ccctttatgc aaaatccggt agcctacatt ctaggcttga gtttagtttc + 12121 aaaaggttta gacatttcct ggctctttca agggttggaa gattttcgaa agattactgt + 12181 tcgaaatatc acggtcaagc ttgttggagt catttcaatc ttcctctttg tcaaatctgc + 12241 aaatgaccta tatctctatg tttttttgct aaccatattt gaactcttgg ggcaactaag + 12301 tatgtggttg cctgctcgtg agtttattga tagacctcat tttgatttag aatatgctaa + 12361 gcctcatttg aagcccgtca tattattatt tcttcctcaa gtagcaatct ctttgtatgt + 12421 taccttagat cgtaccatgc ttggagcatt ggcttctaca aaagatgtag ggatttatga + 12481 tcaggctcta aagttggtaa atatactttt gaccttggta acttccttgg gaagtgttat + 12541 gttgcctcga gtagctaact tattagcaac aggaaatcat agagcagtca ataagatgca + 12601 tgaaatatcc ttcctcattt ataatttagt gattttccca atgatggcag gaattttaat + 12661 cgtcaatgat gattttgttc agtttttcct tgggcaggat tttcaggatg cacgttatgc + 12721 aattgccatt atgagcttcc gtatgttctt tatcggttgg accaatatca tgggaactca + 12781 gatactgata cctcacaatc aaaataaaga gttcatgatt tcaacaacag ctcccgcaat + 12841 tgtcagtgta ggtttgaact tactattcct tcctaaactt ggatatatag gagcagccat + 12901 tgtttctgtt tcgacagagg cgttagtatg ggcgatacaa ttatacttta cccgtagata + 12961 cctaaaagaa gttccaatta tcggatcttt gacaaaaata gtcctagcat cagctatcat + 13021 gtatggcatt ctgctaggtt caaaaacact tatacaattt tcgccaacta taaatgttat + 13081 agtatttgca gtgcttggtg gaatcattta tctttttgca attctatctc taaaagtggt + 13141 agatatcaaa gaattaaaac atattattaa aaaataatgg agttaactat gtatgattat + 13201 cttatcgtcg gtgctggttt gtctggagca atcttcgcac acgaagctac aaaacgcggt + 13261 aaaaaagtaa aagttattga taaacgtgac cacattggtg ggaatatcta ttgtgagaat + 13321 gtagaaggtg ttaatgttca taaatatggt gcacatatct tccatacttc taataaaaaa + 13381 gtctgggatt atgttaatca atttgctgaa tttaacaact acatcaactc gcctgtagca + 13441 aattacaagg gtagccttta taatctgcct ttcaatatga atactttcta tgctatgtgg + 13501 gggacaaaaa ctcctcaaga ggtcaaagat aagattgctg agcaaacggc tcacatgaag + 13561 gacattgaac ctaaaaactt ggaagaacag gctatcaagt tgatcggtcc agatgtctat + 13621 gaaaaattaa tcaagggtta tactgaaaag cagtggggac gctcagcaac ggaacttcct + 13681 ccatttatca ttaaacgtct tccagttcgt ttaacatttg ataataacta ttttaacgac + 13741 cgttaccaag gaattcctat tggtggttac aatgtcatca tcgaaaatat gcttaaagac + 13801 gttgaagttg agcttggtgt tgatttcttt actcatcgtg aggagttaga agcatcagct + 13861 gaaaaagttg tcttcacagg gatgatcgac cagtattttg actacaagca tggagagtta + 13921 gaataccgta gccttcgctt tgatcatgaa attttggacg aggaaaatta tcaaggaaat + 13981 gctgtagtga actatacgga gcgtgagatt ccttatactc gtattattga gcataaacac + 14041 tttgagtatg gtacgcaagc taaaacggtc attactcgtg aatacccagc tgattggaaa + 14101 cgcggagatg aaccttatta tccaatcaat gatgagagaa acaatgctat gtttgctaaa + 14161 tatcaagaag aagcagcaca gaatgataag gtgattttct gcggacgttt ggccgattat + 14221 aaatactacg acatgcatgt ggtcattgaa cgtgccttag aagtcgtatt aagtgagtta + 14281 ggaaagtagt caattacatt aaggtcaagt ttaatgacct tatatctttt ctataaagaa + 14341 aaactacaat tagaggagcg agatttaatg tgaaaaagat aaaagaatat gatattttaa + 14401 aaattatggc tattatttta gttgtgttaa gtcatagtgc gtattataaa atatcgagca + 14461 attatggtgg aatggattat caacaatatt taaatagtca ttcagcattt actctatata + 14521 agatacttgg taaatttatg gaaattatct attattttca tatgccatta tttatggcta + 14581 tatcgggtgt atttttctct attcaaataa aaaaagatcg atggaataag attgagaaat + 14641 tattaactag taagtttaaa agattaatat tgccattttt tgtttttact ttattatata + 14701 gtttgccatt aaaatatata tcaaactact acaatggtgt ttcgttttgg agagctataa + 14761 ctggtcaatt cttgttatta ggaaattctc acttatggta tttgtatgca ttatttatta + 14821 tctttataat tagtttttat tgtttaagaa gagatacttc tatatttgta tacttgtcct + 14881 tatatattat acatgtactg agtttcttga ttcatataac gttagtaagt gcaccattgc + 14941 agtttctttt ttggttttcc atgggatttt tgttcgaatc taaaagaagg aagtataata + 15001 tttttttgga aaatcacaaa tggattagcc ttttattctt tgtgttattt atatttttgg + 15061 tggttttaaa ttttctattt aaaagcgatt ttaaagtatt gagtcgattt tttgttgact + 15121 tattagctat tttaggatca cttatttgtt acaatatttc gtacttttta agtaataaaa + 15181 ctaaaatttt agatagtaaa ctacttaatc tcattttgat taatggttta gggatatata + 15241 ttttttctga tactttaaac tattttatat taagtatttc ttattttgta agtgatagat + 15301 ttatgtttac ttcatttggt ataattatta tatttttaat tagatttgtt ttcactttat + 15361 ttttgggatt agtctttaca ttgctattta aaaaagtatt tccaaaatat tcttggttag + 15421 ttaactagaa aatacaatat cagtgattat gcactataag ctatcctgta attcttacag + 15481 ttaaatattt tatcctatat actgaggaga caaataaaat aacttatagt attttgcacc + 15541 ttatctagtt taattgtaat ataaaagaaa atatccagga agtggtatag tactctctca + 15601 ttgtttaact tcgcttaaat atataggtta attccttgac tatgtgatgt agttgaggga + 15661 tttttgataa tattcatatt ttttgcaaag atgttgtttg aaaaataatt ttcaaaaatt + 15721 ctgaaaattc tgttgacaac tttctgaaaa gagtctataa tggagagaaa gttttaaagg + 15781 agaaaatgat gaaaagttca aaactacttg cccttgcggg cgtgacatta ttggcggcga + 15841 ctactttagc tgcatgctct ggatcaggtt caagcgctaa aggtgagaag acattctcat + 15901 acatttatga gacagaccct gataacctca actatttg +// + diff --git a/public/res/serotype_genbank/serotype_35A.gb b/public/res/serotype_genbank/serotype_35A.gb new file mode 100644 index 0000000..ecbaf53 --- /dev/null +++ b/public/res/serotype_genbank/serotype_35A.gb @@ -0,0 +1,955 @@ +LOCUS CR931704 21463 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 1936/39 (serotype 35a). +ACCESSION CR931704 +VERSION CR931704.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21463) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 21463) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..21463 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="1936/39" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC35A_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC35A_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34277.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SPC35A_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SPC35A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(508..1008) + /gene="tnp" + /locus_tag="SPC35A_0003" + /pseudo + CDS complement(508..1008) + /gene="tnp" + /locus_tag="SPC35A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1230..2675 + /gene="wzg" + /locus_tag="SPC35A_0004" + CDS 1230..2675 + /gene="wzg" + /locus_tag="SPC35A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34280.1" + /db_xref="GOA:Q4JZF5" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZF5" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYSDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1230..1346 + /gene="wzg" + /locus_tag="SPC35A_0004" + /note="Signal peptide predicted for SPC1643 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1434..1781 + /gene="wzg" + /locus_tag="SPC35A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.3e-62" + misc_feature 1959..2402 + /gene="wzg" + /locus_tag="SPC35A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2677..3408 + /gene="wzh" + /locus_tag="SPC35A_0005" + CDS 2677..3408 + /gene="wzh" + /locus_tag="SPC35A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34281.1" + /db_xref="GOA:O86886" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:O86886" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDRGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2680..3288 + /gene="wzh" + /locus_tag="SPC35A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.6e-36" + gene 3414..4109 + /gene="wzd" + /locus_tag="SPC35A_0006" + CDS 3414..4109 + /gene="wzd" + /locus_tag="SPC35A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34282.1" + /db_xref="GOA:O86887" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:O86887" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3414..3530 + /gene="wzd" + /locus_tag="SPC35A_0006" + /note="Signal peptide predicted for SPC1645 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3435..3851 + /gene="wzd" + /locus_tag="SPC35A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.1e-55" + misc_feature 3957..4034 + /gene="wzd" + /locus_tag="SPC35A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4119..4808 + /gene="wze" + /locus_tag="SPC35A_0007" + CDS 4119..4808 + /gene="wze" + /locus_tag="SPC35A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34283.1" + /db_xref="GOA:Q4JZK1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZK1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 4823..6190 + /gene="wchA" + /locus_tag="SPC35A_0008" + CDS 4823..6190 + /gene="wchA" + /locus_tag="SPC35A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34284.1" + /db_xref="GOA:Q4JZF1" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZF1" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHAPLVYVLNLFIKWYWKRAYPNFKGGKKILLLTATSRVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHIMAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 4823..4909 + /gene="wchA" + /locus_tag="SPC35A_0008" + /note="Signal peptide predicted for SPC1647 by SignalP 2.0 + HMM (Signal peptide probability 0.844) with cleavage site + probability 0.429 between residues 29 and 30" + misc_feature 5606..6187 + /gene="wchA" + /locus_tag="SPC35A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.8e-158" + gene 6177..6983 + /gene="wciB" + /locus_tag="SPC35A_0009" + CDS 6177..6983 + /gene="wciB" + /locus_tag="SPC35A_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34285.1" + /db_xref="GOA:Q4JZF0" + /db_xref="UniProtKB/TrEMBL:Q4JZF0" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDV + ILSRSNVEILLEKSDVIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDYTSFESRLFGRV + SELLFNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 6992..8185 + /gene="wzy" + /locus_tag="SPC35A_0010" + CDS 6992..8185 + /gene="wzy" + /locus_tag="SPC35A_0010" + /note="member of homology group 45" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34286.1" + /db_xref="UniProtKB/TrEMBL:Q4JZE9" + /translation="MKITIKRYSLPEILGLAALAIFLLFSLLSITLYAQYISIKVYFI + ALFGIILLIFLKELISESYNLKSVIGLFVIFTLCFIIGTVTNYAYFFILGLFLIYSLR + NLPFSDVAKVSFIISISVLLLVVLSSKLGIIPDYVEIWPTRVRHYLGFRYSLLPSTLM + MNIIAISFFLKQENASYPRLLVLFLLSGWLYVETDSRLTFINSCLFLLVNLIMKLSPS + IIEKVGRLLKLFSFTYFINACLSYWIAKTYLNTSNVVLNQFFYQVDQFLGGRIYYSNR + SLSLYGYKLLGQKIDWIGNGLSIQGERSTETYLYVDNLYIQILQHFGLIVSVIILSLL + TITLVKLLKKGQMVLGIILVILSFHALIDDLILNLYYNIFWVLIGMLIYKKYQFYDKK + QLTIE" + misc_feature 6992..7093 + /gene="wzy" + /locus_tag="SPC35A_0010" + /note="Signal peptide predicted for SPC1649 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.778 between residues 34 and 35" + gene 8340..9335 + /gene="wcrI" + /locus_tag="SPC35A_0011" + CDS 8340..9335 + /gene="wcrI" + /locus_tag="SPC35A_0011" + /note="member of homology group 128" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34287.1" + /db_xref="GOA:Q4JZE8" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZE8" + /translation="MNKISLTDNLPLISVVLPVYNVENYLEKCLNSVVRQTYKNIEII + IVNDGSLDSSIDICNKYANKDSRIKVFTKPNGGLSDARNFGIKKSMGEFITFVDSDDY + VTDDYVEYLYSLVKKYNCKMSMCSIFVHYISNDKMINNGTGRELMMTAEQCIEKMCYH + DEVDTCAYAKLYHRSLFSEICFPKGRIFEDIGTIYRFFDTAGQIACGFNAKYYYEIRE + NSIVTSSFSEKKFDLLFMTDQMRNFVDQRYPSLKAATKRRAVYARFSTLNQLLDVQGY + NEEKKEIIRFIQDNKEALLENPKTPKRDRLAVRALSLGFCIYKLLWKQYLKIQRG" + misc_feature 8379..8882 + /gene="wcrI" + /locus_tag="SPC35A_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 5.4e-48" + gene 9337..10479 + /gene="wcrJ" + /locus_tag="SPC35A_0012" + CDS 9337..10479 + /gene="wcrJ" + /locus_tag="SPC35A_0012" + /note="member of homology group 129" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI34288.1" + /db_xref="GOA:Q4JZE7" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4JZE7" + /translation="MNKEFLKYIYIRLLRNLRRIFFIIPIIRNRVVFESFSGDAYSCN + PKYISEELRKQYGDSVEIIWAFNDPNKFKKELPKEIVTCRYRSFNHLIYRITSKVYIC + NFLQAIEIPKRKGQLEIQTWHGGGCYKKVGVAEKGRQAAYVKRQRMHVEETDLFITSS + KYFENEVVKKQFGYKGEILSIGMPRNDILINLPISSQVEKLKEKLGLPNNKLIALYAP + TWRSGTKQYETLDIKKLTQAVDKKFGKKCIVLFRSHLYGNQSYDDVVDVSQYSDMQEL + LLLSDILITDYSSSMWDFSLSFKPCFLYTPDLKDYLDERGFDEDIHSWGFSVSESNKE + LVENILQFNNEEYRQKMKNHHQFLESYEQGDAVKRVVAKIAEYCNL" + misc_feature 9937..10464 + /gene="wcrJ" + /locus_tag="SPC35A_0012" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 1.5e-35" + gene order(10492..10611,10636..11399) + /gene="wcrK" + /locus_tag="SPC35A_0013" + /pseudo + CDS join(10492..10611,10636..10749,10742..11125,11112..11399) + /gene="wcrK" + /locus_tag="SPC35A_0013" + /note="member of homology group 130" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + misc_feature join(10540..10611,10636..10742,10749..11112,11125..11381) + /gene="wcrK" + /locus_tag="SPC35A_0013" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.6e-33" + /pseudo + gene 11419..12135 + /gene="mnp1" + /locus_tag="SPC35A_0014" + CDS 11419..12135 + /gene="mnp1" + /locus_tag="SPC35A_0014" + /note="member of homology group 131" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (mannitol)" + /protein_id="CAI34290.1" + /db_xref="GOA:Q4JZE6" + /db_xref="InterPro:IPR001228" + /db_xref="InterPro:IPR018294" + /db_xref="UniProtKB/TrEMBL:Q4JZE6" + /translation="MNLAVIFAGGSGTRMNAKDRPKQFLLVHGKPIIVHTIELFENHP + EIDGIIVVCIEDWIPYMEEMKYRYRLDKIAKIVPGGATGQLSIYNGLVAAEQVYGIED + NVVLIHDGVRPLITADTISDNIQSVKEKGNAITCTVAKETVILVDDENKVGEVPSREH + SRFAKAPQSFWLKDILGAHRDSVDNGRNDFIDSCTMMRHYGHDLHVVVGPYENIKITT + PDDFYIFRALYDLRENEQLK" + misc_feature 11425..12117 + /gene="mnp1" + /locus_tag="SPC35A_0014" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF000, score 2.4e-23" + misc_feature 11425..12114 + /gene="mnp1" + /locus_tag="SPC35A_0014" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 7e-05" + gene 12154..13224 + /gene="wcrH" + /locus_tag="SPC35A_0015" + CDS 12154..13224 + /gene="wcrH" + /locus_tag="SPC35A_0015" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34291.1" + /db_xref="GOA:Q4JZE5" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4JZE5" + /translation="MKYFVEETLLDEQDKKNAGGKARQDVTDILESIGYQKLIAESGM + NERQELNAVQRLVHHYKVKKMWKKTLSVVGKGDEVIIQFPLLNHSLFFNQVIKQLSKN + GVKVYFLIHDLESLRWSQSKSISLKSRIRLNIEERSVLRLSEGIIAHNKKMKSYIKTY + SVESSKIIPLEIFDYIIPSYHERKNLDNFQLNAPIVIAGNLKQHKAGYVYHLPSNVEF + NLYGIGYEQTDDKSVHYCGSFMPEELPFVLKGSFGLVWDGPSSESCIETYGEYLRVNN + PHKTSLYLASGIPVVVWSEAAIASFIKENNCGILVSNLSELPELLSMITVDEYELMKK + NTEIIGERLRQGFYTKQAVKGF" + gene 13240..14319 + /gene="mnp2" + /locus_tag="SPC35A_0016" + CDS 13240..14319 + /gene="mnp2" + /locus_tag="SPC35A_0016" + /note="member of homology group 132" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (mannitol)" + /protein_id="CAI34292.1" + /db_xref="GOA:Q4JZA9" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZA9" + /translation="MIESFNDKVLQEDLEIIAKEELPFRKFRNSTVFITGVTGLVGLQ + LFKALACINRVHQLNMKIIGLVRNLDKAEKIFGDLLKRKDIQIVLGDVSEDFHSYIPD + GLVIDYIIHGASVTTSKLMIEFPVDTIRVAFNGTYQMLELAKEKKVKSFVYLSSMEVY + GSFQSDRTTVVNENMLGYLDLTSVRTNYPECKRICENMCIAFLSQYQVPAKIARLSQT + FGAGTLPGENRVFAQFARSVMQGKDIVLHTLGQSEGNYCYTADTVVALLTILLRGENG + EAYNIANEESHTTIADMAKMVTSQFSQTSQVVFDIPKKNIFGYAVDTKMKLSTHKIQQ + LGWKPRVSLVDAYDRMMRSMNETGV" + misc_feature 13333..14085 + /gene="mnp2" + /locus_tag="SPC35A_0016" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 9.2e-23" + misc_feature 13336..14178 + /gene="mnp2" + /locus_tag="SPC35A_0016" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 0.00013" + gene 14328..15743 + /gene="wzx" + /locus_tag="SPC35A_0017" + CDS 14328..15743 + /gene="wzx" + /locus_tag="SPC35A_0017" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34293.1" + /db_xref="GOA:Q4JZA8" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZA8" + /translation="MKVLKNYLYNLSYQLLVIILPIITTPYVTRIFSSDDLGTYGYFN + SIVTYFILLATLGIANYGTKEISGNRKSIQKNFWGIYTLQFGATTFSIFLYILACLFI + PGMKNLVAYILGLGLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVSAIFLFVKSAS + DLYLYVFLLTAFELLGQLSMWFPAREYIGKPHFDIEYARHHLKPVILLFLPQIAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVAHLLATGDHKVVN + KMHEVSFLIYNLVIFPIMAGMLIVNDDFVQFFLGQDFQDARYAISIMIFRMFFIGWTN + IMGIQILIPHNQNKEFMISTTTPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LFYTRRYLKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSPTLNVLAFVALGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 14334..15128 + /gene="wzx" + /locus_tag="SPC35A_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.5e-65" + gene 15745..16743 + /gene="wciG" + /locus_tag="SPC35A_0018" + CDS 15745..16743 + /gene="wciG" + /locus_tag="SPC35A_0018" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34294.1" + /db_xref="GOA:Q4JZE2" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZE2" + /translation="MRKNRNINLDLLKVLACVGVVLLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMINGYLLLGKREITYLYILPKVKWILITVSSWSFIVWLFKRDFTTNPI + KKIVGSLIQRGYFFQFWFFGALILIYLCLPILRQFLNSKRSYLYSLSLLMTIGLIFEL + SNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTIEEIESRFKNWMKIVSILLLLI + SPIILFFIAKTIYHNLFAEYFYDTLFVKVSTLGIFLTILMLTLNENRRESIVSLSNQT + MGVFIIHTYIMKVWEKVLGFNFVGAYLFFALFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 16757..17866 + /gene="glf" + /locus_tag="SPC35A_0019" + CDS 16757..17866 + /gene="glf" + /locus_tag="SPC35A_0019" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34295.1" + /db_xref="GOA:Q4JZE1" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZE1" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRDHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTADMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELEVDFFAHRE + GLEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + misc_feature 17192..17794 + /gene="glf" + /locus_tag="SPC35A_0019" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.1e-136" + gene 17814..18881 + /gene="wcjE" + /locus_tag="SPC35A_0020" + CDS 17814..18881 + /gene="wcjE" + /locus_tag="SPC35A_0020" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34296.1" + /db_xref="GOA:Q4JZE0" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZE0" + /translation="MNGRLRLWRKSLDMTKSRINWIDFGKGFSIFLVLAGHVLLGLYQ + SEKFPTANNILSLLIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPY + IFYSIIHFGLQKVAGSSVRVPTTISDLLNIYKDPLGVSWYLYILWSILIIYGLLSILV + KNRRMLFLISVFAYCLTLFVQTDIYIIQRTLVWGLCFFLGSVLNEIHFDKINLKKFLF + FFVLFDFIYMFAWFLFYEVGSKKDYVSYSNPGLWGIAFVVCVLVAFAIFPKMEKNFPK + TFLYFTKYGKDSLGIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATY + ILKKIPFLNIVLLPQKYIKLK" + gene order(18923..19222,19248..19454) + /gene="tnp" + /locus_tag="SPC35A_0021" + /pseudo + CDS join(18923..19222,19248..19454) + /gene="tnp" + /locus_tag="SPC35A_0021" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature 19263..19448 + /gene="tnp" + /locus_tag="SPC35A_0021" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 4.2e-14" + /pseudo + gene complement(19676..19861) + /gene="tnp" + /locus_tag="SPC35A_0022" + /pseudo + CDS complement(19676..19861) + /gene="tnp" + /locus_tag="SPC35A_0022" + /note="member of homology group 0047 7" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 19946..20924 + /gene="tnp" + /locus_tag="SPC35A_0023" + /pseudo + CDS join(19946..20677,20688..20924) + /gene="tnp" + /locus_tag="SPC35A_0023" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + gene 21104..>21463 + /gene="aliA" + /locus_tag="SPC35A_0024" + CDS 21104..>21463 + /gene="aliA" + /locus_tag="SPC35A_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34300.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 21104..21190 + /gene="aliA" + /locus_tag="SPC35A_0024" + /note="Signal peptide predicted for SPC1664 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 21350..21418 + /gene="aliA" + /locus_tag="SPC35A_0024" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaagttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggcctgact + 361 tttgcatctg ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtca attgaaacaa gaacaagaca aaagcagctc aaaaaggtat tgcaacttgg + 541 taataccttt ttgaggtgct ttttgatatg agcccatgtt ttctcaatag gattgtactc + 601 aggtgagtag ggaggaagag gtaaaagttt atacccaaac tcttcacaca agagttctaa + 661 cttacccatt ctatggaatc ttgcattatc cataataata accgatggtg tggttaatgt + 721 tggtaagaaa aacttctgaa accaagcttc aaaaaagtcg ctcgtcatcg tctcttcgta + 781 agtcattgga acgattaatt caccatttgt tagacctgca accaaagaaa tcctctgata + 841 tcttcttcca gatactttgc ctcttcttaa ctgacctttt aatgagcgac catattctcg + 901 atgaaaataa gtatcgaatc ctgtttcatc aatctaaaca ggtgctaggt gctttaaact + 961 attaaaattc ttaagaaata aggctacttt ttctgggtct tgttcataat tagattgaaa + 1021 ctagagtagt acacctctgc ttctaaaaaa atttttagaa atcgatttaa ctgtcctgat + 1081 cgatttgtca tgttcttatt tcattttact atatttttgt ttcgcgggaa gtctactaag + 1141 atacttaaag atgcagatag taaaaaaatg tagacattac cgtaaaaaag tgatataatc + 1201 gtatgatgtt caatgtatag gtgttaatca tgagtagacg ttttaaaaaa tcacgttcac + 1261 agaaagtgaa gcgaagtgtt aatatagttt tgctgactat ttatttattg ttagtttgtt + 1321 ttttattgtt cttaatcttt aagtacaata tccttgcttt tagatatctt aatctagtgg + 1381 taactgcgtt agtcctacta gttgccttgg tagggctact cttgattatc tataaaaaag + 1441 ctgaaaaatt tactattttt ctgttgctgt tctctatcct tgtcagctct gtgtcgctct + 1501 ttgcagtaca gcagtttgtt ggactgacca atcgtttaaa tgcgacttct aattactcag + 1561 aatattcaat cagtgtcgct gttttagcag atagtgagat cgaaaatgtt acgcaactga + 1621 cgagtgtgac agcaccgact gggactgata atgaaaatat tcaaaaacta ctagctgata + 1681 tcaagtcaag tcagaatacc gatttgacgg tcaaccagag ttcgtcttac ttggcagctt + 1741 acaagagttt gattgcaggg gagactaagg ccattgtcct aaatagtgtc tttgaaaata + 1801 tcatcgagtc agagtattca gactacgcat cgaagataaa aaagatttat accaagggat + 1861 tcactaaaaa agtagaagct cctaagacgt ctaagaatca gtctttcaat atctatgtta + 1921 gtggaattga cacctatggc cctattagtt cagtgtcgcg atcagatgtc aatatcctga + 1981 tgactgtcaa tcgagatacc aagaaaatcc tcttgaccac aacgccacgt gatgcctatg + 2041 taccaatcgc agatggtgga aataatcaaa aagataaatt aacccatgcg ggcatttatg + 2101 gagttgattc gtccattcac accttagaaa atctctatgg agtggatatc aattactatg + 2161 tgcgattgaa cttcacttcg tttttgaaat tgattgattt gttgggtgga attgatgttt + 2221 ataatgatca agaatttact gcccatacga atggaaagta ttaccctgca ggcaatgttc + 2281 atcttgattc agaacaggct ctcggttttg ttcgtgagcg ctactcacta gcagatggcg + 2341 atcgtgaccg cgggcgcaat caacaaaagg tgattgtggc tatccttcaa aaattaacgt + 2401 caaccgaagc actgaaaaat tatagcacga tcattaatag cttgcaagat tctatccaaa + 2461 caaatatgcc acttgagact atgataaatt tggtcaatgc tcagttagaa agtggaggga + 2521 attataaagt aaattctcaa gatttaaaag gtacaggtcg gacggatctt ccttcttatg + 2581 caatgccaga cagtaacctc tatgtgatgg aaatagatga tagtagttta gctgtagtta + 2641 aagcagctat acaggatgtg atggagggta gatgaaatga tagacatcca ttcgcatatc + 2701 gtttttgatg tagatgacgg tcccaagtca agagaggaaa gcaaggctct cttgacagaa + 2761 tcctacaggc agggggtgag aaccattgtc tctacctctc accgtcgcaa gggcatgttt + 2821 gaaactccgg aagagaagat agcagaaaac tttcttcagg ttcgggaaat agctaaggaa + 2881 gtggcgagtg acttggtcat tgcttatggg gctgaaattt actacacacc agatgttctg + 2941 gataagctgg aaaaaaagcg gattccgacc ctcaatgata gtcgttatgc cttgatagag + 3001 ttcagtatga acactcctta tcgcgatatt catagcgcct tgagcaagat cttgatgttg + 3061 ggaattactc cagtcattgc ccacattgag cgctatgatg ctcttgaaaa taatgaaaaa + 3121 cgcgttcgag aactgattga taggggctgt tacacgcaag taaatagttc acatgtcctc + 3181 aaacccaaac tttttggcga acgttataaa ttcatgaaaa aaagagctca gtatttttta + 3241 gagcaggatt tggttcatat cattgcaagt gatatgcaca atctagacgg tagacctcct + 3301 catatggcag aagcatatga ccttgttacc caaaaatacg gagaagcgaa ggctcaggaa + 3361 ctttttatag acaatcctcg aaaaattgta atggatcaac taatttagga gaaatgatga + 3421 aagaacaaaa cacgatagaa atcgatgtat ttcaattatt taaaaccttg tggaaacgca + 3481 agctaatgat tttaatagtg gcacttgtga caggtgcggg ggcttttgca tatagcactt + 3541 ttattgttaa gccagaatat acgagtacca cgcgaattta cgtagtgaat cgcaatcaag + 3601 gagacaagcc ggggctgaca aatcaggatt tgcaggcagg atcttatctg gtaaaagact + 3661 accgtgagat tatcctttcg caggatgcat tggaaaaagt agcgacaaat ttgaagttgg + 3721 atatgccagc aaaaacgtta gccagcaaag ttcaagtgac tgtaccagct gacactcgta + 3781 tcgtctcaat ctctgtcaag gataaacagc cagaggaagc cagtcgtatc gctaattctc + 3841 tacgagaagt tgctgcagaa aagatcgtcg ctgtaacgcg agtatctgat gtaacgacac + 3901 ttgaagaagc gcgaccagct acgactccct cttctccaaa tgttcgacgc aattccttgt + 3961 ttggttttct tggaggagca gtcgtaacag taattgctgt tcttttgatt gagttgctgg + 4021 acacccgtgt gaaacgtcct gaagatgttg aagatgtact gaaaattcca cttttagggc + 4081 tcgttccaga ttttgacaaa ataaaatagg aggaagttat gccaacatta gaaatctcac + 4141 aggcaaaatt ggattctgta aaaaaggcag aggaatatta taacgctttg tgcacgaacc + 4201 tacagttaag tggagatggt ttgaaagtat tttctatcac ttctgtgaaa ataggagaag + 4261 gaaaatcaac gacttccgcc aatatcgctt gggcttttgc gcgtgcaggt tacaaaacgc + 4321 tgctgattga tggagatatt cgcaattctg ttatgttagg tgtctttaaa gcaaggaata + 4381 agattacagg cctgacagaa tttttatcag gaactacaga cttatcacaa gggctttgtg + 4441 ataccaatat cgaaaatctc tttgtaattc aggctggctc tgtgtcaccg aatccgacag + 4501 ctcttcttca aagtaagaat ttcactacaa tgcttgaaac cttgcgtaaa tattttgact + 4561 acatcattgt agatactgct cctgttggtg tcgtgattga tgcggctatt attacgcgaa + 4621 actgcgatgc ttctatttta gtgacggagg caggtgaaat aaatcgtcgg gatattcaaa + 4681 aagcaaaaga acagttggaa cacacaggaa agccgttttt gggaattgtg ttgaataaat + 4741 tcgatacttc agtagacaaa tacggttctt atggaaatta tggagattac gggaaaaata + 4801 aaaaataggt cgggggatag agatgaatgg aaaaatatta aggtcttcat tggccataat + 4861 ccagagtttt cttgttattt tattgactta tctacttagt gctgtgagag aaacggagat + 4921 tgtttcaaca acagctattg cactttatat cctccattat tttgtctttt atatcagtga + 4981 ttatggacag gatttcttta aaaggagata tttgattgaa cttgtccaga cattgaaata + 5041 tatcctattc tttgcactag cgattagtat ttctaatttt ttcttagagg atcgatttag + 5101 tatttccaga cgaggcatga tttacttcct cacattacat gctcccttag tctatgtgct + 5161 aaacctattt atcaagtggt attggaagcg ggcttatccc aactttaaag gaggtaagaa + 5221 gattctccta cttacagcaa cttctcgtgt cgaaaaggta ctggatagat taatagaatc + 5281 aaatgaggtt gttgggaagt tggtagccgt cagtgtctta gataaaccag attttcagca + 5341 tgattgttta aaggtagtag cagaggggga gatagtaaac tttgcgactc atgaggtggt + 5401 cgatgaagtc tttatcaatc ttccaagtga aaaatacaat attggagagc ttgtctctca + 5461 gtttgaaacg atgggaattg atgtaacagt taatctaaat gcttttgatc gtagtttggc + 5521 acgtaacaag caaattcgtg agatggcagg attaaacgtt gtgacttttt ctacaacatt + 5581 ttataagact agtcatataa tggctaagcg gattattgat attatgggtg cattggtagg + 5641 gctgatacta tgtggtttag tcagtattgt actggttcct ttgattcgaa aggatggggg + 5701 ttctgctatt tttgctcaga cgcgtatagg aaaaaatggt cgtcagttca ctttttataa + 5761 gtttcgctct atgtgtgtag atgccgaggc gaaaaaaaga gaactcatgg aacaaaatac + 5821 catgcagggt ggaatgttta aggtggacga tgatcctcgt atcacgaaaa ttggtcgttt + 5881 tatacggaag actagcttgg acgagctacc acagttttat aatgttctaa agggagatat + 5941 gagtttggtt ggcacacggc caccaacagt ggacgagtat gaacactata ccccagaaca + 6001 aaaacgtcgg ctaagtttta aacctggtat aacaggctta tggcaggtca gtggacgaag + 6061 tgagattaag aattttgatg aagttgtcaa attagatgta gcctatatag acgattggac + 6121 aatttggaaa gatattgaga ttttattgaa gacagttaaa gttgtattga tgaaggatgg + 6181 agcgaagtag attgatagat gtaaaaatca ttgtggcaac acataaagag gttaaaatgc + 6241 ctcaagacaa tagtctttac cttccaatac atgttgggag agacggtaaa tcagatattg + 6301 gttttatcgg tgataatact ggcgataata tatcctctct aaatccatat tattgtgagt + 6361 tgacgggact ttattgggca tggaagaatc ttgattataa ttacttaggt ctagttcatt + 6421 accgtcgtta ttttacaaat aaatctcaag ggtataatga aaatgtcaat atggatgacg + 6481 tcattttgtc tcgatctaat gttgaaatat tattagagaa atctgacgta atagttccaa + 6541 agaagcgaaa gtattatatt gaaactcttt attcacatta tgcccatacc cttaacggag + 6601 aacatctgga tcttgctagg aaaattattg agcaaaatag ttcagagtat ctttcatcct + 6661 ttgataaagt gatgaaacaa agaagcggtt atatgttcaa tatgtttatc atgaaaaaag + 6721 aactattaga tgattattta ccgtggcttt tttctattct ggatactatg tacgaacaga + 6781 tggacttgac cgactatact tcatttgagt cacgtttatt cgggcgagtt agtgagttgt + 6841 tgtttaatgt ttggttatgt aaaaaaggaa taacgcctaa agaggtacca tttatgtaca + 6901 tggagagagt ggatttgttt gaaaaaggaa aatctttttt aatggctaaa ttttttggaa + 6961 agaagtatgg acagagtttc taggagggaa tatgaaaatc accatcaaaa ggtattcact + 7021 gccagaaatt ttaggactag cagcattagc tatattccta ctattttcgt tattaagtat + 7081 aactctttat gcccaatata tatctattaa agtatatttt attgcacttt ttggcattat + 7141 tttattaata tttctgaagg aacttatatc tgagagttat aatcttaaat ctgtgattgg + 7201 attattcgtg atttttactc tctgcttcat cataggtacc gtcacaaatt acgcatactt + 7261 ttttatttta ggtctgtttt tgatttatag tcttagaaat ctcccttttt cagacgtagc + 7321 caaagtctcc tttatcatta gtattagtgt attgctccta gtagtattga gtagtaagct + 7381 tggtattatt cctgattatg ttgagatttg gcctaccaga gttagacact atcttggttt + 7441 ccgatattca ttacttccat caacgcttat gatgaatatc atagctatat catttttttt + 7501 aaagcaagaa aatgcttcat atccgcgtct tcttgtattg tttttacttt caggatggtt + 7561 atacgtagaa acagattcac gtttgacttt tattaattcg tgtttgtttc tactggttaa + 7621 tttaataatg aaattgtcac cttccatcat tgaaaaggta gggagactat taaaactttt + 7681 ttcgttcacc tactttatta atgcctgttt gagttactgg attgcgaaga cttacttaaa + 7741 cacctcaaat gttgttttga atcaattctt ttaccaagtg gatcaatttc ttggaggacg + 7801 tatttattat tctaatcgtt cgttatcttt atatggatat aagttgttag gtcaaaagat + 7861 tgattggatt ggaaatggct tgagcataca aggggagcgt agcacagaaa catatttgta + 7921 tgtggataat ttatatatcc agattcttca acattttggt ttgatagttt cggtaattat + 7981 tttaagccta ttaactataa ctttagtaaa gcttttgaaa aaggggcaga tggtattagg + 8041 aattatttta gttattttga gttttcatgc tttaattgat gatttgatac taaatctata + 8101 ttataatata ttttgggttt tgataggaat gttgatatat aaaaagtatc aattttatga + 8161 caaaaagcag ttgacaatag aataagaagc aagcattgga aatagacatt cagatatgta + 8221 caagaaaact cgatttaagt tttttggtaa aatttttaaa attaagttgt aaaatggata + 8281 tcaaaatctc accttttttt gtaggtgtga ttaaacagag ggatttagat aggaaaataa + 8341 tgaataagat tagcttaact gataatttac cgttaatttc agttgtttta ccagtataca + 8401 acgtagagaa ttatttagaa aaatgtttga attctgttgt gagacagacg tataaaaaca + 8461 tagaaattat aatagtaaat gatggtagct tagattcttc aatagatatt tgtaataagt + 8521 atgcaaataa agatagtcga attaaagtat ttacaaaacc taatggaggt ttgtctgatg + 8581 ctagaaattt cggtatcaaa aaatctatgg gtgagtttat aacattcgtt gattcagatg + 8641 actatgttac agatgattat gtagaatatt tgtatagctt agtcaaaaaa tataattgta + 8701 aaatgtcaat gtgttcaata tttgtccatt atatttctaa tgataaaatg atcaataatg + 8761 ggacaggaag agaattgatg atgacagcag agcagtgtat tgaaaaaatg tgctatcatg + 8821 atgaggtgga tacatgtgct tatgcaaaat tatatcatag aagtctattt agtgaaatat + 8881 gcttccctaa aggaaggata ttcgaagata ttggaacaat ttatcgcttt tttgatactg + 8941 ctgggcagat tgcctgtggt tttaacgcaa aatattatta tgagattcgg gaaaattcga + 9001 ttgttacatc atcatttagt gaaaaaaaat ttgatttgtt atttatgaca gatcaaatgc + 9061 gaaattttgt tgatcaacgc tatccatctt tgaaagctgc aacaaaacgt cgagctgtct + 9121 atgcaagatt tagtaccctt aaccaattat tggatgtaca aggatataat gaagaaaaaa + 9181 aagaaataat tcgttttatc caagacaaca aggaagcgtt acttgaaaat cctaagactc + 9241 ctaagcggga tagattagct gttagagctc tctcccttgg attttgcatt tataaattgt + 9301 tatggaagca atatttaaaa attcaaagag gttagtatga ataaagaatt tttgaagtat + 9361 atttatattc gattattaag aaatttaagg agaattttct ttattatccc gataataaga + 9421 aatagagttg tttttgaatc tttctcagga gatgcttata gttgcaatcc taaatatatt + 9481 tctgaagaat taagaaaaca gtatggtgat tctgttgaaa ttatctgggc ttttaatgat + 9541 ccaaacaaat tcaaaaaaga attaccaaag gagattgtga cttgtcgtta ccgtagtttc + 9601 aatcatctga tatatagaat cacttcaaaa gtttatattt gtaatttcct gcaagcaatc + 9661 gaaattccaa agcgtaaagg acaactagag attcaaactt ggcatggagg aggttgctat + 9721 aaaaaagttg gggtggctga aaaaggacgc caggctgctt atgttaaacg acaacggatg + 9781 cacgttgaag aaacagatct ctttattaca agtagtaaat attttgaaaa tgaggtagta + 9841 aaaaaacaat ttgggtataa gggagaaatt ttatctattg gtatgcctcg aaatgatatt + 9901 ttaataaatt taccaatttc aagtcaagtt gagaaattaa aggagaaatt gggattacca + 9961 aacaataaat tgatagcact ttatgctccg acctggagat caggtactaa acagtatgaa + 10021 acacttgata taaaaaaact tactcaagcc gttgataaaa aatttggtaa aaaatgtatt + 10081 gttcttttca gatcgcatct atatggaaat caatcttatg atgatgttgt ggatgtctct + 10141 cagtatagtg atatgcaaga attattgttg ctttcagata tactgattac tgactattct + 10201 tcgtctatgt gggatttctc tctctctttt aaaccgtgtt ttttatatac ccccgatttg + 10261 aaggattatc tagatgaaag aggttttgat gaagacatac attcatgggg attttcagtt + 10321 tctgaatcaa ataaggaact agttgaaaat attttacagt ttaataatga agaatataga + 10381 caaaaaatga agaatcatca tcagttttta gaatcttatg aacaaggaga tgcagtgaaa + 10441 agagttgtgg cgaagattgc tgaatattgt aatttataga gaggatagat aatgaaaaaa + 10501 attggtgatt tggtcaaaag atatggtgtg aaaaatgtgg ttttacgtgc tattaatgat + 10561 gttctaccag tcaatctcat ctttcctagt caacaactca gacgtttgaa ttgacaagaa + 10621 aaagtcaaaa agaagttgaa aaaatatgta gttgtttcgg attcaatcaa gagtgaggag + 10681 gagtgcgata ttatctggtg gctatggttt caaggacttg ataatgcact agctattgtg + 10741 aaaaaaatgt agagagtcgg tagataaata tgctaaacgc agtggcaaaa gggttattga + 10801 gttaacatct caaaatttat ttgaatatat tgaggtacct aacgaactct atgtaaaata + 10861 taagtcaggt agtttgccat tagctttgtt ttcagatttt tgtcgaatta gccttctttc + 10921 taactatgga ggattatggg ttgattcaac tgttctaatt acggggaaaa ttgaagatga + 10981 gatattgaac caagatattt ttatgtttca agcttcccct ttagactatt cggttactaa + 11041 aatcagtaat tggatgttat attcaaaata cccaggacac ccgttcatat tatcgatacg + 11101 tgatactttg atttcatttt ataaataata agaataatac gattccggat tgttttttat + 11161 ttcatttact tgtttcctgt ttaatagatg ataataggat aaatcaaagt ttttataata + 11221 tggattatta tactaatacc tatcctcact tattagggag agttttgagc gaaccatatg + 11281 atcctttgaa atttgaaaat attttaagga aaacgtctat ttataaatta tcatataaaa + 11341 atttaaatta tgttgctgag gatagatttt ataatgcaat tttagattta gattttagtt + 11401 agaataaaga ggagagaaat gaatttagca gttatttttg ctggaggatc cggtacgcga + 11461 atgaatgcaa aggatagacc taagcagttt cttttggtac atggtaagcc aattattgtt + 11521 cacactattg agctatttga gaaccatcca gagattgatg gaattatcgt tgtttgtatt + 11581 gaggattgga ttccgtatat ggaggagatg aaatatcgct atagattaga taagattgct + 11641 aagattgttc cagggggggc aactggtcaa ttatctattt ataatggttt agtcgcggct + 11701 gaacaagttt atggaataga ggataatgtt gtgttaatcc atgatggagt ccgtccttta + 11761 attacagcag acactatttc agataacatc caatccgtaa aagaaaaggg aaatgctatt + 11821 acttgtacag tggccaaaga aacagttatc ttagtagatg atgaaaataa ggtaggcgaa + 11881 gtgcctagtc gtgaacattc gcgatttgcc aaggctcctc agagtttttg gctaaaagat + 11941 attctaggtg cacatcgaga ctctgtagat aacggtagaa atgattttat tgattcatgc + 12001 accatgatga gacactatgg tcatgattta catgttgttg ttggtccgta tgagaatatt + 12061 aagattacaa cgcctgatga tttttatata tttagggctt tgtacgatct tcgtgagaat + 12121 gagcaactaa aataatgaag aaaagagaaa aagatgaagt attttgttga agaaacgtta + 12181 cttgatgaac aggataaaaa aaatgcgggt ggaaaggcta gacaagacgt cactgatatt + 12241 ttggaatcca taggttatca gaagttaata gctgagtccg gaatgaatga acgtcaggaa + 12301 ttaaatgctg ttcaaagatt ggttcatcat tataaagtta agaaaatgtg gaagaaaact + 12361 ctttcagttg ttggtaaggg tgatgaagtt attattcaat ttcctttact aaatcatagt + 12421 ttattcttta atcaggttat taagcaactt agtaagaatg gagttaaagt ttattttttg + 12481 attcatgatt tagaatcgtt gcgatggtcg cagtcaaaat cgatatcatt aaaaagtagg + 12541 attcgattaa acattgaaga acgtagtgtt ttaaggttat cagaaggcat tattgctcat + 12601 aataaaaaaa tgaaatctta tattaagacc tactctgttg aaagttctaa aattattcct + 12661 cttgaaattt ttgattatat tattccatct tatcatgaaa gaaaaaatct ggataacttt + 12721 cagttaaatg ctccaattgt tattgctgga aatttaaagc aacataaagc tggatatgtc + 12781 tatcatttac caagcaatgt ggagtttaat ctttatggaa ttggatatga acagacagat + 12841 gacaaaagtg tgcactactg tggttctttt atgccagaag aattaccatt cgttttaaaa + 12901 ggaagttttg gattggtatg ggatggtccg tcatcagagt cttgtataga aacttatgga + 12961 gagtatcttc gtgtaaacaa ccctcacaag acttcactat atttagcttc aggcatacca + 13021 gtagttgtat ggtcagaggc agcaatagct agtttcatta aggagaataa ttgtggtatt + 13081 cttgtatcca atctgagtga actacctgag ttactttcta tgattaccgt tgatgaatat + 13141 gaattgatga aaaagaatac tgagattatt ggagaaaggc ttcgacaagg tttttatact + 13201 aaacaagcag ttaaaggttt ctagactgga ggaagtgtaa tgattgaaag ttttaatgat + 13261 aaagtgttgc aggaagattt agagataatt gcaaaagaag agcttccatt tcgaaaattt + 13321 agaaattcaa ctgtttttat cacgggagta acaggtttag taggccttca attatttaag + 13381 gctttggctt gtatcaatag agtccatcag ttgaatatga aaattattgg tctagtcaga + 13441 aatttggata aagcagaaaa aatttttgga gatttattga aacggaagga tatacaaata + 13501 gttttaggag atgtttcgga agatttccac tcgtatatcc ctgatggttt agttattgac + 13561 tatatcattc acggagcaag cgtgactacc tctaaactca tgattgaatt tccagtagat + 13621 acaattcgag tagcttttaa tggaacgtat caaatgttag aattggcaaa agaaaaaaaa + 13681 gtgaaaagtt ttgtatatct ttcttcaatg gaggtatatg gtagctttca gtcagataga + 13741 acaactgttg taaacgagaa tatgttaggg tatcttgatt tgacatctgt tcgaacaaat + 13801 tacccagaat gcaaaagaat ttgtgaaaat atgtgcattg catttctaag tcagtatcaa + 13861 gtcccggcta agattgctcg tctatcccag acctttggtg caggcactct accgggtgaa + 13921 aatagagtat ttgctcaatt tgctcgtagt gttatgcaag ggaaagatat tgttttacat + 13981 acgttagggc aatcagaagg aaattactgc tacacagctg atactgttgt tgcattatta + 14041 acaattctat tgagaggaga aaatggggag gcttataata ttgctaatga agagagtcat + 14101 acaacaatag cagatatggc aaaaatggta acttcgcaat tctctcaaac gagtcaagtg + 14161 gtttttgata ttccgaagaa aaatatattt ggttatgctg tagatactaa aatgaagtta + 14221 tcaacacaca aaattcaaca attgggttgg aagccgaggg tctctcttgt agatgcttat + 14281 gatcgaatga tgagaagtat gaatgaaact ggggtatagg taactatatg aaggtattaa + 14341 aaaactactt atataatctc tcttatcaac tattagttat tattcttcct atcattacga + 14401 ctccttatgt gacgcgcata ttttcttcag atgatttagg gacatacggt tacttcaact + 14461 ccattgttac ctacttcatt ttacttgcta ctctgggtat tgctaactat ggaacgaagg + 14521 agatatctgg gaataggaag agtattcaga aaaatttctg gggaatatat actttacagt + 14581 ttggagcgac tactttttcc atttttctct atatactagc ctgtcttttc atcccaggga + 14641 tgaaaaacct agttgcatat atcttgggat tgggtttagt ctctaaagga ctagatattt + 14701 catggttgtt tcaagggtta gaagattttc gtaaaattac ggtcagaaat atcacagtga + 14761 agcttgttgg tgtaagtgcc attttcttgt ttgtaaaatc agcgagtgat ctatacttgt + 14821 atgtttttct tctaacagca tttgaattgt tgggtcagtt aagtatgtgg tttccagccc + 14881 gtgaatatat tggaaaacca cattttgata tagaatatgc taggcatcat ctgaagccag + 14941 ttatcttgct attcttacca caaattgcta tctcgcttta tgtgacttta gatcgtacaa + 15001 tgttaggggc gctagcttct acaaaagatg tcggcattta tgatcaggct ttgaagctgg + 15061 ttaatatttt actgaccttg gtaacttcct tgggaagtgt tatgctgcca cgcgttgcgc + 15121 atttgttagc gacaggtgat cataaggtag tcaataagat gcatgaggta tccttcttaa + 15181 tttataattt ggttattttt ccgattatgg cagggatgtt gattgtgaat gatgattttg + 15241 ttcaattttt ccttgggcaa gactttcaag atgcacgcta tgcaatttcc attatgatct + 15301 tccgtatgtt ctttatcggt tggactaata taatgggaat tcagatactg atacctcata + 15361 atcaaaataa agaattcatg atttcaacaa caactcccgc aattatcagt gtaggtttga + 15421 acttactatt ccttcctaaa ctgggatata tcggggcagc cattgtctct gttttaacag + 15481 aggcacttgt atgggcaatc caattattct atactcgcag atatttaaaa gaagttccta + 15541 taatcggatc aatgtcaaaa attatactag catctgccat tatgtatggc cttttactaa + 15601 gttcaaaaac agttatacat ttttcaccga ccttaaatgt gctagcattt gtagcgcttg + 15661 gtggaatcat ttatcttttt gcaattctat ctctgaaagt ggtagatgtg aaagaattaa + 15721 aacaaattat taggaaaaac tagaatgaga aaaaatcgaa atatcaacct agatttacta + 15781 aaagtgcttg catgtgttgg agttgtttta cttcatacaa caatgggcgg atttaaagag + 15841 acaggttcat ggaatctttt ggcatattta tattatttag gtacttactc tattcccttg + 15901 ttttttatga tcaatggtta tttgttgtta ggcaagaggg agataactta tctttacata + 15961 ctcccgaaag taaaatggat tttaataaca gtgtcatcat ggtcatttat cgtatggctt + 16021 tttaagcgtg attttacaac taatcctatt aaaaaaattg taggttcttt gatacaaaga + 16081 ggttatttct ttcagttttg gtttttcggt gcactcatac ttatctattt atgtttgcca + 16141 attttgagac aatttctaaa ttcaaaaaga agctatttat acagtttatc tttattgatg + 16201 actattggtt tgatttttga gttatcaaat atcctacttc aaatgccaat acaaacatat + 16261 gtaatacaaa cttttagatt atggacgtgg tttttttact atcttttagg tggttatata + 16321 gcgcaattca ctatagaaga aatcgaatca aggtttaaga attggatgaa aatagttagc + 16381 atacttttgt tattgatttc accaataata ttatttttca tagcgaagac tatataccat + 16441 aatctatttg ctgaatactt ttatgatact ttatttgtaa aagtcagtac tttaggaatt + 16501 tttctaacta tcctcatgct tactttgaat gaaaaccgaa gagaatcgat tgtttccctt + 16561 tctaatcaaa caatgggggt tttcataata catacttata ttatgaaagt gtgggaaaaa + 16621 gtgcttggtt ttaattttgt aggagcatat ttattttttg ctctatttac tttaagtgtt + 16681 agttttatta ttgttgggat gttaatgaag attccttact tcaatcgaat cgtcaaatta + 16741 taaaaaggag aacaagatgt acgattatct tattgtcggt gctggtttgt caggagcaat + 16801 ttttgcttat gaggcgacca agcgtggaaa aaaagtaaaa gtgattgata aacgtgacca + 16861 cattggtggg aatatctact gtgagaatgt agaaggagtt aatgttcaca aatatggtgc + 16921 ccatatcttt catacttcta ataagaaagt ttgggattat gttaatcaat ttgctgaatt + 16981 taacaactac gtcaactcgc ctgtagctaa ttacaagggt agcctctata atctaccttt + 17041 caatatgaat accttctatg ctatgtgggg gacaaaaact cctcaagaag tcaaagataa + 17101 gattgctgag cagacagctg atatgaagga tgttgagccg aaaaatctgg aagaacaagc + 17161 tatcaagctg attggtccag atatctacga aaaattgatc aagggttata ctgaaaagca + 17221 gtgggggcgc tcagcaacag aacttcctcc atttatcatt aaacgacttc cagttcgtct + 17281 aacatttgat aataactatt ttaatgaccg ttatcaagga attcctattg gtggttataa + 17341 tgtgattatt gaaaatatgc ttaaagacgt agaagttgaa cttgaagtag atttctttgc + 17401 tcaccgtgaa gggttggaag catctgctga aaaagttgtc ttcacaggaa tgatcgacca + 17461 atattttgac tacaaacacg gagagttaga ataccgtagc cttcgttttg agcatgagat + 17521 tttagacgag gaaaattatc aaggaaatgc tgtagtgaac tatacggagc gtgagattcc + 17581 ttatactcgt attatcgaac acaagcattt tgaatatgga acgcaggcaa agacagttat + 17641 cacgcgtgaa tatccagctg actggaagcg tggggacgag ccttactatc cgatcaacga + 17701 tgagaaaaat aatgctatgt ttgctaagta ccaagaggaa gcttcaaaga atgataaggt + 17761 tattttctgt ggacgtttag cagattataa atattatgat atgcatgtgg tgattgaacg + 17821 ggcgcttgag gttgtggaga aagagtttgg atatgacaaa aagtagaatc aattggatag + 17881 attttggaaa aggcttttcc atatttttag tcttagcagg gcatgtgttg cttggactgt + 17941 atcaatcgga aaaatttccc acagcaaata acatactatc gttgttgata gcacaagtct + 18001 acatatttca tataccagta ttttttgcct tatcaggata ctttttcaaa cctgtgtcgg + 18061 atttgaagga gttctggcaa tatgctaaaa agaagacaat tgtttttggt ctgccatata + 18121 ttttctattc gatcattcac tttggtcttc aaaaagttgc agggtcatct gttcgtgttc + 18181 ctacaaccat atctgatttg ctaaatatct ataaagatcc tcttggagtt tcgtggtatt + 18241 tatatatact ctggtcgatt ttgataatct atggattatt gtctatttta gtcaaaaatc + 18301 gtagaatgtt atttttgata agtgttttcg cttattgttt aaccctattt gttcaaacag + 18361 atatttatat tattcaaaga acgctagttt gggggctttg tttctttctt ggcagtgtat + 18421 tgaatgaaat tcactttgat aaaattaatt tgaaaaaatt tctttttttc tttgtgctat + 18481 ttgattttat ttatatgttc gcttggttct tgttttatga agtagggtct aagaaggatt + 18541 atgtaagcta tagtaaccca ggtttgtggg ggattgcttt tgttgtctgt gtattagttg + 18601 cttttgcgat ttttccgaaa atggagaaaa attttcctaa aactttccta tatttcacta + 18661 aatacgggaa agatagttta gggatttata ttcttcatgc accaatttgt agcatgattc + 18721 ggattctaat gttgaaagtg ggaataaact cagtttttct tcacgttgtt gttgggattg + 18781 tgctaggctg gtatttatcc atactagcaa cttatatatt gaaaaaaatt ccatttttga + 18841 atattgtttt attaccacaa aagtatatta aattaaaatg actctttgtc aactgtagtg + 18901 ggttgaagaa aagctaagct cgagaaagga caaattttgt cctttctttt ttgatattca + 18961 gggcgataaa aatccgtttt ttgaagtttt caaaggtaag cgcgtcataa caaggtatct + 19021 atcattcatg gaagacctcc tgtatactat tagtaaagta aaactattgg aggatattgt + 19081 aatgccacaa cctattgttc ctgtagagat tccacaatct cgtcgttttg attctaaaaa + 19141 gagaaatgat attctgctta aaattcgtat tggcaagctt gaagtaagtt tttttcaatc + 19201 tctcaatctc gaaatgatat aacagctttt ggataaggtg ttgctttatg acaattcatc + 19261 tatctagcct agggcaggtc tatctcgtat gtgggaaaac ggatatgagg caaggcattg + 19321 attcactggc ttatctggtt aaaacccgct ttgaattgga tcctttctca ggtcaagttt + 19381 ttctcttttg tggtggacgt aaagaccgct ttaaagccct ttactgggat ggtcaaggat + 19441 tttggctatt atagtggatt taaactagaa tagtacacct ctgcttctaa aacattgtta + 19501 gaaatcgatt tgactgtcct gttcttattt cattttacta taaattcatc agaaagtcgt + 19561 gatttctatt gaaatgagga ctttcttttt atactcatct gctttcaaaa agcattctag + 19621 tccatctccg attaacgatg gactttatca cctccttctc cagtccttgt atgacatctt + 19681 ggagttgatt catgacatct tccaaagttc gaaaggcctt attcttaaat ccacgtttac + 19741 gaatctcttt ccacacttgt tcaatggggt tcatctctgg tgtgtatgga agaataaagg + 19801 taaaaccaat attagtcgga atctttaagg tacttgattt ataccatata gcattgtcca + 19861 taacgagtaa aagataatca tctggataag cttgtgaaag ctcctattcc taaagcccct + 19921 ttataacctc ttgcgagaga gactattgac tcagccctta cttcatgcgg atgaaacctc + 19981 ctatcgggtt ctagagaatg atagccatct gacctactat tggacctttt tgtctgggaa + 20041 agctgagaat caagcaatca cgctgtacca ccatgatcag cgtcggagtg gttcggtagt + 20101 gcaagaattc ctaggagatt attctggcta tgttcattgt gatatgttgc ggcagtaact + 20161 taggacttta gtcctctagt tctgcctatg cgatagcagt ccaaggttta ggagcaaggc + 20221 gacgctaagc ttggtaaact gcgaaccgct agaagcttat cgtcaactgg aagaagctga + 20281 acttgttgga tgttgggcgc atgtgagaag gaagtttttt gaagcgcccc gcaagcaagc + 20341 ggataaatca tcgttaggag ctaaaggttt agcttattgt gatcagttat tttccttgga + 20401 aagagactgg gaggctttac cagctgatga acgactacgg aaacgtcaag aacatctcca + 20461 gcccctaatg gaagacttct ttgcttggtg ccgccgtcag tcagttttat cgggttcaaa + 20521 actaggaagg gcaattgaat acagcctcaa gtatgaagaa acctttaaga ccattttgaa + 20581 agacggacat ctggtccttt ccaataatct agctgaacgc gccattaaat cattggttat + 20641 gggacggagt aaaagagtcc agtggactct tttagcctga gctcagttta aaaaagcgag + 20701 ggtggttgtt ttctcaaagt tttgaaggag ctaaagcaag agctattatt atgagcttat + 20761 tggaaacagc taaacgtcat caattaaata gcgagaaata tctattctat cttctagaat + 20821 gtcttccaaa cgaggaaact ctcgtaaaca aagaggtttt agagcctatt taccatggac + 20881 taaagttgta caagaaaagt gcaaataaga aatctccaga ttaggaacta tccgtgagtt + 20941 ctctagtctg gagatttttc aatatatttc gttattggac ggttacgata ttcatatttt + 21001 ttgcaaagat gttgtttgaa aaataatttt caaaaattct gaaaattctg ttgacatctt + 21061 tctgaaaaga gtctataatg gagagaaagt tttaaaggag aaaatgatga aaagttcgaa + 21121 actatttgcc cttgcgggcg tgacattatt ggcggcgact actttagctg catgctctgg + 21181 atcaggttca agcactaaag gtgagaagac attctcatac atttatgaga cagaccctga + 21241 taacctcaac tatttgacaa ctgctaaggc tgcgacagca aatattacca gtaacgtggt + 21301 tgatggtttg ctagaaaatg atcgctacgg gaactttgtg ccgtctatgg ctgaggattg + 21361 gtctgtatcc aaggatggat tgacttacac ttatactatc cgtaaggatg caaaatggta + 21421 tacttctgaa ggtgaagaat acgcggcagt caaagctcaa gac +// + diff --git a/public/res/serotype_genbank/serotype_35B.gb b/public/res/serotype_genbank/serotype_35B.gb new file mode 100644 index 0000000..56ef215 --- /dev/null +++ b/public/res/serotype_genbank/serotype_35B.gb @@ -0,0 +1,761 @@ +LOCUS CR931705 16658 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 4356/39 (serotype 35b). +ACCESSION CR931705 +VERSION CR931705.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 16658) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 16658) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..16658 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="4356/39" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC35B_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC35B_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34301.1" + /db_xref="GOA:Q4JZD8" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JZD8" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAP + WDAFCVELL" + gene 323..491 + /gene="aliB" + /locus_tag="SPC35B_0002" + /pseudo + CDS 323..491 + /gene="aliB" + /locus_tag="SPC35B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(492..1011) + /gene="tnp" + /locus_tag="SPC35B_0003" + /pseudo + CDS complement(join(492..638,637..1011)) + /gene="tnp" + /locus_tag="SPC35B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1227..2681 + /gene="wzg" + /locus_tag="SPC35B_0004" + CDS 1227..2681 + /gene="wzg" + /locus_tag="SPC35B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34304.1" + /db_xref="GOA:Q4JZD7" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZD7" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVGFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLVIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVY + NDQEFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1227..1352 + /gene="wzg" + /locus_tag="SPC35B_0004" + /note="Signal peptide predicted for SPC1668 by SignalP 2.0 + HMM (Signal peptide probability 0.979) with cleavage site + probability 0.532 between residues 42 and 43" + misc_feature 1440..1787 + /gene="wzg" + /locus_tag="SPC35B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.6e-63" + misc_feature 1965..2408 + /gene="wzg" + /locus_tag="SPC35B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2683..3414 + /gene="wzh" + /locus_tag="SPC35B_0005" + CDS 2683..3414 + /gene="wzh" + /locus_tag="SPC35B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34305.1" + /db_xref="GOA:O86886" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:O86886" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDRGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2686..3294 + /gene="wzh" + /locus_tag="SPC35B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.6e-36" + gene 3420..4115 + /gene="wzd" + /locus_tag="SPC35B_0006" + CDS 3420..4115 + /gene="wzd" + /locus_tag="SPC35B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34306.1" + /db_xref="GOA:O86887" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:O86887" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3420..3536 + /gene="wzd" + /locus_tag="SPC35B_0006" + /note="Signal peptide predicted for SPC1670 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3441..3857 + /gene="wzd" + /locus_tag="SPC35B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.1e-55" + misc_feature 3963..4040 + /gene="wzd" + /locus_tag="SPC35B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4125..4814 + /gene="wze" + /locus_tag="SPC35B_0007" + CDS 4125..4814 + /gene="wze" + /locus_tag="SPC35B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34307.1" + /db_xref="GOA:Q4JZK1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZK1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 4829..6196 + /gene="wchA" + /locus_tag="SPC35B_0008" + CDS 4829..6196 + /gene="wchA" + /locus_tag="SPC35B_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34308.1" + /db_xref="GOA:Q4JZD3" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZD3" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYLNFKGSKKILLLTATSHVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHIMAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 4829..4915 + /gene="wchA" + /locus_tag="SPC35B_0008" + /note="Signal peptide predicted for SPC1672 by SignalP 2.0 + HMM (Signal peptide probability 0.844) with cleavage site + probability 0.429 between residues 29 and 30" + misc_feature 5612..6193 + /gene="wchA" + /locus_tag="SPC35B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.8e-158" + gene 6183..6989 + /gene="wciB" + /locus_tag="SPC35B_0009" + CDS 6183..6989 + /gene="wciB" + /locus_tag="SPC35B_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34309.1" + /db_xref="GOA:Q4JZB6" + /db_xref="UniProtKB/TrEMBL:Q4JZB6" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDV + ILSRSNVEILLEKSDVIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKGLLDDYLPWLFSILDTMYEQMDLTDYTSFESRLFGRV + SELLFNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 6998..8227 + /gene="wzy" + /locus_tag="SPC35B_0010" + CDS 6998..8227 + /gene="wzy" + /locus_tag="SPC35B_0010" + /note="member of homology group 45" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34310.1" + /db_xref="UniProtKB/TrEMBL:Q4JZD1" + /translation="MKITIKRYSLPEILGLAALAIFLLFSLLDVSFYVQYISPMLYKA + AIFLIIMLIILKEFVSGSNSFESLLGLLGVSTLYFIIGSVTSYTSFIVLGLSLIYSLR + DIPFSKVVKVAFIISVAMLFLVILSSKIGFIPDYIEFSSTRVRHYLGFRYSLFPSTIM + MNIIAISFFLKQETVSYQRLFILFLVSMYLYLETDSRLTFISSSLLLLANLAMKLIPT + VIEKFSLLLKFFTLTYFVNAYLSYWISKNYLRTSNALLNHFFHQADQFLGGRIYLSNR + SLSLYGYGILGQKIAWVGNALNAQGERSTDAYLYVDNLYIQILQHFGLIALIIILSLL + TATLVKLLRKGQIVLSIIIVSLSFHALIDDLILSIHYNIFWILLGSLIYSNYQFSEER + YGEVENDSLRRTVREGY" + misc_feature 6998..7099 + /gene="wzy" + /locus_tag="SPC35B_0010" + /note="Signal peptide predicted for SPC1674 by SignalP 2.0 + HMM (Signal peptide probability 0.982) with cleavage site + probability 0.455 between residues 34 and 35" + gene 8239..9363 + /gene="wcrJ" + /locus_tag="SPC35B_0011" + CDS 8239..9363 + /gene="wcrJ" + /locus_tag="SPC35B_0011" + /note="member of homology group 129" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI34311.1" + /db_xref="GOA:Q4JZD0" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4JZD0" + /translation="MNNRDGKYYIGLVMKIITNPLKILKIKKRRVLLKSYNAETISCN + PKYIYNELKKINRYELVWVLKEPEKYPDVKAVKYMSLKWLYYIVTSQYVISNTGFNFW + LPKKKKQIYINTWHGGGAYKDSDNLNNISKAQVKQIKKSAELEDYFISSCAVFTKEYA + KKRVGFKGKILEIGTPRNDFLIRNQADDGLKNSIKNRLGIDDNCSIVIYAPTWRDDAS + AIEEIDYESLLESLRETYPKVSILVRGHHLQKNLIDIKNSNIVNVSDYDDMQELLLIS + DLLITDYSSTIWDMIHGGKKVLLYTPDLDEYLKYRGFHVDIKEWNIPYFKTNEELIAY + ISSNYFKNMEEMIENHKIRFGSFEHGNATQKIVELLEEGN" + misc_feature 8818..9354 + /gene="wcrJ" + /locus_tag="SPC35B_0011" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 2.8e-31" + gene 9364..10344 + /gene="wcrM" + /locus_tag="SPC35B_0012" + CDS 9364..10344 + /gene="wcrM" + /locus_tag="SPC35B_0012" + /note="member of homology group 117" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34312.1" + /db_xref="GOA:Q4JZC9" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZC9" + /translation="MKVSVIIPVYNVEKYLRRCLDSVVNQTYKDIEVILVNDGSPDNS + KEICEEYVAKYSNIQLINQKNAGLGAARNTGLQYITGNAVTFVDSDDWLELDAIEYYV + ASMKKSDADIVVTQMIRKKEYFSNEGTNGTTIKEEVLNQEQFAKKYFKIDGNNIEYYA + CAKLYKREIAREVKYPVGLFAEDVPAAFGYIIRSQKIFYSTKVTYNYFFNDNSLTAKF + TDKDFDLEKIWDLVVEEAKVYGNEDYILYAKVNRYRIDFNLLCRIALSENKSDIEKYS + QEIVVLLGKVKENKKILLKYLPFSRKVIFRLFIVDYTLGRNVLRMFKNIV" + misc_feature 9373..9885 + /gene="wcrM" + /locus_tag="SPC35B_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.4e-47" + gene 10365..11438 + /gene="wcrH" + /locus_tag="SPC35B_0013" + CDS 10365..11438 + /gene="wcrH" + /locus_tag="SPC35B_0013" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34313.1" + /db_xref="GOA:Q4JZC8" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4JZC8" + /translation="MIEMYYFIKVEKDLKNTAGIKAPDDIEKISEELGMKEIRFPKFP + FEKNKVIQKLWLFCVVGYNWISLLWRLKKNDVVIYQHPMYGVRVANFAIPLLKKYKNI + KFISVIHDLESLRKGIQGVIEDNETTNAIADKELLSKFDKVISHNPKMTEYLEGIGIK + KENLVELQIFDYLDPSEIEEKIEDGVVIAGNLAKGKSSYIYKLLENELNFKLNLFGPN + FINEELPENVEYFGSLPPNKLPQKLVGKFGLVWDGDSLETCSGNTGNYLKYNNPHKTS + LYLASGIPVIIWKEAALAQFIEENNVGITVNNLSEIEFVMQNISEGEYLSIKRNTMQL + GEKLRNGYFYRQAISKCKNDFMK" + gene order(11684..11989,12017..12406) + /gene="tnp" + /locus_tag="SPC35B_0014" + CDS join(11684..11989,12017..12406) + /gene="tnp" + /locus_tag="SPC35B_0014" + /note="member of homology group 19; + member of homology group 19" + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + /protein_id="CAI34314.1" + /db_xref="GOA:Q4JZC7" + /db_xref="InterPro:IPR002559" + /db_xref="UniProtKB/TrEMBL:Q4JZC7" + /translation="MLAVLKTAYQLKHAKGGRKPKLSLEDLLMATLQYVREYRTYEEI + AADFGIHESNLLRRSQWVEVTLVQSGVTISRTPLSSEDTVMIDATEVQINRPKKRISE + MKAQAIVTSQGRIVSLDITVNYCHDMKLFKMSRRNIGQAGKILADSGYQGLMKIYPQA + QTSRKSSKLRPLIVEDKACNHALSKERSKVENIFAKAKTFKMFSTTYRNHRKRFGLRM + NLIAGIINHELGF" + misc_feature 11798..11863 + /gene="tnp" + /locus_tag="SPC35B_0014" + /note="Predicted helix-turn-helix motif with score + 1106.000, SD 2.95 at aa 39-60, sequence + RTYEEIAADFGIHESNLLRRSQ" + misc_feature join(11930..11989,12017..12397) + /gene="tnp" + /locus_tag="SPC35B_0014" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 9.8e-14" + gene 12450..13865 + /gene="wzx" + /locus_tag="SPC35B_0015" + CDS 12450..13865 + /gene="wzx" + /locus_tag="SPC35B_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34315.1" + /db_xref="GOA:Q4JZC6" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZC6" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSNDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKEIEKNFWGIYSLQLGATVFSLTLYCLLCLTL + PFMQNPVAYILGLALVSKGLDISWLFQGLEDFRKITVRNITVKFVGVISIFLFVKSAD + DLYLYVFLLTIFELLGQLSMWVPAREFIGRPHFDLEYARHHLKPVILLFLPQVAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVSNLLSSGDHKAVN + KMHEISFLIYNLVIFPIMAGMLIVNDDFVTFFLGQDFQEARYAIAIMIFRMFFIGWTN + IMGIQILIPHNQNKEFMLSTTIPAIVSVGLNLLLLPKFGYIGAAIVSVLTEALVWAIQ + LYYIRAYLKDVPIIRTMIKIILASAIMYSVLLVSKTYIHFSPTINVLVFVVLGGIIYL + FSVLSLKVVDVIELKQVIRKN" + misc_feature 12456..13250 + /gene="wzx" + /locus_tag="SPC35B_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.2e-71" + gene 13867..14865 + /gene="wciG" + /locus_tag="SPC35B_0016" + CDS 13867..14865 + /gene="wciG" + /locus_tag="SPC35B_0016" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34316.1" + /db_xref="GOA:Q4JZC5" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZC5" + /translation="MHKFKDINLDLLKVIACVGVVLLHTEMGGFKETGSWNFSTYLYY + LGTYSIPLFFIVNGYLLLGKKEITYSYILQKVKYILITVLSWTFIVWLFKRDFSVNPI + KKLIGSLVQKGYFFQFWFFGALILIYICLPVLKQFLNSKRSYLYFLSVLLVIGLIFEL + TNIVLQMPIQTYVIQTFRLWTWLFYYILGGFISQFDKNTIKNGFKRWMKVIAVLLLLV + SPFILFFIAKTTYHNFFAEYFYDILLVKVVSVGIFLTIFSIVLNENSNKWIIFLSNQT + MGIFIIHTYIMKVWEKLFGFNFIGSYLLFAIFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 14878..15981 + /gene="glf" + /locus_tag="SPC35B_0017" + CDS 14878..15981 + /gene="glf" + /locus_tag="SPC35B_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34317.1" + /db_xref="GOA:Q4JZC4" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZC4" + /translation="MYDYLVVGAGLFGAVFAHEAALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIEEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPSFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQ + GNVIFGGRLGHYRYYDMHQVIGVALQCVRNELN" + misc_feature 15313..15921 + /gene="glf" + /locus_tag="SPC35B_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.7e-113" + gene 16299..>16658 + /gene="aliA" + /locus_tag="SPC35B_0018" + CDS 16299..>16658 + /gene="aliA" + /locus_tag="SPC35B_0018" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34318.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 16299..16385 + /gene="aliA" + /locus_tag="SPC35B_0018" + /note="Signal peptide predicted for SPC1683 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 16545..16613 + /gene="aliA" + /locus_tag="SPC35B_0018" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttggct ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 tttttttata accaaggttt ataaactttc attctcgaaa ttcaattaac tttacaaatt + 301 cccactatta aggagaaaga agataaacat aaagaagcgt gtccttagtg caggtctgac + 361 ttttgcatct gctttgcttt tagctgcttg cggccaatca ggttcagata caaaaactta + 421 ctcatcaacc tttagtggaa atccaactac atttaactat ctattagact attacgctga + 481 taatacagtc aattgaaaca agaacaagac aaaagagcct cgtaaaaagt attgcaactt + 541 ggtaatacct ttttgaggtg ctttttgata tgagcccatg ttttctcaat aggattgtac + 601 tcaggtgagt agggaggaag aaggtaaaag tttatgccca aactcttcgc ataaaagttc + 661 tagcttcccc agtctatgga atcttacatt atccataata ataaccgata gtgtggttaa + 721 tgttggtaag agaaatttct gaaaccaagc ttcaaaaaag tcgctcgtca tcgtctcttc + 781 gtaagtcatt ggagcaatta actcaccatt tgttagacct gcaaccaaag aaatcctctg + 841 atatcttctt ccagatactt tgcctcttct taactgacct tttaatgagc gaccatattc + 901 tcgataaaaa taagtatcga atcttgtttc gtcaatctaa acaggtgcta ggtgctttaa + 961 actattaaaa ttcttaagaa ataaggctac tttttctggg tcttgttcat aattagattg + 1021 aaactagaat agtacacctc tgcttctaaa acgttgttag aaatcgattt gactgtcctg + 1081 atcgttttat catgttctta tttcatttta ctatattttt ggttcgcggg aagtctacta + 1141 agatacttaa agatgcagat agtgaaaata aaggtgtaga cattaccgta aaaaagtgat + 1201 ataatcgtat gatgttcaat gtataggtgt taatcatgag tagacgtttt aaaaaatcag + 1261 gttcacagaa agtgaagcga agtgttaata tcgttttgct gactatttat ttattgttag + 1321 ttggtttttt attgttctta atctttaagt acaatatcct tgcttttaga tatcttaacc + 1381 tagtggtaac tgcgttagtc ctactagttg ccttggtagg gctactcttg gttatctata + 1441 aaaaagctga aaaatttact atttttctgt tgctgttctc tatccttgtc agctctgtgt + 1501 cgctctttgc agtacagcag tttgttggac tgaccaatcg tttaaatgcg acttctaatt + 1561 actcagaata ttcaatcagt gtcgctgttt tagcagatag tgatatcgaa aatgttacgc + 1621 aactgacgag tgtgacagca ccgactggga ctgataatga aaatattcaa aaactactag + 1681 ctgatatcaa gtcaagtcag aataccgatt tgacggtcaa ccagagttcg tcttacttgg + 1741 cagcttacaa gagtttgatt gcaggggaga ctaaggccat tgtcctaaat agtgtctttg + 1801 aaaatatcat cgagtcagag tatccagact acgcatcgaa gataaaaaag atttatacca + 1861 agggattcac taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct + 1921 atgttagtgg aattgacacc tatggcccta ttagttcggt gtcgcgatca gatgtcaata + 1981 tcctgatgac tgtcaatcga gataccaaga aaatcctctt gaccacaacg ccacgtgatg + 2041 cctatgtacc aatcgcagat ggtggaaata atcaaaaaga taaattaacc catgcgggca + 2101 tttatggagt tgattcgtcc attcacacct tagaaaatct ctatggagtg gatatcaatt + 2161 actatgtgcg attgaacttc acttcgtttt tgaaattgat tgatttgttg ggtggaattg + 2221 atgtttataa tgatcaagaa tttactgccc atacgaatgg aaagtattac cctgcaggca + 2281 atgttcatct tgattcagaa caggctctcg gttttgttcg tgagcgctac tcactagcag + 2341 atggcgatcg tgaccgcggg cgcaatcaac aaaaggtgat tgtggctatc cttcaaaaat + 2401 taacgtcaac cgaagcactg aaaaattata gcacgatcat taatagcttg caagattcta + 2461 tccaaacaaa tatgccactt gagactatga taaatttggt caatgctcag ttagaaagtg + 2521 gagggaatta taaagtaaat tctcaagatt taaaaggtac aggtcggacg gatcttcctt + 2581 cttatgcaat gccagacagt aacctctatg tgatggaaat agatgatagt agtttagctg + 2641 tagttaaagc agctatacag gatgtgatgg agggtagatg aaatgataga catccattcg + 2701 catatcgttt ttgatgtaga tgacggtccc aagtcaagag aggaaagcaa ggctctcttg + 2761 acagaatcct acaggcaggg ggtgagaacc attgtctcta cctctcaccg tcgcaagggc + 2821 atgtttgaaa ctccggaaga gaagatagca gaaaactttc ttcaggttcg ggaaatagct + 2881 aaggaagtgg cgagtgactt ggtcattgct tacggggctg aaatttacta cacaccagat + 2941 gttctggata agctggaaaa aaagcggatt ccgaccctca atgatagtcg ttatgccttg + 3001 atagagttca gtatgaacac tccttatcgc gatattcata gcgccttgag caagatcttg + 3061 atgttgggaa ttactccagt cattgcccac attgagcgct atgatgctct tgaaaataat + 3121 gaaaaacgcg ttcgagaact gattgatagg ggctgttaca cgcaagtaaa tagttcacat + 3181 gtcctcaaac ccaaactttt tggcgaacgt tataaattca tgaaaaaaag agctcagtat + 3241 tttttagagc aggatttggt tcatatcatt gcaagtgata tgcacaatct agacggtaga + 3301 cctcctcata tggcagaagc atatgacctt gttacccaaa aatacggaga agcgaaggct + 3361 caggaacttt ttatagacaa tcctcgaaaa attgtaatgg atcaactaat ttaggagaaa + 3421 tgatgaaaga acaaaacacg atagaaatcg atgtatttca attatttaaa accttgtgga + 3481 aacgcaagct aatgatttta atagtggcac ttgtgacagg tgcgggggct tttgcatata + 3541 gcacttttat tgttaagcca gaatatacga gtaccacgcg aatttacgta gtgaatcgca + 3601 atcaaggaga caagccgggg ctgacaaatc aggatttgca ggcaggatct tatctggtaa + 3661 aagactaccg tgagattatc ctttcgcagg atgcattgga aaaagtagcg acaaatttga + 3721 agttggatat gccagcaaaa acgttagcca gcaaagttca agtgactgta ccagctgaca + 3781 ctcgtatcgt ctcaatctct gtcaaggata aacagccaga ggaagccagt cgtatcgcta + 3841 attctctacg agaagttgct gcagaaaaga tcgtcgctgt aacgcgagta tctgatgtaa + 3901 cgacacttga agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgacgcaatt + 3961 ccttgtttgg ttttcttgga ggagcagtcg taacagtaat tgctgttctt ttgattgagt + 4021 tgctcgacac ccgtgtgaaa cgtcctgaag atgttgaaga tgtactgaaa attccacttt + 4081 tagggctcgt tccagatttt gacaaaataa aataggagga agttatgcca acattagaaa + 4141 tctcacaggc aaaattggat tctgtaaaaa aggcagagga atattataac gctttgtgca + 4201 cgaacctaca gttaagtgga gatggtttga aagtattttc tatcacttct gtgaaaatag + 4261 gagaaggaaa atcaacgact tccgccaata tcgcttgggc ttttgcgcgt gcaggttaca + 4321 aaacgctgct gattgatgga gatattcgca attctgttat gttaggtgtc tttaaagcaa + 4381 ggaataagat tacaggcctg acagaatttt tatcaggaac tacagactta tcacaagggc + 4441 tttgtgatac caatatcgaa aatctctttg taattcaggc tggctctgtg tcaccgaatc + 4501 cgacagctct tcttcaaagt aagaatttca ctacaatgct tgaaaccttg cgtaaatatt + 4561 ttgactacat cattgtagat actgctcctg ttggtgtcgt gattgatgcg gctattatta + 4621 cgcgaaactg cgatgcttct attttagtga cggaggcagg tgaaataaat cgtcgggata + 4681 ttcaaaaagc aaaagaacag ttggaacaca caggaaagcc gtttttggga attgtgttga + 4741 ataaattcga tacttcagta gacaaatacg gttcttatgg aaattatgga gattacggga + 4801 aaaataaaaa ataggtcggg ggatagagat gaatggaaaa atattaaggt cttcattggc + 4861 cataatccag agttttcttg ttattttatt gacttatcta cttagtgctg tgagagaaac + 4921 ggagattgtt tcaacaacag ctattgcact ttatatcctc cattattttg tcttttatat + 4981 cagtgattat ggacaggatt tctttaaaag gagatatttg attgaacttg tccagacatt + 5041 gaaatatatc ctattctttg cactagcgat tagtatttct aattttttct tagaggatcg + 5101 atttagtatt tccagacgag gcatgattta cttcctcaca ttacatgctc tcttagtcta + 5161 tgtgctaaac ctatttatca agtggtattg gaagcgggct tatctcaact ttaaaggaag + 5221 taagaagatt ctcctactta cagcaacttc tcatgtcgaa aaggtactgg atagattaat + 5281 agaatcaaat gaggttgttg ggaagttggt agccgtcagt gtcttagata aaccagattt + 5341 tcagcatgat tgtttaaagg tagtagcaga gggggagata gtaaactttg cgactcatga + 5401 ggtggtcgat gaagtcttta tcaatcttcc aagtgaaaaa tacaatattg gagagcttgt + 5461 ctctcagttt gaaacgatgg gaattgatgt aacagttaat ctaaatgctt ttgatcgtag + 5521 tttggcacgt aacaagcaaa ttcgtgagat ggcaggatta aacgttgtga ctttttctac + 5581 aacattttat aagactagtc atataatggc taagcggatt attgatatca tgggtgcatt + 5641 ggtagggctg atactatgtg gtttagtcag tattgtactg gttcctttga ttcgaaagga + 5701 tgggggttct gctatttttg ctcagacgcg tataggaaaa aatggtcgtc agttcacttt + 5761 ttataagttt cgctctatgt gtgtagatgc cgaggcgaaa aaaagagaac tcatggaaca + 5821 aaataccatg cagggtggaa tgtttaaggt ggacgatgat cctcgtatca cgaaaattgg + 5881 tcgttttata cggaagacta gcttggacga gctaccacag ttttataatg ttctaaaggg + 5941 agatatgagt ttggttggca cacggccacc aacagtggac gagtatgaac actatacccc + 6001 agaacaaaaa cgtcggctaa gttttaaacc tggtataaca ggcttatggc aggtcagtgg + 6061 acgaagtgag attaagaatt ttgatgaagt tgtcaaatta gatgtagcct atatagacga + 6121 ttggacaatt tggaaagata ttgagatttt attgaagaca gttaaagttg tattgatgaa + 6181 ggatggagcg aagtagattg atagatgtaa aaatcattgt ggcaacacat aaagaggtta + 6241 aaatgcctca agacaatagt ctttaccttc caatacatgt tgggagagac ggtaaatcag + 6301 atattggttt tatcggtgat aatactggcg ataatatatc ctctctaaat ccatattatt + 6361 gtgagttgac gggactttat tgggcatgga agaatcttga ttataattac ttaggtctag + 6421 ttcattaccg tcgttatttt acaaataaat ctcaagggta taatgaaaat gtcaatatgg + 6481 atgacgtcat tttgtctcga tctaatgttg aaatattatt agagaaatct gacgtaatag + 6541 ttccaaagaa gcgaaagtat tatattgaaa ctctttattc acattatgcc cataccctta + 6601 acggagaaca tctggatctt gctaggaaaa ttattgagca aaatagttca gagtatcttt + 6661 catcctttga taaagtgatg aaacaaagaa gcggttatat gttcaatatg tttatcatga + 6721 aaaaaggact attagatgat tatttaccgt ggcttttttc tattctggat actatgtacg + 6781 aacagatgga cttgaccgac tatacttcat ttgagtcacg tttattcggg cgagttagtg + 6841 agttgttgtt taatgtttgg ttatgtaaaa aaggaataac gcctaaagag gtaccattta + 6901 tgtacatgga gagagtggat ttgtttgaaa aaggaaaatc ttttttaatg gctaaatttt + 6961 ttggaaagaa gtatggacag agtttctagg agggaatatg aaaatcacta tcaaaaggta + 7021 ttcactgcca gaaattttag gactagcagc attagctata ttcctcctat tttcgctatt + 7081 ggatgtaagt ttttacgttc agtatatatc tcctatgcta tataaagctg caatcttttt + 7141 gataattatg ctaataattt tgaaggaatt tgtatctggg agtaatagct ttgagtctct + 7201 attgggttta ctaggggttt ctacgctcta ttttatcata ggtagtgtaa cgagctatac + 7261 ttcttttata gtcttagggc tatctctgat atatagcttg agggatattc ccttttcaaa + 7321 agtagtcaaa gtagccttta tcattagtgt tgctatgttg ttccttgtga tattgagtag + 7381 taagataggt tttattcctg attacattga gttttcatct actagagttc gacactatct + 7441 tggattccga tattcattat ttccatcaac gatcatgatg aatattatag ctatatcatt + 7501 ttttttgaag caagaaacag tatcgtatca gcgccttttt atattatttt tagtttcaat + 7561 gtacctatat ttagaaactg attcacgact gacttttatc agttcgagtt tgttactatt + 7621 agctaatttg gctatgaagc taatccctac tgttattgaa aaatttagtc ttttattaaa + 7681 atttttcacg cttacctatt ttgttaatgc ctatttaagt tattggattt caaaaaatta + 7741 cttaaggaca tcaaatgcct tgttgaatca tttttttcat caagcagatc aattcttagg + 7801 ggggcgtatt tatttatcta atcgttcgtt aagtttatat ggttatggga ttcttgggca + 7861 gaaaattgct tgggttggaa acgccttgaa tgcgcaagga gaacgaagta cggatgcata + 7921 tttatatgta gataatctat atattcagat tcttcaacat tttgggctga tagctttaat + 7981 tattatttta agtttactga ctgcgacttt agtgaagctt ttgagaaagg gacaaattgt + 8041 cttaagtatt attatagttt ctctgagttt ccatgctttg attgacgatt tgatattgag + 8101 tatccattat aatatttttt ggatattatt aggtagttta atctactcaa attatcagtt + 8161 ttctgaagaa aggtatggag aagttgagaa tgattcctta cgtagaactg taagggaagg + 8221 ttattaatag ggtttaatat gaataataga gatggaaaat attatattgg actagtaatg + 8281 aaaattatta ctaacccatt aaagatatta aagataaaaa aacgccgagt tctgctgaaa + 8341 agttataatg cagagactat ttcttgcaat ccaaagtata tttataacga acttaagaaa + 8401 attaatcgtt atgaattagt gtgggtgttg aaggagccag aaaaatatcc tgatgtaaaa + 8461 gcagtaaagt atatgtcgtt aaaatggttg tattatatag ttacttctca atacgtaata + 8521 tcaaatacgg gatttaactt ttggcttcct aaaaagaaaa aacagatata tataaataca + 8581 tggcatggag gtggagcata caaagatagt gacaatttaa acaatattag taaagcgcag + 8641 gtcaagcaaa ttaaaaagag tgcagagttg gaagattatt ttatatcgag ttgtgcagtc + 8701 tttacaaagg aatatgcaaa gaaaagagta ggatttaaag gtaaaatact agagataggg + 8761 acacctcgaa atgatttttt aattcgtaat caagcagatg atggtctaaa aaatagtata + 8821 aaaaatcgac ttggaataga tgataattgt tctatagtaa tttatgctcc aacatggcga + 8881 gatgatgctt cagctattga agagatagat tatgaaagct tactagaaag tttaagagag + 8941 acatatccaa aagtgagtat tttagtacgt ggtcatcatc ttcaaaagaa tttgattgat + 9001 ataaagaatt caaatattgt taatgtatct gactatgatg atatgcaaga attattatta + 9061 atttcagatt tattaattac tgattactct tcaacaatat gggatatgat tcatggaggg + 9121 aaaaaagtat tattatatac tcctgattta gatgaatatt taaaatatcg aggatttcat + 9181 gtagatataa aagaatggaa cattccatac tttaaaacta acgaagagtt gattgcatat + 9241 atctcttcaa attattttaa aaatatggaa gaaatgatag agaaccataa gattagattt + 9301 ggaagttttg aacacggaaa tgcaactcaa aaaatagtgg aattattaga agaaggtaat + 9361 taaatgaaag taagtgtaat aatacctgtt tataatgttg aaaaatattt aagaaggtgt + 9421 ttggattccg ttgttaatca aacatacaaa gatattgaag tgattttggt aaatgatggt + 9481 tctccagata attcaaaaga aatatgtgaa gaatacgttg ctaaatattc caatattcaa + 9541 ttaataaatc aaaagaatgc agggctaggt gcagcaagaa atactggtct acagtatata + 9601 acaggaaatg cggtaacttt tgtcgattct gatgattggt tagagttaga tgcaattgaa + 9661 tattatgttg catctatgaa aaagagtgac gcagatattg tagttactca aatgattaga + 9721 aaaaaagaat atttttctaa tgaaggaact aatgggacga ctataaaaga agaggtccta + 9781 aatcaggaac agtttgcaaa aaaatatttt aaaatagatg gtaataatat agagtattat + 9841 gcttgtgcaa aactttataa gagagagatt gctagagagg ttaaataccc tgttggttta + 9901 tttgcagaag acgtccctgc agcatttggt tatattatac gttcacaaaa aattttttat + 9961 agtacaaaag taacgtataa ttatttcttt aatgataata gtttaacggc taaatttaca + 10021 gataaagatt ttgatttgga aaagatatgg gatctagtcg tagaagaagc aaaggtttat + 10081 gggaacgagg attatatttt atatgccaag gtgaatagat atagaatcga ttttaatctt + 10141 ttgtgcagaa ttgctttatc ggaaaataaa tctgatatag aaaaatatag ccaagaaata + 10201 gtggttctac ttggaaaagt taaagaaaat aaaaaaattt tattaaagta tttaccgttt + 10261 tctaggaagg tgatatttag attgtttata gttgattata cgctaggaag aaatgttttg + 10321 agaatgttta agaatattgt gtagttaaca aatattggta taaggtgata gaaatgtatt + 10381 attttataaa agtagagaaa gatttaaaaa atacagccgg gattaaagcg cctgatgata + 10441 tagaaaaaat ttcagaagaa ttgggaatga aagaaatacg ctttcccaag tttccttttg + 10501 aaaaaaataa agttatacaa aaactctggc ttttttgtgt tgtaggttat aattggataa + 10561 gtctgttgtg gagacttaaa aagaatgatg tagttattta ccaacatcca atgtacggag + 10621 tgcgtgttgc aaattttgca attcctttat tgaaaaagta taaaaatata aaatttattt + 10681 cagtaataca tgatttagaa tcgttaagaa aaggaatcca aggagtcatt gaagataatg + 10741 aaacaacaaa tgctattgca gacaaagagt tgttgtcaaa atttgataaa gtgatttccc + 10801 ataatccgaa aatgacagaa tatttagaag ggatagggat aaaaaaagaa aatttagttg + 10861 aattgcaaat attcgactac ctagatccat cagaaataga agaaaagatt gaagatggag + 10921 tggttatagc ggggaatcta gcaaaaggaa aaagttcata tatatataag ttgttagaaa + 10981 atgaactgaa cttcaaatta aatctttttg ggccaaattt tattaacgaa gagctaccag + 11041 aaaacgttga gtattttggt agtttacctc caaataaatt gcctcaaaag ctagtaggta + 11101 agtttggttt ggtttgggac ggtgatagtc tagaaacttg tagtggaaat actggtaact + 11161 atttgaagta taataatcca cataaaacct cattatatct tgcttcagga atacctgtaa + 11221 ttatctggaa agaagctgcg ttagcacagt ttattgaaga aaataatgtt ggtattactg + 11281 taaataattt gtcagaaatt gagtttgtga tgcaaaatat atctgagggc gaatatttat + 11341 caataaaaag aaatacaatg caattgggtg aaaaattaag aaatggatat ttttatcgtc + 11401 aggcgatatc taagtgcaaa aatgatttca tgaagtaaga gggcatataa aaagacggaa + 11461 aatatttagc aataaatact gtagcttatt ttttattgaa gtggatgtgt aatttcagat + 11521 aactatggag ttgctcacca attaaatcag aactcaaaaa acaatagact ccctgcgaaa + 11581 caaaatatgg tatagtagtt ctatgaatga tgaagcaagt aaacaactaa ctgatgcacg + 11641 atttaagcgt cttgttggtg ttcagcgcac gacttttgaa gagatgttag ctgtattaaa + 11701 aacagcttat caacttaaac acgcaaaagg tggacgaaaa cctaaattaa gcctagaaga + 11761 ccttcttatg gccactcttc aatatgtgcg agaatatcga acttatgaag aaattgcggc + 11821 tgattttggt atccacgaaa gcaacttact ccgtcggagc caatgggttg aagtaactct + 11881 tgttcaaagt ggtgttacga tttcaagaac tcctctcagt tctgaggaca cggtaatgat + 11941 tgatgcgacg gaagtacaaa tcaatcgccc taaaaaaaga attagcgaat tattctggta + 12001 aaaaaaatgc cacgctatga aggctcaagc gattgtcaca agtcaaggga gaattgtttc + 12061 tttggatatc actgtgaact attgtcatga tatgaagttg ttcaaaatga gtcgcagaaa + 12121 tatcggacaa gctggtaaaa tcttggctga cagtggttat caagggctca tgaagatata + 12181 tcctcaagca caaacttcac gtaaatccag caaactcaga ccgctaatag ttgaagataa + 12241 agcctgtaac catgcgctat ctaaggagag aagcaaggtt gagaatatct ttgccaaagc + 12301 aaaaacgttt aaaatgtttt caacaaccta tcgaaatcat cgtaaacgct tcggattacg + 12361 gatgaatttg attgctggta ttatcaatca tgaactagga ttctagtttt gcaggaagtc + 12421 taataattaa attggaattg tgaacgtaaa tgaaagtact taaaaactat gcatacaatc + 12481 tatcttatca attattggtg attatacttc caatcattac gaccccctat gtgacacggg + 12541 tcttttcttc gaatgatcta gggacatatg gttattttaa ctccatcgtt acttatttta + 12601 tcctcttagc aacgctaggg gttgccaact atgggaccaa ggtcatttca gggcatcgca + 12661 aagaaattga aaaaaacttt tggggaatct actctctgca attaggtgca acagtttttt + 12721 ctctaacctt gtattgtctt ctttgtctaa ctcttccctt tatgcaaaat ccagtagcct + 12781 acattctagg cttggctttg gtttctaaag gattagatat atcctggctt tttcaagggc + 12841 tagaggattt tcgaaagatt actgttcgaa atatcacagt caagttcgtt ggtgtaatct + 12901 ctatcttcct ctttgtcaaa tctgcagatg atctatacct ctatgtcttt ttgctaacca + 12961 tatttgaact cttggggcag ctaagtatgt gggtgcctgc tcgtgagttt attggtagac + 13021 ctcattttga tttagaatat gctagacatc atttgaaacc agtcatatta ttgttccttc + 13081 cgcaagtggc gatttccttg tatgttacgc tagatcgtac catgcttgga gcgttagctt + 13141 ctacaaaaga tgtagggatt tatgaccagg ctttaaagtt ggtaaatatc cttctgacct + 13201 tggtaacttc cttgggaagt gtcatgttgc ctagagtttc aaatctttta tcctcagggg + 13261 atcataaagc agttaacaaa atgcatgaga tatcattttt aatttataat ttggttattt + 13321 tccccattat ggcaggaatg ctaattgtaa atgatgactt tgttaccttt ttcctcgggc + 13381 aagattttca agaggcacgt tatgcaatag caattatgat ttttagaatg ttctttattg + 13441 gttggaccaa tattatgggg attcaaattt tgatacctca taatcaaaat aaagaattta + 13501 tgctgtcaac aacaattcct gctattgtta gtgttggatt aaatcttctc ttgcttccca + 13561 agtttggata tataggagca gcaattgttt ctgtcttaac agaggcgcta gtatgggcta + 13621 ttcaattgta ctatattcgt gcatacctaa aagatgttcc gattattaga actatgataa + 13681 agattattct agcctcagct atcatgtata gcgttttgct agtttctaag acatacatac + 13741 atttttcccc aactataaat gttttggtat ttgtggtgtt aggtggaatc atttatcttt + 13801 tttcagtttt atctctaaaa gtggtagatg tgatagaatt aaaacaagta attaggaaaa + 13861 attagaatgc ataaatttaa agatattaac ttggatttac taaaagtaat tgcatgtgtt + 13921 ggagttgttt tactccatac agagatgggg ggatttaaag agacaggttc atggaatttt + 13981 tcgacatatt tatactactt aggaacctat tctatccctc tattttttat agttaatggt + 14041 tatttattgt tagggaagaa agagattacc tattcctaca tattacagaa agtaaaatat + 14101 attctaataa cagtgctgtc atggaccttt atagtttggt tatttaaacg ggatttttca + 14161 gttaatccaa taaaaaaact tataggatca ttggtgcaaa aaggttattt ctttcagttt + 14221 tggttttttg gtgcgcttat acttatttat atatgtctcc ccgttttgaa acaatttctt + 14281 aattcaaaaa gaagttattt atacttttta tctgtattgc tagttattgg tttaattttt + 14341 gagttaacaa atattgtact tcaaatgcca atacaaacat atgtaataca aacttttaga + 14401 ttatggactt ggcttttcta ttatatttta gggggcttta tatctcagtt tgataaaaat + 14461 accatcaaaa atgggtttaa gagatggatg aaagtaattg cagtactttt attattagtt + 14521 tcgccattta tattattttt catagcaaag accacttacc ataatttttt tgctgaatat + 14581 ttttatgata ttttattagt aaaagttgta agcgtaggga tttttctaac tattttctca + 14641 attgtattga atgaaaatag caacaaatgg attatttttc tttctaatca aactatgggt + 14701 atctttataa tacacactta tattatgaag gtatgggaaa aactatttgg ttttaatttt + 14761 ataggttcat atttactttt tgctatattt actttaagtg ttagttttat cattgttgga + 14821 atgttaatga aaattccgta ttttaatcga atcgtcaaat tataaaaagg agaaaaaatg + 14881 tacgattatc ttgttgttgg tgctggtctc tttggtgcag tctttgccca tgaagcagcc + 14941 ttaaaaggaa aaaaagtaaa agttattgaa aaacgaaatc atatcgcggg taatatctat + 15001 actcgtgaag aggaaggaat tcaagttcat caatatggtg ctcatatctt ccatacttct + 15061 gataaggaga tctgggatta tgtaaatcag tttgcagagt ttaaccgtta taccaattct + 15121 cctgttgcaa actataaggg tgagatttat aaccttcctt ttaatatgaa tactttcaat + 15181 aaactttggg gagttgtaac gccagcagaa gcacaagcta agattgagga acaacgtgct + 15241 attttaaatg gtaaaactcc tgaaaatttg gaagaacagg cgatttctct tgtaggtaca + 15301 gacatctacg aaaaattaat caaagactat acagagaaac agtggggcaa accaactact + 15361 gaacttccat cctttattat tcgccgtttg ccagtacgcc tgacctatga taacaactat + 15421 tttaacgata cctatcaagg gattccaatt ggtggataca ctcaaatagt tgaaaaaatg + 15481 ttggatcatg aaaatattga tgtagaaaca aatgttgatt tctttgtgaa taaagagcaa + 15541 tatctgaaag attttcctaa gattgtcttt actggtatga ttgatgaatt ctttgactat + 15601 aagttgggcg aactagagta ccgtagtctt cgttttgaaa atgagacctt ggatatggaa + 15661 aattaccaag gaaatgcagt tgtgaactat acggatgcag aaactccata tactcgcatt + 15721 attgaacaca aacattttga gtttgggagt caagcaaaga ctatcattac taaagaacat + 15781 tctaaaacat gggaaaaagg tgatgagcct tattatccag ttaataatga tcgtaataat + 15841 catttgtata aatcatacaa aaaacttgct gatgagcaag ggaatgttat ctttggtggc + 15901 cgcttaggac actatcgtta ttacgatatg caccaagtaa ttggagtagc tttgcagtgc + 15961 gtgagaaatg agttaaatta atactcaatg aaaattaaag agcaaactag gaagctagcc + 16021 acaggttgct caaaacactg ttttgaggtt gcagatggac gctgacgcgg tttgaagaga + 16081 ttttcgaaga gtataaacaa gtaaaactga ctaccagtta ttatttagaa atagtattaa + 16141 aaattccttg actatgtgat atagttgagg gatttttaaa tgatattcat attttttgca + 16201 aagatgttgt ttgaaaaata attttcaaaa attctgaaaa ttctgttgac aactttctga + 16261 aaagagtcta taatggagag aaagttttaa aggagaaaat gatgaaaagt tcaaaactat + 16321 ttgcccttgc gggcgtgaca ttattggcgg cgactacttt agctgcatgc tctggatcag + 16381 gttcaagcac taaaggtgag aaaacattct catacattta tgagacagac cctgataacc + 16441 tcaactattt gacaactgct aaggctgcga cagcaaatat taccagtaac gtggttgatg + 16501 gtttgctaga aaatgatcgc tacgggaact ttgtgccgtc tatggctgag gattggtctg + 16561 tatccaagga tggattgact tacacttata ctatccgtaa ggatgcaaaa tggtatactt + 16621 ctgaaggtga agaatacgcg gcagtcaaag ctcaagac +// + diff --git a/public/res/serotype_genbank/serotype_35C.gb b/public/res/serotype_genbank/serotype_35C.gb new file mode 100644 index 0000000..201b6d3 --- /dev/null +++ b/public/res/serotype_genbank/serotype_35C.gb @@ -0,0 +1,898 @@ +LOCUS CR931706 19741 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 7765/43 (serotype 35c). +ACCESSION CR931706 +VERSION CR931706.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 19741) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 19741) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..19741 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="7765/43" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC35C_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC35C_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34319.1" + /db_xref="GOA:Q4JZD8" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JZD8" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAP + WDAFCVELL" + gene 323..491 + /gene="aliB" + /locus_tag="SPC35C_0002" + /pseudo + CDS 323..491 + /gene="aliB" + /locus_tag="SPC35C_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(492..1024,1026..1352)) + /gene="tnp" + /locus_tag="SPC35C_0003" + /pseudo + CDS complement(join(492..1024,1026..1352)) + /gene="tnp" + /locus_tag="SPC35C_0003" + /note="member of homology group 4; + member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(962..1024,1026..1334)) + /gene="tnp" + /locus_tag="SPC35C_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.8e-23" + /pseudo + gene 1559..3013 + /gene="wzg" + /locus_tag="SPC35C_0004" + CDS 1559..3013 + /gene="wzg" + /locus_tag="SPC35C_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34322.1" + /db_xref="GOA:Q4JYW1" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYW1" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVY + NDQEFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1559..1684 + /gene="wzg" + /locus_tag="SPC35C_0004" + /note="Signal peptide predicted for SPC1688 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 1772..2119 + /gene="wzg" + /locus_tag="SPC35C_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.6e-63" + misc_feature 2297..2740 + /gene="wzg" + /locus_tag="SPC35C_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 3015..3746 + /gene="wzh" + /locus_tag="SPC35C_0005" + CDS 3015..3746 + /gene="wzh" + /locus_tag="SPC35C_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34323.1" + /db_xref="GOA:O86886" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:O86886" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDRGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3018..3626 + /gene="wzh" + /locus_tag="SPC35C_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.6e-36" + gene 3752..4447 + /gene="wzd" + /locus_tag="SPC35C_0006" + CDS 3752..4447 + /gene="wzd" + /locus_tag="SPC35C_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34324.1" + /db_xref="GOA:O86887" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:O86887" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3752..3868 + /gene="wzd" + /locus_tag="SPC35C_0006" + /note="Signal peptide predicted for SPC1690 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3773..4189 + /gene="wzd" + /locus_tag="SPC35C_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.1e-55" + misc_feature 4295..4372 + /gene="wzd" + /locus_tag="SPC35C_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4457..5146 + /gene="wze" + /locus_tag="SPC35C_0007" + CDS 4457..5146 + /gene="wze" + /locus_tag="SPC35C_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34325.1" + /db_xref="GOA:Q4JZK1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZK1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5161..6528 + /gene="wchA" + /locus_tag="SPC35C_0008" + CDS 5161..6528 + /gene="wchA" + /locus_tag="SPC35C_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34326.1" + /db_xref="GOA:Q4JYV7" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JYV7" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYLNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHIMAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5161..5247 + /gene="wchA" + /locus_tag="SPC35C_0008" + /note="Signal peptide predicted for SPC1692 by SignalP 2.0 + HMM (Signal peptide probability 0.844) with cleavage site + probability 0.429 between residues 29 and 30" + misc_feature 5944..6525 + /gene="wchA" + /locus_tag="SPC35C_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.8e-158" + gene 6515..7321 + /gene="wciB" + /locus_tag="SPC35C_0009" + CDS 6515..7321 + /gene="wciB" + /locus_tag="SPC35C_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34327.1" + /db_xref="GOA:Q4JZB6" + /db_xref="UniProtKB/TrEMBL:Q4JZB6" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDV + ILSRSNVEILLEKSDVIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKGLLDDYLPWLFSILDTMYEQMDLTDYTSFESRLFGRV + SELLFNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 7330..8523 + /gene="wzy" + /locus_tag="SPC35C_0010" + CDS 7330..8523 + /gene="wzy" + /locus_tag="SPC35C_0010" + /note="member of homology group 45" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34328.1" + /db_xref="UniProtKB/TrEMBL:Q4JYV5" + /translation="MKITIKRYSLPEILGLAALAIFLLFSLLSITLYAQYISIKVYFI + ALFGIILLIFLKELISESYNLKSVIGLFVIFTLCFIIGTVTNYAYFFILGLFLIYSLR + NLPFSDVAKVSFIISISVLLLVVLSSKLGIIPDYIEISPTRVRHYLGFRYSLLPSTLM + MNIIAISFFLKQENASYPRLLVLFLLSGWLYVETDSRLTFINSCLFLLVNLIMKLSPS + IIEKVGRLLKLFSFTYFINACLSYWIAKTYLNTSNVVLNQFFYQADQFLGGRIYYSNR + SLSLYGYKLLGQKIDWIGNGLSIQGERSTETYLYVDNLYIQILQHFGLIVSVIILSLL + TITLVKLLKKGQMVLGIILVILSFHALIDDLILNLYYNIFWVLIGMLIYKKYQFYDKK + QLTIE" + misc_feature 7330..7431 + /gene="wzy" + /locus_tag="SPC35C_0010" + /note="Signal peptide predicted for SPC1694 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.778 between residues 34 and 35" + gene 8678..9673 + /gene="wcrI" + /locus_tag="SPC35C_0011" + CDS 8678..9673 + /gene="wcrI" + /locus_tag="SPC35C_0011" + /note="member of homology group 128" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34329.1" + /db_xref="GOA:Q4JZB4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZB4" + /translation="MNKINLTDNLPLISVVLPVYNVENYLEKCLNSVVRQTYKNIEII + IVNDGSLDSSIDICNKYANKDSRIKVFTKPNGGLSDARNFGVKKSMGEFITFVDSDDY + VTDDYVEYLYSLVKKYNCKMSMCSIFVHYISNDKMINNGTGRELMMTAEQCIEKMCYH + DEVDTCAYAKLYHRSLFSEICFPKGRIFEDIGTIYRFFGTAGQIACGFNAKYYYEIRE + NSIVTSSFSEKKFDLLFMTDQMRNFVDQRYPSLKAATKRRAVYARFSTLNQLLDVQGY + NEEKKEIIRFIQDNKEALLENPKTPKRDRLAVRALSLGFCIYKLLWKQYLKIQRG" + misc_feature 8717..9220 + /gene="wcrI" + /locus_tag="SPC35C_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.2e-47" + gene 9675..10826 + /gene="wcrJ" + /locus_tag="SPC35C_0012" + CDS 9675..10826 + /gene="wcrJ" + /locus_tag="SPC35C_0012" + /note="member of homology group 129" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI34330.1" + /db_xref="GOA:Q4JYV3" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4JYV3" + /translation="MNKEFLKYIYIRLLRNLRRIFFIIPIIRNRVVFESFSGDAYSCN + PKYISEELRKQYGDSVEIIWAFNDPNKFKKELPKEIVTCRYRSFNHLIYRITSKVYVC + NFLQAIEIPKRKGQLEIQTWHGGGCYKKVGVAEKGRQAAYVKRQRMHVEETDLFITSS + KYFENEVVKKQFGYKGEILSIGMPRNDILINLPISSQVEKLKEKLGLPNNKLIALYAP + TWRSGTKQYETLDIKKLTQAVDKKFGKKCIVLFRSHLYGNQSYDDVVDVSQYSDMQEL + LLLSDILITDYSSSMWDFSLSFKPCFLYTPDLKDYLDERGFDEDIHSWGFSVSESNKE + LVENILQFDNEEYRQKMKNHHQFLESYEQGDAAKRVVAKIAEYCNLYRG" + misc_feature 10275..10802 + /gene="wcrJ" + /locus_tag="SPC35C_0012" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 5.1e-37" + gene 10830..11735 + /gene="wcrK" + /locus_tag="SPC35C_0013" + CDS 10830..11735 + /gene="wcrK" + /locus_tag="SPC35C_0013" + /note="member of homology group 130" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34331.1" + /db_xref="GOA:Q4JYV2" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JYV2" + /translation="MKKIAYLIKRYGVKNVVLRAINDVLPVNLIFPSQQLRRLNWQEK + VKKKLKKYVVISDSIKSEEECDIIWWLWFQGLDNAPAIVKKCRESVDKYAKRSGKRVI + ELTSQNLFEYIEVPNELYVKYKSGSLPLALFSDFCRISLLSNYGGLWIDSTVLITGEI + EDEILNQDIFMFQASPLDYSVTKISNWMLYSKYPGHPFISSIRDTLISFYNKNNTIPD + YFLFHLLVSCLIDDNRINQSFYDMDYYTNTYPHLLGRVLSEPYDTLKFENILRKTSIH + KLSYKNLDNVAEDSFYNAILGLDFS" + misc_feature 10884..11714 + /gene="wcrK" + /locus_tag="SPC35C_0013" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 4.7e-51" + gene 11753..12469 + /gene="mnp1" + /locus_tag="SPC35C_0014" + CDS 11753..12469 + /gene="mnp1" + /locus_tag="SPC35C_0014" + /note="member of homology group 131" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (mannitol)" + /protein_id="CAI34332.1" + /db_xref="GOA:Q4JYV1" + /db_xref="InterPro:IPR001228" + /db_xref="InterPro:IPR018294" + /db_xref="UniProtKB/TrEMBL:Q4JYV1" + /translation="MNLAVIFAGGSGTRMNAKDRPKQFLLVHGKPIIVHTIELFENHP + EIDGIIVVCIEDWIPYMEEMKYCYRLDKIAKIVPGGATGQLSIYNGLVAAEQLYGIED + NVVLIHDGVRPLITADTISDNIQSVKEKGNAITCTVAKETVILVDDENKVDEVPSREH + SRFAKAPQSFWLKDILGAHRASVDNGRNNFIDSCTMMRYYGHDLHVVVGPYENIKITT + PDDFYTFRALYDLRENKQLK" + misc_feature 11759..12451 + /gene="mnp1" + /locus_tag="SPC35C_0014" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF000, score 3.9e-23" + misc_feature 11759..12448 + /gene="mnp1" + /locus_tag="SPC35C_0014" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 6.5e-05" + gene 12480..13550 + /gene="wcrH" + /locus_tag="SPC35C_0015" + CDS 12480..13550 + /gene="wcrH" + /locus_tag="SPC35C_0015" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34333.1" + /db_xref="GOA:Q4JYV0" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4JYV0" + /translation="MKYFVEETLLDEQDKKNAGGKARQDVTDILESIGYQKLIAESEM + NERQELNAVQRLVHHYKVKKMWKKTLSVVGKGDEVIIQFPLLNHSLFFNQVIKQLSKN + GVKVYFLIHDLESLRWSQSKSISLKSRIRLNIEEHSVLRLSEGIIAHNKKMKSYIKTY + SVESSKIIPLETFDYIIPSYHERKNLDNFQLNAPIVIAGNLKQHKAGYVYHLPSNVEF + NLYGIGYEQTDDKSVHYCGSFMPEELPFVLKGSFGLVWDGPSSESCIETYGEYLRVNN + PHKTSLYLASGIPVVVWSEAAIASFIKENNCGILVSNLSELPELLSMITVDEYELMKK + NTEIIGERLRQGFYTKQAVKGF" + gene 13566..14645 + /gene="mnp2" + /locus_tag="SPC35C_0016" + CDS 13566..14645 + /gene="mnp2" + /locus_tag="SPC35C_0016" + /note="member of homology group 132" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (mannitol)" + /protein_id="CAI34334.1" + /db_xref="GOA:Q4JZA9" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZA9" + /translation="MIESFNDKVLQEDLEIIAKEELPFRKFRNSTVFITGVTGLVGLQ + LFKALACINRVHQLNMKIIGLVRNLDKAEKIFGDLLKRKDIQIVLGDVSEDFHSYIPD + GLVIDYIIHGASVTTSKLMIEFPVDTIRVAFNGTYQMLELAKEKKVKSFVYLSSMEVY + GSFQSDRTTVVNENMLGYLDLTSVRTNYPECKRICENMCIAFLSQYQVPAKIARLSQT + FGAGTLPGENRVFAQFARSVMQGKDIVLHTLGQSEGNYCYTADTVVALLTILLRGENG + EAYNIANEESHTTIADMAKMVTSQFSQTSQVVFDIPKKNIFGYAVDTKMKLSTHKIQQ + LGWKPRVSLVDAYDRMMRSMNETGV" + misc_feature 13659..14411 + /gene="mnp2" + /locus_tag="SPC35C_0016" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 9.2e-23" + misc_feature 13662..14504 + /gene="mnp2" + /locus_tag="SPC35C_0016" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 0.00013" + gene 14654..16069 + /gene="wzx" + /locus_tag="SPC35C_0017" + CDS 14654..16069 + /gene="wzx" + /locus_tag="SPC35C_0017" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34335.1" + /db_xref="GOA:Q4JZA8" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZA8" + /translation="MKVLKNYLYNLSYQLLVIILPIITTPYVTRIFSSDDLGTYGYFN + SIVTYFILLATLGIANYGTKEISGNRKSIQKNFWGIYTLQFGATTFSIFLYILACLFI + PGMKNLVAYILGLGLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVSAIFLFVKSAS + DLYLYVFLLTAFELLGQLSMWFPAREYIGKPHFDIEYARHHLKPVILLFLPQIAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVAHLLATGDHKVVN + KMHEVSFLIYNLVIFPIMAGMLIVNDDFVQFFLGQDFQDARYAISIMIFRMFFIGWTN + IMGIQILIPHNQNKEFMISTTTPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LFYTRRYLKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSPTLNVLAFVALGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 14660..15454 + /gene="wzx" + /locus_tag="SPC35C_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.5e-65" + gene 16071..17069 + /gene="wciG" + /locus_tag="SPC35C_0018" + CDS 16071..17069 + /gene="wciG" + /locus_tag="SPC35C_0018" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34336.1" + /db_xref="GOA:Q4JYU7" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYU7" + /translation="MRKNRNINLDLLKVLACVGVVLLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMINGYLLLGKREITYLYILQKVKWILITVSSWSFIVWLFKRDFTTNPI + KKIVGSLIQRGYFFQFWFFGALILIYLCLPILRQFLNSKRSYLYSLSLLMTIGLIFEL + SNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTIEEIESRFKNWMKIVSILLLLI + SPIILFFIAKTIYHNLFAEYFYDTLFVKVSTLGIFLTILMLTLNENRRESIVSLSNQT + MGVFIIHTYIMKVWEKVLGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 17083..18192 + /gene="glf" + /locus_tag="SPC35C_0019" + CDS 17083..18192 + /gene="glf" + /locus_tag="SPC35C_0019" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34337.1" + /db_xref="GOA:Q4JYU6" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYU6" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKITEQTADMKDVEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFDHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + misc_feature 17518..18120 + /gene="glf" + /locus_tag="SPC35C_0019" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.2e-137" + gene 18173..19207 + /gene="wcjE" + /locus_tag="SPC35C_0020" + CDS 18173..19207 + /gene="wcjE" + /locus_tag="SPC35C_0020" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34338.1" + /db_xref="GOA:Q4JYU5" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYU5" + /translation="MDMTKSRINWIDFGKGFSIFLVLAGHVLLGLYQSEKFPTANNIL + SLLIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQ + KVAGASVRVPTTISDLLNIYKHPLGVSWYLYILWSILIIYGLLSILVKNRRMLFLISV + FAYCLTLFVQTDIYIIQRTLVWGICFFLGSVLSEIHFDKINLKKFLFFFVLFDFIYMF + AWFLFYEVGSKKDYVSYINPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKD + SLGIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIV + LLPQKYIKLK" + gene 19382..>19741 + /gene="aliA" + /locus_tag="SPC35C_0021" + CDS 19382..>19741 + /gene="aliA" + /locus_tag="SPC35C_0021" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34339.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 19382..19468 + /gene="aliA" + /locus_tag="SPC35C_0021" + /note="Signal peptide predicted for SPC1705 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 19628..19696 + /gene="aliA" + /locus_tag="SPC35C_0021" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttggct ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattta aggagaaaga agatgaacat aaagaagcga gtccttagtg caggcctgac + 361 ttttgcatct gctttgcttt tagctgcttg cggccaatca ggttcagata caaaaactta + 421 ctcatcaacc tttggtggaa atccaactac atttaactat ctattagact attacgctga + 481 taacatagtc aattgaaaca agaacaggac aaaagagcct cataaaaggt attgcaactt + 541 ggtaatacct tttacgaggc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggtgagta gggaggaaga ggtaaaagtt tatgcccaaa ctcctcgcat aaaagttcta + 661 acttacccat tctatggaat cttgcattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagag aaacttctga aaccaagctt caaaaaagtc gctcgtcacc atctcttcgt + 781 aagtcattgg agcgattaac tcaccatttg ttagacctgc aaccaaagaa atcctctgat + 841 atcttcttcc agatacttta cctcttatta actgaccttt taatgagcga ccatattctc + 901 gataaaaata agtatcgaat cctgtttcat caatctaaac aggtgctagg tgctttaaac + 961 tattaaaatt cttaagaaat aaggctactt tttctggctc ttgttcatag taggtgtggt + 1021 tctttttttc gagtgtagcc catagctttg agcgcatagt ggatggtagt tggatgacag + 1081 ccaaattcag aagctatttc agtcaaataa gcgtctggat tgtcagtaag atagttttta + 1141 agtctatctc tatcaacctt tcttggtttt gttcctttta cttggtggtt tagctctcct + 1201 gttttctctt ttagctttaa ccagccataa atggtattac gtgagatttg gaaaacgtgt + 1261 gacgcttctg ttatactacc tgttcgctca caataagaga gaactttttt acgaaaatct + 1321 attgaatatg ccataagaag attataccac attgtgtact atattagatt gaaactagag + 1381 tagtacacct ctgcttctaa aacattgtta gaaatcgatt tgactgtcct tatttcattt + 1441 tattatattt ttggttcgcg ggaagtctac taagatactt aaagatgcag atagtgaaaa + 1501 taaaggtgta gacattaccg taaaaaagtg atataatcgt atgatgttca atgtataggt + 1561 gttaatcatg agtagacgtt ttaaaaaatc acgttcacag aaagtgaagc gaagtgttaa + 1621 tatagttttg ctgactattt atttattgtt agtttgtttt ttattgttct taatctttaa + 1681 gtacaatatc cttgctttta gatatcttaa tctagtggta actgcgttag tcctactagt + 1741 tgccttggta gggctactct tgattatcta taaaaaagct gaaaaattta ctatttttct + 1801 gttgctgttc tctatccttg tcagctctgt gtcgctcttt gcagtacagc agtttgttgg + 1861 actgaccaat cgtttaaatg cgacttctaa ttactcagaa tattcaatca gtgtcgctgt + 1921 tttagcagat agtgatatcg aaaatgttac gcaactgacg agtgtgacag caccgactgg + 1981 gactgataat gaaaatattc aaaaactact agctgatatc aagtcaagtc agaataccga + 2041 tttgacggtc aaccagagtt cgtcttactt ggcagcttac aagagtttga ttgcagggga + 2101 gactaaggcc attgtcctaa atagtgtctt tgaaaatatc atcgagtcag agtatccaga + 2161 ctacgcatcg aagataaaaa agatttatac caagggattc actaaaaaag tagaagctcc + 2221 taagacgtct aagaatcagt ctttcaatat ctatgttagt ggaattgaca cctatggccc + 2281 tattagttcg gtgtcgcgat cagatgtcaa tatcctgatg actgtcaatc gagataccaa + 2341 gaaaatcctc ttgaccacaa cgccacgtga tgcctatgta ccaatcgcag atggtggaaa + 2401 taatcaaaaa gataaattaa cccatgcggg catttatgga gttgattcgt ccattcacac + 2461 cttagaaaat ctctatggag tggatatcaa ttactatgtg cgattgaact tcacttcgtt + 2521 tttgaaattg attgatttgt tgggtggaat tgatgtttat aatgatcaag aatttactgc + 2581 ccatacgaat ggaaagtatt accctgcagg caatgttcat cttgattcag aacaggctct + 2641 cggttttgtt cgtgagcgct actcactagc agatggcgat cgtgaccgcg ggcgcaatca + 2701 acaaaaggtg attgtggcta tccttcaaaa attaacgtca accgaagcac tgaaaaatta + 2761 tagcacgatc attaatagct tgcaagattc tatccaaaca aatatgccac ttgagactat + 2821 gataaatttg gtcaatgctc agttagaaag tggagggaat tataaagtaa attctcaaga + 2881 tttaaaaggt acaggtcgga cggatcttcc ttcttatgca atgccagaca gtaacctcta + 2941 tgtgatggaa atagatgata gtagtttagc tgtagttaaa gcagctatac aggatgtgat + 3001 ggagggtaga tgaaatgata gacatccatt cgcatatcgt ttttgatgta gatgacggtc + 3061 ccaagtcaag agaggaaagc aaggctctct tgacagaatc ctacaggcag ggggtgagaa + 3121 ccattgtctc tacctctcac cgtcgcaagg gcatgtttga aactccggaa gagaagatag + 3181 cagaaaactt tcttcaggtt cgggaaatag ctaaggaagt ggcgagtgac ttggtcattg + 3241 cttacggggc tgaaatttac tacacaccag atgttctgga taagctggaa aaaaagcgga + 3301 ttccgaccct caatgatagt cgttatgcct tgatagagtt cagtatgaac actccttatc + 3361 gcgatattca tagcgccttg agcaagatct tgatgttggg aattactcca gtcattgccc + 3421 acattgagcg ctatgatgct cttgaaaata atgaaaaacg cgttcgagaa ctgattgata + 3481 ggggctgtta cacgcaagta aatagttcac atgtcctcaa acccaaactt tttggcgaac + 3541 gttataaatt catgaaaaaa agagctcagt attttttaga gcaggatttg gttcatatca + 3601 ttgcaagtga tatgcacaat ctagacggta gacctcctca tatggcagaa gcatatgacc + 3661 ttgttaccca aaaatacgga gaagcgaagg ctcaggaact ttttatagac aatcctcgaa + 3721 aaattgtaat ggatcaacta atttaggaga aatgatgaaa gaacaaaaca cgatagaaat + 3781 cgatgtattt caattattta aaaccttgtg gaaacgcaag ctaatgattt taatagtggc + 3841 acttgtgaca ggtgcggggg cttttgcata tagcactttt attgttaagc cagaatatac + 3901 gagtaccacg cgaatttacg tagtgaatcg caatcaagga gacaagccgg ggctgacaaa + 3961 tcaggatttg caggcaggat cttatctggt aaaagactac cgtgagatta tcctttcgca + 4021 ggatgcattg gaaaaagtag cgacaaattt gaagttggat atgccagcaa aaacgttagc + 4081 cagcaaagtt caagtgactg taccagctga cactcgtatc gtctcaatct ctgtcaagga + 4141 taaacagcca gaggaagcca gtcgtatcgc taattctcta cgagaagttg ctgcagaaaa + 4201 gatcgtcgct gtaacgcgag tatctgatgt aacgacactt gaagaagcgc gaccagctac + 4261 gactccctct tctccaaatg ttcgacgcaa ttccttgttt ggttttcttg gaggagcagt + 4321 cgtaacagta attgctgttc ttttgattga gttgctggac acccgtgtga aacgtcctga + 4381 agatgttgaa gatgtactga aaattccact tttagggctc gttccagatt ttgacaaaat + 4441 aaaataggag gaagttatgc caacattaga aatctcacag gcaaaattgg attctgtaaa + 4501 aaaggcagag gaatattata acgctttgtg cacgaaccta cagttaagtg gagatggttt + 4561 gaaagtattt tctatcactt ctgtgaaaat aggagaagga aaatcaacga cttccgccaa + 4621 tatcgcttgg gcttttgcgc gtgcaggtta caaaacgctg ctgattgatg gagatattcg + 4681 caattctgtt atgttaggtg tctttaaagc aaggaataag attacaggcc tgacagaatt + 4741 tttatcagga actacagact tatcacaagg gctttgtgat accaatatcg aaaatctctt + 4801 tgtaattcag gctggctctg tgtcaccgaa tccgacagct cttcttcaaa gtaagaattt + 4861 cactacaatg cttgaaacct tgcgtaaata ttttgactac atcattgtag atactgctcc + 4921 tgttggtgtc gtgattgatg cggctattat tacgcgaaac tgcgatgctt ctattttagt + 4981 gacggaggca ggtgaaataa atcgtcggga tattcaaaaa gcaaaagaac agttggaaca + 5041 cacaggaaag ccgtttttgg gaattgtgtt gaataaattc gatacttcag tagacaaata + 5101 cggttcttat ggaaattatg gagattacgg gaaaaataaa aaataggtcg ggggatagag + 5161 atgaatggaa aaatattaag gtcttcattg gccataatcc agagttttct tgttatttta + 5221 ttgacttatc tacttagtgc tgtgagagaa acggagattg tttcaacaac agctattgca + 5281 ctttatatcc tccattattt tgtcttttat atcagtgatt atggacagga tttctttaaa + 5341 aggagatatt tgattgaact tgtccagaca ttgaaatata tcctattctt tgcactagcg + 5401 attagtattt ctaatttttt cttagaggat cgatttagta tttccagacg aggcatgatt + 5461 tacttcctca cattacatgc tctcttagtc tatgtgctaa acctatttat caagtggtat + 5521 tggaagcggg cttatctcaa ctttaaagga agtaagaaga ttctcctact tacagcaact + 5581 tctcgtgtcg aaaaggtact ggatagatta atagaatcaa atgaggttgt tgggaagttg + 5641 gtagccgtca gtgtcttaga taaaccagat tttcagcatg attgtttaaa ggtagtagca + 5701 gagggggaga tagtaaactt tgcgactcat gaggtggtcg atgaagtctt tatcaatctt + 5761 ccaagtgaaa aatacaatat tggagagctt gtttctcagt ttgaaacgat gggaattgat + 5821 gtaacagtta atctaaatgc ttttgatcgt agtttggcac gtaacaagca aattcgtgag + 5881 atggcaggat taaacgttgt gactttttct acaacatttt ataagactag tcatataatg + 5941 gctaagcgga ttattgatat catgggtgca ttggtagggc tgatactatg tggtttagtc + 6001 agtattgtac tggttccttt gattcgaaag gatgggggct ctgctatttt tgctcagacg + 6061 cgtataggaa aaaatggtcg tcagttcact ttttataagt ttcgctctat gtgtgtagat + 6121 gccgaggcga aaaaaagaga actcatggaa caaaatacca tgcagggtgg aatgtttaag + 6181 gtggacgatg atcctcgtat cacgaaaatt ggtcgtttta tacggaagac tagcttggac + 6241 gagctaccac agttttataa tgttctaaag ggagatatga gtttggttgg cacacggcca + 6301 ccaacagtgg acgagtatga acactatacc ccagaacaaa aacgtcggct aagttttaaa + 6361 cctggtataa caggcttatg gcaggtcagt ggacgaagtg agattaagaa ttttgatgaa + 6421 gttgtcaaat tagatgtagc ctatatagac gattggacaa tttggaaaga tattgagatt + 6481 ttattgaaga cagttaaagt tgtattgatg aaggatggag cgaagtagat tgatagatgt + 6541 aaaaatcatt gtggcaacac ataaagaggt taaaatgcct caagacaata gtctttacct + 6601 tccaatacat gttggaagag acggtaaatc agatattggt tttatcggtg ataatactgg + 6661 cgataatata tcctctctaa atccatatta ttgtgagttg acgggacttt attgggcatg + 6721 gaagaatctt gattataatt acttaggtct agttcattac cgtcgttatt ttacaaataa + 6781 atctcaaggg tataatgaaa atgtcaatat ggatgacgtc attttgtctc gatctaatgt + 6841 tgaaatatta ttagagaaat ctgacgtaat agttccaaag aagcgaaagt attatattga + 6901 aactctttat tcacattatg cccataccct taacggagaa catctggatc ttgctaggaa + 6961 aattattgag caaaatagtt cagagtatct ttcatccttt gataaagtga tgaaacaaag + 7021 aagcggttat atgttcaata tgtttatcat gaaaaaagga ctattagatg attatttacc + 7081 gtggcttttt tctattctgg atactatgta cgaacagatg gacttgaccg actatacttc + 7141 atttgagtca cgtttattcg ggcgagttag tgagttgttg tttaatgttt ggttatgtaa + 7201 aaaaggaata acgcctaaag aggtaccatt tatgtacatg gagagagtgg atttgtttga + 7261 aaaaggaaaa tcttttttaa tggctaaatt ttttggaaag aagtatggac agagtttcta + 7321 ggagggaata tgaaaatcac tatcaaaagg tattcactgc cagaaatttt aggattagca + 7381 gcattagcta tattcctact attttcgtta ttaagtataa ctctttatgc ccaatatata + 7441 tctattaaag tatattttat tgcacttttt ggcattattt tattaatatt tctgaaggaa + 7501 cttatatctg agagttataa tcttaaatct gtgattggat tattcgtgat ttttactctc + 7561 tgcttcatca taggtaccgt cacgaattac gcatactttt ttattttagg tctgtttttg + 7621 atttatagtc ttagaaatct ccctttttca gacgtagcca aagtctcctt tatcattagt + 7681 attagtgtat tgctcctagt agtattgagt agtaagcttg gtattattcc tgattatatt + 7741 gagatttcgc ctaccagagt tagacactat cttggtttcc gatattcatt acttccatca + 7801 acgcttatga tgaatatcat agctatatca ttttttttaa agcaagaaaa cgcttcatat + 7861 ccgcgtcttc ttgtattgtt tttactttca ggatggttat acgtagaaac agattcacgt + 7921 ttgactttta ttaattcgtg tttgtttcta ctggttaatt taataatgaa attgtcacct + 7981 tccatcattg aaaaggtagg gagactgtta aaactttttt cgttcaccta ctttattaat + 8041 gcctgtttga gttactggat tgcgaagact tacttaaaca cctcaaatgt tgttttgaat + 8101 caattctttt accaagcgga tcaatttctt ggaggacgta tttattattc taatcgttcg + 8161 ttatctttat atggatataa gttgttaggt caaaagattg attggattgg aaatggcttg + 8221 agcatacaag gggagcgtag cacagaaaca tatttgtatg tggataattt atatatccag + 8281 attcttcaac attttggttt gatagtttcg gtaattattt taagtctatt aactataact + 8341 ttagtaaagc ttttgaaaaa ggggcagatg gtattaggaa ttattttagt tattttgagt + 8401 tttcatgctt taattgatga tttgatacta aatctatatt ataatatctt ttgggttttg + 8461 ataggaatgt tgatatataa aaaatatcaa ttttatgata aaaagcagtt gacaatagaa + 8521 taagaagcaa gcattggaaa tagacattca gatatgtaca agaaaactcg atttaagttt + 8581 tttggtaaaa tttttaaaat taagttgtaa aatggatatc aaaatctcac cttttttgta + 8641 ggtgtgatta aacagaggga tattagatag gaaaataatg aataagatta atttaactga + 8701 taatttaccg ttaatttcag ttgttttacc agtatacaac gtagagaatt atttagaaaa + 8761 gtgtttgaat tctgttgtga gacagacgta taaaaacata gaaattataa tagtaaatga + 8821 tggcagctta gattcttcaa tagatatttg taataagtat gcaaataaag atagtcgaat + 8881 taaagtattt acaaaaccta atggaggttt gtctgatgct agaaatttcg gtgtcaaaaa + 8941 atctatgggt gagtttataa cattcgttga ttcagatgac tatgttacag atgattatgt + 9001 agaatatttg tatagcttag tcaaaaaata taattgtaaa atgtcaatgt gttcaatatt + 9061 tgtccattat atttctaatg ataaaatgat caataatggg acaggaagag aattgatgat + 9121 gacagcagag cagtgtattg aaaaaatgtg ctatcatgat gaggtggata catgtgctta + 9181 tgcaaaatta tatcatagaa gtctatttag tgaaatatgc ttccctaaag gaaggatatt + 9241 cgaagatatt ggaacaattt atcgcttttt tggtactgct gggcagattg cctgtggttt + 9301 taacgcaaaa tattattatg agattcggga aaattcgatt gttacatcat catttagtga + 9361 aaaaaaattt gatttgttat ttatgacaga tcaaatgcga aattttgttg atcaacgtta + 9421 tccatctttg aaagctgcaa caaaacgtcg agctgtctat gcaagattta gtacccttaa + 9481 ccaattatta gatgtacaag gatataatga agaaaaaaaa gaaataattc gttttatcca + 9541 agacaacaag gaagcgttac ttgaaaatcc taagactcct aagcgggata gattagctgt + 9601 tagagctctc tcccttggat tttgcattta taaattgtta tggaagcaat atctaaaaat + 9661 tcaaagaggt tagtatgaat aaagaatttt tgaagtatat ttatattcga ttattaagaa + 9721 atttaaggag aattttcttt attatcccga taataaggaa tagagttgtt tttgaatctt + 9781 tctcaggaga tgcttatagt tgcaatccta aatatatttc tgaagaatta agaaaacagt + 9841 atggtgattc tgttgaaatt atctgggctt ttaatgatcc aaacaaattc aaaaaagaat + 9901 taccaaagga gattgtgact tgtcgttacc gtagtttcaa tcatctgatc tatagaatca + 9961 cttcaaaagt ttatgtttgt aatttcctgc aagcaattga aattccaaag cgtaaaggac + 10021 aactagagat tcaaacttgg catggaggag gttgctataa aaaagttggg gtggctgaaa + 10081 aaggacgcca ggctgcttat gttaaacgac aacggatgca cgttgaagaa acagatctct + 10141 ttattacaag tagtaaatat tttgaaaatg aggtagtaaa aaaacaattt gggtataagg + 10201 gagaaatttt atctattggt atgcctcgaa atgatatttt aataaattta ccaatttcaa + 10261 gtcaagttga gaaattaaag gagaaattgg gattaccaaa caataaattg atagcacttt + 10321 atgctccgac ctggagatca ggtactaaac agtatgaaac acttgatata aaaaaactta + 10381 ctcaagccgt tgataaaaaa tttggtaaaa aatgtatcgt tcttttcaga tcgcatctat + 10441 atggaaatca atcttatgat gatgttgtgg atgtctctca gtatagtgat atgcaagaat + 10501 tattgttgct ttcagatata ctgattactg actattcttc gtctatgtgg gatttctctc + 10561 tctcttttaa accgtgtttt ttatataccc ccgatttgaa ggattatcta gatgaaagag + 10621 gttttgatga agatatacat tcatggggat tttcagtttc tgaatcaaat aaggaactag + 10681 ttgaaaatat tttacagttt gataatgaag aatatagaca aaaaatgaag aatcatcatc + 10741 agtttttaga atcttatgaa caaggagatg cagcgaaaag agtcgtggcg aagattgctg + 10801 aatattgtaa tttatataga ggatagataa tgaaaaaaat tgcttatttg atcaaaagat + 10861 atggtgtgaa aaatgtggtt ttacgtgcta ttaatgatgt tctaccagtc aatctcatct + 10921 ttcccagtca acaactcaga cgtttgaatt ggcaagaaaa agtcaaaaag aagttaaaaa + 10981 aatatgtagt tatttcggat tcaatcaaga gtgaggagga atgcgatatt atctggtggc + 11041 tatggtttca aggacttgat aatgcaccag ctattgtgaa aaaatgtaga gagtcggtag + 11101 ataaatatgc taaacgcagt ggcaaaaggg ttattgagtt aacatctcaa aatttatttg + 11161 aatatattga ggtacctaac gaactctatg tgaaatataa gtcaggtagt ttgccactag + 11221 ctttattttc agatttttgt cgaattagcc ttctttctaa ctatggagga ttatggattg + 11281 attcaactgt tctaattacg ggggaaattg aagatgagat attgaaccaa gatattttta + 11341 tgtttcaagc ttctccttta gactattcag ttactaaaat cagtaattgg atgttatatt + 11401 caaaatatcc aggacacccg ttcatatcat cgatacgtga tactttgatt tcattttata + 11461 ataagaataa tacgatccca gattattttt tatttcattt acttgtttcc tgtttaatag + 11521 atgataatag gataaatcaa agtttttatg atatggatta ttataccaat acctatcctc + 11581 acttattagg gagagttttg agcgaaccat atgatacttt gaaatttgaa aatattttaa + 11641 ggaaaacgtc tattcataaa ttatcatata aaaatttaga taatgttgct gaagatagct + 11701 tttataatgc tattttaggt ttagatttta gttagtaata aagaggagag aaatgaattt + 11761 agcagttatt tttgctggag gctccggtac gcgaatgaat gcaaaggata gacctaagca + 11821 gtttcttttg gtacatggta agccaattat tgttcacact attgagctat ttgagaacca + 11881 tccagagatt gatggaatta tcgttgtttg tattgaagat tggattccgt atatggagga + 11941 gatgaaatat tgctatagat tagataagat tgctaagatt gttccagggg gggcaactgg + 12001 tcaattatct atttataatg gtttagtcgc ggctgaacaa ctttatggaa tagaggataa + 12061 tgttgtgtta atccatgatg gagtccgtcc tttaattaca gcagacacta tttcagataa + 12121 catccaatcc gtaaaagaaa agggaaatgc tattacttgt acagtggcca aagaaacagt + 12181 tatcttagta gatgatgaaa ataaggtaga cgaagtgcct agtcgtgaac attcgcgatt + 12241 tgccaaggct cctcagagtt tttggctaaa agatattcta ggtgcacatc gagcctctgt + 12301 agataatggt agaaataatt ttattgattc atgcaccatg atgagatatt atggtcatga + 12361 tttacatgtt gttgttggtc cgtatgagaa tattaagatt acaacgcctg atgattttta + 12421 tacatttagg gctttgtacg atcttcgtga gaataagcaa ctaaaataat gaggaaaaga + 12481 tgaagtattt tgttgaagaa acgttacttg atgaacagga taaaaaaaat gcgggtggaa + 12541 aggctagaca agacgtcact gatattttag agtccatagg ttatcagaag ttaatagctg + 12601 agtccgaaat gaatgaacgt caggaattaa atgctgttca aagattggtt catcattata + 12661 aagttaagaa aatgtggaag aaaactcttt cagttgttgg taagggtgat gaagttatta + 12721 ttcaatttcc tttactaaat catagtttat tctttaatca ggttattaag caacttagta + 12781 agaatggagt taaagtttat tttttgattc atgatttaga atcgttgcga tggtcgcagt + 12841 caaaatcgat atcattaaaa agtaggattc gattaaacat tgaagaacat agtgttttaa + 12901 ggttatcaga aggcattatt gctcataata aaaaaatgaa atcttatatt aagacctact + 12961 ctgttgaaag ttctaaaatt attcctcttg aaacttttga ttatattatt ccatcttatc + 13021 atgaaagaaa aaatctggat aactttcagt taaatgctcc aattgttatt gctggaaatt + 13081 taaagcaaca taaagctgga tatgtctatc atttaccaag caatgtggag tttaatcttt + 13141 atggaattgg atatgaacag acagatgaca aaagtgtgca ctactgtggt tcttttatgc + 13201 cagaagaatt accattcgtt ttaaaaggaa gttttggatt ggtatgggat ggtccgtcat + 13261 cagagtcttg tatagaaact tatggagagt atcttcgtgt aaacaaccct cacaagactt + 13321 cactatattt agcttcaggc ataccagtag ttgtatggtc agaggcagca atagctagtt + 13381 tcattaagga gaataattgt ggtattcttg tatccaatct gagtgaacta cctgagttac + 13441 tttctatgat taccgttgat gaatatgaat tgatgaaaaa gaatactgag attattggag + 13501 aaaggcttcg acaaggtttt tatactaaac aagcagttaa aggtttctag actggaggaa + 13561 gtgtaatgat tgaaagtttt aatgataaag tgttgcagga agatttagag ataattgcaa + 13621 aagaagagct cccatttcga aaatttagaa attcaactgt ttttatcacg ggagtaacag + 13681 gtttagtagg ccttcaatta tttaaggctt tggcttgtat caatagagtc catcagttga + 13741 atatgaaaat tattggtcta gtcagaaatt tggataaagc agaaaaaatt tttggagatt + 13801 tattgaaacg gaaggatata caaatagttt taggagatgt ttcggaagat ttccactcgt + 13861 atatccctga tggtttagtt attgactata tcattcacgg agcaagcgtg actacctcta + 13921 aactcatgat tgaatttcca gtagatacaa ttcgagtagc ttttaatgga acgtatcaaa + 13981 tgttagaatt ggcaaaagaa aaaaaagtga aaagttttgt atatctttct tcaatggagg + 14041 tatatggtag ctttcagtca gatagaacaa ctgttgtaaa cgagaatatg ttagggtatc + 14101 ttgatttgac atctgttcga acaaattacc cagaatgcaa aagaatttgt gaaaatatgt + 14161 gcattgcatt tctaagtcag tatcaagtcc cggctaagat tgctcgtcta tcccagacct + 14221 ttggtgcagg cactctaccg ggtgaaaata gagtatttgc tcaatttgct cgtagtgtta + 14281 tgcaagggaa agatattgtt ttacatacgt tagggcaatc agaaggaaat tactgctaca + 14341 cagctgatac tgttgttgca ttattaacaa ttctattgag aggagaaaat ggggaggctt + 14401 ataatattgc taatgaagag agtcatacaa caatagcaga tatggcaaaa atggtaactt + 14461 cgcaattctc tcaaacgagt caagtggttt ttgatattcc gaagaaaaat atatttggtt + 14521 atgctgtaga tactaaaatg aagttatcaa cacacaaaat tcaacaattg ggttggaagc + 14581 cgagggtctc tcttgtagat gcttatgatc gaatgatgag aagtatgaat gaaactgggg + 14641 tatagataac tatatgaagg tattaaaaaa ctacttatat aatctctctt atcaactatt + 14701 agttattatt cttcctatca ttacgactcc ttatgtgacg cgcatatttt cttcagatga + 14761 tttagggaca tacggttact tcaattccat tgttacctac ttcattttac ttgctactct + 14821 gggtattgct aactatggaa cgaaggagat atctgggaat aggaagagta ttcagaaaaa + 14881 tttctgggga atatatactt tacagtttgg agcgactact ttttccattt ttctctatat + 14941 actagcctgt cttttcatcc cagggatgaa aaacctagtt gcatatatct tgggattggg + 15001 tttagtctct aaaggactag atatttcatg gttgtttcaa gggttagaag attttcgtaa + 15061 aattacggtc agaaatatca cagtgaagct tgttggtgta agtgccattt tcttgtttgt + 15121 aaaatcagcg agtgatctat acttgtatgt ttttcttcta acagcatttg aattgttggg + 15181 tcagttaagt atgtggtttc cagcccgtga atatattgga aaaccacatt ttgatataga + 15241 atatgctagg catcatctga agccagttat cttgctattc ttaccacaaa ttgctatctc + 15301 gctttatgtg actttagatc gtacaatgtt aggggcgcta gcttctacaa aagatgtcgg + 15361 catttatgat caggctttga agctggttaa tattttactg accttggtaa cttccttggg + 15421 aagtgttatg ctgccacgcg ttgcgcattt gttagcgaca ggtgatcata aggtagtcaa + 15481 taagatgcat gaggtatcct tcttaattta taatttggtt atttttccga ttatggcagg + 15541 gatgttgatt gtgaatgatg attttgttca atttttcctt gggcaagact ttcaagatgc + 15601 acgctatgca atttccatta tgatcttccg tatgttcttt atcggttgga ctaatataat + 15661 gggaattcag atactgatac ctcataatca aaataaagaa ttcatgattt caacaacaac + 15721 tcccgcaatt atcagtgtag gtttgaactt actattcctt cctaaactgg gatatatcgg + 15781 ggcagccatt gtctctgttt taacagaggc acttgtatgg gcaatccaat tattctatac + 15841 tcgcagatat ttaaaagaag ttcctataat cggatcaatg tcaaaaatta tactagcatc + 15901 tgccattatg tatggccttt tactaagttc aaaaacagtt atacattttt caccgacctt + 15961 aaatgttcta gcatttgtag cgcttggtgg aatcatttat ctttttgcaa ttctatctct + 16021 gaaagtggta gatgtgaaag aattaaaaca aattattagg aaaaactaga atgagaaaaa + 16081 atcgaaatat caacctagat ttactaaaag tgcttgcatg tgttggagtt gttttacttc + 16141 atacaacaat gggcggattt aaagagacag gttcatggaa tcttttggca tatttatatt + 16201 atttaggtac ttactctatt cccttgtttt ttatgatcaa tggttatttg ttgttaggca + 16261 agagggagat aacttatctt tacatactcc agaaagtaaa atggatttta ataacagtgt + 16321 catcatggtc atttatcgta tggcttttta agcgtgattt tacaactaat cctattaaaa + 16381 aaattgtagg ttctttgata caaagaggtt atttctttca gttttggttt ttcggtgcac + 16441 tcatacttat ctatttatgt ttgccaattt tgagacaatt tctaaattca aaaagaagct + 16501 atttatacag tttatcttta ttgatgacta ttggtttgat ttttgagtta tcaaatatcc + 16561 tacttcaaat gccaatacaa acatatgtaa tacaaacttt tagattatgg acgtggtttt + 16621 tttactatct tttaggtggt tatatagcgc aattcactat agaagaaatt gaatcaaggt + 16681 ttaagaattg gatgaaaata gttagcatac ttttgttatt gatttcacca ataatattat + 16741 ttttcatagc gaagactata taccataatc tatttgctga atacttttat gatactttat + 16801 ttgtaaaagt cagtacttta ggaatttttc taactatcct catgcttact ttgaatgaaa + 16861 accgaagaga atcgattgtt tccctttcta atcaaacaat gggggttttc ataatacata + 16921 cttatattat gaaagtgtgg gaaaaagtgc ttggttttaa ttttgtagga gcatatttac + 16981 tttttgctct atttacttta agtgttagtt ttattattgt tgggatgtta atgaagattc + 17041 cttacttcaa tcgaatcgtc aaattataaa aaggagaaca agatgtacga ttatcttatt + 17101 gtcggtgctg gtttgtcagg agcaattttt gcttatgagg cgaccaagcg tggaaaaaaa + 17161 gtaaaagtga ttgataaacg taaccacatt ggtgggaata tctactgtga gaatgtagaa + 17221 ggagttaatg ttcataaata tggtgcccat atctttcata cttctaataa gaaagtttgg + 17281 gattatgtta atcaatttgc tgaatttaac aactacgtca actcgcctgt agctaattac + 17341 aagggtagcc tctataatct acctttcaat atgaatacct tctatgctat gtgggggaca + 17401 aaaactcctc aagaagtcaa agataagatt actgagcaga cagctgatat gaaggatgtt + 17461 gagccgaaaa atctggaaga acaggctatc aagttgattg gtccagatgt ctatgaaaag + 17521 ttaatcaagg gttatactga aaagcagtgg ggacgctcag caacggaact tcctccattt + 17581 atcattaaac gtcttccagt tcgtttaaca tttgataata actattttaa cgaccgttac + 17641 caaggaattc ctattggtgg ttacaatgtc atcatcgaaa atatgcttaa agacgttgaa + 17701 gttgagcttg gtgttgattt ctttgctcat cgtgaagagt tagaagcatc agctgaaaaa + 17761 gttgtcttta cagggatgat cgaccagtat tttgactaca agcacggaga gttagaatac + 17821 cgtagccttc gctttgatca tgaaattttg gacgaggaaa attatcaagg aaatgctgta + 17881 gtgaactata cggagcgtga gattccttat actcgtatta tcgaacacaa gcattttgaa + 17941 tatggaacac aggcaaagac agttatcacg cgtgaatatc cagctgactg gaagcgtggg + 18001 gacgagcctt actatccgat caacgatgag aaaaataatg ctatgtttgc taagtaccaa + 18061 gaggaagctt caaagaatga taaggttatt ttctgtggac gtttagcaga ttataaatat + 18121 tacgatatgc atgtggtgat tgaacgggcg cttgaggttg tggagaaaga gtttggatat + 18181 gacaaaaagt agaatcaatt ggatagattt tggaaaaggc ttttccatat ttttagtctt + 18241 agcaggacat gtgttgcttg gactgtatca atcggaaaaa tttcccacag caaataacat + 18301 actatcgttg ttgatagcac aagtctacat atttcatata ccagtatttt ttgccttatc + 18361 aggatacttt ttcaaacctg tgtcggattt gaaggagttc tggcaatatg ctaaaaagaa + 18421 gacaattgtt tttggtctgc catatatttt ctattcgatc attcactttg gtcttcaaaa + 18481 agttgcaggg gcatctgttc gtgttcctac aaccatatct gatttgctaa atatctataa + 18541 acatcctctt ggagtttcat ggtatttata tatactctgg tcgattttga taatctatgg + 18601 attattgtct attttagtca aaaatcgtag aatgttattt ttgataagtg ttttcgctta + 18661 ttgtttaacc ctatttgttc aaacagatat ttatattatt caaagaacgc tagtttgggg + 18721 gatttgtttc tttcttggca gtgtattgag tgaaattcac tttgataaaa ttaatttgaa + 18781 aaaatttctt tttttctttg tgttatttga ttttatttat atgttcgctt ggttcttgtt + 18841 ttatgaagta gggtctaaga aggattatgt aagctatatt aacccaggtt tgtgggggat + 18901 tgcttttatt gtctgtgtat tagttgcttt tgcgattttt cctaaaatgg agaaaaattt + 18961 tcctaaaact ttcctatatt tcactaaata cgggaaagat agtttaggga tctatattct + 19021 tcatgcacca atttgtagca tgattcggat tctaatgttg aaagtgggaa taaactcagt + 19081 ttttcttcac gttgttgttg ggattgtgct aggctggtat ttatccatac tagcaactta + 19141 tatattgaaa aaaattccat ttttgaatat tgttttatta ccacaaaagt atattaaatt + 19201 aaaataaatt attttagatt tataatgtgg ctctttgtca actaacatct ggagaggaca + 19261 atcactgtct tctctttttt tgtcttttca gaatatacca aattaacaca aaaattctga + 19321 aaattctgtt gacatctttc tgaaaagagt ttataatgga gagaaagttt taaaggagaa + 19381 aatgatgaaa agttcaaaac tatttgccct tgcgggcgtg acattattgg cggcgactac + 19441 tttagctgca tgctctggat caggttcaag cactaaaggt gagaagacat tctcatacat + 19501 ttatgagaca gaccctgata acctcaacta tttgacaact gctaaggctg cgacagcaaa + 19561 tattaccagt aacgtggttg atggtttgct agaaaatgat cgctacggga actttgtgcc + 19621 gtctatggct gaggattggt ctgtatccaa ggatggattg acttacactt atactatccg + 19681 taaggatgca aaatggtata cttctgaagg tgaagaatac gcggcagtca aagctcaaga + 19741 c +// + diff --git a/public/res/serotype_genbank/serotype_35D.gb b/public/res/serotype_genbank/serotype_35D.gb new file mode 100644 index 0000000..e4b3e80 --- /dev/null +++ b/public/res/serotype_genbank/serotype_35D.gb @@ -0,0 +1,528 @@ +LOCUS KY084476 15484 bp DNA linear BCT 07-MAR-2017 +DEFINITION Streptococcus pneumoniae strain 3431-06 cps gene locus, complete + sequence; and AliA (aliA) gene, partial cds. +ACCESSION KY084476 +VERSION KY084476.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 15484) + AUTHORS Geno,K.A., Saad,J.S. and Nahm,M.H. + TITLE Discovery of novel pneumococcal serotype, 35D: a natural + WciG-deficient variant of serotype 35B + JOURNAL J. Clin. Microbiol. (2017) In press + PUBMED 28202800 + REMARK Publication Status: Available-Online prior to print +REFERENCE 2 (bases 1 to 15484) + AUTHORS Geno,K.A. and Nahm,M.H. + TITLE Direct Submission + JOURNAL Submitted (03-NOV-2016) Medicine, University of Alabama at + Birmingham, 845 19th Street South, BBRB 614, Birmingham, AL 35226, + USA +COMMENT ##Assembly-Data-START## + Sequencing Technology :: Sanger dideoxy sequencing + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..15484 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="3431-06" + /serotype="35D" + /db_xref="taxon:1313" + /geo_loc_name="USA" + /note="Active Bacterial Core Surveillance; Centers for + Disease Control and Prevention; invasive pneumococcal + disease" + misc_feature 53..14807 + /note="cps gene locus" + gene 53..1507 + /gene="wzg" + /gene_synonym="cps35bA" + CDS 53..1507 + /gene="wzg" + /gene_synonym="cps35bA" + /note="Wzg" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein" + /protein_id="AQS23540.1" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVGFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLVIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVY + NDQEFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 1509..2240 + /gene="wzh" + /gene_synonym="cps35bB" + CDS 1509..2240 + /gene="wzh" + /gene_synonym="cps35bB" + /note="Wzh" + /codon_start=1 + /transl_table=11 + /product="phosphotyrosine phosphatase" + /protein_id="AQS23541.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDRGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + gene 2246..2941 + /gene="wzd" + /gene_synonym="cps35bC" + CDS 2246..2941 + /gene="wzd" + /gene_synonym="cps35bC" + /note="Wzd" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein" + /protein_id="AQS23542.1" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + gene 2951..3640 + /gene="wze" + /gene_synonym="cps35bD" + CDS 2951..3640 + /gene="wze" + /gene_synonym="cps35bD" + /note="Wze" + /codon_start=1 + /transl_table=11 + /product="tyrosine kinase" + /protein_id="AQS23543.1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 3655..5022 + /gene="wchA" + /gene_synonym="cps35bE" + CDS 3655..5022 + /gene="wchA" + /gene_synonym="cps35bE" + /note="WchA" + /codon_start=1 + /transl_table=11 + /product="UDP-glucosyl transferase" + /protein_id="AQS23544.1" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYLNFKGSKKILLLTATSHVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHIMAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + gene 5009..5815 + /gene="wciB" + CDS 5009..5815 + /gene="wciB" + /note="WciB" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="AQS23545.1" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDV + ILSRSNVEILLEKSDVIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKGLLDDYLPWLFSILDTMYEQMDLTDYTSFESRLFGRV + SELLFNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 5824..7053 + /gene="wzy" + CDS 5824..7053 + /gene="wzy" + /note="Wzy" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase" + /protein_id="AQS23546.1" + /translation="MKITIKRYSLPEILGLAALAIFLLFSLLDVSFYVQYISPMLYKA + AIFLIIMLIILKEFVSGSNSFESLLGLLGVSTLYFIIGSVTSYTSFIVLGLSLIYSLR + DIPFSKVVKVAFIISVAMLFLVILSSKIGFIPDYIEFSSTRVRHYLGFRYSLFPSTIM + MNIIAISFFLKQETVSYQRLFILFLVSMYLYLETDSRLTFISSSLLLLANLAMKLIPT + VIEKFSLLLKFFTLTYFVNAYLSYWISKNYLRTSNALLNHFFHQADQFLGGRIYLSNR + SLSLYGYGILGQKIAWVGNALNAQGERSTDAYLYVDNLYIQILQHFGLIALIIILSLL + TATLVKLLRKGQIVLSIIIVSLSFHALIDDLILSIHYNIFWILLGSLIYSNYQFSEER + YGEVENDSLRRTVREGY" + gene 7065..8189 + /gene="wcrJ" + CDS 7065..8189 + /gene="wcrJ" + /note="WcrJ" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="AQS23547.1" + /translation="MNNRDGKYYIGLVMKIITNPLKILKIKKRRVLLKSYNAETISCN + PKYIYNELKKINRYELVWVLKEPEKYPDVKAVKYMSLKWLYYIVTSQYVISNTGFNFW + LPKKKKQIYINTWHGGGAYKDSDNLNNISKAQVKQIKKSAELEDYFISSCAVFTKEYA + KKRVGFKGKILEIGTPRNDFLIRNQADDGLKNSIKNRLGIDDNCSIVIYAPTWRDDAS + AIEEIDYESLLESLRETYPKVSILVRGHHLQKNLIDIKNSNIVNVSDYDDMQELLLIS + DLLITDYSSTIWDMIHGGKKVLLYTPDLDEYLKYRGFHVDIKEWNIPYFKTNEELIAY + ISSNYFKNMEEMIENHKIRFGSFEHGNATQKIVELLEEGN" + gene 8190..9170 + /gene="wcrM" + CDS 8190..9170 + /gene="wcrM" + /note="WcrM" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="AQS23548.1" + /translation="MKVSVIIPVYNVEKYLRRCLDSVVNQTYKDIEVILVNDGSPDNS + KEICEEYVAKYSNIQLINQKNAGLGAARNTGLQYITGNAVTFVDSDDWLELDAIEYYV + ASMKKSDADIVVTQMIRKKEYFSNEGTNGTTIKEEVLNQEQFAKKYFKIDGNNIEYYA + CAKLYKREIAREVKYPVGLFAEDVPAAFGYIIRSQKIFYSTKVTYNYFFNDNSLTAKF + TDKDFDLEKIWDLVVEEAKVYGNEDYILYAKVNRYRIDFNLLCRIALSENKSDIEKYS + QEIVVLLGKVKENKKILLKYLPFSRKVIFRLFIVDYTLGRNVLRMFKNIV" + gene 9191..10264 + /gene="wcrH" + CDS 9191..10264 + /gene="wcrH" + /note="WcrH" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="AQS23549.1" + /translation="MIEMYYFIKVEKDLKNTAGIKAPDDIEKISEELGMKEIRFPKFP + FEKNKVIQKLWLFCVVGYNWISLLWRLKKNDVVIYQHPMYGVRVANFAIPLLKKYKNI + KFISVIHDLESLRKGIQGVIEDNETTNAIADKELLSKFDKVISHNPKMTEYLEGIGIK + KENLVELQIFDYLDPSEIEEKIEDGVVIAGNLAKGKSSYIYKLLENELNFKLNLFGPN + FINEELPENVEYFGSLPPNKLPQKLVGKFGLVWDGDSLETCSGNTGNYLKYNNPHKTS + LYLASGIPVIIWKEAALAQFIEENNVGITVNNLSEIEFVMQNISEGEYLSIKRNTMQL + GEKLRNGYFYRQAISKCKNDFMK" + misc_feature 10510..11232 + /note="similar to IS1381 transposase; similar to INSD + accession CR931705" + gene 11276..12691 + /gene="wzx" + CDS 11276..12691 + /gene="wzx" + /note="Wzx" + /codon_start=1 + /transl_table=11 + /product="flippase" + /protein_id="AQS23550.1" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSNDLGTYGYFN + SIVTYFILLATLGVANYGTKVISGHRKEIEKNFWGIYSLQLGATVFSLTLYCLLCLTL + PFMQNPVAYILGLALVSKGLDISWLFQGLEDFRKITVRNITVKFVGVISIFLFVKSAD + DLYLYVFLLTIFELLGQLSMWVPAREFIGRPHFDLEYARHHLKPVILLFLPQVAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVSNLLSSGDHKAVN + KMHEISFLIYNLVIFPIMAGMLIVNDDFVTFFLGQDFQEARYAIAIMIFRMFFIGWTN + IMGIQILIPHNQNKEFMLSTTIPAIVSVGLNLLLLPKFGYIGAAIVSVLTEALVWAIQ + LYYIRAYLKDVPIIRTMIKIILASAIMYSVLLVSKTYIHFSPTINVLVFVVLGGIIYL + FSVLSLKVVDVIELKQVIRKN" + gene 12693..13691 + /gene="wciG" + CDS 12693..13691 + /gene="wciG" + /note="WciG" + /codon_start=1 + /transl_table=11 + /product="putative integral membrane acetyl transferase" + /protein_id="AQS23551.1" + /translation="MHKFKDINLDLLKVIACVGVVLLHTEMGGFKETGSWNFSTYLYY + LGTYSIPLFFIVNGYLLLGKKEITYSYILQKVKYILITVLSWTFIVWLFKRDFSVNPI + KKLIGSLVQKGYFFQFWFFGALILIYICLPVLKQFLNSKRSYLYFLSVLLVIGLIFEL + TNIVLQMPIQTYVIQTFKLWTWLFYYILGGFISQFDKNTIKNGFKRWMKVIAVLLLLV + SPFILFFITKTTYHNFFAEYFYDILLVKVVSVGIFLTIFSIVLNENSNKWIIFLSNQT + MGIFIIHTYIMKVWEKLFGFNFIGSYLLFAIFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 13992..14807 + /gene="glf" + CDS 13992..14807 + /gene="glf" + /note="Glf" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase" + /protein_id="AQS23552.1" + /translation="MNTFNKLWGVVTPAEAQAKIEEQRAILNGKTPENLEEQAISLVG + TDIYEKLIKDYTEKQWGKPTTELPSFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIV + EKMLDHENIDVETNVDFFVNKEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENE + TLDMENYQGNAVVNYTDAETPYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYP + VNNDRNNHLYKSYKKLADEQGNVIFGGRLGHYRYYDMHQVIGVALQCVRNELN" + gene 15125..>15484 + /gene="aliA" + CDS 15125..>15484 + /gene="aliA" + /codon_start=1 + /transl_table=11 + /product="AliA" + /protein_id="AQS23553.1" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" +ORIGIN + 1 tgtagacatt accgtaaaaa agtgatataa tcgtatgatg ttcaatgtat aggtgttaat + 61 catgagtaga cgttttaaaa aatcaggttc acagaaagtg aagcgaagtg ttaatatcgt + 121 tttgctgact atttatttat tgttagttgg ttttttattg ttcttaatct ttaagtacaa + 181 tatccttgct tttagatatc ttaacctagt ggtaactgcg ttagtcctac tagttgcctt + 241 ggtagggcta ctcttggtta tctataaaaa agctgaaaaa tttactattt ttctgttgct + 301 gttctctatc cttgtcagct ctgtgtcgct ctttgcagta cagcagtttg ttggactgac + 361 caatcgttta aatgcgactt ctaattactc agaatattca atcagtgtcg ctgttttagc + 421 agatagtgat atcgaaaatg ttacgcaact gacgagtgtg acagcaccga ctgggactga + 481 taatgaaaat attcaaaaac tactagctga tatcaagtca agtcagaata ccgatttgac + 541 ggtcaaccag agttcgtctt acttggcagc ttacaagagt ttgattgcag gggagactaa + 601 ggccattgtc ctaaatagtg tctttgaaaa tatcatcgag tcagagtatc cagactacgc + 661 atcgaagata aaaaagattt ataccaaggg attcactaaa aaagtagaag ctcctaagac + 721 gtctaagaat cagtctttca atatctatgt tagtggaatt gacacctatg gccctattag + 781 ttcggtgtcg cgatcagatg tcaatatcct gatgactgtc aatcgagata ccaagaaaat + 841 cctcttgacc acaacgccac gtgatgccta tgtaccaatc gcagatggtg gaaataatca + 901 aaaagataaa ttaacccatg cgggcattta tggagttgat tcgtccattc acaccttaga + 961 aaatctctat ggagtggata tcaattacta tgtgcgattg aacttcactt cgtttttgaa + 1021 attgattgat ttgttgggtg gaattgatgt ttataatgat caagaattta ctgcccatac + 1081 gaatggaaag tattaccctg caggcaatgt tcatcttgat tcagaacagg ctctcggttt + 1141 tgttcgtgag cgctactcac tagcagatgg cgatcgtgac cgcgggcgca atcaacaaaa + 1201 ggtgattgtg gctatccttc aaaaattaac gtcaaccgaa gcactgaaaa attatagcac + 1261 gatcattaat agcttgcaag attctatcca aacaaatatg ccacttgaga ctatgataaa + 1321 tttggtcaat gctcagttag aaagtggagg gaattataaa gtaaattctc aagatttaaa + 1381 aggtacaggt cggacggatc ttccttctta tgcaatgcca gacagtaacc tctatgtgat + 1441 ggaaatagat gatagtagtt tagctgtagt taaagcagct atacaggatg tgatggaggg + 1501 tagatgaaat gatagacatc cattcgcata tcgtttttga tgtagatgac ggtcccaagt + 1561 caagagagga aagcaaggct ctcttgacag aatcctacag gcagggggtg agaaccattg + 1621 tctctacctc tcaccgtcgc aagggcatgt ttgaaactcc ggaagagaag atagcagaaa + 1681 actttcttca ggttcgggaa atagctaagg aagtggcgag tgacttggtc attgcttacg + 1741 gggctgaaat ttactacaca ccagatgttc tggataagct ggaaaaaaag cggattccga + 1801 ccctcaatga tagtcgttat gccttgatag agttcagtat gaacactcct tatcgcgata + 1861 ttcatagcgc cttgagcaag atcttgatgt tgggaattac tccagtcatt gcccacattg + 1921 agcgctatga tgctcttgaa aataatgaaa aacgcgttcg agaactgatt gataggggct + 1981 gttacacgca agtaaatagt tcacatgtcc tcaaacccaa actttttggc gaacgttata + 2041 aattcatgaa aaaaagagct cagtattttt tagagcagga tttggttcat atcattgcaa + 2101 gtgatatgca caatctagac ggtagacctc ctcatatggc agaagcatat gaccttgtta + 2161 cccaaaaata cggagaagcg aaggctcagg aactttttat agacaatcct cgaaaaattg + 2221 taatggatca actaatttag gagaaatgat gaaagaacaa aacacgatag aaatcgatgt + 2281 atttcaatta tttaaaacct tgtggaaacg caagctaatg attttaatag tggcacttgt + 2341 gacaggtgcg ggggcttttg catatagcac ttttattgtt aagccagaat atacgagtac + 2401 cacgcgaatt tacgtagtga atcgcaatca aggagacaag ccggggctga caaatcagga + 2461 tttgcaggca ggatcttatc tggtaaaaga ctaccgtgag attatccttt cgcaggatgc + 2521 attggaaaaa gtagcgacaa atttgaagtt ggatatgcca gcaaaaacgt tagccagcaa + 2581 agttcaagtg actgtaccag ctgacactcg tatcgtctca atctctgtca aggataaaca + 2641 gccagaggaa gccagtcgta tcgctaattc tctacgagaa gttgctgcag aaaagatcgt + 2701 cgctgtaacg cgagtatctg atgtaacgac acttgaagaa gcgcgaccag ctacgactcc + 2761 ctcttctcca aatgttcgac gcaattcctt gtttggtttt cttggaggag cagtcgtaac + 2821 agtaattgct gttcttttga ttgagttgct cgacacccgt gtgaaacgtc ctgaagatgt + 2881 tgaagatgta ctgaaaattc cacttttagg gctcgttcca gattttgaca aaataaaata + 2941 ggaggaagtt atgccaacat tagaaatctc acaggcaaaa ttggattctg taaaaaaggc + 3001 agaggaatat tataacgctt tgtgcacgaa cctacagtta agtggagatg gtttgaaagt + 3061 attttctatc acttctgtga aaataggaga aggaaaatca acgacttccg ccaatatcgc + 3121 ttgggctttt gcgcgtgcag gttacaaaac gctgctgatt gatggagata ttcgcaattc + 3181 tgttatgtta ggtgtcttta aagcaaggaa taagattaca ggcctgacag aatttttatc + 3241 aggaactaca gacttatcac aagggctttg tgataccaat atcgaaaatc tctttgtaat + 3301 tcaggctggc tctgtgtcac cgaatccgac agctcttctt caaagtaaga atttcactac + 3361 aatgcttgaa accttgcgta aatattttga ctacatcatt gtagatactg ctcctgttgg + 3421 tgtcgtgatt gatgcggcta ttattacgcg aaactgcgat gcttctattt tagtgacgga + 3481 ggcaggtgaa ataaatcgtc gggatattca aaaagcaaaa gaacagttgg aacacacagg + 3541 aaagccgttt ttgggaattg tgttgaataa attcgatact tcagtagaca aatacggttc + 3601 ttatggaaat tatggagatt acgggaaaaa taaaaaatag gtcgggggat agagatgaat + 3661 ggaaaaatat taaggtcttc attggccata atccagagtt ttcttgttat tttattgact + 3721 tatctactta gtgctgtgag agaaacggag attgtttcaa caacagctat tgcactttat + 3781 atcctccatt attttgtctt ttatatcagt gattatggac aggatttctt taaaaggaga + 3841 tatttgattg aacttgtcca gacattgaaa tatatcctat tctttgcact agcgattagt + 3901 atttctaatt ttttcttaga ggatcgattt agtatttcca gacgaggcat gatttacttc + 3961 ctcacattac atgctctctt agtctatgtg ctaaacctat ttatcaagtg gtattggaag + 4021 cgggcttatc tcaactttaa aggaagtaag aagattctcc tacttacagc aacttctcat + 4081 gtcgaaaagg tactggatag attaatagaa tcaaatgagg ttgttgggaa gttggtagcc + 4141 gtcagtgtct tagataaacc agattttcag catgattgtt taaaggtagt agcagagggg + 4201 gagatagtaa actttgcgac tcatgaggtg gtcgatgaag tctttatcaa tcttccaagt + 4261 gaaaaataca atattggaga gcttgtctct cagtttgaaa cgatgggaat tgatgtaaca + 4321 gttaatctaa atgcttttga tcgtagtttg gcacgtaaca agcaaattcg tgagatggca + 4381 ggattaaacg ttgtgacttt ttctacaaca ttttataaga ctagtcatat aatggctaag + 4441 cggattattg atatcatggg tgcattggta gggctgatac tatgtggttt agtcagtatt + 4501 gtactggttc ctttgattcg aaaggatggg ggttctgcta tttttgctca gacgcgtata + 4561 ggaaaaaatg gtcgtcagtt cactttttat aagtttcgct ctatgtgtgt agatgccgag + 4621 gcgaaaaaaa gagaactcat ggaacaaaat accatgcagg gtggaatgtt taaggtggac + 4681 gatgatcctc gtatcacgaa aattggtcgt tttatacgga agactagctt ggacgagcta + 4741 ccacagtttt ataatgttct aaagggagat atgagtttgg ttggcacacg gccaccaaca + 4801 gtggacgagt atgaacacta taccccagaa caaaaacgtc ggctaagttt taaacctggt + 4861 ataacaggct tatggcaggt cagtggacga agtgagatta agaattttga tgaagttgtc + 4921 aaattagatg tagcctatat agacgattgg acaatttgga aagatattga gattttattg + 4981 aagacagtta aagttgtatt gatgaaggat ggagcgaagt agattgatag atgtaaaaat + 5041 cattgtggca acacataaag aggttaaaat gcctcaagac aatagtcttt accttccaat + 5101 acatgttggg agagacggta aatcagatat tggttttatc ggtgataata ctggcgataa + 5161 tatatcctct ctaaatccat attattgtga gttgacggga ctttattggg catggaagaa + 5221 tcttgattat aattacttag gtctagttca ttaccgtcgt tattttacaa ataaatctca + 5281 agggtataat gaaaatgtca atatggatga cgtcattttg tctcgatcta atgttgaaat + 5341 attattagag aaatctgacg taatagttcc aaagaagcga aagtattata ttgaaactct + 5401 ttattcacat tatgcccata cccttaacgg agaacatctg gatcttgcta ggaaaattat + 5461 tgagcaaaat agttcagagt atctttcatc ctttgataaa gtgatgaaac aaagaagcgg + 5521 ttatatgttc aatatgttta tcatgaaaaa aggactatta gatgattatt taccgtggct + 5581 tttttctatt ctggatacta tgtacgaaca gatggacttg accgactata cttcatttga + 5641 gtcacgttta ttcgggcgag ttagtgagtt gttgtttaat gtttggttat gtaaaaaagg + 5701 aataacgcct aaagaggtac catttatgta catggagaga gtggatttgt ttgaaaaagg + 5761 aaaatctttt ttaatggcta aattttttgg aaagaagtat ggacagagtt tctaggaggg + 5821 aatatgaaaa tcactatcaa aaggtattca ctgccagaaa ttttaggact agcagcatta + 5881 gctatattcc tcctattttc gctattggat gtaagttttt acgttcagta tatatctcct + 5941 atgctatata aagctgcaat ctttttgata attatgctaa taattttgaa ggaatttgta + 6001 tctgggagta atagctttga gtctctattg ggtttactag gggtttctac gctctatttt + 6061 atcataggta gtgtaacgag ctatacttct tttatagtct tagggctatc tctgatatat + 6121 agcttgaggg atattccctt ttcaaaagta gtcaaagtag cctttatcat tagtgttgct + 6181 atgttgttcc ttgtgatatt gagtagtaag ataggtttta ttcctgatta cattgagttt + 6241 tcatctacta gagttcgaca ctatcttgga ttccgatatt cattatttcc atcaacgatc + 6301 atgatgaata ttatagctat atcatttttt ttgaagcaag aaacagtatc gtatcagcgc + 6361 ctttttatat tatttttagt ttcaatgtac ctatatttag aaactgattc acgactgact + 6421 tttatcagtt cgagtttgtt actattagct aatttggcta tgaagctaat ccctactgtt + 6481 attgaaaaat ttagtctttt attaaaattt ttcacgctta cctattttgt taatgcctat + 6541 ttaagttatt ggatttcaaa aaattactta aggacatcaa atgccttgtt gaatcatttt + 6601 tttcatcaag cagatcaatt cttagggggg cgtatttatt tatctaatcg ttcgttaagt + 6661 ttatatggtt atgggattct tgggcagaaa attgcttggg ttggaaacgc cttgaatgcg + 6721 caaggagaac gaagtacgga tgcatattta tatgtagata atctatatat tcagattctt + 6781 caacattttg ggctgatagc tttaattatt attttaagtt tactgactgc gactttagtg + 6841 aagcttttga gaaagggaca aattgtctta agtattatta tagtttctct gagtttccat + 6901 gctttgattg acgatttgat attgagtatc cattataata ttttttggat attattaggt + 6961 agtttaatct actcaaatta tcagttttct gaagaaaggt atggagaagt tgagaatgat + 7021 tccttacgta gaactgtaag ggaaggttat taatagggtt taatatgaat aatagagatg + 7081 gaaaatatta tattggacta gtaatgaaaa ttattactaa cccattaaag atattaaaga + 7141 taaaaaaacg ccgagttctg ctgaaaagtt ataatgcaga gactatttct tgcaatccaa + 7201 agtatattta taacgaactt aagaaaatta atcgttatga attagtgtgg gtgttgaagg + 7261 agccagaaaa atatcctgat gtaaaagcag taaagtatat gtcgttaaaa tggttgtatt + 7321 atatagttac ttctcaatac gtaatatcaa atacgggatt taacttttgg cttcctaaaa + 7381 agaaaaaaca gatatatata aatacatggc atggaggtgg agcatacaaa gatagtgaca + 7441 atttaaacaa tattagtaaa gcgcaggtca agcaaattaa aaagagtgca gagttggaag + 7501 attattttat atcgagttgt gcagtcttta caaaggaata tgcaaagaaa agagtaggat + 7561 ttaaaggtaa aatactagag atagggacac ctcgaaatga ttttttaatt cgtaatcaag + 7621 cagatgatgg tctaaaaaat agtataaaaa atcgacttgg aatagatgat aattgttcta + 7681 tagtaattta tgctccaaca tggcgagatg atgcttcagc tattgaagag atagattatg + 7741 aaagcttact agaaagttta agagagacat atccaaaagt gagtatttta gtacgtggtc + 7801 atcatcttca aaagaatttg attgatataa agaattcaaa tattgttaat gtatctgact + 7861 atgatgatat gcaagaatta ttattaattt cagatttatt aattactgat tactcttcaa + 7921 caatatggga tatgattcat ggagggaaaa aagtattatt atatactcct gatttagatg + 7981 aatatttaaa atatcgagga tttcatgtag atataaaaga atggaacatt ccatacttta + 8041 aaactaacga agagttgatt gcatatatct cttcaaatta ttttaaaaat atggaagaaa + 8101 tgatagagaa ccataagatt agatttggaa gttttgaaca cggaaatgca actcaaaaaa + 8161 tagtggaatt attagaagaa ggtaattaaa tgaaagtaag tgtaataata cctgtttata + 8221 atgttgaaaa atatttaaga aggtgtttgg attccgttgt taatcaaaca tacaaagata + 8281 ttgaagtgat tttggtaaat gatggttctc cagataattc aaaagaaata tgtgaagaat + 8341 acgttgctaa atattccaat attcaattaa taaatcaaaa gaatgcaggg ctaggtgcag + 8401 caagaaatac tggtctacag tatataacag gaaatgcggt aacttttgtc gattctgatg + 8461 attggttaga gttagatgca attgaatatt atgttgcatc tatgaaaaag agtgacgcag + 8521 atattgtagt tactcaaatg attagaaaaa aagaatattt ttctaatgaa ggaactaatg + 8581 ggacgactat aaaagaagag gtcctaaatc aggaacagtt tgcaaaaaaa tattttaaaa + 8641 tagatggtaa taatatagag tattatgctt gtgcaaaact ttataagaga gagattgcta + 8701 gagaggttaa ataccctgtt ggtttatttg cagaagacgt ccctgcagca tttggttata + 8761 ttatacgttc acaaaaaatt ttttatagta caaaagtaac gtataattat ttctttaatg + 8821 ataatagttt aacggctaaa tttacagata aagattttga tttggaaaag atatgggatc + 8881 tagtcgtaga agaagcaaag gtttatggga acgaggatta tattttatat gccaaggtga + 8941 atagatatag aatcgatttt aatcttttgt gcagaattgc tttatcggaa aataaatctg + 9001 atatagaaaa atatagccaa gaaatagtgg ttctacttgg aaaagttaaa gaaaataaaa + 9061 aaattttatt aaagtattta ccgttttcta ggaaggtgat atttagattg tttatagttg + 9121 attatacgct aggaagaaat gttttgagaa tgtttaagaa tattgtgtag ttaacaaata + 9181 ttggtataag gtgatagaaa tgtattattt tataaaagta gagaaagatt taaaaaatac + 9241 agccgggatt aaagcgcctg atgatataga aaaaatttca gaagaattgg gaatgaaaga + 9301 aatacgcttt cccaagtttc cttttgaaaa aaataaagtt atacaaaaac tctggctttt + 9361 ttgtgttgta ggttataatt ggataagtct gttgtggaga cttaaaaaga atgatgtagt + 9421 tatttaccaa catccaatgt acggagtgcg tgttgcaaat tttgcaattc ctttattgaa + 9481 aaagtataaa aatataaaat ttatttcagt aatacatgat ttagaatcgt taagaaaagg + 9541 aatccaagga gtcattgaag ataatgaaac aacaaatgct attgcagaca aagagttgtt + 9601 gtcaaaattt gataaagtga tttcccataa tccgaaaatg acagaatatt tagaagggat + 9661 agggataaaa aaagaaaatt tagttgaatt gcaaatattc gactacctag atccatcaga + 9721 aatagaagaa aagattgaag atggagtggt tatagcgggg aatctagcaa aaggaaaaag + 9781 ttcatatata tataagttgt tagaaaatga actgaacttc aaattaaatc tttttgggcc + 9841 aaattttatt aacgaagagc taccagaaaa cgttgagtat tttggtagtt tacctccaaa + 9901 taaattgcct caaaagctag taggtaagtt tggtttggtt tgggacggtg atagtctaga + 9961 aacttgtagt ggaaatactg gtaactattt gaagtataat aatccacata aaacctcatt + 10021 atatcttgct tcaggaatac ctgtaattat ctggaaagaa gctgcgttag cacagtttat + 10081 tgaagaaaat aatgttggta ttactgtaaa taatttgtca gaaattgagt ttgtgatgca + 10141 aaatatatct gagggcgaat atttatcaat aaaaagaaat acaatgcaat tgggtgaaaa + 10201 attaagaaat ggatattttt atcgtcaggc gatatctaag tgcaaaaatg atttcatgaa + 10261 gtaagagggc atataaaaag acggaaaata tttagcaata aatactgtag cttatttttt + 10321 attgaagtgg atgtgtaatt tcagataact atggagttgc tcaccaatta aatcagaact + 10381 caaaaaacaa tagactccct gcgaaacaaa atatggtata gtagttctat gaatgatgaa + 10441 gcaagtaaac aactaactga tgcacgattt aagcgtcttg ttggtgttca gcgcacgact + 10501 tttgaagaga tgttagctgt attaaaaaca gcttatcaac ttaaacacgc aaaaggtgga + 10561 cgaaaaccta aattaagcct agaagacctt cttatggcca ctcttcaata tgtgcgagaa + 10621 tatcgaactt atgaagaaat tgcggctgat tttggtatcc acgaaagcaa cttactccgt + 10681 cggagccaat gggttgaagt aactcttgtt caaagtggtg ttacgatttc aagaactcct + 10741 ctcagttctg aggacacggt aatgattgat gcgacggaag tacaaatcaa tcgccctaaa + 10801 aaaagaatta gcgaattatt ctggtaaaaa aaatgccacg ctatgaaggc tcaagcgatt + 10861 gtcacaagtc aagggagaat tgtttctttg gatatcactg tgaactattg tcatgatatg + 10921 aagttgttca aaatgagtcg cagaaatatc ggacaagctg gtaaaatctt ggctgacagt + 10981 ggttatcaag ggctcatgaa gatatatcct caagcacaaa cttcacgtaa atccagcaaa + 11041 ctcagaccgc taatagttga agataaagcc tgtaaccatg cgctatctaa ggagagaagc + 11101 aaggttgaga atatctttgc caaagcaaaa acgtttaaaa tgttttcaac aacctatcga + 11161 aatcatcgta aacgcttcgg attacggatg aatttgattg ctggtattat caatcatgaa + 11221 ctaggattct agttttgcag gaagtctaat aattaaattg gaattgtgaa cgtaaatgaa + 11281 agtacttaaa aactatgcat acaatctatc ttatcaatta ttggtgatta tacttccaat + 11341 cattacgacc ccctatgtga cacgggtctt ttcttcgaat gatctaggga catatggtta + 11401 ttttaactcc atcgttactt attttatcct cttagcaacg ctaggggttg ccaactatgg + 11461 gaccaaggtc atttcagggc atcgcaaaga aattgaaaaa aacttttggg gaatctactc + 11521 tctgcaatta ggtgcaacag ttttttctct aaccttgtat tgtcttcttt gtctaactct + 11581 tccctttatg caaaatccag tagcctacat tctaggcttg gctttggttt ctaaaggatt + 11641 agatatatcc tggctttttc aagggctaga ggattttcga aagattactg ttcgaaatat + 11701 cacagtcaag ttcgttggtg taatctctat cttcctcttt gtcaaatctg cagatgatct + 11761 atacctctat gtctttttgc taaccatatt tgaactcttg gggcagctaa gtatgtgggt + 11821 gcctgctcgt gagtttattg gtagacctca ttttgattta gaatatgcta gacatcattt + 11881 gaaaccagtc atattattgt tccttccgca agtggcgatt tccttgtatg ttacgctaga + 11941 tcgtaccatg cttggagcgt tagcttctac aaaagatgta gggatttatg accaggcttt + 12001 aaagttggta aatatccttc tgaccttggt aacttccttg ggaagtgtca tgttgcctag + 12061 agtttcaaat cttttatcct caggggatca taaagcagtt aacaaaatgc atgagatatc + 12121 atttttaatt tataatttgg ttattttccc cattatggca ggaatgctaa ttgtaaatga + 12181 tgactttgtt acctttttcc tcgggcaaga ttttcaagag gcacgttatg caatagcaat + 12241 tatgattttt agaatgttct ttattggttg gaccaatatt atggggattc aaattttgat + 12301 acctcataat caaaataaag aatttatgct gtcaacaaca attcctgcta ttgttagtgt + 12361 tggattaaat cttctcttgc ttcccaagtt tggatatata ggagcagcaa ttgtttctgt + 12421 cttaacagag gcgctagtat gggctattca attgtactat attcgtgcat acctaaaaga + 12481 tgttccgatt attagaacta tgataaagat tattctagcc tcagctatca tgtatagcgt + 12541 tttgctagtt tctaagacat acatacattt ttccccaact ataaatgttt tggtatttgt + 12601 ggtgttaggt ggaatcattt atcttttttc agttttatct ctaaaagtgg tagatgtgat + 12661 agaattaaaa caagtaatta ggaaaaatta gaatgcataa atttaaagat attaacttgg + 12721 atttactaaa agtaattgca tgtgttggag ttgttttact ccatacagag atggggggat + 12781 ttaaagagac aggttcatgg aatttttcga catatttata ctacttagga acctattcta + 12841 tccctctatt ttttatagtt aatggttatt tattgttagg gaagaaagag attacctatt + 12901 cctacatatt acagaaagta aaatatattc taataacagt gctgtcatgg acctttatag + 12961 tttggttatt taaacgggat ttttcagtta atccaataaa aaaacttata ggatcattgg + 13021 tgcaaaaagg ttatttcttt cagttttggt tttttggtgc gcttatactt atttatatat + 13081 gtctccccgt tttgaaacaa tttcttaatt caaaaagaag ttatttatac tttttatctg + 13141 tattgctagt tattggttta atttttgagt taacaaatat tgtacttcaa atgccaatac + 13201 aaacatatgt aatacaaact tttaaattat ggacttggct tttctattat attttagggg + 13261 gctttatatc tcagtttgat aaaaatacca tcaaaaatgg gtttaagaga tggatgaaag + 13321 taattgcagt acttttatta ttagtttcgc catttatatt atttttcata acaaagacca + 13381 cttaccataa tttttttgct gaatattttt atgatatttt attagtaaaa gttgtaagcg + 13441 tagggatttt tctaactatt ttctcaattg tattgaatga aaatagcaac aaatggatta + 13501 tttttctttc taatcaaact atgggtatct ttataataca cacttatatt atgaaggtat + 13561 gggaaaaact atttggtttt aattttatag gttcatattt actttttgct atatttactt + 13621 taagtgttag ttttatcatt gttggaatgt taatgaaaat tccgtatttt aatcgaatcg + 13681 tcaaattata aaaaggagaa aaaatgtacg attatcttgt tgttggtgct ggtctctttg + 13741 gtgcagtctt tgcccatgaa gcagccttaa aaggaaaaaa agtaaaagtt attgaaaaac + 13801 gaaatcatat cgcgggtaat atctatactc gtgaagagga aggaattcaa gttcatcaat + 13861 atggtgctca tatcttccat acttctgata aggagatctg ggattatgta aatcagtttg + 13921 cagagtttaa ccgttatacc aattctcctg ttgcaaacta taagggtgag atttataacc + 13981 ttccttttaa tatgaatact ttcaataaac tttggggagt tgtaacgcca gcagaagcac + 14041 aagctaagat tgaggaacaa cgtgctattt taaatggtaa aactcctgaa aatttggaag + 14101 aacaggcgat ttctcttgta ggtacagaca tctacgaaaa attaatcaaa gactatacag + 14161 agaaacagtg gggcaaacca actactgaac ttccatcctt tattattcgc cgtttgccag + 14221 tacgcctgac ctatgataac aactatttta acgataccta tcaagggatt ccaattggtg + 14281 gatacactca aatagttgaa aaaatgttgg atcatgaaaa tattgatgta gaaacaaatg + 14341 ttgatttctt tgtgaataaa gagcaatatc tgaaagattt tcctaagatt gtctttactg + 14401 gtatgattga tgaattcttt gactataagt tgggcgaact agagtaccgt agtcttcgtt + 14461 ttgaaaatga gaccttggat atggaaaatt accaaggaaa tgcagttgtg aactatacgg + 14521 atgcagaaac tccatatact cgcattattg aacacaaaca ttttgagttt gggagtcaag + 14581 caaagactat cattactaaa gaacattcta aaacatggga aaaaggtgat gagccttatt + 14641 atccagttaa taatgatcgt aataatcatt tgtataaatc atacaaaaaa cttgctgatg + 14701 agcaagggaa tgttatcttt ggtggccgct taggacacta tcgttattac gatatgcacc + 14761 aagtaattgg agtagctttg cagtgcgtga gaaatgagtt aaattaatac tcaatgaaaa + 14821 ttaaagagca aactaggaag ctagccacag gttgctcaaa acactgtttt gaggttgcag + 14881 atggacgctg acgcggtttg aagagatttt cgaagagtat aaacaagtaa aactgactac + 14941 cagttattat ttagaaatag tattaaaaat tccttgacta tgtgatatag ttgagggatt + 15001 tttaaatgat attcatattt tttgcaaaga tgttgtttga aaaataattt tcaaaaattc + 15061 tgaaaattct gttgacaact ttctgaaaag agtctataat ggagagaaag ttttaaagga + 15121 gaaaatgatg aaaagttcaa aactatttgc ccttgcgggc gtgacattat tggcggcgac + 15181 tactttagct gcatgctctg gatcaggttc aagcactaaa ggtgagaaaa cattctcata + 15241 catttatgag acagaccctg ataacctcaa ctatttgaca actgctaagg ctgcgacagc + 15301 aaatattacc agtaacgtgg ttgatggttt gctagaaaat gatcgctacg ggaactttgt + 15361 gccgtctatg gctgaggatt ggtctgtatc caaggatgga ttgacttaca cttatactat + 15421 ccgtaaggat gcaaaatggt atacttctga aggtgaagaa tacgcggcag tcaaagctca + 15481 agac +// + diff --git a/public/res/serotype_genbank/serotype_35F.gb b/public/res/serotype_genbank/serotype_35F.gb new file mode 100644 index 0000000..9e93393 --- /dev/null +++ b/public/res/serotype_genbank/serotype_35F.gb @@ -0,0 +1,669 @@ +LOCUS CR931707 15137 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 361/39 (serotype 35f). +ACCESSION CR931707 +VERSION CR931707.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 15137) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 15137) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..15137 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="361/39" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC35F_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC35F_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34340.1" + /db_xref="GOA:Q4K0Y0" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K0Y0" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVEMTD + " + gene complement(284..1679) + /gene="tnp" + /locus_tag="SPC35F_0002" + /pseudo + CDS complement(join(284..418,418..963,963..1679)) + /gene="tnp" + /locus_tag="SPC35F_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(join(691..963,963..1196)) + /gene="tnp" + /locus_tag="SPC35F_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 5.4e-19" + /pseudo + gene 1848..3302 + /gene="wzg" + /locus_tag="SPC35F_0003" + CDS 1848..3302 + /gene="wzg" + /locus_tag="SPC35F_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34342.1" + /db_xref="GOA:Q4JZA2" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZA2" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYEVDINYYVRLNFTSFLKLIDLLGGIDVY + NDQEFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMIDLVNTQLESGGKYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1848..1973 + /gene="wzg" + /locus_tag="SPC35F_0003" + /note="Signal peptide predicted for SPC1708 by SignalP 2.0 + HMM (Signal peptide probability 0.991) with cleavage site + probability 0.537 between residues 42 and 43" + misc_feature 2061..2408 + /gene="wzg" + /locus_tag="SPC35F_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.6e-63" + misc_feature 2586..3029 + /gene="wzg" + /locus_tag="SPC35F_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.6e-68" + gene 3304..4035 + /gene="wzh" + /locus_tag="SPC35F_0004" + CDS 3304..4035 + /gene="wzh" + /locus_tag="SPC35F_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34343.1" + /db_xref="GOA:Q4JYJ3" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYJ3" + /translation="MIDIHSHIVFDVDDGPKSREESKALLVESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNIPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRVQYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + misc_feature 3307..3915 + /gene="wzh" + /locus_tag="SPC35F_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 4.7e-36" + gene 4044..4736 + /gene="wzd" + /locus_tag="SPC35F_0005" + CDS 4044..4736 + /gene="wzd" + /locus_tag="SPC35F_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34344.1" + /db_xref="GOA:Q4JZA0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZA0" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 4062..4478 + /gene="wzd" + /locus_tag="SPC35F_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-53" + misc_feature 4584..4661 + /gene="wzd" + /locus_tag="SPC35F_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4746..5429 + /gene="wze" + /locus_tag="SPC35F_0006" + CDS 4746..5429 + /gene="wze" + /locus_tag="SPC35F_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34345.1" + /db_xref="GOA:Q4JZ99" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZ99" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARTGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILVTAIGEVNKRDVQKAKQQLEQTEKLFLGVVLNKLDISVDKYGVY + GSYGNYRKE" + gene 5438..6079 + /gene="wcjH" + /locus_tag="SPC35F_0007" + CDS 5438..6079 + /gene="wcjH" + /locus_tag="SPC35F_0007" + /note="member of homology group 61" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34346.1" + /db_xref="GOA:Q4JYJ0" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JYJ0" + /translation="MIKMYFVFKNILDRFLAFFLFITLIIIPIIPITILVIWIEDPGD + VFFFQDRIGLNGKSFKVIKFRSMYKDADQRIKKSIISGEIDRLNFKEHSQSMTTKVGK + VIRKLSIDELPQLVNIIKGDMAIVGPRPLQQFEITHHILTHKEMETTLKMSKRLSVKP + GLLCYWQVTPNKNDIPFSDRMNLDLLYIDNVSFKTDFLLILKGFYTVLMGNNN" + misc_feature 5474..6070 + /gene="wcjH" + /locus_tag="SPC35F_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.1e-23" + gene 6081..6872 + /gene="wciB" + /locus_tag="SPC35F_0008" + CDS 6081..6872 + /gene="wciB" + /locus_tag="SPC35F_0008" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34347.1" + /db_xref="GOA:Q4JYI9" + /db_xref="UniProtKB/TrEMBL:Q4JYI9" + /translation="MKNIKILVATHKKYKMPSDSNMYLPIHVGCEGKKNLGFQGDNSE + ENISNLNPYYCELTGLFWAWKNLDCDYLGLVHYRRYFTKMTKRYNESINIDDVILNRF + EVEKLLENSDIIVPKRRKYYIETLYSHYDHTFDGSHLDLARKMIEMKNPEYLSSFDKV + MEQRSGYMFNMFIMKKELADDYFSWLFPILDSMYESMDLSGLTDFEARLFGRVSELLF + NVWLVKSNLTPKEVPFMYMEKVNLFKKGISFLMAKFFGKKYGQSF" + gene 6889..8109 + /gene="wzy" + /locus_tag="SPC35F_0009" + CDS 6889..8109 + /gene="wzy" + /locus_tag="SPC35F_0009" + /note="member of homology group 45" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34348.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ96" + /translation="MMKVVIKRKSLPEILALSALTIFLVVSILDVTFYVQYLPKVVYK + ILIAISLILLVIKELYKRKFDYRTIISLFATVLMYLLIGRVSTLNSNIAIGIIFIYAL + RDIPFKSVAKTSLAVSVLILLFVITSAKLGVIINYLEISGTRVRSYLGFRYALFPSIL + MMNIVAIVFYLKQNKIQYWQWLLLSLSAYWLYDETDSRLTFYSSCILLICSLLIRWIP + ELFSKFGYIFKAFKLTFIINAVVSFWVSFTYLNLSHSYINNLFLKLDYILGGRIYLMN + KSLNLYGFGLFGRPVEWNGNGLTIEGVRNYQTYLYVDNLYVQILQKFGLLALGIMLLV + LTLTLFKVIKRREWVLSFILILMSFHSMIDDLNLYLHYNIFWILLGSLIYPDYQFSDE + SDEELGENSFEEII" + misc_feature 6889..6993 + /gene="wzy" + /locus_tag="SPC35F_0009" + /note="Signal peptide predicted for SPC1714 by SignalP 2.0 + HMM (Signal peptide probability 0.989) with cleavage site + probability 0.880 between residues 35 and 36" + gene 8205..9005 + /gene="wcrO" + /locus_tag="SPC35F_0010" + CDS 8205..9005 + /gene="wcrO" + /locus_tag="SPC35F_0010" + /note="member of homology group 46" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34349.1" + /db_xref="GOA:Q4JZ95" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZ95" + /translation="MSDIKIIQDKILIILKEFISICEENNLTYYALGGTLLGAVRHKG + FIPWDDDIDIGMPREDYEKFKILAPDLLPSNLKIVNNPLNLDITQLVDKNVIVKIANS + ENNVFIDIFPLDGYPEKGFFAAKLHSFRLLFQRMLCKISVLDQLEDKDRGTVENLIVK + ISKMLRIQKVLPKDTLVENLHKVIQKYDFKTSRYVGNVLGRYREREIVPKEYFKEPVS + LIFEDTMINCPTKYKEYLSEIYGDYMKLPSVEDRVAHNIELISVGDAE" + misc_feature 8268..8927 + /gene="wcrO" + /locus_tag="SPC35F_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 7.6e-51" + gene 9021..10127 + /gene="wcrC" + /locus_tag="SPC35F_0011" + CDS 9021..10127 + /gene="wcrC" + /locus_tag="SPC35F_0011" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34350.1" + /db_xref="GOA:Q4JZ94" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZ94" + /translation="MGKKICIVKWILDDSGGGERVAVSLANELTKKYEVHLIGITTKQ + SDLFFKINSQVRYSNFFDHRVRLSKNILKISKMLRKYFIDNEIEVGFGIGISANVFLS + LAGIGTQTKVVLCDHTNSITDNREFSQKFQRYVGTKLADKIITLTQEDRENYIKKYGV + PEERICYIYNWKEAALSDVSYNKKSTKIVTVGRFDYQKGYDYLIQVAKKVLEKRADWT + WEIYGSGNQDEVEKIRDLINENDLQDRLVIKGLEKNQDLIYGDKGIYVMTSRYEGLPL + VLLEAQQYNLPIASFSCPTGPNEIVEDGVNGYLVECYDVEAMSNRLLELMNDKELRNR + FSSHAKDNIEKFNKDRIIHQWIDLIEEVSGGGNV" + misc_feature 9534..10046 + /gene="wcrC" + /locus_tag="SPC35F_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.4e-39" + gene 10120..11136 + /gene="wcrD" + /locus_tag="SPC35F_0012" + CDS 10120..11136 + /gene="wcrD" + /locus_tag="SPC35F_0012" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34351.1" + /db_xref="GOA:Q4JYI5" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYI5" + /translation="MSNKILTITVPTYNIENYIGKCIESFKAVNPTYYSDFEVLIIND + GSTDNSVQVVKDLMEGSTLDLRIITKENGGHGSTINRGIKEASGKYFKVIDGDDWINV + PEFESLLDKLREINTDLVISDYTEQHVYNNSTIFKEFSSYLIPNQETRGIPSKWTPMH + ALVYKTSILKDNAITISENTFYVDQEYTMLPLQFVENYIYFKLDIYQYFLGRADQSMN + IDIMRKRADHHERVTKRILDLYKESYTQKPEIEKVVSDSLQYLVNKQNILYVMNEELD + KVYELFSYSEKSGFKFKFETKTKTSNLLYVNYKTKYLFNLVIKNLVKRKANSLEKEFQ + EKGF" + misc_feature 10138..10638 + /gene="wcrD" + /locus_tag="SPC35F_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.4e-32" + gene 11226..12656 + /gene="wzx" + /locus_tag="SPC35F_0013" + CDS 11226..12656 + /gene="wzx" + /locus_tag="SPC35F_0013" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34352.1" + /db_xref="GOA:Q4JZ92" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZ92" + /translation="MECACMKVLKNYAYNLSYQLLIIILPIITTPYVTRIFSSDNLGT + YGYFNSIVTYFLLLATLGIGNYGTKEISGNRKAIHQNFWGIYSIQLGASLFSTFLYVI + VCLILPAMQNTVAYILGLSLFSKGLDISWLFQGLEDFRKITVRNITVKVIGITSIFLF + VKSASDLYLYVFLLTIFELLGQLSMWVPAREFIGKPHFDWLYAKQHLKPVILLFLPQV + AISLYVTLDSTMLGSLASIRDVGIYDQSLKLVKILLTLVTSLGSVMLPRVSNLLSSGD + HKAVNKMHEISFLIYNLVIFPIMAGMLIVNDDFVTFFLGQDFQEARYAIAIMIFRMFF + IGWTNIMGIQILIPHNKNKEFMLSTIIPAIVSVGLNLLLLPKLGYIGAAIVSVLTEAL + VWAIQLYYTRTYLKDVPIIRTMIKIILASAIMYSVLLVSKTYIHFSPTINVLVFVVLG + GIIYLFSVLSLKVIDVIELKQVIRKN" + misc_feature 11247..12041 + /gene="wzx" + /locus_tag="SPC35F_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 7e-63" + gene 12658..13656 + /gene="wciG" + /locus_tag="SPC35F_0014" + CDS 12658..13656 + /gene="wciG" + /locus_tag="SPC35F_0014" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34353.1" + /db_xref="GOA:Q4JZ91" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZ91" + /translation="MHKFKDINLDLLKVIACVGVVLLHTEMGGFKETGSWNFSTYLYY + LGTYSIPLFFIVNGYLLLGKKEITYSYILQKVKWILITVLSWTLIVWLFKRDFSVNPI + KKLIGSLVQKGYFFQFWFFGALILIYICLPVLKQFLNSKRSYLYFLSVLLVIGLIFEL + TNIVLQMPIQAYVIQTFRLWTWLFYYILGGFISQFDKNTIKNGFKRWMKVIAVLLLLV + SPFILFFIAKTTYYNFFAEYFYDILLVKVVSVGIFLTIFSLVLNENSNKWIIFLSNQT + MGIFIIHTYIMKVWEKLFGFSFMGSYLLFAIFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 13669..14772 + /gene="glf" + /locus_tag="SPC35F_0015" + CDS 13669..14772 + /gene="glf" + /locus_tag="SPC35F_0015" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34354.1" + /db_xref="GOA:Q4JZ90" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZ90" + /translation="MYDYLIVGAGLFGAVFAHEAALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWEYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQVKIEEQRAILNGKTPENLEEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPAFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKMLDHENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKLADEQ + GNVIFGGRLGHYRYYDMHQVIGAALQCVRNELN" + misc_feature 14104..14712 + /gene="glf" + /locus_tag="SPC35F_0015" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 9.6e-115" + gene 15090..>15137 + /gene="aliA" + /locus_tag="SPC35F_0016" + CDS 15090..>15137 + /gene="aliA" + /locus_tag="SPC35F_0016" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34355.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaaacct caagtttttg aagcttgagg ttttttacta + 181 tagtggattg aaactagaat agtgcacctc tacttctaaa acattgttag aaatcgattt + 241 gactgtcctg actaatttgt cctattctta tttcatttta ctatatttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttatga agatattgtt + 361 tgaaagatgt gagtttccac ggatgggttt gtggagggat atacttgcgt ctttcttttt + 421 ttgttctggt tcttgttcaa agtttttcga atagagttca tgatctagta gctcctttgt + 481 gtgatagatt ttgtcagcga tattgaggta gatgtctccg tcaaatgctt ttataactaa + 541 tgctttcgta tttctgatga aatagacttc ttttccttgt tcggtaggga tatagtaacg + 601 attttggaat cggatatggt gtccactatc gacgactctc tccgccagtc tggccagaat + 661 gagattcctt tcagaggggt taggaacctc ctcgaagaca gagagttttg tcttgtttcc + 721 aaactgttca ttaaaggttt ggatgtagga aagcaggaag gtattggctt cttccaaggt + 781 atgaatattg tttcgttcca gttcgatagg caggcgagat tgtagtgtct gattaagtct + 841 ttcgactctc cctttagctt gagggataga ggttgtctcc agaagaatcc ctagttggtg + 901 acaggcgtat ccaaattgtg tatgggtgtc gtcctccatt ttcttcgagt tggaggcttg + 961 atataggtaa agaccgttct cttatctgtt ttaatttgaa ggggaacgcc gtgattgcct + 1021 aaaatttgtt cgaggacatg atagtaagca ttcaaggtct cttgtttatc aaaataagcg + 1081 cctaggatat tgccagaagc atcatcaatg gctaagtgta agttagatgt ttgggctcca + 1141 aaccatgcat gagggctggc atccatttga atgagttctc cagcaaattt ctttctgggt + 1201 ctactaggat gtactttttt aggggcttca aggaagtttt cagccgtcgg taagattgga + 1261 ttgtctaggg gttgattcag gttcagttta gcttgttttc ttactctctt ctttgtcttt + 1321 ctatgggact taggcgacag gatatttttc ttatagagta tttttctaac agttgtatca + 1381 gagagctgaa ttccttcttc ttcagctagc aattcacaga aatgaaggac atttggttta + 1441 tatgtttcat aggagaggta tttctttagg agacgttctt tgatttcatc agggattgca + 1501 tgttttggtt ttcgatttct gtttccgtgt ctgaaggctt cttttccttt cagttgatag + 1561 gctagtagca gacgattgat ttgtctttca gaaagattga gctcgacaca ggttcgtttc + 1621 tttgttttct ttccttgcgc tatagctttt atcacaagat attttttagt ttcattcata + 1681 ttcagttgga tccttttcat atgactattc taccaaatgg gacattttca cgttcgattt + 1741 actaaagaca ttatcacatt cgaattacac aagatgcaga tagtgaaaat aaaggtgtag + 1801 acattaccgt aaaaaagtga tataatcgta tgatgttcaa ggtataggtg ttaatcatga + 1861 gtagacgttt taaaaaatca ggttcacaga aagtgaagcg aagtgttaat atcgttttgc + 1921 tgactattta tttattatta gtttgttttt tattgttctt aatctttaag tacaatatcc + 1981 ttgcttttag atatcttaat ctagtggtaa ctgcgttagt cctactagtt gccttggtag + 2041 ggctactctt gattatctat aaaaaagctg aaaaatttac tatttttctg ttgctgttct + 2101 ctatccttgt cagctctgtg tcgctctttg cagtacagca gtttgttgga ctgaccaatc + 2161 gtttaaatgc gacttctaat tactcagaat attcaatcag tgtcgctgtt ttagcagata + 2221 gtgatatcga aaatgttacg caactgacga gtgtgacagc accgactggg actgataatg + 2281 aaaatattca aaaactacta gctgatatca agtcaagtca gaataccgat ttgacggtca + 2341 accagagttc gtcttacttg gcagcttaca agagtttgat tgcaggggag actaaggcca + 2401 ttgtcctaaa tagtgtcttt gaaaacatca tcgagtcaga gtatccagac tacgcatcga + 2461 agataaagaa gatttatacc aagggattca ctaaaaaagt agaagctcct aagacgtcta + 2521 agaatcagtc tttcaatatc tatgttagtg gaattgacac ctatggccct attagttcgg + 2581 tgtcgcgatc agatgtcaat atcctgatga ctgtcaatcg agataccaag aaaatcctct + 2641 tgaccacaac gccacgtgat gcctatgtac caatcgcaga tggtggaaat aatcaaaaag + 2701 ataaattaac ccatgcgggc atttatggag ttgattcgtc cattcacacc ttagaaaatc + 2761 tctatgaagt ggatatcaat tactatgtgc gattgaactt cacttcgttt ttgaaattga + 2821 ttgatttgtt gggtggaatt gatgtttata atgatcaaga atttactgcc catacgaatg + 2881 gaaagtatta ccctgcaggc aatgttcatc ttgattcaga acaggctctc ggttttgttc + 2941 gtgagcgcta ctcactagca gatggcgatc gtgaccgtgg gcgcaatcaa caaaaggtca + 3001 ttgtggctat ccttcaaaaa ttaacgtcaa ccgaagcgct gaaaaattat agtacgatca + 3061 ttaatagctt gcaagattct atccaaacaa atatgccact tgagactatg atagatttag + 3121 tgaatactca gttggaaagt ggagggaagt ataaagtaaa ttctcaagat ttaaaaggta + 3181 caggtcggat ggatcttcct tcttatgcaa tgccagacag taacctctat gtgatggaaa + 3241 tagatgatag tagtttagct gtagttaaag cagctataca ggatgtgatg gagggtagat + 3301 gaaatgatag atatccattc gcacatcgtc tttgatgtag atgatggtcc caagtcaagg + 3361 gaggaaagca aggctctctt ggtagaatcc tacagacagg gggtgcgaac cattgtctct + 3421 acctctcacc gtcgcaaggg catgtttgaa actccggaag agaagatagc agaaaacttt + 3481 cttcaggttc gggaaatagc taaggaagtg gcgagtgact tggtcattgc ttacggggct + 3541 gaaatttact acacaccaga tgttctggat aagctggaaa aaaagcggat tccgaccctc + 3601 aatgatagtc gttatgcctt gatagagttt agtatgaaca ttccttatcg cgatattcat + 3661 agcgctttga gcaagatctt gatgttggga attactccag tcattgccca catcgagcgc + 3721 tatgatgctc ttgaaaataa tgaaaaacgc gttcgggaac tgatcgatat gggctgttac + 3781 acgcaagtaa atagttcaca tgtcctcaaa cccaaacttt ttggcgaacg ttataaattc + 3841 atgaaaaaaa gagttcagta ttttttggaa cgtgatttag ttcatgtagt tgcaagtgac + 3901 atgcacaatt tagacagtag acctccatat atgcaacagg catatgatat cattgctaag + 3961 aaatatggag cgaaaaaagc gaaagaattt tttgtagata atcccagaaa aattataatg + 4021 gatcaattaa tttaggagaa aatatgaagg aacaaaacac tttggaaatc gatgtattgc + 4081 aactattcag ggctttatgg aaaagaaagt tggtcatttt attagtggca attataactt + 4141 cttcagttgc ttttgcctac agtacttttg ttatcaaacc tgagtttact agtacgactc + 4201 ggatttatgt agttaaccgt aatcaggaag agaagtctgg tttaaccaat caagacttgc + 4261 aggcaggatc atacttggtt aaagactatc gtgaaattat cctatcgcag gatgttttgg + 4321 aggaagttat ttctgatttg aaactagatt tgacgccaaa aggtttggct aataaaatta + 4381 aagtaacagt accagttgat acccgtattg tctctgtctc agttaatgat cgagttcctg + 4441 aagaggcaag ccgtatcgct aactctttga gagaagtagc tgctcaaaaa attatcagta + 4501 ttactcgtgt ttctgatgtg acaacactgg aggaggcaag accggcgata tcaccatctt + 4561 cgccaaatat taaacgcaat acactaattg gttttttggc aggggggatt ggaactagtg + 4621 ttatagttct tcttcttgaa cttttggaca ctcatgtgaa acgtccggaa gatatcgaag + 4681 atacactgca gatgacactt ttgggagttg taccaaactt gagtaagttg aaataggaga + 4741 gaggaatgcc gacattagaa atagcacaaa aaaaactgga gttcattaag aaggcagaag + 4801 aatattacaa tgccttgtgt acaaatatac agttgagcgg agataaacta aaagtaattt + 4861 ccgttacttc tgttaaccct ggggaaggaa aaacaactac ttccgtaaat atagcaaggt + 4921 cgtttgcgcg tacaggctat aaaactcttt tgatcgatgg cgatactcga aattcagtta + 4981 tatcaggagt ttttaaatcg cgtgaaaaaa ttacagggct aacagaattt ttatctggga + 5041 cagctgattt atctcacggt ttatgtgata caaatattga aaatttattt gtaattcaat + 5101 cgggatctgt atcaccaaac cctacagcct tgttacaaag taaaaatttt aatgatatga + 5161 ttgaaacatt gcgtaaatat tttgattata tcattgttga tacaccacct attggaattg + 5221 ttattgatgc ggcaattatc actcaaaagt gtgatgcgtc catcttggta acagcaatag + 5281 gtgaggtgaa taaacgtgat gtccaaaaag cgaaacaaca attagaacaa acagagaaac + 5341 tgttcctagg agttgtttta aataaattgg atatctcggt tgataagtat ggagtttacg + 5401 gttcctatgg aaattatagg aaggaataac ggagtaattg ataaaaatgt attttgtttt + 5461 taaaaatatt ttagatagat ttttggcgtt tttcctattt atcacactga taatcatacc + 5521 gattattccg ataacaattc tggttatttg gatagaagat ccaggagatg tgtttttctt + 5581 tcaagataga attggtttaa atgggaagag ctttaaagta ataaagtttc ggagcatgta + 5641 taaagatgct gatcaaagga taaagaaaag tattattagt ggtgaaattg atcgtctaaa + 5701 ttttaaagaa cattctcaaa gtatgactac aaaagtcggt aaagtgatac gaaaactttc + 5761 aattgatgaa ttacctcaat tagtgaatat tataaaaggt gatatggcta tagtgggacc + 5821 tcgtccatta caacaatttg aaataactca tcatattctt acccataaag aaatggagac + 5881 tactttaaag atgtctaaaa gattgtctgt gaaacctggt ttgctttgtt attggcaagt + 5941 tacgccgaat aaaaatgaca ttccttttag tgatagaatg aatctagatt tattatacat + 6001 tgataatgta tctttcaaga ctgatttctt gcttattttg aagggatttt atacagtttt + 6061 aatgggtaat aacaattaac atgaaaaata taaaaatatt agtagcaaca cataaaaaat + 6121 ataaaatgcc cagtgattca aatatgtatc taccaattca tgtaggatgt gaaggaaaga + 6181 aaaatttagg atttcaaggt gacaattcag aagaaaatat ttctaattta aatccttatt + 6241 attgtgaatt aactggcttg ttttgggctt ggaaaaactt agattgtgat tatctgggtt + 6301 tagtacatta tcgtcgttat tttactaaaa tgacaaaaag gtacaatgaa tcaataaata + 6361 tcgatgatgt aattttaaat aggtttgaag ttgagaaatt gttagagaac tcagatatca + 6421 ttgttcctaa aagaagaaaa tattatattg aaactcttta ttctcattac gaccatactt + 6481 ttgatggttc tcatttagat ctagctagaa aaatgattga aatgaagaat ccagaatatc + 6541 tctctagttt tgataaggta atggaacaaa gaagcgggta catgtttaac atgttcatta + 6601 tgaaaaaaga actggcagac gattattttt cttggctgtt tcctatcttg gatagtatgt + 6661 atgaaagtat ggatttatca gggttaactg attttgaagc tagattattt ggaagagtaa + 6721 gtgagttgtt atttaacgta tggttggtga agagcaattt aactccaaag gaagtgccgt + 6781 ttatgtatat ggaaaaagtt aacttattta aaaaagggat ttcatttttg atggcgaaat + 6841 ttttcggaaa gaaatatgga cagagttttt agttaggaat aaaaaatagt gatgaaagta + 6901 gtaataaaaa gaaagtcttt gccagagatt ttagctctta gtgcactaac tatattttta + 6961 gttgtgtcaa ttttagatgt gactttttat gttcagtatc ttccaaaagt tgtttataag + 7021 atactgatag ctatttcgct tattctgcta gttataaaag agttgtacaa aagaaagttt + 7081 gattatagaa ctatcataag tctatttgct acagttttga tgtatctcct tatagggagg + 7141 gtgagtactc ttaactctaa tattgcaata ggaattattt tcatttatgc tttacgcgat + 7201 attcctttta aaagcgtggc aaaaacttct ttagcagtaa gtgtactcat attactgttt + 7261 gttataacta gcgcaaaatt gggagttatt ataaattatt tagagatttc tgggactcga + 7321 gtccgtagtt atttaggatt taggtacgca ctattcccat ctatcttgat gatgaacata + 7381 gtcgctattg tattttattt aaagcaaaat aaaatacaat attggcaatg gttattgtta + 7441 tctttatctg cttattggct gtatgatgaa acggattctc gattaacatt ttatagttcc + 7501 tgtatattgt tgatatgcag tttattaata agatggatcc cagaactatt ctctaagttc + 7561 ggatatatat ttaaagcttt taaactcacc tttattataa atgcagttgt tagtttttgg + 7621 gtctccttta cctatctcaa tttgagtcat tcttatatca ataatctttt tttaaaatta + 7681 gactatatat taggtggtcg tatatacttg atgaataaat cgttgaattt gtatggtttt + 7741 ggattattcg gacgaccagt tgaatggaat ggaaatggtc tgaccattga aggagttaga + 7801 aactatcaga cctatctgta tgttgataat ttgtatgttc aaattttaca aaaatttggt + 7861 ttactcgctc taggaataat gctcctagtc ctaactttaa ccttgtttaa agtgattaag + 7921 agacgcgaat gggttctgtc ttttattttg atattgatga gttttcattc catgattgat + 7981 gatttgaatt tgtaccttca ttacaatatt ttttggatat tattaggtag tttaatctac + 8041 cccgattatc aattttctga tgaaagtgat gaagagttag gggaaaattc ttttgaagaa + 8101 attatatagt gaaatgctaa gaaatatttg agaagaactc acaagagtat agctgagaag + 8161 acagttgtat atcgagtttt gctgttttta tataggaggg aagtatgtcg gatataaaaa + 8221 tcattcaaga taagatttta attatcttaa aagagtttat tagtatttgt gaagaaaata + 8281 acctgaccta ctatgctcta ggtgggacct tgttgggcgc ggtacgtcat aaaggattca + 8341 taccttggga tgacgatatt gatatcggta tgccaagaga agattatgaa aagtttaaaa + 8401 tactagcccc agacctgtta ccaagtaatt taaaaatagt taataatcca cttaatcttg + 8461 atataactca gttagtagat aaaaatgtta ttgttaaaat tgcgaattcg gaaaacaatg + 8521 tgtttattga catttttcct ctagatggtt atccagaaaa aggatttttt gcagctaaat + 8581 tgcatagttt taggctattg tttcaaagaa tgctttgtaa aatatcagtt ttagaccagc + 8641 ttgaagataa agaccgtggc actgtggaga atcttatagt taaaatatcg aaaatgctaa + 8701 gaatccaaaa agtacttcct aaggatacat tggtagaaaa tctgcataaa gttattcaaa + 8761 aatatgattt taaaacttct cgttacgtcg gtaatgttct aggtagatat agggagagag + 8821 aaatagttcc gaaagagtat tttaaagaac ctgtttctct tatttttgag gatacgatga + 8881 taaactgtcc gacaaagtac aaggaatatt taagcgaaat ctacggtgat tacatgaaat + 8941 taccatcagt agaagataga gtagcacata atatagaact tatatcagta ggtgatgcag + 9001 agtgaagggt aggatagaaa ttgggaaaaa aaatatgtat tgtgaaatgg attttggatg + 9061 attctggtgg cggtgagcga gttgctgtat ctttggcaaa cgaacttaca aaaaagtatg + 9121 aagttcattt aattggaatt acaacaaagc aatcggacct gttctttaaa atcaattccc + 9181 aagtaagata ctccaatttt tttgaccata gagtacgctt gtctaagaat attctaaaaa + 9241 tctcaaaaat gttaagaaaa tatttcatag ataatgaaat agaggttggt tttgggatag + 9301 ggatatctgc taatgtattt ttatctttgg caggaatagg aactcaaact aaagtagttt + 9361 tgtgtgatca taccaattcg attacggata atagagaatt ttctcagaaa ttccaaagat + 9421 atgttgggac aaagttggca gacaagatta tcactctcac tcaagaagac cgtgaaaatt + 9481 atataaaaaa atacggtgtt cctgaggaaa gaatttgcta catctataat tggaaagagg + 9541 ctgctctttc agatgtatct tataataaaa aatcaactaa aattgtgact gttggccgtt + 9601 ttgattatca aaaaggctat gattatctca ttcaagtcgc gaaaaaagtg ttagagaaaa + 9661 gggctgactg gacttgggaa atctacggtt ccggcaatca agatgaagta gagaaaatca + 9721 gagatttaat caacgaaaat gatttacagg ataggttagt cataaaagga ctcgaaaaaa + 9781 atcaagattt gatttatgga gataaaggga tttatgtcat gacttctcgc tatgaaggtc + 9841 tacctttagt cctgctggaa gcacaacaat ataatcttcc tatagctagc tttagttgtc + 9901 cgacaggacc gaacgaaatt gttgaagatg gagttaatgg ctatctggtt gagtgttatg + 9961 atgtagaagc gatgtctaat agattattag aactaatgaa tgataaggag ctaagaaatc + 10021 gtttttcatc tcatgcaaaa gataacattg aaaaatttaa taaagaccga attatacatc + 10081 agtggataga tttgatagaa gaagtatctg gggggggaaa tgtctaataa aatactgacg + 10141 attactgtgc caacctataa tattgaaaac tatattggta aatgcataga atcatttaaa + 10201 gctgtaaatc ctacctatta cagtgatttt gaagtgttaa tcattaatga cggaagtact + 10261 gataattctg tacaagttgt taaggattta atggaaggta gcactttaga tttaagaatt + 10321 atcacaaaag aaaatggggg ccatggctca actattaatc gcgggattaa agaagctagt + 10381 ggaaaatatt ttaaggtcat tgatggggat gattggatca atgttccaga atttgaaagc + 10441 ttattggata agttaagaga gattaacact gatttagtga tttctgacta tacagagcag + 10501 catgtatata ataatagcac tatttttaaa gaattctctt cttatctaat tccaaatcaa + 10561 gagacaagag gtattcctag caagtggaca cctatgcatg ccctggtcta taaaacaagt + 10621 atcttgaagg ataatgctat tacgattagt gaaaatacat tttatgtcga ccaagagtat + 10681 acaatgctcc ctcttcaatt tgtagaaaat tatatttatt ttaagttgga tatttatcag + 10741 tacttcttgg gaagagctga tcagagtatg aatattgata taatgagaaa gagagcagat + 10801 catcatgaga gagtaacgaa acgaatctta gacttatata aagagagtta tacacaaaag + 10861 ccagaaatag aaaaggttgt cagtgactct ttgcagtatc tggttaataa gcaaaatatt + 10921 ttgtatgtta tgaatgagga acttgataag gtatatgaac tgttttcata ttctgagaaa + 10981 agtggattca aatttaaatt tgaaacaaaa acaaagactt caaatttact ttatgtcaat + 11041 tataaaacga agtatctttt taaccttgtt attaaaaatc tagttaaaag aaaagcaaac + 11101 agtctagaaa aagaatttca agagaaggga ttttgatgaa atatgtcagg aagtaaaaca + 11161 aatcatcaat tttttctgaa ggaattcata acaaaattaa ctacactgta taagactgta + 11221 ttcaagtgga gtgtgcttgt atgaaagtac ttaaaaacta cgcttacaat ctttcatatc + 11281 agttactaat cataatctta ccgattatta ccactcccta cgttactagg atttttagtt + 11341 cggataatct agggacttat ggttatttta actcaattgt aacctatttt cttttgctgg + 11401 ctactttagg aataggaaat tatggaacaa aagagatttc aggtaatagg aaagctatcc + 11461 atcagaattt ttggggtatt tatagtatac aactgggagc atctctattc tccactttcc + 11521 tttatgttat tgtctgtcta attttaccag ctatgcaaaa tactgtagcc tatattttag + 11581 gcttaagttt gttttctaaa ggtttagata tttcttggtt atttcaaggt ttagaggatt + 11641 ttcggaaaat tacagtaaga aatataactg tgaaagtcat tgggataacc tcgattttct + 11701 tatttgtaaa atcagctagc gacctctacc tttatgtttt tcttttaacg atatttgagt + 11761 tattagggca acttagtatg tgggtaccag ctcgggaatt tattgggaaa ccgcactttg + 11821 actggttgta tgctaaacaa catttgaagc cagttatctt attattttta ccacaggtcg + 11881 ctatatcgct ttatgtgact ttagatagta ctatgcttgg ttctctagcc tcaataagag + 11941 atgttggaat ttatgatcaa tctctgaaac ttgtcaaaat attattaaca ttagtaactt + 12001 cattaggaag tgtcatgttg cctagagttt caaatctttt atcctcaggg gatcataaag + 12061 cagtcaacaa aatgcatgag atatcatttt taatttataa tttggttatt ttccccatta + 12121 tggcaggaat gctaattgta aatgatgact ttgtaacctt tttcctcggg caagattttc + 12181 aagaggcacg ttatgcgata gcaattatga tttttagaat gttctttatt ggttggacca + 12241 atattatggg gattcaaatt ttgatacctc ataataaaaa taaagaattt atgctgtcaa + 12301 caataattcc tgctattgtt agtgtaggct taaatcttct cttgcttcca aagctgggct + 12361 atataggagc agcaattgtt tctgtcttaa cagaggcgct agtatgggct attcaattgt + 12421 actatactcg tacatactta aaagatgttc cgattattag aactatgata aaaattattc + 12481 tagcctcagc tatcatgtat agcgttttgc tagtttctaa gacatacata catttttccc + 12541 caactataaa tgttttggta tttgtggtgt taggtggaat catttatctt ttttcagttt + 12601 tatctctaaa agtgatagat gtgatagaat taaaacaagt aattaggaaa aattagaatg + 12661 cataaattta aagatattaa cttggattta ctaaaagtaa ttgcatgtgt tggagttgtt + 12721 ttactccata cagagatggg gggatttaaa gagacaggtt catggaattt ttcgacatat + 12781 ttatactact taggaaccta ttctatccct ctatttttta tagttaatgg ttatttattg + 12841 ttagggaaga aagagattac ctattcctac atattacaga aagtaaaatg gattctaata + 12901 acagtgctgt catggaccct tatagtttgg ctatttaaac gggatttttc agttaatcca + 12961 ataaaaaaac ttataggatc attggtgcaa aaaggttatt tctttcagtt ttggtttttt + 13021 ggtgcgctta tacttattta tatatgtctc cccgttttga aacaatttct taattcaaaa + 13081 agaagttatt tatacttttt atctgtattg ctagttattg gtttgatttt tgagttaaca + 13141 aatattgtgc ttcaaatgcc aatacaagca tatgtaatac aaacttttag attatggact + 13201 tggcttttct attatatttt agggggcttt atatctcagt ttgataaaaa taccatcaaa + 13261 aatgggttta agagatggat gaaagtaatt gcagtacttt tattattagt ttcgccattt + 13321 atattatttt tcatagcaaa gaccacttac tataattttt ttgctgaata tttttatgat + 13381 attttattag taaaagttgt aagcgtaggg atttttctaa ctattttctc acttgtattg + 13441 aatgaaaata gcaacaaatg gattattttt ctttctaatc aaactatggg tatctttata + 13501 atacacactt atattatgaa ggtatgggaa aaactatttg gttttagttt tatgggttca + 13561 tatttacttt ttgctatatt tactttaagt gttagtttta tcattgttgg aatgttaatg + 13621 aaaattccgt attttaatcg aatcgtcaaa ttataaaaag gagaaaaaat gtacgattat + 13681 cttatcgttg gtgctggtct ctttggtgca gtctttgccc atgaagcagc cttaaaagga + 13741 aaaaaagtaa aagttattga aaaacgaaat catatcgcgg gtaatatcta tactcgtgaa + 13801 gaggaaggaa ttcaggttca tcaatatggt gctcatatct tccatacttc tgataaggag + 13861 atctgggagt atgtaaatca gtttgcagag tttaaccgtt ataccaattc tcctgttgca + 13921 aactataagg gagagattta taacttacct tttaatatga ataccttcaa taaactctgg + 13981 ggagttgtga cgccagcaga agcacaagtt aagattgagg aacaacgtgc tattttaaat + 14041 ggtaaaactc ctgaaaattt ggaagaacaa gcgatttctc ttgtaggtac agacatctac + 14101 gaaaaattaa tcaaagacta tacagagaaa cagtggggca aaccaactac tgaacttcca + 14161 gcctttatta ttcgccgttt gccagtacgt ctgacctatg ataacaacta ttttaacgat + 14221 acctatcaag ggattccaat tggtggatac actcaaatag ttgaaaaaat gttggatcat + 14281 gaaaatattg atgtagaaac aaatgttgat ttctttgtga ataaagagca atatctgaaa + 14341 gattttccta agattgtctt tactggtatg attgatgaat tctttgacta taagttgggc + 14401 gaactagagt accgtagtct tcgttttgaa aatgagacct tggatatgga aaattaccaa + 14461 ggaaatgcag ttgtgaacta tacggatgca gaaaccccat atactcgcat tattgaacac + 14521 aaacattttg agtttgggag tcaagcaaag actatcatta ctaaagaaca ttctaaaaca + 14581 tgggaaaaag gtgatgagcc ttattatcca gttaataatg atcgtaataa tcatttgtat + 14641 aaatcatata aaaaacttgc tgatgagcaa gggaatgtta tctttggtgg ccgcttagga + 14701 cactatcgtt attacgatat gcaccaagta attggagcag ctttgcagtg cgtgagaaat + 14761 gagttaaatt aatactcaat gaaaattaaa gagcaaacta ggaagctagc cgcaggttgc + 14821 tcaaaacact gttttgaggt tgcagatgga agctgacgcg gtttgaagag attttcgaag + 14881 agtataaaca agtaaaactg actaccagtt attatttaga aatagtatta aaaattcctt + 14941 gactatgtga tatagttgag ggatttttaa atgatattca tattttttgc aaagatgttg + 15001 tttgaaaaat aattttcaaa aattctgaaa attctgttga caactttctg aaaagagtct + 15061 ataatggaga gaaagtttta aaggagaaaa tgatgaaaag ttcaaaacta cttgcccttg + 15121 cgggcgtgac attattg +// + diff --git a/public/res/serotype_genbank/serotype_36A.gb b/public/res/serotype_genbank/serotype_36A.gb new file mode 100644 index 0000000..41ce297 --- /dev/null +++ b/public/res/serotype_genbank/serotype_36A.gb @@ -0,0 +1,804 @@ +LOCUS CR931708 19113 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 1095/39 (serotype 36). +ACCESSION CR931708 +VERSION CR931708.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 19113) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 19113) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..19113 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="1095/39" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC36_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC36_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI34356.1" + /db_xref="UniProtKB/TrEMBL:Q4K2K9" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVEMTD + " + gene complement(284..1659) + /gene="tnp" + /locus_tag="SPC36_0002" + /pseudo + CDS complement(join(284..400,400..1659)) + /gene="tnp" + /locus_tag="SPC36_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(676..1176) + /gene="tnp" + /locus_tag="SPC36_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 5.7e-19" + /pseudo + gene 1835..3280 + /gene="wzg" + /locus_tag="SPC36_0003" + CDS 1835..3280 + /gene="wzg" + /locus_tag="SPC36_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34358.1" + /db_xref="GOA:Q4JZ87" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZ87" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIKNVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIQKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEVDDSSLAVVKAAIQDVMEGR" + misc_feature 1835..1951 + /gene="wzg" + /locus_tag="SPC36_0003" + /note="Signal peptide predicted for SPC1724 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 2039..2386 + /gene="wzg" + /locus_tag="SPC36_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 4.8e-65" + misc_feature 2564..3007 + /gene="wzg" + /locus_tag="SPC36_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 3.5e-70" + gene 3282..4013 + /gene="wzh" + /locus_tag="SPC36_0004" + CDS 3282..4013 + /gene="wzh" + /locus_tag="SPC36_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34359.1" + /db_xref="GOA:Q4JZ86" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ86" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHTGLSNILMLGITPVIAHIERYDALENNEKRVCELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPHMAEAYDLVT + QKYGEAKAQELFVDNPRKIIMDQLI" + misc_feature 3285..3893 + /gene="wzh" + /locus_tag="SPC36_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 7.1e-37" + gene 4022..4714 + /gene="wzd" + /locus_tag="SPC36_0005" + CDS 4022..4714 + /gene="wzd" + /locus_tag="SPC36_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34360.1" + /db_xref="GOA:Q4JZ85" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZ85" + /translation="MKEQNTLEIDVLQLFRILWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSLPNIKRNTLIGFLAGGIGTSVIVFLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 4040..4456 + /gene="wzd" + /locus_tag="SPC36_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.3e-53" + misc_feature 4562..4639 + /gene="wzd" + /locus_tag="SPC36_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4724..5407 + /gene="wze" + /locus_tag="SPC36_0006" + CDS 4724..5407 + /gene="wze" + /locus_tag="SPC36_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34361.1" + /db_xref="GOA:Q4JZ84" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZ84" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFAYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 5423..6790 + /gene="wchA" + /locus_tag="SPC36_0007" + CDS 5423..6790 + /gene="wchA" + /locus_tag="SPC36_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34362.1" + /db_xref="GOA:Q4JZ83" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZ83" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMEGLNVVTFSTNFYKTSHVISKRILDICGATIGLVL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKMDNDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSKIIDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 6206..6787 + /gene="wchA" + /locus_tag="SPC36_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.2e-149" + gene 6795..7580 + /gene="wcrO" + /locus_tag="SPC36_0008" + CDS 6795..7580 + /gene="wcrO" + /locus_tag="SPC36_0008" + /note="member of homology group 46" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34363.1" + /db_xref="GOA:Q4JZ82" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZ82" + /translation="MNKVREIQLGELSLLKNFIAICSKYNLRYYALGGTLLGVIRHKG + FIPWDDDMDLGMPRKDYEKFLSICNKELPEHVVLRLHDDNLGNTSIMDTSLQIPFGDE + LCSPFIDIFPLDGYPDDRFHYFIHTNKIKFYRALSKISVIDRLHDRDRGSFENAIVSI + SKVLKLNKLLKTATINNKLQNLIKQYDFETSSIVGNVLGSYRERELARKEVFGEPQLL + EFENLEISCHANPDEYLIKIYGDYMKLPKEAERKGHFESTWGD" + misc_feature 6858..7514 + /gene="wcrO" + /locus_tag="SPC36_0008" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 9.6e-43" + gene 7582..8322 + /gene="wchO" + /locus_tag="SPC36_0009" + CDS 7582..8322 + /gene="wchO" + /locus_tag="SPC36_0009" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI34364.1" + /db_xref="GOA:Q4JZ81" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q4JZ81" + /translation="MNSFDLMGVRIDPLTMDETVEAVENFVIEKRPLHLMGVNADKIN + QCQLDDVIKKIVNDSEIINADGASVVLASRFLGYQVPERVAGIDLMQRLLKLADEKSY + SVYFFGAKEEVLQDMLQNFKEEYPNLRVAGHRNGYFSEEDEQDIQEDIREKNPDFVFV + GITSPKKEYIIQKFMGNEVNSIFMGVGGSFDVLSGHIQRAPLWMQKSNLEWLFRVANE + PKRLFKRYFVGNITFIKRVLDEKQKTKK" + misc_feature 7741..8256 + /gene="wchO" + /locus_tag="SPC36_0009" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 9.4e-93" + gene 8297..9382 + /gene="wcjA" + /locus_tag="SPC36_0010" + CDS 8297..9382 + /gene="wcjA" + /locus_tag="SPC36_0010" + /note="member of homology group 66" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34365.1" + /db_xref="GOA:Q4JZ80" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZ80" + /translation="MRNKKRKNNILHISRTMDIGGAERIVYQLSSDLQDEFDSVHIAS + TGGLWERELAAQGIIHHKIQDIDSKNPFTVLKLIISIYQIINNNDITLVHTHHRMAAF + YIRLLKLINPKLIHVYTAHNVFKDKLSLYRFSLKNAYSIAVSQAVNKNLKDDVGITDS + TVIYNGVILKQTNKQVDEIMKFDGIKLGCIARLSEQKGLNYLIDAMSLISKENIHLFI + VGDGELRTELENKVKDLNLEEKVIFFGYRQDIVECINSFDFCVLPSVFEGFGLVAIEA + FMNGKTMIATDISGLNEVVTKENGVLVPLKDARALASAIEGLSTDLQLRTKLATQAKK + DYEEKFSYPLFLENYRKLYQKLMGDPK" + misc_feature 8804..9301 + /gene="wcjA" + /locus_tag="SPC36_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.1e-43" + gene 9379..10473 + /gene="mnaA" + /locus_tag="SPC36_0011" + CDS 9379..10473 + /gene="mnaA" + /locus_tag="SPC36_0011" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI34366.1" + /db_xref="GOA:Q4JZ79" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4JZ79" + /translation="MKKVMLVFGTRPEAIKMCPLVNELKKNNSIKILVCVTGQHKEML + EQVLDVFKVVPDYDLGIMKTNQTLFTITTSILDKIQAVLEQEKPDIVLVHGDTTTTFA + TALAAFYMGIKVGHVEAGLRTYNLQSPFPEEFNRQTTSIIADFNFAPTEVAKENLLKE + GRENIYVTGNTVIDALKTTVQDYYEHPILEWAKDSKLIMLTAHRRENLGQPMENMFNA + VNRILNEFEDVKVVYPIHKNPKVRELASKVFGDNERMQIIEPLEVIDFHNFMNQSYMI + LTDSGGVQEEAPSLGKPVLVMRDTTERPEGIAAGTLKLVGTEDENIYRNFKLLLENEE + EYNKMSKASNPYGDGTACQQIVEVIMKGLV" + misc_feature 9442..10458 + /gene="mnaA" + /locus_tag="SPC36_0011" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 1.9e-183" + gene 10473..11438 + /gene="wciF" + /locus_tag="SPC36_0012" + CDS 10473..11438 + /gene="wciF" + /locus_tag="SPC36_0012" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34367.1" + /db_xref="GOA:Q4JZ78" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZ78" + /translation="MGKVSIVVPVYNVEDYLKYCIDSLINQSYKDIEIILVDDGSTDD + SGRICDKYAQEDDRIRVLHIENGGLSNARNTGVKFASAEWIIFIDSDDYYDRRTVEYL + VQLQKKYAVDLVATSVIEVRDFQSEDFLGSLTNIDSLKLDRYTALKEMFYGNIVGTHP + GGKLYKKEILMKFPFPEGMLYEDLAVSFEHIGACNEIAVGCINLYKYYRRPGSIVNSS + YSDKFLDFYKAIEMNREFVQRDYPNDKEMNKALTVRYVFKGLHVVHAMLSSEMYSDVN + KIRKEYTRYFNDIIPNPNITGKNKVKYLMLLVSPKLYEKIREKMG" + misc_feature 10485..10985 + /gene="wciF" + /locus_tag="SPC36_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 9.3e-47" + gene 11445..12860 + /gene="wzx" + /locus_tag="SPC36_0013" + CDS 11445..12860 + /gene="wzx" + /locus_tag="SPC36_0013" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34368.1" + /db_xref="GOA:Q4JZ77" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZ77" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSNDLGTFGYFN + SIVAYFIFLATLGVANYGTKEISAHRNNIPNNFWGIYTLQFTATCISIFLYIGLCFSF + SFMQNPVAYILVLSLLSRGLDITWLFQGLEDFRKITVRNITVKLIGVISIFLFIKSQN + DLYLYVFLLTIFEFLGQLSMWLPALEFIGKPQFDFNYAKKHLKPVILLFLPQIAISLY + VTLNRTMLGALASTTDVGIYDQSLKLVNILLTLVTSLGSVMLPRVSNLLSTGDKKSVN + RMNQLSFFIYNLVIFPTIAGMLIINNDFVKFFLGNDFQEAKYAIAIMIFRMFFIGWTN + IMGIQILIPHNKNKEFLTSTTVPAIISVGLNLLLLPEFGYIGAAIVSVLTEIFVWVIQ + LYFTRKYLKDVPIFKSTVKIFSASILMYVALSFLKSILTFTPIVNVVVCAIVGAILYG + LLILIFKVVSLKEIKEQLLNN" + misc_feature 11451..12245 + /gene="wzx" + /locus_tag="SPC36_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.7e-62" + gene 12996..14192 + /gene="wzy" + /locus_tag="SPC36_0014" + CDS 12996..14192 + /gene="wzy" + /locus_tag="SPC36_0014" + /note="member of homology group 254" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34369.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ76" + /translation="MFILYYSLLNNNMIKIKFENLLVSIVVSVVIFFNTISTTMLDRT + FFQAKANYLLLVVLLLGLRFMFPTRISFKYLIFSSLLLLSGILVYFQTGKLNFLVYSA + LLVLLVNVDMKVVLKTYLIVAGILVLSVFLLSLLGAVPNLQYNREGVIRNSFGFIYPT + DFASHCFYLFLAFSYLLKDKFIWIRSLIGVLLSFFIIKYCDARLNALSIILATIIFIF + FYFNEDKKFRIYSISPYSVVLCSSIMMYLSYIFSWGSPFLVSINKLITGRLALGKNAF + NTFDVHLFGTRDVLFKGSGGKTEAVIDYNYVDSSYVQMLFTYGVIPLVLLICMYVVIS + REQYKQGQYLYVVILSLVALNCMIEAFWFVPTYNIFMFLLFTKNTFLNKSLNNFNPLD + KTELLN" + gene 14354..15451 + /gene="glf" + /locus_tag="SPC36_0015" + CDS 14354..15451 + /gene="glf" + /locus_tag="SPC36_0015" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34370.1" + /db_xref="GOA:Q4JZ75" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZ75" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRDHIGGNIYCEN + IEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGIKTPQEVKNKIAEQTAHMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TDLPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFANRQ + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEVLDKENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQDKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAVQNDK + VIFCGRLADYKYYDMHVVIERALNVVEEEFK" + misc_feature 14789..15391 + /gene="glf" + /locus_tag="SPC36_0015" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.1e-135" + gene 15476..16528 + /gene="wcrH" + /locus_tag="SPC36_0016" + CDS 15476..16528 + /gene="wcrH" + /locus_tag="SPC36_0016" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34371.1" + /db_xref="GOA:Q4JZ74" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4JZ74" + /translation="MKYYLKEEFLTDSGVRNAGNKARNDVEEIVVREGYSPLLLMVDD + WYQMGTIRAQRHKAKALSKAISKLKEGDQLLIQFPMLHHSFFTTHLVKRMQCKGVKVH + FIIHDLEVLRYANLDTVPLKHKIRVHLQESSLLKQADGLIAHNPVMKSVLVDKGISEK + KIVSLGIFDYLIPNYQDKEDLSKEGAIIVAGNLVQEKAGYLYELPTRPAYNLYGVGFD + EARKLSNETYFGSFLPDELPSALEGSFGLVWDGGSSKTCSGVFGEYLRYNNSHKASLY + LASGFPIIVWGQSALANFVLEKECGISVESLLDLEEVLEHLSQEEYQDLVKNAKSVGQ + KIREGSYLLSALQALN" + gene 16621..17221 + /gene="tnp" + /locus_tag="SPC36_0017" + /pseudo + CDS join(16621..16890,16871..17221) + /gene="tnp" + /locus_tag="SPC36_0017" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature 16886..17212 + /gene="tnp" + /locus_tag="SPC36_0017" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 3.3e-54" + /pseudo + gene 17434..18870 + /gene="tnp" + /locus_tag="SPC36_0018" + /pseudo + CDS join(17434..18438,18438..18638,18637..18870) + /gene="tnp" + /locus_tag="SPC36_0018" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 17611..18195 + /gene="tnp" + /locus_tag="SPC36_0018" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 3.5e-10" + /pseudo + gene 19066..>19113 + /gene="aliA" + /locus_tag="SPC36_0019" + CDS 19066..>19113 + /gene="aliA" + /locus_tag="SPC36_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34374.1" + /db_xref="UniProtKB/TrEMBL:Q4K1C2" + /translation="MMKSSKLFALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaaacct caagtttttg aagcttgagg ttttttacta + 181 tagtggattg aaactagaat agtgcacctc tacttctaaa acattgttag aaatcgattt + 241 gattgttctg aacgatttgt cctattctta tttcgtttta ctatacttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttagat gtgagtttcc + 361 acggatgggt ttgtggaggg atatacttgt gtctttcttt ttttgttctg gttcttgttc + 421 aaagtttttc gaatagagtt catgatctag tagctccttt gtgcgataga ttttgtcagc + 481 gatattgagg tagatgtctc cgtcaaatgc ttttataact aatgctttcg tctttctgat + 541 gaaatagact tcttttcctt gttcggtagg gatatagtaa cgattttgga atcggatatg + 601 gtgtctacta tcgacgactc tctccgccag tctagccaga atgagatttc gttcagaggg + 661 cttaggagcc tcctcaaaaa cagagagttt tgtcttgttt acaaactgtt cattaaaggt + 721 ttggatgtag gaaagcagga aggtattgac ttcttccaag gtatgaatct tgtttcgttc + 781 cagttcgata ggcaggcgag attgtagtgt ctgattgagt ctttcgactc tccctttagc + 841 ttgagggata gaggttgtct ccagaagaat ccccagttgg tgacaggcgt atccgaattg + 901 tgtatgggtg tcgtcctcca ttttcttaga gttggaggct taataggtaa agaccgttat + 961 cttatctgtt ttaatttgaa ggggaacgcc gtgattgcct aaaatttgtt cgaggacatg + 1021 atagtaagca ttcagggtct tttgtttatc aaaataagcg cctaggatat tgccagaagc + 1081 atcatcaatg gctaagtgta agttagatgt ttgtgctcca aaccaggcat gagggctggc + 1141 atccatttga atgagttcac cagcaaattt ctttctgggt ctactaggat gtactttttt + 1201 agggtcttca aggaagtttt cagccgtcgg taagattgga ttatctaggg ggtgcttggg + 1261 gttcagttta gcttgttttc ttactctctt ctttgccttt ctatgagact taggcgacag + 1321 gatgttttcc ttatagagta tttttctaac agttgtatca gagagctgaa ttccctcttc + 1381 ttcagctagt aattcacaga aatgaaggac atttggttta tatgtttcat aggagaggta + 1441 tttctttagg atacattcgt tgatttcatc agggattgca tgctttggtt ttcgatttct + 1501 gtttccgtgt ctgaaggcct cttttccttt ttgttgatag gctagtagca gacgattgat + 1561 ttgtctttca gaaagattga gctcgacaca ggcccgtttc tttgttttct ttccttgggc + 1621 tatagctttt atcacaagat attttttcgt ttcattcata ttcagttgga tctttttcat + 1681 atgactattc tacaaaatgg gacattttca cgttcgattt actaaagaca ttatcacatt + 1741 cgaattacac aagatgcaga tagtaaaaaa aaatatagac attaccgtaa aaaagtgata + 1801 taattgtatg atgttcaagg tataggtgtt aatcatgagt agacgtttta aaaaatcacg + 1861 ttcacagaaa gtgaagcgaa gtgttaatat cgttttgctg actatttatt tattgttagt + 1921 ttgtttttta ttgttcttaa tctttaagta caatatcctt gcttttagat atcttaacct + 1981 agtggtaact gcgttagtcc tactagttgc cttggtaggg ctactcttga ttatctataa + 2041 aaaagctgaa aagtttacta tttttctgtt ggtgttctct atccttgtca gctctgtgtc + 2101 gctctttgca gtacagcagt ttgttggact gaccaatcgt ttaaatgcga cttctaatta + 2161 ctcagaatat tcaatcagtg tcgctgtttt agcagatagt gatatcaaaa atgttacgca + 2221 actgacgagt gtgacagcac cgactgggac tgataatgaa aatattcaaa aactactagc + 2281 tgatattaag tcaagtcaga ataccgattt gacggtcgac cagagttcgt cttacttggc + 2341 agcttacaag agtttgattg caggggagac taaggccatt gtcttaaata gtgtctttga + 2401 aaatatcatc gagtcagagt atccagacta cgcatcgaag ataaaaaaga tttataccaa + 2461 gggattcact aaaaaagtag aagctcctaa gacgtctaag aatcagtctt tcaatatcta + 2521 tgttagtgga attgacacct atggtcctat tagttcggtg tcgcgatcag atgtcaatat + 2581 cctgatgact gtcaatcgag ataccaagaa aatcctcttg accacaacgc cacgtgatgc + 2641 ctatgtacca atagcagatg gtggaaataa tcaaaaagat aaattaaccc atgcgggcat + 2701 ttatggagtt gattcgtcca ttcacacctt agaaaatctc tatggagtgg atatcaatta + 2761 ctatgtgcga ttgaacttca cttctttctt gaaaatgatt gacttattgg gaggggtaga + 2821 tgttcataat gatcaagagt tttcagctct acatgggaag ttccatttcc cagtagggaa + 2881 tgtccatcta gactctgagc aggctctagg ttttgtacgt gaacgctact cactagccga + 2941 tggagaccgt gaccgtggtc gcaaccaaca aaaggtcatt gtagcaatta ttcagaagtt + 3001 aacttctaca gaggttttga aaaactatag tagtattctc caaggattgc aggattctct + 3061 tcaaacaaat atgccgattg agactatgat agatttagtg aatactcagt tggaaagtgg + 3121 ggggaattat aaagtaaatt ctcaagattt aaaagggaca ggtcggatgg atcttccttc + 3181 ttatgcaatg ccagacagta acctctatgt gatggaagta gatgatagta gtttagctgt + 3241 agttaaagca gctatacagg atgtgatgga gggtagatga aatgatagac atccattcgc + 3301 atatcgtttt tgatgtagat gacggtccca agtcaagaga ggaaagcaag gctctcttgg + 3361 cagaatccta caggcagggg gtgcgaacca ttgtctctac ctctcaccgt cgcaagggca + 3421 tgtttgaaac tccggaagag aagatagcag aaaactttct tcaggttcgg gaaattgcaa + 3481 aagaagtagc agatgattta gtcattgctt atggcgcaga gatatactat actctggatg + 3541 ctctagaaaa gctagaaaaa aaagaaattc ctacccttaa tgatagtcgt tatgctttga + 3601 ttgagtttag catgcatact tcctatcgtg agattcatac gggattgagc aatattttga + 3661 tgttgggaat cacgccagta attgctcata ttgaacgtta tgatgcttta gagaataatg + 3721 agaaacgtgt ttgtgaactg attgatatgg ggtgctatac tcagataaat agttatcatg + 3781 ttttaaaacc taagttcttt ggtgaaaaat ataaattcat gaaaaagaga gctcggtatt + 3841 ttttggaacg tgatttagtt catgtagttg caagtgacat gcacaattta gacagtagac + 3901 ctcctcatat ggcagaagca tatgaccttg ttacccaaaa atacggagaa gcgaaggctc + 3961 aggaactttt tgtagataat cccagaaaaa ttataatgga tcaattaatt taggagaaaa + 4021 tatgaaggaa caaaacactt tggaaatcga tgtattgcaa ctattcagaa ttttatggaa + 4081 aagaaagttg gtcattttat tagtggcaat tataacttct tcagttgctt ttgcctacag + 4141 tacttttgtt atcaaacctg agtttactag tacgactcgg atttatgtag ttaaccgtaa + 4201 tcaggaagag aagtctggtt taaccaatca agacttgcag gcaggatcat acttggttaa + 4261 agactatcgt gaaattatcc tatcgcagga tgttttggag gaagttattt ctgatttgaa + 4321 attagatttg acgccaaaag gtttggctaa taaaattaaa gtaacagtac cagttgatac + 4381 ccgtattgtc tctgtttcag ttaatgatcg agttcctgaa gaggcaagcc gtatcgctaa + 4441 ctctttgaga gaagtagctg ctcaaaaaat tatcagtatt actcgtgttt ctgatgtgac + 4501 aacactggag gaggcaagac cggcgatatc accatctttg ccaaatatta aacgcaatac + 4561 actaattggt tttttggcag gggggattgg aactagtgtt atagtttttc ttcttgaact + 4621 tttggacact catgtgaaac gtccggaaga tatcgaagat acactgcaga tgacactttt + 4681 gggagttgta ccaaacttga gtaagttgaa ataggagaga ggaatgccga cattagaaat + 4741 agcacaaaaa aaactggagt tcattaagaa ggcagaagaa tattacaatg ccttgtgtac + 4801 aaatatacag ttgagcggag ataaactaaa agtaatttcc gttacttctg ttaaccctgg + 4861 ggaaggaaaa acaactactt ccgtaaatat agcaaggtcg tttgcgcgtg caggctataa + 4921 aactcttttg atcgatggcg atactcgaaa ttcagttata tcaggagttt ttaaatcgcg + 4981 tgaaaaaatt acagggctaa cagaattttt atctgggaca gctgatttat ctcacggttt + 5041 atgtgataca aatattgaaa atttatttgt aattcaatcg ggatctgtat caccaaaccc + 5101 tacagccttg ttacaaagta aaaattttaa tgatatgatt gaaacattgc gtaaatattt + 5161 tgcttatatc attgttgata cagcacctat tggaattgtt attgatgcgg caattatcac + 5221 tcaaaagtgt gatgcgtcca tcttggtaac agcaacaggt gaggtgaata aacgtgatgt + 5281 ccaaaaagcg aaacaacaat tagaacaaac agggaaactg ttcctaggag ttgttttaaa + 5341 taaattggat atctcggttg ataagtatgg agtttacggt tcctatggaa attatggtaa + 5401 aaaataactt aggaaatatt ttatggatga aaaaggattg aaaatttttc tggcagtatt + 5461 acagagtata attgtcattt tattggttta ttttcttagc tttgttagag agacagaact + 5521 tgaacgttct tcgatggtta tactatacct tctccacttt tttgtattct attttagttc + 5581 ctatggtaac aattttttta aaagagggta cttagttgag tttaatagta ctataagata + 5641 tatttttttc tttgcaatag ctataagtgt attaaacttt tttatagcgg aacggtttag + 5701 tatctctaga agaggaatgg tatacttctt aactttagaa ggaatatcct tatacttgtt + 5761 aaatttctta gtaaagaaat attggaagca tgtgtttttt aatctaaaaa atagcaagaa + 5821 aattttactg ttaacagtaa cgaaaaatat ggaaaaagtt cttgataaat tgctagaatc + 5881 tgatgaactt tcatggaaat tggtagcagt aagtgttttg gataaatctg attttcaaca + 5941 tgataaaata cctgtaattg aaaaggaaaa aattattgaa tttgcaacgc atgaagttgt + 6001 ggatgaggtg tttgtcaatc ttccaggaga gagctacgat attggagaaa ttatctctag + 6061 gtttgagaca atggggatag atgtaactgt aaatcttaaa gcatttgata agaatttggg + 6121 tcgcaataaa caaattcatg agatggaagg attgaatgta gtcactttct ctacaaattt + 6181 ttataaaact agtcatgtga tttcaaagag aattctcgat atttgtggtg ccactattgg + 6241 ccttgttctt tttgctatag ctagtctagt tttagttcca ttgattcgta aagatggcgg + 6301 accagctatt tttgctcaaa ctcgtatagg gaaaaatggt cgacatttta ccttttataa + 6361 attccgttcg atgcggatcg atgctgaagc tatcaaagaa caattgatgg atcaaaatac + 6421 gatgcaaggt ggtatgttta agatggacaa tgatccgcgt atcacgaaaa ttggtcgttt + 6481 tataaggaag actagcttgg acgagttgcc acagttttat aatgttttaa agggagatat + 6541 gagtttagtt ggcacacggc caccaacagt ggacgaatat gagcactata ctccagaaca + 6601 gaaacgtcga ctcagcttta aacctggtat tacaggttta tggcaggtta gcggccgtag + 6661 taaaataatc gattttgacg atgttgtaaa attagatgtg gcttatattg ataattggac + 6721 aatctggaaa gatattgaaa ttttgcttaa aactgttaaa gttgtattta tgagagatgg + 6781 agcgaagtga ttttatgaat aaagtgaggg aaattcaact aggagaatta tctttattga + 6841 aaaactttat tgctatttgt agtaaatata atttaagata ttatgctttg ggaggaacat + 6901 tgctaggagt aattcgtcat aaaggattta ttccttggga tgatgatatg gatttaggaa + 6961 tgcctcgaaa agattatgaa aaatttttgt ctatttgtaa caaggaactt ccagaacatg + 7021 ttgttttgag acttcatgat gataatttag gtaatacctc tattatggat acatccttac + 7081 aaattccatt tggagatgaa ctatgtagtc cattcataga tattttccct ttggatggtt + 7141 atccagatga tcgttttcat tattttattc atacaaacaa aattaaattc tatcgtgcac + 7201 tttctaaaat ttcggtaatc gatcgtctac atgacagaga tcggggaagt tttgaaaatg + 7261 caattgtgag tatatcaaaa gttttgaaat taaataaact tttaaaaaca gccactatta + 7321 acaacaaatt acaaaatcta attaaacaat atgattttga aactagttca atagtaggga + 7381 atgtactagg ttcatacaga gaacgtgaac ttgctagaaa agaagtattc ggtgaaccac + 7441 aattactaga gtttgagaac ttagaaataa gttgccatgc taacccagat gaatatttaa + 7501 taaaaatata cggtgattac atgaagttac caaaagaagc tgaacgtaag ggccacttcg + 7561 agtctacatg gggagattaa tttgaatagt tttgatttaa tgggggtcag gattgacccc + 7621 ttaacaatgg atgaaacagt agaggcggtt gagaattttg tcattgaaaa acgtcctctt + 7681 catttaatgg gcgtaaacgc tgataagatt aatcaatgtc aattagatga cgtcattaaa + 7741 aaaatagtta acgattctga aattatcaat gcagatggtg catcagtagt tctagcctct + 7801 cgatttttgg gctaccaagt tccagagcga gttgctggaa ttgatttaat gcaaagatta + 7861 ttaaaattag cggatgagaa atcttattct gtgtatttct ttggtgctaa agaagaagtt + 7921 ttgcaggata tgttacaaaa tttcaaagaa gagtatccaa atctacgagt tgctggacat + 7981 cgtaatggtt atttttcgga ggaagatgag caagatattc aggaagatat tcgtgaaaag + 8041 aaccctgact ttgtatttgt tggaatcacc tctccgaaaa aagaatacat cattcaaaaa + 8101 tttatgggca atgaagtaaa ttccattttt atgggtgtag gtggtagttt tgacgtattg + 8161 tccggtcata ttcaacgagc accactttgg atgcaaaaat caaatctaga gtggttgttt + 8221 cgagtcgcta atgaaccaaa gcgtctcttt aaacgatatt ttgtggggaa tattaccttt + 8281 attaagcgag ttttagatga gaaacaaaaa acgaaaaaat aatattttac atatttcacg + 8341 aacaatggat attggtggcg ctgagaggat tgtgtaccag ttgagttctg atttgcaaga + 8401 tgagtttgat agtgtacaca ttgcttctac aggaggcctt tgggaacgag aattagcagc + 8461 ccaaggaatt atccatcata aaatccagga tatagacagc aaaaatcctt ttacagtgtt + 8521 gaagttgatt attagtatct atcaaattat taataataat gatatcactc tggtccatac + 8581 tcatcatcga atggctgctt tttatattcg tttattaaaa ctgattaatc ccaaattaat + 8641 ccacgtctat actgcccata atgttttcaa agataagttg tctttatata gattttcact + 8701 gaaaaatgcc tacagtattg cagttagtca agcagttaat aaaaatttga aagatgatgt + 8761 ggggattacc gacagtactg tcatctataa cggagtaatc ttaaagcaga caaataaaca + 8821 ggttgatgag attatgaagt ttgatggaat caaacttggt tgtattgcaa gattatctga + 8881 acaaaagggc ttgaactatc ttattgatgc gatgtctctg atttcaaaag aaaatattca + 8941 tttatttatc gttggtgatg gagagcttag aactgaacta gaaaataaag ttaaagatct + 9001 caatctagaa gagaaagtaa ttttttttgg ctatagacaa gatattgttg agtgtattaa + 9061 tagttttgat ttttgtgtct taccctcagt atttgaggga tttggcctag ttgctattga + 9121 agcatttatg aatggaaaaa caatgattgc aacagatatt tcaggattaa atgaagttgt + 9181 tacaaaagaa aatggtgtgt tggttccgct taaagatgct agagccttag cttctgctat + 9241 tgaggggctg tcgactgact tgcaacttag aacaaagtta gctactcagg ctaaaaaaga + 9301 ttatgaggag aaatttagtt atcctttgtt tctagagaat tatcgtaaat tgtatcaaaa + 9361 actaatggga gatccaaaat gaaaaaagta atgttagttt ttgggacgcg tccagaagca + 9421 ataaaaatgt gtcctttagt caatgagttg aagaaaaaca actcgataaa aatacttgtg + 9481 tgtgtaactg gtcaacataa agaaatgtta gaacaagttt tggatgtctt taaagttgtt + 9541 cctgattatg acttaggaat tatgaagaca aatcaaacat tatttacaat cacgacaagt + 9601 attttagata aaattcaagc ggttttagag caggagaaac cagatattgt tcttgttcat + 9661 ggagatacta caaccacttt tgcaacagct ttagctgcat tttacatggg aattaaagtt + 9721 ggacatgtag aagcaggatt gagaacttat aatcttcaaa gcccatttcc tgaggaattc + 9781 aatcgtcaga ctacttcaat tattgcggat ttcaattttg ctccgacaga ggtggctaaa + 9841 gagaatctct taaaagaggg aagagagaat atctatgtta ctgggaatac agttattgat + 9901 gccttgaaga caaccgttca agattattat gaacatccta ttttagagtg ggctaaggac + 9961 agtaaactaa tcatgctgac agcccatcgg cgtgaaaatc ttggccaacc tatggaaaat + 10021 atgtttaacg cagttaatcg tatcctgaat gagtttgaag atgttaaagt cgtgtatcct + 10081 attcataaga atcctaaagt tcgtgagcta gcaagtaaag tgtttggtga caatgaacgt + 10141 atgcaaatca ttgaaccact agaagtcatt gatttccata attttatgaa tcaaagctat + 10201 atgattttaa cagattcagg tggtgtacaa gaagaagcac cttctttagg taaaccagta + 10261 ttagtaatgc gtgatacaac tgaacgtcca gaggggattg ctgcaggaac cttgaaatta + 10321 gtaggaacag aagatgaaaa tatttatagg aattttaagc ttcttttgga aaatgaagag + 10381 gaatacaaca agatgagtaa ggcaagcaat ccttatgggg atggaacagc ttgtcaacag + 10441 attgtagaag ttatcatgaa gggattagta taatggggaa agtttcgatt gttgttccag + 10501 tatacaacgt tgaagattat ttgaaatatt gtattgatag cttaattaat caatcgtaca + 10561 aggatattga gattattttg gtagatgatg gctctactga tgattctgga agaatatgtg + 10621 ataagtatgc ccaagaagat gaccgtatta gagtcttgca tattgagaat ggaggccttt + 10681 ctaatgctcg aaatacgggt gtaaagtttg cttctgctga gtggataatt ttcattgatt + 10741 ctgatgatta ctatgatcgt agaactgttg agtatttagt gcaacttcaa aagaagtatg + 10801 ctgttgatct tgtggcaact tccgtcatcg aagttaggga cttccaaagt gaggattttt + 10861 taggttcatt aactaacata gattctttga aattagatcg ctatacagct ttgaaggaga + 10921 tgttttatgg aaatatagtt ggaactcatc cagggggaaa actatacaaa aaagaaatct + 10981 tgatgaagtt tccttttcca gagggtatgc tctatgaaga tttggctgtc tcttttgagc + 11041 atatcggagc atgcaatgaa attgccgtag gatgtatcaa tttatacaaa tattatcgaa + 11101 gacctggaag tattgtcaat tcttcttata gtgataaatt tttagacttc tataaggcta + 11161 tagagatgaa tagagaattt gttcagagag attatcctaa tgataaggaa atgaataaag + 11221 cacttactgt acgttatgtc tttaaggggt tacatgtagt acatgctatg cttagttcag + 11281 agatgtattc ggatgtcaat aaaatcagaa aagaatacac tagatacttc aacgatatta + 11341 ttcctaatcc aaatataaca gggaaaaata aagtgaaata cctgatgctt ttggtttctc + 11401 caaaactgta tgaaaaaatt agagagaaga tgggttaggt aagaatgaag gttttaaaaa + 11461 attatgcata taatctctct taccagctac tagtgataat tcttcctatt ataacaacac + 11521 cttatgtaac tagggtattt agttcaaatg atttaggaac ttttggctac tttaattcga + 11581 ttgttgctta ttttattttt ttagcaacat taggagtagc taattatggg acaaaagaga + 11641 tttcagctca tagaaataat atccctaata atttttgggg tatttatact ttgcagttta + 11701 ctgcgacttg tatatcgata tttctatata ttggtctgtg cttttcattt tcatttatgc + 11761 aaaatccagt agcttatata ttggtattat ctctattatc taggggatta gatattactt + 11821 ggctttttca aggactagaa gattttagga agataactgt tagaaatatc actgtcaaac + 11881 tcataggtgt tatttcaata tttttgttca taaagtctca gaatgattta tatctatatg + 11941 tctttttatt aactatattt gaatttttag gacaattaag tatgtggctg ccagctctag + 12001 aatttatagg taagccacaa tttgatttca attatgccaa gaaacatctt aaaccggtga + 12061 tattactgtt tttacctcaa atagcgatat ctttatatgt tacgttaaat aggacaatgc + 12121 ttggcgcttt agcatcaaca acagatgttg gaatttatga tcaatcttta aagttggtaa + 12181 atatcctact tactttggta acttcactag gtagtgttat gctaccacgt gtttcgaatc + 12241 ttttatcaac aggggataag aagtctgtga atcgcatgaa tcaattatct ttctttatat + 12301 acaatcttgt gatttttcca actattgcag gtatgttaat tatcaataat gactttgtga + 12361 aatttttctt aggaaatgac tttcaagaag caaaatatgc tattgcaatc atgattttta + 12421 ggatgttttt tattggttgg acgaacatta tggggattca aattttgata cctcataata + 12481 agaacaaaga atttttgact tcaacaacgg ttccagcaat tattagtgtt ggtttaaatt + 12541 tgcttttact gcctgaattt ggatatattg gggctgcgat tgtttctgta ttaacagaaa + 12601 tatttgtatg ggttatccaa ttgtatttta caagaaaata tttaaaagat gtaccaattt + 12661 ttaaatcaac tgttaaaata ttttcagcat caattcttat gtatgttgct ctttcatttt + 12721 tgaagtcaat tttgactttt acacctattg ttaatgttgt tgtatgtgct attgtggggg + 12781 cgatacttta tggtttacta attttaatat ttaaagtagt tagcttaaag gagataaaag + 12841 agcagctgtt aaataattag tatgatgata atctatacag aaataatcaa agttattttt + 12901 gtaagaattt gttttagcta agttagttga ttgaaaaaat ttagaaaagg aaggatgaaa + 12961 gattgtagat gaactaaaag ataaaattat taattatgtt cattctatat tattctttac + 13021 taaataataa tatgataaaa attaaatttg aaaatctact ggttagtatt gttgtatctg + 13081 tagtgatatt ttttaatact atatctacta caatgctgga tagaactttt tttcaagcta + 13141 aagcaaatta tcttttatta gtagttttgt tattaggtct tcgttttatg tttccaacac + 13201 gtatttcatt taaatatcta atattttctt ctttgctatt attatcagga attttagtat + 13261 attttcagac tggaaaactt aattttcttg tctattcagc ccttctggtt ttattagtta + 13321 atgtagatat gaaagtagtt ttgaaaacgt atctcattgt agcgggcatt cttgtactaa + 13381 gtgtatttct tttatctctc ttaggtgcag ttcccaattt acaatataat cgcgaaggag + 13441 ttattcggaa ttcatttgga tttatttatc ctacagattt tgcatcccac tgtttctatc + 13501 ttttcttggc tttttcttat ttattaaaag ataaatttat atggattagg tctctaatag + 13561 gtgtactttt atctttcttt attataaaat attgtgatgc acgtttaaat gccttatcaa + 13621 ttattttagc aacaattatt tttatatttt tctactttaa tgaagataag aaattccgga + 13681 tctattcaat ttccccttat tctgtagttc tatgttcgtc aataatgatg tatttatctt + 13741 atattttctc ttggggatct ccatttttag tatctatcaa taaattaatt acaggtagat + 13801 tagctttggg gaaaaatgca tttaatactt ttgatgtaca tctatttgga actagagacg + 13861 tattatttaa ggggtcagga ggtaaaacgg aggctgttat tgattataac tacgtagatt + 13921 catcgtatgt tcaaatgtta tttacatatg gtgttatacc tcttgtactg cttatatgta + 13981 tgtatgttgt aatttcgaga gaacagtata aacagggtca atatttatat gtagtaatat + 14041 tatctttagt ggctctaaac tgcatgattg aagctttttg gtttgtccct acttacaata + 14101 tattcatgtt tttgttattc acaaaaaata cttttcttaa taagtcgttg aataatttta + 14161 atcctttgga taaaacggaa ttgttgaact gataaaatta aattttttga tttgtaaaat + 14221 tatttttttc ataaaatgaa ctattctaac taatatttca aaaaaatttt ttaaaatcta + 14281 tttttgcatg atattttaat gaggataact ttacaatgct acaaaagtgt cgagtctaat + 14341 aaaggagtgt aatatgtacg actatctaat cgttggtgct ggattgtcag gtgcaatctt + 14401 tgcttatgaa gcaaccaagc gtggaaaaaa agtaaaagtt attgataaac gtgaccacat + 14461 tggtggaaat atctactgtg agaatataga aggagttaat gttcataaat atggtgcaca + 14521 tatcttccat acttctaata agaaagtctg ggattatgtg aatcaatttg ctgaatttaa + 14581 caactacatc aactcgcctg tagctaatta caagggtagc ctttataatc tacctttcaa + 14641 tatgaatact ttctatgcta tgtgggggat aaaaactcct caagaagtga aaaataagat + 14701 tgctgagcaa acggctcaca tgaaagacgt tgaaccgaaa aacttggaag aacaggctat + 14761 caagttgatc ggtccagata tttatgaaaa gttgattaaa ggatatactg aaaagcaatg + 14821 gggacgttcc gcgactgacc ttccaccgtt tatcatcaaa cgtctaccag ttcgtttgac + 14881 ttttgataat aactacttta atgaccgtta ccaaggtatt ccaatcggtg gctataatgt + 14941 cattatcgaa aatatgctga aagatgttga agtagaactt ggagttgact tttttgccaa + 15001 tcgtcaggaa ttagaagctt ctgctgaaaa agttgtcttt acagggatga ttgaccaata + 15061 tttcgattat aaacatggtg agctagaata ccgtagtctt cgttttgagc atgaagttct + 15121 agataaggaa aattatcaag gaaatgccgt tgttaattat acagaacgag aaattcctta + 15181 tactcgcatt attgagcaca aacattttga gtacggaaca caagataaaa cggttattac + 15241 tcgtgaatac ccagctgatt ggaaacgtgg agatgaacct tattatccaa tcaatgatga + 15301 gagaaacaat gccatgtttg ctaaatatca agaagaagca gtacagaatg ataaggtaat + 15361 tttctgtgga cgtttggctg attataaata ctacgacatg catgtggtca ttgaacgtgc + 15421 cctaaatgtt gtagaggaag aatttaaata agataacgaa ggataaaatt gatagatgaa + 15481 atattatcta aaagaagaat ttctgacgga ttctggtgta cgaaatgcgg gaaataaggc + 15541 tcgaaacgat gttgaagaaa tagtagttcg tgagggctat agtcctttgt tattgatggt + 15601 agatgattgg tatcaaatgg ggactattag agcccaacga cacaaggcta aagcgctatc + 15661 caaagctatc tctaagttga aggaaggcga tcagctactt attcaatttc ctatgcttca + 15721 tcatagtttc tttacgactc atttagtcaa aagaatgcaa tgtaaaggag tgaaggttca + 15781 ctttattatc catgatttag aagttttgcg ctatgccaat ttggatacag tacccttaaa + 15841 gcataaaatt cgtgttcatc ttcaagagtc aagtcttttg aaacaagctg atggtcttat + 15901 tgctcataat ccagttatga aatcagtgct tgttgataag gggatttctg aaaaaaaaat + 15961 agttagttta ggcatttttg actatctgat cccgaattat caggacaaag aagatttatc + 16021 gaaggaaggg gctattattg tagctggaaa tttagttcaa gaaaaagcag gttatttata + 16081 tgagttgcct acaagaccgg catataacct ctatggtgtt ggttttgatg aggctagaaa + 16141 actatccaat gaaacctatt ttggttcatt tcttccagat gaattaccat cagcattaga + 16201 aggaagcttt ggtttggttt gggacggtgg tagttctaaa acttgtagcg gcgtgtttgg + 16261 tgagtatttg agatacaata attcccacaa ggcctccctt tatttggctt ctggttttcc + 16321 tattattgtc tgggggcaat ctgctttggc taatttcgtc ttagaaaaag agtgtggaat + 16381 tagtgttgag agtttacttg atttagaaga agtattggaa catttgtctc aagaagagta + 16441 tcaggatttg gtcaaaaatg ctaagtccgt aggtcaaaaa attcgtgaag gttcttatct + 16501 tctttctgca ttacaagctt taaattaatg aatctaaaaa ttatacaaat agatagatga + 16561 gggagttact ggattccctc ttttcttata tcaagggagt tttaagtgaa gaattaaagt + 16621 aagcgcgtca taacaaggta tctatcattc atggagctcc tcctgtatac tattagtaaa + 16681 gtaaaactat tggaggatat tttaatgcca caacctattg ttcctgtaga gattccacaa + 16741 tctcgtcgtt ttgattctaa aaagagaaat gatattctgc ttaaaattcg tattggcaag + 16801 cttgaagtaa gtttttttca atctctcaat ctcgaaatgg tagaacagct tttggataag + 16861 gtgttgctct atgacaattc atctatctag cctagggcag gtctatctcg tatgtgggaa + 16921 aacggatatg aggcaaggca ttgattcact ggcttatctg gttaaaaccc actttgaatt + 16981 agatcctttc tcaggtcaag tttttctctt ttgtggtgga cgtaaagacc gctttaaagc + 17041 cttttactgg gatggtcaag gattttggct actatataaa cgctttgaga acggcagact + 17101 gacttggcta agtacagaaa aggatgtcaa agctctcaca ccagaacaag tagactggct + 17161 tatgaagggc ttttctatca ctcccaaaat aaatttatca gaaagtcgtg atttctattg + 17221 aaatgaggac tttcttttta gtataataaa gttagaaaac agagagggaa gctcatggaa + 17281 gaagattgaa aatcattcaa caacagagcg ctacaattga tagtctcacc aatgaacttg + 17341 cccttctgcg tgaacaagtg gcttatctga ctcaaaagct ctatggaaaa tcctctgaga + 17401 aaagtgtttg cccctctgga caactcaacc tttttgagga agagtctcca tctgaggaag + 17461 atggagatgt tcccagttga aacagaggaa attacctaca aacgtaagaa atctaaaggg + 17521 aaacgccaag ctcttcttgc ccaatttgat tcagaagaag ttcatcatca agtagaagag + 17581 aggatttgcc ctgattgtca gggagatcta aaagagattg gagggagtct tcaaggacaa + 17641 gaattggtct ttattcctgc gcaattaaaa cgcatagatc atatccaaca cgcttacaaa + 17701 tgccaagcat gcagtgataa aaatccgagt gataaaatcg tgaaagttcc tattcctaaa + 17761 gcccctttgg cgcatagcta tggctcagtt tctattatcg ctcacaccat ccatcagaag + 17821 tttaatctga aggtacccaa ttatcgccaa gaagaagatt gggctaagat gggtttacca + 17881 atcacacgca aggaaatctc taattggcat atcaagacga gtcaatacta tttggagccc + 17941 ctatataacc tcttgcgaga gagactattg actcagccct tacttcatgc ggatgaaact + 18001 tcttataggg tgctagagag tgatagtcag ctgacttact attggacttt tttgtctggg + 18061 aaagctgaga aacaagggat tacgctttac caccatgatc agtgtcgaag tggttcagta + 18121 gtacaagaat tcctaggaga ttattctggc tatgtgcatt gtgatatgtt gcggcagtaa + 18181 cttaggactt tagtcctcta gttctgccta tgcgatagca gtccaaggtt taggagcaag + 18241 gcgacgctaa gcttggtaaa ctgcgaaccg ctagaagctt atcgtcaact ggaagaagct + 18301 gaacttgttg gatgttgggt acatgtgaga aggaagtttt ttgaagcgac ccccaagcaa + 18361 gcggataaat catccttagg agctaaaggt ttagcttatt gtaatcagtt attttccttg + 18421 gaaagagact ggaagacttc tttgcttggt gccggcgtca gtcagtttta tcgggttcaa + 18481 aactaggaag ggcaattgaa tacagcctca agtataaaga aacctttaag actattttga + 18541 aagacggaca tctggtcctt tccaataatc tagctgaatg cgccattaaa tcattggtta + 18601 tgggacggag taaaagagtc cagtggactc ttttagccta agctcagttt aaaaaagcga + 18661 gggtggttat tttctcaaag ttttgaagga gctaaagcaa gagctattat tatgagtttg + 18721 ttggaaacag ctaaacgtca tcaattaaat agcgagaaat atctattcta tcttctagaa + 18781 tgtcttccaa acgaggaaac tctcgtaaac aaagaggttt tagaggttta tttatcatgg + 18841 actaaagttg tacaagaaaa gtgcaaataa gaaatctcca gattaggaac tatccgtgag + 18901 ttctctagtc tggagatttt tcaatatact tcgttattgg gcggttacga tattcatatt + 18961 ttttgcaaag atgttgtttg aaaaataatt ttcaaaaatt ctgaaaattc tgttgacatc + 19021 tttctgaaaa gagtctataa tggagagaaa gttttaaagg agaaaatgat gaaaagttca + 19081 aaactatttg cccttgcggg cgtgacatta ttg +// + diff --git a/public/res/serotype_genbank/serotype_36B.gb b/public/res/serotype_genbank/serotype_36B.gb new file mode 100644 index 0000000..dc80cb9 --- /dev/null +++ b/public/res/serotype_genbank/serotype_36B.gb @@ -0,0 +1,865 @@ +LOCUS MK606436 21895 bp DNA linear BCT 30-SEP-2020 +DEFINITION Streptococcus pneumoniae strain GPS_NP_1196 cps gene cluster, + complete sequence. +ACCESSION MK606436 +VERSION MK606436.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 21895) + AUTHORS van Tonder,A.J., Gladstone,R.A., Lo,S.W., Nahm,M.H., du Plessis,M., + Cornick,J., Kwambana-Adams,B., Madhi,S.A., Hawkins,P.A., + Benisty,R., Dagan,R., Everett,D., Antonio,M., Klugman,K.P., von + Gottberg,A., Breiman,R.F., McGee,L., Bentley,S.D. and The Global + Pneumococcal Sequencing,C.O. + TITLE Putative novel cps loci in a large global collection of pneumococci + JOURNAL Microb Genom 5 (7) (2019) + PUBMED 31184299 +REFERENCE 2 (bases 1 to 21895) + AUTHORS van Tonder,A.J. + TITLE Direct Submission + JOURNAL Submitted (06-MAR-2019) Parasites and Microbes, Wellcome Sanger + Institute, Wellcome Genome Campus, Hinxton, Cambridge CB10 1SA, + United Kingdom +COMMENT ##Assembly-Data-START## + Assembly Method :: Velvet v. 1.2 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..21895 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="GPS_NP_1196" + /isolation_source="nasopharyngeal swab" + /host="Homo sapiens" + /db_xref="taxon:1313" + /geo_loc_name="Nepal" + /collection_date="2009" + misc_feature 1..21895 + /note="cps gene cluster" + gene 1..1608 + /gene="dexB" + CDS 1..1608 + /gene="dexB" + /EC_number="3.2.1.70" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3280" + /inference="protein motif:CLUSTERS:PRK10933" + /inference="protein motif:Pfam:PF00128.18" + /inference="protein motif:TIGRFAMs:TIGR02403" + /inference="similar to AA sequence:RefSeq:YP_004326655.1" + /inference="similar to AA sequence:UniProtKB:Q99040" + /note="trehalose-6-phosphate hydrolase; maltooligosyl + trehalose synthase; alpha,alpha-phosphotrehalase; alpha + amylase catalytic domain protein" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="QCO92024.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNGDGVGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIAAIFGTMEDMDQLIAEAKKRDIRIIMDLVVN + HTSDEHAWFVEACENTDSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGDKDLLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFEILDQVEDIESLNYAREALEKGVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTDQPWLAVNPNYEMINVQEALANPDSIFYTYQKL + VQIRKENSWLIRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTLAQEVFEKQILVPWDAFCVELL" + CDS 2163..2411 + /inference="ab initio prediction:Prodigal:2.60" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="QCO92025.1" + /translation="MLVRKTSETILQKSRSSSSLRKSLERLTHHLLDLQPKKSSDIFF + QILYLLLTDLLMSDHILDKNKYRILFRQSKQVLGALNY" + gene 2675..4120 + /gene="wzg" + CDS 2675..4120 + /gene="wzg" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09379" + /inference="protein motif:Pfam:PF03816.8" + /inference="protein motif:TIGRFAMs:TIGR00350" + /inference="similar to AA sequence:RefSeq:YP_001835063.1" + /inference="similar to AA sequence:UniProtKB:Q7WY78" + /note="putative transcriptional regulator ywtF; + membrane-bound transcriptional regulator LytR; cell + envelope-related function transcriptional attenuator + common domain; cell envelope-related transcriptional + attenuator domain protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14A" + /protein_id="QCO92026.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLSIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSINVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIQKLTST + EVLKNYSNILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 4122..4853 + /gene="cpsB" + CDS 4122..4853 + /gene="cpsB" + /EC_number="3.1.3.48" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4464" + /inference="protein motif:Pfam:PF02811.13" + /inference="similar to AA sequence:RefSeq:YP_002739714.1" + /inference="similar to AA sequence:UniProtKB:Q54518" + /note="capsular polysaccharide biosynthesis protein; PHP + domain protein" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein phosphatase CpsB" + /protein_id="QCO92027.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHTGLSNILMLGITPVIAHIERYDALENNEKRVCELINMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + gene 4862..5554 + /gene="wzd" + CDS 4862..5554 + /gene="wzd" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:Pfam:PF02706.9" + /inference="protein motif:TIGRFAMs:TIGR01006" + /inference="similar to AA sequence:RefSeq:YP_001835065.1" + /inference="similar to AA sequence:UniProtKB:P72367" + /note="capsular polysaccharide type 8 biosynthesis protein + cap8A; capsular polysaccharide biosynthesis protein; MPA1 + family polysaccharide export protein; chain length + determinant protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14C" + /protein_id="QCO92028.1" + /translation="MKEQNTLEIDVLQLFRILWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVFLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + gene 5564..6247 + /gene="wze" + CDS 5564..6247 + /gene="wze" + /EC_number="2.7.10.2" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:CLUSTERS:PRK11519" + /inference="protein motif:Pfam:PF01656.17" + /inference="protein motif:TIGRFAMs:TIGR01007" + /inference="similar to AA sequence:RefSeq:YP_001835066.1" + /inference="similar to AA sequence:UniProtKB:Q54520" + /note="tyrosine-protein kinase CpsD; tyrosine kinase; + capsular polysaccharide biosynthesis protein; capsular + exopolysaccharide family protein; CobQ/CobB/MinD/ParA + nucleotide binding domain" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14D" + /protein_id="QCO92029.1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFAYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 6263..7630 + /gene="wchA" + CDS 6263..7630 + /gene="wchA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15204" + /inference="protein motif:Pfam:PF02397.10" + /inference="protein motif:TIGRFAMs:TIGR03025" + /inference="similar to AA sequence:RefSeq:YP_001835067.1" + /inference="similar to AA sequence:UniProtKB:P71241" + /note="putative colanic biosynthesis UDP-glucose lipid + carrier transferase; undecaprenyl-phosphate galactose + phosphotransferase; exopolysaccharide biosynthesis + polyprenyl glycosylphosphotransferase; Bacterial sugar + transferase" + /codon_start=1 + /transl_table=11 + /product="glucosyl-1-phosphate transferase" + /protein_id="QCO92030.1" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLVL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILFKTVKVVFI + RDGAK" + gene 7617..8420 + /gene="wefL" + CDS 7617..8420 + /gene="wefL" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3475" + /inference="protein motif:Pfam:PF04991.7" + /inference="similar to AA sequence:RefSeq:YP_004326645.1" + /note="LPS biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="LicD superfamily protein" + /protein_id="QCO92031.1" + /translation="MERSDFMNKVREIQLGELSLLKNFIAICSKYNLRYYALGGTLLG + AIRHKGFIPWDDDMDLGMPRKDYEKFLSICNKELPEHVVLRLHDDNLGNTSIMDTSLQ + IPFGDELCSPFIDIFPLDGYPDDRFHYFIYTNKIKFYRALSKISVIDRLHDRDRGSFE + NVIVGISKVLKLNKLLKTATINNKLQNLIKQYDFETSSIVGNVLGSYRERELARKEVF + GEPQLLEFENLEISCHANPDEYLTKIYGDYMKLPEEAERKGHFESTWGD" + gene 8440..9162 + /gene="cpsF" + CDS 8440..9162 + /gene="cpsF" + /EC_number="2.4.1.187" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK03692" + /inference="protein motif:Pfam:PF03808.7" + /inference="protein motif:TIGRFAMs:TIGR00696" + /inference="similar to AA sequence:RefSeq:YP_002037034.1" + /inference="similar to AA sequence:UniProtKB:Q7A714" + /note="putative N-acetylmannosaminyltransferase; putative + UDP-N-acetyl-D-mannosaminuronic acid transferase; + WecB/TagA/CpsF family glycosyltransferase" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetyl-D-mannosamine transferase WchO" + /protein_id="QCO92032.1" + /translation="MGVRIDPLTMDETVQAVEKFVIEQRPLHLMGVNADKINQCQSDE + AIKKIVNESEIINADGASVVLASRFLGYQVPERVAGIDLMQRLLKLADEKSYSVYFFG + AKEEVLQDMLQNFKEEYPNLRIVGHRNGYFSEEDEQDIQEDIREKNPDVVFVGITSPK + KEYTIQKFMDNGVNSIFMGVGGSFDVLSGHIQRAPLWMQKSNLEWLFRVANEPKRLFK + RYFVGNVTFIKRVLDEKRKTKK" + gene 9137..10222 + /gene="tagE" + CDS 9137..10222 + /gene="tagE" + /EC_number="2.4.1.52" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0297" + /inference="protein motif:CLUSTERS:PRK09922" + /inference="protein motif:Pfam:PF00534.14" + /inference="protein motif:TIGRFAMs:TIGR03088" + /inference="similar to AA sequence:RefSeq:NP_344886.1" + /inference="similar to AA sequence:UniProtKB:P13484" + /note="putative poly(glycerol-phosphate) + alpha-glucosyltransferase; + UDP-D-galactose:(glucosyl)lipopolysaccharide-1, + 6-D-galactosyltransferase; glycogen synthase; + PEP-CTERM/EpsH1 system-associated sugar transferase, ; + glycosyl transferase group 1 protein; Glycosyl + transferases group 1" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps4H" + /protein_id="QCO92033.1" + /translation="MKNEKRKNNILHILRTMDIGGAERIVYQLSSDLQDEFDSVHVAS + TGGLWEPELETQGIIHHKIQDIDSKNPLTVLKLLLTIYQIIKTNDITLIHTHHRMAAF + YIRLLKLINPKLVHVYTAHNVFKDKLSLYRFSLKNAYSIAVGQAVNQNLKDDVGVANS + TVIYNGVILKQSNRQVDEIMKFGGIKLGCIARLSGQKGLTYLLDAISLISDENLRLFI + VGDGELRDELENKVKELELEDKITFLGYRQDVVECINSFDFLVSSSLFEGMALNVIEA + FMNGKTMVATDIPGNNEVVTKENGILVPAKDARALASAIESLATDSTLRTRLAHQAKK + DYEEKFRYPLFLENYRKFYQKLMGDSK" + gene 10231..11313 + /gene="mnaA" + CDS 10231..11313 + /gene="mnaA" + /EC_number="5.1.3.14" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0381" + /inference="protein motif:CLUSTERS:PRK13609" + /inference="protein motif:Pfam:PF02350.13" + /inference="protein motif:TIGRFAMs:TIGR00236" + /inference="similar to AA sequence:RefSeq:YP_004622336.1" + /inference="similar to AA sequence:UniProtKB:P39131" + /note="diacylglycerol glucosyltransferase" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine 2-epimerase" + /protein_id="QCO92034.1" + /translation="MLVFGTRPEAIKMCPLVNELKKNDSIKTLVCVTGQHKEMLEQVL + DVFKVVPDYDLGIMKANQTLFTITTSILDKIQAVLEQEKPDIVLVHGDTTTTFATALA + AFYMGIKVGHVEAGLRTYNLQSPFPEEFNRQATSIIADFNFAPTEVAKENLLKEGREN + IYVTGNTVIDALKTTVQDHYDHPILEWAKNSKLIMLTAHRRENLGQPMENMFNAVNRI + LNEFEDVKVVYPIHKNPKVRELASKVFGDNERMQIIEPLEVIDFHNFMNQSYMILTDS + GGVQEEAPSLGKPVLVMRDTTERPEGIAAGTLKLVGTEDENIYRNFKLLLENEEEYNK + MSKASNPYGDGTACQQIVEVIMKGLV" + gene 11313..12278 + /gene="wefD" + CDS 11313..12278 + /gene="wefD" + /EC_number="2.4.1.212" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3858" + /inference="protein motif:CLUSTERS:PRK10073" + /inference="protein motif:Pfam:PF00535.20" + /inference="protein motif:TIGRFAMs:TIGR03937" + /inference="similar to AA sequence:RefSeq:YP_004326642.1" + /inference="similar to AA sequence:UniProtKB:Q7BLV3" + /note="hyaluronan synthase; putative glycosyl transferase; + putative glycosyl hydrolase; poly-beta-1,6 + N-acetyl-D-glucosamine synthase; Glycosyl transferase + family 2" + /codon_start=1 + /transl_table=11 + /product="glycosyl transferase family 2 protein" + /protein_id="QCO92035.1" + /translation="MRKVSIVVPVYNVEDYLKYCVDSLINQSYKDIEIILVDDGSTDD + SGRICDKYAQEDDRIRVLHIENGGLSNARNTGVKFASAEWIIFIDSDDYYDRRTVEYL + VQLQKKYAVDLVATSVIEVRDFQSEDFLGSLTNIDSLKLDRYTALKEMFYGNIVGTHP + GGKLYKKEILMKFPFPEGMIYEDLAVSFEHIGACNEIAVGCINLYKYYRRPGSIVNSS + YSDKFLDFYKAIEMNREFVQRNYPNDKEMNKALTVRYVFKGLHVVHAMLSSEMYSDVN + KIRKEYIRYFNDIIPNPNITGKNKVKYLMLLVSPKLYEKIREKMG" + gene 12285..13700 + /gene="wzx" + CDS 12285..13700 + /gene="wzx" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF01943.11" + /inference="similar to AA sequence:RefSeq:YP_008510121.1" + /inference="similar to AA sequence:UniProtKB:P37746" + /note="putative O-antigen transporter; integral membrane + protein MviN; polysaccharide biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="flippase" + /protein_id="QCO92036.1" + /translation="MKVLKNYAYNLSYQLLVIILPIITTPYVTRVFSSNDLGTFGYFN + SIVAYFIFLATLGVANYGTKEISAHRNNIPNNFWGIYTLQFTATCISIFLYIGLCFSF + SFMQNPVAYILVLSLLSRGLDITWLFQGLEDFRKITVRNITVKLIGVISIFLFIKSQN + DLYLYVFLLTIFEFLGQLSMWLPALEFIGKPQFDFNYAKKHLKPVILLFLPQIAISLY + VTLNRTMLGALASTTDVGIYDQSLKLVNILLTLVTSLGSVMLPRVSNLLSTGDKKSVN + RMNQLSFFIYNLVIFPTIAGMLTINNDFVKFFLGNDFQEAKYAIAIMIFRMFFIGWTN + IMGIQILIPHNKNKEFLTSTTVPAIISVGLNLLLLPEFGYIGAAIVSVLTEIFVWVIQ + LYFTRKYLKDVPIFKSTVKIFSASILMYVALSFLKSILTFTPIVNVVVCAIVGAILYG + LLILIFKVVSLKEIKEQLLNN" + CDS complement(13660..13842) + /inference="ab initio prediction:Prodigal:2.60" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="QCO92037.1" + /translation="MNIINNLSFSSSTIFHPSFSKLFQSTNLAKTNSYKNNFDYFCID + YHHTNYLTAALLSPLS" + gene 13872..15032 + /gene="wzy" + CDS 13872..15032 + /gene="wzy" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_006040928.1" + /codon_start=1 + /transl_table=11 + /product="polysaccharide polymerase" + /protein_id="QCO92038.1" + /translation="MIKIKFENLLVSIVVSVVIFFNTISTTMLDRTFFQAKANYLLLV + VLLLGLRFMFPTRISFKYLIFSSLLLLSGILVYFQTGKLNFLVYSALLVLLVNVDMKV + VLKTYLIVAGILVLSVFLLSLLGAVPNLQYNREGVIRNSFGFIYPTDFASHCFYLFLA + FSYLLKDKFIWIRSLIGVLLSFFIIKYCDARLNALSIILATIIFIFFYFNEDKKFRIY + SISPYSVVLCSSIMMYLSYIFSLGSPFLVSINKLITGRLALGKNAFNTFDVHLFGTRD + VLFKGSGGKTEAVIDYNYVDSSYVQMLFTYGVIPLVLLICMYVVISIEQYKQGQYLYV + VILSLVALNCMIEAFWFVPTYNIFMFLLFTKNTFLNKSLNNFNPLDKTELLN" + gene 15194..16291 + /gene="glf" + CDS 15194..16291 + /gene="glf" + /EC_number="5.4.99.9" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG1232" + /inference="protein motif:CLUSTERS:PRK07208" + /inference="protein motif:Pfam:PF03275.7" + /inference="protein motif:TIGRFAMs:TIGR00031" + /inference="similar to AA sequence:RefSeq:YP_004326638.1" + /inference="similar to AA sequence:UniProtKB:P37747" + /note="protoporphyrinogen oxidase" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase" + /protein_id="QCO92039.1" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + IEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKNKIAEQTAHMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TDLPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFANRQ + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEVLDKENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQDKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAVQNDK + VIFCGRLADYKYYDMHVVIERALNVVEEEFK" + CDS 16316..17368 + /EC_number="2.4.1.-" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09814" + /inference="similar to AA sequence:RefSeq:YP_008510117.1" + /note="beta-1,6-galactofuranosyltransferase" + /codon_start=1 + /transl_table=11 + /product="putative glycosyltransferase" + /protein_id="QCO92040.1" + /translation="MKYYLKEEFLTDSGVRNAGNKARNDVEEIVVREGYSPLLLMVDD + WYQMGTIRAQRHKAKALSKAISKLKEGDQLLIQFPMLHHSFFTTHLVKRMQCKGVKFH + FIIHDLEVLRYANLDTVPLKHKIRVHLQESSLLKQADGLIAHNPVMKSVLVDKGISEK + KIVSLGIFDYLIPNYQDKEDLSKEGAIIVAGNLAQEKAGYLYELPTRPAYNLYGVGFD + EARKLSNETYFGSFLPDELPSALEGSFGLVWDGGSSKTCSGVFGEYLRYNNSHKASLY + LASGFPIIVWGQSALANFVLEKECGISVESLLDLEEVLEHLSQEEYQNLVKNAKSVGQ + KIREGSYLLSALQALN" + CDS 17491..17730 + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_001836149.1" + /codon_start=1 + /transl_table=11 + /product="IS66 family Orf1" + /protein_id="QCO92041.1" + /translation="MELLLYTISKVKLLEDIVMPQPIVPVEIPQSRPFDSKKRNDILL + KIRIGKLEVSFFQSLNLEMIEQLLDKVLLYDNSSI" + CDS 18224..19033 + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3436" + /inference="protein motif:Pfam:PF03050.8" + /inference="similar to AA sequence:RefSeq:YP_003445207.1" + /note="transposase IS66 family protein" + /codon_start=1 + /transl_table=11 + /product="ISSmi4 transposase" + /protein_id="QCO92042.1" + /translation="MENPLRKVFAPLDNSVFLKRNKIWKKTLTYPVEREEITYKRKKA + KGKRQALLAQFDSEEVHHRLEACICPDYQGDLKEIGASLQRQELVFIPAQLKRIDHIQ + HAYKCQACSDKNRSDKIVKAPIPKAPLAHSFGSVSIIAHTIHQKFNLKVPNYRQEEDW + ARMGLPITRKEISNWHIKASQYYLESLYNLLREKLLEQPLLHADETSYRVLESDSHLT + YYWTFLSGKSEKQGITLYHHDQRRSGSVVQEFLGNYSAYAIAVQSLGARRR" + CDS 19036..19485 + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3436" + /inference="protein motif:Pfam:PF03050.8" + /inference="similar to AA sequence:RefSeq:YP_003879023.1" + /note="transposase IS66 family protein" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO92043.1" + /translation="MVNYEPLEAYRQLEEAELVGCWAHVRRKFFEAPPKQADKSSLGA + KGLAYCDQLFALERDWEALLADERLQKRQEELQPLMEDFFAWCRRQSVLSGSKLGRAI + EYSLKYKETFKTILKDGHLVLSNNLAERAIKSLVMGRSKRVQWTLLA" + CDS 19556..19714 + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_006253052.1" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO92044.1" + /translation="MSLLETAKRHQLNSEKYLSYLLECLPNEETLVNKEVLEAYLPCT + KVVQEKCK" + gene 19913..21895 + /gene="aliA" + CDS 19913..21895 + /gene="aliA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4166" + /inference="protein motif:CLUSTERS:PRK15104" + /inference="protein motif:Pfam:PF00496.16" + /inference="protein motif:TIGRFAMs:TIGR02294" + /inference="similar to AA sequence:RefSeq:YP_001835080.1" + /inference="similar to AA sequence:UniProtKB:P31306" + /note="76 kDa cell surface lipoprotein; oligopeptide ABC + transporter substrate-binding protein OppA; ABC-type + oligopeptide transport system, periplasmic component; + nickel ABC transporter, nickel/metallophore periplasmic + binding protein; Bacterial extracellular solute-binding + proteins, family 5 Middle" + /codon_start=1 + /transl_table=11 + /product="oligopeptide ABC transporter + oligopeptide-binding protein AliA" + /protein_id="QCO92045.1" + /translation="MKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETDP + DNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDA + KWYTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDAYVKGEINDFSQVG + IKALDEQTVQYTLNKPESFWNSKTTMGVLAPVNEEFLNSKGDDFAKATDPSSLLYNGP + YLLKSIVTKSSVEFAKNPNYWDKDNVHIDKVKLSFWDGQDTSKPAENFKDGSLTAARL + YPTSASFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKALL + NKDFRQAIAFGFDRTAYASQLNGQTGASKILRNIFVPPTFVQADGKNFGDMVKEKLVT + YGDEWKDVNLADSQDGLYNPEKAKAEFAKAKSALQAEGVTFPIHLDMPVDQTATTKVQ + RVQSMKQSLEATLGADNVIIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPDFA + DPSTYLDIIKPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDETTDVAKRY + DKYAAAQAWLTDSALIIPTTSRTGRPILSKMVPFTIPFALSGNKGTSEPVLYKYLELQ + DKAVTVDEYQKAQEKWMKEKEESNKKAQEDLAKHVK" +ORIGIN + 1 atgcaagaaa aatggtggca caatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg gagatggagt tggtgatttg ccaggtatta ccagtaagtt ggactatcta + 121 gccaagctag gaatcacagc aatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctatg atattgctga ttatcaagcg attgcggcta tttttggaac catggaggac + 241 atggatcagc tgattgcaga agctaagaag cgtgacattc gtatcatcat ggacttggtg + 301 gttaatcata cctcagatga acatgcttgg tttgtcgaag cctgtgaaaa tactgacagc + 361 cctgagcgag actactatat ctggcgcgat gaacccaatg acctagattc tatctttagt + 421 gggtctgctt gggaatacga tgaaaagtca ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaagg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agataaggat ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcagc ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttgcttcat + 1021 cttatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaatac tggatcaagt agaagatatt gaatctctca actatgcgcg tgaggctctt + 1141 gaaaaaggtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac agatcaacct + 1261 tggttggcag ttaatccaaa ttacgagatg atcaacgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagttggcta + 1381 attcgagctg actttgaatt gcttgatacg gctgataagg tctttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacaccc tagctcaaga agtctttgaa + 1561 aaacaaatct tagttccatg ggatgctttc tgtgtggaat tactataaat attttttgca + 1621 gaaaaattta aaattgaaat cgtataaaaa caagggagga ctgtataaaa ggcagaaatc + 1681 ctttgttttt tataaccaag gtttataaac cttcattctc gaaattcaat taactttaca + 1741 aattcccact attaaggaga aagaagacga acataaagaa gcgtatcctt agtgcaggcc + 1801 tgacttttac atctgctttg cttttagctg cttgcgacca atcaggttca gatacaaaaa + 1861 cttactcatc aacctttagt ggaaatccaa ctacatttaa ctatctatta gactattacg + 1921 ctgataatat agtcaattga aacaagagaa agacaaaaga gcctcgtaaa aggtattgca + 1981 acttggtaat acctttttga ggtgcttttt gatatgagcc catgttttct caataggatt + 2041 gtactcaggt gagtagggag gaagaggtaa aagtttatgc ccaaactctt cacacaagag + 2101 ttctagcttc cccattctat ggaatcttgc attatccata ataataaccg atggtgtggt + 2161 taatgttggt aagaaaaact tctgaaacca tacttcaaaa aagtcgctcg tcatcgtctc + 2221 ttcgtaagtc attggagcga ttaactcacc atttgttaga cctgcaacca aagaaatcct + 2281 ctgatatctt cttccagata ctttacctct tattaactga ccttttaatg agcgaccata + 2341 ttctcgataa aaataagtat cgaatcctgt ttcgtcaatc taaacaggtg ctaggtgctt + 2401 taaactatta aaattcttaa gaaataaggc tactttttct gggtcttgtt cataattaga + 2461 ttgaaactag aatagtacac ctctgcttct aaaacattgt tagaaatcga tttgactgtc + 2521 ctgatcgatt tgtcatgttc ttatttcatt ttactatatt tttgtttcgc gggaagtcta + 2581 ctaagatact taaagatgca gatagtaaaa aaatgtagac attaccgtaa aaaagtgata + 2641 taattgtatg atgttcaagg tataggtgtt aatcatgagt agacgtttta aaaaatcacg + 2701 ttcacagaaa gtgaagcgaa gtgttaatat cgttttgctg actatttatt tattgttagt + 2761 ttgtttttta ttgttcttaa tctttaagta caatatcctt gcttttagat atcttaacct + 2821 agtggtaact gcgttagtcc tactagttgc cttggtaggg ctactctcga ttatctataa + 2881 aaaagctgaa aagtttacta tttttctgtt ggtgttctct atccttgtca gctctgtgtc + 2941 gctctttgca gtacagcagt ttgttggact gaccaatcgt ttaaatgcga cttctaatta + 3001 ctcagaatat tcaatcaatg tcgctgtttt agcagatagt gagatcgaaa atgttacgca + 3061 actgacgagt gtgacagcac cgactgggac tgataatgaa aatattcaaa aactactagc + 3121 tgatatcaag tcaagtcaga ataccgattt gacggtcgac cagagttcgt cttacttggc + 3181 agcttataag agtttgattg caggtgagac taaggccatt gtcttaaata gtgtctttga + 3241 aaatatcatc gagtcagagt atccagacta tgcatcgaag ataaaaaaga tttataccaa + 3301 gggatttact aaaaaagtag aagctcctaa gacgtctaag aatcagtctt tcaatatcta + 3361 tgttagtgga attgacacct atggtcctat tagttcggtg tcgcgatcag atgtcaatat + 3421 cctgatgact gtcaatcgag ataccaagaa aatcctcttg accacaacac cacgtgatgc + 3481 ctatgtacca atcgcagatg gtggaaataa tcaaaaagat aaattgactc atgcgggcat + 3541 ttatggagtt gattcgtcca ttcacacctt agaaaatctc tatggagtgg atatcaatta + 3601 ctatgtgcga ttgaacttca cttcgttttt gaaattgatt gacttattgg gaggggtaga + 3661 tgttcataat gatcaagagt tttcagctct acatgggaag ttccatttcc cggtagggaa + 3721 tgtccatcta gactctgagc aagctctagg ttttgtacgt gaacgctact cactagcaga + 3781 tggcgatcgt gaccgtggtc gcaaccaaca aaaggtcatt gtagcaatta ttcagaagtt + 3841 aacttctaca gaggttttga aaaactatag taatattctt caaggattgc aggattctct + 3901 tcaaacaaat atgccgattg agactatgat agatttagtg aatactcagt tggaaagtgg + 3961 ggggaattat aaagtaaatt ctcaagattt aaaagggaca ggtcggatgg atcttccttc + 4021 ttatgcaatg ccagacagta acctctatgt gatggaaata gatgatagta gtttagctgt + 4081 agttaaagca gctatacagg atgtgatgga gggtagatga aatgatagac atccattcgc + 4141 atatcgtttt tgatgtagat gacggtccca agtcaagaga ggaaagcaag gctctcttgg + 4201 cagaatccta caggcagggg gtgcgaacca ttgtctctac ctctcaccgt cgcaagggca + 4261 tgtttgaaac tccggaagag aagatagcag aaaactttct tcaggttcgg gaaattgcaa + 4321 aagaagtagc agatgattta gtcattgctt atggcgcaga gatatactat actctggatg + 4381 ctctagaaaa gctagaaaaa aaagaaattc ctacccttaa tgatagtcgt tatgctttga + 4441 ttgagtttag catgcatact tcctatcgtg agattcatac gggattgagc aatattttga + 4501 tgttgggaat cacgccagta attgctcata ttgaacgtta tgatgcttta gagaataatg + 4561 aaaaacgtgt ttgtgaactg attaatatgg ggtgctatac tcagataaat agttatcatg + 4621 ttttaaaacc taagttcttt ggtgaaaaat ataaattcat gaaaaagaga gctcggtatt + 4681 ttttggaacg tgatttagtt catgtagttg caagtgacat gcacaattta gacagtagac + 4741 ctccatatat gcaacaggca tatgatatca ttgctaagaa atatggagcg aaaaaagcga + 4801 aagaattttt tgtagacaat cccagaaaaa ttataatgga tcaattaatt taggagaaaa + 4861 tatgaaggaa caaaacactt tggaaatcga tgtattgcaa ctattcagaa ttttatggaa + 4921 aagaaagttg gtcattttat tagtggcaat tataacttct tcagttgctt ttgcctacag + 4981 tacttttgtt atcaaacctg agtttactag tacgactcgg atttatgtag ttaaccgtaa + 5041 tcaggaagag aaatctggtt taaccaatca agacttgcag gcaggatcat acttggttaa + 5101 agactatcgt gaaattatcc tatcgcagga tgttttggag gaagttattt ctgatttgaa + 5161 actagatttg acgccaaaag gtttggctaa taaaattaaa gtgacagtac cagttgatac + 5221 ccgtattgtc tctgtttcag ttaatgatcg agttcctgaa gaggcaagcc gtatcgctaa + 5281 ctctttgaga gaagtagctg ctcaaaaaat tatcagtatt actcgtgttt ctgatgtgac + 5341 aacactggag gaggcaagac cggcgatatc accatcttcg ccaaatatta aacgtaatac + 5401 actaattggt tttttggcag gggggattgg aactagtgtt atagtttttc ttcttgaact + 5461 tttggacact catgtgaaac gtccggaaga tatcgaagat acactgcaga tgacactttt + 5521 gggagttgta ccaaacttga gtaagttgaa ataggagaga ggaatgccga cattagaaat + 5581 agcacaaaaa aaactggaat tcattaagaa ggcagaagaa tattacaatg ccttgtgtac + 5641 aaatatacag ttgagcggag ataaactaaa agtaatttcc gttacttctg ttaaccctgg + 5701 ggaaggaaaa acaactactt ccgtaaatat agcaaggtcg tttgcgcgtg caggctataa + 5761 aactcttttg atcgatggcg atactcgaaa ttcagttata tcaggagttt ttaaatcgcg + 5821 tgaaaaaatt acagggctaa cagaattttt atctgggaca gctgatttat ctcacggttt + 5881 atgtgataca aatattgaaa atttatttgt aattcaatcg ggatctgtat caccaaaccc + 5941 tacagccttg ttacaaagta aaaattttaa tgatatgatt gaaacattgc gtaaatattt + 6001 tgcttatatc attgttgata cagcacctat tggaattgtt attgatgcgg caattatcac + 6061 tcaaaagtgt gatgcgtcca tcttggtaac ggcaacaggt gaggtgaata aacgtgatgt + 6121 ccaaaaagcg aaacaacaat tagaacaaac agggaaactg ttcctaggag ttgttttaaa + 6181 taaattggat atctcggttg ataagtatgg agtttacggt tcctatggaa attatggtaa + 6241 aaaataactt aggaaatatt ttatggatga aaaaggattg aaaatttttc tggcagtatt + 6301 acagagtata attgtcattt tattggttta ttttcttagc tttgttagag agacagaact + 6361 tgaacgttct tcgatggtta tactatacct tctccacttt tttgtattct attttagttc + 6421 ctatggtaac aattttttta aaagagggta cttagttgag tttaatagta ctataagata + 6481 tatttttttc tttgcaatag ctataagtgt attaaacttt tttatagcgg aacggtttag + 6541 tatctctaga agaggaatgg tatacttctt aactttagaa ggaatatcct tatacttgtt + 6601 aaatttctta gtaaagaaat attggaagca tgtgtttttt aatctaaaaa atagcaagaa + 6661 aattttactg ttaacagtaa cgaaaaatat ggaaaaagtt cttgataaat tgctagaatc + 6721 tgatgaactt tcatggaaat tggtagcagt aagtgttttg gataaatctg attttcaaca + 6781 tgataaaata cctgtaattg aaaaggaaaa aattattgaa tttgcaacgc atgaagttgt + 6841 ggatgaggtg tttgtcaatc ttccaggaga gagctacgat attggagaaa ttatctctag + 6901 gtttgagaca atggggatag atgtaactgt aaatcttaaa gcatttgata agaatttggg + 6961 tcgcaataaa caaattcatg agatggtagg attgaatgta gtcactttct ctacaaattt + 7021 ttataaaact agtcatgtga tttcaaagag aattctcgat atttgtggtg ccactattgg + 7081 ccttgttctt tttgctatag ctagtctagt tttagttcca ttgattcgta aagatggcgg + 7141 accagctatt tttgctcaaa ctcgtatagg gaaaaatggt cgacatttta ccttttataa + 7201 attccgttcg atgcggatcg atgctgaagc tatcaaagaa caattgatgg atcaaaatac + 7261 gatgcaaggt ggtatgttta agattgacaa tgatcctcgt gttacaaaaa ttggtcgctt + 7321 tattcgtaaa accagtttgg atgaattgcc gcagttttgg aatgtcttta taggagatat + 7381 gagtttggtg ggaacacgtc cacctacagt agacgagtat gatcagtata ctccagaaca + 7441 gaaacgtcga ctcagcttta aacctggtat tacaggttta tggcaggtta gcggccgtag + 7501 taaaataacc gattttgacg atgttgtaaa attagatgtg gcttatattg ataattggac + 7561 aatctggaaa gatattgaaa ttttgtttaa aactgttaaa gttgtattta taagagatgg + 7621 agcgaagtga ttttatgaat aaagtgaggg aaattcaact aggagaatta tctttattga + 7681 aaaactttat tgctatttgt agtaaatata atttaagata ttatgctttg ggaggaacat + 7741 tgctaggagc aattcgtcat aaaggattta ttccttggga tgatgatatg gatttaggaa + 7801 tgcctcgaaa agattatgaa aaatttttgt ctatttgtaa caaggaactt ccagaacatg + 7861 ttgttttgag acttcatgat gataatttag gtaatacctc tattatggat acatccttac + 7921 aaattccatt tggagatgaa ctatgtagtc cattcataga tattttccct ttggatggtt + 7981 atccagatga tcgttttcat tattttattt atacaaacaa aattaaattc tatcgtgcac + 8041 tttctaaaat ttcggtaatc gatcgtctac atgacagaga tcggggaagt tttgaaaatg + 8101 taattgtggg tatatcaaaa gttttgaaat taaataaact tttaaaaaca gccactatta + 8161 acaacaaatt acaaaatcta attaaacaat atgattttga aactagttca atagtaggga + 8221 atgtactagg ttcatacaga gaacgtgaac ttgctagaaa agaagtattc ggtgaaccac + 8281 aattactaga gtttgagaac ttagaaataa gttgccatgc aaacccagat gaatatttaa + 8341 caaaaatata tggtgattac atgaaattac ccgaagaagc agaacgtaag ggccatttcg + 8401 agtctacatg gggagattaa tttgaatagt tttgatttaa tgggggtcag gattgaccct + 8461 ttaacaatgg atgaaacagt acaagcggtt gaaaaatttg tcattgaaca acgtcctctt + 8521 catttaatgg gcgtaaatgc tgataagatt aaccaatgtc aatcagatga agccattaag + 8581 aagatagtta acgagtctga aatcatcaat gcagatggtg catcagtcgt tctagcttct + 8641 cgatttttgg gctaccaagt tccagaacga gttgctggaa ttgatttaat gcaaagatta + 8701 ttaaaattag ccgatgaaaa atcttattca gtgtatttct ttggtgctaa agaagaagtt + 8761 ttgcaagata tgttacaaaa ttttaaagaa gagtatccaa atctacgaat tgttggacat + 8821 cgtaatggtt atttttctga ggaagatgag caagatattc aggaagatat tcgtgaaaag + 8881 aatcccgacg ttgtatttgt tggaattact tcacctaaaa aagaatacac catccaaaaa + 8941 tttatggata atggagtgaa ttctattttt atgggtgtag gtggtagttt tgatgtattg + 9001 tctggtcaca ttcagcgtgc cccactttgg atgcagaaat caaacttgga gtggttgttc + 9061 cgagttgcta atgaaccaaa gcgtctcttt aaacgatact ttgtagggaa tgttaccttt + 9121 attaagcgag ttttagatga aaaacgaaaa acgaaaaaat aatattttac atattttacg + 9181 aacgatggat attggtggtg ctgagagaat cgtgtaccag ttaagttctg atttgcaaga + 9241 tgaatttgat agtgtccatg ttgcttctac aggaggcctt tgggaaccag aattagagac + 9301 ccaaggaatt atccatcata aaattcaaga tatagacagc aaaaatcctc ttactgtgtt + 9361 gaagttgctt cttactattt atcaaattat taagacaaat gatattactc tgattcatac + 9421 gcatcatcga atggcagctt tttatattcg tttgttaaaa ctgattaatc ccaagctagt + 9481 ccacgtttac actgctcata atgtctttaa agataagttg tctttatata gattttcact + 9541 gaagaatgcc tatagtattg cagttggtca agcagttaat caaaatttga aagatgatgt + 9601 gggagttgca aatagcactg ttatctataa cggagtgatc ttgaaacagt cgaatagaca + 9661 agttgatgag attatgaagt ttggtggaat caagctaggc tgtattgcaa gattatctgg + 9721 acaaaaaggt ttgacttatc tgcttgatgc tatctctttg atttctgatg aaaatctccg + 9781 tttatttatc gttggggatg gagaacttag agacgaatta gaaaataagg ttaaagaact + 9841 cgaattagaa gataagataa cttttttagg ctatagacag gatgtagtcg agtgtattaa + 9901 tagttttgat ttcctagtgt cttcgtcgtt atttgaaggc atggctctaa atgttattga + 9961 agcatttatg aatggaaaaa caatggttgc taccgatatt cctggcaata atgaagttgt + 10021 tacaaaagaa aatgggatct tggttcctgc taaagatgct agggccttag cttctgctat + 10081 tgagagtctg gcgactgact caactcttag aactaggtta gctcatcaag ctaaaaaaga + 10141 ttatgaagag aagtttaggt atcctttatt tttagagaat tatcgtaaat tttatcaaaa + 10201 actaatggga gattcaaaat gaaaaaagta atgttagttt ttgggacgcg tccagaagca + 10261 ataaaaatgt gtcccttagt gaatgagttg aagaaaaatg attcaatcaa aacacttgtg + 10321 tgtgtaactg gtcaacataa agaaatgtta gagcaagttt tagatgtctt taaagttgtt + 10381 cctgattatg atttaggaat tatgaaggca aatcaaacac tatttacaat cacgacaagt + 10441 attttagata aaattcaagc agttttagag caggaaaaac cagatattgt tcttgttcat + 10501 ggggatacta caaccacttt tgcgacagct ttagctgcat tttacatggg aattaaagtt + 10561 ggacatgtag aggcaggatt gagaacttat aatcttcaaa gcccgtttcc tgaagaattc + 10621 aatcgtcagg ctacttcaat tattgcggat ttcaattttg ctccgacaga agtggctaaa + 10681 gagaatcttc taaaagaggg aagagagaat atctatgtta ccggaaatac tgtcatcgac + 10741 gccttgaaga caactgttca agatcattat gatcatccta ttttagagtg ggctaagaac + 10801 agtaaactaa tcatgctgac agcccataga cgtgaaaatc ttggtcaacc catggaaaat + 10861 atgtttaatg cagttaatcg tatactgaat gagtttgaag atgttaaagt cgtatatcct + 10921 attcacaaga atcctaaagt tcgtgagcta gcaagtaaag tgtttggtga caatgaacgt + 10981 atgcaaatca ttgaaccact agaagtcatt gatttccata atttcatgaa tcaaagctat + 11041 atgattttaa cagattcagg tggtgtacaa gaagaagcac cttctttagg taaaccagta + 11101 ttagtaatgc gtgatacaac tgaacgtcca gaggggattg ctgcaggaac cttgaaatta + 11161 gtaggaacag aagatgaaaa tatttatagg aattttaagc ttcttttgga aaatgaagag + 11221 gaatacaaca agatgagtaa ggcaagcaat ccttatgggg atggaacagc ttgtcaacag + 11281 attgtagaag ttatcatgaa gggattagta taatgaggaa agtttcgatt gttgttccag + 11341 tatacaacgt tgaagattat ttgaaatatt gtgttgatag cttaattaat caatcgtaca + 11401 aggatattga gattattttg gtagatgatg gctctacgga tgattctgga agaatatgtg + 11461 ataagtatgc ccaagaagat gaccgtatta gagtcttgca tattgagaat ggaggccttt + 11521 ctaatgctcg aaatacgggt gtaaagtttg cttctgctga gtggataatt ttcattgatt + 11581 ctgatgatta ctatgatcgt agaactgttg agtatttagt gcaacttcaa aagaagtatg + 11641 ctgttgatct tgttgcaact tccgtcatcg aagttaggga cttccaaagt gaggattttt + 11701 taggttcatt aactaacata gattctttga aattagatcg ctatacagct ttgaaggaga + 11761 tgttttatgg aaatatagtt ggaactcatc cagggggaaa actatacaaa aaagaaatct + 11821 tgatgaagtt tccttttcca gagggtatga tctatgaaga tttggctgtc tcttttgagc + 11881 atatcggagc atgcaatgaa attgccgtag gatgtatcaa tttatacaaa tattatcgaa + 11941 gacctggaag tattgtcaat tcttcttata gtgataaatt tttagacttc tataaggcta + 12001 tagagatgaa tagagaattt gttcagagaa attatcctaa tgataaggaa atgaataaag + 12061 cacttactgt acgttatgtc tttaaggggt tacatgtagt acatgctatg cttagttcag + 12121 agatgtattc ggatgttaat aaaatcagaa aagaatacat taggtacttc aacgatatta + 12181 ttcctaatcc aaatataaca gggaaaaata aagtgaaata cctgatgctt ttggtttctc + 12241 caaaactgta tgaaaaaatt agagagaaga tgggttaggt aagaatgaag gttttaaaaa + 12301 attatgcata taatctctct taccagctac tagtgataat tcttcctatt ataacaacac + 12361 cttatgtaac tagggtattt agttcaaatg atttaggaac ttttggctac tttaattcga + 12421 ttgttgctta ttttattttt ttagcaacat taggagtagc taattatggg acaaaagaaa + 12481 tttcagctca tagaaataat atccctaata atttttgggg tatttatacc ttgcagttta + 12541 ctgcgacttg tatatcgata tttctatata ttggtctgtg cttttcattt tcatttatgc + 12601 aaaatccagt agcttatata ttggtattat ctctattatc taggggatta gatattactt + 12661 ggctttttca aggactagaa gattttagga agataactgt tagaaatatc actgtcaaac + 12721 tcataggtgt tatttcaata tttttgttca taaagtctca gaacgattta tatttatatg + 12781 tctttttatt aactatattt gaatttttag gacaattaag tatgtggctg ccagctctag + 12841 aatttatagg taagccacaa tttgatttca attatgccaa gaaacatctt aaaccggtga + 12901 tattactgtt tttacctcaa atagcgatat ctttatatgt tacgttaaat aggacaatgc + 12961 ttggcgcttt agcatcaaca acagatgttg gaatttatga tcaatcttta aagttggtaa + 13021 atatcctact tactttggta acttcactag gtagtgttat gttaccacgt gtttcgaatc + 13081 ttttatcaac aggggataag aagtctgtga atcgcatgaa tcaattatct ttctttatat + 13141 acaatcttgt gatttttcca actattgcag gtatgttaac tatcaataat gactttgtga + 13201 aatttttctt aggaaatgac tttcaagaag caaaatatgc tattgcaatc atgattttta + 13261 ggatgttttt tattggttgg acgaacatta tggggattca aattttgata cctcataata + 13321 agaacaaaga atttttgact tcaacaacgg ttccagcaat tattagtgtt ggtttaaatt + 13381 tacttttact gcctgaattt ggatatattg gggctgcgat tgtttctgta ttaacagaaa + 13441 tatttgtatg ggttatccaa ttgtatttta caagaaaata tttaaaagat gtaccaattt + 13501 ttaaatcaac tgttaaaata ttttcagcat caattcttat gtatgttgct ctttcatttt + 13561 tgaagtcaat tttgactttt acacctattg ttaatgttgt tgtatgtgct attgtggggg + 13621 cgatacttta tggtttacta attttaatat ttaaagtagt tagcttaaag gagataaaag + 13681 agcagctgtt aaataattag tatgatgata atctatacag aaataatcaa agttattttt + 13741 gtaagaattt gttttagcta agttagttga ttgaaaaagt ttagaaaagg aaggatgaaa + 13801 gattgtagat gaactaaaag ataaattatt aattatgttc attctatatt attctttact + 13861 aaataaataa tatgataaaa attaaatttg aaaatctact ggttagtatt gttgtatctg + 13921 tagtgatatt ttttaatact atatctacta caatgctgga tagaactttt tttcaagcta + 13981 aagcaaatta tcttttatta gtagttttgt tattaggtct tcgttttatg tttccaacac + 14041 gtatttcatt taaatatcta atattttctt ctttgctatt attatcagga attttagtat + 14101 attttcagac tggaaaactt aattttcttg tctattcagc ccttctggtt ttattagtta + 14161 atgtagatat gaaagtagtt ttgaaaacgt atctcattgt agcgggcatt cttgtactaa + 14221 gtgtatttct tttatctctc ttaggtgcag ttcccaattt acaatataat cgcgaaggag + 14281 ttattcggaa ttcatttgga tttatttatc ctacagattt tgcatcccac tgtttctatc + 14341 ttttcttggc tttttcttat ttattaaaag ataaatttat atggattagg tctctaatag + 14401 gtgtactttt atctttcttt attataaaat attgtgatgc acgtttaaat gccttatcaa + 14461 ttattttagc aacaattatt tttatatttt tctactttaa tgaagataag aaattccgga + 14521 tctattcaat ttccccttat tctgtagttc tatgttcgtc aataatgatg tatttatctt + 14581 atattttctc tttgggatct ccatttttag tatctatcaa taaattaatt acaggtagat + 14641 tagctttggg gaaaaatgca tttaatactt ttgatgtaca tctatttgga actagagacg + 14701 tattatttaa agggtcagga ggtaaaacgg aggctgttat tgattataac tacgtagatt + 14761 catcgtatgt tcaaatgtta tttacatatg gtgttatacc tcttgtactg cttatatgta + 14821 tgtatgttgt aatttcgata gaacagtata aacagggtca atatttatat gtagtaatat + 14881 tatctttagt ggctctaaac tgcatgattg aagctttttg gtttgtccct acttacaata + 14941 tattcatgtt tttgttattc acaaaaaata cttttcttaa taagtcgttg aataatttta + 15001 atcctttgga taaaacggaa ttgttgaact gataaaatta aattttttga tttgtaaaat + 15061 tatttttttc ataaaatgaa ctattctaac taatatttca aaaaaatttt ttaaaatcta + 15121 tttttgcatg atattttaat gaagataact ttacaatgct acaaaagtgt cgagtctaat + 15181 aaaggagtgt aatatgtacg actatctaat cgttggtgct ggattgtcag gtgcaatctt + 15241 tgcttatgaa gcaaccaagc gtggaaaaaa agtaaaagtt attgataaac gtaaccacat + 15301 tggtggaaat atctactgtg agaatataga aggagttaat gttcataaat atggtgcaca + 15361 tatcttccat acttctaata agaaagtctg ggattatgtg aatcaatttg ctgaatttaa + 15421 caactacatc aactcgcctg tagctaatta caagggtagc ctttataatc tacctttcaa + 15481 tatgaatact ttctatgcta tgtgggggac aaaaactcct caagaagtga aaaataagat + 15541 tgctgagcaa acggctcaca tgaaagacgt tgaaccgaaa aacttggaag aacaggctat + 15601 caagttgatc ggtccagata tttatgaaaa gttgattaaa ggatatactg aaaagcaatg + 15661 gggacgttcc gcgactgacc ttccaccgtt tatcatcaaa cgtctaccag ttcgtttgac + 15721 ttttgataat aactacttta atgaccgtta ccaaggtatt ccaatcggtg gctataatgt + 15781 cattatcgaa aatatgctga aagatgttga agtagaactt ggagttgact tttttgccaa + 15841 tcgtcaggaa ttagaagctt ctgctgaaaa agttgtcttt acagggatga ttgaccaata + 15901 tttcgattat aaacatggtg agctagaata ccgtagtctt cgttttgagc atgaagttct + 15961 agataaggaa aattatcaag gaaatgccgt tgttaattat acagaacgag aaattcctta + 16021 tactcgcatt attgagcaca aacattttga gtacggaaca caagataaaa cggttattac + 16081 tcgtgaatac ccagctgatt ggaaacgtgg agatgaacct tattatccaa tcaatgatga + 16141 gagaaacaat gccatgtttg ctaaatatca agaagaagca gtacagaatg ataaggtaat + 16201 tttctgtgga cgtttggctg attataaata ctacgacatg catgtggtta ttgaacgtgc + 16261 cctaaatgtt gtagaggaag aatttaaata agataacgaa ggataaaatt gatagatgaa + 16321 atattatcta aaagaagaat ttctgacgga ttctggtgta cgaaatgcgg gaaataaggc + 16381 tcgaaacgat gttgaagaaa tagtagttcg tgagggctat agtcctttgt tattgatggt + 16441 agatgattgg tatcaaatgg ggactattag agcccaacga cacaaggcta aagcgctatc + 16501 caaagctatc tctaagttga aggaaggcga tcagctactt attcaatttc ctatgcttca + 16561 tcatagtttc tttacgactc atttagtcaa aagaatgcaa tgtaaaggag tgaagtttca + 16621 ctttattatc catgatttag aagttttgcg ctatgccaat ttggatacag tacccttaaa + 16681 gcataaaatt cgtgttcatc ttcaagagtc aagtcttttg aaacaagctg atggtcttat + 16741 tgctcataat ccagttatga aatcagtgct tgttgataag gggatttctg agaaaaaaat + 16801 agttagttta ggcatttttg actatctgat cccgaattat caggacaaag aagatttatc + 16861 gaaggaaggg gctattattg tagctggaaa tttagctcaa gaaaaagcag gttatttata + 16921 tgagttgcct acaagaccgg catataacct ctatggtgtt ggttttgatg aggctagaaa + 16981 actatccaat gaaacctatt ttggttcatt tcttccagat gaattaccat cagcattaga + 17041 aggaagcttt ggtttggttt gggacggtgg tagttctaaa acttgtagcg gcgtgtttgg + 17101 tgagtatttg agatacaata attcccacaa ggcctccctt tatttggctt ctggttttcc + 17161 tattattgtc tgggggcaat ctgccttggc taatttcgtc ttagaaaaag agtgtggaat + 17221 tagtgttgag agtttacttg atttagaaga agtattggaa catttgtctc aagaagagta + 17281 tcagaatttg gtcaaaaatg ctaagtccgt aggtcaaaaa attcgtgaag gttcttatct + 17341 cctttctgca ttacaagctt taaattaatg aatctaaaaa ttatacaaat agatagatga + 17401 gggagttact ggattccctc ttttcttata tcaagggagt tttaagtgaa gaattaaagt + 17461 aagcgcgtca taacaaggta tctatcattc atggagctcc tcctgtatac tattagtaaa + 17521 gtaaaactat tggaggatat tgtaatgcca caacctattg ttcctgtaga gattccacaa + 17581 tctcgtcctt ttgattctaa aaagagaaat gatattctgc ttaaaattcg tattggcaag + 17641 cttgaagtaa gtttttttca atctctcaat ctcgaaatga tagaacagct tttggataag + 17701 gtgttgctct atgacaattc atctatctag cctagggtag gtctatctcg tgtgtgggaa + 17761 aactgatatg aggcaaggca ttgattcact ggcttatctg gttaaaaccc actttgaatt + 17821 ggatcctttc tccggtcaag tctttctctt ttgtggtgga cgtaaagacc gctttaaagt + 17881 cctttactga gatggtcaag gattttggct actatataaa cgctttgaga acggcagact + 17941 gacttggccc agtacagaaa aggatgtcaa agctctcaca tctgaacaag tagactggct + 18001 tatgaagggc ttttctatca ctccaaaaat aaatccatca gaaagtcgtg atttctattg + 18061 aaatgaggac tttcttttta gtataataaa ggtagaaaac aaggagggga agcccatgga + 18121 agaagattga aaatcattca acaacagagt gctacaattg atagtctcac caatgaactt + 18181 gcccttcttc gtgaacaagt ggcttatctg actcaaaagc tctatggaaa atcctctgag + 18241 aaaagtgttt gcccctctgg acaactcagt ctttttgaag aggaacaaaa tatggaagaa + 18301 gactctgact tacccagttg aaagagaaga aatcacctat aaacgtaaga aagctaaagg + 18361 gaaacgtcaa gctcttcttg cccaatttga ttcagaagaa gttcatcatc gcttagaggc + 18421 ctgcatttgc cctgactatc agggagatct aaaagagatt ggagcgagcc ttcaacgaca + 18481 agaattagtc tttattcctg cgcaattaaa acgaatagat catatccaac acgcttataa + 18541 gtgccaagca tgcagtgata aaaatcggag tgataaaatc gtgaaagctc ctattcctaa + 18601 agcccctttg gcgcatagct ttggctcagt ttctattatc gctcacacca tccatcagaa + 18661 gtttaatctg aaggtaccca attatcgcca agaagaagat tgggctagga tgggtttacc + 18721 aatcacacgt aaggaaatct ctaattggca tatcaaggca agtcaatact atttagagtc + 18781 cctttataac cttttacgag aaaagttgtt agaacaacct cttcttcatg cggatgaaac + 18841 ctcttatcgg gttctagaga gtgatagcca tctgacctac tattggacct ttttgtctgg + 18901 gaaatcagag aaacaaggga ttacgcttta ccatcatgat cagcgtcgga gtggttcggt + 18961 agtgcaagaa ttcctaggaa attattctgc ctatgcgata gcagtccaaa gtttaggagc + 19021 aaggcgacgc taagcttggt aaactacgaa ccgctagaag cttatcgtca actggaagaa + 19081 gctgaacttg ttggatgttg ggcgcatgtg agaaggaagt tttttgaagc gccccccaag + 19141 caagcggata aatcatcgtt aggagctaaa ggtttagctt attgtgatca gttatttgcc + 19201 ttggaaagag actgggaggc tttgctagct gatgaacgac tacagaaacg tcaagaagag + 19261 ctccaacccc taatggaaga tttctttgct tggtgccggc gtcagtcagt tttatcgggt + 19321 tcaaaactag gaagggcaat tgaatacagc ctcaagtata aagaaacctt taagaccatt + 19381 ttaaaagacg gacatctggt cctttccaat aatctagctg aacgcgccat taaatcattg + 19441 gttatgggac ggagtaaaag agtccagtgg actcttttag cctaagctca gtttaaaaaa + 19501 gtgagggtgg ttattttctc aaagttttga aggagctaaa gcaagagcta ttattatgag + 19561 cttattggaa acagctaaac gtcatcaact aaatagcgag aaatatctat cctatcttct + 19621 agaatgtctt ccaaacgagg aaactctcgt aaacaaagag gttttagagg cttatttacc + 19681 atgtactaaa gttgtacaag aaaagtgcaa ataagaaatc tccagattag gaactatata + 19741 tgagttctct agtctggaga tttttcaata tacttcgtta ttggacggtt acgatattca + 19801 tattttttgc aaagatgttg tttgaaaaat aattttcaaa aattctgaaa attctgttga + 19861 caactttctg aaaagagtct ataatggaga gaaagtttta aaggagaaaa tgatgaaaag + 19921 ttcaaaacta tttgcccttg cgggcgtgac attattggcg gcgactactt tagctgcatg + 19981 ctctggatca ggttcaagta ctaaaggtga gaagacattc tcatacattt atgagacaga + 20041 ccctgataac ctcaactatt tgacaactgc taaggctgcg acagcaaata ttaccagtaa + 20101 cgtggttgat ggtttgctag aaaatgatcg ctacgggaac tttgtgccgt ctatggctga + 20161 ggattggtct gtatccaagg atggattgac ttacacttat actatccgta aggatgcaaa + 20221 atggtatact tctgaaggtg aagaatacgc agcagtcaaa gctcaagact ttgtaacagg + 20281 actaaaatat gctgctgata aaaaatcaga tgctctttac cttgttcaag aatcaatcaa + 20341 agggttggat gcctatgtaa aaggggaaat caacgatttc tcacaagtag gaattaaggc + 20401 tctggatgaa cagacagttc agtacacttt gaacaaacca gaaagcttct ggaattctaa + 20461 gacaaccatg ggtgtgcttg cgccagttaa tgaagagttt ttgaattcaa aaggggatga + 20521 ttttgccaaa gctacggatc caagtagtct cttgtataac ggtccttatt tgttgaaatc + 20581 cattgtgacc aaatcttctg ttgaatttgc gaaaaatccg aactactggg ataaggacaa + 20641 tgtgcatatt gacaaagtta aattgtcatt ctgggatggt caagatacca gcaaacctgc + 20701 agaaaacttt aaagatggta gccttacagc agctcgtctc tatccaacaa gtgcaagttt + 20761 cgcagagctt gagaagagta tgaaggacaa tattgtctat actcaacaag actctattac + 20821 gtatctagtt ggtacaaaca ttgaccgtca gtcctataaa tacacatcta agaccagcga + 20881 cgaacaaaag gcatcgacta aaaaggctct cttaaacaag gatttccgtc aggctattgc + 20941 ctttggtttt gatcgtacag cctatgcctc tcagttgaat ggacaaactg gagcaagcaa + 21001 aatcttacgt aatatctttg ttccaccaac atttgttcaa gcagatggta aaaactttgg + 21061 cgatatggtc aaagagaaat tggttactta tggggatgaa tggaaggatg ttaatcttgc + 21121 agattctcag gatggtcttt acaatccaga aaaagccaag gctgaatttg ctaaagctaa + 21181 atcagcctta caagcagaag gtgtgacatt cccaattcat ttggatatgc cagttgacca + 21241 aacagcaact acaaaagttc agcgcgtcca atctatgaaa caatccttgg aagcaacttt + 21301 aggagctgat aatgtcatta ttgatattca acaactacaa aaagacgaag taaacaatat + 21361 tacatatttt gctgaaaatg ctgctggcga agactgggat ttatcagata atgtcggttg + 21421 gggtccagac tttgccgatc catcaactta ccttgatatc atcaaaccat ctgtaggaga + 21481 aagtactaaa acatatttag ggtttgactc aggggaagat aatgtagctg ctaaaaaagt + 21541 aggtctatat gactacgaaa aattggtcac tgaggctggt gatgagacta cagatgttgc + 21601 taaacgctat gataaatacg ctgcagccca agcttggttg acagatagtg ctttgattat + 21661 tccaactaca tctcgtacag ggcgtccaat cttgtctaag atggtaccat ttacaatacc + 21721 atttgcattg tcaggaaata aaggtacaag tgaaccagtc ttgtataaat acttggaact + 21781 tcaagacaag gcagtcactg tagatgaata tcaaaaagct caggaaaaat ggatgaaaga + 21841 aaaagaagag tctaataaaa aggctcaaga agatctcgca aaacatgtga aataa +// + diff --git a/public/res/serotype_genbank/serotype_37.gb b/public/res/serotype_genbank/serotype_37.gb new file mode 100644 index 0000000..6a00549 --- /dev/null +++ b/public/res/serotype_genbank/serotype_37.gb @@ -0,0 +1,772 @@ +LOCUS CR931709 17777 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 264/73 (serotype 37). +ACCESSION CR931709 +VERSION CR931709.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17777) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17777) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17777 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="264/73" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC37_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC37_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34375.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SPC37_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SPC37_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(491..1353) + /gene="tnp" + /locus_tag="SPC37_0003" + /pseudo + CDS complement(join(491..1024,1024..1353)) + /gene="tnp" + /locus_tag="SPC37_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(962..1024,1024..1335)) + /gene="tnp" + /locus_tag="SPC37_0003" + /note="HMMPfam hit to PF01710, Transposase, score 4.9e-23" + /pseudo + gene 1587..3032 + /gene="wzg" + /locus_tag="SPC37_0004" + CDS 1587..3032 + /gene="wzg" + /locus_tag="SPC37_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34378.1" + /db_xref="GOA:Q4JZ71" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZ71" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLAVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLTDIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KMSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKRILLTTTPRDSYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + GFTAHTNGKYYPEGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1587..1703 + /gene="wzg" + /locus_tag="SPC37_0004" + /note="Signal peptide predicted for SPC1746 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.526 between residues 39 and 40" + misc_feature 1791..2138 + /gene="wzg" + /locus_tag="SPC37_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.5e-64" + misc_feature 2316..2759 + /gene="wzg" + /locus_tag="SPC37_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.8e-68" + gene 3034..3765 + /gene="wzh" + /locus_tag="SPC37_0005" + CDS 3034..3765 + /gene="wzh" + /locus_tag="SPC37_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34379.1" + /db_xref="GOA:Q4JZ70" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ70" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSLHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKSQELFIDNPRKIVMDQLI" + misc_feature 3037..3645 + /gene="wzh" + /locus_tag="SPC37_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 7.4e-36" + gene 3771..4466 + /gene="wzd" + /locus_tag="SPC37_0006" + CDS 3771..4466 + /gene="wzd" + /locus_tag="SPC37_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34380.1" + /db_xref="GOA:Q4JZ69" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZ69" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAFLLIELLDTRVKRPEDVEDVLQI + PLLGIVPDLNKMK" + misc_feature 3771..3887 + /gene="wzd" + /locus_tag="SPC37_0006" + /note="Signal peptide predicted for SPC1748 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3792..4208 + /gene="wzd" + /locus_tag="SPC37_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.7e-55" + misc_feature 4314..4391 + /gene="wzd" + /locus_tag="SPC37_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4476..5165 + /gene="wze" + /locus_tag="SPC37_0007" + CDS 4476..5165 + /gene="wze" + /locus_tag="SPC37_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34381.1" + /db_xref="GOA:Q4K1K6" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1K6" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5180..6547 + /gene="wchA" + /locus_tag="SPC37_0008" + CDS 5180..6547 + /gene="wchA" + /locus_tag="SPC37_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34382.1" + /db_xref="GOA:Q4JZ67" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZ67" + /translation="MNGKIVKPSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISVYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIQKDGGSAIFAQTRIEKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSERSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5180..5272 + /gene="wchA" + /locus_tag="SPC37_0008" + /note="Signal peptide predicted for SPC1750 by SignalP 2.0 + HMM (Signal peptide probability 0.845) with cleavage site + probability 0.335 between residues 31 and 32" + misc_feature 5963..6544 + /gene="wchA" + /locus_tag="SPC37_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.7e-154" + gene 6534..7340 + /gene="wciB" + /locus_tag="SPC37_0009" + CDS 6534..7340 + /gene="wciB" + /locus_tag="SPC37_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34383.1" + /db_xref="GOA:Q4JZ66" + /db_xref="UniProtKB/TrEMBL:Q4JZ66" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDV + ILSRFNVEILLEKSDVIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDYTPFESRLFERV + SELLFNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene order(7344..7838,7850..8401) + /gene="wciC" + /locus_tag="SPC37_0010" + /pseudo + CDS join(7344..7838,7850..8401) + /gene="wciC" + /locus_tag="SPC37_0010" + /note="member of homology group 125" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /db_xref="PSEUDO:CAI34384.1" + misc_feature join(7812..7838,7850..8332) + /gene="wciC" + /locus_tag="SPC37_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.8e-14" + /pseudo + gene 8398..9396 + /gene="wciD" + /locus_tag="SPC37_0011" + CDS 8398..9396 + /gene="wciD" + /locus_tag="SPC37_0011" + /note="member of homology group 60" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34385.1" + /db_xref="GOA:Q4JZ65" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZ65" + /translation="MTKKKNTGKILTVVVPSYNAENYLQETMPTILSAKNIERGELLI + VNDGSTDRTEEIARQFEREYEGIVRVISKENCGHGSAVNAGIENAVGNYFKVVDADDW + VNTNNLEDLIVFLSEVDVDQVLSPYDKIFVNYRGDIEREEECNEFSQVENEVIYSAEE + FYTRIKQTVGMHSITVKTSLLQENNIRLSEKMFYVDMEYIVYMLPYVKKVVLFDKSIY + RYRLGTETQSISMASYIKNRDMHKQVIYHLVDFYNQMRSSAVLRRITWKLILNLIRQQ + WIIYFNLSKKEGKNSECFEFDNWLIKEGRIKKIPLYFFKAVKYIRFKVKYFLGIRK" + misc_feature 8431..8976 + /gene="wciD" + /locus_tag="SPC37_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 7.5e-30" + gene 9398..10366 + /gene="wciE" + /locus_tag="SPC37_0012" + CDS 9398..10366 + /gene="wciE" + /locus_tag="SPC37_0012" + /note="member of homology group 44" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34386.1" + /db_xref="GOA:O86892" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:O86892" + /translation="MRKIGKVINEYFVLRKSFTPAIARNKLFEKFWGRIGNYKIFNNI + ASNFYQYKHETIINFLEKDFSQFLKSYNFKEVSHKEIEQRKIFSMWIQGYESAPKLVQ + KTIDSQRKYAEKYGYKFVFLDENNIREYVTLPSEIVEKYENGTIDFIKYSDVVRGTLL + SKYGGVWLDSTIYVDSSRELNYLKKDFYTIRAKTHERVPKYIANGRWSAFCLSGEKQN + IVFDFLEKFHVAYFMKYDIVLDYFLIDYIIELGYRTNDLIRNYIDKVEENNQELFFLA + DNFSNQYDEKEWAGVLSTTALFKCSYKCPINEATGTYFDRLMKGEL" + misc_feature 9497..10348 + /gene="wciE" + /locus_tag="SPC37_0012" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.1e-144" + gene 10386..11357 + /gene="wciF" + /locus_tag="SPC37_0013" + CDS 10386..11357 + /gene="wciF" + /locus_tag="SPC37_0013" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34387.1" + /db_xref="GOA:O86893" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:O86893" + /translation="MISVIVPVYNVADYLRFALDSLLEQTYKDFEVILVNDGSTDNSG + EICDEYGKLYDNIHVFHKKNGGLSDARNFGLEKSRGEFITFLDSDDYFEPYALELLIT + IQKKYDVDIVSTKGGITYSHDIYSKKLMAEDYLTVKILTNKEFLAAVYYNDEMTVSAW + GKLYKRDLFKTIFPKGKIYEDLYVVAERLLNIKTVAHTDLPIYHYYQRQGSIVNSTFS + DRQYDFFDAIDHNEAIIKKFYCGDKELLAALNAKRVIGSFILSNSAFYNSKNDITKII + RIIKPYYWEVIKNKKIPMKRKVQCVLFLLSPNYYYKIKDKMLQRGRI" + misc_feature 10392..10904 + /gene="wciF" + /locus_tag="SPC37_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6.8e-50" + gene 11358..12581 + /gene="wzy" + /locus_tag="SPC37_0014" + CDS 11358..12581 + /gene="wzy" + /locus_tag="SPC37_0014" + /note="member of homology group 126" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34388.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ62" + /translation="MHVRLDGLLDYIFLFSVIITCNTMYSTSQGFDGLGKWATLLLVV + SVFLKLLISRISMKAINVIVSRSLIFILIILLIVILNGFKISETSFVYYFVLFPIFMM + ILQMYYDVNEIANLIRKFVRIIFLLAIGSLLFWLIGSVFHIISPTVYVLNYWNGGGIV + EGYYNLHFEAQKIEILGAILIRNTGIFAEAPMWSLVLSLALIFQTLHIKKWNFTTWIL + IITIMTTTSTTGVYIIGLIFLYVLFSKTSGVKRYVSSLFILATICCFSILWDNKSGTG + SATIRFDDYKAGFLAWQKSPIWGLGISDGLRAIEQHMDRTVRYNLGYSNSFFVVLAQG + GIMLASYYFYPVIKIILNKFSSNDLKFSALLIIFLMITTIFIETYMFLFVISLYYSLD + FGDDRDCHEKQYITN" + misc_feature 12180..12377 + /gene="wzy" + /locus_tag="SPC37_0014" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 3.2e-11" + gene 12612..14027 + /gene="wzx" + /locus_tag="SPC37_0015" + CDS 12612..14027 + /gene="wzx" + /locus_tag="SPC37_0015" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34389.1" + /db_xref="GOA:O86895" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:O86895" + /translation="MKILKNYAYNLSYQLLVIILPIITTPYVTRVFSSDDLGTYGYFS + SIVTYFTLLATLGVANYGTKEISAHRKEIGKNFWGIYSLQFGATWLSILLYLALCFLF + TSMQNPVAYILGLSLVSKGLDISWLFQGLEDFRKITVRNITVKLVGAISIFLFVKSAN + DLYLYVFLLTIFELLGQLSMWLPARQFIGKSYFDWKYAKKHLKPVILLFLPQIAISLY + VTLDRTMLGVLASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVSSLLSSGDYKAVN + KMHEMSFLIYNLVIFPIIAGMLIVNDDFVRFFLGQNFQDARYAIAIMTFRMFFIGWTN + IMGIQILIPHNKNKEFMVSTTVPAILSVGLNLLLLPQFGYIGAAIVSVLTEAFVWGIQ + LFYTRFYLKEVPIIGSMTKTALASAVMYGLLLGSKTSIHFSPTINVLIFSVLGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 12618..13412 + /gene="wzx" + /locus_tag="SPC37_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.4e-79" + gene 14029..15011 + /gene="wciG" + /locus_tag="SPC37_0016" + /pseudo + CDS join(14029..14934,14934..15011) + /gene="wciG" + /locus_tag="SPC37_0016" + /note="member of homology group 21" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /db_xref="PSEUDO:CAI34390.1" + gene order(15025..15864,15868..16125) + /gene="glf" + /locus_tag="SPC37_0017" + /pseudo + CDS join(15025..15864,15868..16125) + /gene="glf" + /locus_tag="SPC37_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /db_xref="PSEUDO:CAI34391.1" + misc_feature join(15460..15864,15868..16062) + /gene="glf" + /locus_tag="SPC37_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.6e-135" + /pseudo + gene 16196..17243 + /gene="wcjE" + /locus_tag="SPC37_0018" + /pseudo + CDS join(16196..16534,16533..17243) + /gene="wcjE" + /locus_tag="SPC37_0018" + /note="member of homology group 18" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /db_xref="PSEUDO:CAI34392.1" + gene 17418..>17777 + /gene="aliA" + /locus_tag="SPC37_0019" + CDS 17418..>17777 + /gene="aliA" + /locus_tag="SPC37_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34393.1" + /db_xref="GOA:Q4JZ60" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JZ60" + /translation="MMKSSRLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 17418..17504 + /gene="aliA" + /locus_tag="SPC37_0019" + /note="Signal peptide predicted for SPC1761 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 17664..17732 + /gene="aliA" + /locus_tag="SPC37_0019" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaaggcag aaatcctttg + 241 ttttttataa ccaaggttta taaaccttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gacgaacata aagaagcgta tccttagtgc aggcctgact + 361 tttacatctg ctttgctttt agctgcttgc gaccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtca attgaaacaa gaacaagaca aaagagcctc ataaaaggta ttgcaacttg + 541 gtaatacctt tttgaggtgc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggtgagta gggaggaaga ggtaaaagtt tatgcccaaa ctcttcgcat aaaagttcta + 661 gcttccccat tctatggaat cttgcattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagag aaaattctga aaccaagctt caaaaaagtc gctcgtcatc gtctcttcgt + 781 aagtcattgg agcgattaat tcaccatttg ttagacctgc aaccaaagaa atcctctgat + 841 atcttcttcc agatactttg cctcttatta actgaccttt taatgagcga ccatattctc + 901 gataaaaata agtatcgaat cctgtttcgt caatctaaac aggtgctagg tgctttaaac + 961 tattaaaatt cttaagaaat aaggctactt tttctggctc ttgttcatag taggtgtggt + 1021 tctttttttt cgagtgtagc ccatagcttt gagcgcatag tggatggtag ttggatgaca + 1081 gccaaattca gaagctattt cagtcaaata agcatctgga ttgtcagtaa gatagttttt + 1141 aagtctatct ctatcaacct ttcttggttt tgttcctttt acttggtggt ttagctctcc + 1201 tgttttctct tttagcttta accagccata aatggtatta cgtgagattt ggaaaacgtg + 1261 tgatgcttct gttatactac ctgttcgctc acaataagag agaacttttt tacgaaaatc + 1321 tattgaatat gccataaaaa gattatacca cattgtgtac tacagtagat tgaaactaga + 1381 acagtacacc tctgattcta aaacattgtt agaaatcgat ttgactgtcc tgatcgattt + 1441 gtcatgttct tatttccttt tactatattt ttggttcgcg ggaagtctac taagatactt + 1501 aaagatgcag atagtgaaaa taaaggtgta gacattaccg taaaaagtga tataatcgta + 1561 tgatgttcaa ggtataggtg ttaatcatga gtagacgttt taaaaaatca cgttcacaga + 1621 aagtgaagcg aagtgttaat atcgttttgc tgactattta tttattgtta gtttgttttt + 1681 tattattctt aatctttaag tacaatatcc ttgcttttag atatcttaat ctagcggtaa + 1741 ctgcgttagt cctactagtt gccttggtag ggctactctt gattatctat aaaaaagctg + 1801 aaaagtttac tatttttctg ttggtgttct ctatccttgt cagctctgtg tcgctctttg + 1861 cagtacagca gtttgttgga ctgaccaatc gtttaaatgc gacttctaat tactcagaat + 1921 attcaatcag tgtcgctgtt ttagcagata gtgagatcga aaatgttacg caactgacga + 1981 gtgtgacagc accgactggg actgataatg aaaatattca aaaactacta actgatatca + 2041 agtcaagtca gaataccgat ttgacggtca accagagttc gtcttacttg gcagcttaca + 2101 agagtttgat tgcaggggag actaaggcca ttgtcctaaa tagtgtcttt gaaaatatca + 2161 tcgagtcaga gtatccagac tacgcatcga agataaaaaa gatttatacc aagggattca + 2221 ctaaaaaagt agaagctcct aagatgtcta agaatcagtc ttttaatatc tatgttagtg + 2281 gaattgacac ctatggtcct attagttcgg tgtcgcgatc agatgtcaat atcctgatga + 2341 ctgtcaatag ggatacgaag agaatccttc ttacaacaac tcctcgagat tcatatgttc + 2401 ctattgctga tggtggaaat aatcaaaaag ataaattaac ccatgcgggc atttatggag + 2461 ttgattcgtc cattcacacc ttagaaaatc tctatggagt ggatatcaat tactatgtgc + 2521 gattgaactt cacttcgttt ttgaaattga ttgatttgtt gggtggaatt gatgtttata + 2581 atgatcaagg atttactgcc catacgaatg gaaagtatta ccctgaaggc aatgttcatc + 2641 ttgattcaga acaggctctc ggttttgttc gtgagcgcta ctcactagca gatggcgatc + 2701 gtgaccgcgg gcgcaatcaa caaaaggtga ttgtggctat ccttcaaaaa ttaacgtcaa + 2761 ccgaagcact gaaaaattat agtacgatca ttaatagctt gcaagattct atccaaacaa + 2821 atatgccact tgagactatg ataaatttgg tcaatgctca gttagaaagt ggagggaatt + 2881 ataaagtaaa ttctcaagat ttaaaaggta caggtcggat ggatcttcct tcttatgcaa + 2941 tgccagacag taacctctat gtgatggaaa tagatgatag tagtttagct gtagttaaag + 3001 cagctataca ggatgtgatg gagggtagat gaaatgatag acatccattc gcacatcgtt + 3061 tttgatgtag atgacggtcc caagtcaaga gaggaaagca aggctctctt ggcagaatcc + 3121 tacaggcagg gggtgcgaac cattgtctct acctctcacc gtcgcaaggg catgtttgaa + 3181 actccggaag agaagatagc agaaaacttt cttcaggttc gggaaattgc aaaagaagta + 3241 gcagatgatt tagtcattgc ttatggcgca gagatatatt atactctgga tgctctagaa + 3301 aagctagaaa aaaaagaaat tcctaccctt aatgatagtc gttatgcctt aatagagttt + 3361 agtatgaaca ctccttatcg cgatattcat agcgccttga gcaagatctt gatgttggga + 3421 attactccag tcattgccca tattgagcgc tatgatgctc ttgaaaataa tgaaaaacgc + 3481 gttcgggaac tgatcgatat gggctgttac acgcaagtaa atagtttaca tgtcctcaaa + 3541 cccaaacttt ttggcgaacg ttataaattc atgaaaaaaa gagctcagta ttttttagag + 3601 caggatttgg ttcatatcat tgcaagtgat atgcacaatc tagacggtag acctcctcat + 3661 atggcagaag catatgacct tgttacccaa aaatacggag aagcgaagtc tcaggaactt + 3721 tttatagaca atcctcgaaa aattgtaatg gatcaactaa tttaggagaa atgatgaaag + 3781 aacaaaacac gatagaaatc gatgtatttc aattatttaa aaccttgtgg aaacgcaagc + 3841 taatgatttt aatagtggca cttgtgacag gtgcgggggc ttttgcatat agcactttta + 3901 ttgttaagcc agaatatacg agtaccacgc gaatttatgt agtgaatcgc aatcaaggag + 3961 acaagccggg gttgacaaat caggatttgc aggcaggaac ttatctggta aaagactacc + 4021 gtgagattat cctttcgcag gatgcattgg aaaaagtagc gacaaatttg aagttggata + 4081 tgccagcaaa aacgttagcc agcaaagttc aagtggctgt accagctgac actcgtatcg + 4141 tctcaatctc tgtcaaggat aaacagccag aggaagccag tcgtatcgct aattctctac + 4201 gagaagttgc tgcagaaaag atcgtcgctg taacgcgagt atctgatgta acgacacttg + 4261 aagaagcgcg accagctacg actccctctt ctccaaatgt tcgacgcaat tccttgtttg + 4321 gttttcttgg aggagcagtc gtaacagtaa ttgcttttct tttgattgag ttgctcgaca + 4381 cccgtgtgaa acgtcctgaa gatgttgaag atgtactgca aattccactt ttagggatcg + 4441 ttccagattt gaacaaaatg aaataggagg aagttatgcc aacgttagaa atctcacagg + 4501 caaaattgga ttttgtaaaa aaggcagagg aatattataa cgctttgtgc acgaacctac + 4561 agttaagtgg agatggtttg aaagtatttt ctatcacttc tgtgaaacta ggagaaggaa + 4621 aatcaacgac ttccaccaat atcgcttggg cttttgcgcg tgcaggttac aaaacgctgc + 4681 tgattgatgg agatattcgc aattctgtta tgttaggtgt ctttaaagca agggataaga + 4741 ttacaggcct gacagaattt ttatcaggaa ctacagacct atcacaaggg ctttgtgata + 4801 ccaatatcga aaatctcttt gtaattcagg ctggctctgt gtcaccgaat ccgacagctc + 4861 ttcttcaaag taagaatttc agtacaatgc ttgaaacctt gcgtaaatat tttgactaca + 4921 tcattgtaga tactgctcct gtcggtgtcg tgattgatgc ggctattatt acgcgaaaat + 4981 gcgatgcttc tattttagtg acggaggcag gtgaaataaa tcgacgggat attcaaaaag + 5041 caaaagaaca gttggaacac acagggaagc cgtttttggg agttgtgttg aataaattcg + 5101 atacttcagt agacaaatac ggttcttatg gaaattatgg agattacggg aaaaataaaa + 5161 aataggtcgg gggatagaga tgaatggaaa aatagtaaag ccttcattgg ccataatcca + 5221 gagttttctt gttattttat tgacttatct acttagtgct gtgagagaag cggagattgt + 5281 ttcaacaaca gctattgcac tttatatcct ccattatttt gtcttttata tcagtgttta + 5341 tgggcaggat ttctttaaaa ggggatattt gattgaactt gtccagacat tgaaatatat + 5401 cctattcttt gcactagcga ttagtatttc taattttttc ttagaggatc gatttagtat + 5461 ttccagacga ggcatgattt acttcctcac attacatgct ctcttagtct atgtgctaaa + 5521 cctatttatc aagtggtatt ggaagcgggc ttatcccaac tttaaaggaa gtaagaagat + 5581 tctcctactt acagcaactt ctcgtgtcga aaaggtactg gatagattaa tagaatcaaa + 5641 tgaggttgtt ggggagttgg tagccgtcag tgtcttagat aaaccagatt ttcagcatga + 5701 ttgtttaaag gtagtagcag agggggagat agtaaacttt gcgactcatg aggtggtcga + 5761 tgaagtcttt atcaatcttc cgagtgaaaa atacaatatt ggagagcttg tctctcagtt + 5821 tgaaacgatg ggaattgatg taacagttaa tctaaatgct tttgatcgta gtttggcacg + 5881 taacaagcaa attcgtgaga tggcaggatt aaacgttgtg actttttcta caacatttta + 5941 taagactagt catgtaattg ctaagcggat tattgatatc gtgggtgcat tggtagggct + 6001 gatattatgt ggtttagtca gtattgtact ggttcctttg attcaaaagg atgggggctc + 6061 tgctattttt gctcagacgc gtatagaaaa aaatggtcgt cagttcactt tttataagtt + 6121 tcgctctatg tgtgtagatg ccgaggcgaa aaaaagagaa ctcatggaac aaaataccat + 6181 gcagggtgga atgtttaagg tggacgatga tcctcgtatc acgaaaattg gtcgttttat + 6241 acggaagact agcttggacg agctaccaca gttttataat gttctaaagg gagatatgag + 6301 tttggttggc acacggccac caacagtgga cgagtatgaa cactataccc cagaacaaaa + 6361 acgtcggcta agttttaaac ctggtataac aggcttatgg caggtcagtg aacgaagtga + 6421 gattaagaat tttgatgaag ttgtcaaatt agatgtagcc tatatagacg attggacaat + 6481 ttggaaagat attgagattt tattgaagac agttaaagtt gtattgatga aggatggagc + 6541 gaagtagatt gatagatgta aaaatcattg tggcaacaca taaagaggtt aaaatgcctc + 6601 aagacaatag tctttacctt ccaatacatg ttgggagaga cggtaaatca gatattggtt + 6661 ttatcggtga taatactggc gataatatat cctctctaaa tccatattat tgtgagttga + 6721 cgggacttta ttgggcatgg aagaatcttg attataatta cttaggtcta gttcattacc + 6781 gtcgttattt tacaaataaa tctcaagggt ataatgaaaa tgtcaatatg gatgacgtca + 6841 ttttgtctcg atttaatgtt gaaatattat tagagaaatc tgacgtaata gttccaaaga + 6901 agcgaaagta ttatattgaa actctttatt cacattatgc ccataccctt aacggagaac + 6961 atctggatct tgctaggaaa attattgagc aaaatagttc agagtatctt tcatcctttg + 7021 ataaagtgat gaaacaaaga agcggttata tgttcaatat gtttatcatg aaaaaagaac + 7081 tattagatga ttatttaccg tggctttttt ctattctgga tactatgtac gaacagatgg + 7141 acttgaccga ctatactcca tttgagtcac gtttattcga gcgagttagt gagttgttgt + 7201 ttaatgtttg gttatgtaaa aaaggaataa cgcctaaaga ggtaccattt atgtacatgg + 7261 agagagtgga tttgtttgaa aaaggaaaat cttttttaat ggctaaattt tttggaaaga + 7321 agtatggaca gagtttttag gatatgaaag taactattat tggacaaata aaaaataaga + 7381 gaacaggtct tggaaaggcg attaatgatt ttagggatta ttgttgcaat cgtgctacaa + 7441 gagtaacgga aatagatata acaaataatt ttaatttttt aagctctctt tttcaaattt + 7501 taatatctga tacagatgtt tattatttta ctccagctgg ttcagtagct ggtaatatta + 7561 gggattcact gtttttgttc tttatgataa tgaaaaggaa aaaaatagtg acccattttc + 7621 ataatagtgc ttttggaaat gtgatgagac aacatccgac tctaatgata ataaatagaa + 7681 tattgtattc taaagttgat ttgattatat tattgggaga gaaatcgaaa ataatgtttc + 7741 aacaactaag aattttagac gaaaaattta aaataattag gaatggtgtg gatggatatt + 7801 tatttattga aaaaaatgaa ttaaataaaa aaatgaatta aataaaaaaa tgagcgatct + 7861 acccataaat attatttttt ttagtaatat gattagagaa aaaggttacg aaattttatt + 7921 agaagttgct aagaagatgg tgggggatga gaaatatcac ttttattttt ctggaaaatt + 7981 tcaggataat aatttaaaga ctaggtttat taatgaaatt tatagtatga ataatttaac + 8041 atatttagat ggtgtatatg gtagtgataa gaaaaagtta ttgcaaaaaa tgcattactt + 8101 tgttttacca tcgtattata aagatgaaac tttacctatc agtatgttag aagcaatggc + 8161 aaatggtctc tatattattg taagcgatgt gggagttgtg tcagaggtga ttaataaaga + 8221 aactgctagt cttattgaaa tgataaacga agaaacagca gacagtatca tagaaattat + 8281 taatcagact tcaaataaac ttaatgagtt cgattttaat gtatcaaaat ataagcaaga + 8341 gttgttaaat gaaaatatac aagcatcaat ttatcagcaa ttagagagga tagcaaattg + 8401 acgaagaaaa aaaatactgg aaaaatatta acagtagttg taccatcata taatgcagaa + 8461 aattatttac aagagacgat gccgacgata ctttctgcta agaatataga gaggggagaa + 8521 ttactgattg taaacgatgg ttctacagac agaaccgaag aaatagcaag acaattcgag + 8581 agagaatatg agggaattgt cagagttata agtaaggaaa actgtggtca cggttcggca + 8641 gtaaatgcgg ggattgagaa tgctgttggt aattacttta aagtggtaga tgcagatgat + 8701 tgggtgaaca ccaataattt agaagatttg atagtgtttc tatctgaggt ggatgtggat + 8761 caagttttat caccatatga taaaattttt gtgaattatc gaggtgatat agagcgtgaa + 8821 gaagagtgca acgagttttc gcaagttgag aacgaggtga tctattctgc agaagaattc + 8881 tatacacgaa ttaaacaaac ggtaggaatg cattccatta ctgtgaaaac gagtcttttg + 8941 caagagaaca atattcggct gtctgaaaaa atgttctatg tagatatgga atatattgtt + 9001 tatatgcttc catatgtaaa aaaggttgtt ttatttgata aaagtatcta tagatatcgt + 9061 ctaggaacag agacacaaag cattagtatg gcgagttata ttaaaaatcg tgatatgcat + 9121 aaacaagtga tctatcattt ggttgatttt tataatcaaa tgagatctag cgctgtttta + 9181 aggagaataa catggaaatt gattttaaat ttaataagac agcaatggat aatttatttt + 9241 aatttatcta aaaaagaggg gaaaaacagc gagtgttttg aatttgataa ttggctaata + 9301 aaagaaggac ggataaaaaa aataccacta tactttttta aagctgtgaa atatatcaga + 9361 tttaaggtga aatattttct ggggataaga aaataatatg agaaaaatag gaaaagtaat + 9421 aaacgagtat tttgtattaa gaaaatcatt tactcctgct attgctcgga ataaattatt + 9481 tgaaaagttt tggggacgga tagggaatta taaaattttc aataatatag ctagtaattt + 9541 ttatcaatac aaacatgaaa caatcataaa ttttttggaa aaagatttta gccaattttt + 9601 aaaatcctat aactttaaag aggtatcgca caaggagata gaacaaagaa aaatcttctc + 9661 tatgtggata caaggatacg aaagtgctcc taagttggtt cagaagacga ttgatagcca + 9721 aaggaaatat gcagaaaaat acggatataa atttgttttt ttggatgaaa acaatatccg + 9781 tgaatatgtg acacttccat cagagatagt agaaaaatat gagaatggaa ctatagattt + 9841 tataaaatat tcggatgttg taaggggaac attgctttca aaatatggag gagtgtggtt + 9901 agattcgact atttatgttg attcttcacg agaactgaat tatttaaaaa aagattttta + 9961 tactattcga gcaaagacac atgagagagt gcccaaatat atcgcaaatg gtaggtggtc + 10021 tgcattttgt ttgtcagggg aaaagcaaaa catagtattt gattttttag agaaatttca + 10081 tgtagcatat tttatgaaat acgatatagt gctagattat tttttgattg actatattat + 10141 agaattaggt tataggacaa atgacttgat tagaaactat attgataaag tcgaagaaaa + 10201 taatcaggag ttgttctttt tggcagacaa tttttctaac cagtatgatg aaaaagagtg + 10261 ggcaggagtt ttatcaacaa ctgcattgtt taagtgtagt tataagtgtc cgataaatga + 10321 agcgacagga acctattttg atagattgat gaagggtgaa ctgtagcata aagagaggga + 10381 atggtatgat ttcagttatt gttccagtat acaatgtcgc ggattatctg cgctttgcgt + 10441 tggatagtct tttggaacag acgtataaag attttgaggt tattctagta aatgatggat + 10501 ccactgataa ttctggggaa atatgtgatg aatatgggaa actgtatgat aatattcatg + 10561 ttttccataa gaagaatggc ggactttcgg atgctagaaa ttttggtttg gagaagagtc + 10621 gaggagagtt tataactttt cttgattcag atgattattt tgaaccgtat gcattagaat + 10681 tgttaattac tattcaaaaa aaatatgatg tagatatcgt atcaactaaa gggggaataa + 10741 cctattctca tgatatttat agcaaaaaac tgatggctga ggactaccta actgtaaaaa + 10801 tattgacaaa taaagaattt ttggcagctg tatattataa cgatgaaatg acggtatctg + 10861 cttggggaaa attgtataaa agagatttat ttaaaacgat ttttccaaaa ggaaagatct + 10921 acgaggattt gtatgttgtt gcagagcgtt tgttgaatat taaaacagtt gctcataccg + 10981 atttgcctat atatcattat tatcagagac agggaagtat tgttaattca acattttcgg + 11041 atagacagta tgattttttt gatgcgattg atcataatga agccataata aaaaaattct + 11101 attgtggaga taaggaattg ctagcagcct taaatgctaa aagagtaatt ggctccttta + 11161 ttttgagtaa tagcgcattt tataatagta aaaacgatat tactaaaata ataagaataa + 11221 ttaaaccgta ttattgggaa gtaataaaaa ataaaaaaat tccaatgaaa aggaaagttc + 11281 aatgtgtttt gtttctgctt tccccaaatt actactataa aataaaagat aagatgttac + 11341 agagaggcag gatatagatg catgttagat tagatggttt gctggactat atatttctat + 11401 ttagtgtgat tattacttgt aatactatgt attcaactag tcaaggattt gatggactag + 11461 ggaaatgggc gactctgtta cttgtggtat cagtttttct gaaattgctt atctctagaa + 11521 tatctatgaa ggcaatcaat gtgattgtgt cgcgttcttt aatatttata ttaattattc + 11581 tactcatagt aatattaaat ggttttaaga tttctgagac aagtttcgtc tattattttg + 11641 tattatttcc gatttttatg atgattttgc agatgtacta tgatgttaat gaaatcgcaa + 11701 atctgatacg gaaatttgtt cgtataatat ttcttttagc aattggctct ctcctatttt + 11761 ggcttattgg tagtgtattt catattatat ccccaacggt ttatgtgttg aattattgga + 11821 atggtggggg aatagtagaa gggtactata atcttcattt tgaagcacaa aaaatagaga + 11881 ttttgggggc gatactgata agaaatacgg ggatttttgc tgaagcacct atgtggagtt + 11941 tggtattgag ccttgcattg atatttcaaa cgcttcatat aaaaaaatgg aatttcacaa + 12001 cttggattct tattattaca attatgacaa ctacgtcaac aacaggggtt tatataatag + 12061 gtttgatttt cctatatgtt ttattttcaa aaacaagtgg tgtgaagaga tatgtttcta + 12121 gtttatttat tttagcgact atatgttgtt tttcaatatt atgggataat aaatctggaa + 12181 ctggttcagc aactatacgc tttgatgatt ataaggctgg ttttttggca tggcagaaaa + 12241 gtcctatttg gggattaggt atttcagacg gtcttagagc cattgaacaa catatggata + 12301 gaactgttag atataatctt gggtatagca atagcttttt tgttgtttta gctcaaggag + 12361 ggataatgtt ggcttcgtat tacttttatc cagtaattaa aattattttg aataaattta + 12421 gttcgaatga tttgaagttt tctgcgctat taataatttt ccttatgata actactatat + 12481 ttatagagac ctatatgttt ttatttgtca tttctttata ctattctctt gattttgggg + 12541 acgatagaga ttgtcatgag aaacagtaca ttactaatta ataataaagg tgtgaacaga + 12601 aataagaaga aatgaaaata ctaaaaaact atgcctataa tctttcttat caattgttgg + 12661 tgatcatact ccctatcatt acgactccct atgtaacgag ggtttttagt tctgacgatt + 12721 taggaacgta tggctacttt agctccattg ttacctattt taccttgctt gcaactcttg + 12781 gtgttgccaa ctacggtacc aaagagattt cagcacatcg taaggaaatt gggaagaatt + 12841 tctggggaat ttattctctc cagtttggtg caacttggct atccattttg ctttatcttg + 12901 ccctttgttt cttatttact tcaatgcaaa atccggtagc ttatatattg ggattaagtt + 12961 tagtgtcaaa aggtttggat atttcttggt tatttcaagg tttggaggat tttagaaaga + 13021 ttacagttcg gaacatcact gttaagttag ttggtgcaat ctctattttc ctatttgtaa + 13081 aatcagctaa tgacttatac ttatatgtat ttcttcttac cattttcgaa ttgttagggc + 13141 aattaagcat gtggttaccc gcaagacaat ttattggtaa atcatatttt gattggaaat + 13201 acgctaagaa gcatttgaaa ccagttatct tgttattctt gccacagatt gccatctcgc + 13261 tttatgtgac tttggaccgt acgatgctgg gggtgttggc ttcgacaaag gatgttggaa + 13321 tttatgatca agctttgaag cttgttaata ttttactgac tttggttacc tcactgggga + 13381 gtgttatgtt gccacgagta tctagccttt tatcgtctgg ggattacaaa gccgttaata + 13441 agatgcacga gatgtctttt ttaatctata acttggtgat tttcccaatc atagcaggaa + 13501 tgttgattgt caacgatgat tttgttcgtt tcttccttgg gcaaaatttt caagatgctc + 13561 gctatgcgat tgctattatg accttccgta tgttctttat tggttggacc aatataatgg + 13621 gaattcaaat cttgattccg cacaataaaa ataaggaatt tatggtttca acgacagttc + 13681 ccgctattct gagtgtggga ttgaatttgt tgcttcttcc ccaatttggt tatataggtg + 13741 ctgcgattgt ttcagttttg actgaggcgt ttgtatgggg gattcagtta ttctatacac + 13801 gtttttattt aaaagaagtt cctattatcg gttcaatgac aaaaactgca cttgcatctg + 13861 ctgttatgta tggtctcttg ctaggttcaa aaacatctat acatttttcg ccaaccataa + 13921 atgttttaat attttcggtg ctaggcggaa ttatctatct ttttgcaatt ctatctctga + 13981 aagtggtaga tgtgaaagaa ttaaaacaaa taatcaggaa aaattagaat gagcaaattt + 14041 cgaaatatta acttagattt actaaaagtg cttgcatgtg ttggagtcgt tctacttcat + 14101 acagctatgg gtgggtttaa agagacaggt gcatggaatt ttttgacata tttatattac + 14161 ttaggaacct attctatccc tctatttttt atggtcaatg gttatttatt gttggggaag + 14221 agagaaatta cctattccta catattgcaa aaaataaaat ggctcctaat aacagtgtcg + 14281 tcatggactt ttatcgtttg gctgtttaaa agagacttta cagagaactt aattaaaaaa + 14341 attataggtt ctttgataca aaaggggtat ttcttccagt tttggttttt tggtgcactc + 14401 atacttattt atatatgttt gcctattttg aaaaatttcc ttaatttaaa aagaaattat + 14461 ttatacattc tatctgtatt gctggttatt ggtttgattt ttgagttagc gaatattgta + 14521 tttcaaatgc cagcacaaac atatgttata caaaccttta gattatggac ttggtttttt + 14581 tactaccttt taggtggttt tatagcgcaa tttaacaagg atattatcag aaataggttt + 14641 aagatatgga tgaaagtagc tactgtactc ttattattaa tttcaccatt aatattattt + 14701 ttcttagcga agaccactta ccataatctt tttgctgaat atttttatga tattttattt + 14761 gtaaaagttg taagtttagg aatttttcta actatattct cacttgcatt gaatcaagat + 14821 atcaacaaat ggattatttt tctttctaac caaactatgg gtgtctttat aatacacact + 14881 tatattatga aagtgtggga aaaactattt ggttttagtt ttgtaggagc atatttactt + 14941 taagtattag ttttattatt gctggaatgt taatgaaaat tccttatttc aatcgaattg + 15001 tcaaattata aaaaggagaa caaaatgtac gactatctaa tcgtcggtgc gggtttgtct + 15061 ggagctattt ttgctcacga agctacaaaa cgtggaaaaa aagtaaaagt gattgataaa + 15121 cgcgatcaca ttggagggaa catctactgt gaaaatgtag aaggtatcaa tgtccataaa + 15181 tatggtgccc atatcttcca tacctcaaac aaaaaagttt gggactatgt caatcaattc + 15241 gctgaattta acaactatat caattcacct gtcgcgaact ataaaggaag tctttataat + 15301 cttcctttca atatgaatac tttctatgct atgtggggga caaaaactcc acaggaagtg + 15361 aaagataaga ttgctgagca gacggctgat acgaaggatg ttgagccaaa aaatctggaa + 15421 gaacaagcta tcaagttgat tggtccggat atctatgaaa agttgatcaa gggctatact + 15481 gaaaagcaat ggggacgctc agcaacggaa cttcctccat ttatcattaa acgtcttcca + 15541 gttcgtctaa catttgataa taactatttt aacgaccgtt accaaggaat tcctattggt + 15601 ggttataatg tgattatcga aaacatgctt aaagacgttg aagttgagct tggtgttgat + 15661 ttctttgctc accgtgaaga gttagaagca tcagctgaaa aagttgtctt cacaggaatg + 15721 atcgaccagt attttgacta caaacacggg gagttagaat accgtagcct tcgctttgag + 15781 catgaaattt tggacgagga aaattatcaa gggaatgctg tagtgaacta tacagagcgt + 15841 gagatccctt atactcgtat catctaacac aaacattttg aatatggaac gcagccaaag + 15901 acagttatca cgcgtgaata tccagccgac tggaagcgcg gggacgagcc ctactatccg + 15961 atcaatgatg agaaaaataa tgctatgttt gctaagtatc aagaggaagc ttcaaagaat + 16021 gataaggtta tcttctgtgg gcgcttagca gattataaat attatgatat gcatgtggtg + 16081 attgaacgag ctcttgaagt tgtagagaaa gagttaggta actaaagatt tgatattaaa + 16141 atgagggact acttcttttc ctcattttat tcaccttaag aggagatgga aaaaaatgaa + 16201 tgcttatagt aaacaaaagt ctggtcgaat cgaatggata gattttggaa agggctctgc + 16261 catattttta gttttagtgg gacatgtatt acttggtctg tatcaatcgg aaaaatttcc + 16321 catagcaaac aacatactat cactgttgat agcacaaatc tacatatttc acataccagt + 16381 attttttgct ttatcaggat actttttcaa acctgtgtcg aatttgaaag agttctggca + 16441 atatgctaag aagaagacga ttatttttgg cctaccatat attttttatt cgatcattca + 16501 tttttgtctt caaaaagttg cagggggcga ctgttagagt cccgacgact atatttgatt + 16561 taataaatat ctataaaaat cctattggag tctcatggta tttatacata ctctggtcga + 16621 ttttgataat gtatggatta gtatctattt taatcaaaaa tcgtagaata ttatttttga + 16681 taagtgtttt tgcttattgt ttaaccctat ttgttcaaac agatatttat atcattcaaa + 16741 gaacgctagt ttggggtatt tgtttctttc ttggaagtgt attgaacgaa attcacttta + 16801 ataaaattag tttgaaaaaa tttcttgttt tctttgtgat atttgacttt atttatatgc + 16861 ttgtatggtt cttattttat gaagtagagt ctaaaaggga tagtgtaagc tatagtaacc + 16921 caggggtgtg ggggattgct tttattgtct gtatattagt tgcgtttgta atcttcccta + 16981 aaatatcgga aaaatttcct aaaactttcc tatatttcac taaatatggt aaagatagtt + 17041 taggtatcta tatcctccat gcaccaattt gtagcatgat tcggattcta atgttgaaag + 17101 tgggaataaa ctcagttttt cttcacgttg ttgttgggat tgtcttgggt tggtatttat + 17161 ccatactggc aacttatata ttgaaaaaaa ttccattttt gaatattgtt ttattaccac + 17221 aaaagtatat taaattaaaa taaattattt tagatttata atgtggctct ttgtcaacta + 17281 acatctggag aggacaatca ctgtcttctc cttttttgtc ttttcagaat ataccaaatt + 17341 aacacaaaaa ttctgaaaat tctgttgaca actttctgaa aagagtctat aatggagaga + 17401 aagttttaaa ggagaaaatg atgaaaagtt caagactatt tgcccttgcg ggcgtgacat + 17461 tattggcggc gactacttta gctgcatgct ctggatcagg ttcaagcact aaaggtgaga + 17521 agacattctc atatatttat gagacagacc ctgataacct caactatttg acaactgcta + 17581 aggctgcgac agcaaatatt accagtaacg tggttgatgg tttgctagaa aatgatcgct + 17641 acgggaactt tgtgccgtct atggctgagg attggtctgt atccaaggat ggattgactt + 17701 acacttatac tatccgtaag gatgcaaaat ggtatacttc tgaaggtgaa gaatacgcgg + 17761 cagtcaaagc tcaagac +// + diff --git a/public/res/serotype_genbank/serotype_38.gb b/public/res/serotype_genbank/serotype_38.gb new file mode 100644 index 0000000..3155ea5 --- /dev/null +++ b/public/res/serotype_genbank/serotype_38.gb @@ -0,0 +1,1232 @@ +LOCUS CR931710 30298 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 9687/39 (serotype 38). +ACCESSION CR931710 +VERSION CR931710.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 30298) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 30298) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..30298 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="9687/39" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC38_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC38_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34394.1" + /db_xref="GOA:Q4JZD8" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JZD8" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAP + WDAFCVELL" + gene order(322..1752,1788..2273) + /gene="aliB" + /locus_tag="SPC38_0002" + /pseudo + CDS join(322..1752,1788..2273) + /gene="aliB" + /locus_tag="SPC38_0002" + /note="member of homology group 169" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + misc_feature join(538..1752,1788..1871) + /gene="aliB" + /locus_tag="SPC38_0002" + /note="HMMPfam hit to PF00496, Bacterial extracellular + solute-binding prot, score 1.3e-37" + /pseudo + gene complement(order(2414..2998,3052..3225,3228..3740)) + /gene="tnp" + /locus_tag="SPC38_0003" + /pseudo + CDS complement(join(2414..2998,3052..3225,3228..3740)) + /gene="tnp" + /locus_tag="SPC38_0003" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI34396.1" + misc_feature complement(join(2918..2998,3052..3225,3228..3284)) + /gene="tnp" + /locus_tag="SPC38_0003" + /note="HMMPfam hit to PF01610, Transposase, score 8.5e-33" + /pseudo + gene 3892..4275 + /gene="tnp" + /locus_tag="SPC38_0004" + /pseudo + CDS 3892..4275 + /gene="tnp" + /locus_tag="SPC38_0004" + /note="member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase (fragment)" + gene complement(4295..5248) + /gene="tnp" + /locus_tag="SPC38_0005" + CDS complement(4295..5248) + /gene="tnp" + /locus_tag="SPC38_0005" + /note="member of homology group 39" + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + /protein_id="CAI34398.1" + /db_xref="GOA:Q4K0X9" + /db_xref="InterPro:IPR001584" + /db_xref="InterPro:IPR012337" + /db_xref="UniProtKB/TrEMBL:Q4K0X9" + /translation="MQEHYTPKGKHLTIDNRRLIERWKNENKSNREIAGLLGKAPQTI + HNEVKRGTTLQQVRKGLYKKVYSADYAQTVYQFNRKRSVKKLILTKEIREKILHYHKQ + KFSPEMMVNKKQVKVGISTIYYWFHNGHLGLTKADMLYPRKRKGVKKQASPNFKPAGK + SIEERPDVINLRLENGHYEIDTVLLTKIKNYCLLVLTDRRSRHQIIRLIPNKTAESVN + QALTLLLGEHRILSITADNGSEFKRLSEVFPEEHIYYAHAYSSWERGSNENHNRLIRR + WLPKGTKKTTPKEVAFIENWINNYPKKCLDYKSPSEFLLGG" + misc_feature complement(4304..4741) + /gene="tnp" + /locus_tag="SPC38_0005" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 6.6e-23" + misc_feature complement(5102..5167) + /gene="tnp" + /locus_tag="SPC38_0005" + /note="Predicted helix-turn-helix motif with score + 1087.000, SD 2.89 at aa 28-49, sequence + KSNREIAGLLGKAPQTIHNEVK" + gene 5802..6899 + /gene="glf" + /locus_tag="SPC38_0006" + CDS 5802..6899 + /gene="glf" + /locus_tag="SPC38_0006" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34399.1" + /db_xref="GOA:Q4JZ57" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZ57" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + IEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKNKIAEQTAHMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TDLPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFANRQ + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEVLDKENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQDKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAVQNDK + VIFCGRLADYKYYDMHVVIERALEVVRNEFS" + misc_feature 6237..6839 + /gene="glf" + /locus_tag="SPC38_0006" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.1e-135" + gene 7217..7897 + /gene="wzd" + /locus_tag="SPC38_0007" + CDS 7217..7897 + /gene="wzd" + /locus_tag="SPC38_0007" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34400.1" + /db_xref="GOA:Q4JZ56" + /db_xref="InterPro:IPR003856" + /db_xref="UniProtKB/TrEMBL:Q4JZ56" + /translation="MNNRIVDISLFDLLNVLWLRKWIIVFVSFVFGCISFLYYQFFVP + KTYTSDTRIYVVSKGDNKNLSNADLQAGSALTKDYKEIILSDEVLEETISDLKLESTL + ESLASKIKISIPAETRIISISVTNTNSDEAARIANGIRKVAALKIKEVTQVTDVTTLQ + TARPPQTPSGPHVRKSTTAGLVLGAFLTVFLVVAKEILDDRIKRFEELEKLGIPILGS + IPLSKNIK" + misc_feature 7232..7642 + /gene="wzd" + /locus_tag="SPC38_0007" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 2.5e-41" + gene 7904..8593 + /gene="wze" + /locus_tag="SPC38_0008" + CDS 7904..8593 + /gene="wze" + /locus_tag="SPC38_0008" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34401.1" + /db_xref="GOA:Q4JZ55" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZ55" + /translation="MGKLELTRKYYQLYNETKEYFNALQTNIQLSGDGLKVISVTSTV + KNEGKSTISVGLSMSLALSGYKVLLLDVDLRNSVMSGMFHSRERITGLTEYLSGKAGM + ADSMQETTLDNLYILQAGVVSPNPLSLLRSVKFETLIDSMKKYFDYIIVDTPPIGQVI + DAAIIAQQCDGIFLVTEMRKTTRRQIFSSLQQLEQTGVPVLGLVANKAIIKKDSYGYY + GKNTASETERY" + gene order(8703..9092,9118..9183,9188..9508) + /gene="tnp" + /locus_tag="SPC38_0009" + /pseudo + CDS join(8703..9092,9118..9183,9188..9508) + /gene="tnp" + /locus_tag="SPC38_0009" + /note="member of homology group 19; + member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature join(9030..9092,9118..9183,9188..9496) + /gene="tnp" + /locus_tag="SPC38_0009" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 7.9e-11" + /pseudo + gene 9726..11177 + /gene="wzg" + /locus_tag="SPC38_0010" + CDS 9726..11177 + /gene="wzg" + /locus_tag="SPC38_0010" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34403.1" + /db_xref="GOA:Q4JZ54" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZ54" + /translation="MRYFMSREKKRGTAVHLKSYINSVLLILYTGIASLFLFQIFRYN + ILNFRNLNLLVALLVVLVFILGVSLIVRKKAEKLTMLLLILAVASSSISLLAVQQFIG + FTSRLNATSNVSEYAISLVVLKDSEISELEQVSHVMAPTDTDYEAIQSLLADIKEKQG + KDLIVDKSKSYLEAYKSLISGDTKVIFLNSIFEHMIESDFPDFRDKIKKIYTKEMTKK + VEAPKVSKGQTFTIYFSGIDTYGPINSVSRSDVNILMTVNSETKKILLTTTPRDSYVA + IADGGKNQKDKLTHAGIYGIDSSIHTLEHLYGVEINYYVRVNFTSFLKIVDLLNGIDV + DNSQEFTIDGNDYPVGNLHLNSKSALGFVRERHSLADGDRDRGRNQQKVLAAIIQKLT + SIESLKNYRQIMQGLEDSIQTNLSPTTIMDLANTQLESGGNYKINSQDLKGTGRMDLP + SYAMPDSQLYMMEIDENSLSAIKENIQAVLEGR" + misc_feature 9942..10289 + /gene="wzg" + /locus_tag="SPC38_0010" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 9.5e-40" + misc_feature 10467..10904 + /gene="wzg" + /locus_tag="SPC38_0010" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-65" + gene 11116..11910 + /gene="wzh" + /locus_tag="SPC38_0011" + CDS 11116..11910 + /gene="wzh" + /locus_tag="SPC38_0011" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34404.1" + /db_xref="GOA:Q4JZ53" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ53" + /translation="MMRIASQLSKKIFRLFWRVGKMIDVHSHIIFDVDDGPKSIEDSR + ALLLEAYDQGIRTIVSTSHRRQGMFETPEDKIAENFRAVQKIARDIADDLTILYGAEI + YYTQDIINKLEKKTFPTLNGSRYALIEFSSETSYRSIHSALQQLLLSGITPLIAHIER + YDALENNKQAVLELIRMGCYTQINSSHLLKKKLFKDDAKIMKKRVHYFLKHDLVHIVA + SDMHNLDTRPPYMAEAYEIISKRYGKEKAEEFFIKNPQRILMDQLI" + misc_feature 11182..11790 + /gene="wzh" + /locus_tag="SPC38_0011" + /note="HMMPfam hit to PF02811, PHP domain, score 3.6e-36" + gene 11929..12516 + /gene="wciI" + /locus_tag="SPC38_0012" + CDS 11929..12516 + /gene="wciI" + /locus_tag="SPC38_0012" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34405.1" + /db_xref="GOA:Q4JZ52" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JZ52" + /translation="MYKVIKRFIDIALALLGIVLLSPLFLGIIVFIKLESKGTIFFKQ + KRIGLHKKEFYILKFRTMRIDTPSAVPTHLLKNPYQWITKVGKVLRRTSLDELPQIWN + ILVGHMSLVGPRPALWNQFDLIEERDKYGANDILPGLTGWAQINGRDELSIPVKAKFD + GYYVKNCSFVLDCRCVVESFLVVFKRYGHREGGAD" + misc_feature 11929..12030 + /gene="wciI" + /locus_tag="SPC38_0012" + /note="Signal peptide predicted for SPC1774 by SignalP 2.0 + HMM (Signal peptide probability 0.966) with cleavage site + probability 0.674 between residues 34 and 35" + misc_feature 11944..12498 + /gene="wciI" + /locus_tag="SPC38_0012" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.1e-31" + gene 12529..13659 + /gene="wcyA" + /locus_tag="SPC38_0013" + CDS 12529..13659 + /gene="wcyA" + /locus_tag="SPC38_0013" + /note="member of homology group 170" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34406.1" + /db_xref="GOA:Q4JZ51" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZ51" + /translation="MGNRKKVFVVANVVKEHILKFHIPTIKEMTKRGWTVDVGASGDE + TVPYCHQQYSLPHQRSPFHLGTLKSIWKLRKILKSGGYDIVYCHTPVGGLVGRLASLG + LRKQGTRVIYFVHGYHFYKGATFFNWLVYYPIEKLLSLFTDSIILINQEDYHLTKTKF + KQVQSYLVSGMGVKQERFSPQSNQVRERYRKELKLPEDATVLIYCAELIKNKNQTFLL + HAMKKLVDQGENLYCLLVGIDYTKGEMVEYIQSLNLSDRVLLLGWREDIANLYACSDI + CVATSIREGFGLNIVEAMFCHVPVVATINRGHASIIQDGQNGLLVQLGNTKQLVEAIY + VLMKDTKKKQELVEQASANLEQYHSQKIVNSLLEIIEQTAMK" + misc_feature 13084..13599 + /gene="wcyA" + /locus_tag="SPC38_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.6e-41" + gene 13656..15086 + /gene="wzy" + /locus_tag="SPC38_0014" + CDS 13656..15086 + /gene="wzy" + /locus_tag="SPC38_0014" + /note="member of homology group 171" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34407.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ50" + /translation="MSEGCEKVKIQIDKIYYLFFWLVVSFGYFFMMPTFTEDLEGVVS + ASLVQLLLFIIGYVYVSYLNRSFISLYSIFMIVFYLFQNGQVLLYSLGVEYDYFYVLR + YDETIVLQSVIFSTQCLIAAFMAGVFSTKKEVSKPLYSYMDQLEREKLITTGKLFWGA + FAIFALPFMMMKLVITSTSGYFAMIRFVGSLPTITVLFEKMFIASSVFLIVYLKSEET + WSKFLKVVILGWSIMAALTGDRTVGLAGIVTLALIQTLIGNRKKKIKFSQYALLVGAA + VVVMYLMSFAFQFRMQQDSKVSGLQTAVVEMIGTLGFSFFPLVLTIRIVPTSINFFRG + KSYIAAIITGLIPSNFDFLHLTNTLSEWNAYPTELLDTIYHYGFGLDYSLIAEAYINF + GSYGWIAIFFLCSLIAYFVRDVDFKRKDNLFSQYASLILLYSWFTLPRRKSYFIFNNF + FWYVLFFGLALILVSRSIKQRKEFKK" + gene 15083..15850 + /gene="wcyB" + /locus_tag="SPC38_0015" + CDS 15083..15850 + /gene="wcyB" + /locus_tag="SPC38_0015" + /note="member of homology group 172" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34408.1" + /db_xref="GOA:Q4JZ49" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZ49" + /translation="MKISIIMGIHNGEKRFETAVQSIFNQTYDNWEFIICDDASTDKT + FEKLQGLYGQDSRFILLKNEKNVGLSATLNRCIEASSGEFIARMDDDDICYPERFERQ + VDYLFHHPEIDFVSSSIDIFDGEVVVGTRILLDFPSKKDLIWNSPFVHPVTMFRRDAL + LEVGGYRVSPETVRGQDYDLFMRLYSCEKKGGNILEPLFRYTIDQNTMKRRTFKARIG + EMIIRYKGYRAMKVPFYNYVFIFKPLVAHLVTLVKRR" + misc_feature 15092..15574 + /gene="wcyB" + /locus_tag="SPC38_0015" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.2e-39" + gene 15850..17031 + /gene="wcyC" + /locus_tag="SPC38_0016" + CDS 15850..17031 + /gene="wcyC" + /locus_tag="SPC38_0016" + /note="member of homology group 173" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34409.1" + /db_xref="GOA:Q4JZ48" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZ48" + /translation="MFMKILITTHTYLPNKDGVQFVNQYLAEGLVKRGHQVTVLTYCY + PSRTRVPREVINGVRVIRWNARTSCTFHKGEKLAYQNFILNSQSDYDVLVNVGTQTAL + TDWLFPIFSQLTIPKVLYIHSIWDFNWLHWHRQSFKRFVAKAWANVRWKYYYWTKASI + FKQYHEVIQLHPKDYSVAFFKEKYGIESQILENAADASFFQNRNAVKKQSYIVNVSNF + NDRKNQKKAVEYFLKSNLPNEWKLVLVGSEKNQYLQSLQTFEKELRNQLGITSGKEIE + YRIGLSREEVVKTVKEASFCLMTSIWEAFPISLIEVMAAGIPFISSDVGIVNYLSGGI + TACSDQEFIRAIEEFASCPEIRNQYGKKGQMEAKEHYQVDDKVKELEALLQKVVKEEK + E" + misc_feature 16435..16947 + /gene="wcyC" + /locus_tag="SPC38_0016" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 7.5e-15" + gene 17028..17993 + /gene="wcyD" + /locus_tag="SPC38_0017" + CDS 17028..17993 + /gene="wcyD" + /locus_tag="SPC38_0017" + /note="member of homology group 174" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34410.1" + /db_xref="GOA:Q4JZ47" + /db_xref="UniProtKB/TrEMBL:Q4JZ47" + /translation="MKKIVFLCPYFGTLPPHTQLWLNSCKMNPSVTWYLFTDDKRKFD + YPENVQVFYTTLEETKALYQKKFDFEISLEGAYKLGDYKPLFGYLYEEMIQEFDAWGH + IDVYDEIYGDIRAFVTDELLEKYDKLMIFGHMGIYKNSPEVNRRFELSSDLNRTYQEI + FSSSQFYNFEEYVAGSITRIYQKNGFPIGKLDEVIADLSGTSYHFRRGYISDDFETFT + YLPYEPMIFSWEEGKTYCYSVKNHQVQKDEFMYVHFKRRKMIQDIPDDASTYLIVPSG + FALMPEEITVDLIRKYSQKKLFYPVYFEEKWKGFKRLWNKIWRSE" + gene 17990..18871 + /gene="wcyV" + /locus_tag="SPC38_0018" + CDS 17990..18871 + /gene="wcyV" + /locus_tag="SPC38_0018" + /note="member of homology group 187" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34411.1" + /db_xref="GOA:Q4JZ46" + /db_xref="UniProtKB/TrEMBL:Q4JZ46" + /translation="MKNILKKLIQQLPDKLFLQIKYFYIFKKKLNLKNPKTFNEKLQW + LKLYDRNPFYTILADKILVKDYIAKTLGEEYVIPTLGVYHHFDEIDFDELPNSFVMKT + NHDSGSIIIVKNKEDLNIQEAREKLQKSLERDYFIFGREWPYKNIERKIIIEEFMTDE + SNQELKDYKIYCFNGLPKFVHVDYDRFTNHKRNIYDSNWKQQEFMYAFPSDKNKTIEK + PAELSEMIELVRKLSKEMPFVRCDFYIVNHKILFGEMTFCPGSGFEKFYPEQYDVEFG + KDITLPEKHEWKQKKNV" + gene 18847..20262 + /gene="wzx" + /locus_tag="SPC38_0019" + CDS 18847..20262 + /gene="wzx" + /locus_tag="SPC38_0019" + /note="member of homology group 176" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34412.1" + /db_xref="GOA:Q4JZ45" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZ45" + /translation="METKEKRLVHNTIIFTIGSLGSKFIQFLLVPLYTYTLTASQFGI + TEILLTAVNLLIPVFSISIADGLLRFGLDKTLRRENVLKSAFIISILGTILSIISIPI + FSLYPTLSEWMVYFIIILNLRMYRDVFAIQLKVEGKNTLFACDSMIYTFVLSLASIVF + LVPFSLGISGYFFAYIVSNGISIFFILFFGGVWKSFTSGRFEKQLMIQLLKYSAPMIL + NGIAWWITNASDRFMLQWFMDDRAVGLYGVVAKLPLLIGTFTGVFNQAWIISAVEEFE + EENEEWFYQKVFHQYYAALFLSVSVFLLLLQPFMKVYVSPSFYEAWQYAPFLLLSSVV + SGIAAFMTGFYVAQKKNLNIIYTTIAGAFANILLNAMFIPMLGVLGASIATFLSWFVI + AIYRMKDVENFACFPLDKKVFWYLFLLCIQTITMTFLPILGIVFSVVLIPYFFYQEQE + FLAVLFDKGRKKVCSFKKSKR" + misc_feature 18868..19671 + /gene="wzx" + /locus_tag="SPC38_0019" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 8.3e-10" + gene 20235..20897 + /gene="wcyF" + /locus_tag="SPC38_0020" + CDS 20235..20897 + /gene="wcyF" + /locus_tag="SPC38_0020" + /note="member of homology group 177" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI34413.1" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4JZ44" + /translation="MFIQKIKKIIRVFLRKSLVKDYRQRIQNKEFTLITSNCVGGLIS + HDLGLQFRSPTINMYIEAADFIQFCSHLERYLKEDLSFIEVNQDGHFVALCGDIKIYI + VHYNSFEEFAKKWSERAKRVDFDQLYLMMSERDGCRYEDIVKFDTLPYKNKVIFTSKK + MPEIQSAFYIPGIETKNNQKHKVKSVTTYLNSFTGKRYIDLFDFVEFLNTGRKQLSKY + EK" + gene 20887..21969 + /gene="gla" + /locus_tag="SPC38_0021" + CDS 20887..21969 + /gene="gla" + /locus_tag="SPC38_0021" + /note="member of homology group 96" + /codon_start=1 + /transl_table=11 + /product="putative epimerase" + /protein_id="CAI34414.1" + /db_xref="GOA:Q4JZ43" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR008089" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZ43" + /translation="MKSKIILKNKTILVTGAAGFIGANLVMSLLQEENPLQIIGIDNL + NDYYDVSLKEYRLSTIQEECQSSLNKKWVFIKGDIADSDLMEEIFETYRPQIVVNLAA + QAGVRYSITNPDVYMKSNIIGFHTILEKCRKYQENIEHLVYASSSSVYGGNTKIPFSE + LDAVDNPVSLYAVTKKTNELEAHAYSKLYNIPTTGLRFFTVYGPAGRPDMAYFSFTKQ + LIDKKPIEIFNYGNCQRDFTYIDDIVEGVKRVMTGAPQKEIGEDGLPIPPYAIYNIGN + HQPENLLNFVEILQEKLIAASILPEDYDFSSAQKLVPMQAGDVVATYADISLLEKDFN + FKPKTSLRNGLRNFAEWYRNFYQRGE" + misc_feature 20887..20976 + /gene="gla" + /locus_tag="SPC38_0021" + /note="Signal peptide predicted for SPC1783 by SignalP 2.0 + HMM (Signal peptide probability 0.974) with cleavage site + probability 0.471 between residues 30 and 31" + misc_feature 20917..21948 + /gene="gla" + /locus_tag="SPC38_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00023" + misc_feature 20920..21825 + /gene="gla" + /locus_tag="SPC38_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 7.1e-05" + misc_feature 20920..21711 + /gene="gla" + /locus_tag="SPC38_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 8.3e-55" + misc_feature 20923..21789 + /gene="gla" + /locus_tag="SPC38_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 5.4e-09" + gene 21929..23197 + /gene="ugd" + /locus_tag="SPC38_0022" + CDS 21929..23197 + /gene="ugd" + /locus_tag="SPC38_0022" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI34415.1" + /db_xref="GOA:Q4JZ42" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4JZ42" + /translation="MQNGIEIFIKGVNRMKITVVGMGYVGLSLAVLLAQHHEVTALDI + IDKKIQLINEKKSPIQDEYIEQYFLEKNLHLSATTNEVEAYKDAEMIIIAAPTDYDTH + KNFFDTSAVEQVIENIISMNNEALIVIKSTVPVGYTESIREKYGKKNILFSPEFLREA + NGLYDNLYPNRIIVGTDLNDGALVSKAHEFVSLLQEGALKENIDTLIMGFSEAEAVKL + FSNAYLALRVSYFNELDTYAELKGLNTKAIIDGVGLDPRIGQFYNNPSFGYGGYCLPK + DSKQLLSNYHDVPENIISAIVSSNETRKKFIAERILEIVGANHIDEYYNLKQEIVVGI + YRLVMKKGSDNFRHSSIQGIIKRLKANGVTLMIYEPSLPDGQLFFGSEVVHDFPKFKE + KSHLIVANRFDETLMDVKDKVYTRDLFGRD" + misc_feature 21971..22528 + /gene="ugd" + /locus_tag="SPC38_0022" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.3e-45" + misc_feature 21971..22369 + /gene="ugd" + /locus_tag="SPC38_0022" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.0013" + misc_feature 22556..22837 + /gene="ugd" + /locus_tag="SPC38_0022" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-35" + misc_feature 22937..23176 + /gene="ugd" + /locus_tag="SPC38_0022" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 8.5e-05" + gene complement(23327..24576) + /gene="tnp" + /locus_tag="SPC38_0023" + /pseudo + CDS complement(join(23327..24061,24058..24576)) + /gene="tnp" + /locus_tag="SPC38_0023" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(join(23834..24061,24058..24120)) + /gene="tnp" + /locus_tag="SPC38_0023" + /note="HMMPfam hit to PF01610, Transposase, score 6e-23" + /pseudo + gene 25509..26786 + /gene="intron" + /locus_tag="SPC38_0024" + CDS 25509..26786 + /gene="intron" + /locus_tag="SPC38_0024" + /note="member of homology group 108" + /codon_start=1 + /transl_table=11 + /product="putative group II intron protein" + /protein_id="CAI34417.1" + /db_xref="GOA:Q4JZ41" + /db_xref="InterPro:IPR000477" + /db_xref="InterPro:IPR013597" + /db_xref="InterPro:IPR015706" + /db_xref="UniProtKB/TrEMBL:Q4JZ41" + /translation="MSKLLDKILSRENMLEAYNQVKSDKGSAGIDGMTIEEMDNYLRQ + NWRLTKELIKQRKYKPQPVLRVEIPKPGGGIRQLGIPTVMDRMIQQTIVQVMSPICEP + HFSDTSYGFRPNRSCEKAIMKLLEYLNDGYEWIVDIDLEKFFDTVPQDRLMSLVHNII + EDGDTESLIRKYLHSGVIINGQLYKTLVGTPQGGNLSPLLSNIMLNELDKELEKRGLR + FVRYADDCVITVGSEAASKRVMYSVSRFIEKRLGLKVNMTKTKITRPRELKYLGFGFW + KSSDGWKSRPHQDSVRRFKFKLKKLTQRKWSIDLTRRIEQLNLSIRGWINYFSLGNMK + SIVASIDERLRTRLRVIIWKQWKKKSRRLWGLLKLGVPKWIADKVSGWGDHYQLVAQK + SVLKRAISKPVLEKRGLVSCLDYYLERHALKVS" + misc_feature 25683..26333 + /gene="intron" + /locus_tag="SPC38_0024" + /note="HMMPfam hit to PF00078, Reverse transcriptase + (RNA-dependent DNA pol, score 1.1e-63" + misc_feature 26379..26630 + /gene="intron" + /locus_tag="SPC38_0024" + /note="HMMPfam hit to PF08388, Group II intron, + maturase-specific domain, score 3.5e-30" + gene complement(order(26843..27319,27321..27647)) + /gene="tnp" + /locus_tag="SPC38_0025" + /pseudo + CDS complement(join(26843..27319,27321..27647)) + /gene="tnp" + /locus_tag="SPC38_0025" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(27257..27319,27321..27629)) + /gene="tnp" + /locus_tag="SPC38_0025" + /note="HMMPfam hit to PF01710, Transposase, score 2.2e-23" + /pseudo + gene order(27827..28225,28242..28736) + /gene="tnp" + /locus_tag="SPC38_0026" + /pseudo + CDS join(27827..28225,28242..28736) + /gene="tnp" + /locus_tag="SPC38_0026" + /note="member of homology group 19; + member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature join(28154..28225,28242..28616) + /gene="tnp" + /locus_tag="SPC38_0026" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 0.00054" + /pseudo + gene 28879..29862 + /gene="tnp" + /locus_tag="SPC38_0027" + /pseudo + CDS 28879..29862 + /gene="tnp" + /locus_tag="SPC38_0027" + /note="member of homology group 39" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1239 transposase" + misc_feature 29386..29820 + /gene="tnp" + /locus_tag="SPC38_0027" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.1e-18" + /pseudo + gene 29939..>30298 + /gene="aliA" + /locus_tag="SPC38_0028" + CDS 29939..>30298 + /gene="aliA" + /locus_tag="SPC38_0028" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34421.1" + /db_xref="GOA:Q4JZ40" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JZ40" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSAKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 29939..30031 + /gene="aliA" + /locus_tag="SPC38_0028" + /note="Signal peptide predicted for SPC1791 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.782 between residues 31 and 32" + misc_feature 30185..30253 + /gene="aliA" + /locus_tag="SPC38_0028" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttggct ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaaagcag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggtctgact + 361 tttgcatctg ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatacattga ttatcaccaa tctagttgat ggtttgcttg aaaatgacaa tcacggaaac + 541 ctagttccat ctttgccaga ggactggtct gtttcgagcg acggtctgac ttatacttac + 601 aaattgagaa aagatgccaa atggttcaca gctgacggtg aagagtactc cccagtcaag + 661 gcccaggatt ttgtgacagg tatcaagtac gtagtggata ataaatcaca ggctattgac + 721 ttgattcaaa actcgatcaa aggtttgaat gattatatta caggagcgga ttctgacttt + 781 tctaaggttg ggatgaaggc cattgacaac cagactgttg agtatacttt ggtacgccca + 841 gaaccttact ggaactcaaa aacaaccaac agtattcttt tcccggtaaa ctaagagttt + 901 ctaaattcaa aagggaaaga ttttgggacc ctatctccag atagtattct ctacagcggt + 961 ccttatttgt taaaagattt cacatcaaaa tcatttatcg agtatgtgaa aaacccacat + 1021 tactatgatc atgccaaagt atcgattgaa cacgtgaaat tggcttactt taatggatca + 1081 gatcaagaat tgactatccg taactttgaa agtggagctt attctatcgc tggagtttat + 1141 ccaaatagtt cgaactttgc taagaccaag gagaaatata aggataatat cgtctatagc + 1201 ttgcaggaca agacttcttg gtatttaaat ttcaatgtca atcgcgaggc ttgcaatcac + 1261 actactaaaa cgacagatga gcagaagaag tcaactgaga cagctgtctt gaacaaaaac + 1321 ttccgccaag cagtaaactt tgccttggac cgcacagccc attctgccca gtcaaatggg + 1381 gaagaggcgg ctagcaagac ccttcgtaac accttggtgc tcctacattt gtccaagttg + 1441 gagacaagac ctttggagaa gtagttgctt ctaaattggt caactatggt acagaatgga + 1501 ggtattgact tggcagatgc tcaggatgcc tatttcaaca aagaaaaagc ccaagcaaaa + 1561 tttgcggaag ctaaaaaaga attggcaagt caaggtgtga ctttccctat ttacgtgaat + 1621 gtggcagtag atcagacaag taaaaatgcc gttacaggca tgaactcagt taagcagact + 1681 ctggagtcag ttttaggtgc tgataacatt gttattgatg ttcagcaact ttcaacagat + 1741 gattttaata atgtaccttc ttggcaccga tgccagctga tagaggctat gatttgagct + 1801 ttgatggttg ggtgggtgac tatcaggatc catcaactta tctcaatcct ttcaatgcag + 1861 agaatggctt ctatctcaaa atttttggac cggatgccaa ggaagataag gaaaaaatca + 1921 ctagcctagg tcttgatacc tacactaaga tgctcaaaga tgcagatagt gaaaacaaag + 1981 atgtagccaa acgctatgaa aaatatgctg aagcacaggc ttggatgatt gacaattctc + 2041 tcattatgtc agctatgtca agtggtggca cagcatctgt aaccaaagtg atgccattta + 2101 caagagggca ttaattggtt ggtattaagg gtgatggcaa taactacaag tacatgaaac + 2161 tgcaaaaaga tactgtaaca accaaacggt ttgaaaaagc taagaccaaa tgggagcaag + 2221 aaagcaaaaa agcaatcgaa aaagcccaaa aagaagcaga aaaacatgtt aaatagttat + 2281 aaatagcttt ttcaaggaga attataaaga caaacatcag ttttggtgct tgtcttttta + 2341 aatcactcgg ttattgaaaa ttagacttct tgcgaaacag gctctttgtc aactgtagtg + 2401 ggttgaagaa aagctaagct cgagaaagga caaatttcgt cctttctttt ttgatgttca + 2461 aagtgataac aatccgtttt ttgaagtttt caaagtttcg aaaaccaaag gcattgcgct + 2521 tgataagttt gatgagatta ttggtcgctt ccaattttgc gttggaataa ggtaattgaa + 2581 gagcgttgac gattttttct ttgttcttta gaaaggtttt aaagacagtc tgaaaaatag + 2641 gatgaacctg cttaagattg tcctcaataa gtccgaaaaa tttctctggt tccttattct + 2701 ggaagtgaaa cagcaagagt tgatagagct gatagtgatg tttcaagtct tgtgaatagc + 2761 tcaaaagctt gtcaagaatt tctttatttg ttaagtgcat gcgaaaagta gggcgataaa + 2821 aacgtttatc gctcaattta cggctatcct gttgaatgag tttccagtag cgcttgatag + 2881 ccttgtattc atgggatttt cgatgaaact gattcatgat ttggacacgc acacgactca + 2941 tagcacggct aagatgttgt acaatgtgaa agcgatcaag aacgatttta gcattcggga + 3001 gtgaaacagc ctgggagact gtttcagcct gagcctagaa atttgaaagc gaagctgttt + 3061 agccaagtca tagtaagggc taaacatatc catagtaatg attttgacgc gacatcggac + 3121 ggctctatca tatttaagaa agtgatctcg gatgacagct tgtgttctgc cttcaagaac + 3181 agtgataata ttaagattat caaaatcttg cgcaatgaag ctcatctcca tctcccgatt + 3241 gaaacagtca ctccccggac tgtttcaacc tcccaagaca taatctcagg cagatttcta + 3301 aaattacact caaagtggaa gtcattgagc ttgcgaatga cagttgaagt tgaaatggcc + 3361 agctgatggg caatatcagt catagaaatt ttttcaatta acttttgagc aattttttgg + 3421 ttgatgatac gagggatttg gtgatttttc tttaccaggg gagtctcagc aaccatcatt + 3481 tttgaacagt gatagcactt gaaacggcgt tttctaagga gaattctaga aggcatacca + 3541 gttgtttcga ggtaagggat cttagacggt ttttgaaagt catatttctt cattagactt + 3601 ccacaatcag ggcaagatgg agcctcataa tccagcttag cgataatttc tttgtgggta + 3661 tccatattga tgatatctag aatcttgatg tttgggtctt taatatcgag cagttttgtg + 3721 ataaaatgta attgttccat atgaatcttt ctaatgagtt gttttgtcgc ttttcattat + 3781 aggtcatatg ggactttttt tctacaacaa aataggctcc ataatatcta taggggattt + 3841 acccactaca aatattatag agccgcgaaa caaatatggt ataatagttc tatggattat + 3901 gaagcaagta aacaactaac tgatgcacga tttaagcgtc ttgttggtgt tcagcgtacc + 3961 acttttgaag agatgttagc tgtattaaaa acagcttatc aacttaaaca cgcaaaaggt + 4021 ggacgaaaac ctaaattaag cctagaagac cttcttatgg ccactcttca atatgtgcga + 4081 gaatatcgca cttatgaaca aattgcggcc gattttggta ttcacgaaag caacttaatc + 4141 cgtcggagcc aatgggttga agtaactctt gttcaaagtg gttttacgat ttcaagaact + 4201 cctctcagtt ctgaggacac ggtaatgatt gatgcgacgg aagtaaaaat caatcgccct + 4261 aaaaaaagaa ttagccccaa atttcaagtt gaagttagcc acccaaaaga aattcacttg + 4321 gcgacttgta gtccaagcat tttttagggt agttgttaat ccaattttcg ataaaagcta + 4381 cttctttcgg agtcgttttc ttggttcctt taggtaacca tctccgaatt aatcgattat + 4441 gattttcatt tgaacctctc tcccatgaag agtaagcatg tgcgtagtag atatgttcct + 4501 caggaaatac ctcagacaat cgtttgaact ccgaaccatt atctgcagta atggacagaa + 4561 tacgatgctc ccctaatagt aacgtaagcg cctgattgac agattcagca gttttatttg + 4621 gaattaacct tataatttgg tgtctgctcc gccggtcggt taagactaac aggcaataat + 4681 tttttatctt agtcagtagg acggtatcaa tttcataatg accattttcc aagcgaagat + 4741 taataacgtc aggacgttct tcgatagatt tacctgccgg cttaaagttc ggactagctt + 4801 gcttcttgac acctttcctt tttctgggat aaagcatgtc ggccttcgtc aatcctaaat + 4861 gaccattatg aaaccagtag tagatggttg aaataccaac tttcacttgc ttcttgttaa + 4921 ccatcatttc aggcgaaaat ttttgcttat gatagtgtaa gatcttctct ctgatttcct + 4981 ttgttaaaat taactttttc accgaccgtt ttcgattgaa ttggtaaaca gtttgtgcgt + 5041 aatcggcaga atagaccttt ttgtatagcc cttttctcac ttgttgtaaa gttgtacctc + 5101 ttttgacttc attatgaatc gtttgaggcg cctttcctaa caagcctgca atttcacgat + 5161 tggacttatt ttcattcttc caccgctcaa tcaagcgacg gttatctatt gtcaaatgtt + 5221 tcccttttgg ggtataatgt tcttgcatct ctgtgccttt ccttgtgttt gtggttgaac + 5281 aacaagtata gcacagaggt gttttcttat accttaaatc acatttcatt tgacaacagg + 5341 aacccttgaa cctgtttttt cagctaaacc aaggctatga ttagccttgg ccacctagcc + 5401 taacagtttc aaacctgtta tcaaatgaaa tcatcaactt actcaaacat agtgaaacat + 5461 ctaattcttg actaaggtaa ggtggctaac ttcattatag aactttcaaa aaaagaatta + 5521 gcaaattatt ctggtaaaaa gaaatgccgc gctatggaaa aatgatttgt tttgtgctaa + 5581 aatagattga aactaatact caatgaaaat caaagagtaa cttggaagtt agctcaaagt + 5641 acagctttaa ggtggtagat agaactgacg aagtcagctc aaaatactgt tttgaggttg + 5701 cagatggacg ctgacgtggt ttgaagagat tttcgaagag tataagatcc tctcttttgc + 5761 tatagttaag gagatgagag gtaaatgata agggagagac tatgtacgac tatctaatcg + 5821 ttggtgctgg tttgtcggga gcaatttttg cttatgaagc aaccaagcgt ggaaaaaaag + 5881 taaaagttat tgataaacgt aaccacattg gtggaaatat ctactgtgag aatatagaag + 5941 gagttaatgt tcataaatat ggtgcacata tcttccatac ttctaataag aaagtctggg + 6001 attatgtgaa tcaatttgct gaatttaaca actacatcaa ctcgcctgta gctaattaca + 6061 agggtagcct ttataatcta cctttcaata tgaatacttt ctatgctatg tgggggacaa + 6121 aaactcctca agaagtgaaa aataagattg ctgagcaaac ggctcacatg aaagacgttg + 6181 aaccgaaaaa cttggaagaa caggctatca agttgatcgg tccagatatt tatgaaaagt + 6241 tgattaaagg atatactgaa aagcaatggg gacgttccgc gactgacctt ccaccgttta + 6301 tcatcaaacg tctaccagtt cgtttgactt ttgataataa ctactttaat gaccgttacc + 6361 aaggtattcc aatcggtggc tataatgtca ttatcgaaaa tatgctgaaa gatgttgaag + 6421 tagaacttgg agttgacttt tttgccaatc gtcaggaatt agaagcttct gctgaaaaag + 6481 ttgtctttac agggatgatt gaccaatatt tcgattataa acatggtgag ctagaatacc + 6541 gtagtcttcg ttttgagcat gaagttctag ataaggaaaa ttatcaagga aatgccgttg + 6601 ttaattatac agaacgagaa attccttata ctcgcattat tgagcacaaa cattttgagt + 6661 acggaacaca agataaaacg gttattactc gtgaataccc agctgattgg aaacgtggag + 6721 atgaacctta ttatccaatc aatgatgaga gaaacaatgc catgtttgct aaatatcaag + 6781 aagaagcagt acagaatgat aaggtaattt tctgtggacg tttggctgat tataaatact + 6841 acgacatgca tgtggttatt gaacgggctt tggaagtggt aaggaatgag ttctcatgag + 6901 agaaacaggc atatatgaaa gttaatgtag aggagttgag ctttttattt gaatattggg + 6961 tgaaaaagta gtatacttag atagtctgtt tttaaaaatc aaaatgggga aatcgattct + 7021 tatcaacttc agagtgaact gaattaaaac tgcataggag tatataaaat gctgaagtaa + 7081 gatttacaga acatggtatg ataagtgttc gacagcttgt ttggcaggag ttcgaatatt + 7141 caagtaattg agagggtttt tgaacttctg ataagataga tagtagatta ctttcgagta + 7201 aaggatagtt gagaaaatga ataatcgtat agtagacatc agtttgtttg atttattgaa + 7261 tgtcttatgg cttcgtaaat ggatcattgt ttttgtatca tttgtttttg gatgtatttc + 7321 ttttttatat tatcaatttt ttgtacccaa aacctataca agtgatactc gtatatatgt + 7381 ggtaagcaaa ggggataata aaaatctgtc taatgcagat ttgcaagcag gaagtgctct + 7441 aacaaaggat tacaaagaaa tcattttatc agatgaagtg ttagaagaaa caatttctga + 7501 tttaaaacta gaatcaactt tggaatctct agcttcgaaa attaaaattt ctatccctgc + 7561 ggaaactcga attatttcca ttagtgttac aaatacgaac tcagatgaag ctgctcgaat + 7621 agcaaatggg ataaggaagg tagctgccct taaaatcaag gaagtaactc aagttacaga + 7681 tgtcaccact ttacagactg cacgccctcc ccaaactccg tcaggaccgc atgtgcgaaa + 7741 atctactaca gcagggcttg ttcttggtgc attcttaaca gtctttctag tagttgccaa + 7801 ggaaatatta gatgatcgca taaaacgttt tgaagaactt gaaaaattgg gaatccctat + 7861 tttaggctca atccctttat caaaaaatat aaagtagaaa atcatgggaa aattagaact + 7921 aacacgtaag tactatcaat tgtacaatga aacgaaagaa tattttaatg ccttacagac + 7981 caatattcaa cttagtggtg atggactgaa agtcatttct gttacttcca cagtaaaaaa + 8041 cgaaggcaaa tcgactatat cagttggctt gtccatgtcc ttggccttat caggctataa + 8101 agtcctgtta ctggatgtgg atttacgtaa ttcagtgatg tcaggaatgt ttcattctag + 8161 ggaaagaata acaggtttga ctgaatattt atctggcaaa gcgggaatgg cggattctat + 8221 gcaggaaact actttagata atctctatat attacaagca ggagtcgttt caccgaatcc + 8281 cttatctcta ttaaggagtg ttaagtttga aaccttgata gattctatga aaaagtactt + 8341 tgactatatt atagtagata ctccaccaat cggccaagta atagatgctg caattattgc + 8401 ccaacaatgt gatgggatat ttttggtcac tgaaatgagg aaaacgacac gcagacaaat + 8461 tttttcttcc ctccagcaat tggaacaaac tggagttccc gttttgggcc ttgtggccaa + 8521 taaagcaatt ataaaaaaag atagctatgg ctattatgga aaaaacaccg cgagcgagac + 8581 tgaaagatat tgatggacta cctcctctac ctcacaaatt gcattttttg tgaggtagag + 8641 gggtaagttg atactattat atattagact tcctgcgaaa caaaatatgg tatagtagtt + 8701 ctatgaatga tgaagcaagt aaacaactaa ctgatgcacg atttaagcgt cttgttggtg + 8761 ttcagcgtac cacttttgaa gagatgttag ctgtattaaa aacagcttat caacttaaac + 8821 acgcaaaagg tggacgaaaa cctaaattaa gcctagaaga ccttcttatg gctactcttc + 8881 aatatgtgcg agaatatcga acttatgaag aaattacggc tgattttggt attcacgaaa + 8941 gcaacttact ccgtcggagc caatgggttg aagtaactct tgttcaaagt ggtgttacga + 9001 tttcaagaac tcctctcagc tctgaggaca cggtaatgat tgatgcgacg gaagtacaaa + 9061 tcaaccgccc taaaaaaaga attagcgaat gattctggta aaaagaaatg ccacgctatg + 9121 aaggctcaag cgattgtcac aagtcaaggg agaattgttt ctttggatat cgctgtgaac + 9181 tatttgttat gatatgaagt tgttcaaaat gagtcgcaga aatatcggac aagctggtaa + 9241 aatcttggct gacagtggtt atcaagggct catgaagata tatcctcaag cacaaactcc + 9301 acgtaaatcc agcaaactca agccgctaac agctgaagat aaagcctgta accatgcgct + 9361 atccaaggag agaagcaagg ttgagaacat ctttgccaaa gtaaaaacgt ttaaaatgtt + 9421 ttcaacaacc tatcgaaatc atcgtaaacg cttcggatta cgaatgaatt tgattgctgc + 9481 tattatcaat catgaactag gattctagtt tggcaggaag tctattttgg aatgctatta + 9541 tgtttagttg tgctcaatga aaatgaaaga actagtaagc taggcgcagt cagctcaaaa + 9601 cagtgttttg aggttgtaga tagaactgac gaagtcagta acatatatat gacaaaccga + 9661 tgctgacgtg gtttgaagag atttttgaag agtataagac ggtattttaa gggaatgatt + 9721 actatttgag gtattttatg agtagagaga aaaaaagagg aacagcagtc cacttgaaat + 9781 cttatatcaa tagtgtgctg ctaatcctgt acacaggaat agcgagccta tttctttttc + 9841 agatattccg atacaatatt ttaaatttta ggaatctcaa tttattagta gctctgctag + 9901 tagtattggt atttatttta ggagtgagtt tgattgtccg aaaaaaagct gaaaagttga + 9961 caatgcttct cctaatctta gctgtcgcaa gtagttcaat atcgcttttg gctgttcaac + 10021 aatttatcgg ttttacaagt cgcttaaatg caacttcaaa cgtttcagaa tatgctatta + 10081 gtcttgtagt tttgaaagat agcgaaatta gtgaactaga acaagtatca catgtgatgg + 10141 cgcctaccga tacagattat gaagctattc aaagtttgtt agcagatata aaagaaaagc + 10201 aaggtaaaga tctaatagta gataaaagca aatcttattt agaagcctat aagagtttga + 10261 tttcaggtga caccaaggtg atttttttaa atagtatttt tgaacatatg attgagtcgg + 10321 attttcctga ctttagagac aaaattaaga aaatatatac aaaagaaatg acaaagaaag + 10381 tagaagctcc aaaggtttca aaggggcaga cttttactat ttatttcagt gggattgata + 10441 cttatggacc aattaactct gtatcacgtt cggatgtcaa tattttgatg acagtcaata + 10501 gcgagaccaa aaaaattctt ttgacaacta cacctcgtga ctcctatgtc gcaattgcag + 10561 atggaggaaa gaatcaaaaa gataaattga ctcatgctgg aatttatggt attgattctt + 10621 ccattcatac cttggaacat ttatatggtg tagagattaa ctactatgtt cgtgtaaatt + 10681 tcacttcttt cttaaagata gttgatttat tgaatggtat tgatgtggac aatagtcaag + 10741 aatttacaat tgacgggaac gactatcctg ttggaaatct ccatctaaat tctaagtcag + 10801 cacttggttt cgttcgagaa cgtcattctc tagcagatgg agatcgtgat cgaggacgga + 10861 atcaacagaa ggtgctcgct gcaattattc aaaaattaac ctcaatagaa tcattgaaaa + 10921 attatcgtca aatcatgcaa ggattagagg attcaataca aacaaatctc tctccaacaa + 10981 ctatcatgga cttagccaat actcaattgg aaagtggagg gaattataaa ataaattctc + 11041 aagatttaaa agggacaggg cggatggatc ttccttctta tgcaatgcct gatagtcagt + 11101 tgtatatgat ggaaattgat gagaatagcc tctcagctat caaagaaaat attcaggctg + 11161 ttctggaggg taggtaagat gatagatgtt cattctcaca ttatttttga tgtggatgat + 11221 gggccaaagt ccatagaaga tagtagagct ttgttgttag aagcctatga tcaaggaatt + 11281 cggacaattg tttcaacatc ccaccgccgt caaggtatgt ttgaaacacc agaagacaag + 11341 attgcggaaa attttcgtgc ggtacagaaa atagctagag atattgcaga tgatttaaca + 11401 attttatatg gtgcagaaat ctactatact caagacatta tcaataaact tgaaaagaaa + 11461 actttcccaa ctttaaatgg gagtcgatat gccttgattg aatttagtag cgagacttct + 11521 tatcgttcta ttcatagcgc tcttcagcag ttgcttttgt caggaattac cccgcttatc + 11581 gcccatatcg aacgttatga tgctcttgaa aacaataaac aagcagttct cgaattgatt + 11641 cgtatgggct gttatacaca gattaatagt tcccatctac tcaaaaaaaa attatttaaa + 11701 gatgatgcaa aaatcatgaa gaaacgagtt cactattttt tgaaacatga tttagtccat + 11761 attgtagcaa gtgacatgca taatcttgat actagaccgc cttatatggc ggaagcttat + 11821 gaaatcattt ctaaaagata cggaaaagaa aaagctgaag aattttttat aaaaaatccg + 11881 caacgaatcc taatggatca attgatttaa tgaaaaagga aacaacaaat gtataaagtt + 11941 atcaaacgat ttatagatat agctttagct ttgctaggaa ttgtattatt atcaccacta + 12001 tttttaggaa ttatagtgtt cataaaatta gaatctaaag ggactatttt ctttaaacaa + 12061 aaaagaattg ggctacataa aaaagaattt tacattctaa aatttagaac gatgagaatt + 12121 gacactcctt cagctgtccc tacacatctt ttaaaaaatc cttatcaatg gattacaaag + 12181 gttggtaaag tcttacgtag aacctctctg gatgaattgc cacagatttg gaatattttg + 12241 gtcggtcaca tgtcgcttgt aggaccaaga cctgcccttt ggaatcaatt tgatttgatt + 12301 gaagaaagag acaaatatgg agcaaatgat attttacctg gtttaacagg ttgggcacaa + 12361 atcaatggaa gagatgaatt atctattcca gtcaaagcca aatttgatgg ctactatgtg + 12421 aagaactgtt catttgtttt agattgtcga tgtgttgtag aaagtttttt agtagtattt + 12481 aagagatatg ggcatcgaga aggtggtgca gattagagga actgatatat gggaaatcgt + 12541 aaaaaagttt ttgtagtagc caatgtagtc aaagaacata ttctaaaatt tcacattccg + 12601 actatcaaag aaatgacaaa aagagggtgg acggtagacg taggtgcttc tggggatgaa + 12661 acagttccct attgtcacca acaatattca ctgccccacc aacgttctcc gtttcatcta + 12721 ggcactctca aaagtatctg gaaattgaga aaaattttga agtctggagg ctatgatatt + 12781 gtttactgtc atactcctgt tggaggtttg gtgggacgac tggcttcttt aggattgcga + 12841 aaacaaggaa caagagtcat ttattttgtt catggatatc atttttacaa aggagcaact + 12901 tttttcaatt ggttagtgta ttacccaatt gaaaagctac tgtccctttt tacagatagt + 12961 atcattctaa tcaatcaaga agattatcat ctcacaaaaa caaaatttaa acaggttcaa + 13021 tcctatctag tgagtggaat gggagtaaaa caagaacggt tttcacccca atcaaatcaa + 13081 gttagagaac gttatcgtaa agaattgaaa ctgcctgagg atgcgactgt tttaatttat + 13141 tgtgctgagc taataaaaaa taaaaatcaa acatttttac ttcatgctat gaaaaagctt + 13201 gtggatcagg gagaaaatct ttattgctta ttagtaggaa ttgattatac caagggtgaa + 13261 atggtagaat atattcaatc cttgaattta tccgatcgag ttttactttt agggtggaga + 13321 gaagatattg ccaatcttta cgcttgttct gatatatgtg ttgcaacaag tattcgagaa + 13381 ggatttggat taaatatagt ggaagcaatg ttttgtcacg ttccagttgt tgcgaccatc + 13441 aatagaggac acgccagtat tatacaagat ggacaaaacg gtctattagt ccaattagga + 13501 aatacaaagc aattagtaga ggctatttat gtactaatga aggatactaa gaagaagcaa + 13561 gaattagtgg agcaagctag tgcgaattta gaacaatatc atagtcagaa aattgtaaat + 13621 agcttactag aaataataga acagactgca atgaagtgag tgaaggatgt gaaaaagtga + 13681 aaatacaaat tgataaaata tactatctat ttttttggct ggtagtttcc tttggatatt + 13741 tttttatgat gccaaccttt acagaagatt tagaaggcgt tgtcagtgct agtttagtac + 13801 aattgttatt atttattata ggatatgtat atgtatctta tttaaatcgt tcttttatct + 13861 cactgtatag tatctttatg attgtatttt acctttttca aaatggacag gtattgttat + 13921 attcacttgg agtagagtat gattactttt atgttttaag atatgatgaa accatcgtac + 13981 tacaatcagt tattttttca acacaatgtc ttattgcagc ctttatggct ggagtctttt + 14041 ctacgaagaa agaggtatca aaaccccttt attcttatat ggatcaatta gaacgagaaa + 14101 aactgattac tactggaaag ttattttggg gtgcgtttgc gatttttgct ttacccttta + 14161 tgatgatgaa gcttgttatc accagtacat ctgggtattt tgcgatgata cgtttcgttg + 14221 gaagcctacc tacaataaca gtgttatttg aaaaaatgtt cattgcttca agtgtttttt + 14281 tgattgttta tttaaaatct gaggaaactt ggagcaagtt tttaaaagtt gttatcttag + 14341 gttggagtat aatggctgct ttaacaggag atagaaccgt aggtttagca gggattgtta + 14401 cgttagcttt aattcaaaca ttaattggta atcgtaaaaa aaagattaag ttttctcagt + 14461 atgccttgtt agttggggca gctgttgtag tgatgtattt aatgtccttt gcttttcaat + 14521 ttaggatgca acaagattct aaagtttcag gactacaaac tgcggtagta gaaatgatag + 14581 gaactctagg gtttagtttt ttcccactcg tattaacgat tagaattgtt ccaacttcta + 14641 ttaacttttt tagaggaaaa tcatatattg cagccatcat tacaggacta attccatcta + 14701 attttgattt tttacattta acaaatacat tatcagaatg gaatgcatat ccaacggaat + 14761 tattagatac aatctatcat tatggtttcg gattagatta ttctttaatt gcggaagcct + 14821 atattaattt tggttcttat ggatggatag cgattttttt cctttgttct ctaatagctt + 14881 attttgtaag agatgtggat tttaaaagaa aggacaactt attctcacaa tatgctagct + 14941 tgattttgct gtattcatgg tttacccttc caagaagaaa atcttatttt atttttaata + 15001 attttttttg gtatgtatta ttttttggac tagcactcat acttgtctct cgttctatta + 15061 aacaacgaaa ggaatttaaa aaatgaaaat ttcaattatt atgggcattc ataatggtga + 15121 aaagcgcttt gaaacagctg ttcaaagtat tttcaatcaa acttatgata attgggaatt + 15181 tattatttgt gatgatgctt ccacagataa aacgtttgaa aagttacaag gattatatgg + 15241 acaggattca cgttttatct tattaaaaaa tgaaaaaaat gtaggtcttt ccgcgacatt + 15301 aaaccgttgc attgaagcaa gtagtggaga atttattgct agaatggatg atgatgatat + 15361 ttgttatccc gagcgctttg aaagacaagt cgactatttg ttccatcatc cagagattga + 15421 ttttgtttct tcatctattg atatttttga tggagaagta gttgtaggta cacggatttt + 15481 acttgatttt cctagtaaaa aggatttgat ttggaatagc ccctttgttc atcctgttac + 15541 catgtttcgt agagatgcct tgcttgaagt tggcggttat agagtttctc cagaaactgt + 15601 tcgtgggcaa gattatgatt tgtttatgcg actatattca tgcgagaaaa aaggtggaaa + 15661 tattttagaa ccactatttc gctatacgat tgatcaaaat acgatgaagc gacgtacgtt + 15721 taaagctcga attggggaaa tgattattcg ctataaaggt tatcgtgcga tgaaagttcc + 15781 attttataat tatgttttta tatttaaacc attagtagct catctagtaa cactcgttaa + 15841 aaggagataa tgtttatgaa aattttaata accactcata cttatcttcc taataaagat + 15901 ggtgttcaat ttgttaatca atatttagca gaaggattgg ttaaaagagg acatcaagta + 15961 acggtgctga cctattgtta tccatcacgt acaagggtac ctagagaagt gataaatggt + 16021 gttagagtca ttcgttggaa tgctcgaaca agctgtactt tccataaagg agaaaaatta + 16081 gcttatcaaa acttcatctt aaactcccaa tcagattatg atgttttagt gaatgttgga + 16141 acacagactg ctttaacaga ttggttattt ccgatatttt ctcagctaac aattccgaaa + 16201 gtcttatata ttcattcgat atgggatttc aactggttgc attggcatag acaatcattc + 16261 aagcgatttg ttgctaaagc ttgggcaaat gtacgatgga aatattatta ttggacaaag + 16321 gcttctatct ttaagcaata tcatgaagtg attcagctgc acccaaaaga ttatagtgtg + 16381 gcttttttta aagaaaaata tggcatagaa agtcagattt tagaaaatgc tgctgatgct + 16441 tctttttttc aaaatagaaa tgctgtcaaa aagcaatctt acattgtaaa tgtttctaat + 16501 tttaatgatc gaaaaaatca gaagaaagcg gttgagtatt ttttgaaaag caatcttcca + 16561 aatgaatgga agctcgtttt agttggttca gaaaagaatc agtatttaca aagtctacaa + 16621 acttttgaaa aagaactccg aaaccaatta ggtatcactt caggtaaaga aatagaatat + 16681 cgcatcggac tgtcaagaga agaagtcgta aaaactgtaa aagaagcttc tttttgttta + 16741 atgacaagta tatgggaagc ttttccaatt tccttaattg aagtgatggc tgcaggaatt + 16801 ccatttatct cttctgatgt aggaattgtc aactatttgt ctggaggaat cactgcttgt + 16861 agtgatcaag aatttataag agctattgaa gagtttgcca gttgtccaga aattagaaat + 16921 caatatggca aaaagggaca aatggaagca aaagaacatt atcaagtgga tgataaagta + 16981 aaagagcttg aagctttgtt acaaaaggtc gtaaaggaag aaaaagagtg aaaaaaatag + 17041 tatttttgtg tccatacttt gggactttac caccccatac gcagttatgg ctaaattctt + 17101 gtaaaatgaa tccgtctgtg acatggtatc tttttacaga tgacaagaga aaatttgact + 17161 atccagaaaa tgtgcaagta ttttatacga ctttggaaga aacaaaggcg ttgtatcaaa + 17221 agaaatttga ttttgagatt tctttagagg gggcttataa actcggagat tataaacctt + 17281 tatttggtta tctttatgag gaaatgatac aagagtttga tgcttgggga catattgatg + 17341 tttatgatga aatctatgga gatattcgtg catttgtaac agatgaatta ctagaaaaat + 17401 acgataaatt gatgattttt gggcatatgg ggatttataa aaattctccc gaagtcaatc + 17461 gtagatttga attgtcgtct gatttgaatc gtacttatca agaaatattt tcttcatcac + 17521 aattttataa ttttgaagaa tatgttgcag gaagtattac tcgtatctat cagaaaaatg + 17581 gattccccat tggaaaatta gatgaggtga ttgcggatct ttctggtaca agttatcatt + 17641 ttcgacgagg gtacatttca gatgattttg aaacatttac ttatttacca tatgagccta + 17701 tgattttttc atgggaagag gggaaaacgt attgttattc ggttaagaat catcaagtgc + 17761 aaaaagatga gtttatgtat gttcacttta agcgtcgaaa aatgattcaa gatataccag + 17821 atgatgcttc tacttattta atcgtcccaa gtggttttgc cttgatgcct gaagagataa + 17881 cggttgattt gattcgaaaa tatagtcaga aaaaattatt ttatccagtt tattttgaag + 17941 aaaagtggaa aggtttcaaa cgattatgga ataaaatttg gaggtcggaa tgaagaacat + 18001 tttaaaaaaa ttgatacaac aattaccgga taaactgttt ctacaaatta agtatttcta + 18061 catttttaag aagaaattaa atttaaaaaa tcctaagacc ttcaatgaaa aattacaatg + 18121 gctaaaatta tatgatagaa atccttttta taccatttta gcggataaga ttttagtgaa + 18181 ggactatatt gccaagacac ttggggaaga atatgttatt ccgactcttg gtgtttatca + 18241 tcattttgat gagattgatt ttgatgagct tccaaattct tttgtgatga aaaccaatca + 18301 tgatagtggc agtattatca ttgtaaaaaa caaagaagac ttgaatattc aagaagcaag + 18361 agaaaagcta caaaaaagtt tggaaagaga ttattttatt tttggtcgtg aatggcctta + 18421 taaaaatatt gaacgaaaaa ttattattga agagtttatg acggatgaat cgaatcaaga + 18481 attaaaggat tataaaattt attgttttaa tggtcttcct aagtttgttc atgtagatta + 18541 tgaccgtttt acaaatcata agagaaatat ttatgatagc aactggaagc agcaagaatt + 18601 tatgtatgct tttccgtccg ataaaaataa gacgatagag aagcctgctg aactgtctga + 18661 aatgattgaa cttgtgagaa aattatcaaa agagatgcca tttgtgagat gtgattttta + 18721 tatcgtcaat cacaaaattt tgtttggtga gatgactttt tgtccaggtt cagggtttga + 18781 aaaattttat ccagaacagt atgatgtaga gtttggaaag gatattactt taccggagaa + 18841 gcatgaatgg aaacaaaaga aaaacgttta gttcataata cgattatttt tacaattgga + 18901 agtttaggtt caaaatttat tcagtttttg ttagttcctt tgtataccta tactttaaca + 18961 gcttctcagt ttgggattac cgaaatttta ttaaccgctg ttaatctttt aatacctgta + 19021 ttttctattt ccattgctga tggattatta agatttggat tagataagac cttaagaaga + 19081 gaaaatgtct tgaaatcagc ttttatcatt tcgatacttg ggactatttt atccattatt + 19141 tcgattccaa ttttttcgct ctatcctact ttgtcagagt ggatggttta ttttatcatc + 19201 attttgaact tgagaatgta tcgggatgtt tttgcgattc aattgaaagt tgaagggaaa + 19261 aatacattat ttgcttgcga tagtatgatt tatacatttg ttttatcttt agcgagtatt + 19321 gtctttctag ttcctttttc tttaggcatt tcaggttatt ttttcgctta tattgtcagt + 19381 aatggaattt ccattttctt tatcttattt ttcggaggag tctggaaaag ttttactagc + 19441 ggaagatttg aaaaacaatt gatgatacaa ctattgaaat attcagcacc catgatttta + 19501 aatggtattg catggtggat tacaaatgcc tcagatcggt ttatgttgca atggtttatg + 19561 gatgatagag cggtaggttt gtatggtgtt gttgcaaagt tacccttatt aatcggaacg + 19621 tttactggag tatttaatca ggcatggatt atttcagcag tagaagagtt tgaagaagaa + 19681 aatgaagaat ggttttatca aaaagttttt caccaatatt atgcagcact ctttttaagt + 19741 gtttcagtat ttttgcttct acttcaacca tttatgaaag tatatgttag tccaagcttt + 19801 tatgaagcat ggcaatatgc tccgttttta ttattgtcaa gtgtagtttc aggaatcgcc + 19861 gcatttatga caggttttta tgttgcgcaa aagaaaaatt tgaatattat atacacgacg + 19921 attgctggtg cttttgcgaa tattttgtta aatgcgatgt ttattcctat gcttggagta + 19981 ttaggcgctt ccattgcgac ctttctatca tggtttgtta ttgcaatcta tcgtatgaaa + 20041 gatgttgaaa actttgcttg ttttccatta gataaaaaag ttttttggta tttatttcta + 20101 ttatgtattc agaccattac gatgactttt ctgccaatcc ttggcattgt tttttcagtc + 20161 gtattgattc cttatttctt ttaccaagaa caggaatttc tagcagtttt atttgataaa + 20221 ggaaggaaaa aagtatgttc attcaaaaaa tcaaaaagat aataagagta tttttaagga + 20281 aatctttagt aaaagattat cgacaaagaa ttcaaaataa agagtttact cttattactt + 20341 ctaattgtgt gggtggactg attagtcatg atttgggtct acaatttcgt tctcccacta + 20401 tcaatatgta tatagaagca gcagacttta ttcagttttg ttcacattta gaacgctatt + 20461 taaaagaaga cttatctttt attgaagtaa atcaagatgg acattttgta gctctttgtg + 20521 gggatataaa aatttatatt gttcattata atagctttga agagtttgct aaaaaatggt + 20581 ctgaacgtgc caaaagagta gattttgatc aattatatct tatgatgtct gaacgagatg + 20641 gctgtcgtta tgaagatatt gtgaagtttg atacgttacc ctataagaat aaagtaattt + 20701 ttacaagtaa aaagatgcca gaaattcaat ccgcttttta tataccaggt attgaaacaa + 20761 aaaataatca aaaacataag gtgaaatcag taacaactta tcttaactcc tttacaggaa + 20821 aacgatatat agatttattc gactttgtag agtttttgaa tacaggaagg aaacaattaa + 20881 gtaagtatga aaagtaagat aatattaaaa aataaaacaa ttcttgttac aggagcagct + 20941 ggctttattg gtgctaatct tgtcatgagt ttattacaag aagaaaatcc attacagatt + 21001 attggaatag ataatttgaa tgattattat gatgtttctt taaaagagta tcgtttatca + 21061 acaattcaag aggagtgtca atcatcttta aataaaaaat gggtatttat caaaggagat + 21121 attgctgatt ctgatttgat ggaagaaatt tttgagacgt atagacctca aattgtagtg + 21181 aatttggcag cacaagcagg tgttcgttat tctatcacta atcctgatgt ttatatgaaa + 21241 agtaatatca ttggatttca tactattctt gaaaaatgta gaaagtatca agaaaatatt + 21301 gaacatttag tttatgcatc atcctcttct gtttatggtg gaaatacaaa aattcctttt + 21361 tctgaattag atgcagtaga caatcctgtt tctttatatg cagttacgaa gaaaacaaat + 21421 gaattagaag cacatgcgta ttcaaaattg tacaatattc caacaacagg cctgagattt + 21481 tttacagttt atggaccagc tggaagacct gatatggctt attttagttt tacaaagcaa + 21541 ttaattgata aaaagccaat tgaaattttc aattatggga attgtcaacg tgattttact + 21601 tatattgacg atattgttga aggcgttaaa agagtgatga ctggagctcc tcaaaaagaa + 21661 attggagaag atgggttacc aattcctcct tatgctatct ataatattgg aaatcaccaa + 21721 ccagaaaatt tattgaattt tgtcgaaatc ttgcaagaaa aattgatagc tgcttctatt + 21781 ttaccagaag attatgattt ctcatctgct cagaaacttg ttccaatgca agctggtgat + 21841 gtagttgcaa cctatgcaga tataagtcta ttggagaagg attttaattt caaacctaag + 21901 actagtctta gaaatggctt gagaaatttt gcagaatggt atagaaattt ttatcaaagg + 21961 ggtgaataga atgaaaatta ctgtagtagg aatgggatat gtcggattgt ccttggcggt + 22021 attattagcg caacatcatg aagtaacagc gttagatatt attgataaaa aaattcaact + 22081 catcaatgag aaaaaatctc caattcaaga tgagtatatt gaacaatact ttttagaaaa + 22141 aaatcttcat ttaagcgcaa caacaaacga agtagaggcg tataaagatg cggaaatgat + 22201 tattatagct gctcctacag attatgatac acacaaaaat ttctttgata catctgccgt + 22261 agaacaagta atcgaaaata ttatttctat gaataacgag gctttaattg tcattaaatc + 22321 aactgttcct gttggctata cggagtcgat tcgagaaaaa tatggtaaaa agaatatact + 22381 gtttagccca gaatttcttc gtgaagcaaa tggattgtat gataatcttt atcctaatcg + 22441 aattatcgta ggtacagatt tgaatgatgg agcattagtt tctaaagcac atgaatttgt + 22501 gtctttacta caagaaggtg ctctcaaaga gaatattgat actttaatca tgggattttc + 22561 tgaagcagaa gctgtgaaat tattttccaa tgcttatctg gctttaagag tgtcttattt + 22621 taatgagttg gatacttatg ctgaactgaa aggattgaat acgaaagcca ttattgatgg + 22681 agtaggattg gatcctagaa ttggtcagtt ttataacaat ccatcctttg gttatggtgg + 22741 ttactgttta ccaaaggata gtaagcaact gttgtcaaat tatcatgatg ttcctgaaaa + 22801 tattatttca gcaattgttt ctagtaatga aactcgtaaa aaatttattg cagaacgtat + 22861 tcttgaaata gtcggagcta atcatattga tgaatactat aatttgaagc aggaaatcgt + 22921 tgtaggtatt tatcgtttag tcatgaaaaa aggttcggat aattttagac attcttctat + 22981 ccaaggaatt ataaagagac taaaagcgaa tggagtgaca ttaatgatct atgaaccttc + 23041 acttccagat ggacaattat tttttggaag tgaagttgtt catgattttc caaaatttaa + 23101 agaaaaaagc caccttattg tagccaatcg ttttgatgaa acattaatgg atgtaaagga + 23161 taaagtatat acaagggatt tgtttggaag agattaaggg agataggttt tgaacaagtt + 23221 ctattctcaa aaaatcacac cgttactatc ttcgaataaa ttaaaagcaa agcaagtgat + 23281 tgatagaaaa tcggctcttt gtcaactgta gtgggttgaa gaaaagctaa gctcgagaaa + 23341 ggacaaattt cgtcctttct tttttgatgt tcaaagtgat aacaatccgt tttttgaagt + 23401 tttcaaagtt tcgaaaacca aaggcattgc gcttgataag tttgatgaga ttattggtcg + 23461 cttccagttt ggcattagaa tagtgtagtt gaagggcgtt gacaatcttt tctttatctt + 23521 tgaggaaggt tttaaagaca gtctgaaaaa taggatgaac ctgcttaaga ttgtcctcaa + 23581 taagtccgaa aaatttctct ggttccttat tctggaagtg aaaaagcaag agttgataga + 23641 gctgatagtg gtgtttcaag tcttccgaat agctcaaaag cttgtttaaa atctctttat + 23701 tggttaagtg catacgaaaa gtaggacgat aaaatcgctt atcactcagt ttacggctat + 23761 cctgttgaat gagtttccag tagcgcttga tagccttgta ttcatgagac tttcgatcca + 23821 attgattcat gatttggaca cggatacgac tcatagcacg gctaagatgt tgtacaatgt + 23881 gaaagcgaag ctgtttagcc aagtcatagt aagggctaaa catatccata gtaatgattt + 23941 tgacgcgaca tcggacggct ctatcatatt taagaaagtg atctcggatg acagcttgtg + 24001 ttctaccctc aagaacagtg atgatatcga gcttttcaaa atcttgcgca ataaagctca + 24061 tctccatctc ccgattgaaa cagtcactcc ccggactgtt ttaacgtccc aggacataat + 24121 ctcaggaaga caagaaaaat catgtttaaa gtgaaaatca ttgagctttc gaatgacagt + 24181 tgaagttgaa atggccagct gatgggcaat atcggtcata gaattctttt caattaactt + 24241 ttgagcaatc ttttggttga tgatacgagg gatttggtga ttcttcttga ctatagaagt + 24301 ttcagcgacc atcatttttg aacagtgata gcacttgaat cgacgctttc taaggagaat + 24361 tctagtaggc ataccagtcg tttcaagata aggaatttta gaaggttttt gaaagtcata + 24421 tttcttcaat tggtttccgc actcagggca agatggggcg tcgtagtcca gtttggcgat + 24481 gatttccttg tgtgtatcct tattgatgat gtctaaaatc tggatattag tgtctttaat + 24541 gtctagtaat tttgtgataa aatgtaattg ttccatatga ttctttctaa tgagttgttt + 24601 tgtcgctttt cattataggt catatgggac tttttttcta caacaaaata ggctccataa + 24661 tatccatagg ggatttaccc actacaaata ttatagagcc agaaaatcac ctgctttttg + 24721 tatcaatgtt tttttcacaa aatctaaaat ataatggatt gaatttggaa tagaacacta + 24781 tggtttctaa agcattgtta gaaattatag tcaattgaaa caagagcagg acaaaagagc + 24841 ctcgtaaaag gtattgcaac ttggtaatac ctttttgatg tacgacgggc atgtcgtgca + 24901 tctgaggtgt aagtcctcgg tgggcacctg ctaccggtga acccaatagc gatttccaag + 24961 cctgactatc gtgaggtagc agggagagga agggatagcg aaatcgtggc tctacgaaca + 25021 ggaacgtgat agtaaggcgt atatagcgga taagggggcc tcaaactcta aagtccaaaa + 25081 aggtagtcgt aacctatatg cgtaaatcac gagagtaatt gaattcggac taaggtttgt + 25141 gtgaaaaaga taaatctttc tagagtctaa agactctgcg tcagatttcc tattttcact + 25201 gtaacctttt aacgtcctca tatcttgtat aaacgaggaa agatgtacga cttatcccgt + 25261 gaggtttcat gagcgctgaa agcgtagtaa caacgaatca tgagaagtca gccgagccca + 25321 tagtagtgag gaaacttccg taatggaagt ggagcgaagg ggtgaacaac taatcgaagt + 25381 aatcctactt cacttgtgtc tgtaaaatga gtggtctgat agaactggac tttgacacgt + 25441 aatgactaga tgaaggttca ccaatataag atgtccctca ggcaccaaaa caagaaagga + 25501 ataggcacat gtcaaaattg ctagataaaa tattatcacg cgaaaatatg ctggaagcct + 25561 acaatcaagt aaaatccgat aaaggctcag ctgggattga tggaatgact atcgaagaga + 25621 tggataatta tctcagacaa aactggcgct tgactaagga actgataaaa cagagaaaat + 25681 ataagcctca accagttctt agagttgaga tacctaaacc aggcggaggt atccgtcaac + 25741 taggaattcc aacagttatg gatagaatga ttcaacagac cattgtccaa gtcatgagcc + 25801 ccatttgtga accccatttc tcagatacga gttatggttt cagaccaaat aggtcatgtg + 25861 aaaaagccat catgaagctc ttagaatact taaatgacgg ctatgagtgg atagtggata + 25921 tagacctaga gaaatttttc gatacagttc ctcaagatag attgatgtcc ttagtacata + 25981 acattatcga agacggagat acggaatcct tgattcgtaa gtatcttcat tcaggtgtta + 26041 tcattaatgg tcaactttat aaaacactag ttggtacacc acagggagga aatttatctc + 26101 ctctcttatc caatatcatg cttaatgaat tggacaagga attagaaaag aggggacttc + 26161 gatttgtgcg ctacgcagat gattgtgtga ttacggtcgg aagcgaggca gcctctaagc + 26221 gtgtgatgta ttcagtcagt cgttttattg agaaacggct aggtttgaaa gtaaacatga + 26281 ccaagactaa gattaccaga ccaagagagt tgaaatatct aggttttggg ttctggaaat + 26341 catcagatgg ttggaaaagc cgtccacatc aagatagtgt tcggagattt aagtttaaat + 26401 tgaagaaact aacacagagg aaatggagta tagacctaac aagacgtatt gagcaactga + 26461 atttgtctat tcgaggatgg ataaactatt tctcattggg aaatatgaaa agtatagtcg + 26521 ccagcataga tgagcgcttg cgtactcgcc tacgagtgat tatctggaag caatggaaga + 26581 agaaatcgag acgattatgg ggattgctta agttaggggt tcctaaatgg atagcagata + 26641 aggtatctgg ctggggcgac cattatcaat tagtagctca gaagtcggta cttaaacgtg + 26701 ctatatcaaa accagtcctg gaaaaacgtg gactggtttc gtgtttggat tattaccttg + 26761 aacgacatgc gttaaaagtt agttgaaccg ccgtatgccg aacggcacgt acggtggtgt + 26821 gagaggggct agagattatc ccctactcta tgtgcttttt gatatgagcc catgttttct + 26881 caataggatt gtactcaggt gagtagggag gaagaggtaa aagtttatgc ccaaactctt + 26941 tgcataaaag ttctagcttc cccattctat ggaatcttgc attatccata ataataaccg + 27001 atggtgtggt taatgttggt aagagaaact tctgaaacca agcttcaaaa aagtcgctcg + 27061 tcatcatctc ttcgtaagtc attggagcga ttaactcacc atttgttaga cctgcaacca + 27121 aagaaatcct ctgatatctt cttccagata ctttgcctct tcttaactga ccttttaatg + 27181 agcgaccata ttctcgataa aaataagtat cgaatcctgt ttcatcaatc taaacaggtg + 27241 ataggtgctt taaactatta aaattcttaa gaaataaggc tactttttct gggtcttgtt + 27301 catagtaggt gtggttcttt ttttcgagtg tagtccatag ctttgagcgc atagtggatg + 27361 gtagttggat gacagccaaa ttcagaagct atttcagtca aataagcgtc tggattgtca + 27421 gtaagatagt ttttaagtct atctctatca acttttcttg gttttgttcc ttttacttgg + 27481 tggtttagct ctcctgtttt ctcttttagc tttaaccagc cataaatagt attacgtgag + 27541 atttggaaaa cgtgtgatgc ttctgttata ctacctgttc gctcacaata agagagaact + 27601 tttttacgaa aatctattga atatgccata agaagattat accacattgt gtactatttt + 27661 tggttcattt tactataatt taaaattccc tcatcgattt gttcacattc tattgcaatc + 27721 aactgtaaat atgcttttca gaatatatca aatataacaa atataacaaa taactaaaag + 27781 ttctataata gactccctgc gaaacaaaat atggtatagt agttctatga atgatgaagc + 27841 aagtaaacaa ctaaccgatg cacgatttaa gcgtcttgtt ggtgttcagc gtaccacttt + 27901 tgaagagatg ttagctgtat taaaaacagc ttatcaactt aaacacgcaa aaggtggacg + 27961 aaaacctaaa ttaagcctag aagaccttct tatggccact cctcactatg tgcgagaata + 28021 tcgaacttat gaagaaattg cggctgattt tggtatccac gaaagcaact tactccgtcg + 28081 gagccaatgg gttgaagtaa ctcttgttca aagtggtttt acgatttcaa gaactcctct + 28141 cagttctgag gacacggtaa tgattgatgc gacgaaagta aaaatcaatc gccctaaaaa + 28201 aagaattagc gaattattct ggtaaaaaga aatgccacgc tatgaagtct caggcgattg + 28261 tcacaagtca agggagaatt gtttctttgg atatcactgt gaactattgt catgatatga + 28321 agttgttcaa aatgagttgc agaaatatcg gacaagctgg taaaatcttg gccgacagtg + 28381 gttatcaagg gctcatgaag atatatcctc aagcacaaac tccacgtaaa tccagcaaac + 28441 tcaagccgct aacagctgaa gataaagcct gtaaccatgc gctatctaag gagagaagca + 28501 aggttgagaa catctttgcc aaagcatagt atattgaaac tagaatagta cacctctact + 28561 tctaaaacat tgttagaaat cgatttgact gccctgatcg attcgtccta ttcttgtttc + 28621 attttgatat aaaaacgttt aaaatgtttt caacaaccta tcgaaatcat cgtaaacgct + 28681 tcggattacg aatgaatttg attgctgcta ttatcaatca tgaactagga ttctagtttt + 28741 gcaggaagtt taatgaagtt agccacccag ccctcctaaa aattagatgg ttcaactagc + 28801 tgaaagctct tgtaggcata agaaaacacc tctgtgttat acttgttgtt caaccacaaa + 28861 cacaagaaag gcacagaaat gcaagacaat tatactacaa aaggtaaaca tttgacaatc + 28921 gatagccgtc gcttaatcga aagatggaaa aaagaaggaa aatcaaatag agaaattgcc + 28981 tctctacttg gaaaagctcc tcaaactatc cacactgaaa tcaagcgtag gacagtccga + 29041 aaatgtcttg gaaaagggcg cttcaaagag gtttattctg ccgactatgc tcaacagtct + 29101 tatgaaaata atcgcaagca ctcggtcaag agatcaagcg tgaccaagga actaaaggaa + 29161 aagattctcc actatcataa ccaaaaattt ttgcctgaaa tgatggttat ggctaaaggg + 29221 gttaacgtgg gaatttcaac catttactat tggattcatc atggaaaatt ggggttaagc + 29281 aagcaggatc tgctttaccc tagaaaagga aaagcgctta agaaacaggc tagcaccaac + 29341 tttaaacctg ctggtcaatc catcgaacag cggcctgaag ctatcaatct tcgcttggag + 29401 aatgggcatt atgagattga tacggttcta cttacgagat cgaaaaacta ctgcttgctt + 29461 gtcttgacgg atcgaaagag tagacatcag atcatccgat tgattccaaa taaaagtgct + 29521 gaggtggtca atcaggctct aaaactcatc ttaaaacaac acaagattct ttccatcacg + 29581 gcagataatg gaacggaatt caatcgcttg tttgatatat tttctgagga gcacatctat + 29641 tatgcgcacc cctatgcctc ttgggaaagg ggaactaatg agaatcacaa caggctcatt + 29701 cgtagatagt tacctaaggg aaccaagaaa atgactccca aagaagtcgc attcatcgaa + 29761 aagtggatta acaactatcc taaaaaatgc ttggactaca agtcacccag agaagacttc + 29821 tggatggcta acttgaactt gaaatttagc tataacaaat aactcttaaa attctgaaaa + 29881 ttctgttgac aactttctga aaagagtcta taatggagag aaagttttaa aggagaaaat + 29941 gatgaaaagt tcaaaactat ttgcccttgc tggcgtgaca ttattggcgg cgactacttt + 30001 agctgcatgc tctggatcag gttcaagcgc taaaggtgag aagacattct catacattta + 30061 tgagacagac cctgataacc tcaactattt gacaactgct aaggctgcaa cagcaaatat + 30121 taccagtaac gtggttgatg gtttgctaga aaatgatcgc tacgggaact ttgtgccgtc + 30181 tatggctgag gattggtctg tatccaagga tggattgact tacacttata ctatccgtaa + 30241 ggatgcaaaa tggtatactt ctgaagggga agaatacgcg gcagtcaaag ctcaagac +// + diff --git a/public/res/serotype_genbank/serotype_39.gb b/public/res/serotype_genbank/serotype_39.gb new file mode 100644 index 0000000..95dbd99 --- /dev/null +++ b/public/res/serotype_genbank/serotype_39.gb @@ -0,0 +1,818 @@ +LOCUS CR931711 17810 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 203/40 (serotype 39). +ACCESSION CR931711 +VERSION CR931711.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17810) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17810) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17810 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="203/40" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC39_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC39_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34422.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 323..491 + /gene="aliB" + /locus_tag="SPC39_0002" + /pseudo + CDS 323..491 + /gene="aliB" + /locus_tag="SPC39_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(492..1010) + /gene="tnp" + /locus_tag="SPC39_0003" + /pseudo + CDS complement(492..1010) + /gene="tnp" + /locus_tag="SPC39_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1232..2677 + /gene="wzg" + /locus_tag="SPC39_0004" + CDS 1232..2677 + /gene="wzg" + /locus_tag="SPC39_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34425.1" + /db_xref="GOA:Q4JZ38" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZ38" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGIDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGTDRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1232..1348 + /gene="wzg" + /locus_tag="SPC39_0004" + /note="Signal peptide predicted for SPC1795 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1436..1783 + /gene="wzg" + /locus_tag="SPC39_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 1961..2404 + /gene="wzg" + /locus_tag="SPC39_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.6e-70" + gene 2679..3410 + /gene="wzh" + /locus_tag="SPC39_0005" + CDS 2679..3410 + /gene="wzh" + /locus_tag="SPC39_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34426.1" + /db_xref="GOA:Q4JZ37" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ37" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKSKLFGERYKFMKKRARYFLERDLVHVVASDMHNLNKRPPYIKEAYELIS + KQYGERRARELFIENPRLILSDQII" + misc_feature 2682..3290 + /gene="wzh" + /locus_tag="SPC39_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.7e-37" + gene 3419..4111 + /gene="wzd" + /locus_tag="SPC39_0006" + CDS 3419..4111 + /gene="wzd" + /locus_tag="SPC39_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34427.1" + /db_xref="GOA:Q4JYU0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JYU0" + /translation="MKENKEITIDVFQLFKVLWKKKTSIILTAIVAAVLAFAVSSFVL + TPEYSSTTRIYVVNRNQSEKAGLTNQDLQAGTYLVKDYKEIILSQDVLEKVISNLKLE + KTVKELSKKIQVTVPVDTRIVSITVKNAQPEEASRIANALREVAAEKIISVTRVSDVT + TLEEARAALSPSSPNIRRNTLLAFLAGGAVMVVSVLLLELLDDRVKRPEDVEEVMQIA + LLGVVLDLNKLK" + misc_feature 3419..3565 + /gene="wzd" + /locus_tag="SPC39_0006" + /note="Signal peptide predicted for SPC1797 by SignalP 2.0 + HMM (Signal peptide probability 0.987) with cleavage site + probability 0.704 between residues 49 and 50" + misc_feature 3437..3853 + /gene="wzd" + /locus_tag="SPC39_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 6.4e-48" + gene 4122..4823 + /gene="wze" + /locus_tag="SPC39_0007" + CDS 4122..4823 + /gene="wze" + /locus_tag="SPC39_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34428.1" + /db_xref="GOA:Q4JZ35" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZ35" + /translation="MPTLAIEQKRLDFAKKAEENYNALRTNIQLSGDNLRVLSISSVK + PGEGKSTTSINIAWAFARAGYKALLVDADIRNSIMSGVFKSREKITGLTDFLAGTTDL + SHGLCDTNIENLFVIQAGPVSPNPTALLQSENFATMIDTMRKYFDYVIVDTAPIGMVI + DAAIITQKCDASILVTAARETKRRDILKAKEQLEQTGVPFLGVVLNKFNTEVEKYGAY + GGYGAYSLYGNYRKE" + gene 4832..5473 + /gene="wcjH" + /locus_tag="SPC39_0008" + CDS 4832..5473 + /gene="wcjH" + /locus_tag="SPC39_0008" + /note="member of homology group 61" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34429.1" + /db_xref="GOA:Q4JZ34" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JZ34" + /translation="MIKIYFVFKNILDRFLAFFLFITLIIIPIIPITILAIWIEDPGD + VFYLQDRVGLNGKKFKVIKFRSMYKDADQRIKESINSGKTDRLNFKEHSQSMTTKVGK + VIRKLSIDELPQLLNIIKGDMSIVGPRPLQQFEITHHILTYQEMGIDLKMSKRLSVKP + GLLCYWQVTPNKNDMPFADRMDLDLLYIDNVSFKTDFLLILKGFFTVLMGNNS" + misc_feature 4832..4939 + /gene="wcjH" + /locus_tag="SPC39_0008" + /note="Signal peptide predicted for SPC1799 by SignalP 2.0 + HMM (Signal peptide probability 0.806) with cleavage site + probability 0.797 between residues 36 and 37" + misc_feature 4856..5464 + /gene="wcjH" + /locus_tag="SPC39_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.2e-25" + gene 5475..6266 + /gene="wciB" + /locus_tag="SPC39_0009" + CDS 5475..6266 + /gene="wciB" + /locus_tag="SPC39_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34430.1" + /db_xref="GOA:Q4JZ33" + /db_xref="UniProtKB/TrEMBL:Q4JZ33" + /translation="MKNIKILVATHKKYKMPSDTNMYLPIHVGCEGKKKLGFQGDNSG + ENISVLNPYYCELTGLYWAWKNLECDYLGLVHYRRYFTKMTKGYNESINIDDVILNRF + EVEKLLENSEVIVPKKRKYYIETLYSHYAHTLDASHLDLARKMIEQKNPEYLASFDKV + MKQRSGYMFNMFIMKKELADDYFSWLFPILDSMYESMDLSGLTDFEARLFGRVSELLF + NVWLDKNNLNIKEVPFMYMEKIDLFKKGKSFLMAKFLGKKYGQSF" + gene 6318..7154 + /gene="whaI" + /locus_tag="SPC39_0010" + CDS 6318..7154 + /gene="whaI" + /locus_tag="SPC39_0010" + /note="member of homology group 149" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34431.1" + /db_xref="GOA:Q4JZ32" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JZ32" + /translation="MKSEIEIIQSKIIELLKLFIDICENNDLTYYALGGTLLGAVRHK + GFIPWDDDIDLGMPREDYERFKQIATEQINGKYQFLSEDTPGYRKAFSVIRDTSTRIV + MNYSNVEQEESLWIDIFPIDGLPSKGIKKKIHEKRYLYRRMMVQLSQFNNIVNQNKTD + RPWHEKLIIKIANHLKIENILSFEKQQYKYLKTIKKYSVMEGYAGNFTGAYKLCELVP + SCYFGEPVKLDFEGIKLNCPNKYKDYLKAIYGENYITPPPIEHRVPHQYRVISLGENI + GE" + misc_feature 6384..7067 + /gene="whaI" + /locus_tag="SPC39_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 2.6e-49" + gene order(7248..7793,7866..8048) + /gene="wciE" + /locus_tag="SPC39_0011" + /pseudo + CDS join(7248..7793,7866..8048) + /gene="wciE" + /locus_tag="SPC39_0011" + /note="member of homology group 44" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + misc_feature join(7254..7793,7866..8045) + /gene="wciE" + /locus_tag="SPC39_0011" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 6.7e-22" + /pseudo + gene 8126..9217 + /gene="wcrC" + /locus_tag="SPC39_0012" + CDS 8126..9217 + /gene="wcrC" + /locus_tag="SPC39_0012" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34433.1" + /db_xref="GOA:Q4JZ31" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZ31" + /translation="MKKIALVKWIIDGTDGGLKVSTDLANELSKVYEVHLISVISTEE + IFFPLNNAVRYKNLSSQKISMSKNFVKAVKLLRTYIKKNNIEVLFGIGMTMNIVGITS + TIGLKTKFISCDHTNSIVDIDTTMKKLQRYVGAKLSDKIITLTTADRNNYIKKYKINP + KRVDYIYNWMNSIDAEKKYTLDSKKLITVGRFHKQKGYDYLSKVAIKILSIYPEWQWD + IYGSGDEQIKQDLITELDKGGVLSQVHFKGNVKGTDNIYPDHTIYVMTSRYEGLPLVL + LEAKQYGLPIVSFNCPTGPAEIVLDGENGYLIENFDINQMSQKIIELIENNELRLGFS + QNAMLDTDKFNKKNITKQWIELIEKMTGE" + misc_feature 8633..9145 + /gene="wcrC" + /locus_tag="SPC39_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.9e-34" + gene 9219..10226 + /gene="wcrD" + /locus_tag="SPC39_0013" + CDS 9219..10226 + /gene="wcrD" + /locus_tag="SPC39_0013" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34434.1" + /db_xref="GOA:Q4JZ30" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZ30" + /translation="MYDKLVTIIVPMYNIEQYITKCIESFKQVDKKYYADFEVIVVND + GSTDNSLQVVEDLITNSSCLNIRVVNKENGGHGSTINVGIKESKGKFFKVIDGDDWID + VPSFEKLLEELKGIDVDMVITNYTEQHIYNQTEKEIGFSEILDCNKIYEGIPFKRIPM + HALTYKTSILKESRINISEKTFYVDMEYTLLPLQYVKSYVYIDLNVYQYFLGRKDQSM + NLNVMKQKADHHNRVTKKILDYYEVIRFDKNLEPVVRDVLTYLINKQCQLFIMNKNIE + EASRLFSYAHKCHYRWKYDYSKKIVSLIYINSRFKNIFNLILKPLINKQQKEWSEMDE + Y" + misc_feature 9237..9740 + /gene="wcrD" + /locus_tag="SPC39_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 3.7e-31" + gene 10216..11178 + /gene="wciF" + /locus_tag="SPC39_0014" + CDS 10216..11178 + /gene="wciF" + /locus_tag="SPC39_0014" + /note="member of homology group 25" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34435.1" + /db_xref="GOA:Q4JZ29" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZ29" + /translation="MNISVVIPVYNVEDYLHYAIDSLVNQTHKNFEVLLINDGSTDNS + GNLCDKYAQEYDWIRVFHKENGGLSDARNYGVLRATNEWIFFLDPDDYIEYFTFELLS + LIQEKYQADLISTKVQTTNEYEKFSKEQFNLESSKIVTKEEALELMLEDKVATVSACA + KLYKKQILEMRPFPVGKIYEDFFVVAEHLRLAEQIVISPVITYHYYRRPGSIVQSQFT + DKRFDFFDAGEYNRSQIKQFYDGNSVEKALNLKIVQGSFSISEAAALTDTKALRNIVK + KISSLYWSIIFNSKVSIKFKFKYNWFLLTPNLYCRIKKLLKRSI" + misc_feature 10225..10728 + /gene="wciF" + /locus_tag="SPC39_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6e-36" + gene 11178..12455 + /gene="wzy" + /locus_tag="SPC39_0015" + CDS 11178..12455 + /gene="wzy" + /locus_tag="SPC39_0015" + /note="member of homology group 67" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34436.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ28" + /translation="MFLVFLLFFGVFLLFPIITTPVLLLPIVYRFRYSRYYLMLFVIG + ISLIALRYIPYFTDDGAYHYKAAYLFQFYDNVFDWFGNLMSKNIPTEEYGYYNYPLFA + LLLYIFSKTGTYSLVSFTVILIVYFLYTKIIYEIYREYNISKFLFLLALLTMVAIVNV + RFTTSGMRYHLAGAIIVFLFYKEIKNGFELNKTLFYYLIPILIHSSAVIFVATRLIFP + WFKDASFFKKIIILFSLPIFTLLSPLLQTLNVEYLSFLLEKFNAYQKTEIFIKLYSTS + DLINVYLGVLISLLYIFLYHTTFRFQKNLNMKLFLSFVLYICLLTLSVLPFLTILDRF + VWFVYPLVAISMILHIGYNKTHIERVQYIRNNYLPFFIVLTLCFIGGVIGNRRFLDFL + RLVDFNTMEILTKNVFDYFSDLHHFSLSEVLRR" + misc_feature 11178..11267 + /gene="wzy" + /locus_tag="SPC39_0015" + /note="Signal peptide predicted for SPC1806 by SignalP 2.0 + HMM (Signal peptide probability 0.657) with cleavage site + probability 0.472 between residues 30 and 31" + gene 12485..13426 + /gene="wcrG" + /locus_tag="SPC39_0016" + CDS 12485..13426 + /gene="wcrG" + /locus_tag="SPC39_0016" + /note="member of homology group 102" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34437.1" + /db_xref="GOA:Q4JZ27" + /db_xref="InterPro:IPR003406" + /db_xref="UniProtKB/TrEMBL:Q4JZ27" + /translation="MKQAYLIIAHNKIEQLKFLLSLLDYEKNDIFILFDKKATITEKQ + KNELTQIVTKSGVFFTREIPIYWGDYSLVEAEIELFETANKQENYSMYHLLSGVDLPL + DTAENIYNFFDSRKGYNFLTMVSDELFIRNKVYERVAFKTMFPHLTVRTINNNFLRLI + LKIYRKFEVELQRIFKVDCFKKFNLELGYASNWCSLNKEAVDILLEEKQLIATIFKNT + KVSDELFIPTVLQKHQLLNTVYSIEPTNDKPTDFQGNLRYINWWDGSPYTWTDSSDDI + DQLKRGKVLGHKFSRKFDLERNPNLKEEILTIINRTD" + misc_feature 12491..13189 + /gene="wcrG" + /locus_tag="SPC39_0016" + /note="HMMPfam hit to PF02485, Core-2/I-Branching enzyme, + score 0.00047" + gene 13428..14852 + /gene="wzx" + /locus_tag="SPC39_0017" + CDS 13428..14852 + /gene="wzx" + /locus_tag="SPC39_0017" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34438.1" + /db_xref="GOA:Q4JZ26" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZ26" + /translation="MKVLKNYAYNLSYQLLLIILPIITTPYVTRVFSAKDLGTYGYFN + SIVSYFILLATLGVASYGTKEISSNRKNIPKNFWGIYTLQFGATSLSILLYTLLCLGI + YIMRNPVAYILGMSLISKGLDISWLFQGLEDFRKIIVRNILVKLVGVISIFLLIKSAN + DLYLYVFLLTIFELLGQLSMWLPARKFIGKPHFDIDYTKYHLKPILLLFLPQIAISLY + ATLDRTMLGMISSTNDVGIYDQALKLINILLTVVTSLGSVMLPRVSNLLATGNHKAVN + KMHEMSFLIYNLIIFPIMAGMLIVNDDFVNFFLGKDFQDARYAIAIMIFRMFFIGWSN + IMGFQMLIVHNKNKEYMISTTVPAILSVALNLLFLPKLGYIGAAIVSVLTEAVVWGIQ + LFYTRSYLREVPILGSLFKIIVSSGFMYVNLLFVKHLLNVSPMINVGIYAVLGAMIYL + ILILIFRVINPNELKQQLLKNKGA" + misc_feature 13434..14228 + /gene="wzx" + /locus_tag="SPC39_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 9.5e-65" + gene 14854..15954 + /gene="glf" + /locus_tag="SPC39_0018" + CDS 14854..15954 + /gene="glf" + /locus_tag="SPC39_0018" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34439.1" + /db_xref="GOA:Q4JZ25" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZ25" + /translation="MYDYLVVGAGLSGAIFAYEATKRGKKVKVIDKRDHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTAHMKDIEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFTHRE + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFDHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDERNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVLSELGK" + misc_feature 15289..15891 + /gene="glf" + /locus_tag="SPC39_0018" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 6e-136" + gene 16035..17093 + /gene="wcyO" + /locus_tag="SPC39_0019" + CDS 16035..17093 + /gene="wcyO" + /locus_tag="SPC39_0019" + /note="member of homology group 80" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34440.1" + /db_xref="GOA:Q4JZF8" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JZF8" + /translation="MKKIKEYDILKIMAIILVVLSHSAYYKISSNYGGMDYQQYLNSH + SAFTLYKILGKFMEIIYYFHMPLFMAISGVFFSIQIKKDRWNKIEKLLTSKFKRLILP + FFVFTLLYSLPLKYISNYYNGVSFWRAITGQFLLLGNSHLWYLYALFIIFIISFYCLR + RDTSIFVYLSLYIIHVLSFLIHITLVSAPLQFLFWFSMGFLFESKRRKYNIFLENHKW + ISLLFFVLFIFLVVLNFLFKSDFKVLSRFFVDLLAILGSLICYNISYFLSNKTKILDS + KLLNLILINGLGIYIFSDTLNYFILSISYFVSDRFMFTSFGIIIIFLIRFVFTLFLGL + VFTLLFKKVFPKYSWLVN" + misc_feature 16044..17075 + /gene="wcyO" + /locus_tag="SPC39_0019" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 6.5e-06" + gene 17451..>17810 + /gene="aliA" + /locus_tag="SPC39_0020" + CDS 17451..>17810 + /gene="aliA" + /locus_tag="SPC39_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34441.1" + /db_xref="GOA:Q4JZ60" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JZ60" + /translation="MMKSSRLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 17451..17537 + /gene="aliA" + /locus_tag="SPC39_0020" + /note="Signal peptide predicted for SPC1811 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 17697..17765 + /gene="aliA" + /locus_tag="SPC39_0020" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaaag gagtgctgta taaaagacag aaatcctttg + 241 ttttttataa ctaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactatcta aggagaaaga aaatgaacat aaagaagcgt gtccttagtg caggtctgac + 361 ttttgcatct gctttgcttt tagctgcttg cggccaatca ggttcagata caaaaactta + 421 ctcatcaacc tttagtggaa atccaactac atttaattac ctgttagact attacgctga + 481 taatatagtc aattgaaaca agagcaggac aaaagagcct cgtaaaaggt attgcaactt + 541 ggtaatacct ttttgaggtg ctttttgata tgagcccatg ttttctcaat aggattgtac + 601 tcaggcgagt agggaggaag atgtaaaagt ttatgcccaa actcctcgca taaaagttct + 661 aacttaccca ttctatggaa tcttgtatta tccataataa taaccgatgg tgtgtttaat + 721 gttggtaaga gaaatttctg aaactaagct tcaaaaaagt cgctcgtcat cgtctcttcg + 781 taagtcattg gagcgattaa ctcaccattt gttagacctg caaccaaaga aatcctctga + 841 tatcttcttc cagatacttt gcctcttatt aactgacctt ttaatgagcg accatattct + 901 cgataaaaat aagtatcaaa tcctgtttcg tcaatctaaa caggtgctag gtgctttaaa + 961 ctattaaaat tcttaagaaa taaggctact ttttctgggt cttgttcata attagattga + 1021 aactagaata gtagacctct gcttctaaaa cattgttaga aatcgatttg actgtcctga + 1081 tcgatttgtc atgttcttat ttcattttac tatatttttg tttcgcggga agtctactaa + 1141 gatacttaaa gatgcagata gtaaaaaaaa tgtagacatt accgtaaaaa agtgatataa + 1201 tcgtatgatg ttcaaggtat aggtgttaat catgagtaga cgttttaaaa aatcacgttc + 1261 acagaaagtg aagcgaagtg ttaatatcgt tttgctgact atttatttat tgttagtttg + 1321 ttttttattg ttcttaatct ttaagtacaa tatccttgct tttagatatc ttaacctagt + 1381 ggtaactgcg ttagtcctac tagttgcctt ggtagggcta ctcttgatta tctataaaaa + 1441 agctgaaaag tttactattt ttctgttggt gttctctatc cttgtcagct ctgtgtcgct + 1501 ctttgcagta cagcagtttg ttggactgac caatcgttta aatgcgactt cgaattactc + 1561 agaatattca atcagtgtcg ctgttttagc agatagtgag atcgaaaatg ttacgcaact + 1621 gacgagtgtg acagcaccga ctgggactga taatgaaaat attcaaaaac tattagctga + 1681 tatcaagtca agtcagaata ccgatttgac ggtcaaccag agttcgtctt acttggcagc + 1741 ttacaagagt ttgattgcag gggagactaa ggccattgtc ctaaatagtg tctttgaaaa + 1801 tatcatcgag tcagagtatc cagactacgc atcgaagata aagaagattt ataccaaggg + 1861 attcactaaa aaagtagaag ctcctaagac gtctaagaat cagtctttca atatctatgt + 1921 tagtggaatt gacacctatg gtcctattag ttcggtgtcg cgatcagatg tcaatatcct + 1981 gatgactgtc aatcgagata ccaagaaaat cctcttgacc acaacgccgc gtgatgccta + 2041 tgtaccaatc gcagatggtg gaaataatca aaaggataaa ttgactcatg ctggtatata + 2101 tggggttgat tcatccattc ataccctaga aaacctttat ggtatagata ttaattatta + 2161 tgttcgtttg aattttacct catttttgaa attgattgac ttattgggag gggtagatgt + 2221 tcataatgat caagagtttt cagctctaca tgggaagttc catttcccag tagggaatgt + 2281 ccatctagac tctgagcagg ctctaggttt tgtacgtgaa cgctactcac tagccgatgg + 2341 agaccgtgac cgtggtcgca accaacaaaa ggtgattgtg gctatccttc aaaaattaac + 2401 gtcaaccgaa gcactgaaaa attatagtac gatcattaat agcttgcaag attctatcca + 2461 aacaaatatg ccacttgaga ctatgataaa tttggtcaat gctcagttag aaagtggtgg + 2521 aacttacaaa gtgaattctc aagatttaaa agggacagat cggatggatc ttccttctta + 2581 tgcaatgcca gacagtaacc tctatgtgat ggaaatagat gatagtagtt tagctgtagt + 2641 taaagcagct atacaggatg tgatggaggg tagatgaaat gatagacatc cattcgcata + 2701 tcgtttttga tgtagatgac ggtcccaagt caagagagga aagcaaggct ctcttggcag + 2761 aatcctacag gcagggggtg cgaaccattg tctctacctc tcaccgtcgc aagggcatgt + 2821 ttgaaactcc agaagagaag atagcagaaa actttcttca ggttcgggaa attgcaaaag + 2881 aagtagcaga tgatttagtc attgcttatg gtgcagagat atactatact ctggatgcac + 2941 tagaaaagct agaaaaaaaa gaaattccta cccttaatga tagtcgttat gccttgattg + 3001 agtttagcat gcatacttcc tatcgtcaga ttcatacggg attgagcaat attttgatgt + 3061 tgggaattac tccagtcatt gcccacatcg agcgctatga tgctcttgaa aataatgaaa + 3121 aacgtgttcg tgaactgatt gatatggggt gctatactca gataaatagt tatcatgttt + 3181 taaaatctaa gctctttggt gaaagatata aatttatgaa aaagagagct cggtattttt + 3241 tggaacgtga tttagttcat gtagttgcaa gtgacatgca caatttgaac aaacgtcccc + 3301 cttatataaa agaagcctat gaacttatct caaaacaata cggtgaaaga agagcgagag + 3361 aattatttat tgaaaatcct cgcttaatct tatctgatca aattatttag gagttgacat + 3421 gaaagaaaat aaagaaatta cgattgacgt ttttcaattg tttaaagtcc tttggaagaa + 3481 gaaaacctct attatactaa ctgcgattgt agcagctgtc ctagcttttg ctgtaagtag + 3541 ttttgtactg acacctgagt attctagtac gacacgtatt tatgtggtca atcgaaatca + 3601 atcggaaaaa gcagggttga cgaaccagga tttgcaggct ggaacctatc tggtaaagga + 3661 ctataaggaa atcatcctct ctcaagatgt acttgagaaa gtcatttcaa atcttaaact + 3721 agagaaaaca gttaaggaat taagcaagaa gattcaggta acagtacctg tggatactcg + 3781 tatcgtatca attactgtaa aaaatgcaca accagaagaa gctagccgta tcgcaaatgc + 3841 tcttcgtgaa gtggctgctg aaaaaatcat ttctgtaact cgtgtatctg atgtgacaac + 3901 attggaagaa gccagggcag ccctaagtcc ttcatcacct aatattcgtc gtaataccct + 3961 gttagctttt ttagcgggag gagcagtgat ggtagtttca gtcttgttac ttgagttgtt + 4021 ggatgatcgt gttaaacgac cagaagatgt ggaagaagta atgcagattg cacttctagg + 4081 ggttgttcta gatttgaata agttaaaata agggagaaaa tatgccaaca ttagcaatag + 4141 aacaaaaacg tttagatttt gcgaaaaaag cagaagagaa ttacaatgct ttgcgaacaa + 4201 atattcaatt gagtggtgat aatctgagag ttctttccat ctcgtctgtt aaacctggtg + 4261 aggggaaatc gacaacatca ataaatattg cttgggcctt tgcgcgtgca ggctataaag + 4321 ctttattggt ggatgcggat attcgtaatt ctatcatgtc aggagtcttt aaatcaagag + 4381 aaaaaattac tgggctaacg gattttctgg caggtaccac tgacctttct catggacttt + 4441 gtgatacaaa tattgaaaat ttatttgtta ttcaggcagg acctgtatcc cctaacccaa + 4501 cagcactttt acagagtgaa aactttgcca ctatgattga tactatgcgt aagtattttg + 4561 attatgtcat tgtcgatact gcaccgattg ggatggtcat tgatgctgct attatcacac + 4621 aaaaatgtga tgcttctatt ttggtaacag cagcgaggga aacaaagcgt cgtgatattt + 4681 tgaaagcaaa ggaacagtta gaacagacag gagtaccttt tttaggagtt gttctaaata + 4741 aattcaatac agaagttgaa aaatatggag cttatggtgg ttatggagct tatagtttat + 4801 atggaaatta taggaaggaa tgacggagta attgataaaa atatattttg tttttaaaaa + 4861 tattttagat agatttttgg cgtttttcct atttattacc ttgataatca taccgattat + 4921 tcctataaca attttggcta tttggataga agatccagga gatgttttct atttacaaga + 4981 tagagttggt ttaaatggaa aaaaattcaa agtaataaag tttcggagca tgtataaaga + 5041 tgccgatcag agaataaagg aaagtattaa tagtggtaaa actgatcgtc taaattttaa + 5101 agaacattct caaagtatga ctacaaaagt cggtaaagtg atacgaaaac tttcaattga + 5161 tgaattacct caattattga atattataaa aggtgatatg tctatagtcg gacctcgtcc + 5221 attacaacag tttgaaatca ctcatcatat tcttacctat caagaaatgg gtattgattt + 5281 aaagatgtct aaaagattgt ctgtgaaacc tggtttgctt tgttattggc aagttacgcc + 5341 aaataaaaat gacatgcctt ttgctgacag aatggatctc gatttattat atattgataa + 5401 tgtatctttc aagactgatt tcttgcttat tttgaaggga ttttttacag ttttaatggg + 5461 taataatagt taacatgaag aatataaaaa tattagtagc gacacataaa aaatataaaa + 5521 tgcccagtga tacaaatatg tatctaccaa ttcatgtagg atgtgaagga aagaaaaaat + 5581 taggatttca aggtgataat tctggtgaaa atatttctgt tttaaatcct tactattgtg + 5641 aacttactgg cctctattgg gcatggaaaa atttagagtg cgactattta ggtttggtac + 5701 actatcgtcg ttattttact aaaatgacta aagggtacaa tgaatcaata aatattgatg + 5761 atgtaatttt aaataggttt gaagtggaga aattgttaga gaactcagaa gtcatcgttc + 5821 ctaaaaaaag aaagtactat atagaaaccc tctattctca ctatgctcat accttggatg + 5881 ctagccactt agacctagct agaaaaatga ttgaacagaa aaatcctgaa tatctagcaa + 5941 gttttgataa ggtaatgaag caaagaagcg gatacatgtt taacatgttc attatgaaaa + 6001 aagaactggc agacgattat ttttcttggc tatttcctat tttggatagt atgtatgaaa + 6061 gtatggattt atcagggtta actgattttg aagctagatt atttggaaga gttagtgaac + 6121 tactatttaa tgtgtggtta gataaaaaca atctaaatat taaggaagtt ccttttatgt + 6181 acatggaaaa gattgacttg tttaaaaaag ggaagtcatt tttaatggcg aaatttttgg + 6241 gaaagaaata tggacagagt ttctaataat tatatagact attttactag aaaagattga + 6301 gagaaattgg tcaataaatg aaatcagaga tagaaattat tcagagtaaa attatagagt + 6361 tgttaaaatt atttatagat atctgtgaaa ataatgacct gacatattat gccttgggtg + 6421 gaaccttgtt aggtgctgtg aggcataagg gctttatacc ttgggatgat gatatcgatt + 6481 tgggtatgcc aagagaggat tatgaacgat ttaaacaaat tgctactgaa caaattaatg + 6541 gtaagtatca gtttttgagt gaggatacac caggatatag aaaagcattt tctgtgattc + 6601 gagatacttc aacaagaata gtgatgaatt atagtaatgt cgaacaagaa gaaagtttgt + 6661 ggattgatat atttccaata gatggcttac ccagcaaagg tataaagaaa aaaattcatg + 6721 aaaaaaggta tttatataga cgaatgatgg ttcaattatc tcagtttaat aatattgtaa + 6781 atcagaataa aactgataga ccttggcatg aaaaattgat aataaaaata gccaatcatt + 6841 taaaaataga aaatattcta tcatttgaaa aacaacagta caaatattta aaaacgataa + 6901 agaaatattc agtgatggag ggttatgcag gtaattttac aggggcatat aaactttgtg + 6961 agttagtgcc aagttgttat tttggtgaac ctgttaaatt agattttgaa ggaataaaac + 7021 tgaactgtcc aaataaatat aaagattatc tcaaagcaat atatggtgag aattatataa + 7081 caccacctcc aattgaacac agagttcctc atcaatatag agtcataagt ttaggagaga + 7141 atataggtga gtaaaattag aaaagcgcaa gcatattatt tggatattaa aaataaaaaa + 7201 agtattttcc tccaaatgtt ttaaattggc aacttttagg aaaattcttg ggacaagtac + 7261 caaatgtgat aggtgaaaac caggcaagat ttttttgtga aaaacgtcac cagaaaacta + 7321 aaggattttt attacaatat tttaatgaat ttgtagaaaa ttataatttt actaaagata + 7381 atctagaaaa tagtaagatt gtttggacat tgtggtggca aggttatgat aacgctcctg + 7441 aaattgtaaa gtattgttta gataatatga aaaaattagc tcatgaaaat ggttttgagt + 7501 tttattgttt agatgaatcc tcctttgagc gctatgttaa aattcctgaa tatctaaaat + 7561 taaaaattaa aaaaggctat atttcaattg caaatatttc agatatgata cgtgtttgtc + 7621 ttcttttgca gtatggtggg acttggattg attcaactgt gtttattcat tcgtctttta + 7681 aatgggataa cttttctaaa tcttatttta caataaagac tggtgagatg acagattatt + 7741 ctccaaatgt ttccaagaat cgatggaaga catttttatt atcagggaat agttagttat + 7801 atgagtttac tcgtgatttt ttctttgaat attttaaaaa atttgattat gtcattgatt + 7861 atttattgat tgactatatt tttgatatag catttgatac aaatatcgag ataaaaaaac + 7921 aaatgttgga attggaatca acaaatccga atttgttttg gcttgaaagt catttttctg + 7981 aaaaatttga tagaaaatat gggaatatat ttcagaagaa acgaagattt ttaaaacgac + 8041 atataagtta gatacaaaaa taaaatgtga ttctgagaat tattactcag ccttaattaa + 8101 aagtaaattg aaatgatggt aaaaaatgaa gaaaatagct ttagttaagt ggattataga + 8161 cggtacagat ggtggcttga aagtttccac agatcttgct aatgaattat caaaagtgta + 8221 cgaggtacat ctaatttcag tcataagtac tgaagaaata ttttttccac taaataatgc + 8281 agttcgttat aaaaatttat cttcacaaaa gatatcaatg agtaagaact tcgttaaggc + 8341 ggtgaaatta ctaagaacat atataaaaaa aaataacata gaagttctat ttggaatagg + 8401 gatgactatg aatattgtag gcataacaag tacaattggt ttaaaaacta aatttatttc + 8461 ttgtgatcac actaattcta tcgtagatat agacactact atgaaaaaac ttcaaagata + 8521 tgtgggagct aaactttcag ataagataat tacactaact actgctgata gaaataatta + 8581 tataaaaaag tataagataa acccaaaaag agttgattac atttataatt ggatgaattc + 8641 tatagatgca gaaaaaaaat atactcttga ttcgaaaaaa ttaattactg taggtagatt + 8701 tcacaagcaa aaaggttatg actatttatc taaagttgct atcaagatat tatcaatata + 8761 tcctgaatgg caatgggata tatatggttc gggtgatgag caaataaaac aagatttgat + 8821 aactgaattg gataaaggtg gagttttatc acaagttcat tttaagggga atgtcaaagg + 8881 tacagataat atttatccag accatactat ttatgtaatg acttcccgtt atgaaggact + 8941 tcccttagta cttttagaag caaaacaata tggactacct attgtcagtt ttaattgtcc + 9001 tacaggtcca gcagaaattg tattggatgg agaaaatggt tatctaattg agaattttga + 9061 tataaatcaa atgagtcaaa aaataataga attaattgaa aataatgaat tgagattagg + 9121 attttcgcaa aatgcgatgt tagatactga taaattcaat aaaaagaaca ttactaaaca + 9181 atggattgaa ttgatagaaa aaatgacggg agaatgaaat gtacgataaa ttagtaacaa + 9241 tcatagtacc aatgtataat attgaacaat atattactaa gtgtatagaa tcatttaaac + 9301 aagtagataa aaaatattat gcggattttg aagtgattgt tgttaatgac ggtagtacgg + 9361 ataactcact tcaagttgtc gaagatttaa ttactaatag tagttgccta aatattagag + 9421 ttgttaataa agaaaatggt ggacatgggt caacgattaa tgttggtata aaagaatcta + 9481 aaggaaaatt ttttaaagtt atcgatgggg atgactggat tgatgtacca agttttgaaa + 9541 aattattaga agaacttaaa ggtatagatg tagatatggt tattacaaat tatactgaac + 9601 aacatatcta taatcagact gaaaaagaga ttggcttttc tgagatatta gattgtaata + 9661 aaatatatga gggaatacct ttcaaacgga ttcccatgca tgctctgaca tacaaaacat + 9721 ctatattgaa agaatctaga attaatataa gtgaaaagac cttttatgta gatatggaat + 9781 atactttgtt acctttgcaa tatgtaaaaa gttatgttta tattgattta aatgtttacc + 9841 agtatttctt aggtagaaaa gatcagagta tgaatttaaa tgtgatgaaa caaaaagcag + 9901 atcatcacaa tagagtaaca aaaaaaattc tcgattatta tgaagtaatt cgatttgata + 9961 agaacttaga accagtagtc agagacgtat tgacatactt aatcaacaag caatgtcagt + 10021 tgtttataat gaataagaat atcgaggaag cgagccgatt atttagttac gctcataaat + 10081 gtcattatag atggaaatat gattattcga aaaaaatagt ctcactaatt tatataaatt + 10141 ctagatttaa aaatatattt aatctcatct taaaaccgtt aatcaataag caacaaaaag + 10201 aatggagcga gatggatgaa tattagtgta gttattcctg tatataatgt tgaggattac + 10261 cttcattatg ctatagacag tttagtaaat caaactcata aaaattttga ggttttacta + 10321 atcaatgatg gttctactga taattcagga aatttatgtg ataaatatgc tcaagaatat + 10381 gattggatta gggtatttca taaagagaat ggtggcttat cagatgcgcg taattatggt + 10441 gtattaagag caactaatga gtggatattc tttttggatc cggatgatta tatagagtac + 10501 tttacatttg aattattgag tctaattcaa gagaaatatc aagctgattt gatttcaaca + 10561 aaagttcaaa ctacaaatga atatgaaaaa tttagcaagg aacaatttaa tttagaatct + 10621 agtaaaatag ttacaaaaga agaagcacta gaattaatgt tggaagataa agttgctacg + 10681 gtatctgcat gtgcaaaact ttataaaaaa caaattttag aaatgagacc atttcctgta + 10741 ggaaaaatct acgaagactt ttttgttgta gctgaacatt taagattagc tgaacaaata + 10801 gttatttcac ctgttattac gtatcattac tatcgtcgtc ctggtagtat cgtacaatct + 10861 cagtttacag ataagcgatt tgattttttt gatgcaggtg agtataacag aagtcaaata + 10921 aaacaatttt atgatggtaa tagcgtagaa aaggcgttaa atttaaaaat tgttcaaggt + 10981 tctttttcta tatctgaagc tgcagctctt acggacacaa aggctttaag aaatattgtt + 11041 aaaaaaataa gttcattata ctggagtata atctttaatt ctaaagtttc tataaaattt + 11101 aaatttaaat ataattggtt tttacttact cccaatttat actgccgtat aaaaaaattg + 11161 ttaaaaagga gtatataatg tttttagttt ttttactgtt ttttggtgta tttctattat + 11221 ttccaattat aactacacca gtcttattac tcccaatagt ttatagattt agatatagca + 11281 gatattattt aatgttattt gttataggta tttccttaat tgcgctaagg tatattccgt + 11341 attttactga tgatggagcc tatcattata aagcagctta tttatttcag ttttatgata + 11401 atgtttttga ttggtttggg aacttgatgt ctaaaaatat tccgacggaa gagtatggtt + 11461 attataatta tcccttattt gccttattgc tatatatatt cagtaagaca ggtacctatt + 11521 cactagttag ttttacagtc attctgattg tttatttctt atatactaaa ataatatatg + 11581 aaatctatcg ggaatataat atctcaaaat ttttattttt attagcttta ttaacaatgg + 11641 ttgcaatcgt aaatgttcgt tttacaacta gtggtatgag gtatcattta gcaggggcca + 11701 ttattgtttt cttattctat aaagaaataa agaatggatt tgaactaaat aaaactttat + 11761 tttattatct tattccaata ttaatccatt ctagtgcagt aatatttgta gcgactagat + 11821 taatatttcc atggtttaaa gatgcgagtt tttttaagaa aataattatt ctattttctt + 11881 taccaatttt tacgctctta tctccattgt tgcaaactct caatgttgaa tatttatcat + 11941 ttttattaga gaagtttaat gcttatcaaa aaacagaaat atttataaaa ttatatagta + 12001 catctgattt aataaatgta tatttaggtg ttcttatttc tttattatat atttttttat + 12061 accatacaac atttcgtttt cagaagaatc ttaatatgaa acttttttta tcttttgttt + 12121 tgtacatttg tttattaact ttatcagtac tcccattttt aacaatatta gatcgttttg + 12181 tttggtttgt ttatccttta gttgccattt cgatgatttt acatattggc tacaataaaa + 12241 cccatattga aagagtacaa tacattagaa ataattattt accatttttc attgtattaa + 12301 ccctatgctt tattggtgga gttatcggaa ataggagatt tttagatttt ttaagattgg + 12361 tagatttcaa tacaatggag atactcacta aaaatgtatt tgattatttt tctgatttgc + 12421 accatttctc tttgagtgaa gttttaagac gataaatata ttttataaac ataataggag + 12481 ttatatgaaa caagcttatt taatcatagc tcataataaa atagagcaat taaaattttt + 12541 actttcatta ttagattatg aaaaaaacga tattttcatt ttatttgata aaaaagcaac + 12601 aattactgaa aaacaaaaaa atgaactaac tcaaatagta acgaagtcag gcgtattctt + 12661 cacaagggaa ataccaattt attggggaga ttattcttta gttgaagcag aaatagaact + 12721 ttttgaaacc gcaaataaac aagaaaatta cagtatgtat catttgttat caggtgtaga + 12781 tttaccatta gatactgcag aaaatatata taactttttt gatagcagaa aaggatataa + 12841 ttttttaacg atggtttctg atgaattatt tattcgaaat aaagtctatg agcgtgtagc + 12901 gtttaaaaca atgtttcctc atttaacggt aagaactata aataataatt tcttaaggtt + 12961 gattttaaaa atttatagaa agtttgaagt tgaactgcaa agaatattta aagttgattg + 13021 ttttaaaaag tttaatttag aattgggata tgcttctaat tggtgttctc ttaataagga + 13081 ggcggtagat atactgctag aagaaaagca attgattgct accattttta aaaataccaa + 13141 agtaagtgac gaattattca ttcctacagt tttacagaaa catcagctat tgaataccgt + 13201 ttattcgata gaacctacaa atgataagcc tactgatttt caaggtaatc ttcgctatat + 13261 taattggtgg gatggaagtc catatacatg gactgattct tctgatgata ttgatcaatt + 13321 gaaaagaggt aaggttttag gccataagtt ttctagaaaa tttgatttag agagaaatcc + 13381 gaatctaaaa gaagaaattc taactatcat aaataggaca gattgatatg aaagtactaa + 13441 aaaattacgc gtataacctc tcttatcaat tattactcat tatacttccc atcattacaa + 13501 ctccctatgt gacacgggta ttttctgcaa aggatcttgg aacatatgga tactttaatt + 13561 ccattgttag ctattttatt ttgttagcta ctttgggggt cgctagctat gggactaagg + 13621 agatttcgag taatagaaaa aatatcccga agaatttctg ggggatatat actcttcaat + 13681 ttggtgcaac atcattatca attctcttat acactttatt atgtttagga atttacataa + 13741 tgagaaatcc tgttgcgtat atattaggaa tgagtttgat ttctaaagga ttagatatat + 13801 cctggctttt tcaggggttg gaagattttc gtaagattat agtcagaaac atattagtga + 13861 agctcgttgg tgtaatttca atatttttat tgataaaatc agcgaatgat ctttatcttt + 13921 atgtctttct cttaacgata tttgagttat tgggacaatt aagtatgtgg ttacctgctc + 13981 gaaagtttat tggaaaacca cattttgata tagattatac taaatatcat ttaaagccaa + 14041 ttcttttatt atttctccct cagattgcta tatcactata tgcaacttta gaccgtacga + 14101 tgttaggaat gatatcatct acaaatgatg tcgggatcta tgatcaagca ttaaaattga + 14161 tcaatatttt attaactgta gtaacttcgt taggaagtgt catgttgccg agagtatcta + 14221 atctcttggc gacagggaat cataaggcag ttaataaaat gcatgagatg tcatttctga + 14281 tctataattt gattattttt cctattatgg caggaatgct aattgtaaat gatgattttg + 14341 ttaacttttt cctcgggaaa gattttcaag acgcacgtta tgcgatagca attatgattt + 14401 ttagaatgtt ctttattggt tggagcaata ttatgggatt tcaaatgcta atcgtacata + 14461 ataagaataa agaatatatg atctcaacaa ctgtgcctgc aattcttagt gttgccttga + 14521 atttgttatt tcttcctaaa ctcggatata taggagcggc aattgtatct gttttaacag + 14581 aggcggtagt ttgggggata cagttattct atactcgttc ttatttgaga gaagttccta + 14641 ttctaggttc attgtttaaa attatagttt catcgggatt tatgtatgtc aatttattat + 14701 ttgtaaaaca tcttctgaac gtatcaccta tgataaatgt agggatttat gctgttctgg + 14761 gagcaatgat ttatctcata ttaattttga tttttagggt tataaatcca aatgagttaa + 14821 aacaacaatt attaaaaaat aaaggagctt aatatgtacg attatcttgt tgttggtgct + 14881 ggtttgtctg gagcaatttt tgcttatgaa gcaaccaagc gtggaaaaaa agtaaaagtt + 14941 attgataaac gtgaccacat tggtgggaat atctattgtg agaatgtaga aggtgttaat + 15001 gttcataaat atggtgcaca tatcttccat acttctaata aaaaagtctg ggattatgtt + 15061 aatcaatttg ctgaatttaa caactacatc aactcgcctg tagcaaatta caagggtagc + 15121 ctttataatc tgcctttcaa tatgaatact ttctatgcta tgtgggggac aaaaactcct + 15181 caagaggtca aagataagat tgctgagcaa acggctcaca tgaaggacat tgaacctaaa + 15241 aacttggaag aacaggctat caagttgatc ggtccagatg tctatgaaaa attaatcaag + 15301 ggttatactg aaaagcagtg gggacgctca gcaacggaac ttcctccatt tatcattaaa + 15361 cgtcttccag ttcgtttaac atttgataat aactatttta acgaccgtta ccaaggaatt + 15421 cctattggtg gttacaatgt catcatcgaa aatatgctta aagacgttga agttgagctt + 15481 ggtgttgatt tctttactca tcgtgaagag ttagaagcat cagctgaaaa agttgtcttc + 15541 acagggatga tcgaccagta ttttgactac aagcatggag agttagaata ccgtagcctt + 15601 cgctttgatc atgaaatttt ggacgaggaa aattatcaag gaaatgctgt agtgaactat + 15661 acggagcgtg agattcctta tactcgtatt attgagcata aacactttga gtatggtacg + 15721 caagctaaaa cggtcattac tcgtgaatac ccagctgatt ggaaacgcgg agatgaacct + 15781 tattatccaa tcaatgatga gagaaacaat gctatgtttg ctaaatatca agaagaagca + 15841 gcacagaatg ataaggtgat tttctgcgga cgtttggccg attataaata ctacgacatg + 15901 catgtggtca ttgaacgtgc cttagaagtc gtattaagtg agttaggaaa gtagtcaatt + 15961 acattaaggt caagtttaat gaccttatat cttttctata aagaaaaact acaattagag + 16021 gagcgagatt taatgtgaaa aagataaaag aatatgatat tttaaaaatt atggctatta + 16081 ttttagttgt gttaagtcat agtgcgtatt ataaaatatc gagcaattat ggtggaatgg + 16141 attatcaaca atatttaaat agtcattcag catttactct atataagata cttggtaaat + 16201 ttatggaaat tatctattat tttcatatgc cattatttat ggctatatcg ggtgtatttt + 16261 tctctattca aataaaaaaa gatcgatgga ataagattga gaaattatta actagtaagt + 16321 ttaaaagatt aatattgcca ttttttgttt ttactttatt atatagtttg ccattaaaat + 16381 atatatcaaa ctactacaat ggtgtttcat tttggagagc tataactggt caattcttgt + 16441 tattaggaaa ttctcactta tggtatttgt atgcattatt tattatcttt ataattagtt + 16501 tttattgttt aagaagagat acttctatat ttgtatactt gtccttatat attatacatg + 16561 tactgagttt cttgattcat ataacgttag taagtgcacc attgcagttt cttttttggt + 16621 tttccatggg atttttgttc gaatctaaaa gaaggaagta taatattttt ttggaaaatc + 16681 acaaatggat tagcctttta ttctttgtgt tatttatatt tttggtggtt ttaaattttc + 16741 tatttaaaag cgattttaaa gtattgagtc gattttttgt tgacttatta gctattttag + 16801 gatcacttat ttgttacaat atttcgtact ttttaagtaa taaaactaaa attttagata + 16861 gtaaactact taatctcatt ttgattaatg gtttagggat atatattttt tctgatactt + 16921 taaactattt tatattaagt atttcttatt ttgtaagtga tagatttatg tttacttcat + 16981 ttggtataat tattatattt ttaattagat ttgttttcac tttatttttg ggattagtct + 17041 ttacattgct atttaaaaaa gtatttccaa aatattcttg gctagttaac tagaaaatac + 17101 aatatcagtg attatgcact ataagctatc ctgtaattct tacagttaaa tattttatcc + 17161 tatatactga ggagacaaat aaaataactt atagtatttt gcaccttatc tagtttaatt + 17221 gtaatataaa agaaaatatc caggaagtgg tatagtactc tctcattgtt taacttcgct + 17281 taaatatata ggttaattcc ttgactatgt gatgtagttg agggattttt gataatattc + 17341 atattttttg caaagatgtt gtttgaaaaa taattttcaa aaattctgaa aattctgttg + 17401 acaactttct gaaaagagtc tataatggag agaaagtttt aaaggagaaa atgatgaaaa + 17461 gttcaagact atttgccctt gcgggcgtga cattattggc ggcgactact ttagctgcat + 17521 gctctggatc aggttcaagc actaaaggtg agaagacatt ctcatacatt tatgagacag + 17581 accctgataa cctcaactat ttgacaactg ctaaggctgc gacagcaaat attaccagta + 17641 acgtggttga tggtttgcta gaaaatgatc gctacgggaa ctttgtgccg tctatggctg + 17701 aggattggtc tgtatccaag gatggattga cttacactta tactatccgt aaggatgcaa + 17761 aatggtatac ttctgaaggt gaagaatacg cggcagtcaa agctcaagac +// + diff --git a/public/res/serotype_genbank/serotype_4.gb b/public/res/serotype_genbank/serotype_4.gb new file mode 100644 index 0000000..bcb595a --- /dev/null +++ b/public/res/serotype_genbank/serotype_4.gb @@ -0,0 +1,947 @@ +LOCUS CR931635 20936 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 600/62 (serotype 4). +ACCESSION CR931635 +VERSION CR931635.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 20936) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 20936) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..20936 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="600/62" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC04_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC04_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI32760.1" + /db_xref="GOA:Q4K1T1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K1T1" + /translation="SNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAPWDAFCVELL" + gene 293..466 + /gene="aliB" + /locus_tag="SPC04_0002" + /pseudo + CDS 293..466 + /gene="aliB" + /locus_tag="SPC04_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + /db_xref="PSEUDO:CAI32761.1" + gene complement(order(459..995,997..1323)) + /gene="tnp" + /locus_tag="SPC04_0003" + /pseudo + CDS complement(join(459..995,997..1323)) + /gene="tnp" + /locus_tag="SPC04_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(933..995,997..1305)) + /gene="tnp" + /locus_tag="SPC04_0003" + /note="HMMPfam hit to PF01710, Transposase, score 1.9e-22" + /pseudo + gene 1558..3003 + /gene="wzg" + /locus_tag="SPC04_0004" + CDS 1558..3003 + /gene="wzg" + /locus_tag="SPC04_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32763.1" + /db_xref="GOA:Q9AHD5" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q9AHD5" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTNNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKSQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRHQQKVIVAILQKLTST + EVLKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1558..1674 + /gene="wzg" + /locus_tag="SPC04_0004" + /note="Signal peptide predicted for SPC0077 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1762..2109 + /gene="wzg" + /locus_tag="SPC04_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.2e-63" + misc_feature 2287..2730 + /gene="wzg" + /locus_tag="SPC04_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.7e-69" + gene 3005..3736 + /gene="wzh" + /locus_tag="SPC04_0005" + CDS 3005..3736 + /gene="wzh" + /locus_tag="SPC04_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32764.1" + /db_xref="GOA:Q4K337" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K337" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3008..3616 + /gene="wzh" + /locus_tag="SPC04_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 3e-37" + gene 3742..4437 + /gene="wzd" + /locus_tag="SPC04_0006" + CDS 3742..4437 + /gene="wzd" + /locus_tag="SPC04_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32765.1" + /db_xref="GOA:Q9AHD3" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q9AHD3" + /translation="MMKEQNTIEIDVFQLVKSLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDVLEEVVSDLKL + DLTPKGLANKIKVTVPVDTRIVSISVNDRVPEEASRIANSLREVAAQKIISITRVSDV + TTLEEARPAISPSSPNIKRNTLIGFLAGVIGTSVIVLHLELLDTRVKRPEDIENTLQM + TLLGVVPNLGKLK" + misc_feature 3763..4179 + /gene="wzd" + /locus_tag="SPC04_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.8e-56" + misc_feature 4285..4362 + /gene="wzd" + /locus_tag="SPC04_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4447..5130 + /gene="wze" + /locus_tag="SPC04_0007" + CDS 4447..5130 + /gene="wze" + /locus_tag="SPC04_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32766.1" + /db_xref="GOA:Q4K335" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K335" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSINIAWSFARAGYKTLLIDGDTRNSVMLGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIIDTPPIGIVI + DAAIITQKCDASILVTATGEANKRDIQKAKQQLKQTGKLFLGVVLNKLDISVNKYGVY + GSYGNYGKK" + gene 5143..5253 + /gene="HG261" + /locus_tag="SPC04_0008" + /pseudo + CDS 5143..5253 + /gene="HG261" + /locus_tag="SPC04_0008" + /note="member of homology group 261" + /pseudo + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase) (fragment)" + gene 5471..6106 + /gene="wciI" + /locus_tag="SPC04_0009" + CDS 5471..6106 + /gene="wciI" + /locus_tag="SPC04_0009" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI32768.1" + /db_xref="GOA:Q9AHD1" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q9AHD1" + /translation="MKNGNRIYSWRLFMYGIIKRLGDILLSLIGIIILCPVFMIIAIA + IKLDSEGPVIFKQKRFGIHKEYFYILKFRSMKIDAPKNVAPRNLYNPEQWITKVGAFL + RKTSLDELPQLFNILVGNMSIVGPRPAGINELDLIAERDKYGANDILPGLTGWAQING + RDTLSVEMKTELDGYYVKHLSLIMDIRCIVKTIPYVLKRKGIVEGSGKKES" + misc_feature 5471..5602 + /gene="wciI" + /locus_tag="SPC04_0009" + /note="Signal peptide predicted for SPC0082 by SignalP 2.0 + HMM (Signal peptide probability 0.809) with cleavage site + probability 0.562 between residues 44 and 45" + misc_feature 5525..6079 + /gene="wciI" + /locus_tag="SPC04_0009" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.3e-37" + gene 6115..7344 + /gene="wciJ" + /locus_tag="SPC04_0010" + CDS 6115..7344 + /gene="wciJ" + /locus_tag="SPC04_0010" + /note="member of homology group 35" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32769.1" + /db_xref="GOA:Q97SJ5" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q97SJ5" + /translation="MKILFVCQHYKPEPFRLSDICEDLVRKGHEVSVLAGIPNYPEGK + IYADYRHNKKRREIIEGVTIYRSYTIPRKKSVVFRLLNYFSFAISSTLGVLLGRYKTK + DGSNFDCVFVNQLSPVMMAWAGMAYKKKYKKPMFLYCMDVWPDSLTVGGVKQDGLIFK + LFKFISKKVYRASDYIFVTSPSFKNYFVKQFDISEQKITYLPQYAEDLFIPDESIVNK + ESVDLTFAGNIGKAQNLETILKAASLIEKNTNLPKKIHFHFVGDGTELLSMKALAHEL + ELKNISFYGRRSLEEMPSFYKKSDAMLVSLIGDSIVSRTIPGKVQSYMAAGKPIIGAI + SGDAKIIVEEANCGYVSPERDVKQLAKNICKFSMLSIKRQRELGKKARCYYENHFSKE + QFMLELETCLERESKKE" + misc_feature 6733..7266 + /gene="wciJ" + /locus_tag="SPC04_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.1e-12" + gene 7349..8425 + /gene="wciK" + /locus_tag="SPC04_0011" + CDS 7349..8425 + /gene="wciK" + /locus_tag="SPC04_0011" + /note="member of homology group 212" + /codon_start=1 + /transl_table=11 + /product="putative sugar transferase wciK" + /protein_id="CAI32770.1" + /db_xref="GOA:Q4K332" + /db_xref="UniProtKB/TrEMBL:Q4K332" + /translation="MRVLFILSDNIYLTPYFNFYKELLKKLSISYDVIYWDKNINEII + TKQNYYRISFSGKGKLSKILGYVKFRKEIKKKLKENDYDMILPLHSIVSFILVDFLLF + SFKNRYIYDIRDYSYEKFLVYRLVQKQLVKNSLMNIVSSDGYKFFLPMGEYFTTHNLP + NMIELNEVKQLKNNSTFPIQLSYIGLIRFQEQNKKIIDFFANDSRFQLNFIGTNAGEL + REFCQEKNISNVNLVDTFQPKDTMSFYKNTDAVLNLYGNHTPLLDYALSNKLYFAALL + YKPILVCEDTYMEKVSIENGFGFVLPMKDESEKDCLALYIQNLDRKQLIKNCDNFMDR + ISLEKQKTEIELEKRILSLRKKND" + gene 8418..9536 + /gene="wciL" + /locus_tag="SPC04_0012" + CDS 8418..9536 + /gene="wciL" + /locus_tag="SPC04_0012" + /note="member of homology group 30" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32771.1" + /db_xref="GOA:Q9AHC8" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q9AHC8" + /translation="MIKVLHLFTTLDSGGVESFLFNYYSHIDRKKIQFDFIVPGKEQG + FLEDKMKELGAKVYHVPLLRKKPLHQFLSLARIIKKGDYDIVHCHGYKSAIGLILSKI + IGCKIRIIHSHMAYVTENSFQKVLRKLVTILVKILATHWFACGEDSAKWLYGEKAYKD + GKIEIIFNAIDLKKYQFLSDVREKCRRELDVSNKFVLGNIARLSDQKNQSYLFNVLKE + LILIKPNVILLLVGNGEDEQKLKQKALELNLTPYVLFLGRRTDISDLLSAMDVFLLPS + KYEGLPVSLVEAQASGLQILSSDTVTQEVDVTKNISYLPINEESVLLWKDKVLSLTSE + ECNRFEINNSMTDGLYDICYQASKLLNRYQEMCVIKEI" + misc_feature 8961..9455 + /gene="wciL" + /locus_tag="SPC04_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.6e-26" + gene 9537..10937 + /gene="wzy" + /locus_tag="SPC04_0013" + CDS 9537..10937 + /gene="wzy" + /locus_tag="SPC04_0013" + /note="member of homology group 213" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32772.1" + /db_xref="UniProtKB/TrEMBL:Q9AHC7" + /translation="MQTKYICRVTLVTLSFIFAFCYLFWTLDNWNNGFLISNYVPSIF + IWVCFLIIFQITGFILQKVSIYDFSVWYLILSYFFMFGLIFNEYMGFQTTLLWSPSNF + YNNEELFHSYIFIIWILFCYSVGYLFFYSDGKVHYHSEVQNYQENEEKILYNAGRILT + GVGFISRVITDSKTVLAVRAANSYSAYSEAASSGIIDDLGVLMLPGVFSLFYSDKLSR + VIKRTIFWVMLFYLILIMILTGSRKIQVFSILALVLVYTQSLGITFSKKRVLVFLIVT + VFLLNVLVVIRGHRFDLNTIGIYLFDSFSSLDFVKNILGEVFSESGLTSLTVASAVTV + VPSSIPYEYGMTFLRTILSIFPIGWLVGDFFDKASATVVINKFLGLPVGSSFVEELFW + NFGYYGGVFWSFVLGIFSGWRLNFRAFQTSKISKVIYFSVISQLLLLVRSSSIDVYRP + IMYSLIMIFIFRRLKK" + gene 10937..12019 + /gene="wciM" + /locus_tag="SPC04_0014" + CDS 10937..12019 + /gene="wciM" + /locus_tag="SPC04_0014" + /note="member of homology group 214" + /codon_start=1 + /transl_table=11 + /product="putative pyruvyl transferase WciM" + /protein_id="CAI32773.1" + /db_xref="GOA:Q97SJ4" + /db_xref="InterPro:IPR007345" + /db_xref="UniProtKB/TrEMBL:Q97SJ4" + /translation="MVKKIMLHGATDYGSSNYGDYLYGEIVYDLLESKGYEVSFYNPS + DFFQMYLKEYRQKQSFTKKQADAILYIPGGYFGEGHNARFRDNLIQFKRFLPLGIWAS + YFKKPIGVLGIGAGPNNDSLMNYGIKRIINHAQFITVRDRESFDSLKHLSPSAPVHET + FDLIISSKLREEKTEQLCQLKREAKDKKIILVHYNHSKKALEKFAESISLFLENNPNY + YVVVTSDSILPYEDAYYQEFRKLVRTEDCFQFKYHSPAEMTSLLKMVDVVLTCKLHVG + VVATCFNKSVIAIACHPEKTARYYGAIGELQRCESLFDSSVNSIVKKLETFHLKPITI + PSELVLKARSSLDYLDLFLEGLVRES" + misc_feature 10952..11986 + /gene="wciM" + /locus_tag="SPC04_0014" + /note="HMMPfam hit to PF04230, Polysaccharide pyruvyl + transferase, score 5.9e-109" + gene 12009..13250 + /gene="wzx" + /locus_tag="SPC04_0015" + CDS 12009..13250 + /gene="wzx" + /locus_tag="SPC04_0015" + /note="member of homology group 215" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32774.1" + /db_xref="GOA:Q97SJ3" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q97SJ3" + /translation="MKVDRISFIKNTSSLYILNIVKLLFPLLTLPYLTRVLSLDAYGM + VIYVKALIAYVQLVIDFGFMISATKNIVNACTTPSKIGRIVGDTLVEKIFLSIISILI + YTILMWQIPIMRENILFSVFYLLATVTNIFIFDFLFRGIEKMHAVAIPYIISKTIITI + LTFIVVKDDSSILWIPILEGIGNLVAAVVSYRFLHYYGIKLSFSYLSVWVKDLKESSI + YFLSNFATTIFGVFTTVISGFYLQSQEIAFWGIAMQLLSAAKSLYNPIANSLYPHMIR + TKDIQSVKSINRIMFIPIIFGVLIVLFFSNQILSIIGGEKYTVSADFLKYLLPAFVAS + FYSMIYGWPVLGAIDKVKETTMTTILASIVQTLGLGIFILSDNFSLVTLAICSSMSEV + VLWISRYLIYFKNRSLFVRSK" + misc_feature 12030..12842 + /gene="wzx" + /locus_tag="SPC04_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.4e-23" + gene 13255..14352 + /gene="mnaA" + /locus_tag="SPC04_0016" + CDS 13255..14352 + /gene="mnaA" + /locus_tag="SPC04_0016" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI32775.1" + /db_xref="GOA:Q9AHC4" + /db_xref="HSSP:1O6C" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q9AHC4" + /translation="MKKVVVVFGTRPEAIKMCPLVKELRTRKNIETLVCVTGQHRQML + DQVLDTFGIIPDFDLSIMKDKQTLFDVTIGILEGMKAILESEKPDLVLVHGDTSTTFA + SSLAAFYLQIPIGHVEAGLRTYDIYSPYPEEFNRQAVGVLAQYHFTPTQLSKDNLLRE + GKTPESIFVTGNTAIDALQTTIQEDYTHPELEWIGESRFILITAHRRENLGEPMRHMF + RAIRRIIEEYSDVKAIYPIHMNPRVRQIAEEELSGCERIKMIEPLEVLDFHNFLSRSY + LILTDSGGIQEEAPSLGKPVLVMRDTTERPEGIEAGTLKLVGADENNIYRHFKELLEN + DSVYQAMSQASNPYGDGTACKKIADILEGEV" + misc_feature 13318..14340 + /gene="mnaA" + /locus_tag="SPC04_0016" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 1.3e-183" + gene 14356..15411 + /gene="fnlA" + /locus_tag="SPC04_0017" + CDS 14356..15411 + /gene="fnlA" + /locus_tag="SPC04_0017" + /note="member of homology group 36" + /codon_start=1 + /transl_table=11 + /product="FnlA" + /protein_id="CAI32776.1" + /db_xref="GOA:Q9AHC3" + /db_xref="InterPro:IPR003869" + /db_xref="InterPro:IPR013692" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AHC3" + /translation="MSQFTGKTLLITGGTGSFGNAVLKRFLETDVSEIRIFSRDEKKQ + DDMRHEFQVKVPEVAGKIRFYLGDVRDLASVKNAMHGVDYVFHAAALKQVPSCEFFPV + EAVKTNILGTENVLTAAIEAGVKQVICLSTDKAAYPVNAMGTSKAMMEKIAVAKSRTV + NPEHTKICVTRYGNVLCSRGSVVPLWIEQIKQGNALTITEPSMTRFVMTLEEAVDLVL + FAFEEGKSGDILVQKAPACTIEVLAKAVSEIFASEQDIKIIGIRHGEKRYETLLTNEE + CANAIDLGDFYRVPSDNRNLNYDKYFKDGSTNRNLLTEFNSNNTDLMDVEQVKRKLLE + LDEIQTAIRDMVADEEM" + misc_feature 14377..15231 + /gene="fnlA" + /locus_tag="SPC04_0017" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00099" + misc_feature 14380..15228 + /gene="fnlA" + /locus_tag="SPC04_0017" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 1.2e-162" + misc_feature 14380..15051 + /gene="fnlA" + /locus_tag="SPC04_0017" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 4.8e-09" + misc_feature 14383..15018 + /gene="fnlA" + /locus_tag="SPC04_0017" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 5.8e-09" + misc_feature 15229..15372 + /gene="fnlA" + /locus_tag="SPC04_0017" + /note="HMMPfam hit to PF08485, Polysaccharide biosynthesis + protein C, score 2e-23" + gene 15511..16740 + /gene="fnlB" + /locus_tag="SPC04_0018" + CDS 15511..16740 + /gene="fnlB" + /locus_tag="SPC04_0018" + /note="member of homology group 37" + /codon_start=1 + /transl_table=11 + /product="FnlB" + /protein_id="CAI32777.1" + /db_xref="GOA:Q97SJ2" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q97SJ2" + /translation="MIKNILITGAKGFVGKNLICTLEALKDGRDRTRPNLEIGEIFQY + DRDTDPILLDEYCKKADFVFHLAGVNRPQNPDEFMEGNYGFSSRLLEILEKYENTCPV + LLSSSTQASLEGRFSNSIYGQSKLAGEELFFEYGKKTGAPVLVYRFPNLYGKWCRPNY + NSAVATFCYNLAHDLPIQVNDPSVELELLYIDDLIQECLTALEGNPHRCNLDGLQILP + SPSGNYCYVPTTHRATLGEIVSLLETFKKQPDSLVMPEIPQGSFKKKLYSTYLSYLPV + DKFKFPLKMNIDERGSFTELLKTENTGQFSVNISKPGITKGQHWHHSKWEFFMVVSGR + ALIQERRIGLDENGQEYPILNFEVSGDKIEAIHMIPGYAHNIINLSDTENLITVMWAN + ESFDPRHPDTFFEQVEK" + misc_feature 15523..16146 + /gene="fnlB" + /locus_tag="SPC04_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 8.6e-09" + gene 16741..17925 + /gene="fnlC" + /locus_tag="SPC04_0019" + CDS 16741..17925 + /gene="fnlC" + /locus_tag="SPC04_0019" + /note="member of homology group 38" + /codon_start=1 + /transl_table=11 + /product="UDP-L-fucosamine FnlC" + /protein_id="CAI32778.1" + /db_xref="GOA:Q9AHC1" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q9AHC1" + /translation="MKIKTDYSDIHFKDNGKLKLLIIVGTRPEIIRLSSVITKCRKYF + DVILAHTGQNYDYNLNGIFFDNLGLDTPDVYMDAVGDDLGATVGNIINTSYKLMNQIK + PDALLILGDTNSCLSAIAAKRLHIPIFHMEAGNRCKDECLPEETNRRIVDVISDVNLA + YSEHARKYLHECGLPKERTYVTGSPMAEVLHKNLSAIESSDIHERLGLKKGGYILLSA + HREENIDTDKNFISLFTAINQLAEKYNMPILYSCHPRSKKRLQESGFKLDKRVIQHEP + LGFHDYNCLQMNAFVVVSDSGTLPEESSFFTSQGYPFPAVCIRTSTERPESLDKAGFI + LAGIDENSLLQAVETAVSLAQDEDFGLPVPDYVEENVSTKVVKIIQSYTGIVDKIVWR + KS" + misc_feature 16852..17880 + /gene="fnlC" + /locus_tag="SPC04_0019" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 8.3e-105" + gene complement(18120..18209) + /gene="tnp" + /locus_tag="SPC04_0020" + /pseudo + CDS complement(18120..18209) + /gene="tnp" + /locus_tag="SPC04_0020" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS element transposase (fragment)" + gene complement(18291..19362) + /gene="tnp" + /locus_tag="SPC04_0021" + /pseudo + CDS complement(join(18291..18608,18610..19362)) + /gene="tnp" + /locus_tag="SPC04_0021" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + gene 19465..19650 + /gene="tnp" + /locus_tag="SPC04_0022" + /pseudo + CDS 19465..19650 + /gene="tnp" + /locus_tag="SPC04_0022" + /note="member of homology group 0047 7" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene complement(19886..20457) + /gene="tnp" + /locus_tag="SPC04_0023" + /pseudo + CDS complement(join(19886..20209,20193..20393,20392..20457)) + /gene="tnp" + /locus_tag="SPC04_0023" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature complement(19889..20191) + /gene="tnp" + /locus_tag="SPC04_0023" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 9e-53" + /pseudo + gene 20577..>20936 + /gene="aliA" + /locus_tag="SPC04_0024" + CDS 20577..>20936 + /gene="aliA" + /locus_tag="SPC04_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32783.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 20577..20663 + /gene="aliA" + /locus_tag="SPC04_0024" + /note="Signal peptide predicted for SPC0098 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 20823..20891 + /gene="aliA" + /locus_tag="SPC04_0024" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acactgcggc taaagaagta cttgaaaaac aggtcttggc tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaagttt ataaactttc + 241 attcttgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatacccaa actcttcaca caagagttct aacttaccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtgtttaat gttggtaaga gaaatttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagttattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt tttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaattca gaagctattt cagtcaaata + 1081 agcgtctgga ttgtcagtaa gatagttttt aagtctatct ctatcaactt ttcttggttt + 1141 tgttcctttt acttggtggt ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatggtatta cgtgatattt ggaaaacgtg tgatgcttct gttatactac ctgttcgctc + 1261 acaataagag agaacttttt tacgaaaatc tattgaatat gccataagaa gattatacca + 1321 cattgtgtac tatattagat tgaaactaga atagtacacc tctgcttcta aaacattgtt + 1381 agaaatcgat ttgactgtcc tgaacgattt gttctgttct tatttcattt tactatattt + 1441 ttgtttcgcg ggaagtctac taagatactt aaagatgcag atagtaaaaa taaaggtgta + 1501 gacattaccg taaaaaagtg atataatcgt ataatgttca atgtataggt attaattatg + 1561 agtagacgtt ttaaaaaatc acgttcacag aaagtgaagc gaagtgttaa tatagttttg + 1621 ctgactattt atttattgtt agtttgtttt ttattgttct taatctttaa gtacaatatc + 1681 cttgctttta gatatcttaa tctagtggta actgcgttag tcctactagt tgccttggta + 1741 gggctactct tgattatcta taaaaaagct gaaaagttta ctatttttct gttggtgttc + 1801 tctatccttg tcagctctgt gtcgctcttt gcagtacagc agtttgttgg actgaccaat + 1861 cgtttaaatg cgacttctaa ttactcagaa tattcaatca gtgtcgctgt tttagcagat + 1921 agtgagatcg aaaatgttac gcaactgacg agtgtgacag caccgactgg gactaataat + 1981 gaaaatattc agaaattact agctgatatc aagtcaagtc agaataccga tttgacggtc + 2041 aaccagagtt cgtcttactt ggcagcttac aagagtttga ttgcagggga gactaaggcc + 2101 attgtcctaa atagtgtctt tgaaaacatc atcgagtcag agtatccaga ctacgcatcg + 2161 aagataaaaa agatttatac taagggattc actaaaaaag tagaagctcc taagacgtct + 2221 aagagtcagt ctttcaatat ctatgttagt ggaattgaca cctatggtcc tattagttcg + 2281 gtgtcgcgat cagatgtcaa catcctgatg actgtcaatc gagataccaa gaaaatcctc + 2341 ttgaccacaa cgccacgtga tgcctatgta ccaatcgcag atggtggaaa taatcaaaaa + 2401 gataaattga ctcatgcggg catttatgga gttgattcgt ccattcacac cttagaaaat + 2461 ctctatggag tggatatcaa ttactatgtg cgattgaact tcacttcgtt tttgaaattg + 2521 attgatttgt tgggtggaat tgatgtttat aatgatcaag aatttactgc ccatacgaat + 2581 ggaaagtatt accctgcagg caatgttcat cttgattcag aacaggctct cggttttgtt + 2641 cgtgagcgct actccctagc agatggcgat cgtgaccgcg ggcgccatca acaaaaggtg + 2701 attgtggcta tccttcaaaa attaacgtca accgaagtgc tgaaaaatta tagtacgatc + 2761 attaatagct tgcaagattc tatccaaaca aatatgccac ttgagaccat gataaatttg + 2821 gtcaatgctc agttagaaag tggagggaat tataaagtaa attctcaaga tttaaaaggg + 2881 acaggtcgga tggatcttcc ttcttatgca atgccagaca gtaacctcta tgtgatggaa + 2941 atagatgata gtagtttagc tgtagttaaa gcagctatac aggatgtgat ggagggtaga + 3001 tgaaatgata gacatccatt cgcatatcgt ttttgatgta gatgacggtc ccaagtcaag + 3061 agaggaaagc aaggctctct tggcagaatc ctacagacag ggggtgcgaa ccattgtttc + 3121 tacctctcac cgtcgcaagg gcatgtttga aactccggaa gagaagatag cagaaaactt + 3181 tcttcaggtt cgggaaatag ctaaggaagt ggcgagtgac ttggtcattg cttacggggc + 3241 tgaaatttat tacacaccag atgttctgga taagctggaa aaaaagcgga ttccgaccct + 3301 caatgatagt cgttatgcct tgatagagtt tagtatgaac actccttatc gcgatattca + 3361 tagcgccttg agcaagatct tgatgttggg aattactcca gtcattgccc acattgagcg + 3421 ctatgatgct cttgaaaata atgaaaaacg cgttcgagaa ctgatcgata tgggctgtta + 3481 cacgcaagta aatagttcac atgtcctcaa acccaaactt tttggcgaac gttataaatt + 3541 catgaaaaaa agagctcagt attttttaga gcaggatttg gttcatgtca ttgcaagtga + 3601 tatgcacaat ctagacggta gacctcctca tatggcagaa gcatatgacc ttgttaccca + 3661 aaaatacgga gaagcgaagg ctcaggaact ttttatagac aatcctcgaa aaattgtaat + 3721 ggatcaacta atttaggaga aatgatgaaa gaacaaaata cgatagaaat cgatgtattt + 3781 caattagtta aaagcttgtg gaaacgcaag ctaatgattt taatagtggc acttgtgaca + 3841 ggtgcggggg cttttgcata tagcactttt attgttaagc cagaatatac gagtaccacg + 3901 cgaatttacg tagtgaatcg caatcaagga gacaagccgg ggttgacaaa tcaggatttg + 3961 caggcaggaa cttatctggt aaaagactac cgtgagatta tcctttcgca ggatgttttg + 4021 gaggaagttg tttctgattt gaaactagat ttgacgccaa aaggtttggc taataaaatt + 4081 aaagtgacag taccagttga tacccgtatt gtctctattt cagttaatga tcgagttcct + 4141 gaagaggcaa gccgtatcgc taactctttg agagaagtag ctgctcaaaa aattatcagt + 4201 attactcgtg tttctgacgt gacaacactg gaggaggcaa ggccggcgat atccccgtct + 4261 tcgccaaata ttaaacgcaa tacactaatt ggttttttgg caggggtgat tggaactagt + 4321 gttatagttc ttcatcttga acttttggat actcgtgtga aacgtccgga agatatcgaa + 4381 aatacattgc agatgacact tttgggagtt gtgccaaact tgggtaagtt gaaataggag + 4441 agaaggatgc cgacattaga aatagcacaa aaaaaactgg agttcattaa gaaggcagaa + 4501 gaatattaca atgccttgtg tacaaatata cagttgagcg gagataaact aaaagtaatt + 4561 tccgttactt ctgttaaccc tggggaagga aaaacaacta cttccataaa tatagcatgg + 4621 tcgtttgcgc gtgcaggcta taaaactctt ttgatcgatg gcgatactcg aaattcagtt + 4681 atgttaggag tttttaaatc tcgtgaaaaa attacagggc taacagaatt tttatctggg + 4741 acagctgatt tatctcacgg tttatgtgat acaaatattg aaaatttatt tgtagttcaa + 4801 tcgggatctg tatcaccaaa ccctacagcc ttgttacaaa gtaaaaattt taatgatatg + 4861 attgaaacat tgcgtaaata ttttgattat atcattattg atacaccgcc tattggaatt + 4921 gttattgatg cggcaattat cactcaaaag tgtgatgcgt ccatcttggt aacagcaaca + 4981 ggtgaggcga ataaacgtga tatccaaaaa gcgaaacaac aattaaaaca aacagggaaa + 5041 ctgttcctag gagttgtttt aaataaattg gatatctcgg ttaataagta tggagtttac + 5101 ggttcctatg gaaattatgg taaaaaataa aatgaatata gtatggaagg ggactacaat + 5161 ataactctgg cattcttaca gagcatactt atcagtttat tagcttatgt actgattgca + 5221 atttcagaaa ccgatatgtc ttcaaataat attcggtcta tttggaagaa taattgaact + 5281 ggaccttcta attcattatt gagaactcat atattactga aacaaataaa ttttgtttag + 5341 atggagaaaa gttttatctg acgtagagga taaaagaatt atatttctga aaatcattga + 5401 gtgaccaaat atatattgag tttctgtagt tgcatgtact gcctgattta atttgtcaaa + 5461 tggaaataga atgaaaaatg gaaatagaat ttatagttgg aggttgttta tgtacggtat + 5521 aataaaacga ttaggtgata tattattatc tttaataggg ataataatat tgtgtccggt + 5581 ttttatgata attgcaattg cgattaaact tgattcagaa ggtccggtta tatttaagca + 5641 aaaacgcttt ggtattcata aagaatactt ctatattttg aaatttaggt ctatgaaaat + 5701 agatgcacct aaaaatgtgg cgcctcgaaa cttatataat ccagagcaat ggattacaaa + 5761 agtaggggct ttcttgcgaa aaacatcttt ggatgaacta ccacaattgt ttaatattct + 5821 tgttggtaat atgagtattg taggtcctag accagcgggt ataaatgaac tagatttgat + 5881 tgcagagaga gataagtatg gagcaaatga tatcttgcca gggttaactg gatgggcaca + 5941 aattaacggg cgtgatactt tgtctgttga gatgaagacg gagttagatg gctactatgt + 6001 taaacatctg tctttgataa tggatattag atgtatagtt aagacaatac cttacgtact + 6061 gaaacgaaaa ggtattgtag agggtagtgg taagaaagaa agttaaattg gacaatgaaa + 6121 atactatttg tttgccaaca ttataagcca gaaccattca ggttgtcaga tatttgtgaa + 6181 gatttagttc gaaaagggca tgaagtctct gttttggctg ggattcctaa ttaccctgaa + 6241 gggaagatat atgcagatta tcgtcataat aaaaaaagac gtgagattat agaaggtgtt + 6301 acgatatatc gttcttatac aatccctaga aaaaaaagtg ttgtatttcg attgttgaat + 6361 tattttagct ttgcaattag ttctacttta ggagttttat tggggaggta taaaacgaaa + 6421 gatggatcga attttgactg tgtattcgtt aaccaattgt ctccagttat gatggcatgg + 6481 gctggtatgg cttataaaaa aaaatataag aaaccgatgt ttctatattg tatggatgtt + 6541 tggccagata gtttaaccgt aggtggagtg aaacaagatg gcttgatttt caagctgttt + 6601 aaatttatct caaaaaaagt ttaccgagct agtgattata tatttgtcac tagtccatca + 6661 tttaaaaatt attttgtgaa gcaatttgac atatccgaac aaaagattac atatttgcca + 6721 caatatgcag aagatctttt tatccctgat gaatctatag ttaataaaga aagtgttgac + 6781 ctaacttttg ctggtaatat tggcaaagca caaaatttgg aaactatttt gaaagctgcc + 6841 agtttgatag agaagaatac caatttaccc aagaaaattc attttcattt tgttggagat + 6901 ggtacggaat tgttaagcat gaaagcatta gctcatgaat tggagttaaa gaatatttcc + 6961 ttctatggaa gacgttcttt ggaggaaatg ccatccttct ataaaaaatc agatgctatg + 7021 ttagtttctt taataggaga ctcgatagtt tctcgtacta tacctgggaa ggtacaatct + 7081 tatatggcgg caggcaaacc aattataggt gcaatttcag gagatgctaa aataattgta + 7141 gaagaagcaa attgtggata tgttagtccc gaacgagatg taaaacaatt ggcaaaaaat + 7201 atttgtaaat ttagtatgtt atctattaag agacaaagag agttaggaaa gaaagctcgt + 7261 tgttactatg aaaatcactt ttcaaaagag cagtttatgc tcgaactgga gacatgttta + 7321 gagagggaaa gtaagaaaga ataatttaat gagagtactg tttatactat ctgataatat + 7381 atatctaact ccttacttca atttttataa agaattattg aagaaactgt ctattagtta + 7441 cgatgttata tattgggata agaatattaa cgagattatt acaaaacaaa actactatcg + 7501 tatttctttt tctggtaaag gaaaattaag taagatatta ggttatgtaa aattcagaaa + 7561 agaaattaaa aagaagctaa aagaaaatga ttatgatatg atattgccgt tacatagtat + 7621 tgtgtctttc attttagtag attttcttct cttttcattt aaaaatagat atatttatga + 7681 tattcgtgat tacagttatg aaaaattttt ggtttatcgt ttggttcaga aacaattggt + 7741 gaaaaattct ttaatgaata tcgtttcttc agacggctat aaattttttt taccaatggg + 7801 agagtatttt actacccata acctacccaa tatgatagaa ttaaacgagg taaagcagtt + 7861 aaaaaataat agtacgtttc caattcaact ttcctacatt ggtttaattc gttttcaaga + 7921 acaaaataaa aaaataatcg atttttttgc aaatgacagt cgatttcagt tgaattttat + 7981 aggtactaat gcaggagaat taagggaatt ttgtcaagaa aaaaatatca gcaatgttaa + 8041 cttggtggac acattccagc ctaaagatac catgtctttt tataagaata cagatgctgt + 8101 tttgaattta tacgggaatc acactccctt actagactat gctttgtcta ataaactcta + 8161 ctttgctgca ttgttgtata aacctatttt agtttgtgaa gatacttata tggaaaaagt + 8221 gtcaatagag aatggttttg gtttcgtttt acctatgaag gatgaatcgg aaaaagattg + 8281 tttggctttg tatattcaaa accttgacag gaaacagcta attaagaatt gtgataactt + 8341 catggacaga attagtttag aaaaacaaaa aacagaaata gaattagaga agcgaatctt + 8401 aagcttaagg aagaagaatg attaaagtat tacatctatt tacaacacta gatagtggtg + 8461 gagtagaaag ttttctattc aactattatt ctcacattga tagaaaaaaa attcaatttg + 8521 attttattgt gcctggaaaa gaacaaggat ttttagagga taaaatgaaa gaattgggtg + 8581 caaaggttta tcatgtgcct ctattaagga aaaagcctct acatcagttt ctctctcttg + 8641 ctagaataat aaagaaagga gattatgata tagttcattg ccatggctat aaatctgcaa + 8701 ttggtctgat cttatctaaa ataattggtt gtaaaattag aattattcat agtcatatgg + 8761 cttatgtaac agaaaacagt tttcaaaaag tattgcgtaa attagtaaca attttggtaa + 8821 aaatcttagc aactcattgg tttgcatgtg gggaagattc ggctaagtgg ttatatggag + 8881 agaaagcgta taaagacgga aaaattgaaa ttatttttaa tgcaattgat ttgaaaaagt + 8941 atcaattttt gtcagatgtt agagaaaaat gtcgtagaga attagatgtg tcaaataagt + 9001 tcgtattagg aaatatagct cgcctatcag atcaaaaaaa ccaaagttat ttatttaacg + 9061 ttttaaaaga actcatttta atcaaaccaa atgttatttt actcctagtt ggtaatggtg + 9121 aggatgagca gaaattaaaa cagaaagctt tagaactaaa tctgacccca tatgtgctat + 9181 ttttagggag aaggactgat atttctgatt tattatctgc gatggatgtt tttttgcttc + 9241 cgtctaaata tgaggggttg cctgtttctc tagtagaggc tcaggcatcg ggattacaaa + 9301 ttttatcgtc agatacagtg acgcaagaag tagatgtgac caaaaacatt agttacttac + 9361 ctatcaacga agagtctgtg ttgctatgga aagataaagt actgtcttta acatctgagg + 9421 aatgcaatcg ttttgaaata aataacagta tgacagatgg actctatgat atttgttatc + 9481 aagctagtaa attattgaat cgttatcaag aaatgtgtgt aataaaggag atatagatgc + 9541 agacaaagta tatttgtaga gtgacactag tgacattaag ttttatattt gctttctgtt + 9601 acttgttctg gactctcgat aattggaata atggttttct tatatctaat tatgttccgt + 9661 ctatatttat atgggtttgc tttctaatta tttttcaaat tactggtttt attttacaaa + 9721 aagttagtat atatgatttt tctgtatggt atctgatttt atcttatttt tttatgtttg + 9781 gattaatttt caatgagtat atggggtttc aaacaactct gctgtggagc cctagtaact + 9841 tctataataa tgaagaatta tttcattcat atatttttat aatttggatt ttgttttgtt + 9901 attctgtagg ctatttattt ttttatagtg atggaaaggt acattatcat tcagaagtac + 9961 aaaattatca ggaaaatgaa gagaaaattt tgtacaatgc gggtaggatt ttaacaggag + 10021 tgggctttat ttctagggta ataactgatt ctaaaacagt actagcagtt agagcggcga + 10081 atagctattc agcatattca gaggcagcta gttcaggaat aatagatgat ttaggagtac + 10141 ttatgcttcc tggtgtgttc tccttgtttt attcagataa gctgtcccga gttataaagc + 10201 gtactatttt ttgggtaatg ttgttttacc taattttgat aatgatccta acaggaagtc + 10261 gtaaaatcca ggtgttttca atcttggcgt tggttttagt atacacacaa tctttaggga + 10321 ttactttttc gaagaaaaga gtacttgtat ttttaatagt aactgtattt ctattaaatg + 10381 tattagttgt tattaggggg caccgtttcg acttgaatac tataggtata tacttatttg + 10441 attccttttc ttcattagat tttgtaaaga atatactagg ggaagtattt tcagagtcgg + 10501 gactgaccag cctaacagta gcttctgctg taactgttgt gcctagtagc attccatatg + 10561 aatatgggat gacatttcta cgcactatcc tatcaatttt tcctattgga tggttagttg + 10621 gtgatttttt tgataaagca tcagcgacgg ttgttattaa taaatttttg gggttacctg + 10681 taggctcttc ttttgtggaa gaattatttt ggaactttgg ttactatggt ggtgtttttt + 10741 ggagttttgt tttgggaata tttagtggat ggcgattaaa tttcagagct tttcaaacaa + 10801 gtaaaatctc aaaagttatt tatttttcgg taatttctca actattgctt ttagtgagaa + 10861 gtagttcaat agatgtttat cgtcctatta tgtatagttt gattatgata tttattttta + 10921 ggaggttgaa aaaatagtgg tgaaaaaaat tatgttacat ggtgcaacgg attatggttc + 10981 aagtaattac ggtgattatc tttacggtga gattgtctat gatttattag aatctaaagg + 11041 atatgaagtt tctttttata atccatcaga tttctttcaa atgtacttga aagaatatcg + 11101 ccaaaaacaa agttttacta aaaaacaagc agatgctatt ttgtatatcc cgggaggata + 11161 ttttggggaa gggcataatg cacgttttcg tgataattta atccaattta aacgattttt + 11221 acctttggga atttgggctt catattttaa aaagcctata ggagtattag gtattggtgc + 11281 agggcctaat aacgattctt tgatgaatta tggtataaag agaattatta atcatgctca + 11341 atttattaca gttcgtgatc gagaatcatt tgattctttg aagcatttgt cgccttcggc + 11401 tccagtgcat gaaacctttg atttaattat ttcaagtaaa ttaagagaag aaaaaacaga + 11461 gcagctgtgt caattgaaaa gagaagctaa agataagaag ataattcttg ttcactataa + 11521 tcattccaaa aaagctcttg aaaaatttgc ggaatcaatt agtctttttc tagaaaacaa + 11581 tcctaactat tatgttgtag taacttcgga ttccattcta ccttatgaag atgcttatta + 11641 tcaggaattt agaaaattag ttagaactga ggattgtttt caattcaagt atcattctcc + 11701 tgcagaaatg acatcattgt tgaaaatggt agatgtggtt ttaacttgta aattacatgt + 11761 tggggtagtg gcaacatgtt ttaataaatc tgtgattgcc attgcatgcc atccagaaaa + 11821 aacagcacgt tattatggag caattggaga gttacaacgt tgtgaatctt tatttgattc + 11881 aagtgttaat agtattgtaa agaaacttga aacttttcat ctaaaaccga taacaatacc + 11941 ttcagaattg gtgttgaaag cgagaagtag tttggactat ttagatcttt ttttggaagg + 12001 actagttcgt gaaagttgat agaatttcat ttataaaaaa tacaagttct ctctatattc + 12061 tgaatattgt taaattacta tttcctttat taacactccc gtatttgaca agggtgcttt + 12121 cgctagacgc gtatggaatg gttatttatg ttaaagcgtt aatagcttat gttcaactgg + 12181 tgattgattt tggtttcatg atatcagcta caaaaaatat tgtaaatgct tgtactactc + 12241 cctcaaagat tggaaggata gttggagata ctctagttga aaaaatattt ttatctatca + 12301 tttcgattct aatttacacc atattgatgt ggcaaatccc aataatgaga gagaatattc + 12361 ttttttcagt tttttatttg ttagctacag tgaccaatat ttttatcttt gactttttat + 12421 ttcgtggaat tgaaaagatg catgcagttg caattcctta tattatttct aaaactatca + 12481 ttacaatttt gacatttatt gtagtaaaag atgattcttc tattttatgg attcctatat + 12541 tggaaggaat tgggaattta gttgctgcag tagtttctta tagattcctt cattattatg + 12601 gaattaaatt atcattttct tatctgtctg tttgggttaa agatttaaag gaatcctcta + 12661 tttatttttt atccaatttt gcaactacta tttttggcgt ctttacgaca gtcatttcgg + 12721 gtttttattt acaaagtcaa gagatagcct tttgggggat agcaatgcaa ctgctttcag + 12781 cagcaaaatc attgtataat cctatagcga atagtttata tccgcatatg atacgtacta + 12841 aagatataca atcggttaag agtattaatc ggattatgtt tattcctatt atctttggag + 12901 ttttgatagt tttattcttt tcaaatcaaa ttctttctat aattggtggt gaaaaatata + 12961 ccgtttcagc agattttctt aagtacttat tacccgcttt tgttgctagt ttttattcta + 13021 tgatttacgg atggcctgtc ttaggagcta ttgataaagt gaaagaaact acaatgacaa + 13081 ctatattagc ttcgattgtc caaactttgg gattaggaat atttatcttg tctgataatt + 13141 ttagtttagt aacattagct atttgttcaa gtatgtctga ggtggtgtta tggattagcc + 13201 gttatctaat ttattttaag aaccgttcat tatttgttag gagtaagtaa atatatgaaa + 13261 aaagtagttg tagtatttgg aactcgtcca gaagccatca agatgtgtcc tttggtcaaa + 13321 gagttaagaa cacgtaagaa tattgaaaca ttagtttgcg ttacgggcca acaccgtcaa + 13381 atgttggatc aggtcttgga cacatttggg attattcccg attttgattt gtctattatg + 13441 aaagataaac aaactttatt tgatgtgacc attggcattt tggaaggaat gaaggctatt + 13501 ttagagtcag aaaaacctga tttggtgtta gttcatgggg atacaagtac gaccttcgct + 13561 agttcactgg cggcctttta tttacagatt ccaattggtc atgttgaagc tggtttgcgc + 13621 acttacgata tctattcacc atatcctgaa gagtttaatc gtcaagcagt tggggttttg + 13681 gctcagtatc attttacacc aacacaactt tcaaaagata atcttttaag agaaggaaaa + 13741 actccagaga gcatatttgt gacaggtaat acggcgattg atgctttaca aactacaatt + 13801 caagaggact atacgcatcc tgagttagaa tggataggag aaagcaggtt tattctaatt + 13861 acagctcatc gtcgtgaaaa tcttggtgaa ccgatgagac atatgtttag agcaattaga + 13921 aggattattg aagaatattc agatgtcaag gctatttatc ctatccatat gaatcctcgt + 13981 gttcgccaaa ttgctgagga agaactaagt ggctgtgaac gtatcaagat gatcgaacct + 14041 ttagaagtat tagattttca caatttttta tcaagaagtt atttaatttt aacagatagt + 14101 ggtggtattc aggaagaggc tccaagttta ggaaaacctg ttttggttat gagagataca + 14161 actgaacgtc cagagggaat tgaagcaggg actttgaaac ttgtaggtgc tgatgaaaat + 14221 aatatttata ggcattttaa agaattatta gaaaatgatt cagtttatca agcaatgagt + 14281 caagcttcaa atccatatgg agatggaacg gcttgtaaga aaattgcaga catactagaa + 14341 ggagaagtgt aatatatgtc acaatttaca ggaaaaactc tcctaattac aggagggaca + 14401 ggttcatttg ggaatgcggt tctcaagcgt tttttagaaa cagatgtctc agagattcgt + 14461 atattttcgc gagatgaaaa gaaacaagat gatatgcgtc atgagtttca ggtaaaagta + 14521 ccagaagtgg ctgggaaaat ccgtttttac cttggagatg tgcgtgactt agcttcggta + 14581 aaaaatgcta tgcatggtgt ggattatgtt tttcacgctg ctgctcttaa acaagtacct + 14641 tcttgtgaat ttttccctgt agaagcggta aaaactaaca ttttgggaac ggagaatgtc + 14701 ctcactgcgg ctatcgaagc tggtgtaaag caagttatct gtctttctac agataaggcg + 14761 gcttatcctg tcaatgctat gggaacatcc aaggctatga tggaaaagat tgctgttgct + 14821 aagtccagga cggtaaatcc tgagcataca aagatatgtg tgactcgcta tgggaatgtt + 14881 ctgtgtagcc gtggatctgt cgttcctctt tggattgagc aaattaagca aggaaatgct + 14941 cttacaatta ctgaacctag catgacacgt tttgtgatga cattggaaga agcagtagac + 15001 ttggttttat ttgcatttga agaagggaaa tctggagata tactagttca gaaagcacca + 15061 gcatgtacga ttgaagtgtt ggctaaggct gtatcagaaa tttttgcctc agaacaagat + 15121 attaagatta taggtattag acacggagaa aaaaggtatg aaacactatt aactaacgaa + 15181 gagtgcgcaa atgcaattga tttgggtgat ttttatagag ttcctagtga taatcgtaat + 15241 cttaactatg ataagtattt caaagatggt agtacgaata gaaatttgtt gacagaattc + 15301 aatagtaata ataccgattt gatggatgta gagcaagtta aaagaaagtt gctagaatta + 15361 gatgaaatac agacagcaat tcgtgatatg gtagcagacg aagagatgta aaatctttta + 15421 agatacatta aaattatcaa ggatatataa tgtatcatgt attgtcgaga gagttaacta + 15481 ttaaaacagc atataaaata aggagggggc atgattaaaa atattttaat cacaggagcg + 15541 aaaggatttg taggaaaaaa tcttatctgt actctggaag ctttgaaaga tggacgagat + 15601 aggactcgtc ctaatttaga gattggagag atttttcagt atgatcgtga tacagatccg + 15661 attttattag atgaatattg taagaaggcc gatttcgtat tccatttagc tggtgtcaat + 15721 cgtccacaga atcctgatga attcatggag ggaaattacg gtttttcaag tagattattg + 15781 gagattttag aaaagtatga aaacacttgt cctgttctac tctcaagttc tactcaagct + 15841 agtttagaag gccgattttc aaactctata tatggacaat ctaagctagc aggggaagaa + 15901 ctcttctttg aatatggaaa gaaaacggga gcacctgtct tagtttaccg tttcccgaat + 15961 ctttatggga agtggtgccg tcctaactac aattctgctg tagcaacttt ctgttataat + 16021 ctagctcacg atttacctat tcaagtaaat gatccaagtg tagaattgga gttgctgtat + 16081 attgatgatt tgatacaaga gtgtctaact gcattggaag gaaatcctca tcgttgtaat + 16141 ctagatggat tacaaatctt acctagccca tcaggaaact actgctacgt accaacgact + 16201 catcgtgcaa ccttaggaga gattgtctct ctattagaaa catttaaaaa acagcctgat + 16261 agtttagtta tgcctgaaat tcctcaggga tcgtttaaaa agaaattgta ttctacctac + 16321 ctatcttatt taccagtaga taagtttaag tttcctctaa aaatgaatat agatgaacga + 16381 ggtagtttta cggaattatt aaaaacagaa aatacgggtc aattttctgt taatatttct + 16441 aaacctggca ttaccaaagg gcaacattgg catcattcta agtgggaatt tttcatggtt + 16501 gtttctggtc gtgctttaat acaagagcgt aggatagggc tggatgaaaa cggtcaagag + 16561 tatcctattc tgaactttga agtgtcgggc gataagattg aagcaataca tatgataccg + 16621 ggctatgcac ataatattat taatctttct gatacagaaa atctaattac tgtcatgtgg + 16681 gctaatgagt catttgatcc tagacatcca gatacttttt ttgaacaagt ggagaaataa + 16741 atgaaaatta agacagatta tagtgatatt cactttaaag ataatggcaa acttaagtta + 16801 ttgattattg tgggaacacg tccagagatt atacgtctaa gtagtgttat cactaaatgt + 16861 cgaaagtatt ttgatgttat tttggcacat actggacaaa actatgatta caatttaaat + 16921 ggtattttct ttgataattt agggttagac actccggacg tatacatgga tgctgttgga + 16981 gatgatcttg gtgctactgt agggaatatt attaatactt catacaaatt gatgaatcaa + 17041 attaaaccag atgctttatt gattttaggg gatacaaatt cttgtttatc agctattgct + 17101 gccaagcgtt tacatattcc aatttttcat atggaggctg gcaatcgctg taaagatgag + 17161 tgcctaccgg aagagactaa tcgtcggatt gttgatgtta tttcagatgt taacttagca + 17221 tactctgaac atgcacgtaa gtatttacat gagtgtggtt tacctaaaga gcgcacatat + 17281 gtaactggtt ctcctatggc agaagtgtta cataaaaatt tatctgctat tgagtcttca + 17341 gatatccatg aacgtttggg attgaaaaaa ggaggttata tcttactttc agctcaccgt + 17401 gaggaaaata ttgatacaga taaaaatttt atttctctct ttacagcaat taatcaatta + 17461 gctgaaaagt ataatatgcc aatcttatat tcttgccatc ctagatcaaa gaaaaggcta + 17521 caagagagcg gttttaaact agataaacgt gtgattcagc atgagccact aggattccat + 17581 gactataatt gtttacagat gaatgcattt gttgtagtat ctgattcggg aactttaccg + 17641 gaagaaagta gtttctttac tagtcaaggt tatccttttc ccgctgtatg tattcgtaca + 17701 agtacagaac gtcctgagtc cttagataag gcaggattta ttttggcagg cattgatgaa + 17761 aattctcttc ttcaagcagt tgaaactgct gttagcttgg cacaagatga ggattttgga + 17821 ttaccggttc cggattatgt tgaggaaaat gtctctacta aagttgttaa gataatacag + 17881 agctatacag ggatagtgga taaaatagtt tggaggaaaa gctgaattgt atatttttaa + 17941 taaatcaaaa cgagatgatt aattcttagt agaacaagag taaaattgaa cgtatttgat + 18001 ggaaatgtct tacttgatag tcgagggata gccattctat cggatttttg gcttgttttt + 18061 gcgcttcatg tttgatagaa taaagggctc tttgtcaact gtagtgggtt gaagaaaagc + 18121 taagcttgag aaaggacaaa tttcgtcctt tcttttttga tgttcagagc gataaaaatc + 18181 cgttttttga agttttcaaa gtttcgaaag taaccgccca ataacgaagt ctattgaaaa + 18241 atctccagac tagagaactc atatatagtt cctaatctgg agatttctta tttgcacttt + 18301 tcttgtacaa ctttagtcca cggtaaatag gcctctaaaa cctctttgtt tacgagagtt + 18361 tcctcgtttg gaagacattc tagaagatag gatagatatt tctcgctatt tataatggat + 18421 tgtaataaga tatgaacaaa tcgattagga aaggaaaatt gatttataga aatattttag + 18481 cagtcgatgc gtactgttat agattcaacg cactataatt gatgacgttt agctgtttcc + 18541 aacaaactca taataatagc tcttgcttta gctccttcaa aactttgaga aaataaccac + 18601 cctcgctttt ttaaaaataa ccaccctcgc ttttttaaac tgagcttagg ctaaaagagt + 18661 ccactggact cttttactcc gtcccataac caatgattta atggcgcgtt cagctagatt + 18721 attggaaagg accagatgtc cgtcttttaa aatggtctta aaggtttctt catacttgag + 18781 gctgtattca attgcccttc ctagttttga acccgataaa actgactgac gacggcacca + 18841 agcaaagaag tcttccagta ggggttggag atgttcttga cgtttctgta gccgttcatc + 18901 agctggcaaa gcctcccagt ctctttccaa ggaaaataac tgatcacaat aggctaaacc + 18961 tttagctcct aaggatgatt tatctgcttg cttggggggc acttcaaaaa acttccttct + 19021 cacatgcgcc caacatccaa caagtgcagc ttcttccagt tgacgataag cttctagctg + 19081 ttcgcagttt accaagctta gcgtcgcctt actcctaaac cttggactgc tatcgcatag + 19141 gcagaactag aggactaaag tcctaagtta ctgccgcaac atgtcacaat gaacatagcc + 19201 agaataatct cctaggaatt cttgtactac tgaaccactt cgacactgat catggtggta + 19261 aagcgtaatc ccttgtttct ctgctttacc tgacaaaaaa gtccaatagt aggtcagatg + 19321 gctatcactc tctagaaccc gataggaggt ttcatccgca tgaagtaagg gctgagtcaa + 19381 tagtctctct cgcaagaggt tataaagggg ctttaggaat aggagctttc acaagcttat + 19441 ccagatgatt atcttttact cgttatggac aatgctatat ggcataaatc aagtacctta + 19501 aagattccga ctaatattgg ctttgcattt attcctccat acacaccaga gatgaacccc + 19561 attgaacaag tgtggaaaga gattcgtaaa cgtggattta agaataaagc ctttcgaact + 19621 ttggaagatg tcatgaatca acttcaagat gttatacaag gactggagaa ggaggtgata + 19681 aagtccatcg ttaatcggag atggactaga gtgctttttg aaagcagatg agtataaaaa + 19741 gaaagtcctc atttcaatag aaatcacgac tttctgatgg atttatagta aaatgaaata + 19801 ataacaggac aaatcgatca ggacagtaaa atcgatttct aacaatgttt tagaagcaga + 19861 ggtgtactat tctagtttca atctactata tttttggagt gatagaaaag cctttcatca + 19921 gccaatctac ttgttcaggt gcgagagctt tgacatcctt ttctgtactg ggccaagtca + 19981 gtctgccgtt ctcaaagcgt ttatatagta gccaaaatcc ttgaccatcc cagtaaagga + 20041 ctttaaagcg gtctttacgt ccaccacaaa agagaaagat ttgaccggag aaaggatcca + 20101 attcaaagtg ggttttaacg agataagcca gtgaatcgat tccttgtctc atatcagttt + 20161 tcccacacac gagatagacc tgccctaggc tagatagatg aattgtcata gagcaacacc + 20221 ttatccaaaa gctgttctat catttcgaga ttgagagatt gaaaaaaact tacttcaagc + 20281 ttgccaatac gaattttaag tagaatatca tttctctttt tagaatcaaa acgacgagat + 20341 tgtggaatct ctacaggaac aataggttgt ggcattaaaa tatcctccaa tatttacttt + 20401 actaatagta tacaggagga gctccatgaa tgatagatac cttgttatga cgcgcttacg + 20461 atattcatat tttttgcaaa gatgttgttt gaaaaataat tttcaaaaat tctgaaaatt + 20521 ctgttgacaa ctttctgaaa agagtctata atggagagaa agttttaaag gagaaaatga + 20581 tgaaaagttc aaaactattt gcccttgcgg gcgtgacatt attggcggcg actactttag + 20641 ctgcatgctc tggatcaggt tcaagcacta aaggtgagaa gacattctca tacatttatg + 20701 agacagaccc tgataacctc aactatttga caactgctaa ggctgcgaca gcaaatatta + 20761 ccagtaacgt ggttgatggt ttgctagaaa atgatcgcta cgggaacttt gtgccgtcta + 20821 tggctgagga ttggtctgta tccaaggatg gattgactta cacttatact atccgtaagg + 20881 atgcaaaatg gtatacttct gaaggtgaag aatacgcggc agtcaaagct caagac +// + diff --git a/public/res/serotype_genbank/serotype_40.gb b/public/res/serotype_genbank/serotype_40.gb new file mode 100644 index 0000000..8096862 --- /dev/null +++ b/public/res/serotype_genbank/serotype_40.gb @@ -0,0 +1,971 @@ +LOCUS CR931712 22089 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Colemore (serotype 40). +ACCESSION CR931712 +VERSION CR931712.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22089) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22089) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22089 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Colemore" + /db_xref="taxon:1313" + gene <1..166 + /gene="dexB" + /locus_tag="SPC40_0001" + CDS <1..166 + /gene="dexB" + /locus_tag="SPC40_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34442.1" + /db_xref="GOA:Q4K241" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K241" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVEMTD" + gene complement(313..1707) + /gene="tnp" + /locus_tag="SPC40_0002" + /pseudo + CDS complement(join(313..447,447..1577,1576..1707)) + /gene="tnp" + /locus_tag="SPC40_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(723..1223) + /gene="tnp" + /locus_tag="SPC40_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.1e-21" + /pseudo + gene 1874..3328 + /gene="wzg" + /locus_tag="SPC40_0003" + CDS 1874..3328 + /gene="wzg" + /locus_tag="SPC40_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34444.1" + /db_xref="GOA:Q4JZ21" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZ21" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKLSQNT + DLTVDQSSSYLVAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALSFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIIDSLQDSIQTNMPLETMIDLVNAQLESGGTYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1874..1999 + /gene="wzg" + /locus_tag="SPC40_0003" + /note="Signal peptide predicted for SPC1814 by SignalP 2.0 + HMM (Signal peptide probability 0.991) with cleavage site + probability 0.537 between residues 42 and 43" + misc_feature 2087..2434 + /gene="wzg" + /locus_tag="SPC40_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 3.9e-61" + misc_feature 2612..3055 + /gene="wzg" + /locus_tag="SPC40_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2e-69" + gene 3330..4061 + /gene="wzh" + /locus_tag="SPC40_0004" + CDS 3330..4061 + /gene="wzh" + /locus_tag="SPC40_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34445.1" + /db_xref="GOA:Q4JZ20" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ20" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSCHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 3333..3941 + /gene="wzh" + /locus_tag="SPC40_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 1.9e-38" + gene 4070..4762 + /gene="wzd" + /locus_tag="SPC40_0005" + CDS 4070..4762 + /gene="wzd" + /locus_tag="SPC40_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34446.1" + /db_xref="GOA:Q4JZ19" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZ19" + /translation="MQDQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVIVPIDTRIVSVSVNDRVPEEASRIANSLREVAAKKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGLGTSVIVLLLELLDTRVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 4088..4504 + /gene="wzd" + /locus_tag="SPC40_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 5.8e-51" + misc_feature 4610..4687 + /gene="wzd" + /locus_tag="SPC40_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4772..5455 + /gene="wze" + /locus_tag="SPC40_0006" + CDS 4772..5455 + /gene="wze" + /locus_tag="SPC40_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34447.1" + /db_xref="GOA:Q4JZ18" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZ18" + /translation="MPTLEIAQKKLEFIKKAEEHYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVMSGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDAQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 5471..6838 + /gene="wchA" + /locus_tag="SPC40_0007" + CDS 5471..6838 + /gene="wchA" + /locus_tag="SPC40_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34448.1" + /db_xref="GOA:Q4JZ17" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JZ17" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETEVERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAIGVLNFFIVERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFINLPGESYDIGEIISRFETMG + IDVTVNLNAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHLISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKINNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPK + QKRRLSFKPGITGLWQVSGRSKITDFDAVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 6254..6835 + /gene="wchA" + /locus_tag="SPC40_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.3e-145" + gene 6869..8050 + /gene="wchF" + /locus_tag="SPC40_0008" + CDS 6869..8050 + /gene="wchF" + /locus_tag="SPC40_0008" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI34449.1" + /db_xref="GOA:Q4JZ16" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4JZ16" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMR + ENSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDENPIF + YILACRIGPFIHGIKKRIQAIGGTLLVNPDGHEWLREKWSLPVRKYWKYSERLMVKYA + DLLVCDSKNIEQYIQEDYKQFQPKTTYIAYGTDTTPSILKFEDTKVRNWYQEKGISEN + GYYLVVGRFVPENNYEAMIREFIKSQSKKDFVLITNVEQNKFYDKLLRETGFDQDPRI + KFVGTVYDQELLKYIRENAFAYLHGHEVGGTNPSLLEALGSTKLNLLLDVGFNREVGE + DGAIYWQKDELSRVIEYVETINQATIANLNFKSTQRILSDFTWEKIVADYEGVFCFAK + S" + misc_feature 7484..7978 + /gene="wchF" + /locus_tag="SPC40_0008" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.0035" + gene 8007..8897 + /gene="wcwI" + /locus_tag="SPC40_0009" + CDS 8007..8897 + /gene="wcwI" + /locus_tag="SPC40_0009" + /note="member of homology group 99" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34450.1" + /db_xref="GOA:Q4JZ15" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZ15" + /translation="MWQIMKEYFVLRRVSVPNLYAVVVLYNSLLSEAKILKTLNTLNC + KELNLIVVDNSDRKEIQLKNKNFSTENNITLVNMNGNQGLSKAYNKVLELLKGRIGYV + VWLDDDTEISVEYLTKLLYASRGNYDIILPIIQDTHGKIVSPNSRGLLSNKPIKSYKD + GKKLEKFNAINSCTAVNLDIYEEYRYDERLFLDEIDHSFFYDHRNKNLKIELINTIVI + QNFSQRADNLNFDTAWSRLKIRIRDLIVAYKIRGGIFMGLVAVLKSILLGLQLYLKIK + DLRIVIYSFTSALCIFFRKT" + misc_feature 8064..8561 + /gene="wcwI" + /locus_tag="SPC40_0009" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 4.9e-11" + gene 8894..10090 + /gene="wcwL" + /locus_tag="SPC40_0010" + CDS 8894..10090 + /gene="wcwL" + /locus_tag="SPC40_0010" + /note="member of homology group 100" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34451.1" + /db_xref="GOA:Q4JZ14" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JZ14" + /translation="MKMKILYFMNNTDHGGAALALLDLVTQINENYPEYELIVVTGKK + NNLNVKLTEIGIENYFFPFRNFISSYKKPAILWTILYKIRHYIGNRMALKKIEKKIDL + KKIDIIHSNLNRIDIGAILAKKHSIPHLCHIREHLDVWYFYNKLDHRKFEYDFKVLTT + EKNYIFYMCSFSTKYIAISNSVAMDWCKKGLSQSSIVKVYDGIKLPQVFGDKKWFRNK + KINIVFVGGYDIKKGQELFLSYFLKLPKEIQMQYTLTFYGSGKSKYIKKLQKMSQHLC + SDQVKFHSYIDNLTELLPNYDIGINFSTMEGFGRVTVEYLANGLCVVANKSGASPELI + TEEVGFLIDKDNQDEFIQLFTKLSIEKNKIRQMGNKAVNQAQKFSINQHTREIINVYQ + EMRNKQ" + misc_feature 9509..10015 + /gene="wcwL" + /locus_tag="SPC40_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.2e-19" + gene 10087..11094 + /gene="wcwK" + /locus_tag="SPC40_0011" + CDS 10087..11094 + /gene="wcwK" + /locus_tag="SPC40_0011" + /note="member of homology group 64" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34452.1" + /db_xref="GOA:Q4JZ13" + /db_xref="UniProtKB/Swiss-Prot:Q4JZ13" + /translation="MKNMEQIDFVVTWVNNKDVDWCKRKSEFEKEYNIFQDLNSEERY + REWGFMKYWFRAVEKYAPWVNKIYFITEGHVPNWLDVNHPKLVHVKHEDYIEKQFLPT + FNSNVIEMNLIHLKDLSEKFVLFNDDTFINDFVKQSDFFENNLPKDTGIFSPLIPREN + SLTPIVLNNMEIINKYFSKKKILEQNFSKFFNIKYGKHLLKNICLLPWSDLLGFYNSH + IPVSYCKSNFLEVYEKEYDIFNLTFKNKFRNKNEINHWLIRYWQLSSGNFIPRNINFG + KNYAISNDPTDIINELKFSKYKIICINDGESIDSFDEVKDLMIDAFEKKFPEKSSFEK + K" + gene 11091..11951 + /gene="wcxU" + /locus_tag="SPC40_0012" + CDS 11091..11951 + /gene="wcxU" + /locus_tag="SPC40_0012" + /note="member of homology group 101" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34453.1" + /db_xref="GOA:Q4JZ12" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JZ12" + /translation="MRQIRMNLEDLVLIILNYNSAKDTLRCLEILRSFNMNFKIIVVD + NNSTDNSIELLKNIEDPQTTFLISDENRGYGAGNNIGIHFAENNFSSNIIGIINPDIV + IPNQEVIISMYNVLKNSDFAMVGGSVIDNEGNYRLLNSSWNLPSFKSVVLERFLIYNR + HKVPYCLNMYNDETAIVDCVAGCFFMIKADVMKEIGYFDENVFLYNEENILGMKLREK + GFQSIILTKQFYYHLHDFEKDKVELSLSKKCKRDWVKFQSRKYFTEKYYSKFLGFLLF + LLKYLICFKL" + misc_feature 11124..11678 + /gene="wcxU" + /locus_tag="SPC40_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.6e-20" + gene 12003..13235 + /gene="wzy" + /locus_tag="SPC40_0013" + CDS 12003..13235 + /gene="wzy" + /locus_tag="SPC40_0013" + /note="member of homology group 65" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34454.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ11" + /translation="MKKSSTLHIGLILFLIVLSKNFFNLVPNIALFSDFNLMIIIIIM + TVVNIKYYNRSTKYQYRWYIIFTLIFVLYSAINEKLLYGQPFLLGLLPQRQFFLCLMT + YFPLRKYFQEQNISLKKLYVGIMNLGSISSLIYILQKIVILYGGTQFVNVMYSFAGYF + SGYRLYVGSSLIILATLISTAYFLETLKLKYLCHLILGWFTQIWITQGRIEMIVLLIS + TIVCIIVQGRLTRKKIIYWLLTILGLWMITLTPIFENIVGAILKVDGAGRGSDSLTIR + AIGRQLYWDQLNETTSKLLFGTGYPNYNYALAFQRTGFSSNIFLTDNGFMTHIYIYGI + VGSSIMGLLFLKYLKNSIKYARQSADMIPLMYIISLLIVAYNIILWYWNADGTFILVI + MICALEHGEQLLHQRNGV" + gene 13240..15192 + /gene="rbsF" + /locus_tag="SPC40_0014" + CDS 13240..15192 + /gene="rbsF" + /locus_tag="SPC40_0014" + /note="member of homology group 49" + /codon_start=1 + /transl_table=11 + /product="putative phosphotransferase" + /protein_id="CAI34455.1" + /db_xref="GOA:Q4JZ10" + /db_xref="InterPro:IPR005834" + /db_xref="InterPro:IPR006439" + /db_xref="UniProtKB/TrEMBL:Q4JZ10" + /translation="MNLNKEVRWKDKQYIAFDFFDTTIHRNCHPEVILFEWSKKISIY + FSFKISATEIYSIRKKSEIHEKQEKQLEEIKYERLLQLVFYTILSRLKSDVTDYNLED + FLIYARTCEEEIELRHISIDTDTINFIEFLKQNGKKIILISDFYSDKKLIEKLMVSLG + IRDYFSKIFISSEIGLRKSSGNLYEYVINELSCKPINLLMIGDNIYSDVKVPKKLGID + SYHKSYSDSHVTVSPNDIVKAMNNVISQACTESLFNLYIPEILYFISKLYKELSVNKA + SDILFCAREGFFIKKLFDLYQKKMNLKLINSHYFYVSRKSTLYPSFKNIEDEDFEVIF + RQFPEITLENFLINLNFSNNDINNISKQTEIKQTDKVSDKSIINKLKQNKLFKDVYDL + NCKEEKYSFREYLKSVGVENDNSTINMVDIGWKGTIQDNIQKAFPSLNIKGYYMGLNF + QRYSTRNSMNKTGILFTDDPQKTKFFNLFNYKYLFYERIFVADHGPTVRYEFMNGVGV + PTLDTDENHIEIYRFSEEFQITFFNTFEKILDLFNESLVTPDELFNEIANLSLKKHCI + YLPRLSVSIKKLDRAAKENFGIIKSTNRNSDNKVRNFWKNRDFLFLDYIYKAYGKNRL + LNPILDIYGYFVYLIKTLQIKIVGDI" + misc_feature 13273..13914 + /gene="rbsF" + /locus_tag="SPC40_0014" + /note="HMMPfam hit to PF00702, haloacid dehalogenase-like + hydrolase, score 1.8e-07" + gene 15189..16649 + /gene="wzx" + /locus_tag="SPC40_0015" + CDS 15189..16649 + /gene="wzx" + /locus_tag="SPC40_0015" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34456.1" + /db_xref="GOA:Q4JZ09" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZ09" + /translation="MMSMKEKSINKNAILNIILTLTNIVFPLITFPYISRILNPSGIG + AISFFSSIGSYGVLVASLGISTYGIRVIAKDRYHKDKITKIFQELIVINSVMSIIVTF + FLVLMSFRLEQLSSEKGLLIITCITILSSPFNLNWFYSGIEEYSYITKRSIFFKLVSL + ILTFLFVKSKDDYILYAVITLFSTLASNFINILESRKYINFNLRRDLEFRYHLKPMWY + LFASLLAVNIYINLDSVMLGIINGNDAVGIYSIASKVKWILLSVVTSVSSVLLPRLSF + YSNKYDETKFNNILRKSSTIIFMISIPLTIFFMIKAKESILLLGGEQYIQAVLAMQIL + MPILVISGFSNITGNQILIPTGNEKYFMRAVSIGAIVNLCLNLLLMPILGIIGGAIAT + LCAESVQMIIQFYFSRNKLMGNISLNSIKKIAYSSIFAGILLIVIQNIIENFNSFLNL + AASSFLYFGVYFFLLVLFKESTIKKFLNQIFYKDIS" + misc_feature 15213..16022 + /gene="wzx" + /locus_tag="SPC40_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.3e-61" + gene 16791..17693 + /gene="rmlA" + /locus_tag="SPC40_0016" + CDS 16791..17693 + /gene="rmlA" + /locus_tag="SPC40_0016" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34457.1" + /db_xref="GOA:Q4JZ08" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JZ08" + /translation="MKTNLKRRDYSMKGIILAGGSGTRLYPLTRAASKQLMPVYDKPM + IYYPLSTLMLAGIRDILIISTPQDLHRFQELLQDGSEFGLKLSYAEQPSPDGLAQAFI + IGEEFISDDSVALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFD + QDMKAISIEEKPEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDR + GDLSVELMGRGFAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISRED + VLALAQPLKKNEYGQYLLRLIGEA" + misc_feature 16827..17543 + /gene="rmlA" + /locus_tag="SPC40_0016" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 1.1e-119" + gene 17694..18290 + /gene="rmlC" + /locus_tag="SPC40_0017" + CDS 17694..18290 + /gene="rmlC" + /locus_tag="SPC40_0017" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34458.1" + /db_xref="GOA:Q4JZ07" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4JZ07" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPASFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 17730..18260 + /gene="rmlC" + /locus_tag="SPC40_0017" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.1e-16" + gene 18300..19349 + /gene="rmlB" + /locus_tag="SPC40_0018" + CDS 18300..19349 + /gene="rmlB" + /locus_tag="SPC40_0018" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34459.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18315..19271 + /gene="rmlB" + /locus_tag="SPC40_0018" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 18318..19058 + /gene="rmlB" + /locus_tag="SPC40_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 18321..19133 + /gene="rmlB" + /locus_tag="SPC40_0018" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 19415..20266 + /gene="rmlD" + /locus_tag="SPC40_0019" + CDS 19415..20266 + /gene="rmlD" + /locus_tag="SPC40_0019" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34460.1" + /db_xref="GOA:Q9AH81" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH81" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19415..20263 + /gene="rmlD" + /locus_tag="SPC40_0019" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4.3e-146" + misc_feature 19418..20059 + /gene="rmlD" + /locus_tag="SPC40_0019" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00011" + misc_feature 19418..20047 + /gene="rmlD" + /locus_tag="SPC40_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2e-18" + misc_feature 19421..20149 + /gene="rmlD" + /locus_tag="SPC40_0019" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-08" + gene 20413..21412 + /gene="glf" + /locus_tag="SPC40_0020" + /pseudo + CDS join(20413..20832,20820..20933,20909..21412) + /gene="glf" + /locus_tag="SPC40_0020" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + misc_feature join(20749..20820,20832..20909,20933..21352) + /gene="glf" + /locus_tag="SPC40_0020" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.5e-101" + /pseudo + gene 21730..>22089 + /gene="aliA" + /locus_tag="SPC40_0021" + CDS 21730..>22089 + /gene="aliA" + /locus_tag="SPC40_0021" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34462.1" + /db_xref="GOA:Q4JZ60" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JZ60" + /translation="MMKSSRLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 21730..21816 + /gene="aliA" + /locus_tag="SPC40_0021" + /note="Signal peptide predicted for SPC1832 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 21976..22044 + /gene="aliA" + /locus_tag="SPC40_0021" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaaatgact gactagaatg agcaaacctc + 181 aagtttttga agcttgaggt tttttactat agtggattga aactagaata gtgcacctct + 241 gcttctaaaa cattgttaga aatcgatttg actgtcccga tcgatttgtc ctattcttat + 301 ttcattttgc tatacttgta gttgaggaga attaagctcc tcactagtaa actcttcata + 361 atccttttta tttttatgaa gatattgttt gaaagatgtg agtttccacg gatgggtttg + 421 tggagggata tacttgcgtc tttctttttt tgttctggtt cttgttcaaa gtttttcgaa + 481 tagagttcat gatttagtag ctcctttgtg tgatagattt tgtcagcgat attgaggtag + 541 atgtctccgt caaatgcttt tataactaat gctttcgtct ttctgatgaa atagacttct + 601 tttccttgtt cggtagggat atagtaacga ttttggaatc ggatatggtg tccactatcg + 661 acgactctct ccgccagtct agccagaatg agattccttt cagaggggtt aggaacctcc + 721 tcgaagacag agagttttgt cttgtttcca aactgttcat taaaggtttg aatgtaggaa + 781 agcaggaagg tattggcttc ttccaaggta tgaatattgt tttgttccag ttcgataggt + 841 aggcgagatt gtagtgtctg attgagtctt tcgactctcc ctttagcttg agggatagag + 901 gttgtctcaa ggagaatccc tagttggtga caggcgcatc caaactgtgt atgggtatcg + 961 tcctccattt tcttagagtt ggaggcttga taggtaaaga ccgttctctt atctgtttta + 1021 atttgaaggg gaatgccgtg attggctaag atttgttcga ggacatgata gtaagcattc + 1081 aagttctctt gtttatcaaa ataagcgcct aggatattgc cagaagcatc atcaatggct + 1141 aagtgtaagt tagatgtttg ggctccaaac taggcatgag gactggcatc catttgaatg + 1201 agttcaccag caaatttctt tctgggtcta ctaggatgta cttttttagg gtcttcaagg + 1261 aagttttcag ccgtcggtaa gattggattg tctaggggtt gattcaggtt cagtttagct + 1321 tgttttctta ctctcttctt tgtctttcta tgggacttag gcgacaggat atttttctta + 1381 tagagtattt ttctaacagt agtatcagag agctgaattc cttcttcttc agctagcaat + 1441 tcacagaaat gaaggacatt tggtttatat gtttcatagg agaggtattt ttttaggaga + 1501 cgttctttga tttcatcagg gattgcatgt tttggttttc gatttctgtt tccgtgtctg + 1561 aaggcttctt tgtcctttca gttgataggc tagtagcaga cgattgattt gtctttcaga + 1621 aagattgagc tcgacacagg ctcgtttctt tgttttcttt ccttgggcta tagcttttat + 1681 cacaagatat tttttcgttt cattcatatt cagttggatc cttttcatat gactattcta + 1741 ccaaatggga cattttcacg ttcgatttac taaagacatt atcacattcg aattacacaa + 1801 gatgcagata gtgaaaaaag gtgtagacat taccgtaaaa aagtgatata atcataagat + 1861 gttcaatgta taggtgttaa tcatgagtag acgttttaaa aaatcaggtt cacagaaagt + 1921 gaagcgaagt gttaatatag ttttgctgac tatttattta ttgttagttt gttttttatt + 1981 gttcttaatc tttaagtaca atatccttgc ttttagatat cttaatctag tggtaactgc + 2041 gttagtctta ctagtagcct tggtagggct actcttgatt atctataaaa aagctgaaaa + 2101 atttactatt tttctgttgg tgttctctat ccttgtcagc tcagtgtcgc tctttgcagt + 2161 acagcagttt gttggactga ccaatcgttt aaatgcgact tctaattact cagaatattc + 2221 gctcagtgtc gctgttttag cagatagtga gatcgaaaat gttacgcaac tgacgagtgt + 2281 gacagcaccg actgggactg ataatgaaaa tattcaaaaa ctactagctg atatcaagtt + 2341 aagtcagaat accgatttga cagtcgacca gagttcgtct tacttggttg cttacaagag + 2401 tttgattgca ggggagacta aggccattgt cctaaatagt gtctttgaaa atatcatcga + 2461 gtcagagtat ccagactacg catcgaagat aaagaagatt tataccaagg gatttactaa + 2521 aaaagtagaa gctcctaaga cgtctaagaa tcagtctttc aatatctatg ttagtggaat + 2581 tgacacctat ggtcctatta gttcggtgtc gcgatcagat gtcaatatcc tgatgactgt + 2641 caatcgtgat accaagaaaa tcctcttgac cacaacgcca cgtgatgcct atgtaccaat + 2701 cgcagatggt ggaaataatc aaaaagataa attaacccat gcgggcattt atggagttga + 2761 ttcgtccatt cacaccttag aaaatctcta tggagtggat atcaattact atgtgcgatt + 2821 gaacttcact tctttcttga aaatgattga cttattggga ggggtagatg ttcataatga + 2881 tcaagagttt tcagctctac atgggaagtt ccatttccca gtagggaatg tccacctaga + 2941 ctctgagcag gctctaagtt ttgtacgtga acgctactca ctagccgatg gagaccgtga + 3001 ccgtggtcgc aaccaacaaa aggtgattgt ggctatcctt caaaaattaa cgtcaaccga + 3061 agcactgaaa aattatagta cgatcattga tagcttgcaa gattctatcc aaacaaatat + 3121 gccacttgag accatgatag atttggtcaa tgctcagtta gaaagtggtg gaacttacaa + 3181 agtgaattcg caagacttga aaggtacagg tcggatggat cttccttctt atgcaatgcc + 3241 agacagtaac ctctatgtga tggaaataga tgatagtagt ttagctgtag ttaaagcagc + 3301 tatacaggat gtgatggagg gtagatgaaa tgatagacat ccattcgcat atcgtttttg + 3361 atgtagatga cggtcccaag tcaagagagg aaagcaaggc tctcttggca gaatcctaca + 3421 ggcagggggt gcgaaccatt gtctctacct ctcaccgtcg caagggcatg tttgaaactc + 3481 cggaagagaa gatagcagaa aactttcttc aggttcggga aattgcaaaa gaagtagcag + 3541 atgatttagt cattgcttat ggtgcagaga tatactatac tctggatgct ctagaaaagc + 3601 tagaaaaaaa agaaattcct acccttaatg atagtcgtta tgccttgatt gagtttagca + 3661 tgcatacttc ctatcgtcag attcatacgg gattgagcaa tattttgatg ttgggaatca + 3721 caccagtaat tgctcatatt gaacgttatg atgctttaga gaataacgaa aaacgtgttc + 3781 gtgaactgat tgatatgggg tgctatactc agataaatag ttgtcatgtt tcaaaaccta + 3841 agttctttgg tgaaaaatat aaattcatga aaaagagagc tcggtatttt ttggaacgtg + 3901 atttagttca tgtagttgca agtgacatgc acaatttaga cagtagacct ccatatatgc + 3961 aacaggcata tgatatcatt gctaagaaat atggagcgaa aaaagcgaaa gaactttttg + 4021 tagataatcc cagaaaaatt ataatggatc aattaattta ggagaaaata tgcaagatca + 4081 aaacactttg gaaatcgatg tattgcagct attcagagct ttatggaaaa gaaagttggt + 4141 cattttatta gtggcaatta taacttcttc agttgctttt gcctacagta cttttgttat + 4201 caaacctgag tttactagta cgactcggat ttatgtagtt aaccgtaatc aggaagagaa + 4261 gtctggttta accaatcaag acttgcaggc aggaacttat ctggtaaaag actaccgtga + 4321 aattatccta tcgcaggatg ttttggagga agttatttct gatttgaaac tagatttgac + 4381 gccaaaaggt ttggctaata aaattaaagt aatagtacca attgataccc gtattgtctc + 4441 tgtttcagtt aatgatcgag ttcctgaaga agcaagccgt atcgctaact ctttgagaga + 4501 agtagctgct aaaaaaatta tcagtattac tcgtgtttct gatgtgacaa cactggagga + 4561 ggcaagaccg gcgatatcac cgtcttcgcc aaatattaaa cgcaatacac taattggttt + 4621 tttggcaggg gggcttggaa ctagtgttat agttcttctt cttgaacttt tggacactcg + 4681 tgtgaaacgt ccagaagata tcgaagatac actgcagatg acacttttgg gagttgtacc + 4741 aaacttgagt aagttgaaat aggagagagg aatgccgaca ttagaaatag cacaaaaaaa + 4801 actggagttc attaagaagg cagaagaaca ttacaatgcc ttgtgtacaa atatacagtt + 4861 gagcggagat aaactaaaag taatttccgt tacttctgtt aaccctgggg aaggaaaaac + 4921 aactacttcc gtaaatatag caaggtcgtt tgcgcgtgca ggctataaaa ctcttttgat + 4981 cgatggcgat actcgaaatt cagttatgtc aggatttttt aaatctcgtg aaaaaattac + 5041 agggctaaca gaatttttat ctgggacagc tgatttatct cacggtttat gtgatacaaa + 5101 tattgaaaat ttatttgtag ttcaatcggg atctgtatca ccaaacccta cagccttgtt + 5161 acagagtaaa aattttaatg atatgattga aacattgcgt aaatattttg attatatcat + 5221 tgttgataca gcacctattg gaattgttat tgatgcggca attatcactc aaaagtgtga + 5281 tgcgtccatc ttggtaacag caaccggtga ggtgaataaa cgtgatgccc aaaaagctaa + 5341 acaacaatta gaacaaacag ggaaactgtt cctaggagtt gttttaaata aattggatat + 5401 ctcggttgat aagtatgggg tatacggttc ctatggaaat tatggtaaaa aataacttag + 5461 gaaagatttt atggatgaaa aaggattgaa aatttttctg gcagtattac agagtattat + 5521 tgtcatttta ttggtttatt ttcttagctt tgttagagag acagaagttg aacgttcttc + 5581 gatggttata ctataccttc tccacttttt tgtattctat tttagttcct atggtaacaa + 5641 tttttttaaa agagggtacc tagttgagtt taatagtacc ataagatata tttttttctt + 5701 tgcaatagct ataggtgtat taaacttttt tatagtggaa cggtttagta tctctagaag + 5761 aggaatggta tacttcttaa ctttagaagg aatatcctta tacttgttaa atttcttagt + 5821 aaagaaatat tggaagcatg tgttttttaa tctaaaaaat agcaagaaaa ttttactgtt + 5881 aacagtaacg aaaaatatgg aaaaagttct tgataaattg ctagaatctg atgaactttc + 5941 atggaaattg gtagcagtaa gtgttttgga taaatctgat tttcaacatg ataaaatacc + 6001 tgtaattgaa aaggaaaaaa ttattgaatt tgcaacgcat gaagttgtgg atgaggtgtt + 6061 tatcaatctt ccaggagaga gctacgatat tggagaaatt atctctaggt ttgagacaat + 6121 ggggatagat gtaactgtaa atcttaatgc atttgataag aatttgggtc gcaataaaca + 6181 aattcatgag atggtaggat tgaatgtagt cactttctct acaaattttt ataaaactag + 6241 tcatttgatt tcaaagagaa ttctcgatat ttgtggtgcc actattggcc ttattctttt + 6301 tgctatagct agtctagttt tagttccatt gattcgtaaa gatggcggac cagctatttt + 6361 tgctcaaact cgtataggga aaaatggtcg acattttacc ttttataaat tccgttcaat + 6421 gcggatcgat gctgaagcta tcaaagaaca gttgatggat caaaatacga tgcaaggtgg + 6481 tatgtttaag ataaacaatg atcctcgtgt tacaaaaatt ggtcgcttta ttcgtaaaac + 6541 cagtttggat gaattgccac aattttggaa tgtctttatt ggagatatga gtttggttgg + 6601 gacgcgtcca ccgacagtag acgaatatga tcagtatact ccaaaacaga aacgtcgact + 6661 cagctttaag cctggtatta caggcttatg gcaggttagt gggcgtagta aaataaccga + 6721 ttttgatgct gttgtaaaat tagatgtggc ttatattgat aattggacaa tctggaaaga + 6781 tattgaaatt ttgcttaaaa ctgttaaagt tgtatttatg agagatggag cgaagtaatt + 6841 tctgtatatc catcatatta ggagagaaat gaaaaagtca gtttatatca ttggttcaaa + 6901 aggaattcct gctaagtatg gaggatttga aacttttgtt gaaaaattaa cagccttcca + 6961 acaagataag gctatccaat attatgtggc ttgtatgcgt gaaaactctg caaaatcagg + 7021 gactactgag gatgtttttg aacataatgg tgctatctgt tataacgtcg atgttcctaa + 7081 tattggtcca gcgcgagcta tagcgtatga tatcgctgca attaacagag ctattgaaat + 7141 tgccaaagaa aataaggatg aaaatccaat cttctatatt ttagcttgtc gaattggtcc + 7201 gttcatccat ggaattaaga aaagaattca agcaataggt gggactcttc tggttaatcc + 7261 ggatggtcat gagtggctac gagaaaaatg gagtttacct gttcgcaaat attggaaata + 7321 ctctgaaaga cttatggtca aatatgcaga tttattggtt tgtgacagta aaaatatcga + 7381 acagtatatc caagaagatt ataaacagtt ccaacctaag accacctata tcgcttatgg + 7441 gaccgataca actccctcaa tcttgaaatt tgaagatact aaagtccgaa attggtatca + 7501 agagaaggga attagtgaaa acggttatta tttagtggtg ggacgatttg tccctgagaa + 7561 taactatgaa gctatgattc gtgaatttat caaatcccag tctaaaaagg attttgtcct + 7621 cattacaaat gtggaacaaa ataaatttta cgacaagttg cttcgggaaa caggttttga + 7681 ccaagaccca agaatcaaat ttgttggtac tgtttatgat caggaattgt taaaatatat + 7741 tcgagaaaat gcctttgcat atttacatgg tcatgaggtg gggggtacaa atccatcact + 7801 tttagaggct ttaggatcaa caaagttaaa tttgttgctt gatgttggtt ttaaccgtga + 7861 agttggtgag gatggagcta tttattggca aaaagatgaa ctttcacgag tcatcgaata + 7921 tgtggaaacg ataaatcaag caactatcgc aaacttaaat tttaaatcaa cccaaagaat + 7981 cctctcagat ttcacatggg aaaaaattgt ggcagattat gaaggagtat tttgttttgc + 8041 gaagagttag tgtgcccaat ttatatgcag tagtagtttt atacaatagt ttattatcag + 8101 aagcaaaaat tttaaaaacc ttaaatacat taaattgtaa agaattaaac ttaattgtag + 8161 tagacaatag tgataggaaa gaaatacagt taaaaaataa gaacttttcc actgaaaata + 8221 atataacatt ggtgaatatg aatggaaatc agggattatc taaagcttat aataaagtcc + 8281 tagaattatt aaagggtaga ataggttatg tggtttggtt agatgatgat actgagatta + 8341 gtgtagaata tttaacaaaa ttattgtatg catcaagagg taattacgac attattttgc + 8401 ctattattca agatacccat ggtaaaattg tttctccaaa ttctcgtggt ttactttcaa + 8461 ataaaccgat taaaagttac aaagatggaa aaaaacttga aaaatttaac gcaataaata + 8521 gttgtacagc tgtcaattta gacatttatg aagaatatag atatgatgaa cgacttttct + 8581 tggatgaaat tgatcattcg tttttctatg accacagaaa taaaaattta aagatcgaat + 8641 taattaatac aatagttatt caaaattttt ctcaaagggc tgataattta aattttgata + 8701 ctgcatggag tagattgaaa attagaattc gggatttgat agtggcttat aaaattagag + 8761 gtgggatttt tatgggtctt gtagctgttt taaaaagtat cctacttgga ctccagttat + 8821 acttgaaaat taaggatttg cgtatagtta tctatagttt cacatctgct ttatgtattt + 8881 tttttagaaa gacttgaaaa tgaagatttt atattttatg aataatacag atcatggtgg + 8941 ggctgcttta gcattattag atttagttac tcagataaat gagaattatc ctgagtatga + 9001 acttattgtt gtaacaggaa aaaaaaataa tttaaatgtt aagttaacag aaattggtat + 9061 tgaaaattac ttttttccat ttagaaattt tattagttca tataaaaagc ctgcaatact + 9121 atggacgatt ttatataaaa ttcgtcatta tatcggaaat cgaatggctc taaaaaaaat + 9181 agaaaaaaaa attgatttga aaaaaatcga tattattcat tctaatttaa atagaatcga + 9241 tataggagca atattagcca aaaagcacag tataccccat ttatgtcata taagagagca + 9301 tttggatgta tggtattttt ataataaatt agatcataga aagtttgagt atgactttaa + 9361 ggtcttgact acggaaaaaa attatatttt ttatatgtgt tctttttcaa cgaaatatat + 9421 tgcaatctct aactctgtag ctatggattg gtgtaaaaaa ggactatctc agtcatctat + 9481 tgttaaagtt tacgacggta tcaagttacc tcaggtattt ggtgataaga aatggtttag + 9541 aaataaaaaa ataaatattg tatttgttgg tggttacgat attaaaaaag gtcaggagtt + 9601 gtttttaagc tattttttaa aattaccaaa agaaatacaa atgcaatata ctttgacttt + 9661 ctatggaagt ggaaaatcta agtatataaa gaaattacaa aagatgtctc aacatctatg + 9721 ttctgatcaa gttaaatttc atagttatat agataatctt acagaattac taccaaatta + 9781 tgatattggg attaattttt caacaatgga aggttttgga agagtgactg ttgaatattt + 9841 agcgaacggt ctttgtgttg ttgcaaataa aagtggagct agtccagaat taataacaga + 9901 agaagttgga tttttaatcg acaaggataa tcaggatgaa tttattcagt tatttactaa + 9961 attgtctatt gaaaagaata agataagaca aatggggaat aaagcagtta atcaggcaca + 10021 aaagttttca ataaaccaac atacaagaga gattataaat gtatatcaag aaatgagaaa + 10081 taaacagtga aaaatatgga acaaattgat tttgtggtga catgggttaa taataaagat + 10141 gtagattggt gtaaaagaaa gtctgaattt gagaaagaat ataatatatt tcaagattta + 10201 aatagtgaag aacgatatcg tgaatggggc tttatgaaat attggttcag agctgtggaa + 10261 aaatatgccc cttgggtaaa taaaatttat tttataactg aagggcatgt accaaattgg + 10321 ttagatgtaa atcatcctaa attggttcat gttaaacatg aggattatat tgaaaaacag + 10381 tttttgccaa cttttaattc aaacgttata gagatgaatt tgattcattt gaaagattta + 10441 tcagagaaat ttgttctttt taatgatgat actttcataa atgattttgt aaaacaaagt + 10501 gatttttttg aaaataattt acccaaagat acgggtattt ttagtccttt aatacctaga + 10561 gaaaattctt taactcctat tgtattaaac aatatggaga ttattaacaa atatttttca + 10621 aagaaaaaaa ttcttgagca gaatttttct aagtttttta acatcaaata tggaaaacat + 10681 ctattgaaga atatttgttt actgccatgg tcagatttgt taggctttta taatagtcat + 10741 attccagtaa gttattgtaa aagtaatttc ttggaagtct atgagaaaga atatgacatt + 10801 tttaatttga cgtttaaaaa taaatttagg aataaaaatg agattaatca ttggttaatt + 10861 agatattggc aattgtctag cggtaatttc atacctagaa acattaattt tgggaaaaat + 10921 tatgccattt caaatgatcc tacggatatt attaatgaat taaaattttc taaatataag + 10981 attatatgta ttaatgatgg tgaaagtata gatagttttg atgaagtgaa agatctaatg + 11041 attgatgctt ttgaaaaaaa gtttcctgag aaatcgagtt ttgagaaaaa gtgaggcaga + 11101 taagaatgaa tttggaagat ttagtattaa taattttaaa ttataatagt gctaaagata + 11161 cactacgttg tttagaaatt ctacgttctt ttaatatgaa ttttaaaatc attgtagtgg + 11221 ataataattc tacggacaat tcaatagaac tactcaagaa tatagaggat cctcaaacta + 11281 cttttttaat ttctgatgag aatagaggat atggagcagg taataatatt gggattcact + 11341 ttgcagaaaa taatttttct tcaaatatca taggtattat taatccagat atagtcattc + 11401 ccaatcagga agtgataatt tcaatgtata atgttttgaa aaatagtgac tttgctatgg + 11461 ttggtgggtc agtaatcgat aatgagggaa attatagact attaaattca tcatggaatt + 11521 taccttcttt taagagtgtt gtacttgaaa gatttttaat atataatcga cataaagttc + 11581 catattgttt aaatatgtat aatgatgaaa cagcgattgt agattgtgta gcaggttgct + 11641 tttttatgat aaaagctgat gtaatgaagg aaatcggtta ttttgatgaa aatgtttttt + 11701 tatataatga agagaacatt cttggaatga aactgagaga aaagggcttc caatcaatta + 11761 tattaaccaa acagttttac tatcatttgc atgattttga aaaggataag gtagaattat + 11821 ccttgagtaa aaaatgtaaa cgagattggg tgaaatttca gtcacgtaag tattttaccg + 11881 aaaaatatta ttcaaaattt ttaggttttc ttcttttttt gttgaaatat ttaatttgtt + 11941 tcaaattata ataggacact taaaaaataa tattataaag aagaatctga aaggaaactc + 12001 tagtgaaaaa aagtagtacg ttacatatag ggcttattct ttttttgatt gtactgagta + 12061 aaaacttctt taatttagta ccaaatatag cactgttttc tgattttaat cttatgatta + 12121 ttataatcat catgacagtt gttaatatta aatactataa tcgctcaacc aaatatcagt + 12181 atcgttggta tattattttc acattgatat ttgtgttgta tagtgcaatt aatgagaaac + 12241 tattatatgg ccaaccattt ctattaggtt tacttcctca aagacaattt tttttatgtt + 12301 taatgactta tttcccttta agaaagtatt tccaagaaca aaatattagt ttaaaaaaac + 12361 tttatgttgg tattatgaat ttgggatcta tttcatcgtt aatttacatt ttacaaaaga + 12421 tagtaatatt atatggggga acacaatttg ttaacgtaat gtatagtttt gccggatatt + 12481 ttagcgggta tagattgtat gtaggtagtt ctttaattat tttagcaaca ttaatttcta + 12541 ccgcttattt tttagaaaca ttaaaactca agtatctgtg tcaccttata ttaggttggt + 12601 ttactcaaat ttggataacg caaggtcgaa tagagatgat tgttttgcta atttcaacga + 12661 tagtttgcat aatagttcaa ggaagattaa ctagaaagaa aataatttat tggttgctga + 12721 caattttggg actgtggatg attactctaa cacctatttt tgaaaatatt gttggagcta + 12781 ttttaaaagt agatggagca ggtagaggaa gtgattcatt gactattcga gcaattggac + 12841 gacagttata ttgggatcaa ttgaatgaga caacttcaaa acttcttttt ggaacaggat + 12901 atcctaatta taattatgct ttagcctttc aacgtacagg tttttcaagc aatatttttt + 12961 taacagacaa tggttttatg acacatatat atatatatgg tattgtgggt tcctcaatta + 13021 tgggattatt atttttaaaa tatcttaaaa attcaataaa gtatgctaga caatctgcag + 13081 atatgattcc gttgatgtat attatttctt tactaattgt agcctataat attattcttt + 13141 ggtattggaa tgcggacggt acttttatat tagtaatcat gatttgcgca ttggagcatg + 13201 gagaacaatt attacatcag aggaatggag tgtgattaga tgaatttaaa taaagaagtt + 13261 agatggaagg ataagcaata tattgctttt gatttttttg atacaactat ccatagaaat + 13321 tgtcatcctg aagtgatttt atttgaatgg tctaaaaaaa tttctattta tttctctttc + 13381 aaaatatctg ctacagaaat ttattcaatt aggaaaaaat ctgaaataca tgagaagcaa + 13441 gaaaaacaat tggaagaaat taaatatgaa agattacttc aacttgtttt ttatactatt + 13501 ttaagtcgtt tgaagtcaga tgttaccgac tataatcttg aagatttttt aatttatgca + 13561 agaacgtgtg aagaggaaat agaattaaga catattagta ttgatacaga tacaattaat + 13621 tttattgaat ttttaaaaca aaatgggaaa aaaataattt taatttcaga tttttattct + 13681 gataaaaagc taattgaaaa attaatggtt tcattaggga ttagagatta tttctctaaa + 13741 atatttattt caagtgaaat tggcttacgt aagtcatcag gaaatttata tgaatatgtg + 13801 atcaatgaat tgagctgtaa gcctataaat ttacttatga ttggtgataa tatttattct + 13861 gatgtaaaag ttccaaaaaa actaggaata gattcttatc ataaatctta ttcagattca + 13921 catgtgactg tgagtcctaa cgatattgta aaagcgatga ataatgttat ttctcaagct + 13981 tgtactgaat ctttatttaa tctctatata cctgaaatac tttattttat ttcaaagtta + 14041 tacaaagaat tatctgttaa caaagctagt gatatattat tttgtgcaag agaaggtttt + 14101 tttataaaaa aattatttga tctttatcaa aaaaaaatga acttaaagct tattaattca + 14161 cattattttt atgtttctag aaaatcaacg ctatatccat catttaaaaa tattgaggat + 14221 gaagattttg aagttatttt tagacaattt cctgaaatta ctttagaaaa ttttttgatt + 14281 aatttaaatt tttccaataa tgatattaac aatatttcta agcaaacaga aattaaacaa + 14341 acagacaaag tatcagataa atctattatt aacaaattaa aacaaaataa attatttaaa + 14401 gatgtttatg atttgaactg taaagaagaa aaatattctt ttagagaata tttaaagtct + 14461 gtaggagttg agaatgacaa ttctacaata aatatggtag atattggttg gaaaggcacg + 14521 atacaagaca atattcaaaa agcttttcca tctttaaata taaaagggta ttatatgggg + 14581 ttgaattttc aacggtattc tactaggaat agtatgaata agacgggaat actgtttact + 14641 gacgatcctc aaaaaacaaa gttttttaac ttatttaatt ataaatattt attctatgaa + 14701 agaatttttg ttgcagatca tggaccgaca gttagatatg aatttatgaa tggtgttggg + 14761 gtaccaacat tggatacaga tgaaaatcat atagaaattt atagattttc tgaggaattt + 14821 cagattacat ttttcaacac atttgagaaa attttagatt tgttcaatga atcactagta + 14881 acaccagatg aattatttaa cgaaatagct aatttatcgt taaaaaaaca ttgcatctat + 14941 ttacctaggc tttcagtaag tataaaaaaa ttagatagag cagcaaaaga aaattttggt + 15001 attataaaat ctactaacag gaatagtgat aataaggtaa gaaatttttg gaaaaataga + 15061 gattttttat ttttagatta tatatataaa gcgtatggaa agaatagatt gttaaaccct + 15121 atattggata tttacggata ttttgtatat ctgattaaaa cactgcaaat aaaaatagta + 15181 ggggatattt gatgagcatg aaagaaaaat caataaataa aaatgctatt ttgaatatta + 15241 ttttaacact aacaaatatt gtgtttccat taattacttt tccttatatt tctagaattc + 15301 tgaatccgtc aggaataggt gcaatctctt ttttttcatc tattggttct tatggtgttt + 15361 tagttgcctc gcttggaatt tcaacttatg ggattcgggt gattgcaaag gatcgttatc + 15421 ataaagataa gataactaaa atattccaag aattgatagt tattaatagt gtaatgtcta + 15481 ttatagtgac gttcttcctt gttttaatga gtttccgatt agagcagtta agttcagaaa + 15541 aaggtttatt aataatcaca tgtattacta ttttgtcctc tccttttaat ttgaattggt + 15601 tttatagtgg aatagaagag tattcatata taacaaaacg ttcaatattt tttaaattag + 15661 tttcgttgat attaaccttt ttatttgtta aaagtaaaga cgattatatt ctatatgctg + 15721 tgataacatt gttttcaaca ttggcttcca attttataaa tattttggag agtagaaaat + 15781 acatcaattt taatttgaga agggatttag aatttagata tcatctaaaa ccaatgtggt + 15841 atttatttgc ttcgttactt gcagttaata tttatataaa tttggattct gtgatgttag + 15901 gaattattaa tggaaatgat gcggtaggta tttactcaat cgcatcaaaa gtaaaatgga + 15961 ttttattatc agtcgttact tcagtgagtt cagttttatt acccagatta tcattttata + 16021 gcaataaata tgacgaaacg aagtttaata atattttgag aaagtcatct acaataattt + 16081 ttatgatttc aattcctcta acaatttttt ttatgataaa agcgaaagag agtatattat + 16141 tgttaggtgg agagcagtat attcaggcag ttttagcaat gcaaatatta atgccgatct + 16201 tggtaatatc aggtttttct aatattacag gtaatcagat attgatccct actggtaatg + 16261 agaaatattt tatgagagca gtttctatag gagcaatagt aaatttatgt ttaaatttgt + 16321 tgcttatgcc tattttggga attatcggag gtgcgatcgc aactctttgt gcagaatcag + 16381 tccaaatgat tattcaattt tatttttctc gtaataaatt aatgggtaat atttcattaa + 16441 attcaatcaa aaaaatagcc tattcatcaa tttttgcggg tatactgtta atagtaatac + 16501 aaaatattat agagaatttt aatagcttct taaatttagc tgcatctagt tttctatatt + 16561 ttggagtata ttttttctta ttggtattgt ttaaagaaag tacaattaag aaatttctaa + 16621 atcaaatttt ttataaggat atttcatgaa tttattacca attatttatg gagcgattct + 16681 tgatttaata tcagaataat tttttaaagt gaatgaaatc aaagcaataa aagattaaaa + 16741 aataaattgc tatctattat gtttttctca agttaagtaa aacataactc atgaaaacaa + 16801 atttaaaaag gagggactat agtatgaaag gtattattct agcaggtggt tcggggacac + 16861 gtttatatcc tttgactcgc gctgcatcaa aacaacttat gccggtttat gataaaccga + 16921 tgatttacta cccactttca acattgatgc tggctgggat tagggatatt ttgattattt + 16981 ccactccaca ggatttacat cgattccaag agcttcttca agacggatct gagtttgggc + 17041 tcaaactttc ttatgcagag caaccaagtc cagatggttt ggcacaagcc tttatcattg + 17101 gggaagagtt tatttctgat gatagcgttg cgctgatctt aggtgacaat atctatcacg + 17161 gttctgggct ttccaagatg ctacaaaagg cagcgagtaa ggagtcggga gcaactgttt + 17221 ttggctacca tgtcaaggat ccagagcgct ttggtgtggt tgagtttgat caggatatga + 17281 aggctatttc tattgaagaa aagccagagc aacctcgttc aaactatgca gttacaggtc + 17341 tctatttcta tgataatgat gtagtagaga ttgccaagag tattaaacca agtcctcgtg + 17401 gtgaactgga aattacagat gtaaacaagg cttacctaga tcgtggtgat ttgtctgttg + 17461 agcttatggg acgtggcttt gcttggttgg atactggcac tcatgaaagt ttactagagg + 17521 cttcgcagta catcgaaaca gtccaacgga tgcaaaatgt tcaggtagca aacttagaag + 17581 aaattgctta ccgtatgggc tatatcagtc gagaagatgt attggcctta gcccaaccac + 17641 ttaagaaaaa tgaatacgga cagtatctgc tccgtttgat tggagaagca tagatgacag + 17701 ataatttttt cggtaagacg cttgcggcac gcaaggttga agctattcca ggcatgttgg + 17761 agtttgatat ccccgttcat ggagataatc gtggctggtt taaagaaaat ttccaaaagg + 17821 aaaaaatgct tccacttgga tttccagcgt ctttctttgc agaaggaaaa ttgcaaaaca + 17881 atgtatcctt ctcacgtaaa aatgtccttc gaggcctcca cgcagagcct tgggataagt + 17941 acatctctgt agcagatgga gggaaagttc tgggttcttg ggttgatcta cgcgagggtg + 18001 aaacctttgg gaatacctat cagacagtaa ttgatgcaag caagggaatc tttgttcctc + 18061 gaggcgtagc taatggcttc caagttttat cagatacagt gtcatatagc tatctggtca + 18121 atgattactg ggcgcttgaa ctcaaaccca agtatgcctt tgtgaactac gctgatccaa + 18181 gccttggtat tgaatgggaa aatattgcag aagcagaggt ttcagaagca gataaacatc + 18241 atcccctact taaggacgtg aagcctttga aaaaagaaga tttggaataa ggaaaaaata + 18301 tgactgaata caaaaatatt atcgtgacag gtggagctgg ctttatcggt tctaactttg + 18361 tccattatgt ttacgagaac tttccagatg ttcacgtgac agtcctagat aagttgactt + 18421 atgctggaaa tcgcgcgaat attgaggaaa ttttaggtaa tcgtgttgag ttagttgttg + 18481 gtgacattgc tgatgcggag ttggtagaca agttggctgc tcaagcagat gctatcgttc + 18541 attatgcagc ggaaagccac aatgataatt cgctcaatga tccatcgcca tttattcata + 18601 ctaacttcat tggaacctat actcttttag aagctgctcg taagtatgat attcgcttcc + 18661 accatgtatc gacagatgaa gtttatgggg atctcccttt acgcgaagat ttgccaggtc + 18721 atggagaagg gccgggtgag aaatttacgg ctgaaaccaa gtacaatcca agctcgcctt + 18781 actcatcaac caaggcagcc tcagatttga ttgtcaaagc ctgggtgcgt tcttttggag + 18841 tcaaggcaac gatttccaac tgttcaaata actacggtcc ttaccagcat attgagaagt + 18901 ttattccacg acaaatcacc aatatcttga gcggtatcaa gccaaaactt tacggtgaag + 18961 gtaagaacgt tcgtgactgg attcatacca atgaccattc ttcaggagtt tggacaatct + 19021 tgacaaaagg gcaaatcggt gaaacctact tgattggggc tgatggtgag aagaacaata + 19081 aggaagtttt ggaacttatc cttaaggaaa tgggacaagc tgcggatgcc tatgatcatg + 19141 tgactgaccg tgcaggacat gaccttcgct atgcgattga tgctagcaag ctccgtgatg + 19201 agttggggtg gaaacctgaa tttaccaact ttgaagctgg gctcaaggca acaatcaagt + 19261 ggtatacaga taaccaagaa tggtggaaag cagaaaaaga agctgttgaa gccaattatg + 19321 ctaagactca ggagattatt acagtataaa aagcaggaaa tagctgcttt ttattgctat + 19381 attgggaaga gttacatatt agaaaggtct agagatgatt ttaattacag gggcaaatgg + 19441 ccaattagga acggaacttc gctatttatt ggatgaacgt aatgaagaat acgtggcagt + 19501 agatgtggct aagatggaca ttaccaatga agaaatggtt gagaaagttt ttgaagaggt + 19561 gaaaccgact ttagtctacc attgtgcagc ctacaccgct gttgatgcag cagaggatga + 19621 aggaaaagag ttggacttcg ccatcaatgt gacggggaca aaaaatgtcg caaaagcatc + 19681 tgaaaagcat ggtgcaactc tagtttatat ttctacggac tatgtctttg atggtaagaa + 19741 accagttgga caagagtggg aagttgatga ccgaccagat ccacagacag aatatggacg + 19801 cactaagcgt atgggggaag agttagttga gaagcatgtg tctaatttct atattatccg + 19861 tactgcctgg gtatttggaa attatggcaa aaacttcgtt tttaccatgc aaaatcttgc + 19921 gaaaactcat aagactttaa cagttgtaaa tgaccagtac ggtcgtccga cttggactcg + 19981 taccttggct gagttcatga cctacctagc tgaaaatcgt aaggaatttg gttattatca + 20041 tttgtcaaat gatgcgacag aagatacaac atggtatgat tttgcagttg aaattttgaa + 20101 agatacagat gtcgaagtca agccagtaga ttccagtcaa tttccagcca aagctaaacg + 20161 tccgctaaac tcaacgatga gcctggccaa agccaaagct actggatttg ttattccaac + 20221 ttggcaagat gcattgcaag aattttacaa acaagaagtg agataagtag tagaatgatt + 20281 ttctagtcta ataaaagagg cagagaatga actccaaagg agcttaagat gtacgattat + 20341 cttgttgttg gtgcagtctt tgcccatgaa gcagtcttaa aaggaaaaaa agtaaaagtt + 20401 attgaaaaat gaaatcatat cgcgggtaat atctatactc gtgaagagga aggaattcaa + 20461 gttcatcaat atggtgctca tatcttccat acttctgata aggagatctg ggattatgta + 20521 aatcagtttg cagagtttaa ccgttacata aattctcctg ttgcaaacta taagggtgag + 20581 atttataacc ttccttttaa tatgaatact ttcaataaac tctggggagt tgtaacgcca + 20641 gcagaagcac aagctaagat tgatgaacaa cgtgctattt taaatggtaa aactcctgaa + 20701 aatttggaag aacaggcgat ttctcttgta gctacagaca tctacgaaaa attaatcaaa + 20761 gactatacag agaaacagtg gggcaaacca actactgaac ttccatcctt tattattgtt + 20821 tgccagtacg cctgacctat gataacaact attttaacga tacctatcaa gggattccaa + 20881 ttggtggata cactcaaata gttgaaaaat gttggatcat gaaaatattg atgtagaaac + 20941 aaacgttgat ttctttgtga ataaagagca atatctgaaa gattttccta agattgtctt + 21001 tactggtatg attgatgaat tctttgacta taagttgggc gaactagagt accgtagtct + 21061 tcgttttgaa aatgagacct tggatatgga aaattaccaa ggaaatgcag ttgtgaacta + 21121 tacggatgca gaaaccccat atactcgcat tattgaacac aaacattttg agtttgggag + 21181 tcaagcaaag actatcatta ctaaagaaca ttctaaaaca tgggaaaaag gtgatgagcc + 21241 ttattatcca gttaataatg atcgtaataa tcatttgtat aaatcatata aaaaacttgc + 21301 tgatgagcaa gggaatgtta tctttggtgg ccgcttagga cactatcgtt attacgatat + 21361 tcaccaagta attggagcag ctttgcagtg cgtgagaaat gagttaaatt aatactcaat + 21421 gaaaatcaaa gagcaaacta ggaagctagc cacaggttgc tcaaaacact gttttgaggt + 21481 tgcagatgga cgctgacgcg gtttgaagag attttcgaag agtataaaca agtaaaactg + 21541 actaccagtt attatttaga aatagtatta aaaattcctt gactatgtga tatagttgag + 21601 ggatttttaa atgatattca tattttttgc aaagatgttg tttgaaaaat aattttcaaa + 21661 aattctgaaa attctgttga caactttctg aaaagagtct ataatggaga gaaagtttta + 21721 aaggagaaaa tgatgaaaag ttcaagacta tttgcccttg cgggcgtgac attattggcg + 21781 gcgactactt tagctgcatg ctctggatca ggttcaagca ctaaaggtga gaagacattc + 21841 tcatacattt atgagacaga ccctgataac ctcaactatt tgacaactgc taaggctgcg + 21901 acagcaaata ttaccagtaa cgtggttgat ggtttgctag aaaatgatcg ctacgggaac + 21961 tttgtgccgt ctatggctga ggattggtct gtatccaagg atggattgac ttacacttat + 22021 actatccgta aggatgcaaa atggtatact tctgaaggtg aagaatacgc ggcagtcaaa + 22081 gctcaagac +// + diff --git a/public/res/serotype_genbank/serotype_41A.gb b/public/res/serotype_genbank/serotype_41A.gb new file mode 100644 index 0000000..348b22f --- /dev/null +++ b/public/res/serotype_genbank/serotype_41A.gb @@ -0,0 +1,1049 @@ +LOCUS CR931713 22520 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 6803 (serotype 41a). +ACCESSION CR931713 +VERSION CR931713.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22520) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22520) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22520 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="6803" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC41A_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC41A_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34463.1" + /db_xref="GOA:Q4JZD8" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JZD8" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SPC41A_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SPC41A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(463..1023,1025..1351)) + /gene="tnp" + /locus_tag="SPC41A_0003" + /pseudo + CDS complement(join(463..1023,1025..1351)) + /gene="tnp" + /locus_tag="SPC41A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(961..1023,1025..1333)) + /gene="tnp" + /locus_tag="SPC41A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 7.7e-24" + /pseudo + gene 1584..3029 + /gene="wzg" + /locus_tag="SPC41A_0004" + CDS 1584..3029 + /gene="wzg" + /locus_tag="SPC41A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34466.1" + /db_xref="GOA:Q4JZ02" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JZ02" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIELEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNVPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1584..1700 + /gene="wzg" + /locus_tag="SPC41A_0004" + /note="Signal peptide predicted for SPC1836 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1788..2135 + /gene="wzg" + /locus_tag="SPC41A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.6e-63" + misc_feature 2313..2756 + /gene="wzg" + /locus_tag="SPC41A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 3031..3762 + /gene="wzh" + /locus_tag="SPC41A_0005" + CDS 3031..3762 + /gene="wzh" + /locus_tag="SPC41A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34467.1" + /db_xref="GOA:Q4JZ01" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JZ01" + /translation="MIDVHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMSGITPVIAHIERYDALGNNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3034..3642 + /gene="wzh" + /locus_tag="SPC41A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.5e-36" + gene 3768..4463 + /gene="wzd" + /locus_tag="SPC41A_0006" + CDS 3768..4463 + /gene="wzd" + /locus_tag="SPC41A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34468.1" + /db_xref="GOA:Q4JZ00" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZ00" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKSGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPTDTRIVSISVKDKQPEEASRIANSLREVAVEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELFDTRVKRPEDIEDVLQI + PLLGLVPDLDKMK" + misc_feature 3768..3884 + /gene="wzd" + /locus_tag="SPC41A_0006" + /note="Signal peptide predicted for SPC1838 by SignalP 2.0 + HMM (Signal peptide probability 0.721) with cleavage site + probability 0.467 between residues 39 and 40" + misc_feature 3789..4205 + /gene="wzd" + /locus_tag="SPC41A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1e-55" + misc_feature 4311..4388 + /gene="wzd" + /locus_tag="SPC41A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4473..5162 + /gene="wze" + /locus_tag="SPC41A_0007" + CDS 4473..5162 + /gene="wze" + /locus_tag="SPC41A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34469.1" + /db_xref="GOA:Q4JYZ9" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JYZ9" + /translation="MPTLEISQAKLDFVKKAEEYYNSLCTNLQLSGDGLKVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITQKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVNKYGSY + RNYGDYGKNKK" + gene 5177..6544 + /gene="wchA" + /locus_tag="SPC41A_0008" + CDS 5177..6544 + /gene="wchA" + /locus_tag="SPC41A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34470.1" + /db_xref="GOA:Q4JYZ8" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JYZ8" + /translation="MNGKVVKPSLAIIHSFLVILLTYLLSAVREAEIASATAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHLIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGCFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEIVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5177..5284 + /gene="wchA" + /locus_tag="SPC41A_0008" + /note="Signal peptide predicted for SPC1840 by SignalP 2.0 + HMM (Signal peptide probability 0.897) with cleavage site + probability 0.441 between residues 36 and 37" + misc_feature 5960..6541 + /gene="wchA" + /locus_tag="SPC41A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.7e-160" + gene 6531..7337 + /gene="wciB" + /locus_tag="SPC41A_0009" + CDS 6531..7337 + /gene="wciB" + /locus_tag="SPC41A_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34471.1" + /db_xref="GOA:Q4JYZ7" + /db_xref="UniProtKB/TrEMBL:Q4JYZ7" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTKKSQRYSDYISMDEV + VLSRGDLDNLLSQNDVLVPKKRRYYIETLYSHYAHTLDGSHLDVARDVIKQLSSEYLT + TFDKVMKQRSGYMFNMFIMKKDLANQYFSWLFPILDKMYEQIDVSQLTPFEARLFGRV + SELLFNVWLKHKDIKPKELPFMYMEKVDLFEKGKSFLMAKFFGKKYGQSF" + gene 7321..8418 + /gene="wcrP" + /locus_tag="SPC41A_0010" + CDS 7321..8418 + /gene="wcrP" + /locus_tag="SPC41A_0010" + /note="member of homology group 89" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34472.1" + /db_xref="GOA:Q4JYZ6" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYZ6" + /translation="MDRVFEMLEKESPLFSVIVPTYKISESNLRQCIDSLLYDNQDVE + IILVDDNANSDICGKVIDEYAEKYNNISVIHQENQGVSVARNAGMSIAVGKYLVFVDP + DDWVAENFYSQMAFAVQKNPSSDVIILAAIVDYNGKRFTNYFWHTSRSFCGKDKDDLE + LQLIAKGATSYFPTEIGVGVPWAKIYRNEFVRANGLVFNPSLRRMQDNIFNMYAFEFA + NEIVYINEPIYYYRKSMDSVTNKKNDKVIYYFDLVNDEVEKFIQKFNKPKIFEDALHI + KRLIGINSYYKLYFQFATTSSEKKKMRQEFRELLEREEYANSLKQVNTAYLLPKEKIF + ISILKQKHLRIFSFLQKLEKLSARLKSRHFS" + misc_feature 7366..7905 + /gene="wcrP" + /locus_tag="SPC41A_0010" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.9e-31" + gene 8426..9343 + /gene="wcrQ" + /locus_tag="SPC41A_0011" + CDS 8426..9343 + /gene="wcrQ" + /locus_tag="SPC41A_0011" + /note="member of homology group 106" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34473.1" + /db_xref="GOA:Q4JYX5" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JYX5" + /translation="MRQLTLKLVSIIYKVTKRIPISFISNLGERIYSLKDSYVFDVLS + KLGVDKESTYDLMPPDLFLNKIWICWFQGEDKAPDLVKKCINSVRKHASGYDVIILTE + DNIEEYVTLPNIVLTKYKNGLFSRTHFSDIVRLNLLAQQGGLWIDATIFMTRDLDLSI + FFKNDFVSLRTTIKSSPLFITGYWTTYFVYMPSNFKLVQYTALLLNKYIEKYDRFIDY + FLQDYIITKAIKDLNYESYMEERPVLGNQRWLLADLANKVVTSELLQQFKQDTVGIYK + VTYKSKYIRKKNGRETVYKKIVEDGECLE" + misc_feature 8477..9316 + /gene="wcrQ" + /locus_tag="SPC41A_0011" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 2.8e-47" + gene 9324..10214 + /gene="wcrR" + /locus_tag="SPC41A_0012" + CDS 9324..10214 + /gene="wcrR" + /locus_tag="SPC41A_0012" + /note="member of homology group 90" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34474.1" + /db_xref="GOA:Q4JYX4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYX4" + /translation="MENALNNKIGIVILNYLNWEDTLECINSLRSQSDQDFEAVIVEN + GSPNESVSRIRDYIKNDKNIHLYVVENNLGYANGNNMGILYLKNRYSINRILLTNNDV + IFDDEDYIKKLEDIKYSNTIGAIGTKIIGSDGLNQNPAYFPISFSSSIKSLLINLLAF + SKVITFIKKRFLSSWTKRANDFSNPKTDEQKYFLHGSVIFLTENYLDRFMGLYGGTFL + YYEEVILGIIFEKAGLDMLYVPDFSIYHKEDQSSLESFANDDLIRRKFLLKSIFSSFK + VHFCATNRLSILVKESIKYD" + misc_feature 9351..9851 + /gene="wcrR" + /locus_tag="SPC41A_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.9e-13" + gene 10207..11466 + /gene="wzy" + /locus_tag="SPC41A_0013" + CDS 10207..11466 + /gene="wzy" + /locus_tag="SPC41A_0013" + /note="member of homology group 121" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34475.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4JYZ3" + /translation="MIKFNYSKLALIYQFIIIFFLGAWYKNSIQFKIFLISIDTIISL + FYLYKNNLSRSDLKKVYILITTVLVSLFLPSFMNRVSFILLILQKLYIFNHIINDIKF + EYLLSVFLQFIVLLTFCMGLEFISLGQFNPFKTFYAPRVLLDMSFKVGTPLYFLRSSL + EHPLITSIVLVVTGPFLFLLEKKWLRYVCVFLNISLIFFIQKRTAYILVSIGVVCFAL + YYLKYINRRFQLNKITSVIFLMTLFIIALSFIRVQGDYVLNIIFSKFSALQDADSFSL + NNRVINAKTGLDVIFDQNVINIFIGNGYDFLPNFFEQYNVYVIRNGFYVIDNTYISFL + ADYGMIGLFLVLLYIINAIRKSMTNIYKIKSKKEQLFMLYSIIGIINLMVSIAFFDIY + AWYTLLTLLIFLISVVTSYCKFHSNKF" + gene 11508..12752 + /gene="wcrW" + /locus_tag="SPC41A_0014" + CDS 11508..12752 + /gene="wcrW" + /locus_tag="SPC41A_0014" + /note="member of homology group 122" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI34476.1" + /db_xref="UniProtKB/TrEMBL:Q4JYZ2" + /translation="MTLKNEVKNIKRTIEKNFFHKDFTSISDIKNYQIEISKNLRPRL + NLLITSMNSQDVYAGIKSAVDFFMKFKKFDIDLRIIVMGKKIDEPSLYQVPGFEFIKD + YSIENDSESRIICDLSKNRSPLFIRERDYFLSTMWYTAYNANNVLDEQKRIFGKRMPM + VYLVQDYEPGFYPWSSEYLLAESTYHLDNQLVVFNSKYLKEFFDANGYRFENSYYFDP + VLNEKLGEILNLAELSNIERKNRILFYGRPSKARNAFQLICMALEKWSVLDERSSNWE + IFSAGEDLKDIKLNNSIVIKSLGKMSVEEYAKFMLESKIGISLMASPHPSYPPLEMAT + FGMKVITNSFVTKDISDFNENIISIEHININKLAEELHFLTTSDIEYKISKNDDYING + ISQLDTIVDEIAGHLQFRHSEV" + gene 12749..14197 + /gene="wzx" + /locus_tag="SPC41A_0015" + CDS 12749..14197 + /gene="wzx" + /locus_tag="SPC41A_0015" + /note="member of homology group 123" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34477.1" + /db_xref="GOA:Q4JYZ1" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYZ1" + /translation="MIVKRKSIARNYLLNLIKTTLSILFPLISYPYVSRILSVDGLGA + INFSTSFVNYFVLIAIFGINVYAVREGAKYRDDKKLLGKFVTEMLLVSICTAMISFSL + LTVSLLLPALSEYRSLILIFSITIIFNVVGMEWFFQLMEDYQYITLRAIIFQILSLIF + LFIFVKNRNDIYVYALITVAANAGSQILNLFRLRKEVEIFRYKDYNIRNYFKPMFLIF + LTLLSMNMYRYLDVTFLGFFKNDRSVGYYSLATKITSAIISMLSSVTVILTPRLAYHY + KKEEFDKFYKIAYSSFDLILLLAIPVVIGVFSFSSILVDFLGGSTFVSSVLTVEILSL + TILFSNLNALLITPILTVMNREKAVLKIFIIALIFNVITNMLLIPVMDFNGSALVTVL + TEGIICILSLISIKSVFNVRRLFKNLFQYLVASIFIIVIKIVISQYVSSNYIIFISTA + LLSAILYFLTLILLRNELVLQLIIEVRKKIYR" + misc_feature 12770..13576 + /gene="wzx" + /locus_tag="SPC41A_0015" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.1e-44" + gene 14213..14885 + /gene="wcrX" + /locus_tag="SPC41A_0016" + /pseudo + CDS join(14213..14239,14239..14469,14469..14885) + /gene="wcrX" + /locus_tag="SPC41A_0016" + /note="member of homology group 124" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + gene 14956..16176 + /gene="ugd" + /locus_tag="SPC41A_0017" + CDS 14956..16176 + /gene="ugd" + /locus_tag="SPC41A_0017" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI34479.1" + /db_xref="GOA:Q4JYZ0" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4JYZ0" + /translation="MKIAVAGTGYVGLSIAVLMAQHHEVVAVDIISEKVNLINNGKSP + IKDDYIEEYLATKPLNLVATLDTNLAYQNADFVIIAAPTNYDSEKNFFDTSAVESVIE + TVLETNPNAVMVIKSTVPVGYTQSIRNKYKTSNILFSPEFLRESKALYDNLYPSRIIV + GLDMDDAYLKERAETFAELLQEGAVKEAIEILYMGFTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDTKAIIEGIGLDPRIGSQYNNPSFGYGGYCLPKDSKQLLANYKDVPQ + NMITAIVESNRTRKDFIAEQILKLAGVSNNGEIYPKDVIIGLYRLTMKSNSDNFRQSS + IQGVMKRLKAEGANVIIYEPTLSDDETFFGSKIVNDLEHFKSISNVIVANRYDDLLKD + VSDKVYSRDIFKRD" + misc_feature 14956..15513 + /gene="ugd" + /locus_tag="SPC41A_0017" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.1e-50" + misc_feature 15541..15822 + /gene="ugd" + /locus_tag="SPC41A_0017" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.8e-36" + misc_feature 15904..16155 + /gene="ugd" + /locus_tag="SPC41A_0017" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 9e-07" + gene 16189..17289 + /gene="glf" + /locus_tag="SPC41A_0018" + CDS 16189..17289 + /gene="glf" + /locus_tag="SPC41A_0018" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34480.1" + /db_xref="GOA:Q4JYY9" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYY9" + /translation="MYDYLIIGAGLSGAIFAHEATKRGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYINQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTADMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGIDFFAHRE + ELEASAEKVVFTGMIDRYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGMQPKTVITHEYPADWKRGDEPYYPINDEKNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFSN" + misc_feature 16624..17226 + /gene="glf" + /locus_tag="SPC41A_0018" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 5e-138" + gene 17317..18186 + /gene="rmlA" + /locus_tag="SPC41A_0019" + CDS 17317..18186 + /gene="rmlA" + /locus_tag="SPC41A_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34481.1" + /db_xref="GOA:Q4JYY8" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JYY8" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLT + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSTMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEHPRSNYAVTGIYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLGRGDLSVEVMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17320..18036 + /gene="rmlA" + /locus_tag="SPC41A_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 6.4e-118" + gene 18187..18780 + /gene="rmlC" + /locus_tag="SPC41A_0020" + CDS 18187..18780 + /gene="rmlC" + /locus_tag="SPC41A_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34482.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 18223..18753 + /gene="rmlC" + /locus_tag="SPC41A_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 18793..19842 + /gene="rmlB" + /locus_tag="SPC41A_0021" + CDS 18793..19842 + /gene="rmlB" + /locus_tag="SPC41A_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34483.1" + /db_xref="GOA:Q4JYY6" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYY6" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGERPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLREELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18808..19764 + /gene="rmlB" + /locus_tag="SPC41A_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 7.3e-05" + misc_feature 18811..19755 + /gene="rmlB" + /locus_tag="SPC41A_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0047" + misc_feature 18811..19551 + /gene="rmlB" + /locus_tag="SPC41A_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 3.3e-76" + misc_feature 18814..19626 + /gene="rmlB" + /locus_tag="SPC41A_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.7e-05" + gene 19908..20759 + /gene="rmlD" + /locus_tag="SPC41A_0022" + CDS 19908..20759 + /gene="rmlD" + /locus_tag="SPC41A_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34484.1" + /db_xref="GOA:O54665" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54665" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19908..20756 + /gene="rmlD" + /locus_tag="SPC41A_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 3.4e-148" + misc_feature 19911..20552 + /gene="rmlD" + /locus_tag="SPC41A_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 19911..20540 + /gene="rmlD" + /locus_tag="SPC41A_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.6e-19" + misc_feature 19914..20642 + /gene="rmlD" + /locus_tag="SPC41A_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.8e-08" + gene order(20835..21730,21753..21962) + /gene="tnp" + /locus_tag="SPC41A_0023" + /pseudo + CDS join(20835..21245,21245..21730,21753..21962) + /gene="tnp" + /locus_tag="SPC41A_0023" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + /db_xref="PSEUDO:CAI34485.1" + misc_feature join(20841..21245,21245..21280) + /gene="tnp" + /locus_tag="SPC41A_0023" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 0.00045" + /pseudo + gene 22161..>22520 + /gene="aliA" + /locus_tag="SPC41A_0024" + CDS 22161..>22520 + /gene="aliA" + /locus_tag="SPC41A_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34486.1" + /db_xref="GOA:Q4JYY4" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JYY4" + /translation="MMKSSKLLALAGVTLLAATTLAACSGSGSSAKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 22161..22253 + /gene="aliA" + /locus_tag="SPC41A_0024" + /note="Signal peptide predicted for SPC1856 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.804 between residues 31 and 32" + misc_feature 22407..22475 + /gene="aliA" + /locus_tag="SPC41A_0024" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttggct ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaagttta taaactttca ttcttgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggcctgact + 361 tttgcatctg ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtca attgaaacaa gaacaagaca aaagagcctc ataaaaggta ttgcaacttg + 541 gtaatacctt tttgaggtgc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggtgagta gggaagaaga ggtaaaagtt tatgccaaac ttttcgcata aaagttctag + 661 cttccccatt ctatggaatc ttgcattatc cataataata accgatggtg tggttaatgt + 721 tggtaagaga aacttctgaa accatacttc aaaaaagtcg ctcgtcatcg tctcttcgta + 781 agtcattgga acgattaatt caccatttat tagacctgca accaaagaaa tcctctgata + 841 tcttcttcca gatactttgc ctcttcttaa ctgacctttt aatgagcgac catattctcg + 901 ataaaaataa gtatcgaatc ctgtttcgtc aatctaaaca ggtgctaggt gctttaaact + 961 attaaaattc ttaagaaata aggctacttt ttctgggtct tgttcatagt aggtgtggtt + 1021 ctttttttcg agtgtagccc atagctttga gcgcatagtg gatggtagtt ggatgacagc + 1081 caaattcaga agctatttca gtcaaataag cgtctggatt attagtaaga tagtttttaa + 1141 gtctatctct atcaactttt cttggttttg ttccttttac ttggtggttt agctctcctg + 1201 ttttctcttt tagctttaac cagccataaa tggtattacg tgagatttgg aaaacgtgtg + 1261 atgcttctgt tatactacct gttcgctcac aataagagag aactttttta cgaaaatcta + 1321 ttgaatatgc cataaaaaga ttataccaca ttgtgtacta tattatattg aaactagaat + 1381 agtacacatc tgcttctaaa atattgttag aaaacgattt gactgtcctg atcaatttgt + 1441 catgttctta tttcatttta ctatattttt ggttcgcggg aagtctacta agatacttaa + 1501 agatgcagat agtgaaaaaa ggtgtagaca ttaccgtaaa aaagtgatat aatcgtaaga + 1561 tgttcaatgt ataggtgtta atcatgagta gacgttttaa aaaatcacgt tcacagaaag + 1621 tgaagcgaag tgttaatata gttttgttga ctatttattt attgttagtt tgttttttat + 1681 tgttcttaat ctttaagtac aatatccttg cttttagata tcttaatcta gtggtaactg + 1741 cgttagtcct actagttgcc ttggtagggc tactcttgat tatctataaa aaagctgaaa + 1801 aatttactat ttttctgttg gtgttctcta tccttgtcag ctctgtgtcg ctctttgcag + 1861 tccagcagtt tgttggactg accaatcgtt taaatgcgac ttctaattac tcagaatatt + 1921 cgctcagtgt cgctgtttta gcagatagtg agatcgaaaa tgttacgcaa ctgacgagtg + 1981 tgacagcacc gactgggact gataatgaaa atattcaaaa actactagct gatatcaagt + 2041 caagtcagaa taccgatttg acggttaacc agagttcgtc ttacttggca gcttacaaga + 2101 gtttgattgc aggggagact aaggccattg tcctaaatag tgtctttgaa aatatcatcg + 2161 agttagagta tccagactac gcatcgaaga taaagaagat ttataccaag ggattcacta + 2221 aaaaagtaga agctcctaag acgtctaaga atcagtcttt caatatctat gttagtggaa + 2281 ttgacaccta tggtcctatt agttcggtgt cgcgatcaga tgtcaatatc ctgatgactg + 2341 tcaatcgtga taccaagaaa atcctcttga ccacaacgcc acgtgatgcc tatgtaccaa + 2401 tcgcagatgg tggaaataat caaaaagata aattaaccca tgcgggcatt tatggagttg + 2461 attcgtccat tcacacctta gaaaacctct atggagtgga tatcaattac tatgtgcgat + 2521 tgaacttcac ttctttcttg aaaatgattg acttattggg aggggtagat gttcataatg + 2581 atcaagagtt ttcagctcta catgggaagt tccatttccc agtagggaat gtccatctag + 2641 actctgagca agctctaggt tttgtacgtg aacgctactc actagccgat ggagaccgtg + 2701 accgcgggcg caatcaacaa aaggtgattg tggctatcct tcaaaaatta acgtcaaccg + 2761 aagcactgaa aaattatagt acgatcatta atagcttgca agattctatc caaacaaatg + 2821 tgccacttga gactatgata aatttggtca atgctcagtt agaaagtgga ggaaattata + 2881 aagtaaattc tcaagattta aaagggacag gtcggatgga tcttccttct tatgcaatgc + 2941 cagacagtaa cctctatgtg atggaaatag atgatagtag tttagctgta gttaaagcag + 3001 ctatacagga tgtgatggag ggtagatgaa atgatagacg tccattcgca tatcgttttt + 3061 gatgtagatg acggtcccaa gtcaagagag gaaagcaagg ctctcttggc agaatcctac + 3121 aggcaggggg tgcgaaccat tgtctctacc tctcaccgtc gcaagggtat gtttgaaact + 3181 ccggaagaga agatagcaga aaactttctt caggttcggg aaattgcaaa agaagtagca + 3241 gatgatttag tcattgctta cggggctgaa atttactaca caccagatgt tctggataag + 3301 ctgggaaaaa agcggattcc gaccctcaat gatagtcgtt atgccttgat agaatttagt + 3361 atgaacactc cttatcgcga tattcatagc gccttgagca agatcttgat gtcgggaatt + 3421 actccagtca ttgcccacat tgagcgctat gatgctcttg gaaataatga aaaacgcgtt + 3481 cgagaactga ttgatatggg ctgttacacg caagtaaata gttcacatgt cctcaaacca + 3541 aaactttttg gagaacgtta taaattcatg aaaaaaagag ctcagtattt tttagagcag + 3601 gatttggttc atgtcattgc aagtgatatg cacaatctag acggtagacc tcctcatatg + 3661 gcagaagcat atgaccttgt tacccaaaaa tacggagaag cgaaggctca ggaacttttt + 3721 atagacaatc ctcgaaaaat tgtaatggat caactaattt aggagaaatg atgaaagaac + 3781 aaaacacgat agaaatcgat gtatttcaat tatttaaaac cttgtggaaa cgcaagctaa + 3841 tgattttatt agtggcactt gtgacaggtg cgggggcttt tgcatatagc acttttattg + 3901 ttaagccaga atatacgagt accacgcgaa tttacgtagt gaatcgcaat caaggagaca + 3961 agtcggggct gacaaatcag gatttgcagg caggatctta tctggtaaaa gactaccgtg + 4021 agattatcct ttcgcaggat gcattggaaa aagtagcgac aaatttgaag ttggacatgc + 4081 cagcaaaaac gttagctagc aaagttcaag tgactgtacc aactgacact cgtatcgtct + 4141 caatctctgt caaggataaa cagccagagg aagccagtcg tatcgccaat tctctacgag + 4201 aagttgctgt agaaaagatc gtcgctgtaa cgcgagtatc tgatgtaacg acgcttgaag + 4261 aagcgcgacc agctacgact ccttcttctc caaatgttcg acgcaattcc ttgtttggtt + 4321 ttcttggagg agcagtcgta acagtaattg ctgttctttt gattgagttg ttcgacaccc + 4381 gtgtgaaacg tcctgaagat attgaagatg tactgcaaat tccactttta gggctcgttc + 4441 cagatttgga caaaatgaaa taggaggaag ttatgccaac gttagaaatc tcacaggcaa + 4501 aattggattt tgtaaaaaag gcagaggaat attataactc tttgtgcacg aacctacagt + 4561 taagtggaga tggtttgaaa gtattttcta tcacttctgt gaaactagga gaaggaaaat + 4621 caacgacttc caccaatatc gcttgggctt ttgcgcgtgc aggttacaaa acgctgctga + 4681 ttgatggaga tattcgcaat tctgttatgt taggtgtctt taaagcaagg gataagatta + 4741 caggcctgac agaattttta tcaggaacta cagacctatc acaagggctt tgtgatacca + 4801 atatcgaaaa tctctttgta attcaggctg gctctgtgtc accgaatccg acagctcttc + 4861 ttcaaagtaa gaatttcagt acaatgcttg aaaccttgcg taaatatttt gactacatca + 4921 ttgtagatac tgctcctgtc ggtgtcgtga ttgatgcggc tattattacg caaaaatgcg + 4981 atgcttctat tttagtgacg gaggcaggtg aaataaatcg acgggatatt caaaaagcaa + 5041 aagaacagtt ggaacacaca gggaagccgt ttttgggagt tgtgttgaat aaattcgata + 5101 cttcagtaaa caaatacggt tcttatagaa attatggaga ttacgggaaa aataaaaaat + 5161 agattgaggg atagagatga atggaaaagt agtaaagcct tcattggcca taatccatag + 5221 ttttcttgtt attttattga cttatctact tagtgctgtg agagaagcgg agattgcttc + 5281 agcaacagct attgcacttt atatcctcca ttattttgtc ttttatatca gtgattatgg + 5341 acaggatttc tttaaaaggg gatatttgat tgaacttgtc cagacattga aatatatcct + 5401 attctttgca ctagcgatta gtatttctaa ttttttctta gaggatcgat ttagtatttc + 5461 cagacgaggc atgatttact tcctcacatt acatgctctc ttagtctatg tgctaaacct + 5521 atttatcaag tggtattgga agcgggctta tcccaacttt aaaggaagta agaagattct + 5581 cctgcttaca gcaacttctc gtgtcgaaaa ggtactggat agattaatag aatcaaatga + 5641 ggttgttggg gagttggtag ccgtcagtgt cttagataaa ccagattttc agcatgattg + 5701 tttaaaggta gtagcagagg gggagatagt aaactttgcg actcatgagg tggtcgatga + 5761 agtctttatc aatcttccaa gtgaaaaata caatattgga gagcttgtct ctcagtttga + 5821 aacgatggga attgatgtaa cagtcaatct aaatgctttt gatcgtagtt tggcacgtaa + 5881 caagcaaatt cgtgagatgg cagggttaaa cgttgtgact ttttctacaa cattttataa + 5941 gactagtcat ctaattgcta agcggattat tgatatcgtg ggtgcattgg tagggctgat + 6001 attatgtggt ttagtcagta ttgtactggt tcctttgatt cgaaaggatg ggggctctgc + 6061 tatttttgct cagacgcgta taggaaaaaa tggtcgtcag ttcacttttt ataagtttcg + 6121 ctctatgtgt gtagatgccg aggcgaaaaa aagagaactc atggaacaaa ataccatgca + 6181 gggtggaatg tttaaggtgg acgatgatcc tcgtatcacg aaaattggtt gttttatacg + 6241 gaagactagc ttggacgagc taccacagtt ttacaatgtt ctaaagggag atatgagttt + 6301 ggtaggtaca cgaccaccaa cagtggacga gtatgagcac tataccccag aacaaaaacg + 6361 ccgactaagt tttaaacctg gcataacagg tttatggcag gtcagcggac gaagtgagat + 6421 caagaatttc gatgaaattg tcaaattaga tgtagcctat atagacgatt ggacaatttg + 6481 gaaagatatt gagattttat tgaagacagt taaagttgta ttgatgaagg atggagcgaa + 6541 gtagattgat agatgtaaaa atcattgtgg caacacataa agaagttaaa atgcctcaag + 6601 acaatagtct ttaccttcca atacatgttg ggagagacgg taaatcagat attggtttta + 6661 tcggtgataa tactggcgat aatatatcct ctctaaatcc atattattgt gaattgacgg + 6721 gactttattg ggcatggaag aatcttgatt ataattactt aggtttagtt cattaccgtc + 6781 gttattttac aaaaaaatca caaagatatt cagattatat cagtatggat gaagttgttt + 6841 tatctcgagg tgatttagat aatcttcttt cccaaaatga cgttttagtt cctaagaaga + 6901 ggcgatacta tattgaaacg ctctattcac actacgctca tactttggat ggaagtcatc + 6961 ttgatgttgc tcgtgatgta attaaacagt taagttcaga atatttaacg accttcgata + 7021 aggtcatgaa gcaacgtagt ggttacatgt tcaatatgtt tattatgaaa aaagatttgg + 7081 caaatcagta tttttcttgg ttatttccta ttttagacaa gatgtatgag caaatagatg + 7141 tatcccagtt aacacccttt gaagctagac tattcggtcg tgttagtgaa ttattattta + 7201 atgtgtggtt aaaacataag gacattaaac caaaagagct accatttatg tatatggaaa + 7261 aagtagattt gtttgaaaaa gggaaatcct tcttaatggc caaattcttc gggaaaaaat + 7321 atggacagag tttttgaaat gttagaaaaa gaatctccac tttttagtgt tattgttcca + 7381 acctataaga tatcagaatc taatctacgc caatgcatag actctctgtt atatgataat + 7441 caagatgttg aaattatttt ggtggatgat aacgcgaact cagatatatg tggtaaagta + 7501 atagacgaat atgctgaaaa atataataat atttcagtta ttcatcagga aaaccaaggt + 7561 gtgtcagtcg caagaaatgc tggtatgtct attgctgtag gaaagtatct tgtttttgta + 7621 gaccctgatg attgggttgc tgaaaatttt tatagccaaa tggcttttgc ggttcaaaaa + 7681 aatccttcaa gcgatgtgat tatattagct gctattgtag actacaatgg taaacgattt + 7741 acgaattatt tttggcacac ttctcgttct ttttgtggaa aagacaaaga tgatttggaa + 7801 cttcaattga ttgccaaagg agcaacgagt tattttccaa ctgagatagg ggttggtgtt + 7861 ccttgggcaa aaatttatcg taatgagttt gtgcgagcaa atggcttggt ttttaatcct + 7921 tctcttcgtc gaatgcaaga taatattttc aatatgtatg cattcgaatt tgcgaatgaa + 7981 atcgtctaca ttaatgagcc gatttactat tatagaaaga gtatggatag tgtaactaat + 8041 aagaaaaatg ataaagtaat ttattatttc gacttagtta atgatgaggt tgaaaaattt + 8101 attcaaaaat ttaataaacc taaaatattt gaagatgctc tgcatataaa aagacttata + 8161 ggaatcaatt cgtattataa gttgtatttt cagtttgcga ctacttcaag cgagaaaaag + 8221 aaaatgcgac aagaatttcg tgaactttta gaaagggaag aatatgcaaa ttcgttaaaa + 8281 caagtgaata cagcctatct tctcccaaaa gaaaaaattt ttataagtat tttaaagcag + 8341 aaacacttgc gaatattttc ctttttacaa aaacttgaaa aattatctgc gagattaaag + 8401 agccgtcatt ttagttagag ggaatatgag acagttaaca ttaaaattag ttagtatcat + 8461 ttataaagta acaaaacgaa tacctatatc ttttatttct aatttaggcg agaggattta + 8521 ttcactaaag gattcctatg tttttgacgt attaagtaaa ttgggagtcg ataaagagag + 8581 cacctatgat ttgatgccac cagatttatt tttgaataaa atttggattt gctggtttca + 8641 gggtgaggat aaagcaccag atttagtaaa aaagtgcatc aatagtgtta gaaaacatgc + 8701 ctcaggctac gatgtcatta ttttaacgga agataatata gaagaatatg ttacacttcc + 8761 aaatattgtt ttaacaaaat ataaaaatgg attatttagc cggactcatt tttcggatat + 8821 agttcgattg aatcttcttg cacaacaggg aggactttgg attgatgcaa cgatttttat + 8881 gactagggat ttagatttgt ctatattttt caaaaatgat tttgtaagct tgagaactac + 8941 aataaaatct agtcctcttt ttattacggg gtactggacg acatattttg tatatatgcc + 9001 ctctaatttt aaattggttc aatatactgc tttattatta aataaataca ttgagaaata + 9061 tgatcgcttt atagattatt tcttacaaga ttatataatt actaaggcaa ttaaagattt + 9121 gaattatgaa tcatacatgg aagaacggcc tgtattggga aatcaacgtt ggcttttagc + 9181 agatttagct aataaagttg tgacctcaga acttcttcaa caatttaagc aagatacggt + 9241 aggaatttat aaagtgacat ataaatccaa gtatattaga aaaaaaaatg gtagggaaac + 9301 ggtttataaa aaaattgtag aggatggaga atgccttgaa taataaaata ggaattgtta + 9361 ttttaaatta tcttaattgg gaggatactt tagaatgcat aaatagtttg cgctcacaaa + 9421 gtgatcaaga ttttgaagct gtcatagtag aaaatggttc tccaaatgaa tctgtttcta + 9481 ggattagaga ttatataaaa aatgacaaga atattcatct ttatgtagta gagaataact + 9541 taggttatgc aaatggaaat aatatgggca tcctctactt aaaaaataga tactctataa + 9601 atagaattct attaactaat aatgatgtta tttttgatga tgaagactac ataaaaaaat + 9661 tagaagatat taagtatagt aacacaattg gagctattgg aacaaaaatt attggttctg + 9721 atggtttaaa ccaaaatcca gcttattttc caatttcttt tagttctagt ataaaatcac + 9781 ttcttattaa cttattggca ttttctaaag ttatcacttt tatcaaaaag cgttttctat + 9841 cttcatggac gaaaagagct aatgactttt caaatccaaa aaccgatgaa caaaaatact + 9901 tcctacatgg atcagtcatt tttcttacgg aaaattattt agataggttt atgggattgt + 9961 atggagggac ttttctttac tatgaagaag taatcctagg tattatattt gaaaaagcag + 10021 gtcttgatat gttgtatgta cctgactttt caatttacca taaagaagat caatcatctt + 10081 tggaaagttt tgcaaatgat gatttgatta ggcgtaaatt tttattgaaa agcatattct + 10141 ctagctttaa ggtacatttt tgtgcaacga atagactctc tatactggtg aaggagtcaa + 10201 taaagtatga ttaaatttaa ttattctaaa ttagcattaa tttaccagtt tataataatt + 10261 ttttttctgg gtgcttggta taagaatagc attcagttta aaattttttt gatatctatt + 10321 gatactatca tttctttatt ttatttatat aaaaataatt tatctagaag tgacttaaaa + 10381 aaagtttata tcttgataac tacagtgtta gtaagcttat ttttaccatc gtttatgaat + 10441 agagtatctt ttatacttct catattgcaa aaattatata tatttaacca tattattaat + 10501 gatataaagt ttgaatattt gctctcagtc tttctacaat ttattgtact actaaccttt + 10561 tgtatgggat tagaattcat ttcattagga caatttaatc cgtttaaaac attttatgca + 10621 ccaagagttc ttcttgatat gagttttaaa gtcggaacac ctttatattt tttgagatca + 10681 agtttagagc atcctctaat aacttcgatt gtattagtag ttactggccc tttcttattc + 10741 cttttagaaa agaaatggtt gagatatgta tgtgtgtttc taaatattag tttaatcttt + 10801 tttattcaga agagaactgc gtatatattg gtatcgattg gagttgtatg ttttgctttg + 10861 tattatctaa aatatattaa tcgtagattt caattgaata aaataacttc agtgatattt + 10921 ttaatgacac tatttataat tgctttatcc tttataaggg tgcaaggtga ttatgtatta + 10981 aatattattt ttagtaaatt ttctgcttta caagatgcag atagtttctc gctaaataat + 11041 cgtgtaatta atgctaaaac tggattagat gtaattttcg atcaaaatgt tataaatata + 11101 ttcattggga atggatatga ctttttacct aatttttttg aacaatacaa tgtgtatgta + 11161 attcggaatg gtttttatgt gattgacaat acatatattt catttcttgc cgactatgga + 11221 atgattggtc tgttcttagt attgttatat attataaatg cgatccgaaa aagtatgact + 11281 aatatttaca aaataaagag taaaaaagaa caattattta tgttgtatag tattataggt + 11341 attatcaatt taatggtatc aatagctttt tttgatatat atgcttggta cacgctatta + 11401 acgttattga tttttttaat atcagtagtg acttcttatt gtaaatttca ttccaataag + 11461 ttttagtgtg tacaatcatt ataattagca aaaagaagga aatctgaatg actctcaaaa + 11521 acgaagttaa aaacataaaa cgaacaatag aaaaaaattt ttttcataag gattttacat + 11581 ctatatctga tattaagaat tatcagattg aaatttctaa gaatctaagg ccacgtctta + 11641 atttattaat tacttcaatg aactctcagg atgtatatgc tggcatcaaa tcagcagtgg + 11701 atttttttat gaagttcaaa aaatttgata tagatttaag aatcattgta atgggaaaaa + 11761 aaatcgatga accgtctctt tatcaagttc ctggttttga atttattaaa gactattcaa + 11821 ttgagaatga tagtgagtct aggattattt gcgatttatc taagaatcgt tctccattgt + 11881 ttattaggga gcgtgattat tttctatcaa caatgtggta cactgcttat aatgctaaca + 11941 atgtgctgga tgagcaaaaa agaatttttg ggaaacggat gcccatggtt tatctagttc + 12001 aagactatga accaggtttc tatccatggt cctcagagta tcttttggct gagagcacat + 12061 atcatctaga taaccagctt gttgtcttta attctaagta tttaaaagaa ttttttgatg + 12121 caaatggtta tagatttgaa aatagttatt attttgatcc agttttaaat gaaaaattgg + 12181 gggagattct taatttagca gagctttcta atattgaaag gaaaaatcgt attttatttt + 12241 atggaaggcc tagtaaagct agaaatgctt ttcagttaat ctgtatggca ttggaaaaat + 12301 ggagcgtttt ggacgaacgt agttcaaatt gggaaatttt ttctgcagga gaagatttaa + 12361 aagatattaa attgaataat agcatagtaa taaaatcgtt agggaagatg tcagttgaag + 12421 aatacgcaaa atttatgttg gaatctaaaa tcggaatctc tctaatggcc tcaccgcatc + 12481 ctagctatcc tccgttagaa atggctacgt ttggtatgaa agtcataacg aattctttcg + 12541 ttacaaaaga tatttctgat tttaatgaaa acataatttc tattgaacat attaatatta + 12601 ataaattggc ggaagaatta cattttttaa caacatctga tatagaatat aaaatttcga + 12661 aaaacgatga ttatataaat ggtattagcc agcttgatac aattgtagat gaaattgcgg + 12721 gacatttaca atttcggcat agcgaggtgt gattgtgaaa aggaaatcca ttgcccgaaa + 12781 ttatttactt aatttgataa aaacgacctt gtctattcta tttcccctga tatcataccc + 12841 atatgtgtcg cgtattttat ctgtggatgg gctgggtgca atcaattttt caacctcgtt + 12901 tgttaattat ttcgtactaa ttgcaatctt tggaattaat gtctacgctg ttagagaagg + 12961 tgccaaatat cgagatgata aaaagttact tgggaagttt gtaacggaga tgttacttgt + 13021 tagtatttgc acggcaatga tttcattctc tttattaact gtttccttac tcctacctgc + 13081 tctatcagaa tatagaagtc ttattctaat tttttcaatt accattatat ttaatgttgt + 13141 ggggatggag tggttttttc aattgatgga agactatcaa tatataacac ttcgtgcaat + 13201 tatatttcaa attctatctt tgatattttt attcatattt gtcaaaaata ggaatgatat + 13261 ttatgtgtac gctctaatta cagttgcagc aaatgcaggt tctcaaatac tgaatttatt + 13321 tagacttaga aaagaagttg aaatatttag atataaagac tataatatta gaaattattt + 13381 taaaccgatg tttctgatat ttttaacctt attgtctatg aatatgtata gatatttaga + 13441 tgttactttt ctgggcttct ttaaaaatga tcgaagtgtg ggctactata gcttagctac + 13501 aaaaataaca agtgctataa tttcaatgtt atcttctgtt acagttattt tgacacctcg + 13561 tctagcatat cattataaga aggaggagtt tgataaattc tataaaattg cttatagttc + 13621 ctttgatttg attttattac ttgctatacc agttgttata ggtgtattta gttttagttc + 13681 tattttagta gattttttgg gtgggagtac ttttgtttct tctgtgttaa cggtggagat + 13741 attaagttta acaattctat tctctaattt gaatgcttta ttaattacac ctattttaac + 13801 ggttatgaat cgtgagaaag cggttttaaa aatttttatt atcgcattga ttttcaatgt + 13861 tattacaaac atgttactta ttccagtaat ggattttaat ggttcagctt tggttacagt + 13921 tttgacagaa ggaattattt gcatattatc tttaattagt ataaaaagtg tgtttaatgt + 13981 tagaaggcta tttaagaatc tttttcaata tctggtagct agtatcttta taattgttat + 14041 caagattgtt atttctcagt acgtttcatc aaattatatt atttttattt caactgcttt + 14101 actaagcgca attttatatt tccttacttt gatattattg agaaatgagt tagtactaca + 14161 attaataata gaagttagaa agaaaatata tagatagtgg agttaaatat aaatgtttac + 14221 catatataga gccataaaaa aataattata attattttgt cgcttcccaa gattttttat + 14281 ataaatttta aatgccttcc gttgaatcag gcggttaaac ctcctatata tgttcatttt + 14341 aatactcgat taatgattag gggagacata aaaatcattg atactcattt atcacgtttt + 14401 actattattt tggggaaaga tggctctaat catatctctc ctcatgagag tagattattt + 14461 atgatggggg gcaattaatt ctagggagaa atattctatt atctagtgga tttaatttgt + 14521 gtatagagca aggaggtacg gttaaattag gagataatgt ctcttttaac agaaattctt + 14581 cgatcttttg taaaaaacaa attaatattg gtaaaaatag tttgtttggt tggaactgta + 14641 atttacgtga taataatgga cataggatct attatcaggg gaactgtatt aagagtgagg + 14701 gagttattgt aataggagag aattgctgga taacagcaga ctcagtcatt cttaaaaata + 14761 gtgttcttcc tttttctact gtagttgcta caggtagttt agtaaataaa gagtttaatc + 14821 agagtaacat tttgatagct ggaaggcctg ctagaattat tagagacgat ataaaatggg + 14881 aaagataaga tagtaattga ttaattaggt cgtgtaattt ttaacagaga taacgaaagg + 14941 taatgggtga agtaaatgaa aattgcagtt gcaggtacag gatatgtagg actatctatt + 15001 gcagttttaa tggctcagca tcatgaggtg gtagctgttg atattatttc tgaaaaggtc + 15061 aatctgatta ataatggaaa atctccaatt aaggatgact atattgaaga atacttagca + 15121 acaaagcccc tcaacttagt ggcaacattg gatacaaatc tagcgtacca aaatgcagat + 15181 tttgttatta tagcagctcc aacaaattat gattcagaaa agaacttttt tgatacatct + 15241 gctgtagaat cagttattga aacggtgtta gagactaatc ctaacgctgt aatggtaatt + 15301 aaaagtactg ttcctgtagg ctatactcaa tcgattcgta ataaatataa aacaagtaat + 15361 attttattta gtccagaatt tttacgtgag tcaaaggctt tatatgataa tttatatcct + 15421 agccgtataa ttgttgggct tgatatggac gatgcatatt taaaggagag agccgaaact + 15481 tttgcagaac tgctacaaga aggagctgtt aaagaggcta tagaaattct ttacatggga + 15541 tttacagagg cagaagcagt caaacttttt gcaaatacat atttagcctt acgtgtttct + 15601 tatttcaatg agttggatac ttatgcagaa gttaaagggc tagataccaa agctattatt + 15661 gaaggtattg gcttagatcc acgtatcgga agccaatata acaatccttc ttttggatat + 15721 gggggatatt gccttccaaa agatagtaaa caactattgg caaactataa agatgttcca + 15781 cagaatatga taacagctat cgttgagagc aatcgtacta gaaaagattt tattgcagag + 15841 cagattttga aacttgcagg agtttcaaat aatggggaaa tttacccaaa agatgtaata + 15901 ataggccttt atcggttaac tatgaagagc aactccgata attttcgtca atcttctatt + 15961 caaggtgtta tgaaacgatt gaaggcagaa ggagcaaatg tcataattta tgagccaact + 16021 cttagtgatg acgagacgtt ttttggtagt aagattgtaa atgatttgga acactttaaa + 16081 tcaattagta atgttatcgt ggcaaatcgt tatgatgatt tgcttaaaga tgtgagtgac + 16141 aaggtttata gtcgtgatat ttttaagaga gattaggtag aagttataat gtatgattat + 16201 ttaatcattg gagctggttt gtctggtgca atctttgcgc acgaagctac aaaacgtgga + 16261 aaaaaagtaa aagtgattga taaacgtgat cacatcggtg ggaacatcta ttgtgagaat + 16321 gtagaaggta tcaatgttca taaatatggt gcccatattt tccatacttc taataaaaaa + 16381 gtttgggact atatcaatca attcgctgag tttaacaact atatcaactc acctgtcgca + 16441 aactacaaag gaagtcttta caatcttcct ttcaatatga ataccttcta tgctatgtgg + 16501 ggcacaaaaa ctccacagga agtaaaagat aagattgctg agcagacagc tgatatgaag + 16561 gatgttgagc ctaaaaatct ggaagaacag gctatcaagt tgattggtcc agatatctat + 16621 gaaaagttga ttaagggtta tactgaaaag cagtgggggc gctcagcaac ggaacttcct + 16681 ccatttatca ttaagcgtct tccagttcgt ttaacatttg ataataacta ttttaacgac + 16741 cgttaccaag gaattcctat tggtggttac aatgtcatta tcgaaaacat gcttaaagac + 16801 gttgaagttg agcttggtat tgatttcttt gctcaccgtg aagagttaga agcatcagct + 16861 gaaaaagttg tcttcacagg aatgatcgac cggtattttg actacaagca cggagagtta + 16921 gaataccgta gccttcgttt tgagcatgag attttagacg aggaaaatta tcaagggaat + 16981 gctgtagtga actatacaga gcgtgagatc ccttatactc gtatcatcga acacaaacat + 17041 tttgaatatg gaatgcagcc aaagacagtt atcacgcatg aatatccagc tgactggaag + 17101 cgtggggacg agccctacta tcctattaac gatgagaaaa ataatgctat gtttgctaaa + 17161 taccaagaag aagcagcgca gaatgataaa gttatctttt gtgggcgttt agcagactat + 17221 aaatattacg atatgcatgt ggtgattgaa cgggcgcttg aggttgtgga gaaagaattt + 17281 agtaattgaa aaacaacgaa gaaaggttgc ttatatatga aaggtattat tcttgcaggt + 17341 ggttcgggga cacgattata tcctttgact cgggctgcat caaaacaact tatgccggtt + 17401 tatgataaac ccatgattta ctatcctttg tcaaccctga tgttgactgg aataaaggac + 17461 attttgatta tctcaacacc acaggatttg ccccgtttta aggacttgct cttggatggt + 17521 tccgaatttg ggatcaagct ttcctatgcg gaacaaccta gtcccgatgg acttgctcag + 17581 gcttttatta tcggtgaaga gtttatcggt gacgatagcg ttgccttgat tttaggtgac + 17641 aatatttacc atggtcctgg tctgagcaca atgcttcaaa aagcagccaa gaaagagaaa + 17701 ggtgcgactg tttttggcta ccaagtgaag gatccagagc gttttggtgt ggttgagttt + 17761 gatacagaca tgaatgctat ttctatcgaa gaaaagccag agcaccctcg ttcaaactat + 17821 gcagttacag gaatctattt ctatgataat gatgtagtag agattgccaa aagtataaaa + 17881 ccaagccctc gtggtgaact ggaaattaca gatgtaaaca aggcttacct aggtcgtgga + 17941 gatttatccg ttgaggttat gggacgaggc tttgcttggc tggatactgg aactcatgaa + 18001 agtttattag aggcttcgca gtacatcgaa acagtccaac ggatgcaaaa tgttcaggta + 18061 gcaaacttag aagaaattgc ctatcgcatg ggttatatca gtcgtgaaga tgtattgacc + 18121 ttagcccaac cacttaagaa aaatgaatac ggacagtatc tgctccgttt gattggagaa + 18181 gcatagatga cagataattt tttcggtaag acgcttgcgg cacgcaaggt tgaagctatt + 18241 ccaggcatgt tggagtttga tatccccgtt catggagata atcgtggctg gtttaaagaa + 18301 aatttccaaa aggaaaaaat gcttccactt ggatttccag agtctttctt tgcagaagga + 18361 aaattgcaaa acaatgtatc cttctcacgt aaaaatgtcc ttcgaggcct ccacgcagag + 18421 ccttgggata agtacatctc tgtagcagat ggagggaaag ttctgggttc ttgggttgat + 18481 ctacgcgagg gtgaaacctt tgggaatacc tatcagacag taattgatgc aagcaaggga + 18541 atctttgttc ctcgaggcgt agctaatggc ttccaagttc tatcagatac agtgtcatat + 18601 agctatctgg tcaatgatta ctgggctctc gagctcaaac ccaagtatgc ctttgtgaac + 18661 tacgctgatc caagccttgg tattgaatgg gaaaatattg cagaagcaga ggtttcagaa + 18721 gcagataaac atcatcccct acttaaggat gtaaaacctt tgaaaaaaga agatttgtaa + 18781 aaaggaaaga atatgactga atacaaaaat attatcgtga caggtggagc tggctttatc + 18841 ggttctaact ttgtccatta tgtttacgag aactttccag gtgttcacgt gacagtccta + 18901 gataagttga cttatgctgg aaatcgcgcg aatattgagg aaattttagg taatcgtgtt + 18961 gagttagttg ttggtgacat tgctgatgcg gagttggtag acaagttggc tgctcaagca + 19021 gatgctatcg ttcattatgc agcggaaagc cacaatgata attcgctcaa tgatccatcg + 19081 ccatttattc atactaactt catcggaacc tatactcttt tagaagctgc tcgtaagtat + 19141 gatattcgct tccaccatgt atcgacagat gaagtttatg gggatctccc tttacgcgaa + 19201 gatttgccag gtcatggtga aagaccaggt gagaaattta cggctgaaac aaaatacaac + 19261 ccaagctctc cgtactcatc aaccaaggca gcctcagatt tgattgtcaa agcctgggtg + 19321 cgttcttttg gagtcaaggc aacgatttcc aactgttcaa ataactacgg tccttatcaa + 19381 catatcgaaa aattcatccc acgtcagatt actaacatcc taagtggtat caagccaaaa + 19441 ctttacggtg aaggtaagaa cgttcgtgat tggattcata ccaatgacca ttcttcagga + 19501 gtttggacaa tcttgacaaa agggcaaatc ggtgaaacct acttgattgg ggctgatggt + 19561 gagaagaaca ataaggaagt tttggaactt atccttaagg aaatgggaca agctgcggat + 19621 gcctatgatc atgtgactga ccgtgcagga catgaccttc gctatgcgat tgatgccagc + 19681 aagctccgtg aggagttggg gtggaaacct gaatttacca actttgaagc tgggctcaag + 19741 gcaacaatca agtggtatac agataaccaa gaatggtgga aagcagaaaa agaagctgtt + 19801 gaagccaatt atgctaagac tcaggagatt attacagtat aaaaagcagg aaatagctgc + 19861 tttttattgc tatattggga agagttacat attagaaagg tctagagatg attttaatta + 19921 caggggcaaa tggccaatta ggaacggaac ttcgctattt attggatgaa cgtaatgaag + 19981 aatacgtggc agtagatgtg gctgagatgg acattaccga tgcagaaatg gttgagaaag + 20041 tttttgaaga ggtgaaaccg actttagtct accactgtgc agcctacacc gctgttgatg + 20101 cagcagagga tgaaggaaaa gagttggact tcgccatcaa tgtgacgggg acaaaaaatg + 20161 tcgcaaaagc atctgaaaag catggtgcaa ctctagttta tatttctacg gactatgtct + 20221 ttgacggtaa gaaaccagtt ggacaagagt gggaagttga tgaccgacca gatccacaga + 20281 cagaatatgg acgcactaag cgtatggggg aagagttagt tgagaagcat gtgtctaatt + 20341 tctatattat ccgtactgcc tgggtatttg gaaattatgg caaaaacttc gtttttacca + 20401 tgcaaaatct tgcgaaaact cataagactt taacagttgt aaatgaccag tacggtcgtc + 20461 cgacttggac tcgtaccttg gctgagttca tgacctacct agctgaaaat cgtaaggaat + 20521 ttggttatta tcatttgtca aatgatgcga cagaagacac aacatggtat gattttgcag + 20581 ttgaaatttt gaaagataca gatgtcgaag tcaagccagt agattccagt caatttccag + 20641 ccaaagctaa acgtccgcta aactcaacga tgagcctggc caaagccaaa gctactggat + 20701 ttgttattcc aacttggcaa gatgcattgc aagaatttta caaacaagaa gtgagataag + 20761 tagtagaatg attttctagt ctaataaaag aggcagataa tgaactccaa aggagcttaa + 20821 gatgtacgat tatcttgttg ttggtgctgg tctctttggc gcatagcttt ggctcagttt + 20881 ctattatcgc tcacaccatc catcagaagt ttaatctgaa ggtacccaat tatcgccatg + 20941 aagaagattg ggctaggatg ggtttaccaa tcacacgtaa ggaaatctct aattggcata + 21001 tcaaggcaag tcaatactat ttagagtccc tttataacct tttacgagaa aagttgttag + 21061 aacaacctct tcttcatgcg gatgaaacct cttatcgggt tctagagagt gatagccatc + 21121 tgacctacta ttggaccttt ttgtctggga aatcagagaa acaagggatt acgctttacc + 21181 atcatgatca gcgtcggagt ggttcggtag tgcaagaatt cctaggaaat tattctgcct + 21241 atgcgatagc agtccaaagt ttaggagcaa ggcgacgcta agcttggtaa actacgaacc + 21301 gctagaagct tatcgtcaac tggaagaagc tgaacttgtt ggatgttggg cgcatgtgag + 21361 aaggaagttt tttgaagcgc cccccaagca agcggataaa tcatcgttag gagctaaagg + 21421 tttagcttat tgtgatcagt tatttgcctt ggaaagagac tgggaggctt tgctagctga + 21481 tgaacgacta cagaaacgtc aagaagagct ccaaccccta atggaagatt tctttgcttg + 21541 gtgccggcgt cagtcagttt tatcgggttc aaaactagga agggcaattg aatacagcct + 21601 caagtataaa gaaaccttta agaccatttt aaaagacgga catctggtcc tttccaataa + 21661 tctagctgaa cgcgccatta aatcattggt tatgggacgg agtaaaagag tccagtggac + 21721 tcttttagcc taagctcagt ttaaaaaagt gagggtggtt attttctcaa agttttgaag + 21781 gagctaaagc aagagctatt attatgagct tattggaaac agctaaacgt catcaactaa + 21841 atagcgagaa atatctatcc tatcttctag aatgtcttcc aaacgaggaa actctcgtaa + 21901 acaaagaggt tttagaggcc tatttaccat ggactaaagt tgtacaagaa aagtgcaaat + 21961 aagaaatctc cagattagga actatccgtg agttctctag tctggagatt tttcaatata + 22021 cttcgttatt gggcgcttac aatgatattc atattttttg caaagatgtt gtttgaaaaa + 22081 taattttcaa aaattctgaa aattctgttg acaactttct gaaaagagtc tataatggag + 22141 agaaagtttt aaaggagaaa atgatgaaaa gttcaaaact acttgccctt gcgggcgtga + 22201 cattattggc ggcgactact ttagctgcat gctctggatc aggttcaagc gctaaaggtg + 22261 agaagacatt ctcatacatt tatgagacag accctgataa cctcaactat ttgacaactg + 22321 ctaaggctgc gacagcaaat attaccagta acgtggttga tggtttgcta gaaaatgatc + 22381 gctacgggaa ctttgtgccg tctatggctg aggattggtc tgtatccaag gatggattga + 22441 cttacactta tactatccgt aaggatgcaa aatggtatac ttctgaaggt gaagaatacg + 22501 cggcagtcaa agctcaagac +// + diff --git a/public/res/serotype_genbank/serotype_41F.gb b/public/res/serotype_genbank/serotype_41F.gb new file mode 100644 index 0000000..46e96b3 --- /dev/null +++ b/public/res/serotype_genbank/serotype_41F.gb @@ -0,0 +1,1046 @@ +LOCUS CR931714 22917 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 8211/40 (serotype 41f). +ACCESSION CR931714 +VERSION CR931714.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22917) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22917) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22917 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="8211/40" + /db_xref="taxon:1313" + gene <1..166 + /gene="dexB" + /locus_tag="SPC41F_0001" + CDS <1..166 + /gene="dexB" + /locus_tag="SPC41F_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34487.1" + /db_xref="GOA:Q4JYY3" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JYY3" + /translation="DRRFLVVANLSNDKQNFSVDGKVRSVLIENTAAKEVLEKQVLAP + WDAFCVEMTD" + gene complement(316..1721) + /gene="tnp" + /locus_tag="SPC41F_0002" + /pseudo + CDS complement(join(316..447,447..1721)) + /gene="tnp" + /locus_tag="SPC41F_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(720..1238) + /gene="tnp" + /locus_tag="SPC41F_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 2.1e-17" + /pseudo + gene 1889..3343 + /gene="wzg" + /locus_tag="SPC41F_0003" + CDS 1889..3343 + /gene="wzg" + /locus_tag="SPC41F_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34489.1" + /db_xref="GOA:Q4JYY2" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYY2" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1889..2014 + /gene="wzg" + /locus_tag="SPC41F_0003" + /note="Signal peptide predicted for SPC1859 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 2102..2449 + /gene="wzg" + /locus_tag="SPC41F_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.6e-63" + misc_feature 2627..3070 + /gene="wzg" + /locus_tag="SPC41F_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 3345..4076 + /gene="wzh" + /locus_tag="SPC41F_0004" + CDS 3345..4076 + /gene="wzh" + /locus_tag="SPC41F_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34490.1" + /db_xref="GOA:Q4JYY1" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYY1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTLDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPYMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3348..3956 + /gene="wzh" + /locus_tag="SPC41F_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 4.1e-38" + gene 4082..4777 + /gene="wzd" + /locus_tag="SPC41F_0005" + CDS 4082..4777 + /gene="wzd" + /locus_tag="SPC41F_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34491.1" + /db_xref="GOA:Q4JYY0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JYY0" + /translation="MMKEQNTIEIDVFQLVKILWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQEDKPGLTNQDLQAGTYLVKDYREITLSHDVLEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVTVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDFEDVLQI + PLLGLVPDLDKMK" + misc_feature 4082..4198 + /gene="wzd" + /locus_tag="SPC41F_0005" + /note="Signal peptide predicted for SPC1861 by SignalP 2.0 + HMM (Signal peptide probability 0.639) with cleavage site + probability 0.424 between residues 39 and 40" + misc_feature 4103..4519 + /gene="wzd" + /locus_tag="SPC41F_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-53" + misc_feature 4625..4702 + /gene="wzd" + /locus_tag="SPC41F_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4787..5476 + /gene="wze" + /locus_tag="SPC41F_0006" + CDS 4787..5476 + /gene="wze" + /locus_tag="SPC41F_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34492.1" + /db_xref="GOA:Q4JYX9" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JYX9" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDNLRVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMSGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEITRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5491..6858 + /gene="wchA" + /locus_tag="SPC41F_0007" + CDS 5491..6858 + /gene="wchA" + /locus_tag="SPC41F_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34493.1" + /db_xref="GOA:Q4JYX8" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JYX8" + /translation="MNGKIVKYSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELIQTLKYILFFALAISISNFFLEDQFSISRRGMIYF + LTLHALLVYGLNLFIKWYWKRAYPNFKGSKKILLLTATFRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFVTNEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIEDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5491..5583 + /gene="wchA" + /locus_tag="SPC41F_0007" + /note="Signal peptide predicted for SPC1863 by SignalP 2.0 + HMM (Signal peptide probability 0.776) with cleavage site + probability 0.312 between residues 31 and 32" + misc_feature 6274..6855 + /gene="wchA" + /locus_tag="SPC41F_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 9.2e-158" + gene 6845..7651 + /gene="wciB" + /locus_tag="SPC41F_0008" + CDS 6845..7651 + /gene="wciB" + /locus_tag="SPC41F_0008" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34494.1" + /db_xref="GOA:Q4JYX7" + /db_xref="UniProtKB/TrEMBL:Q4JYX7" + /translation="MERSRLIDVKIIVATHKEVKMPQDSSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENINMDDV + ILSRSNVEILLEKSDIIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKELLDDYLPWLFSILDTMYEQMDLTDHTPFESRLFGRV + SELLFNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 7623..8732 + /gene="wcrP" + /locus_tag="SPC41F_0009" + CDS 7623..8732 + /gene="wcrP" + /locus_tag="SPC41F_0009" + /note="member of homology group 89" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34495.1" + /db_xref="GOA:Q4JYX6" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYX6" + /translation="MERSMDRVFEMLEKESPLFSVIVPTYKISESNLRQCIDSLLYDS + QDVEIILVDDNKNLDICGKVLDEYAEKYNNISVIHQENQGVSVARNAGMSIAVGKYLI + FVDPDDWVAENFYSQMTLAVQKNPSSDVIILAAIVDYNGKQFTNHFWHTSRSFQGTDK + DDLELQLIAKGATSYFPTEIGVGVPWAKIYRNEFVRENGLDFNPSLRRMQDNIFNMYA + FEFANEIVYIDEPIYYYRKSMDSVTNKKNDKVIYYFDLVNDEVEKFIQKFNKPKIFED + ALHIKRLIGINSYYKLYFQFATTSSEKKKMRQEFRELLEREEYANSLKQVNTAYLLPK + EKIFISILKQKHLRIFSFLQKLEKLSARLKSRHFS" + misc_feature 7680..8219 + /gene="wcrP" + /locus_tag="SPC41F_0009" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.6e-30" + gene 8740..9657 + /gene="wcrQ" + /locus_tag="SPC41F_0010" + CDS 8740..9657 + /gene="wcrQ" + /locus_tag="SPC41F_0010" + /note="member of homology group 106" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34496.1" + /db_xref="GOA:Q4JYX5" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JYX5" + /translation="MRQLTLKLVSIIYKVTKRIPISFISNLGERIYSLKDSYVFDVLS + KLGVDKESTYDLMPPDLFLNKIWICWFQGEDKAPDLVKKCINSVRKHASGYDVIILTE + DNIEEYVTLPNIVLTKYKNGLFSRTHFSDIVRLNLLAQQGGLWIDATIFMTRDLDLSI + FFKNDFVSLRTTIKSSPLFITGYWTTYFVYMPSNFKLVQYTALLLNKYIEKYDRFIDY + FLQDYIITKAIKDLNYESYMEERPVLGNQRWLLADLANKVVTSELLQQFKQDTVGIYK + VTYKSKYIRKKNGRETVYKKIVEDGECLE" + misc_feature 8791..9630 + /gene="wcrQ" + /locus_tag="SPC41F_0010" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 2.8e-47" + gene 9638..10528 + /gene="wcrR" + /locus_tag="SPC41F_0011" + CDS 9638..10528 + /gene="wcrR" + /locus_tag="SPC41F_0011" + /note="member of homology group 90" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34497.1" + /db_xref="GOA:Q4JYX4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYX4" + /translation="MENALNNKIGIVILNYLNWEDTLECINSLRSQSDQDFEAVIVEN + GSPNESVSRIRDYIKNDKNIHLYVVENNLGYANGNNMGILYLKNRYSINRILLTNNDV + IFDDEDYIKKLEDIKYSNTIGAIGTKIIGSDGLNQNPAYFPISFSSSIKSLLINLLAF + SKVITFIKKRFLSSWTKRANDFSNPKTDEQKYFLHGSVIFLTENYLDRFMGLYGGTFL + YYEEVILGIIFEKAGLDMLYVPDFSIYHKEDQSSLESFANDDLIRRKFLLKSIFSSFK + VHFCATNRLSILVKESIKYD" + misc_feature 9665..10165 + /gene="wcrR" + /locus_tag="SPC41F_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.9e-13" + gene 10521..11780 + /gene="wzy" + /locus_tag="SPC41F_0012" + CDS 10521..11780 + /gene="wzy" + /locus_tag="SPC41F_0012" + /note="member of homology group 121" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34498.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4JYX3" + /translation="MIKFNYSKLALIYQFIIIFFLGAWYKNSIQFKIFLISIDTIISL + FYLYKNNLSRSDLKKVYILITTVLVSLFLPSFMNRVSFILLILQKLYIFNHIINDIKF + EYLLSVFLQFIVLLTFCMGLEFISLGQFNPFKTFYAPRVLLDMSFKVGTPLYFLRSSL + EHPLITSIILVVTGPFLFLLEKKWLRYVCVFLNISLIFFIQKRTAYILVSIGVVCFAL + YYLKYINRRFQLNKITSVIFLMTLFIIALSFIRVQGDYVLNIIFSKFSALQDADSFSL + NNRVINAKTGLDVIFDQNVINIFIGNGYDFLPNFFEQYNVYVIRNGFYVIDNTYISFL + ADYGMIGLFLVLLYIINAIRKSMTNIYKIKSKKEQLFMLYSIIGIINLMVSIAFFDIY + AWYTPLTLLIFLISVVTSYCKFHSNKF" + gene 11822..13066 + /gene="wcrW" + /locus_tag="SPC41F_0013" + CDS 11822..13066 + /gene="wcrW" + /locus_tag="SPC41F_0013" + /note="member of homology group 122" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI34499.1" + /db_xref="UniProtKB/TrEMBL:Q4JYX2" + /translation="MTLKNEVKNIKRTIEKNFFHKDFTSISDIKNYQIEISKNLRPRL + NLLITSMNSQDVYAGIKSAVDFFMKFKKFDIDLRIIVMGKKIDEPSLYQVPGFEFIKD + YSIENDSESRIICDLSKNRSPLFIRERDYFLSTMWYTAYNANNVLDEQKRIFGKRMPM + VYLVQDYEPGFYPWSSEYLLAESTYHLDNQLVVFNSKYLKEFFDANGYRFENSYYFDP + VLNEKLGEILNSAELSNIERKNRILFYGRPSKARNAFQLICMALEKWSVLDERSSNWE + IFSAGEDLKDIKLNNSIVIKSLGKMSVEEYAKFMLESKIGISLMASPHPSYPPLEMAT + FGMKVITNSFVTKDISDFNENIISIEHININKLAEELHFLTTSDIEYKISKNDDYING + ISQLDTIVDEIAGHLQFRHSEV" + gene 13069..14511 + /gene="wzx" + /locus_tag="SPC41F_0014" + CDS 13069..14511 + /gene="wzx" + /locus_tag="SPC41F_0014" + /note="member of homology group 123" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34500.1" + /db_xref="GOA:Q4JYX1" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYX1" + /translation="MKRKSIARNYLLNLIKTTLSILFPLISYPYVSRILSVDGLGAIN + FSTSFVNYFVLIAIFGINVYAVREGAKYRDDKKLLGKFVTEMLLVSICMAMISFSLLT + ISLLLPALSEYRSLILIFSITILFNVVGMEWFFQLMEDYQYITLRAIIFQILSLLSLF + IFVKDRNDIYVYALITVAANAGSQMLNLFRLRKEVEIFRYKDYNIRHYFKPMFLIFLT + LLSMNIYRYLDVTFLGFFKNDQSVGYYSLATKITNVIISMVSSVTVILTPRLAYHYKQ + KEFDKFYKIAYSSFDFILLLAIPVVIGVLSFSSILVDFLGGSAFISSVLTVEILSLTI + LFSNLNALLITPILTVMNHEKAVLKIFIIALIFNVIANMFLIPVMDFNGSALVTVLTE + GIICILSLISIKNVFDVKRLFKNLFQYLVASIFIIVVKIVISQYVSSNYIIFISTALL + SAILYFFTLILLRNELVSQLIIEVRKKIYR" + misc_feature 13084..13890 + /gene="wzx" + /locus_tag="SPC41F_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.3e-44" + gene 14527..15207 + /gene="wcrX" + /locus_tag="SPC41F_0015" + CDS 14527..15207 + /gene="wcrX" + /locus_tag="SPC41F_0015" + /note="member of homology group 124" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34501.1" + /db_xref="GOA:Q4JYX0" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q4JYX0" + /translation="MFTIYRAMKKIIIIILSLPKIFYINLKCLPLNQAVKLPIYVHFN + TRLMIKGDIKIIDTHLSRFTIILGKDGSNHISPHESRLFIYDGGQLILGRNILLSSGF + NLCIEQGGTVKLGDNVSFNRNSSIFCKKQINIGKNSLFGWNCSLRDNNGHRIYYQDNC + IKSEEVIVIGENCWITADSVILKNSVLPFSTVVATGSLVNKEFNQSNILIAGRPARII + REDIKWER" + gene 15275..16495 + /gene="ugd" + /locus_tag="SPC41F_0016" + CDS 15275..16495 + /gene="ugd" + /locus_tag="SPC41F_0016" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI34502.1" + /db_xref="GOA:Q4JYW9" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4JYW9" + /translation="MKIAVAGTGYVGLSIAVLMAQHHEVVAVDIISEKVNLINNGKSP + IKDDYIEEYLASKPLNLVATLDTNIAYQNADFVIIAAPTNYDSEKNFFDTSAVEAVIE + TVLETNPNAVMVIKSTVPVGYTQSIRNKYKTNNILFSPEFLRESKALYDNLYPSRIIV + GLDMDDAYLKERAETFAELLQEGAIKENIEILYMGFTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDTKAIIEGVGLDPRIGSQYNNPSFGYGGYCLPKDSKQLLANYKDVPQ + NMITAIVESNRTRKDFIAEQILKFAGVSSNGEIHPKDVIIGLYRLTMKSNSDNFRQSS + IQGVMKRLKAEGTNVIIYEPTLSDDETFLGSKIVNDLEHFKSISNVIVANRYDDLLKD + VSDKIYSRDIFKRD" + misc_feature 15275..15829 + /gene="ugd" + /locus_tag="SPC41F_0016" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.8e-51" + misc_feature 15860..16141 + /gene="ugd" + /locus_tag="SPC41F_0016" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.9e-36" + misc_feature 16223..16474 + /gene="ugd" + /locus_tag="SPC41F_0016" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 3.1e-06" + gene 16508..17608 + /gene="glf" + /locus_tag="SPC41F_0017" + CDS 16508..17608 + /gene="glf" + /locus_tag="SPC41F_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34503.1" + /db_xref="GOA:Q4JYW8" + /db_xref="InterPro:IPR003953" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYW8" + /translation="MYDYLIVGAGLSGAIFAHEATKCGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTAGMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASANKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGMQPKTVITHEYPADWKRGDEPYYPINDEKNNAMFAKYQEEAAQNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFSN" + misc_feature 16943..17545 + /gene="glf" + /locus_tag="SPC41F_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 5.3e-139" + gene 17636..18505 + /gene="rmlA" + /locus_tag="SPC41F_0018" + CDS 17636..18505 + /gene="rmlA" + /locus_tag="SPC41F_0018" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34504.1" + /db_xref="GOA:Q4JYW7" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JYW7" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLT + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSTMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEHPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLGRGDLSVEVMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17639..18355 + /gene="rmlA" + /locus_tag="SPC41F_0018" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 1e-117" + gene 18506..19102 + /gene="rmlC" + /locus_tag="SPC41F_0019" + CDS 18506..19102 + /gene="rmlC" + /locus_tag="SPC41F_0019" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34505.1" + /db_xref="GOA:P97005" + /db_xref="HSSP:1NZC" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:P97005" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDLE" + misc_feature 18542..19072 + /gene="rmlC" + /locus_tag="SPC41F_0019" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 19112..20161 + /gene="rmlB" + /locus_tag="SPC41F_0020" + CDS 19112..20161 + /gene="rmlB" + /locus_tag="SPC41F_0020" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34506.1" + /db_xref="GOA:Q4JYW5" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYW5" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGGIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQATD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 19127..20083 + /gene="rmlB" + /locus_tag="SPC41F_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00022" + misc_feature 19130..19870 + /gene="rmlB" + /locus_tag="SPC41F_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 9e-74" + misc_feature 19133..19945 + /gene="rmlB" + /locus_tag="SPC41F_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 7.5e-05" + gene 20227..21078 + /gene="rmlD" + /locus_tag="SPC41F_0021" + CDS 20227..21078 + /gene="rmlD" + /locus_tag="SPC41F_0021" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34507.1" + /db_xref="GOA:Q4JYW4" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYW4" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAAFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 20227..21075 + /gene="rmlD" + /locus_tag="SPC41F_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 3.8e-147" + misc_feature 20230..20859 + /gene="rmlD" + /locus_tag="SPC41F_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 4.8e-18" + misc_feature 20230..20811 + /gene="rmlD" + /locus_tag="SPC41F_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00018" + misc_feature 20233..20961 + /gene="rmlD" + /locus_tag="SPC41F_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.5e-08" + gene order(21225..22030,22032..22325) + /gene="glf" + /locus_tag="SPC41F_0022" + /pseudo + CDS join(21225..21725,21725..22030,22032..22325) + /gene="glf" + /locus_tag="SPC41F_0022" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + misc_feature join(21561..21725,21725..22030,22032..22181) + /gene="glf" + /locus_tag="SPC41F_0022" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 9.6e-104" + /pseudo + gene 22559..>22917 + /gene="aliA" + /locus_tag="SPC41F_0023" + CDS 22559..>22917 + /gene="aliA" + /locus_tag="SPC41F_0023" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34509.1" + /db_xref="GOA:Q4JYW3" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JYW3" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQ" + misc_feature 22559..22645 + /gene="aliA" + /locus_tag="SPC41F_0023" + /note="Signal peptide predicted for SPC1879 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 22805..22873 + /gene="aliA" + /locus_tag="SPC41F_0023" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt atccaatgac aaacaaaact tttcagtaga + 61 tggaaaagtt agatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttggcc ccatgggatg ctttctgtgt ggaaatgact gactagaatg agcaaacctc + 181 aagcttttga agcttgaggt tttttactat agtagattga aactggaata gtacacctct + 241 acttctaaaa cattgttaga aatcgatttg attgtcctga tcgatttgtc ctattcttat + 301 ttcattttac tatgcttgta gttgaggaga attaagctcc tcactagtaa actcttcata + 361 atccttttta tttttatgaa gatattgttt gaaagatgtg agtttccacg gataggtttg + 421 tggagggata tacttgcgtc tttctttttt tgttctggtt cttgttcaaa gtttttcgaa + 481 tagagttcat gatctagtag ctcctttgtg cgatagattt tgtcagcgat attgaggtag + 541 atgtctccgt caaatgcttt tataactaat gctttcgtct ttctgatgaa atagacttct + 601 ttttcttgtt cggtagggat atagtaacga ttttggaatc ggatatggtg tccactatcg + 661 gcgactctct ccgccagtct agccagaatg agattccttt cagaggggtt aggaacctcc + 721 tcgaagacag agagttttgt cttgtttcca aactgttcat taaaggtttg gatgtaggaa + 781 agcaggaagg tcttggcttc ttccaaggta tgaatcttgt ttcgttccag ttcgataggc + 841 aggcgagatt gtagtgtctg atggagtctt tcgactctcc ctttagcttg agggatagag + 901 gttgtctcca gaagaatccc cagttggtga caggcgtatc cgaattgtgt atgagtgtcg + 961 tcctccattt tcttagagtt ggagacttga taggtaaaga ctgttctttt atctgttttg + 1021 atttgaaggg gaatgccgtg attgcctaaa atttgttcga ggacatgata gtaagtattc + 1081 aaggtctctt gtttatcaaa ataagcgcct aaaaaataag cgcctaagat attgccagaa + 1141 gcatcatcaa tggctaagtg taagttagat gtttgtgctc caaaccaggc atgagggctg + 1201 gcatccattt gaatgagttc accagcaaat ttctttctgg gtctactagg atgtactttt + 1261 ttagggtctt caaggaagtt ttcagccgtc ggtaagattg gattatctag gggttgcttg + 1321 gggttcagtt tagcttgttt tcttactctc ttctttgtct ttctatgaga cttaggcgac + 1381 aggatgtttt ccttatagag tatttttcta acagttgtat cagagagctg aattccttct + 1441 tcttcagcta gcaattcaca gaaatgaagg acatttggtt tatatgtttc ataggagagg + 1501 tattttttta ggagacgttc tttgatttca tcagggattg catgttttgg ttttcgattt + 1561 ctgtttccgt gtctgaaggc ttcttttcct ttcagttgat aggctagtag cagacgattg + 1621 atttgccttt cagaaagatt gagttcggca caggctcgtt tctttgtttt ctttccttgg + 1681 gctatagctt ttatcacaag atattttttc atttcattca tatttagttg gatccttttc + 1741 atatgactat tctaccaaat gggacatttt cacgttcgat ttactaaaga cattatcacc + 1801 ttcgaatcac aaagatgcag atagtgaaaa taaaggtgta gacattaccg taaaaaagtg + 1861 atataatcgt aagatgttca atgtataggt gttaatcatg agtagacgtt ttaaaaaatc + 1921 acgttcacag aaagtgaagc gaagtgttaa tatagttttg ctgactattt atttattgtt + 1981 agtttgtttt ttattgttct taatctttaa gtacaatatc cttgctttta gatatcttaa + 2041 tctagtggta actgcgttag tcctactagt tgccttggta gggctactct tgattatcta + 2101 taaaaaagct gaaaaattta ctatttttct gttgctgttc tctatccttg tcagctctgt + 2161 gtcgctcttt gcagtacagc agtttgttgg actgaccaat cgtttaaatg cgacttctaa + 2221 ttactcagaa tattcaatca gtgtcgctgt tttagcagat agtgatatcg aaaatgttac + 2281 gcaactgacg agtgtgacag caccgactgg gactgataat gaaaatattc aaaaactact + 2341 agctgatatc aagtcaagtc agaataccga tttgacggtc aaccagagtt cgtcttactt + 2401 ggcagcttac aagagtttga ttgcagggga gactaaggcc attgtcctaa atagtgtctt + 2461 tgaaaatatc atcgagtcag agtatccaga ctacgcatcg aagataaaaa agatttatac + 2521 caagggattc actaaaaaag tagaagctcc taagacgtct aagaatcagt ctttcaatat + 2581 ctatgttagt ggaattgaca cctatggccc tattagttcg gtgtcgcgat cagatgtcaa + 2641 tatcctgatg actgtcaatc gagataccaa gaaaatcctc ttgaccacaa cgccacgtga + 2701 tgcctatgta ccaatcgcag atggtggaaa taatcaaaaa gataaattaa cccatgcggg + 2761 catttatgga gttgattcgt ccattcacac cttagaaaat ctctatggag tggatatcaa + 2821 ttactatgtg cgattgaact tcacttcttt cttgaaaatg attgacttat tgggaggggt + 2881 agatgttcat aatgatcaag agttttcagc tctacatggg aagttccatt tcccagtagg + 2941 gaatgtccat ctagactctg agcaggctct aggttttgtt cgtgagcgct actcactagc + 3001 agatggcgat cgtgaccgcg ggcgcaatca acaaaaggtg attgtggcta tccttcaaaa + 3061 attaacgtca accgaagcac tgaaaaatta tagtacgatc attaatagct tgcaagattc + 3121 tatccaaaca aatatgccac ttgagactat gataaatttg gtcaatgctc agttagaaag + 3181 tggagggaat tataaagtaa attctcaaga tttaaaaggg acaggtcgga tggatcttcc + 3241 ttcttatgca atgccagaca gtaacctcta tgtgatggaa atagatgata gtagtttagc + 3301 tgtagttaaa gcagctatac aggatgtgat ggagggtaga tgaaatgata gacatccatt + 3361 cgcatatcgt ttttgatgta gatgacggtc ccaagtcaag agaggaaagc aaggctctct + 3421 tggcagaagc ctacagacag ggggtgcgaa ccattgtctc tacctctcac cgtcgcaaag + 3481 gcatgtttga aactccggaa gagaagatag cagaaaactt tcttcaggtt cgggaaatag + 3541 ctaaggaagt ggcgagtgac ttggtcattg cttacggggc tgaaatttac tacacactag + 3601 atgttctaga taagctggaa aaaaagcgga ttccgaccct caatgatagt cgttatgcct + 3661 tgatagagtt tagtatgaac actccttatc gcgatattca tagcgccttg agcaagatct + 3721 tgatgttggg aattactcca gtcattgccc acattgagcg ctatgatgct cttgaaaata + 3781 atgaaaaacg cgttcgagaa ctgatcgata tgggctgtta cacgcaagta aatagttcac + 3841 atgtcctcaa acccaaactt tttggcgaac gttataaatt catgaaaaaa agagctcagt + 3901 attttttaga gcaggatttg gttcatgtca ttgcaagtga tatgcacaat ctagacggta + 3961 gacctcctta tatggcagaa gcatatgacc ttgttaccca aaaatacgga gaagcgaagg + 4021 ctcaggaact ttttatagac aatcctcgaa aaattgtaat ggatcaacta atttaggaga + 4081 aatgatgaaa gaacaaaaca cgatagaaat cgatgtattt caattagtta aaatcttgtg + 4141 gaaacgcaag ctaatgattt tattagtggc acttgtgaca ggtgcggggg cttttgcata + 4201 tagcactttt attgttaagc cagaatatac gagtaccacg cgaatttacg tagtgaatcg + 4261 caatcaagaa gacaagccgg ggctgacaaa tcaggatttg caggcaggaa cttatctggt + 4321 aaaagattac cgtgagatta ccctttcgca tgatgtattg gaaaaagtag cgacaaattt + 4381 gaagttggat atgccagcaa aaacgttagc cagcaaagtt caagtgactg taccagctga + 4441 cactcgtatc gtctcaatct ctgtcaagga taaacagcca gaggaagcca gtcgtatcgc + 4501 taattctcta cgagaagttg ctgcagaaaa gatcgtcact gtaacgcgag tatctgatgt + 4561 aacgacactt gaagaagcgc gaccagctac gactccctct tctccaaatg ttcgacgcaa + 4621 ttccttgttt ggttttcttg gaggagcagt cgtaacagta attgctgttc ttttgattga + 4681 gttgctcgac acccgtgtga aacgtcctga agatttcgaa gatgtactgc aaattccact + 4741 tttagggctc gttccagatt tagacaaaat gaaataggag gaagttatgc caacgttaga + 4801 aatctcacag gcaaaattgg attttgtaaa aaaggcagag gaatattata atgccttgtg + 4861 cacgaaccta cagttaagtg gagataattt aagagtattt tctatcactt ctgtgaaact + 4921 aggagaagga aaatcaacga cttccaccaa tatcgcttgg gcttttgcgc gtgcaggtta + 4981 caaaacgctg ctgattgatg gagatattcg caattctgtt atgtcaggtg tctttaaagc + 5041 aagggataag attacaggcc tgacagaatt tttatcagga actacagacc tatcacaagg + 5101 gctttgtgat accaatatcg aaaatctctt tgtaattcag gctggctctg tgtcaccgaa + 5161 tccgacagct cttcttcaaa gtaagaattt cagtacaatg cttgaaacct tgcgtaaata + 5221 ttttgactac atcattgtag atactgctcc tgtcggtgtc gtgattgatg cggctattat + 5281 tacgcgaaaa tgcgatgctt ctattttagt gacggaggca ggtgaaataa ctcgacggga + 5341 tattcaaaaa gcaaaagaac agttggaaca cacagggaag ccgtttttgg gagttgtgtt + 5401 gaataaattc gatacttcag tagacaaata cggttcttat ggaaattatg gagattacgg + 5461 gaaaaataaa aaataggtcg ggggatagag atgaacggaa aaatagtaaa gtattcattg + 5521 gccataatcc agagttttct tgttatttta ttgacttatc tacttagtgc tgtgagagaa + 5581 gcggagattg tttcaacaac agctattgca ctttatatcc tccattattt tgtcttttat + 5641 atcagtgatt atggacagga tttctttaaa aggggatatt tgattgaact tatccagaca + 5701 ttgaaatata tcctattctt tgcactagcg attagtatct ctaatttttt cttagaggat + 5761 caatttagta tttccagacg aggcatgatt tacttcctca cattacatgc tctcttagtc + 5821 tatgggctaa acctatttat caagtggtat tggaagcggg cttatcccaa ctttaaagga + 5881 agtaagaaga ttctcctact tacagcaact tttcgtgtcg aaaaggtact ggatagatta + 5941 atagaatcaa atgaggttgt tggggagttg gtagctgtca gtgtcttaga taaaccagat + 6001 tttcagcatg attgtttaaa ggtagtagca gagggggaga tagtaaactt tgtgactaat + 6061 gaggtggtcg atgaagtctt tatcaatctt ccaagtgaaa aatacaatat tggagagctt + 6121 gtctctcagt ttgaaacgat gggaattgat gtaacagtca atctaaatgc ttttgatcgt + 6181 agtttggcac gtaacaagca aattcgtgag atggcaggat taaacgttgt gactttttct + 6241 acaacatttt ataagactag tcatgtaatt gctaagcgga ttattgatat catgggtgca + 6301 ttggtagggc tgatactatg tggtttagtc agtattgtac tggttccttt gattcgaaag + 6361 gatgggggct ctgctatttt tgctcagacg cgtataggaa aaaatggtcg tcagttcact + 6421 ttttataagt ttcgctctat gtgtgtagat gccgaggcga aaaaaagaga actcatggaa + 6481 caaaatacca tgcagggtgg aatgtttaag gtggacgatg atcctcgtat cacgaaaatt + 6541 ggtcgtttta tacggaagac tagcttggac gagctaccac agttttataa tgttctaaag + 6601 ggagatatga gtttggttgg cacacgacca ccaacagtgg acgagtatga acactataca + 6661 ccagaacaaa aacgtcgtct gagttttaaa cctggcataa cagggttatg gcaggtcagt + 6721 ggacgaagtg agattaagaa ttttgatgaa gttgtcaaat tagatgtagc ctatatagaa + 6781 gattggacaa tttggaaaga tattgagatt ttattgaaga cagttaaagt tgtattgatg + 6841 aaggatggag cgaagtagat tgatagatgt aaaaatcatt gtggcaacac ataaagaggt + 6901 taaaatgcct caagacagta gtctttacct tccaatacat gttgggagag acggtaaatc + 6961 agatattggt tttatcggtg ataatactgg cgataatata tcctctttaa atccatatta + 7021 ttgtgagttg acgggacttt attgggcatg gaaaaatctt gattataatt acttaggttt + 7081 agttcattac cgtcgttatt ttacaaataa atctcaaggg tataatgaaa atatcaatat + 7141 ggatgacgtc attttgtctc gatctaatgt tgaaatatta ttagagaaat ctgacataat + 7201 agttccaaag aagcgaaagt attatattga aactctttat tcacattatg cccataccct + 7261 taacggcgaa catctggatc ttgctaggaa aattattgag caaaatagtt cagagtatct + 7321 ttcatccttt gataaagtga tgaaacaaag aagcggttat atgttcaata tgtttatcat + 7381 gaaaaaagaa ctattagatg attatttacc gtggcttttt tctattctgg atactatgta + 7441 cgaacagatg gacttgaccg accatactcc atttgagtca cgtttattcg ggcgagttag + 7501 tgagttgttg tttaatgttt ggttatgtaa aaaaggaata acgcctaaag aggtaccatt + 7561 tatgtacatg gagagagtgg atttgtttga aaaaggaaaa tcttttttaa tggctaaatt + 7621 ttttggaaag aagtatggac agagtttttg aaatgttaga aaaagaatct ccacttttta + 7681 gtgttattgt tccaacctat aagatatcag aatctaatct acgccaatgt atagactctc + 7741 tgttatatga tagtcaagat gttgagatta ttttggtaga tgacaataaa aacttggata + 7801 tatgtggaaa agtgttggac gaatatgctg aaaaatataa taatatttca gttattcatc + 7861 aagaaaacca aggtgtgtca gtcgcaagaa atgctggtat gtcaattgct gtaggaaagt + 7921 atcttatttt tgtagatccc gatgattggg ttgctgaaaa tttttatagt caaatgactc + 7981 ttgcggttca aaaaaatcct tcaagcgatg tgattatatt agctgctatt gtagactaca + 8041 atggtaaaca atttacgaat catttttggc acacctctcg ttcttttcag ggaacagata + 8101 aagatgatct ggaacttcaa ttgattgcta aaggagcaac gagttatttc ccaactgaga + 8161 taggggttgg tgttccctgg gcaaaaattt atcgtaatga gtttgtgcga gaaaatggct + 8221 tagattttaa tccttctctt cgccgaatgc aagataatat tttcaatatg tatgcattcg + 8281 aatttgcgaa tgaaatcgtc tacattgatg agccgattta ctattataga aagagtatgg + 8341 atagtgtaac taataagaaa aatgataaag taatttatta tttcgactta gttaatgatg + 8401 aggttgaaaa atttattcaa aaatttaata aacctaaaat atttgaagat gctctacata + 8461 taaaaagact tataggtatc aattcgtatt ataagttgta ttttcagttt gcgactactt + 8521 caagcgagaa aaagaaaatg cgacaagaat ttcgtgaact tttagaaagg gaagaatatg + 8581 caaattcgtt aaaacaagtg aatacagcct atcttctccc aaaagaaaaa atttttataa + 8641 gtattttaaa gcagaaacac ttgcgaatat tttccttttt acaaaaactt gaaaaattat + 8701 ctgcgagatt aaagagccgt cattttagtt agagggaata tgagacagtt aacattaaaa + 8761 ttagttagta tcatttataa agtaacaaaa cgaataccta tatcttttat ttctaattta + 8821 ggcgagagga tttattcact aaaggattcc tatgtttttg acgtattaag taaattggga + 8881 gtcgataaag agagcaccta tgatttgatg ccaccagatt tatttttgaa taaaatttgg + 8941 atttgctggt ttcagggtga ggataaagca ccagatttag taaaaaagtg catcaatagt + 9001 gttagaaaac atgcctcagg ctacgatgtc attattttaa cggaagataa tatagaagaa + 9061 tatgttacac ttccaaatat tgttttaaca aaatataaaa atgggttatt tagccggact + 9121 catttttcgg atatagttcg attgaatctt cttgcacaac agggagggct ttggattgat + 9181 gcaacgattt ttatgactag ggatttagat ttgtctatat ttttcaaaaa tgattttgta + 9241 agcttgagaa ctacaataaa atctagtcct ctttttatta cggggtactg gacgacatat + 9301 tttgtatata tgccctctaa ttttaaattg gttcaatata ctgctttatt attaaataaa + 9361 tacattgaga aatatgatcg ctttatagat tatttcttac aagattatat aattactaag + 9421 gcaattaaag atttgaatta tgaatcatac atggaagaac ggcctgtatt gggaaatcaa + 9481 cgttggcttt tagcagattt agctaataaa gttgtgacct cagaacttct tcaacaattt + 9541 aaacaagata cggtaggaat ttataaagtg acatataaat ccaagtatat tagaaaaaaa + 9601 aatggtaggg aaacggttta taaaaaaatt gtagaggatg gagaatgcct tgaataataa + 9661 aataggaatt gttattttaa attatcttaa ttgggaggat actttagaat gcataaatag + 9721 tttgcgctca caaagtgatc aagattttga agctgtcata gtagaaaatg gttctccaaa + 9781 tgaatctgtt tctaggatta gagattatat aaaaaatgac aagaatattc atctttatgt + 9841 agtagagaat aacttaggtt atgcaaatgg aaataatatg ggcatcctct acttaaaaaa + 9901 tagatactct ataaatagaa ttctattaac taataatgat gttatttttg atgatgaaga + 9961 ctacataaaa aaattagaag atattaagta tagtaatacc attggagcta ttggaacaaa + 10021 aattattggt tctgatggtt taaaccaaaa tccagcttat tttccaattt cttttagttc + 10081 tagtataaaa tcacttctta ttaacttatt ggcattttct aaagttatca cttttatcaa + 10141 aaagcgtttt ctatcttcat ggacgaaaag agctaatgac ttttcaaatc caaaaaccga + 10201 tgaacaaaaa tacttcctac atggatcagt catttttctt acggaaaatt atttagatag + 10261 gtttatggga ttgtatggag ggacttttct ttactatgaa gaagtaatcc taggtattat + 10321 atttgaaaaa gcaggtcttg atatgttgta tgtacctgac ttttcaattt accataaaga + 10381 agatcaatca tctttggaaa gttttgcaaa tgatgatttg attaggcgta aatttttatt + 10441 gaaaagcata ttctctagct ttaaggtaca tttttgtgca acgaatagac tctctatact + 10501 ggtgaaggag tcaataaagt atgattaaat ttaattattc taaattagca ttaatttacc + 10561 agtttataat aatttttttt ctgggtgctt ggtataagaa tagcattcag tttaaaattt + 10621 ttttgatatc tattgatact atcatttctt tattttattt atataaaaat aatttatcta + 10681 gaagtgactt aaaaaaagtt tatatcttga taactacagt gttagtaagc ttatttttac + 10741 catcgtttat gaatagagta tcttttatac ttctcatatt gcaaaaatta tatatattta + 10801 accatattat taatgatata aagtttgaat atttgctctc agtctttcta caatttattg + 10861 tactactaac cttttgtatg ggattagaat tcatttcatt aggacaattt aatccgttta + 10921 aaacatttta tgcaccaaga gttcttcttg atatgagttt taaagtcgga acacctttat + 10981 attttttgag atcaagttta gagcatcctc taataacttc gattatatta gtagttactg + 11041 gccctttctt attcctttta gaaaagaaat ggttgagata tgtatgtgtg tttctaaata + 11101 ttagtttaat cttttttatt cagaagagaa ctgcgtatat attggtatcg attggagttg + 11161 tatgttttgc tttgtattat ctaaaatata ttaatcgtag atttcaattg aataaaataa + 11221 cttcagtgat atttttaatg acactattta taattgcttt atcctttata agggtgcaag + 11281 gtgattatgt attaaatatt atttttagta aattttctgc tttacaagat gcagatagtt + 11341 tctcgctaaa taatcgtgta attaatgcta aaactggatt agatgtaatt ttcgatcaaa + 11401 atgttataaa tatattcatt gggaatggat atgacttttt acctaatttt tttgaacaat + 11461 acaatgtgta tgtaattcgg aatggttttt atgtgattga caatacatat atttcatttc + 11521 ttgccgacta tggaatgatt ggtctgttct tagtattgtt atatattata aatgcgatcc + 11581 gaaaaagtat gactaatatt tacaaaataa agagtaaaaa agaacaatta tttatgttgt + 11641 atagtattat aggtattatc aatttgatgg tatcaatagc tttttttgat atatatgctt + 11701 ggtacacgcc attaacgtta ttgatttttt taatatcagt agtgacttct tattgtaaat + 11761 ttcattccaa taagttttag tgtgtacaat cattataatt agcaaaaaga aggaaatctg + 11821 aatgactctc aaaaacgaag ttaaaaacat aaaacgaaca atagaaaaaa atttttttca + 11881 taaggatttt acatctatat ctgatattaa gaattatcag attgaaattt ctaagaatct + 11941 aaggccacgt cttaatttat taattacttc aatgaactct caggatgtat atgctggcat + 12001 caaatcagca gtggattttt ttatgaagtt caaaaaattt gatatagatt taagaatcat + 12061 tgtaatggga aaaaaaatcg atgaaccgtc tctttatcaa gttcctggtt ttgaatttat + 12121 taaagactat tcaattgaga atgatagtga gtctaggatt atttgcgatt tatctaagaa + 12181 tcgttctcca ttgtttatta gggagcgtga ttattttcta tcaacaatgt ggtacactgc + 12241 ttataatgct aacaatgtgc tggatgagca aaaaagaatt tttgggaaac ggatgcccat + 12301 ggtttatcta gttcaagact atgaaccagg tttctatcca tggtcctcag agtatctttt + 12361 ggctgagagc acatatcatc tagataacca gcttgttgtc tttaattcta agtatttaaa + 12421 agaatttttt gatgcaaatg gttatagatt tgaaaatagt tattattttg atccagtttt + 12481 aaatgaaaaa ttgggggaga ttcttaattc agcagagctt tctaatattg aaaggaaaaa + 12541 tcgtatttta ttttatggaa ggcctagtaa agctagaaat gcttttcagt taatctgtat + 12601 ggcattggaa aaatggagcg ttttggacga acgtagttca aattgggaaa ttttttctgc + 12661 aggagaagat ttaaaagata ttaaattgaa taatagcata gtaataaaat cgttagggaa + 12721 gatgtcagtt gaagaatacg caaaatttat gttggaatct aaaatcggaa tctctctaat + 12781 ggcctcaccg catcctagct atcctccgtt agaaatggct acgtttggta tgaaagtcat + 12841 aacgaattct ttcgttacaa aagatatttc tgattttaat gaaaacataa tttctattga + 12901 acatattaat attaataaat tggcggaaga attacatttt ttaacaacat ctgatataga + 12961 atataaaatt tcgaaaaacg atgattatat aaatggtatt agccagcttg atacaattgt + 13021 agatgaaatt gcgggacatt tacaatttcg gcatagcgag gtgtgattgt gaaaaggaaa + 13081 tccattgccc gaaattattt acttaatttg ataaaaacga ccttgtctat tctatttccc + 13141 ctgatatcat acccatatgt gtcgcgtatt ttatctgtgg atgggctggg tgcaatcaat + 13201 ttttcaacct cgtttgttaa ttatttcgta ctaattgcaa tctttggaat taatgtctac + 13261 gctgttagag aaggtgctaa atatcgagat gataaaaagt tacttgggaa gtttgtaacg + 13321 gagatgctac ttgttagtat ttgcatggca atgatttcat tctctttatt aactatttcc + 13381 ttactattac ctgctctatc agaatataga agtcttattc taattttttc aattaccatt + 13441 ctatttaatg ttgtgggaat ggagtggttt tttcaattga tggaagacta tcaatatata + 13501 acacttcgtg caattatatt tcaaatttta tctttgctat ctttattcat atttgtcaaa + 13561 gacaggaatg acatctatgt gtacgctcta attacagttg cggctaatgc aggttctcaa + 13621 atgctgaatt tatttaggct tagaaaagaa gttgaaatat ttagatataa agactataat + 13681 attagacatt attttaaacc gatgtttctg atatttttaa ccttattatc tatgaatata + 13741 tatagatatt tagatgttac ttttctgggc ttctttaaaa atgatcaaag tgtgggctac + 13801 tatagtttag ctacaaaaat aacaaatgtt ataatttcaa tggtatcttc tgttacagtt + 13861 attttgacac ctcgtctagc ataccattat aagcaaaagg agtttgataa attctataaa + 13921 attgcttata gctcctttga ttttatttta ttacttgcta taccagttgt tataggggta + 13981 ttgagtttta gttctatttt agtggatttt ttgggaggaa gtgcttttat ttcttctgtg + 14041 ctaacagtgg agatattaag tttaacaatt ctattctcta atttgaatgc tttattaatt + 14101 acacctattt taacagttat gaatcatgag aaagcggttt taaaaatttt tattatagca + 14161 ttgattttca atgttattgc aaacatgttc cttattccag taatggattt taatggttca + 14221 gctttggtta cagttttgac agaaggaatc atttgcatat tatctttaat tagtataaaa + 14281 aatgtatttg atgttaaaag attatttaag aatctttttc aatatctagt agctagtata + 14341 tttataattg ttgtcaagat tgttatttct cagtacgttt catcaaatta tattattttt + 14401 atttcaactg ctttactaag cgcaatttta tatttcttta ctttgatatt attgagaaat + 14461 gagttagtat cacaattaat aatagaagtc agaaagaaaa tatatagata atggagttaa + 14521 atataaatgt ttaccatata tagagctatg aaaaaaataa ttataatcat tttgtctctt + 14581 cccaagattt tttatataaa tttaaaatgt cttccgttga atcaggcagt taaacttcct + 14641 atatatgttc attttaatac tcgattaatg attaagggag acataaaaat cattgatact + 14701 catttatcac gttttactat cattttggga aaagatggct ctaatcatat ctctcctcat + 14761 gagagtagat tatttattta tgatgggggc caattaattc tagggagaaa tattctatta + 14821 tctagtggat ttaatttgtg tatagagcaa ggaggtacgg ttaaattagg agataatgtc + 14881 tcttttaaca gaaattcttc gatcttttgt aaaaaacaaa ttaatattgg taaaaatagt + 14941 ttatttggtt ggaactgtag tttacgtgat aacaatggac ataggatcta ttatcaggac + 15001 aactgtatta agagtgaaga agttattgta ataggagaga attgctggat aacagcagac + 15061 tcagtcattc ttaaaaatag tgttcttcct ttttctactg tagttgctac aggtagttta + 15121 gtaaacaaag agtttaatca gagtaacatt ttgatagctg gaaggcctgc tagaattatt + 15181 agagaggata taaaatggga aagataagat agtaattgat taactaggtc gtgtaatttt + 15241 taacagagat aacgaaaggt aatgggtgaa gtaaatgaaa attgcggttg caggtacagg + 15301 atatgtagga ctgtctattg cagttttaat ggctcaacat catgaggtgg tagctgttga + 15361 tattatttct gaaaaggtca atctgattaa taatggaaaa tctccaataa aggatgacta + 15421 tattgaagaa tatttagcat caaagcccct caacttagtg gcaacattgg atacaaatat + 15481 agcgtaccaa aatgcagatt ttgtaattat agcagctcca acaaattatg attcagaaaa + 15541 gaattttttt gatacatctg ctgtagaagc agttattgaa acggtgttag agactaatcc + 15601 taacgctgta atggtgatta aaagtactgt tcctgtaggc tatactcaat cgattcgtaa + 15661 taaatataaa acaaataata ttttatttag tccagaattt ttacgtgagt caaaggcttt + 15721 atatgataat ttatatccta gccgtataat tgttgggctt gatatggacg atgcatattt + 15781 aaaggagaga gcagaaactt ttgcagaact actacaagaa ggagctatta aagagaatat + 15841 agaaattctt tacatgggat ttacagaggc agaagcagtc aaactttttg caaatacata + 15901 tttagccttg cgagtttctt atttcaatga gttggatact tatgcagaag ttaaagggtt + 15961 agatactaaa gctattattg aaggtgttgg cttagatcca cgtatcggaa gccaatataa + 16021 caatccttct tttggatatg ggggatattg ccttccaaaa gatagtaaac aactattggc + 16081 aaactataaa gatgttccac agaatatgat aacagctatc gttgagagca accgtactag + 16141 aaaagatttt attgcagagc agattttgaa atttgcagga gtttcaagta atggggaaat + 16201 tcatccaaaa gatgtaataa taggacttta tcggttgact atgaagagta attccgataa + 16261 ttttcgtcaa tcttctattc aaggtgttat gaaacgattg aaggcagaag gcacaaatgt + 16321 tataatttat gagccaactc ttagtgatga tgagacattt ttgggtagta agattgtaaa + 16381 tgatttggag cactttaaat caattagtaa tgttatcgtg gcaaatcgtt atgatgattt + 16441 gcttaaagat gtgagtgaca agatttatag tcgtgatatt tttaagagag attaggtaga + 16501 agttataatg tatgattatt taatcgttgg agctggtttg tctggagcta tttttgctca + 16561 cgaagctaca aaatgtggaa aaaaagtaaa agtgattgat aaacgcgatc acattggagg + 16621 gaacatatac tgtgagaatg tagaaggtat caatgttcat aaatatggtg cccatatctt + 16681 ccatacttct aataaaaaag tctgggacta cgtcaatcaa tttgctgagt ttaacaacta + 16741 tatcaactca cctgtcgcaa actataaggg aagtctttat aaccttcctt tcaatatgaa + 16801 taccttctat gctatgtggg gcacaaaaac tccacaagaa gtgaaggata agattgctga + 16861 gcagacagct ggtatgaagg atgttgagcc gaaaaatctg gaagaacaag ctatcaagtt + 16921 gattggtccg gatatctatg aaaagttgat caagggttat acagaaaagc aatggggacg + 16981 ctcagcgaca gaacttcctc catttatcat aaaacgcctt ccagttcgtt taacctttga + 17041 taataactat tttaatgacc gttaccaagg gattcctatt ggtggttaca atgtcatcat + 17101 cgaaaatatg ctgaaagatg tagaagttga acttggagta gacttttttg ctcatcgtga + 17161 agagttggaa gcatctgcta acaaagttgt cttcacagga atgatcgacc aatattttga + 17221 ctacaagcac ggagagttag aataccgtag ccttcgtttt gagcatgaga ttttagacga + 17281 ggaaaattat caagggaatg ctgtagtgaa ctatacagag cgtgagatcc cttatactcg + 17341 tatcatcgaa cacaaacatt ttgaatatgg aatgcagcca aagacagtta tcacgcatga + 17401 atatccagct gactggaagc gtggggacga gccctactat cctattaacg atgagaaaaa + 17461 taatgctatg tttgctaaat accaagaaga agcagcgcag aatgataaag ttatcttttg + 17521 tgggcgttta gcagactata aatattacga tatgcatgtg gtgattgaac gggcgcttga + 17581 ggttgtggag aaagaattta gtaattgaaa aacaacgaag aaaggttgct tatatatgaa + 17641 aggtattatt cttgcaggtg gttcggggac acgattatat cctttgactc gggctgcatc + 17701 aaaacaactt atgccggttt atgataaacc catgatttac tatcctttgt caaccctgat + 17761 gttgactgga ataaaggaca ttttgattat ctcaacacca caggatttgc cccgttttaa + 17821 ggacttgctc ttggatggtt ccgaatttgg gatcaagctt tcctatgcgg aacaacctag + 17881 tcccgatgga cttgctcagg cttttattat cggtgaagag tttatcggtg acgatagcgt + 17941 tgccttgatt ttaggtgaca atatctacca tggtcctggt ctgagcacaa tgcttcaaaa + 18001 agcagccaag aaagagaaag gtgcgactgt ttttggctac caagtgaagg atccagagcg + 18061 ttttggtgtg gttgagtttg atacagacat gaatgctatt tctatcgaag aaaagccaga + 18121 gcaccctcgt tcaaactatg cagttacagg actctatttc tatgataatg atgtagtaga + 18181 gattgccaaa agtataaaac caagccctcg tggtgaactg gaaattacag atgtaaacaa + 18241 ggcttaccta ggtcgtggag atttatccgt tgaggttatg ggacgaggct ttgcttggct + 18301 ggatactgga actcatgaaa gtttattaga ggcttcgcag tacatcgaaa cagtccaacg + 18361 gatgcaaaat gttcaggtag caaacttaga agaaattgcc tatcgcatgg gttatatcag + 18421 tcgtgaagat gtattgacct tagcccaacc acttaagaaa aatgaatacg gacagtatct + 18481 gctccgtttg attggagaag catagatgac agataatttt ttcggtaaga cgcttgcggc + 18541 acgcaaggtt gaagctattc caggcatgtt ggagtttgat atccccgttc atggagataa + 18601 tcgtggctgg tttaaagaaa atttccaaaa ggaaaaaatg cttccacttg gatttccaga + 18661 gtctttcttt gcagaaggaa aattgcaaaa caatgtatcc ttctcacgta aaaatgtcct + 18721 tcgagggctc cacgcagagc cttgggataa gtacatctct gtagcagatg gagggaaagt + 18781 tctgggttct tgggttgatc tacgcgaggg tgaaaccttt gggaatacct atcagacagt + 18841 aattgatgca agcaagggaa tctttgttcc tcgaggcgta gctaatggct tccaagttct + 18901 atcagataca gtgtcatata gctatctggt caatgattac tgggctctcg agctcaaacc + 18961 caagtatgcc tttgtgaact acgctgatcc aagccttggt attgaatggg aaaatattgc + 19021 agaagcagag gtttcagaag cagataaaca tcatccccta cttaaggatg taaaaccttt + 19081 gaaaaaagaa gatttggaat aaggaaagaa tatgactgaa tacaaaaata ttatcgtgac + 19141 aggtggagct ggctttatcg gttctaactt tgtccattat gtttacgaga actttccagg + 19201 tgttcacgtg acagtcctag ataagttgac ttatgctgga aatcgcgcga atattgagga + 19261 aattttaggt aatcgtgttg agttagttgt tggtggcatt gctgatgcgg agttggtaga + 19321 caagttggct gctcaagcag atgctatcgt tcattatgca gcggaaagcc acaatgataa + 19381 ttcgctcaat gatccatcgc catttattca tactaacttc atcggaacct atactctttt + 19441 agaagctgct cgtaagtatg atattcgctt ccaccatgta tcgacagatg aagtttatgg + 19501 ggatctccct ttacgcgaag atttgccagg tcatggtgaa ggaccaggtg agaaatttac + 19561 tgctgaaaca aaatacaacc caagctctcc gtactcatca accaaggcag cctcagattt + 19621 gattgtcaaa gcctgggtgc gttcttttgg agtcaaggca acgatttcca actgttcaaa + 19681 taactacggt ccttatcaac atatcgaaaa attcatccca cgtcagatta ctaacatcct + 19741 aagtggaatt aagccaaaac tttacggtga aggtaagaat gttcgtgact ggattcatac + 19801 caatgaccat tcttcaggag tttggacaat cttgacaaaa gggcaaatcg gtgaaaccta + 19861 cttgattggg gctgatggtg agaagaacaa taaggaagtt ttggaactta tccttaagga + 19921 aatgggacaa gctacggatg cctatgatca tgtgactgac cgtgcaggac atgaccttcg + 19981 ctatgcgatt gatgccagca agctccgtga tgagttgggg tggaaacctg aatttaccaa + 20041 ctttgaagct gggctcaagg caacaatcaa gtggtataca gataaccaag aatggtggaa + 20101 agcagaaaaa gaagctgttg aagccaatta tgctaagact caggagatta ttacagtata + 20161 aaaagcagct atttcctgct ttttattgct atattgggaa gagttacata ttagaaaggt + 20221 ctagagatga ttttaattac aggggcaaat ggccaattag gaacggaact tcgctattta + 20281 ttggatgaac gtaatgaaga atacgtggca gtagatgtgg ctgagatgga cattaccaat + 20341 gaagaaatgg ttgagaaagt ttttgaagag gtgaaaccga ctttagtcta ccattgtgca + 20401 gcctacaccg ctgttgatgc agcagaggat gaaggaaaag agttggactt cgccatcaat + 20461 gtgacgggga caaaaaatgt cgcaaaagca tctgaaaagc atggtgcaac tctagtttat + 20521 atttctacgg actatgtctt tgacggtaag aaaccagttg gacaagagtg ggaagttgat + 20581 gaccgaccag atccacagac agaatatgga cgcactaagc gtatggggga agagttagtt + 20641 gagaagcatg tgtctaattt ctatattatc cgtactgcct gggtatttgg aaattatggc + 20701 aaaaacttcg tttttaccat gcaaaatctt gcgaaaactc ataagacttt aacagttgta + 20761 aatgaccagt acggtcgtcc gacttggact cgtaccttgg ctgcgttcat gacctaccta + 20821 gctgaaaatc gtaaggaatt tggttattat catttgtcaa atgatgcgac agaagacaca + 20881 acatggtatg attttgcagt tgaaattttg aaagatacag atgtcgaagt caagccagta + 20941 gattccagtc aatttccagc caaagctaaa cgtccgctaa actcaacgat gagcctggcc + 21001 aaagccaaag ctactggatt tgttattcca acttggcaag atgcattgca agaattttac + 21061 aaacaagaag tgagataagt agtagaatga ttttctagtc taataaaaga ggcagagaat + 21121 gaactccaaa ggagcttaag atgtacgatt atcttgttgt tggtgcagtc tttgcccatg + 21181 aagcagtctt aaaaggaaaa aaagtaaaag ttattgaaaa atgaaatcat atcgcgggta + 21241 atatctatac tcgtgaagag gaaggaattc aagttcatca atatggtgct catatcttcc + 21301 atacttctga taaggagatc tgggattatg taaatcagtt tgcagagttt aaccgttata + 21361 ccaattctcc tgttgcaaac tataagggag agatttataa cttacctttt aatatgaata + 21421 ccttcaataa actctgggga gttgtgacgc cagcagaagc acaagctaag attgatgaac + 21481 aacgtgctat tttaaatggt aaaactcctg aaaatttgga agaacaggcg atttctcttg + 21541 taggtacaga catctacgaa aaattaatca aagactatac agagaaacag tggggcaaac + 21601 caactactga acttccatcc tttattattc gccgtttacc agtacacctg acctatgata + 21661 acaactattt taacgatacc tatcaaggga ttccaattgg tggatacact caaatagttg + 21721 aaaaatgttg gatcatgaaa atattgatgt agaaacaaat gttgatttct ttgtgaacaa + 21781 agagcaatat ctgaaagatt ttcctaagat tgtctttact ggtatgattg atgaattctt + 21841 tgactataag ttgggcgaac tagagtaccg tagtcttcgt tttgaaaatg agaccttgga + 21901 tatggaaaat taccaaggaa atgcagttgt gaactatacg gatgcagaaa ccccatatac + 21961 tcgcattatt gaacacaaac attttgagtt tgggagtcaa gcaaagacta tcattactaa + 22021 tagaacattc taaaacatgg gaaaaaggtg atgagcctta ttatccagtt aataatgatc + 22081 gtaataatga tcgtaataat catttgtata aatcatataa aaaacttgct gatgagcaag + 22141 ggaatgttat ctttggtggc cgcttaggac actatcgtta ttacgatatg caccaagtaa + 22201 ttggagcagc tttgcagtgc gtgagaaatg agttagattc atactcaatg aaaattaaag + 22261 agcaaactag gaagctagcc gcaggttgct caaaacactg ttttgaggtt gcagatggaa + 22321 gctgacgcgg tttgaagaga ttttcgaaga gtataaacaa gtaaaactga ctaccagtta + 22381 ttatttagaa atagtattaa aaattccttg actatatgat atagttgagg gatttttaaa + 22441 tgatattcat attttttgca aagatgttgt ttgaaaaata attttcaaaa attctgaaaa + 22501 ttctgttgac aactttctga aaagagtcta taatggagag aaagtttaaa aggagaaaat + 22561 gatgaaaagt tcaaaactat ttgcccttgc gggcgtgaca ttattggcgg cgactacttt + 22621 agctgcatgc tctggatcag gttcaagcac taaaggtgag aagacattct catacattta + 22681 tgagacagac cctgataacc tcaactattt gacaactgct aaggctgcga cagcaaatat + 22741 taccagtaac gtggttgatg gtttgctaga aaatgatcgc tacgggaact ttgtgccgtc + 22801 tatggctgag gattggtctg tatccaagga tggattgact tacacttata ctatccgtaa + 22861 ggatgcaaaa tggtatactt ctgaagggga agaatacgcg gcagtcaaag ctcaaga +// + diff --git a/public/res/serotype_genbank/serotype_42.gb b/public/res/serotype_genbank/serotype_42.gb new file mode 100644 index 0000000..0ab2f64 --- /dev/null +++ b/public/res/serotype_genbank/serotype_42.gb @@ -0,0 +1,880 @@ +LOCUS CR931715 19403 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 198/71 (serotype 42). +ACCESSION CR931715 +VERSION CR931715.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 19403) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 19403) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..19403 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="198/71" + /db_xref="taxon:1313" + gene <1..33 + /gene="dexB" + /locus_tag="SPC42_0001" + CDS <1..33 + /gene="dexB" + /locus_tag="SPC42_0001" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34510.1" + /db_xref="UniProtKB/TrEMBL:Q4JZU9" + /translation="PWDAFCVELL" + gene 192..360 + /gene="aliB" + /locus_tag="SPC42_0002" + /pseudo + CDS 192..360 + /gene="aliB" + /locus_tag="SPC42_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(378..893,895..1221)) + /gene="tnp" + /locus_tag="SPC42_0003" + /pseudo + CDS complement(join(378..893,895..1221)) + /gene="tnp" + /locus_tag="SPC42_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(831..893,895..1203)) + /gene="tnp" + /locus_tag="SPC42_0003" + /note="HMMPfam hit to PF01710, Transposase, score 1.4e-21" + /pseudo + gene 1428..2882 + /gene="wzg" + /locus_tag="SPC42_0004" + CDS 1428..2882 + /gene="wzg" + /locus_tag="SPC42_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34513.1" + /db_xref="GOA:Q4JYW1" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYW1" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVY + NDQEFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1428..1553 + /gene="wzg" + /locus_tag="SPC42_0004" + /note="Signal peptide predicted for SPC1883 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 1641..1988 + /gene="wzg" + /locus_tag="SPC42_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.6e-63" + misc_feature 2166..2609 + /gene="wzg" + /locus_tag="SPC42_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.5e-69" + gene 2884..3615 + /gene="wzh" + /locus_tag="SPC42_0005" + CDS 2884..3615 + /gene="wzh" + /locus_tag="SPC42_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34514.1" + /db_xref="GOA:Q4JYW0" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYW0" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGEPDKFMKKRAQYFLERDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2887..3495 + /gene="wzh" + /locus_tag="SPC42_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.6e-37" + gene 3621..4316 + /gene="wzd" + /locus_tag="SPC42_0006" + CDS 3621..4316 + /gene="wzd" + /locus_tag="SPC42_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34515.1" + /db_xref="GOA:O86887" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:O86887" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + misc_feature 3621..3737 + /gene="wzd" + /locus_tag="SPC42_0006" + /note="Signal peptide predicted for SPC1885 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3642..4058 + /gene="wzd" + /locus_tag="SPC42_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 3.1e-55" + misc_feature 4164..4241 + /gene="wzd" + /locus_tag="SPC42_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4326..5015 + /gene="wze" + /locus_tag="SPC42_0007" + CDS 4326..5015 + /gene="wze" + /locus_tag="SPC42_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34516.1" + /db_xref="GOA:Q4JZK1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JZK1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSANIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 5030..6397 + /gene="wchA" + /locus_tag="SPC42_0008" + CDS 5030..6397 + /gene="wchA" + /locus_tag="SPC42_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34517.1" + /db_xref="GOA:Q4JYV7" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JYV7" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRRYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYLNFKGSKKILLLTATSRVEKVLDRLIESNEVVGKL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHIMAKRIIDIMGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5030..5116 + /gene="wchA" + /locus_tag="SPC42_0008" + /note="Signal peptide predicted for SPC1887 by SignalP 2.0 + HMM (Signal peptide probability 0.844) with cleavage site + probability 0.429 between residues 29 and 30" + misc_feature 5813..6394 + /gene="wchA" + /locus_tag="SPC42_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.8e-158" + gene 6384..7190 + /gene="wciB" + /locus_tag="SPC42_0009" + CDS 6384..7190 + /gene="wciB" + /locus_tag="SPC42_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34518.1" + /db_xref="GOA:Q4JZB6" + /db_xref="UniProtKB/TrEMBL:Q4JZB6" + /translation="MERSRLIDVKIIVATHKEVKMPQDNSLYLPIHVGRDGKSDIGFI + GDNTGDNISSLNPYYCELTGLYWAWKNLDYNYLGLVHYRRYFTNKSQGYNENVNMDDV + ILSRSNVEILLEKSDVIVPKKRKYYIETLYSHYAHTLNGEHLDLARKIIEQNSSEYLS + SFDKVMKQRSGYMFNMFIMKKGLLDDYLPWLFSILDTMYEQMDLTDYTSFESRLFGRV + SELLFNVWLCKKGITPKEVPFMYMERVDLFEKGKSFLMAKFFGKKYGQSF" + gene 7199..8392 + /gene="wzy" + /locus_tag="SPC42_0010" + CDS 7199..8392 + /gene="wzy" + /locus_tag="SPC42_0010" + /note="member of homology group 45" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34519.1" + /db_xref="UniProtKB/TrEMBL:Q4JYV5" + /translation="MKITIKRYSLPEILGLAALAIFLLFSLLSITLYAQYISIKVYFI + ALFGIILLIFLKELISESYNLKSVIGLFVIFTLCFIIGTVTNYAYFFILGLFLIYSLR + NLPFSDVAKVSFIISISVLLLVVLSSKLGIIPDYIEISPTRVRHYLGFRYSLLPSTLM + MNIIAISFFLKQENASYPRLLVLFLLSGWLYVETDSRLTFINSCLFLLVNLIMKLSPS + IIEKVGRLLKLFSFTYFINACLSYWIAKTYLNTSNVVLNQFFYQADQFLGGRIYYSNR + SLSLYGYKLLGQKIDWIGNGLSIQGERSTETYLYVDNLYIQILQHFGLIVSVIILSLL + TITLVKLLKKGQMVLGIILVILSFHALIDDLILNLYYNIFWVLIGMLIYKKYQFYDKK + QLTIE" + misc_feature 7199..7300 + /gene="wzy" + /locus_tag="SPC42_0010" + /note="Signal peptide predicted for SPC1889 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.778 between residues 34 and 35" + gene 8547..9542 + /gene="wcrI" + /locus_tag="SPC42_0011" + CDS 8547..9542 + /gene="wcrI" + /locus_tag="SPC42_0011" + /note="member of homology group 128" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34520.1" + /db_xref="GOA:Q4JYV4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYV4" + /translation="MNKINLTDNLPLISVVLPVYNVENYLEKCLNSVVRQTYKNIEII + IVNDGSLDSSIDICNKYANKDSRIKVFTKPNGGLSDARNFGVKKSMGEFITFVDSDDY + VTDDYVEYLYSLVKKYNCKMSMCSIFVHYISNDKMINNGTGRELMMTAERCIEKMCYH + DEVDTCAYAKLYHRSLFSEICFPKGRIFEDIGTIYRFFGTAGQIACGFNAKYYYEIRE + NSIVTSSFSEKKFDLLFMTDQMRNFVDQRYPSLKAATKRRAVYARFSTLNQLLDVQGY + NEEKKEIIRFIQDNKEALLENPKTPKRDRLAVRALSLGFCIYKLLWKQYLKIQRG" + misc_feature 8586..9089 + /gene="wcrI" + /locus_tag="SPC42_0011" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6.1e-48" + gene 9544..10695 + /gene="wcrJ" + /locus_tag="SPC42_0012" + CDS 9544..10695 + /gene="wcrJ" + /locus_tag="SPC42_0012" + /note="member of homology group 129" + /codon_start=1 + /transl_table=11 + /product="putative glycerol phosphotransferase" + /protein_id="CAI34521.1" + /db_xref="GOA:Q4JYV3" + /db_xref="InterPro:IPR007554" + /db_xref="UniProtKB/TrEMBL:Q4JYV3" + /translation="MNKEFLKYIYIRLLRNLRRIFFIIPIIRNRVVFESFSGDAYSCN + PKYISEELRKQYGDSVEIIWAFNDPNKFKKELPKEIVTCRYRSFNHLIYRITSKVYVC + NFLQAIEIPKRKGQLEIQTWHGGGCYKKVGVAEKGRQAAYVKRQRMHVEETDLFITSS + KYFENEVVKKQFGYKGEILSIGMPRNDILINLPISSQVEKLKEKLGLPNNKLIALYAP + TWRSGTKQYETLDIKKLTQAVDKKFGKKCIVLFRSHLYGNQSYDDVVDVSQYSDMQEL + LLLSDILITDYSSSMWDFSLSFKPCFLYTPDLKDYLDERGFDEDIHSWGFSVSESNKE + LVENILQFDNEEYRQKMKNHHQFLESYEQGDAAKRVVAKIAEYCNLYRG" + misc_feature 10144..10671 + /gene="wcrJ" + /locus_tag="SPC42_0012" + /note="HMMPfam hit to PF04464, + CDP-Glycerol:Poly(glycerophosphate) gl, score 5.1e-37" + gene 10699..11604 + /gene="wcrK" + /locus_tag="SPC42_0013" + CDS 10699..11604 + /gene="wcrK" + /locus_tag="SPC42_0013" + /note="member of homology group 130" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34522.1" + /db_xref="GOA:Q4JYV2" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JYV2" + /translation="MKKIAYLIKRYGVKNVVLRAINDVLPVNLIFPSQQLRRLNWQEK + VKKKLKKYVVISDSIKSEEECDIIWWLWFQGLDNAPAIVKKCRESVDKYAKRSGKRVI + ELTSQNLFEYIEVPNELYVKYKSGSLPLALFSDFCRISLLSNYGGLWIDSTVLITGEI + EDEILNQDIFMFQASPLDYSVTKISNWMLYSKYPGHPFISSIRDTLISFYNKNNTIPD + YFLFHLLVSCLIDDNRINQSFYDMDYYTNTYPHLLGRVLSEPYDTLKFENILRKTSIH + KLSYKNLDNVAEDSFYNAILGLDFS" + misc_feature 10753..11583 + /gene="wcrK" + /locus_tag="SPC42_0013" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 4.7e-51" + gene 11622..12338 + /gene="mnp1" + /locus_tag="SPC42_0014" + CDS 11622..12338 + /gene="mnp1" + /locus_tag="SPC42_0014" + /note="member of homology group 131" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (mannitol)" + /protein_id="CAI34523.1" + /db_xref="GOA:Q4JYV1" + /db_xref="InterPro:IPR001228" + /db_xref="InterPro:IPR018294" + /db_xref="UniProtKB/TrEMBL:Q4JYV1" + /translation="MNLAVIFAGGSGTRMNAKDRPKQFLLVHGKPIIVHTIELFENHP + EIDGIIVVCIEDWIPYMEEMKYCYRLDKIAKIVPGGATGQLSIYNGLVAAEQLYGIED + NVVLIHDGVRPLITADTISDNIQSVKEKGNAITCTVAKETVILVDDENKVDEVPSREH + SRFAKAPQSFWLKDILGAHRASVDNGRNNFIDSCTMMRYYGHDLHVVVGPYENIKITT + PDDFYTFRALYDLRENKQLK" + misc_feature 11628..12320 + /gene="mnp1" + /locus_tag="SPC42_0014" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF000, score 3.9e-23" + misc_feature 11628..12317 + /gene="mnp1" + /locus_tag="SPC42_0014" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 6.5e-05" + gene 12349..13419 + /gene="wcrH" + /locus_tag="SPC42_0015" + CDS 12349..13419 + /gene="wcrH" + /locus_tag="SPC42_0015" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34524.1" + /db_xref="GOA:Q4JYV0" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4JYV0" + /translation="MKYFVEETLLDEQDKKNAGGKARQDVTDILESIGYQKLIAESEM + NERQELNAVQRLVHHYKVKKMWKKTLSVVGKGDEVIIQFPLLNHSLFFNQVIKQLSKN + GVKVYFLIHDLESLRWSQSKSISLKSRIRLNIEEHSVLRLSEGIIAHNKKMKSYIKTY + SVESSKIIPLETFDYIIPSYHERKNLDNFQLNAPIVIAGNLKQHKAGYVYHLPSNVEF + NLYGIGYEQTDDKSVHYCGSFMPEELPFVLKGSFGLVWDGPSSESCIETYGEYLRVNN + PHKTSLYLASGIPVVVWSEAAIASFIKENNCGILVSNLSELPELLSMITVDEYELMKK + NTEIIGERLRQGFYTKQAVKGF" + gene 13435..14514 + /gene="mnp2" + /locus_tag="SPC42_0016" + CDS 13435..14514 + /gene="mnp2" + /locus_tag="SPC42_0016" + /note="member of homology group 132" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (mannitol)" + /protein_id="CAI34525.1" + /db_xref="GOA:Q4JZA9" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JZA9" + /translation="MIESFNDKVLQEDLEIIAKEELPFRKFRNSTVFITGVTGLVGLQ + LFKALACINRVHQLNMKIIGLVRNLDKAEKIFGDLLKRKDIQIVLGDVSEDFHSYIPD + GLVIDYIIHGASVTTSKLMIEFPVDTIRVAFNGTYQMLELAKEKKVKSFVYLSSMEVY + GSFQSDRTTVVNENMLGYLDLTSVRTNYPECKRICENMCIAFLSQYQVPAKIARLSQT + FGAGTLPGENRVFAQFARSVMQGKDIVLHTLGQSEGNYCYTADTVVALLTILLRGENG + EAYNIANEESHTTIADMAKMVTSQFSQTSQVVFDIPKKNIFGYAVDTKMKLSTHKIQQ + LGWKPRVSLVDAYDRMMRSMNETGV" + misc_feature 13528..14280 + /gene="mnp2" + /locus_tag="SPC42_0016" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 9.2e-23" + misc_feature 13531..14373 + /gene="mnp2" + /locus_tag="SPC42_0016" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 0.00013" + gene 14523..15938 + /gene="wzx" + /locus_tag="SPC42_0017" + CDS 14523..15938 + /gene="wzx" + /locus_tag="SPC42_0017" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34526.1" + /db_xref="GOA:Q4JZA8" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JZA8" + /translation="MKVLKNYLYNLSYQLLVIILPIITTPYVTRIFSSDDLGTYGYFN + SIVTYFILLATLGIANYGTKEISGNRKSIQKNFWGIYTLQFGATTFSIFLYILACLFI + PGMKNLVAYILGLGLVSKGLDISWLFQGLEDFRKITVRNITVKLVGVSAIFLFVKSAS + DLYLYVFLLTAFELLGQLSMWFPAREYIGKPHFDIEYARHHLKPVILLFLPQIAISLY + VTLDRTMLGALASTKDVGIYDQALKLVNILLTLVTSLGSVMLPRVAHLLATGDHKVVN + KMHEVSFLIYNLVIFPIMAGMLIVNDDFVQFFLGQDFQDARYAISIMIFRMFFIGWTN + IMGIQILIPHNQNKEFMISTTTPAIISVGLNLLFLPKLGYIGAAIVSVLTEALVWAIQ + LFYTRRYLKEVPIIGSMSKIILASAIMYGLLLSSKTVIHFSPTLNVLAFVALGGIIYL + FAILSLKVVDVKELKQIIRKN" + misc_feature 14529..15323 + /gene="wzx" + /locus_tag="SPC42_0017" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.5e-65" + gene 15940..16938 + /gene="wciG" + /locus_tag="SPC42_0018" + CDS 15940..16938 + /gene="wciG" + /locus_tag="SPC42_0018" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34527.1" + /db_xref="GOA:Q4JYU7" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYU7" + /translation="MRKNRNINLDLLKVLACVGVVLLHTTMGGFKETGSWNLLAYLYY + LGTYSIPLFFMINGYLLLGKREITYLYILQKVKWILITVSSWSFIVWLFKRDFTTNPI + KKIVGSLIQRGYFFQFWFFGALILIYLCLPILRQFLNSKRSYLYSLSLLMTIGLIFEL + SNILLQMPIQTYVIQTFRLWTWFFYYLLGGYIAQFTIEEIESRFKNWMKIVSILLLLI + SPIILFFIAKTIYHNLFAEYFYDTLFVKVSTLGIFLTILMLTLNENRRESIVSLSNQT + MGVFIIHTYIMKVWEKVLGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 16952..18061 + /gene="glf" + /locus_tag="SPC42_0019" + CDS 16952..18061 + /gene="glf" + /locus_tag="SPC42_0019" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34528.1" + /db_xref="GOA:Q4JYU6" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYU6" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKITEQTADMKDVEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFDHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + misc_feature 17387..17989 + /gene="glf" + /locus_tag="SPC42_0019" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.2e-137" + gene 18042..19076 + /gene="wcjE" + /locus_tag="SPC42_0020" + CDS 18042..19076 + /gene="wcjE" + /locus_tag="SPC42_0020" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34529.1" + /db_xref="GOA:Q4JYU5" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYU5" + /translation="MDMTKSRINWIDFGKGFSIFLVLAGHVLLGLYQSEKFPTANNIL + SLLIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQ + KVAGASVRVPTTISDLLNIYKHPLGVSWYLYILWSILIIYGLLSILVKNRRMLFLISV + FAYCLTLFVQTDIYIIQRTLVWGICFFLGSVLSEIHFDKINLKKFLFFFVLFDFIYMF + AWFLFYEVGSKKDYVSYINPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKD + SLGIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIV + LLPQKYIKLK" + gene 19251..>19403 + /gene="aliA" + /locus_tag="SPC42_0021" + CDS 19251..>19403 + /gene="aliA" + /locus_tag="SPC42_0021" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34530.1" + /db_xref="UniProtKB/TrEMBL:Q4K0S2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYL" + misc_feature 19251..19337 + /gene="aliA" + /locus_tag="SPC42_0021" + /note="Signal peptide predicted for SPC1900 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" +ORIGIN + 1 ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa atttaaaatt + 61 gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg ttttttataa + 121 ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc ccactattaa + 181 ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggcctgact tttgcatctg + 241 ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac tcagcaacct + 301 ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat aatatagtca + 361 attgaaacaa gaacaagaca aaagcagctc aaaaaggtat tgcaacttgg taataccttt + 421 ttgaggttct ttttgatata agcccatgtt ttctcaatag gattgtactc aggtgagtag + 481 ggaggaagag gtaaaagttt atgcccaaac tcctcgcata aaagttctaa cttacccatt + 541 ctatggaatc ttgcattatc cataataata accgatggtg tggttaatgt tggtaagaga + 601 aacttctgaa accaagcttc aaaaaagtcg ctcgtcacca tctcttcgta agtcattgga + 661 gcgattaact caccatttgt tagacctgca accaaagaaa tcctctgata tcttcttcca + 721 gatactttac ctcttattaa ctgacctttt aatgagcgac catattctcg ataaaaataa + 781 gtatcgaatc ctgtttcatc aatctaaaca ggtgctaggt gctttaaact attaaaattt + 841 ttaagaaata aggctacttt ttctgggtct tgttcatagt aggtgtggtt ctttttttcg + 901 agtgtagccc atagctttga gcgcatagtg gatggtagtt ggatgacagg caaattcaga + 961 agctatttca gtcaaataag cgtctggatt gtcagtaaga tagtttttaa gtctatctct + 1021 atcaaccttt cttggttttg ttccttttac ttggtggttt agctctcctg ttttctcttt + 1081 tagctttaac cagccataaa tggtattacg tgagatttgg aaaacgtgtg acgcttctgt + 1141 tatactacct gttcgctcac aataagagag aactttttta cgaaaatcta ttgaatatgc + 1201 cataaaaaga ttataccaca ttgtgtacta tattagattg aaactagaat agtacacatc + 1261 tgcttctaaa acattgttag aaatcgattt gactgtcctt atttcatttt attatatttt + 1321 tggttcgcgg gaagtctact aagatactta aagatgcaga tagtgaaaat aaaggtgtag + 1381 acattaccgt aaaaaagtga tataatcgta tgatgttcaa tgtataggtg ttaatcatga + 1441 gtagacgttt taaaaaatca cgttcacaga aagtgaagcg aagtgttaat atagttttgc + 1501 tgactattta tttattgtta gtttgttttt tattgttctt aatctttaag tacaatatcc + 1561 ttgcttttag atatcttaat ctagtggtaa ctgcgttagt cctactagtt gccttggtag + 1621 ggctactctt gattatctat aaaaaagctg aaaaatttac tatttttctg ttgctgttct + 1681 ctatccttgt cagctctgtg tcgctctttg cagtacagca gtttgttgga ctgaccaatc + 1741 gtttaaatgc gacttctaat tactcagaat attcaatcag tgtcgctgtt ttagcagata + 1801 gtgatatcga aaatgttacg caactgacga gtgtgacagc accgactggg actgataatg + 1861 aaaatattca aaaactacta gctgatatca agtcaagtca gaataccgat ttgacggtca + 1921 accagagttc gtcttacttg gcagcttaca agagtttgat tgcaggggag actaaggcca + 1981 ttgtcctaaa tagtgtcttt gaaaatatca tcgagtcaga gtatccagac tacgcatcga + 2041 agataaaaaa gatttatacc aagggattca ctaaaaaagt agaagctcct aagacgtcta + 2101 agaatcagtc tttcaatatc tatgttagtg gaattgacac ctatggccct attagttcgg + 2161 tgtcgcgatc agatgtcaat atcctgatga ctgtcaatcg agataccaag aaaatcctct + 2221 tgaccacaac gccacgtgat gcctatgtac caatcgcaga tggtggaaat aatcaaaaag + 2281 ataaattaac ccatgcgggc atttatggag ttgattcgtc cattcacacc ttagaaaatc + 2341 tctatggagt ggatatcaat tactatgtgc gattgaactt cacttcgttt ttgaaattga + 2401 ttgatttgtt gggtggaatt gatgtttata atgatcaaga atttactgcc catacgaatg + 2461 gaaagtatta ccctgcaggc aatgttcatc ttgattcaga acaggctctc ggttttgttc + 2521 gtgagcgcta ctcactagca gatggcgatc gtgaccgcgg gcgcaatcaa caaaaggtga + 2581 ttgtggctat ccttcaaaaa ttaacgtcaa ccgaagcact gaaaaattat agcacgatca + 2641 ttaatagctt gcaagattct atccaaacaa atatgccact tgagactatg ataaatttgg + 2701 tcaatgctca gttagaaagt ggagggaatt ataaagtaaa ttctcaagat ttaaaaggta + 2761 caggtcggac ggatcttcct tcttatgcaa tgccagacag taacctctat gtgatggaaa + 2821 tagatgatag tagtttagct gtagttaaag cagctataca ggatgtgatg gagggtagat + 2881 gaaatgatag acatccattc gcatatcgtt tttgatgtag atgacggtcc caagtcaaga + 2941 gaggaaagca aggctctctt gacagaatcc tacaggcagg gggtgagaac cattgtctct + 3001 acctctcacc gtcgcaaggg catgtttgaa actccggaag agaagatagc agaaaacttt + 3061 cttcaggttc gggaaatagc taaggaagtg gcgagtgact tggtcattgc ttacggggct + 3121 gaaatttact acacaccaga tgttctggat aagctggaaa aaaagcggat tccgaccctc + 3181 aatgatagtc gttatgcctt gatagagttc agtatgaaca ctccttatcg cgatattcat + 3241 agcgccttga gcaagatctt gatgttggga attactccag tcattgccca cattgagcgc + 3301 tatgatgctc ttgaaaataa tgaaaaacgc gttcgagagc tgatcgatat gggctgttac + 3361 acgcaagtaa atagttcaca tgtcctcaaa cccaaacttt ttggagaacc tgataaattc + 3421 atgaaaaaaa gagcgcagta tttcttggag cgtgatttgg ttcatgtgat tgcaagtgat + 3481 atgcacaatc tagacggtag acctcctcat atggcagaag catatgacct tgttacccaa + 3541 aaatacggag aagcgaaggc tcaggaactt tttatagaca atcctcgaaa aattgtaatg + 3601 gatcaactaa tttaggagaa atgatgaaag aacaaaacac gatagaaatc gatgtatttc + 3661 aattatttaa aaccttgtgg aaacgcaagc taatgatttt aatagtggca cttgtgacag + 3721 gtgcgggggc ttttgcatat agcactttta ttgttaagcc agaatatacg agtaccacgc + 3781 gaatttacgt agtgaatcgc aatcaaggag acaagccggg gctgacaaat caggatttgc + 3841 aggcaggatc ttatctggta aaagactacc gtgagattat cctttcgcag gatgcattgg + 3901 aaaaagtagc gacaaatttg aagttggata tgccagcaaa aacgttagcc agcaaagttc + 3961 aagtgactgt accagctgac actcgtatcg tctcaatctc tgtcaaggat aaacagccag + 4021 aggaagccag tcgtatcgct aattctctac gagaagttgc tgcagaaaag atcgtcgctg + 4081 taacgcgagt atctgatgta acgacacttg aagaagcgcg accagctacg actccctctt + 4141 ctccaaatgt tcgacgcaat tccttgtttg gttttcttgg aggagcagtc gtaacagtaa + 4201 ttgctgttct tttgattgag ttgctggaca cccgtgtgaa acgtcctgaa gatgttgaag + 4261 atgtactgaa aattccactt ttagggctcg ttccagattt tgacaaaata aaataggagg + 4321 aagttatgcc aacattagaa atctcacagg caaaattgga ttctgtaaaa aaggcagagg + 4381 aatattataa cgctttgtgc acgaacctac agttaagtgg agatggtttg aaagtatttt + 4441 ctatcacttc tgtgaaaata ggagaaggaa aatcaacgac ttccgccaat atcgcttggg + 4501 cttttgcgcg tgcaggttac aaaacgctgc tgattgatgg agatattcgc aattctgtta + 4561 tgttaggtgt ctttaaagca aggaataaga ttacaggcct gacagaattt ttatcaggaa + 4621 ctacagactt atcacaaggg ctttgtgata ccaatatcga aaatctcttt gtaattcagg + 4681 ctggctctgt gtcaccgaat ccgacagctc ttcttcaaag taagaatttc actacaatgc + 4741 ttgaaacctt gcgtaaatat tttgactaca tcattgtaga tactgctcct gttggtgtcg + 4801 tgattgatgc ggctattatt acgcgaaact gcgatgcttc tattttagtg acggaggcag + 4861 gtgaaataaa tcgtcgggat attcaaaaag caaaagaaca gttggaacac acaggaaagc + 4921 cgtttttggg aattgtgttg aataaattcg atacttcagt agacaaatac ggttcttatg + 4981 gaaattatgg agattacggg aaaaataaaa aataggtcgg gggatagaga tgaatggaaa + 5041 aatattaagg tcttcattgg ccataatcca gagttttctt gttattttat tgacttatct + 5101 acttagtgct gtgagagaaa cggagattgt ttcaacaaca gctattgcac tttatatcct + 5161 ccattatttt gtcttttata tcagtgatta tggacaggat ttctttaaaa ggagatattt + 5221 gattgaactt gtccagacat tgaaatatat cctattcttt gcactagcga ttagtatttc + 5281 taattttttc ttagaggatc gatttagtat ttccagacga ggcatgattt acttcctcac + 5341 attacatgct ctcttagtct atgtgctaaa cctatttatc aagtggtatt ggaagcgggc + 5401 ttatctcaac tttaaaggaa gtaagaagat tctcctactt acagcaactt ctcgtgtcga + 5461 aaaggtactg gatagattaa tagaatcaaa tgaggttgtt gggaagttgg tagccgtcag + 5521 tgtcttagat aaaccagatt ttcagcatga ttgtttaaag gtagtagcag agggggagat + 5581 agtaaacttt gcgactcatg aggtggtcga tgaagtcttt atcaatcttc caagtgaaaa + 5641 atacaatatt ggagagcttg tttctcagtt tgaaacgatg ggaattgatg taacagttaa + 5701 tctaaatgct tttgatcgta gtttggcacg taacaagcaa attcgtgaga tggcaggatt + 5761 aaacgttgtg actttttcta caacatttta taagactagt catataatgg ctaagcggat + 5821 tattgatatc atgggtgcat tggtagggct gatactatgt ggtttagtca gtattgtact + 5881 ggttcctttg attcgaaagg atgggggttc tgctattttt gctcagacgc gtataggaaa + 5941 aaatggtcgt cagttcactt tttataagtt tcgctctatg tgtgtagatg ccgaggcgaa + 6001 aaaaagagaa ctcatggaac aaaataccat gcagggtgga atgtttaagg tggacgatga + 6061 tcctcgtatc acgaaaattg gtcgttttat acggaagact agcttggacg agctaccaca + 6121 gttttataat gttctaaagg gagatatgag tttggttggc acacggccac caacagtgga + 6181 cgagtatgaa cactataccc cagaacaaaa acgtcggcta agttttaaac ctggtataac + 6241 aggcttatgg caggtcagtg gacgaagtga gattaagaat tttgatgaag ttgtcaaatt + 6301 agatgtagcc tatatagacg attggacaat ttggaaagat attgagattt tattgaagac + 6361 agttaaagtt gtattgatga aggatggagc gaagtagatt gatagatgta aaaatcattg + 6421 tggcaacaca taaagaggtt aaaatgcctc aagacaatag tctttacctt ccaatacatg + 6481 ttggaagaga cggtaaatca gatattggtt ttatcggtga taatactggc gataatatat + 6541 cctctctaaa tccatattat tgtgagttga cgggacttta ttgggcatgg aagaatcttg + 6601 attataatta cttaggtcta gttcattacc gtcgttattt tacaaataaa tctcaagggt + 6661 ataatgaaaa tgtcaatatg gatgacgtca ttttgtctcg atctaatgtt gaaatattat + 6721 tagagaaatc tgacgtaata gttccaaaga agcgaaagta ttatattgaa actctttatt + 6781 cacattatgc ccataccctt aacggagaac atctggatct tgctaggaaa attattgagc + 6841 aaaatagttc agagtatctt tcatcctttg ataaagtgat gaaacaaaga agcggttata + 6901 tgttcaatat gtttatcatg aaaaaaggac tattagatga ttatttaccg tggctttttt + 6961 ctattctgga tactatgtac gaacagatgg acttgaccga ctatacttca tttgagtcac + 7021 gtttattcgg gcgagttagt gagttgttgt ttaatgtttg gttatgtaaa aaaggaataa + 7081 cgcctaaaga ggtaccattt atgtacatgg agagagtgga tttgtttgaa aaaggaaaat + 7141 cttttttaat ggctaaattt tttggaaaga agtatggaca gagtttctag gagggaatat + 7201 gaaaatcact atcaaaaggt attcactgcc agaaatttta ggattagcag cattagctat + 7261 attcctacta ttttcgttat taagtataac tctttatgcc caatatatat ctattaaagt + 7321 atattttatt gcactttttg gcattatttt attaatattt ctgaaggaac ttatatctga + 7381 gagttataat cttaaatctg tgattggatt attcgtgatt tttactctct gcttcatcat + 7441 aggtaccgtc acgaattacg catacttttt tattttaggt ctgtttttga tttatagtct + 7501 tagaaatctc cctttttcag acgtagccaa agtctccttt atcattagta ttagtgtatt + 7561 gctcctagta gtattgagta gtaagcttgg tattattcct gattatattg agatttcgcc + 7621 taccagagtt agacactatc ttggtttccg atattcatta cttccatcaa cgcttatgat + 7681 gaatatcata gctatatcat tttttttaaa gcaagaaaac gcttcatatc cgcgtcttct + 7741 tgtattgttt ttactttcag gatggttata cgtagaaaca gattcacgtt tgacttttat + 7801 taattcgtgt ttgtttctac tggttaattt aataatgaaa ttgtcacctt ccatcattga + 7861 aaaggtaggg agactgttaa aacttttttc gttcacctac tttattaatg cctgtttgag + 7921 ttactggatt gcgaagactt acttaaacac ctcaaatgtt gttttgaatc aattctttta + 7981 ccaagcggat caatttcttg gaggacgtat ttattattct aatcgttcgt tatctttata + 8041 tggatataag ttgttaggtc aaaagattga ttggattgga aatggcttga gcatacaagg + 8101 ggagcgtagc acagaaacat atttgtatgt ggataattta tatatccaga ttcttcaaca + 8161 ttttggtttg atagtttcgg taattatttt aagtctatta actataactt tagtaaagct + 8221 tttgaaaaag gggcagatgg tattaggaat tattttagtt attttgagtt ttcatgcttt + 8281 aattgatgat ttgatactaa atctatatta taatatcttt tgggttttga taggaatgtt + 8341 gatatataaa aagtatcaat tttatgataa aaagcagttg acaatagaat aagaagcaag + 8401 cattggaaat agacattcag atatgtacaa gaaaactcga tttaagtttt ttggtaaaat + 8461 ttttaaaatt aagttgtaaa atggatatca aaatctcacc ttttttgtag gtgtgattaa + 8521 acagagggat attagatagg aaaataatga ataagattaa tttaactgat aatttaccgt + 8581 taatttcagt tgttttacca gtatacaacg tagagaatta tttagaaaag tgtttgaatt + 8641 ctgttgtgag acagacgtat aaaaacatag aaattataat agtaaatgat ggcagcttag + 8701 attcttcaat agatatttgt aataagtatg caaataaaga tagtcgaatt aaagtattta + 8761 caaaacctaa tggaggtttg tctgatgcta gaaatttcgg tgtcaaaaaa tctatgggtg + 8821 agtttataac attcgttgat tcagatgact atgttacaga tgattatgta gaatatttgt + 8881 atagcttagt caaaaaatat aattgtaaaa tgtcaatgtg ttcaatattt gtccattata + 8941 tttctaatga taaaatgatc aataatggga caggaagaga attgatgatg acagcagagc + 9001 ggtgtattga aaaaatgtgc tatcatgatg aggtggatac atgtgcttat gcaaaattat + 9061 atcatagaag tctatttagt gaaatatgct tccctaaagg aaggatattc gaagatattg + 9121 gaacaattta tcgctttttt ggtactgctg ggcagattgc ctgtggtttt aacgcaaaat + 9181 attattatga gattcgggaa aattcgattg ttacatcatc atttagtgaa aaaaaatttg + 9241 atttgttatt tatgacagat caaatgcgaa attttgttga tcaacgttat ccatctttga + 9301 aagctgcaac aaaacgtcga gctgtctatg caagatttag tacccttaac caattattag + 9361 atgtacaagg atataatgaa gaaaaaaaag aaataattcg ttttatccaa gacaacaagg + 9421 aagcgttact tgaaaatcct aagactccta agcgggatag attagctgtt agagctctct + 9481 cccttggatt ttgcatttat aaattgttat ggaagcaata tctaaaaatt caaagaggtt + 9541 agtatgaata aagaattttt gaagtatatt tatattcgat tattaagaaa tttaaggaga + 9601 attttcttta ttatcccgat aataaggaat agagttgttt ttgaatcttt ctcaggagat + 9661 gcttatagtt gcaatcctaa atatatttct gaagaattaa gaaaacagta tggtgattct + 9721 gttgaaatta tctgggcttt taatgatcca aacaaattca aaaaagaatt accaaaggag + 9781 attgtgactt gtcgttaccg tagtttcaat catctgatct atagaatcac ttcaaaagtt + 9841 tatgtttgta atttcctgca agcaattgaa attccaaagc gtaaaggaca actagagatt + 9901 caaacttggc atggaggagg ttgctataaa aaagttgggg tggctgaaaa aggacgccag + 9961 gctgcttatg ttaaacgaca acggatgcac gttgaagaaa cagatctctt tattacaagt + 10021 agtaaatatt ttgaaaatga ggtagtaaaa aaacaatttg ggtataaggg agaaatttta + 10081 tctattggta tgcctcgaaa tgatatttta ataaatttac caatttcaag tcaagttgag + 10141 aaattaaagg agaaattggg attaccaaac aataaattga tagcacttta tgctccgacc + 10201 tggagatcag gtactaaaca gtatgaaaca cttgatataa aaaaacttac tcaagccgtt + 10261 gataaaaaat ttggtaaaaa atgtatcgtt cttttcagat cgcatctata tggaaatcaa + 10321 tcttatgatg atgttgtgga tgtctctcag tatagtgata tgcaagaatt attgttgctt + 10381 tcagatatac tgattactga ctattcttcg tctatgtggg atttctctct ctcttttaaa + 10441 ccgtgttttt tatatacccc cgatttgaag gattatctag atgaaagagg ttttgatgaa + 10501 gatatacatt catggggatt ttcagtttct gaatcaaata aggaactagt tgaaaatatt + 10561 ttacagtttg ataatgaaga atatagacaa aaaatgaaga atcatcatca gtttttagaa + 10621 tcttatgaac aaggagatgc agcgaaaaga gtcgtggcga agattgctga atattgtaat + 10681 ttatatagag gatagataat gaaaaaaatt gcttatttga tcaaaagata tggtgtgaaa + 10741 aatgtggttt tacgtgctat taatgatgtt ctaccagtca atctcatctt tcccagtcaa + 10801 caactcagac gtttgaattg gcaagaaaaa gtcaaaaaga agttaaaaaa atatgtagtt + 10861 atttcggatt caatcaagag tgaggaggaa tgcgatatta tctggtggct atggtttcaa + 10921 ggacttgata atgcaccagc tattgtgaaa aaatgtagag agtcggtaga taaatatgct + 10981 aaacgcagtg gcaaaagggt tattgagtta acatctcaaa atttatttga atatattgag + 11041 gtacctaacg aactctatgt gaaatataag tcaggtagtt tgccactagc tttattttca + 11101 gatttttgtc gaattagcct tctttctaac tatggaggat tatggattga ttcaactgtt + 11161 ctaattacgg gggaaattga agatgagata ttgaaccaag atatttttat gtttcaagct + 11221 tctcctttag actattcagt tactaaaatc agtaattgga tgttatattc aaaatatcca + 11281 ggacacccgt tcatatcatc gatacgtgat actttgattt cattttataa taagaataat + 11341 acgatcccag attatttttt atttcattta cttgtttcct gtttaataga tgataatagg + 11401 ataaatcaaa gtttttatga tatggattat tataccaata cctatcctca cttattaggg + 11461 agagttttga gcgaaccata tgatactttg aaatttgaaa atattttaag gaaaacgtct + 11521 attcataaat tatcatataa aaatttagat aatgttgctg aagatagctt ttataatgct + 11581 attttaggtt tagattttag ttagtaataa agaggagaga aatgaattta gcagttattt + 11641 ttgctggagg ctccggtacg cgaatgaatg caaaggatag acctaagcag tttcttttgg + 11701 tacatggtaa gccaattatt gttcacacta ttgagctatt tgagaaccat ccagagattg + 11761 atggaattat cgttgtttgt attgaagatt ggattccgta tatggaggag atgaaatatt + 11821 gctatagatt agataagatt gctaagattg ttccaggggg ggcaactggt caattatcta + 11881 tttataatgg tttagtcgcg gctgaacaac tttatggaat agaggataat gttgtgttaa + 11941 tccatgatgg agtccgtcct ttaattacag cagacactat ttcagataac atccaatccg + 12001 taaaagaaaa gggaaatgct attacttgta cagtggccaa agaaacagtt atcttagtag + 12061 atgatgaaaa taaggtagac gaagtgccta gtcgtgaaca ttcgcgattt gccaaggctc + 12121 ctcagagttt ttggctaaaa gatattctag gtgcacatcg agcctctgta gataatggta + 12181 gaaataattt tattgattca tgcaccatga tgagatatta tggtcatgat ttacatgttg + 12241 ttgttggtcc gtatgagaat attaagatta caacgcctga tgatttttat acatttaggg + 12301 ctttgtacga tcttcgtgag aataagcaac taaaataatg aggaaaagat gaagtatttt + 12361 gttgaagaaa cgttacttga tgaacaggat aaaaaaaatg cgggtggaaa ggctagacaa + 12421 gacgtcactg atattttaga gtccataggt tatcagaagt taatagctga gtccgaaatg + 12481 aatgaacgtc aggaattaaa tgctgttcaa agattggttc atcattataa agttaagaaa + 12541 atgtggaaga aaactctttc agttgttggt aagggtgatg aagttattat tcaatttcct + 12601 ttactaaatc atagtttatt ctttaatcag gttattaagc aacttagtaa gaatggagtt + 12661 aaagtttatt ttttgattca tgatttagaa tcgttgcgat ggtcgcagtc aaaatcgata + 12721 tcattaaaaa gtaggattcg attaaacatt gaagaacata gtgttttaag gttatcagaa + 12781 ggcattattg ctcataataa aaaaatgaaa tcttatatta agacctactc tgttgaaagt + 12841 tctaaaatta ttcctcttga aacttttgat tatattattc catcttatca tgaaagaaaa + 12901 aatctggata actttcagtt aaatgctcca attgttattg ctggaaattt aaagcaacat + 12961 aaagctggat atgtctatca tttaccaagc aatgtggagt ttaatcttta tggaattgga + 13021 tatgaacaga cagatgacaa aagtgtgcac tactgtggtt cttttatgcc agaagaatta + 13081 ccattcgttt taaaaggaag ttttggattg gtatgggatg gtccgtcatc agagtcttgt + 13141 atagaaactt atggagagta tcttcgtgta aacaaccctc acaagacttc actatattta + 13201 gcttcaggca taccagtagt tgtatggtca gaggcagcaa tagctagttt cattaaggag + 13261 aataattgtg gtattcttgt atccaatctg agtgaactac ctgagttact ttctatgatt + 13321 accgttgatg aatatgaatt gatgaaaaag aatactgaga ttattggaga aaggcttcga + 13381 caaggttttt atactaaaca agcagttaaa ggtttctaga ctggaggaag tgtaatgatt + 13441 gaaagtttta atgataaagt gttgcaggaa gatttagaga taattgcaaa agaagagctc + 13501 ccatttcgaa aatttagaaa ttcaactgtt tttatcacgg gagtaacagg tttagtaggc + 13561 cttcaattat ttaaggcttt ggcttgtatc aatagagtcc atcagttgaa tatgaaaatt + 13621 attggtctag tcagaaattt ggataaagca gaaaaaattt ttggagattt attgaaacgg + 13681 aaggatatac aaatagtttt aggagatgtt tcggaagatt tccactcgta tatccctgat + 13741 ggtttagtta ttgactatat cattcacgga gcaagcgtga ctacctctaa actcatgatt + 13801 gaatttccag tagatacaat tcgagtagct tttaatggaa cgtatcaaat gttagaattg + 13861 gcaaaagaaa aaaaagtgaa aagttttgta tatctttctt caatggaggt atatggtagc + 13921 tttcagtcag atagaacaac tgttgtaaac gagaatatgt tagggtatct tgatttgaca + 13981 tctgttcgaa caaattaccc agaatgcaaa agaatttgtg aaaatatgtg cattgcattt + 14041 ctaagtcagt atcaagtccc ggctaagatt gctcgtctat cccagacctt tggtgcaggc + 14101 actctaccgg gtgaaaatag agtatttgct caatttgctc gtagtgttat gcaagggaaa + 14161 gatattgttt tacatacgtt agggcaatca gaaggaaatt actgctacac agctgatact + 14221 gttgttgcat tattaacaat tctattgaga ggagaaaatg gggaggctta taatattgct + 14281 aatgaagaga gtcatacaac aatagcagat atggcaaaaa tggtaacttc gcaattctct + 14341 caaacgagtc aagtggtttt tgatattccg aagaaaaata tatttggtta tgctgtagat + 14401 actaaaatga agttatcaac acacaaaatt caacaattgg gttggaagcc gagggtctct + 14461 cttgtagatg cttatgatcg aatgatgaga agtatgaatg aaactggggt atagataact + 14521 atatgaaggt attaaaaaac tacttatata atctctctta tcaactatta gttattattc + 14581 ttcctatcat tacgactcct tatgtgacgc gcatattttc ttcagatgat ttagggacat + 14641 acggttactt caattccatt gttacctact tcattttact tgctactctg ggtattgcta + 14701 actatggaac gaaggagata tctgggaata ggaagagtat tcagaaaaat ttctggggaa + 14761 tatatacttt acagtttgga gcgactactt tttccatttt tctctatata ctagcctgtc + 14821 ttttcatccc agggatgaaa aacctagttg catatatctt gggattgggt ttagtctcta + 14881 aaggactaga tatttcatgg ttgtttcaag ggttagaaga ttttcgtaaa attacggtca + 14941 gaaatatcac agtgaagctt gttggtgtaa gtgccatttt cttgtttgta aaatcagcga + 15001 gtgatctata cttgtatgtt tttcttctaa cagcatttga attgttgggt cagttaagta + 15061 tgtggtttcc agcccgtgaa tatattggaa aaccacattt tgatatagaa tatgctaggc + 15121 atcatctgaa gccagttatc ttgctattct taccacaaat tgctatctcg ctttatgtga + 15181 ctttagatcg tacaatgtta ggggcgctag cttctacaaa agatgtcggc atttatgatc + 15241 aggctttgaa gctggttaat attttactga ccttggtaac ttccttggga agtgttatgc + 15301 tgccacgcgt tgcgcatttg ttagcgacag gtgatcataa ggtagtcaat aagatgcatg + 15361 aggtatcctt cttaatttat aatttggtta tttttccgat tatggcaggg atgttgattg + 15421 tgaatgatga ttttgttcaa tttttccttg ggcaagactt tcaagatgca cgctatgcaa + 15481 tttccattat gatcttccgt atgttcttta tcggttggac taatataatg ggaattcaga + 15541 tactgatacc tcataatcaa aataaagaat tcatgatttc aacaacaact cccgcaatta + 15601 tcagtgtagg tttgaactta ctattccttc ctaaactggg atatatcggg gcagccattg + 15661 tctctgtttt aacagaggca cttgtatggg caatccaatt attctatact cgcagatatt + 15721 taaaagaagt tcctataatc ggatcaatgt caaaaattat actagcatct gccattatgt + 15781 atggcctttt actaagttca aaaacagtta tacatttttc accgacctta aatgttctag + 15841 catttgtagc gcttggtgga atcatttatc tttttgcaat tctatctctg aaagtggtag + 15901 atgtgaaaga attaaaacaa attattagga aaaactagaa tgagaaaaaa tcgaaatatc + 15961 aacctagatt tactaaaagt gcttgcatgt gttggagttg ttttacttca tacaacaatg + 16021 ggcggattta aagagacagg ttcatggaat cttttggcat atttatatta tttaggtact + 16081 tactctattc ccttgttttt tatgatcaat ggttatttgt tgttaggcaa gagggagata + 16141 acttatcttt acatactcca gaaagtaaaa tggattttaa taacagtgtc atcatggtca + 16201 tttatcgtat ggctttttaa gcgtgatttt acaactaatc ctattaaaaa aattgtaggt + 16261 tctttgatac aaagaggtta tttctttcag ttttggtttt tcggtgcact catacttatc + 16321 tatttatgtt tgccaatttt gagacaattt ctaaattcaa aaagaagcta tttatacagt + 16381 ttatctttat tgatgactat tggtttgatt tttgagttat caaatatcct acttcaaatg + 16441 ccaatacaaa catatgtaat acaaactttt agattatgga cgtggttttt ttactatctt + 16501 ttaggtggtt atatagcgca attcactata gaagaaattg aatcaaggtt taagaattgg + 16561 atgaaaatag ttagcatact tttgttattg atttcaccaa taatattatt tttcatagcg + 16621 aagactatat accataatct atttgctgaa tacttttatg atactttatt tgtaaaagtc + 16681 agtactttag gaatttttct aactatcctc atgcttactt tgaatgaaaa ccgaagagaa + 16741 tcgattgttt ccctttctaa tcaaacaatg ggggttttca taatacatac ttatattatg + 16801 aaagtgtggg aaaaagtgct tggttttaat tttgtaggag catatttact ttttgctcta + 16861 tttactttaa gtgttagttt tattattgtt gggatgttaa tgaagattcc ttacttcaat + 16921 cgaatcgtca aattataaaa aggagaacaa gatgtacgat tatcttattg tcggtgctgg + 16981 tttgtcagga gcaatttttg cttatgaggc gaccaagcgt ggaaaaaaag taaaagtgat + 17041 tgataaacgt aaccacattg gtgggaatat ctactgtgag aatgtagaag gagttaatgt + 17101 tcataaatat ggtgcccata tctttcatac ttctaataag aaagtttggg attatgttaa + 17161 tcaatttgct gaatttaaca actacgtcaa ctcgcctgta gctaattaca agggtagcct + 17221 ctataatcta cctttcaata tgaatacctt ctatgctatg tgggggacaa aaactcctca + 17281 agaagtcaaa gataagatta ctgagcagac agctgatatg aaggatgttg agccgaaaaa + 17341 tctggaagaa caggctatca agttgattgg tccagatgtc tatgaaaagt taatcaaggg + 17401 ttatactgaa aagcagtggg gacgctcagc aacggaactt cctccattta tcattaaacg + 17461 tcttccagtt cgtttaacat ttgataataa ctattttaac gaccgttacc aaggaattcc + 17521 tattggtggt tacaatgtca tcatcgaaaa tatgcttaaa gacgttgaag ttgagcttgg + 17581 tgttgatttc tttgctcatc gtgaagagtt agaagcatca gctgaaaaag ttgtctttac + 17641 agggatgatc gaccagtatt ttgactacaa gcacggagag ttagaatacc gtagccttcg + 17701 ctttgatcat gaaattttgg acgaggaaaa ttatcaagga aatgctgtag tgaactatac + 17761 ggagcgtgag attccttata ctcgtattat cgaacacaag cattttgaat atggaacaca + 17821 ggcaaagaca gttatcacgc gtgaatatcc agctgactgg aagcgtgggg acgagcctta + 17881 ctatccgatc aacgatgaga aaaataatgc tatgtttgct aagtaccaag aggaagcttc + 17941 aaagaatgat aaggttattt tctgtggacg tttagcagat tataaatatt acgatatgca + 18001 tgtggtgatt gaacgggcgc ttgaggttgt ggagaaagag tttggatatg acaaaaagta + 18061 gaatcaattg gatagatttt ggaaaaggct tttccatatt tttagtctta gcaggacatg + 18121 tgttgcttgg actgtatcaa tcggaaaaat ttcccacagc aaataacata ctatcgttgt + 18181 tgatagcaca agtctacata tttcatatac cagtattttt tgccttatca ggatactttt + 18241 tcaaacctgt gtcggatttg aaggagttct ggcaatatgc taaaaagaag acaattgttt + 18301 ttggtctgcc atatattttc tattcgatca ttcactttgg tcttcaaaaa gttgcagggg + 18361 catctgttcg tgttcctaca accatatctg atttgctaaa tatctataaa catcctcttg + 18421 gagtttcatg gtatttatat atactctggt cgattttgat aatctatgga ttattgtcta + 18481 ttttagtcaa aaatcgtaga atgttatttt tgataagtgt tttcgcttat tgtttaaccc + 18541 tatttgttca aacagatatt tatattattc aaagaacgct agtttggggg atttgtttct + 18601 ttcttggcag tgtattgagt gaaattcact ttgataaaat taatttgaaa aaatttcttt + 18661 ttttctttgt gttatttgat tttatttata tgttcgcttg gttcttgttt tatgaagtag + 18721 ggtctaagaa ggattatgta agctatatta acccaggttt gtgggggatt gcttttattg + 18781 tctgtgtatt agttgctttt gcgatttttc ctaaaatgga gaaaaatttt cctaaaactt + 18841 tcctatattt cactaaatac gggaaagata gtttagggat ctatattctt catgcaccaa + 18901 tttgtagcat gattcggatt ctaatgttga aagtgggaat aaactcagtt tttcttcacg + 18961 ttgttgttgg gattgtgcta ggctggtatt tatccatact agcaacttat atattgaaaa + 19021 aaattccatt tttgaatatt gttttattac cacaaaagta tattaaatta aaataaatta + 19081 ttttagattt ataatgtggc tctttgtcaa ctaacatctg gagaggacaa tcactgtctt + 19141 ctcttttttt gtcttttcag aatataccaa attaacacaa aaattctgaa aattctgttg + 19201 acatctttct gaaaagagtt tataatggag agaaagtttt aaaggagaaa atgatgaaaa + 19261 gttcaaaact atttgccctt gcgggcgtga cattattggc ggcgactact ttagctgcat + 19321 gctctggatc aggttcaagc actaaaggtg agaagacatt ctcatacatt tatgagacag + 19381 accctgataa cctcaactat ttg +// + diff --git a/public/res/serotype_genbank/serotype_43.gb b/public/res/serotype_genbank/serotype_43.gb new file mode 100644 index 0000000..b20c227 --- /dev/null +++ b/public/res/serotype_genbank/serotype_43.gb @@ -0,0 +1,984 @@ +LOCUS CR931716 22097 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 2427/48 (serotype 43). +ACCESSION CR931716 +VERSION CR931716.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22097) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22097) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22097 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="2427/48" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC43_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC43_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34531.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene complement(307..825) + /gene="tnp" + /locus_tag="SPC43_0002" + /pseudo + CDS complement(307..825) + /gene="tnp" + /locus_tag="SPC43_0002" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + gene 322..378 + /gene="aliB" + /locus_tag="SPC43_0003" + /pseudo + CDS 322..378 + /gene="aliB" + /locus_tag="SPC43_0003" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene 1048..2493 + /gene="wzg" + /locus_tag="SPC43_0004" + CDS 1048..2493 + /gene="wzg" + /locus_tag="SPC43_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34534.1" + /db_xref="GOA:Q4JYU2" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYU2" + /translation="MSRRFKKSRSQKVKRSVNIVLLAIYLLLVGFLLFLIFKYNILAF + RYLNLVVTALVLLVAFVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTNLM + VDQSSSYLAAYKSLIAGDTKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVSIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQNSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGTGRIDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1048..1164 + /gene="wzg" + /locus_tag="SPC43_0004" + /note="Signal peptide predicted for SPC1904 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1252..1599 + /gene="wzg" + /locus_tag="SPC43_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.1e-62" + misc_feature 1777..2220 + /gene="wzg" + /locus_tag="SPC43_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.6e-68" + gene 2495..3226 + /gene="wzh" + /locus_tag="SPC43_0005" + CDS 2495..3226 + /gene="wzh" + /locus_tag="SPC43_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34535.1" + /db_xref="GOA:Q4JYU1" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYU1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKSKLFGERYKFMKKRARYFLERDLVHVVASDMHNLNKRPPYMKEAYELIS + KQYGERRARELFIENPRLILSDQII" + misc_feature 2498..3106 + /gene="wzh" + /locus_tag="SPC43_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 8.1e-37" + gene 3235..3927 + /gene="wzd" + /locus_tag="SPC43_0006" + CDS 3235..3927 + /gene="wzd" + /locus_tag="SPC43_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34536.1" + /db_xref="GOA:Q4JYU0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JYU0" + /translation="MKENKEITIDVFQLFKVLWKKKTSIILTAIVAAVLAFAVSSFVL + TPEYSSTTRIYVVNRNQSEKAGLTNQDLQAGTYLVKDYKEIILSQDVLEKVISNLKLE + KTVKELSKKIQVTVPVDTRIVSITVKNAQPEEASRIANALREVAAEKIISVTRVSDVT + TLEEARAALSPSSPNIRRNTLLAFLAGGAVMVVSVLLLELLDDRVKRPEDVEEVMQIA + LLGVVLDLNKLK" + misc_feature 3235..3381 + /gene="wzd" + /locus_tag="SPC43_0006" + /note="Signal peptide predicted for SPC1906 by SignalP 2.0 + HMM (Signal peptide probability 0.987) with cleavage site + probability 0.704 between residues 49 and 50" + misc_feature 3253..3669 + /gene="wzd" + /locus_tag="SPC43_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 6.4e-48" + gene 3938..4639 + /gene="wze" + /locus_tag="SPC43_0007" + CDS 3938..4639 + /gene="wze" + /locus_tag="SPC43_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34537.1" + /db_xref="GOA:Q4JYT9" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JYT9" + /translation="MPTLAIEQKRLDFAKKAEENYNALRTNIQLSGDNLRVLSISSVK + PGEGKSTTSINIAWAFARAGYKALLVDADIRNSIMSGVFKSREKITGLTDFLAGTTDL + SHGLCDTNIENLFVIQAGPVSPNPTALLQSENFATMIDTMRKYFDYVIVDTAPIGMVI + DAAIITQKCDASILVTAARETKRRDILKAKEQLEQTGVPFLGVVLNKFNTEVEKYGAY + GGYGTYGFYGNYRKG" + gene 4648..5289 + /gene="wcjH" + /locus_tag="SPC43_0008" + CDS 4648..5289 + /gene="wcjH" + /locus_tag="SPC43_0008" + /note="member of homology group 61" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34538.1" + /db_xref="GOA:Q4JYT8" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JYT8" + /translation="MIKIYFVFKNILDRFLAFFLFITLIIIPIIPITILAIWIEDPGD + VFYLQDRVGLNGKKFKVIKFRSMYKDADQRIKKSINSGKTERLNFKEHSQSMTTKVGK + VIRKLSIDELPQLLNIIKGDMSIVGPRPLQQFEITHHILTHKEMGIALKMSKRLSVKP + GLLCYWQVTPNKNDMPFADRMDLDLLYIDNVSFKTDFLLILKGFFTVLMGNNS" + misc_feature 4648..4755 + /gene="wcjH" + /locus_tag="SPC43_0008" + /note="Signal peptide predicted for SPC1908 by SignalP 2.0 + HMM (Signal peptide probability 0.806) with cleavage site + probability 0.797 between residues 36 and 37" + misc_feature 4672..5280 + /gene="wcjH" + /locus_tag="SPC43_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.3e-24" + gene 5291..6082 + /gene="wciB" + /locus_tag="SPC43_0009" + CDS 5291..6082 + /gene="wciB" + /locus_tag="SPC43_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34539.1" + /db_xref="GOA:Q4JYT7" + /db_xref="UniProtKB/TrEMBL:Q4JYT7" + /translation="MKNIKILVATHKKYKMPSDTNMYLPIHVGCEGKEKLGFQGDNSG + ENISFLNPYYCELTGLYWAWKNLECDYLGLVHYRRYFTKMTKGYNESINIDDVILNRF + EVEKLLENSEVIVPKKRKYYIETLYSHYAHTLDASHLDLARKMIEQKNSEYLASFDKV + MKQRSGYMFNMFIMKKELADDYFTWLFPILDSMYECMDLSDLTPFEARLFGRVSELLF + NVWLSKNNLTPTEAHFMYMEKVNLFKKGLSFLQAKFFKKKYKESF" + gene 6093..6914 + /gene="whaI" + /locus_tag="SPC43_0010" + CDS 6093..6914 + /gene="whaI" + /locus_tag="SPC43_0010" + /note="member of homology group 149" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34540.1" + /db_xref="GOA:Q4JYT6" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JYT6" + /translation="MSEIKIIQNKILEILKIFIETCEENNLTYYALGGTLLGAVRHGG + FIPWDDDIDIGMPREDYEKFKKIASKKFNDRYLFLSEDTPGYKKAFSVIRDTSTKIVM + NYSNIEQEESLWIDIFPIDGLPEKGVKRKLHEKQYLFRRMMVQLSQFNSIVNQNKTNR + PWQEKVIIKIAGILKIENLLSFEKAQQKYLATIKKYSITEGYAGNFTGAYKLRELVPS + CYFGEPVKLDFEGIKLNCPNKYKDYLKAIYGDNYMTLPPIEQRLPHQYEIVSLGE" + misc_feature 6156..6839 + /gene="whaI" + /locus_tag="SPC43_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 2e-53" + gene 6921..7889 + /gene="wciE" + /locus_tag="SPC43_0011" + CDS 6921..7889 + /gene="wciE" + /locus_tag="SPC43_0011" + /note="member of homology group 44" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34541.1" + /db_xref="GOA:Q4JYT5" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JYT5" + /translation="MNKLRKALNYYQDISKKRSYFPNNVLNWQLLGKFLGQIPYLIGE + NNARKICEKRHNVTRGFLEKEFYEFIINYEFNTCNQKNSKIIWTLWMQGYENAPELVK + STIDSIRKFAELNNFQFILLEENTIEKYIVFPKLIKEKMDLGVIDYTKISDILRVSLL + AKYGGTWVDATIYMKEEFDSSLLLQNYYTIKTGGIEDYSPNISNNRWKGFFLSGNSSL + FSFTRDFFFEYYSRYDIAVDYLLIDYIFDIAYKYDEKIKNQMLELEKSNHNLFWLESH + LGDEFDQKVWDNITETTKIFKTTYKLSEEIKSNKNNFYSKLIDRKL" + misc_feature 7029..7871 + /gene="wciE" + /locus_tag="SPC43_0011" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1e-61" + gene 7899..9008 + /gene="wcrC" + /locus_tag="SPC43_0012" + CDS 7899..9008 + /gene="wcrC" + /locus_tag="SPC43_0012" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34542.1" + /db_xref="GOA:Q4JYT4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYT4" + /translation="MKKIALVKWILDDSGGGERVAVSLANELTKKYEVYLIGITTKQS + DLFFEINSQVKYSNFFDHRVRLSKNILKISKMLKKYFVDNEIDIAFGIGITANIFLSL + AGIGISTQIVLCDHTNSITDNREFSQKVQRYVGAKCADKIITLTQEDRRSYIKKYGIS + EEKIDYVYNWKEDGLSNVPYNDESMKIVTVGRLDYQKGYDYLVQVAKKVLKEKTGWTW + EIYGSGNQDEVDKIKDLIIKNDLQDKLVIKGLEKNQAMIYGDKGIYVMTSRYEGLPLV + LLEAQQYNLPIVSFRCPTGPNEIVEDGVNGHLIDCYDTDKMSERLLELMEDSNLRTSF + ANHAKDNMDKFDKDKIIQQWIDLIEEMTGGNNFES" + misc_feature 8409..8921 + /gene="wcrC" + /locus_tag="SPC43_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.6e-35" + gene 8998..10122 + /gene="wcyM" + /locus_tag="SPC43_0013" + CDS 8998..10122 + /gene="wcyM" + /locus_tag="SPC43_0013" + /note="member of homology group 181" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34543.1" + /db_xref="GOA:Q4JYT3" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYT3" + /translation="MKAKMLICITSLTGGGAEKSLVNFIQEFESMFEISILVYTEKNN + FYGSKLSHLRIDYFIRKNTPAIIEKIVNKLVKLLPPSFVNRWIIQRSIFKNEKFDYEF + AYMEGKPTKIIAGSSNEDSLKLAYIHCDFSKNWYSKRSFKNFKEELTCYQKFNSILAV + STPQKESFEEIFPKTNLEVIPNLLNIDEIKNLSKEEIELENIPYFCAIGRLELVKNFE + LLINAFHLFRKKYSQYHLIILGDGSLYDHLKNQINNLGESQYIKLLGFQSNPYKYIKN + SVGLIQSSVSESFSYVLAEAAALGIPSISTKTQGSEVMSEYFEVIQVEHTSNELAKGL + EKVIANNFVNVHFNFNEEAYYKFLEIFKKGSRSFEIRREI" + misc_feature 9565..10059 + /gene="wcyM" + /locus_tag="SPC43_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.3e-21" + gene 10100..11197 + /gene="wzy" + /locus_tag="SPC43_0014" + CDS 10100..11197 + /gene="wzy" + /locus_tag="SPC43_0014" + /note="member of homology group 182" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34544.1" + /db_xref="UniProtKB/TrEMBL:Q4JYT2" + /translation="MKFEEKYNTLFNIIFSLLTILYLLKFVNIDRIDGISIVILICIL + FLFVMHSLKYGINRLKLTSLILFFLTFILNLFNGSTFLEITYFFLLYTIILKDNKKFF + KIHFITLTVFVLTIILLSHIGYISNFVIYRSNGGIRNSLGFVHPNSLGLMIYSLTVCS + LNLFEIKRFKFFFYLFLLLMNLWILQLADSRTSGYISILVIVFCYFFDKIGKLNRPLS + SFFINLAITMSVLFITLMSINFEASHIFQFLNKLFTNRIFSSYVFFREYGVTLFGKRI + DGIVSLVQGTVIIDSGYIGLLLQKGIIFFVLFLLFIFSRIKEYSFTLREGILLISVFI + SLMFESYGYTVFLFPILFFDYLGKRKESINE" + gene 11190..12068 + /gene="wcyN" + /locus_tag="SPC43_0015" + CDS 11190..12068 + /gene="wcyN" + /locus_tag="SPC43_0015" + /note="member of homology group 204" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34545.1" + /db_xref="GOA:Q4JYT1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYT1" + /translation="MNKITVFTPTFNRGYLMNKLFHSLNSQTNKHFEWLIVDDGSIDQ + TGELVETFKEQANFEIRYFYQQNGGKHRAINHGLDLARGELFFIVDSDDSLTDDAIEK + IFNNYSGIAFNHSFAGIAFNRGFSKKRIVGETFEGTYIDCDNLHRAKHNILGDKAEVY + RTDILKSIKFPVVDGENFMSEVVLWNEVARRGYKLRWFNDIIYFCDYLEDGLTKNSEK + ILFNNPVAHQMMTKELLQIDFTLKRKFGMIYNYHKIRNQSIKQTAINLEQPLILVYMV + VMMARIRKIVKGVKNE" + misc_feature 11202..11696 + /gene="wcyN" + /locus_tag="SPC43_0015" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2.7e-25" + gene 12061..13125 + /gene="wcrH" + /locus_tag="SPC43_0016" + CDS 12061..13125 + /gene="wcrH" + /locus_tag="SPC43_0016" + /note="member of homology group 51" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34546.1" + /db_xref="GOA:Q4JYT0" + /db_xref="InterPro:IPR016503" + /db_xref="UniProtKB/TrEMBL:Q4JYT0" + /translation="MSNLYYIHEEFGSDSTAATKAPNDLQKIFQDCKFKPLVTLKKNS + KIVRIFDYAFKLLLCLIRIRSNDIVIFQFPFATHGKLKNFLMKLLQYKKAKMIFLIND + LESLRYSGNKKNLISKEQYIKNADVIICHNQRMKEFLIENKIDSEKIVVLGVFDYLLD + KFNKEKASFDKTVVIAGNLSPQKSGYLTELLKNENRIKFNLYGPNFTSSTNNNDCVSY + KGSFSPEKIPFILEGDFGLVWDGDSILTCSGITGEYLKYNNPHKVSLFIASKIPVIIW + KQSALSDFVKENNIGIVVNDLIEMQEIITNMTEEQYEIFRENIEQLSKKVRQGYFTNL + AIEKSLSIIKNNLNNYFEED" + gene 13127..14182 + /gene="wcyO" + /locus_tag="SPC43_0017" + CDS 13127..14182 + /gene="wcyO" + /locus_tag="SPC43_0017" + /note="member of homology group 80" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34547.1" + /db_xref="GOA:Q4JYS9" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYS9" + /translation="MKKEEYNFLKVLTILLVVLGHSTYYIIKMNFGGIDYYHYINNND + SIIVINFFKKITEIIYYFHMPLFMAISGAFFRIQVEKNKWQSPLELFQNKFRRLLIPF + IIFTILYTIPMKYISNYFIQTSIFNAIIGQLFLFGNTHLWYLYALFIIFMIAYFVLKK + DTGFGMLLFLFALHLMSYKINITLIKSAFQFLFYFAIGFKFEQKREVYNHLLNHTKKF + VYFLLIGFVVLIFMNLGIKRYSIIFSKLLEEILALYGSLVTYTIAYYLSRNTKWMNTR + IYQFILVNGLGIYIFSDTLNYLILKWGFIVAEDLMITPHGIILMVIFRFLVTLILSLL + ITLAFKKLFPKYKWLVN" + misc_feature 13145..14164 + /gene="wcyO" + /locus_tag="SPC43_0017" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 9e-05" + gene 14220..15185 + /gene="wcyP" + /locus_tag="SPC43_0018" + CDS 14220..15185 + /gene="wcyP" + /locus_tag="SPC43_0018" + /note="member of homology group 201" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="CAI34548.1" + /db_xref="UniProtKB/TrEMBL:Q4JYS8" + /translation="MCIKKFLKKSHLTKGIYQQLQRKKNQYRLEKKFKYTGKFIDRKK + DSKDLCIILAGYKEFLYDDVLGRVKTFAPETMDICVLSSGIYSEKLNQICEENNWSYL + STEQNNISLIQNVAINLHPQAKYIYKIDEDIFITEHYFENLKEAYIFAQEGDYAPGVV + APLIPVNGYGHKRILQKLGLEDVYYEKFGEKSKYIAGQPRFIESNPEVAKFFWSDGEV + IPTIDTMNAQFSKEEKKVNPCAIRFSIGAILFERSLWELMDYFNVEFEGAGLGVDEVQ + ICNFCILNSKPLMVSENVVVGHLSFGPQNKAMFEYYKEHPEKFSI" + gene 15198..16655 + /gene="wzx" + /locus_tag="SPC43_0019" + CDS 15198..16655 + /gene="wzx" + /locus_tag="SPC43_0019" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34549.1" + /db_xref="GOA:Q4JYS7" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYS7" + /translation="MTSYKVKSIRYNFIMNFILTVSNFIFPLLTFPYVSRVLQVEANG + TVAYVSSIVSYFMMIASLGIPTYGIRAAAKVRDDKRKLSTIVQELLIINVILVFLVLI + AYFIMLFTLQSMYVYKELFYINAIGILLNVIGVGWFFQAIEQYDYITLRSIFFRLLSL + AMIFLLIHSPEDYIMYAGISVFASVGSNILNFKRLFEYISFKKTETYHFKPHIKPILI + LFAQTLVVSIYTNLDTVMLGSMKGTYDVGLYTAATKLKGILLSVVTSLGNVLLPRMSY + YANNQMKDRFLEIITKALNFTLFLSLPLSVFFISVSKESILLLAGEGYLGAVIGMQFL + MFAVIPNALTGLLGIQVLTPLEKEKYVLLSVTSGALIDLLLNFILIPAYGVSGAAFAT + MIAEFVVLCVQIYYTRDLLLKRLHQIVGIRYLCSVGVSTIGIVLVKKLQLSDFLLLCV + EGIIFFGSYGVILVLLKDDFILDFFKIFYKKLKKI" + misc_feature 15198..15323 + /gene="wzx" + /locus_tag="SPC43_0019" + /note="Signal peptide predicted for SPC1919 by SignalP 2.0 + HMM (Signal peptide probability 0.679) with cleavage site + probability 0.496 between residues 42 and 43" + misc_feature 15222..16031 + /gene="wzx" + /locus_tag="SPC43_0019" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.5e-57" + gene 16694..17797 + /gene="glf" + /locus_tag="SPC43_0020" + CDS 16694..17797 + /gene="glf" + /locus_tag="SPC43_0020" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34550.1" + /db_xref="GOA:Q4JYS6" + /db_xref="InterPro:IPR003953" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYS6" + /translation="MYDYLIVGAGLSGAIFAHEATKQGKKVKVIDKRDHIGGNIYCEN + VEGINIHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIADQTAHMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TDLPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFANRQ + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFEHEVLDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQDKTVITREYPADWKRGDEPYYPINDAKNNEMYQRYLEEAKGKDV + IFCGRLADYKYYDMHVVIERALNVVREELGNND" + misc_feature 17129..17728 + /gene="glf" + /locus_tag="SPC43_0020" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 9.6e-133" + gene 17790..18815 + /gene="wcjE" + /locus_tag="SPC43_0021" + CDS 17790..18815 + /gene="wcjE" + /locus_tag="SPC43_0021" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34551.1" + /db_xref="GOA:Q4JYS5" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYS5" + /translation="MTKNRINWIDFGKGFAIFLVVIGHVFTGLFDSGKFTSDAKWLSI + VIAFIYIFHIPVFFALSGYFFKSVENFKEYYYYMKKKTIVLGLPYIFYSIIHYVLQKI + AGGSVRVPTTLFNLINIYKEPLGVVWYLYTLWALYLVYGFLSIFIKNKNYLFMISILG + YIITLVYMSEIFFIKKVLAWGVIFMLGSVLKTVKFNDIRFRNIILLGIIFNIVYIYIV + YILFNVYGKIITDYNYPRWWIIGYTGNVILSFIIFPKIEKTSQNIFRYFSKYGEISIG + ILIFHSPICSMIRILMLKMGIGSVFLHIVIGIVLGWYLSILATNVLKKIPLLNIVLLP + QRYIKLK" + misc_feature 17805..18776 + /gene="wcjE" + /locus_tag="SPC43_0021" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 7.4e-05" + gene complement(18856..19017) + /gene="tnp" + /locus_tag="SPC43_0022" + /pseudo + CDS complement(18856..19017) + /gene="tnp" + /locus_tag="SPC43_0022" + /note="Lone member of homology group 0255" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase (fragment)" + gene complement(order(19073..19670,19675..20676)) + /gene="tnp" + /locus_tag="SPC43_0023" + /pseudo + CDS complement(join(19073..19384,19410..19670,19675..20676)) + /gene="tnp" + /locus_tag="SPC43_0023" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature complement(19918..20502) + /gene="tnp" + /locus_tag="SPC43_0023" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 1.1e-08" + /pseudo + gene complement(20892..21594) + /gene="tnp" + /locus_tag="SPC43_0024" + /pseudo + CDS complement(join(20892..21344,21325..21594)) + /gene="tnp" + /locus_tag="SPC43_0024" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature complement(order(21009..21344,21325..21329)) + /gene="tnp" + /locus_tag="SPC43_0024" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 4.3e-56" + /pseudo + gene 21738..>22097 + /gene="aliA" + /locus_tag="SPC43_0025" + CDS 21738..>22097 + /gene="aliA" + /locus_tag="SPC43_0025" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34555.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 21738..21824 + /gene="aliA" + /locus_tag="SPC43_0025" + /note="Signal peptide predicted for SPC1931 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 21984..22052 + /gene="aliA" + /locus_tag="SPC43_0025" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggtctgact + 361 tttgcatctg ctttgctttt tgatatgagc ccatgttttc tcaataggat tgtactcagg + 421 tgagtaggga ggaagaggta aaagtttatg cccaaactcc tcgcataaaa gttctaactt + 481 acctattcta tggaatctta cattatccat aataataacc gatggtgtgg ttaatgttgg + 541 taagaaaaac ttctgaaacc atacttcaaa aaagtcgctc gtcatcgtct cttcgcaagt + 601 cattggagcg attaactcac catttgttag acctgcaacc aaagaaatcc tctgatatct + 661 tcttccagat actttgcctc ttattaactg accttttaaa gagcgaccat attctcgata + 721 aaaataaata tcgaatcctg tttcgtcaat ctaaacaggt gctaggtgct ttaaactatt + 781 aaaattctta agaaataagg ctactttttc tgggtcttgt tcataattag attgaaacta + 841 gagtagtaca cctctgcttc taaaacattg ttagaaatcg atttaactgt cctgatcgat + 901 ttatcctatt cttgtttcaa tctactatat ttttgtttcg cgggaagtct acttaagata + 961 cttaaagatg cagatagtaa aaaagatgta gacattaccg taaaaaagtg atataatcgt + 1021 atgatattga atgtataggt gttaatcatg agtagacgtt ttaaaaaatc acgttcacag + 1081 aaagtgaagc gaagtgttaa tatagttttg ctggctattt atttattgtt agttggtttt + 1141 ttattgttct taatctttaa gtacaatatc cttgctttta gatatcttaa tctagtggta + 1201 actgcgttag tcctactagt tgcctttgta gggctactct tgattatcta taaaaaagct + 1261 gaaaaattta ctatttttct gttggtgttc tctatccttg tcagctctgt gtcgctcttt + 1321 gcagtacagc agtttgttgg actgaccaat cgtttaaatg cgacttctaa ttactcagaa + 1381 tattcgatca gtgtcgctgt tttagcagat agtgagatcg aaaatgttac gcaactgacg + 1441 agtgtgacag caccgactgg gactgataat gaaaatattc aaaaactact agctgatatc + 1501 aagtcaagtc agaataccaa tttgatggtc gaccagagtt cgtcttactt ggctgcttac + 1561 aagagtctga ttgcaggtga caccaaggcc attgtcttaa atagtgtctt tgaaaatatc + 1621 atcgagtcag agtatccaga ctacgcatcg aagataaaaa agatttatac caagggattc + 1681 actaaaaaag tagaagctcc taagacgtct aagaatcagt ctttcaatat ctatgttagt + 1741 ggaattgaca cctatggtcc tattagttcg gtgtcgcgat cagatgtcaa tatcctgatg + 1801 actgtcaatc gagataccaa gaaaattctc ttgaccacaa cgccgcgtga tgcctatgta + 1861 tcaatcgcag atggtggaaa taatcaaaaa gataaattga ctcatgcggg catttatgga + 1921 gttgattcgt ccattcacac cttagaaaat ctctatggag tggatatcaa ttactatgtg + 1981 cgattgaact tcacttcgtt tttgaaattg attgatttat tgggtggaat tgatgtttat + 2041 aatgatcaag aatttactgc ccatacgaat ggaaagtatt accctgcagg caatgttcat + 2101 cttgattcag aacaggctct cggttttgta cgtgaacgct actcactagc cgatggagac + 2161 cgtgaccgtg gtcgcaacca gcaaaaggtc attgtggcta tccttcaaaa attaacgtca + 2221 accgaagcac tgaaaaatta tagcacgatc attgatagct tgcaaaattc tatccaaaca + 2281 aatatgccac ttgagaccat gataaatttg gtcaatgctc agttagaaag tggtggaact + 2341 tacaaagtga attcgcaaga cttaaaaggt acaggtcgga ttgatcttcc ttcttatgca + 2401 atgccagaca gtaacctcta tgtgatggaa atagatgata gtagtttagc tgtagttaaa + 2461 gcagctatac aggatgtgat ggagggtaga tgaaatgata gacatccatt cgcacatcgt + 2521 ctttgatgta gatgatggtc ccaagtcaag agaggaaagc aaggctctct tggcagaatc + 2581 ctacaggcag ggggtgcgaa ccattgtctc tacctctcat cgtcgcaagg gcatgtttga + 2641 aactccggaa gagaagatag cagaaaattt tcttcaggtt cgggaaattg caaaagaagt + 2701 agcagatgat ttagtcattg cttatggcgc agagatatac tatactctgg atgctctaga + 2761 aaagctagaa aaaaaagaaa ttcctaccct taatgatagt cgttatgcct tgattgagtt + 2821 tagcatgcat acttcctatc gtgagattca tacgggattg agcaatattt tgatgttggg + 2881 aatcacgcca gtcattgccc acatcgagcg ttatgatgct ctagagaata acgaaaaacg + 2941 tgttcgtgag ctgattgata tggggtgcta tactcagata aatagttatc atgttttaaa + 3001 atctaagctc tttggtgaaa gatataaatt tatgaaaaag agagctcggt attttttgga + 3061 acgtgattta gttcatgtag ttgcaagtga catgcacaat ttgaacaaac gtccccctta + 3121 tatgaaagaa gcctatgaac ttatctcaaa acaatacggt gaaagaagag cgagagaatt + 3181 atttattgaa aatcctcgct taatcttatc tgatcaaatt atttaggagt tgacatgaaa + 3241 gaaaataaag aaattacgat tgatgttttt caattgttta aagtcctttg gaagaagaaa + 3301 acctctatta tactaactgc gattgtagca gctgtcctag cttttgctgt aagtagtttt + 3361 gtactgacac ctgagtattc tagtacgaca cgtatttatg tggtcaatcg aaatcaatcg + 3421 gaaaaagcag ggttgacgaa ccaggatttg caggctggaa cctatctggt aaaggactat + 3481 aaggaaatca tcctctctca agatgtactt gagaaagtca tttcaaatct taaactagag + 3541 aaaacagtta aggaattaag caagaagatt caggtaacag tacctgtgga tactcgtatc + 3601 gtatcaatta ctgtaaaaaa tgcacaacca gaagaagcta gccgtatcgc aaatgctctt + 3661 cgtgaagtgg ctgctgaaaa aatcatttct gtaactcgtg tatctgatgt gacaacattg + 3721 gaagaagcca gggcagccct aagtccttca tcacctaata ttcgtcgtaa taccctgtta + 3781 gcttttttag cgggaggagc agtgatggta gtttcagtct tgttacttga gttgttggat + 3841 gatcgtgtta aacgaccaga agatgtggaa gaagtaatgc agattgcact tctaggggtt + 3901 gttctagatt tgaataagtt aaaataaggg agaaaatatg ccaacattag caatagaaca + 3961 aaaacgttta gattttgcga aaaaagcaga agagaattac aatgctttgc gaacaaatat + 4021 tcaattgagt ggtgataatc tgagagttct ttccatctcg tctgttaaac ctggtgaggg + 4081 gaaatcgaca acatcaataa atattgcttg ggcctttgcg cgtgcaggct ataaagcttt + 4141 attggtggat gcggatattc gtaattctat catgtcagga gtctttaaat caagagaaaa + 4201 aattactggg ctaacggatt ttctggcagg taccactgac ctttctcatg gactttgtga + 4261 tacaaatatt gaaaatttat ttgttattca ggcaggacct gtatccccta acccaacagc + 4321 acttttacag agtgaaaact ttgccactat gattgatact atgcgtaagt attttgatta + 4381 tgtcattgtc gatactgcac cgattgggat ggtcattgat gctgctatta tcacacaaaa + 4441 atgtgatgct tctattttgg taacagcagc gagggaaaca aagcgtcgtg atattttgaa + 4501 agcaaaggaa cagttagaac agacaggagt acctttttta ggagttgttc taaataaatt + 4561 caatacagaa gttgaaaaat atggagctta tggtggctat ggaacttatg gtttctatgg + 4621 aaattatagg aagggatgac ggagtaattg ataaaaatat attttgtttt taaaaatatt + 4681 ttagatagat ttttggcgtt tttcctattt attactttga taatcatacc gattattcct + 4741 ataacaattt tggctatttg gatagaagat ccaggagatg ttttctattt acaagataga + 4801 gttggtttaa atggaaaaaa attcaaagta ataaagttcc ggagcatgta taaagatgcc + 4861 gatcagagaa taaagaaaag tattaatagt ggtaaaactg agcgtctaaa ttttaaagaa + 4921 cattctcaaa gtatgactac aaaagtcggt aaagtgatac gcaaactttc aattgatgaa + 4981 ttacctcaat tattgaatat tataaaaggt gatatgtcta tagtcggacc tcgtccatta + 5041 caacagtttg aaatcactca tcatattctt acccataaag aaatgggtat tgctttaaag + 5101 atgtctaaaa gattgtctgt gaaacctggt ttgctttgtt attggcaagt tacgccaaat + 5161 aaaaatgaca tgccttttgc tgacagaatg gatctcgatt tattatatat tgataatgta + 5221 tctttcaaga ctgatttctt gcttatttta aagggttttt ttacagtttt aatgggtaat + 5281 aatagttaac atgaagaata taaaaatatt agtagcgaca cataaaaaat ataaaatgcc + 5341 cagtgataca aatatgtatc taccaattca tgtaggatgt gaaggaaagg aaaaattagg + 5401 atttcaaggt gataattctg gcgaaaatat ttctttttta aatccttact actgtgaact + 5461 tactggtctc tattgggcat ggaaaaattt agagtgcgac tatttaggtt tggtacacta + 5521 tcgtcgttat tttactaaaa tgactaaagg gtacaatgaa tcaataaata ttgatgatgt + 5581 aattttaaat aggtttgaag tggagaaatt gttagagaac tcagaagtca tcgttcctaa + 5641 aaaaagaaag tactatatag aaaccctcta ttctcactat gctcatacct tggatgctag + 5701 ccacttagac ctagctagaa aaatgattga acagaaaaat tctgaatatc tagcaagttt + 5761 tgataaggta atgaagcaga gaagtggcta tatgttcaat atgtttatta tgaaaaaaga + 5821 actagccgat gattatttca cttggctatt tccaatttta gatagcatgt atgaatgtat + 5881 ggatttatca gacttaactc cttttgaagc ccgtcttttt ggaagagtaa gtgagttgtt + 5941 atttaatgta tggttgtcga agaataactt gactcctacg gaagcacatt ttatgtatat + 6001 ggaaaaagta aatctattta agaaaggttt atcattccta caagcgaagt ttttcaaaaa + 6061 gaaatataaa gaaagtttct agaggaggaa atatgtctga gataaaaata attcaaaata + 6121 aaattttaga aatacttaaa atttttatcg aaacatgcga agaaaataac ttgacgtatt + 6181 atgcactagg tggaacatta ttaggagccg ttaggcatgg tggattcatt ccttgggatg + 6241 atgatataga cattggtatg cccagagaag attatgagaa atttaaaaaa atagctagca + 6301 aaaaatttaa tgatagatat ctatttttga gtgaagatac tccaggttat aaaaaagctt + 6361 tttctgtaat tcgagatact tcaacaaaga ttgttatgaa ttatagtaat atagagcaag + 6421 aggagagttt gtggatagat atatttccta ttgatggtct acctgaaaaa ggtgtgaaga + 6481 gaaaactaca cgagaaacag tacctattta gaagaatgat ggtacagtta tctcaattca + 6541 attcaatagt gaatcaaaat aaaaccaaca gaccttggca agagaaagta ataattaaaa + 6601 ttgcagggat tttaaaaatt gaaaatttac tgtcttttga aaaagcgcaa caaaagtatc + 6661 tagctactat aaagaaatac agtataacag agggttatgc aggtaatttt acaggggcat + 6721 ataaacttcg tgagttagtg ccaagttgtt attttggtga acctgttaaa ttagattttg + 6781 aaggaataaa actgaactgt ccaaataaat ataaagatta tctcaaagca atatatggtg + 6841 ataattatat gacattacct ccaattgaac aaagacttcc ccatcaatat gaaattgtta + 6901 gtttaggaga atgatgataa atgaataaat taagaaaagc tttaaattat tatcaagaca + 6961 taagcaaaaa aagatcatat tttcctaata atgtactaaa ttggcaattg ttaggaaagt + 7021 ttcttggaca aataccatat cttataggag aaaataatgc gagaaaaatt tgtgaaaaaa + 7081 ggcacaatgt aacaagagga tttttggaaa aagaatttta tgaatttata ataaattatg + 7141 aatttaacac ttgtaatcaa aaaaatagta aaattatttg gacattgtgg atgcaaggat + 7201 atgaaaatgc gccagaatta gtaaaaagta caatcgatag tataagaaaa tttgctgaat + 7261 taaataattt tcagtttata ttgttagaag agaatacgat agaaaaatat atagtatttc + 7321 ctaagctgat aaaggagaaa atggatttag gtgttataga ttatactaaa atttcggata + 7381 tattaagagt ttcattgctg gcaaaatatg gagggacatg ggtagatgcg actatatata + 7441 tgaaagaaga gtttgattca tcattattat tacagaatta ttatactata aaaacaggag + 7501 gaatagagga ttattctcct aatatttcga ataataggtg gaaaggtttt tttttatcag + 7561 gtaatagttc attatttagc tttactcgtg attttttctt tgaatattat agcagatacg + 7621 atatcgctgt agattattta ttgatagatt atatttttga tatagcttac aaatacgatg + 7681 agaagattaa aaatcaaatg cttgaattag aaaaatctaa tcataattta ttttggttag + 7741 aaagtcattt aggagatgag tttgatcaaa aagtgtggga taatattaca gaaactacta + 7801 aaatattcaa aacaacgtat aaattatctg aagaaattaa atcaaataag aataattttt + 7861 attccaaact aatagataga aagttataga acgagaaaat gaagaaaata gctttagtga + 7921 aatggatttt ggatgattct ggtggtggtg agcgagttgc tgtatctttg gcaaacgaac + 7981 ttacaaaaaa gtatgaagtt tatttaattg gaattacaac aaagcaatcg gatttattct + 8041 ttgaaatcaa ttctcaagta aaatactcca atttttttga ccatcgagta cgcttgtcta + 8101 agaatattct aaagatctca aaaatgttaa aaaaatattt tgtagataat gagatagata + 8161 ttgcctttgg aatagggata actgctaata tatttttatc tttggcagga ataggaatat + 8221 ccacccaaat agttttgtgt gaccatacaa attcaattac agacaataga gaattttctc + 8281 agaaagtcca aagatatgtt ggagcaaaat gtgcagacaa gattatcact ctcacacaag + 8341 aagatcgtag aagttatata aaaaaatatg gtatttctga agaaaaaatt gattatgtct + 8401 ataattggaa agaagatggt ctttccaatg taccttataa tgatgagtca atgaaaattg + 8461 ttacagtagg tcgtttggat tatcaaaaag gctatgatta tcttgttcaa gttgctaaga + 8521 aagtactgaa agaaaagact ggctggactt gggaaattta tggttctggt aatcaagatg + 8581 aggtagataa aatcaaggat ttaatcatca aaaatgattt gcaagataag ttagtcatta + 8641 aaggtcttga aaaaaatcag gctatgattt atggagataa aggaatttat gtcatgactt + 8701 ctcgttatga aggattaccc ttggtattgt tagaagctca acaatacaat cttcctattg + 8761 ttagcttcag gtgtccaacg ggacctaatg agattgttga agatggggtc aatggtcatc + 8821 taatagattg ttatgatacc gataagatga gtgagagact acttgaattg atggaagatt + 8881 cgaacttgcg aacttccttc gccaatcatg ccaaggataa tatggataaa tttgataaag + 8941 ataaaataat tcaacagtgg attgatttaa ttgaggaaat gactggaggg aataattttg + 9001 aaagctaaaa tgttaatttg tataactagt ttaacaggtg gaggagctga aaaatcactt + 9061 gttaacttta ttcaagaatt tgaaagtatg tttgaaatta gcattctagt atatacggaa + 9121 aaaaataatt tttatggctc aaaattaagt catttaagga ttgattattt tattagaaag + 9181 aatacaccag ctattattga aaaaatagtg aataagcttg ttaagttatt accaccgtca + 9241 tttgtgaata gatggattat acagagaagt atttttaaaa atgaaaaatt tgattatgaa + 9301 tttgcatata tggaaggaaa acctacaaaa atcatagcgg gatcatcgaa tgaagatagc + 9361 ttaaaactgg cttatatcca ttgcgatttc tcaaaaaatt ggtattcaaa acgatcgttt + 9421 aaaaatttta aagaggaatt gacttgttat caaaagttta attcaatctt agctgtttct + 9481 actccacaaa aagaatcctt tgaggagatt tttccaaaga caaatttaga agtaatccct + 9541 aacttgctta acattgatga aataaaaaat ttaagtaaag aggaaataga attagaaaat + 9601 attccttatt tttgtgcgat aggaagatta gaacttgtta aaaattttga attattaata + 9661 aatgcttttc atttatttag aaaaaagtat tcacaatatc atttaattat tttgggagat + 9721 ggtagtttat atgatcattt aaagaatcaa attaacaatc taggagagag ccaatatata + 9781 aaattattag gttttcaatc taatccatat aaatatataa agaatagtgt gggattaatt + 9841 caaagttcag tatcagagtc ttttagttat gtattagcag aagcagctgc tttaggcatt + 9901 cctagtattt caacaaaaac tcaaggttct gaggttatgt cagaatattt cgaagtaatc + 9961 caggtagagc atacgagtaa cgaattagca aaagggctag agaaagtcat tgcgaacaac + 10021 tttgttaacg ttcattttaa ttttaatgaa gaagcttatt acaaattttt agagatattt + 10081 aagaaaggaa gtagaagttt tgaaattcga agagaaatat aacacattgt tcaatataat + 10141 tttttctctg ttaacaatat tgtatctact gaaatttgta aatattgaca gaattgatgg + 10201 aatttctatt gtaatcctta tatgtatatt attcctgttt gtgatgcata gtcttaaata + 10261 tggaataaat agattaaaac taacttcctt aatattgttt tttttaacat ttattttgaa + 10321 tctttttaat ggttctacat ttctagaaat aacgtacttc ttcttattat atacaattat + 10381 attaaaagat aataaaaaat ttttcaaaat acattttatt acacttacag tattcgtgtt + 10441 aacaattata ttattgtccc atattggcta tattagtaat tttgtgatat atagatcaaa + 10501 tggtggtatt aggaatagtt taggatttgt acacccgaat tcattagggt taatgatcta + 10561 ttccttaacc gtttgtagtt taaatctttt tgaaataaaa agattcaaat tcttcttcta + 10621 tttattttta ttattgatga atttatggat attacagtta gcagactcta gaacatcagg + 10681 atatataagt attttagtaa ttgtcttttg ttactttttt gataaaatag gtaagttaaa + 10741 tagaccgttg agtagttttt ttattaattt ggctattaca atgtctgttt tgtttataac + 10801 tttaatgtca attaattttg aagccagtca tattttccaa ttcttaaata aattgttcac + 10861 taatcgaatt tttagtagtt atgtattttt tagagaatat ggggttactc tatttggcaa + 10921 aagaattgat ggaattgtct cattagttca aggaacagtc ataattgaca gtggttatat + 10981 aggattgcta ttacaaaaag gaattatttt ttttgtgtta tttttgctat ttattttttc + 11041 tagaataaaa gaatactcat ttacactaag agaaggtatt ctactgatta gtgtatttat + 11101 ttctcttatg tttgagagct atggttacac cgtatttcta ttcccaatat tattttttga + 11161 ttatttagga aaaaggaagg aaagtattaa tgaataaaat taccgtattt acaccaactt + 11221 ttaatagagg gtatttaatg aataagttgt ttcattcatt aaacagtcaa acaaataaac + 11281 attttgaatg gcttattgta gatgatggtt caatagatca gactggtgag cttgttgaaa + 11341 catttaagga acaggcaaat tttgaaatac gatattttta tcaacaaaat ggtggtaagc + 11401 atagagcaat taatcatggt ttggatttag ctagagggga gttattcttc atcgttgatt + 11461 ccgatgattc attgacagat gatgctattg agaaaatttt taataactat tctggaattg + 11521 cctttaatca tagttttgca ggcatagcat ttaatagagg tttctctaaa aaaagaatag + 11581 ttggagagac ttttgaagga acatatatag attgtgacaa tttacatcga gctaaacata + 11641 atattttagg agataaggca gaagtatatc gaacagatat tttaaagagt attaagtttc + 11701 cagtggtaga tggagaaaac tttatgagtg aagttgtctt atggaatgaa gttgcaagaa + 11761 ggggttataa attacgttgg tttaatgaca taatttattt ttgtgactat ttagaagacg + 11821 gattaaccaa aaatagtgaa aaaattttat ttaataaccc agttgcacat caaatgatga + 11881 ccaaggaatt gttacaaatt gattttacat taaagagaaa atttgggatg atctataatt + 11941 atcataaaat tagaaaccaa agtattaagc aaactgctat taatcttgaa cagcctctaa + 12001 ttttagtata tatggtagta atgatggcta gaattagaaa aattgttaag ggggtgaaaa + 12061 atgagtaact tatattatat tcatgaagag tttggtagtg attcaacggc ggctacaaaa + 12121 gcaccaaatg atttacagaa aatatttcaa gactgtaaat ttaaaccatt agtaacatta + 12181 aaaaaaaata gtaaaatagt aagaatattt gattacgcgt ttaaactttt gttgtgtctt + 12241 attagaatta gaagtaatga tattgtgata tttcaatttc cttttgctac tcatgggaaa + 12301 ctaaaaaatt ttttaatgaa attactacaa tataaaaaag ctaaaatgat ctttttaata + 12361 aacgatttag agtcgttaag atattcggga aataaaaaaa atctaatttc taaggaacag + 12421 tatattaaaa atgctgatgt gattatttgt cataaccaac gaatgaagga gtttttaata + 12481 gaaaataaga ttgacagtga aaaaatagtt gtactcggtg tttttgatta tttactggat + 12541 aagtttaata aagaaaaagc atcttttgat aaaacagttg taattgcagg gaatctttcg + 12601 cctcaaaaaa gtggttattt aactgagtta ttaaaaaatg aaaatagaat aaaatttaat + 12661 ttatatggac ctaattttac ttcatcgact aacaataatg attgtgtatc atataaagga + 12721 agtttttcgc ctgaaaaaat tccttttata cttgaaggtg attttggatt agtttgggat + 12781 ggcgattcta tattaacttg ttcagggatt actggggagt atttgaaata caataatcct + 12841 cataaagtgt cgttatttat agcttcaaaa ataccagtta ttatttggaa acaatctgcc + 12901 ttgagtgatt ttgttaaaga aaataatatt ggaattgtag taaatgattt aattgaaatg + 12961 caagagatta ttactaatat gactgaagag caatatgaga tttttagaga aaatattgaa + 13021 cagttgtcca aaaaggtaag gcaaggctat tttacgaatt tagcgattga aaaatcttta + 13081 agcataataa aaaataatct caataattat tttgaggaag attgatatga aaaaagaaga + 13141 atataatttt ttaaaagtcc tcacaatatt attagtagta ttaggacata gtacgtatta + 13201 tattattaag atgaattttg gtgggattga ttattatcac tatataaata ataatgattc + 13261 aattatagta ataaattttt tcaaaaaaat aacagagatt atctattact ttcatatgcc + 13321 tttatttatg gcaatatctg gagcattttt cagaattcaa gttgaaaaaa ataagtggca + 13381 aagtccttta gagttattcc agaacaaatt tagaagacta ttaatcccat ttattatttt + 13441 tacgattttg tatactattc ctatgaaata tatttcaaac tattttatac aaacgagtat + 13501 ctttaatgcg attattggtc aactgttttt atttgggaac actcatctgt ggtatttata + 13561 tgcattgttc attattttta tgattgccta cttcgttttg aaaaaagata cgggttttgg + 13621 aatgttactg ttcctatttg cacttcattt aatgagttac aaaattaata ttacgttaat + 13681 aaaaagtgcg tttcaatttt tattttattt tgcgattggt tttaaatttg aacaaaaaag + 13741 agaagtatac aatcatttat tgaatcatac caagaaattt gtatattttc ttttaatcgg + 13801 atttgttgtg ttaattttca tgaatttggg tattaagaga tactcaatta ttttttcaaa + 13861 gctacttgaa gaaattttag cattgtatgg aagtttggta acttatacta ttgcttatta + 13921 tttatcaaga aacacgaaat ggatgaatac cagaatatac cagtttattt tagtcaatgg + 13981 tctaggaatt tatatttttt cggatactct taattatttg atattaaagt ggggctttat + 14041 tgttgctgag gatttaatga ttacacctca tggaattatt ttgatggtaa tttttcgatt + 14101 tttggtaaca ttaattttaa gtttgctgat tactttagca tttaaaaaac tatttccgaa + 14161 gtataaatgg ttagtgaatt aaaaaatttt atagagcgta aaaacgtaaa ggagaaaaaa + 14221 tgtgtattaa aaagtttctt aaaaagagtc atctgaccaa aggaatttat caacaattac + 14281 aaagaaaaaa gaatcaatat cgcttagaaa aaaaatttaa atatacaggg aaatttattg + 14341 accgtaaaaa agatagtaaa gatttatgta tcatattagc ggggtataaa gaatttttat + 14401 atgacgatgt gctaggaaga gtaaagacat ttgcaccaga aacaatggat atttgtgtcc + 14461 tatcttctgg catctattca gaaaaattaa accaaatttg tgaagaaaat aattggtcgt + 14521 atttgagtac ggaacagaac aatatatctt taattcaaaa cgtagctatt aatctacatc + 14581 ctcaagcaaa atatatttat aaaattgatg aagatatttt tattacagaa cattattttg + 14641 aaaatttaaa agaagcatat atttttgcac aagaagggga ttatgcaccc ggtgtagtag + 14701 caccactcat tccggttaat ggttatggac ataaaagaat cttacaaaaa ttaggcttgg + 14761 aagatgttta ttatgaaaaa tttggagaaa aatcgaaata tatagctgga cagcctcgtt + 14821 ttatagagag taatcccgaa gtagcgaagt ttttctggag cgatggagaa gtaattccta + 14881 ctatagatac aatgaatgca caattttcaa aagaagagaa aaaagtgaat ccgtgtgcaa + 14941 ttcgcttcag tatcggtgca attttatttg agagaagctt atgggaactg atggattatt + 15001 ttaatgttga gtttgaggga gctggacttg gagtggatga agtccaaatt tgtaattttt + 15061 gcatcttaaa ttcaaaacca ttgatggtca gtgaaaatgt ggttgtggga catttatcgt + 15121 ttggtcctca gaataaggct atgttcgaat attataaaga acatccagaa aaattttcta + 15181 tttagatgag ggataatatg acaagttata aagttaaatc tatcaggtat aattttataa + 15241 tgaattttat tttgactgtt tcaaatttca tctttccatt gttaactttt ccctatgttt + 15301 ctagagtact tcaagttgag gcgaatggta ctgtagcata tgtatcatct attgtatctt + 15361 attttatgat gattgcttca cttggtattc caacgtatgg catacgtgct gcagcaaaag + 15421 tacgtgatga taaaagaaaa ttatctacca ttgtccaaga actattgatt attaatgtaa + 15481 ttcttgtatt cttagtactc attgcatatt ttataatgtt gtttacttta cagtcaatgt + 15541 acgtctataa agaattattc tatatcaatg caataggtat actattaaat gtcataggag + 15601 ttggttggtt ttttcaagca attgaacaat atgattatat tactcttaga tcgattttct + 15661 tcagactttt atcattagct atgattttct tacttatcca tagtcctgag gattatatta + 15721 tgtatgcagg aatttctgtt tttgctagtg tgggatcaaa tattttaaat tttaaacgat + 15781 tatttgaata tatatcattt aaaaagacag aaacttatca ttttaaacca catataaagc + 15841 cgattttgat tttatttgct cagacattgg tagtgtcgat ttatacgaat cttgataccg + 15901 ttatgctagg aagtatgaaa ggaacatatg atgtgggatt atatactgca gcaacaaaac + 15961 taaaggggat tctcttgagt gttgttactt cattaggaaa tgttttgctt ccaagaatgt + 16021 cctactatgc taataatcaa atgaaagatc ggtttttgga aatcataaca aaagctttga + 16081 actttacgtt attcttatcg cttccattgt cagtattctt tatttcagta tcaaaggaaa + 16141 gtattttgct acttgctggg gaaggatatt taggtgctgt tataggaatg caatttttaa + 16201 tgtttgcagt tattcctaat gcacttacgg gtttattagg tattcaagta ttaacacctt + 16261 tagaaaaaga aaagtacgta ttactttcag tgacttcagg agcgttaata gatttactac + 16321 taaacttcat tttaattcca gcttatggtg taagtggagc agcatttgcc actatgattg + 16381 cagaattcgt tgtattatgc gttcagattt actatacgag agatttgcta ttaaagaggc + 16441 tacatcaaat agttggcatt agatatctat gctcggtagg ggtgagtact attggaattg + 16501 ttcttgtaaa gaaattacaa ttaagtgatt ttttgttatt atgtgtggaa ggaatcattt + 16561 tctttggaag ttacggtgtg attctagtgt tgttaaagga tgatttcatt cttgattttt + 16621 ttaaaatttt ctataagaaa ttaaagaaaa tttaactaat taattttgaa aatttaattt + 16681 taaaggagaa aaaatgtacg attatcttat tgtcggagct ggattgtcag gtgcaatctt + 16741 tgctcatgaa gcaacaaaac aaggaaaaaa agtaaaagta atagataaac gtgaccacat + 16801 tggtgggaac atctattgtg agaacgttga aggaatcaat atccataagt atggtgccca + 16861 tatcttccat acctctaata aaaaagtttg ggactatgtc aatcaattcg ctgagtttaa + 16921 caactatgtc aactcacctg tcgcaaacta caaaggaagt ctttataatc ttcctttcaa + 16981 tatgaatacc ttctatgcga tgtgggggac aaaaactcct caagaagtca aggataagat + 17041 tgctgatcaa acggctcaca tgaaggacgt tgaacctaaa aacttggaag aacaggctat + 17101 caagttgatc ggtccagata tctatgaaaa gttgatcaaa ggctacactg aaaagcaatg + 17161 gggacgttct gcgactgacc ttccaccgtt tatcatcaaa cgtctaccag ttcgtttgac + 17221 ttttgataat aactacttca atgaccgtta ccaaggaatt ccaatcggtg gttataatgt + 17281 cattatcgaa aatatgttga aggatgtgga agtagaactt ggagttgact tttttgccaa + 17341 tcgtcaagaa ttagaggctt ctgctgaaaa ggttgtcttt acaggaatga ttgaccaata + 17401 ctttgattat aaacatggtg agttagaata ccgtagtctt cgttttgagc atgaagttct + 17461 tgatgaagag aactatcaag gaaatgcagt tgtaaactat acagaacgag aaattcctta + 17521 tactcgcatt attgagcata aacattttga gtatggtacg caagataaaa cggttattac + 17581 tcgtgaatac ccagctgatt ggaaacgtgg agatgaacca tactacccaa tcaacgacgc + 17641 taaaaataat gaaatgtatc aaagatattt agaagaagca aaaggtaaag atgttatctt + 17701 ctgtggtcgt cttgcagatt ataaatatta tgatatgcac gtagtaatcg aaagagctct + 17761 taatgtagta agagaggaat taggtaataa tgactaaaaa tagaataaac tggatagatt + 17821 ttgggaaagg gttcgcaata tttctagtag tcataggtca tgtgtttact ggtttatttg + 17881 attctgggaa atttacaagt gatgccaaat ggttatccat agttattgca tttatatata + 17941 tattccatat tccagtattc tttgctttat caggatattt tttcaaatct gtagagaatt + 18001 ttaaagagta ttattattat atgaagaaga aaacgatagt attaggatta ccgtatatat + 18061 tttattctat aattcattat gtattacaga aaatagcggg aggatcggta cgtgttccca + 18121 ctacattgtt taatttgata aatatttata aagaaccatt aggagttgta tggtatttgt + 18181 atacattatg ggcactatat ttagtatacg gatttttatc aatatttata aagaacaaaa + 18241 actatctttt tatgattagt atactcggat atataattac attagtatat atgtcagaaa + 18301 tattttttat aaaaaaagtt ctagcatggg gagtaatttt catgttgggt tctgtattaa + 18361 aaacagttaa atttaatgat attagattta gaaacataat tctactagga atcatattta + 18421 atatcgtata tatttatata gtgtatattt tatttaatgt atatggtaaa ataataacgg + 18481 actataacta tcctagatgg tggattattg gatacacagg taatgttatc ttatcattta + 18541 taatttttcc aaaaatagaa aaaacatccc aaaatatttt taggtatttt agtaaatatg + 18601 gggaaattag tatagggatt ctaattttcc attcaccaat ttgtagtatg attcgaattc + 18661 taatgttaaa aatgggaatt ggttctgttt ttcttcatat tgttattggt attgtcttgg + 18721 gctggtattt atcaatactt gcaaccaatg tattgaagaa aattccatta ttgaatattg + 18781 ttttactacc acagagatat attaaactaa aataaaaagg ctctttgtca actgtagtgg + 18841 gttgaagaaa agctaagctc gagaaaggac aaattttgtc ctttcttttt tgatattcag + 18901 agcgataaaa atccgttttt tgaagttttc aaagttccga aaaccaaagg cgttgcgttt + 18961 gaggaattta atgagattat tagtcgcttc taatgtaacc gcccaataac gaagtctatt + 19021 gaaaaatctc cagactagag aactcatata tagttcctaa tctggagatt tcttatttgc + 19081 acttttcttg tacaacttta gtccatggta aataagcctc taaaacctct ttgtttacga + 19141 gagtttcctc gtttggaaga cattctagaa gataggatag atatttctcg ctatttataa + 19201 tggattgaaa taagatatga acaaattgat taggaaagga aaattgattt atagaaatgt + 19261 tttagcagtc gatgcgtact gttatagatt caacgcacta taattgatga cgtttagctg + 19321 tttccaacaa gctcataata atagctcttg ctttagctcc ttcaaaactt tgagaaaata + 19381 accaccctcg cttttttaaa ctgagctcag gctaaaagag tccactggac tcttttactc + 19441 cgtcccataa ccaatgattt aatggcgcgt tcagctagat tattggaaag gaccagatgt + 19501 ccgtctttta aaatagtctt aaaggtttct ttatacttga ggctgtattc aattgccctt + 19561 cctagttttg aacctgctaa aactgactga cgacggcacc aagcaaagaa gtcttccatt + 19621 aggggttgga gctcttcttg acgtttctgt agtcgttcat cagctgacaa tgtcctccca + 19681 gtctctttcc aaggcaaata actgatcaca ataagctaaa cctttagctc ctaaggatga + 19741 tttatctgct tgcttggggg tcgcttcaaa aaatttcctt ctcacatgcg cccaacatcc + 19801 aacaagttca gcttcttcca gttgacgata agcttctagc ggttcgcagt ttaccaagct + 19861 tagcgtcgcc ttgctcctaa accttggact gctatcgcat aggcagaact agaggactaa + 19921 agtcctaagt tactgccgca acatatcaca atgaacatag ccagaataat ctcctaggaa + 19981 ttcttgtact accgaaccac tccgactctg atcatgatgg tacagcgtga ttgcttgatt + 20041 ctcaactttc ccagacaaaa aggtccaata gtaggtcaga tggctatgac tctctagaac + 20101 ccgataagag gtttcatctg catgaagaag agcttgttct aacaactttt ctcgtaaaag + 20161 attataaagg ggctccaaat aatagtgact cgtcttgata tgccaattag aaatttcctt + 20221 acgtgtgatt ggtaaaccca tcttagccca atcttcttct tagtgataat tgggtacctt + 20281 cagaataaac ttctgatgga tggtgtgagc gataatagaa gctgagccaa ggctatgcgc + 20341 caaaggggct ttaggaatag gagctttcac gattttatca ctccgatttt tatcactgca + 20401 tgcttggcac ttataagcgt gttggatatg atctattcgt tttaattgcg caggaataaa + 20461 gactaattct tgtcgttgaa gggttgctcc aatctctttt agatcatcct gacaatcagg + 20521 gcaaatgctc tcttctactt gatgatgaac tttttctgaa tcaaattggg caagaagagc + 20581 ttggcgtttc cctttagatt tcttacgttt gtaggtaatt tcctctgttt caactgggaa + 20641 catctccatc tttctcagat ggagactctt cctcaaaaag gttgagttgt ccagaagggc + 20701 aaacactttt ctcagaggat tttccataga gcttttgcgt tagataagcc acttgttcac + 20761 gcagaaggga aagttcatta gtgagactat caattatagc actctgttgt tgaatgattt + 20821 tcaatcttct tccatgagct tccctctcta ttttctaact ttattatact aaaaagaaag + 20881 tcctcatttc aatagaaatc acgactttct gatgaattta tagtaaaatg aaataataac + 20941 aggacaaatc gatcaggaca gtcaaatcga tttctaacaa tgttttagaa gcagaggtgt + 21001 actattctag tttcaattta ctatattttt ggagtgatag aaaagccctt cataagccag + 21061 tctacttgtt ctggtgtgag agctttgaca tccttttctg tactgggcca agtcagtctg + 21121 ccgttctcaa agcgtttata tagtagccaa aatccttgac catcccagta aagggcttta + 21181 aagcggtctt tacgtccacc acaaaagaga aaaacttgac ctgagaaagg atctaattca + 21241 aagtgggttt taaccagata agccagtgaa tcaatgcctt gcctcatatc cgttttccca + 21301 cacacgagat agacctgccc taggctaaat agatgaattg tcatagagca acaccttatc + 21361 caaaagctgt tctatcattt cgagattgag agattgaaaa aaacttactt caagcttgcc + 21421 aatacgaatt ttaagcagaa tatcatttct ctttttagaa tcaaaacgac gagattgtgg + 21481 aatctctaca ggaacaatag gttgtggcat taaaatatcc tccaatagtt ttactttact + 21541 aatagtatac aggaggagct ccatgaatga tagatacctt gttatgacgc gcttacgata + 21601 tagttgaggg atttttaaat gatattcata ttttttgcaa agatgttgtt tgaaaaataa + 21661 ttttcaaaaa ttctgaaaat tctgttgaca actttctgaa aagagtctat aatggagaga + 21721 aagttttaaa ggagaaaatg atgaaaagtt caaaactatt tgcccttgcg ggcgtgacat + 21781 tattggcggc gactacttta gctgcatgct ctggatcagg ttcaagcact aaaggtgaga + 21841 agacattctc atacatttat gagacagacc ctgataacct caactatttg acaactgcta + 21901 aggctgcgac agcaaatatt accagtaacg tggttgatgg tttgctagaa aatgatcgct + 21961 acgggaactt tgtgccgtct atggctgagg attggtctgt atccaaggat ggattgactt + 22021 acacttatac tatccgtaag gatgcaaaat ggtatacttc tgaaggtgaa gaatacgcgg + 22081 cagtcaaagc tcaagac +// + diff --git a/public/res/serotype_genbank/serotype_44.gb b/public/res/serotype_genbank/serotype_44.gb new file mode 100644 index 0000000..5a92022 --- /dev/null +++ b/public/res/serotype_genbank/serotype_44.gb @@ -0,0 +1,1097 @@ +LOCUS CR931717 24095 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Hammer (serotype 44). +ACCESSION CR931717 +VERSION CR931717.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 24095) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 24095) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..24095 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Hammer" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC44_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC44_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34743.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SPC44_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SPC44_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(488..1009) + /gene="tnp" + /locus_tag="SPC44_0003" + /pseudo + CDS complement(488..1009) + /gene="tnp" + /locus_tag="SPC44_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1222..2676 + /gene="wzg" + /locus_tag="SPC44_0004" + CDS 1222..2676 + /gene="wzg" + /locus_tag="SPC44_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34746.1" + /db_xref="GOA:Q4JYS2" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYS2" + /translation="MLIMSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVVVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIELEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFYFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDL + PSYAMPDSNLYVLEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1222..1347 + /gene="wzg" + /locus_tag="SPC44_0004" + /note="Signal peptide predicted for SPC1935 by SignalP 2.0 + HMM (Signal peptide probability 0.991) with cleavage site + probability 0.537 between residues 42 and 43" + misc_feature 1435..1782 + /gene="wzg" + /locus_tag="SPC44_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.8e-63" + misc_feature 1960..2403 + /gene="wzg" + /locus_tag="SPC44_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.5e-69" + gene 2678..3409 + /gene="wzh" + /locus_tag="SPC44_0005" + CDS 2678..3409 + /gene="wzh" + /locus_tag="SPC44_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34747.1" + /db_xref="GOA:Q4JYS1" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYS1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRIIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2681..3289 + /gene="wzh" + /locus_tag="SPC44_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 1.3e-36" + gene 3415..4110 + /gene="wzd" + /locus_tag="SPC44_0006" + CDS 3415..4110 + /gene="wzd" + /locus_tag="SPC44_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34748.1" + /db_xref="GOA:Q4K1W4" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K1W4" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSAFI + VKPEYTSTTRIYVVNRDQGDKSGLTNQDLQAGSYLVKDYREIILSQNVLEKVATNLKL + DIPAKTLARKVQVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVGRNSLFGFFGGAVVTVIAVLLIELFDIRVKRPEDVEDVLQI + PLLGVVPDLDKMK" + misc_feature 3415..3531 + /gene="wzd" + /locus_tag="SPC44_0006" + /note="Signal peptide predicted for SPC1937 by SignalP 2.0 + HMM (Signal peptide probability 0.729) with cleavage site + probability 0.460 between residues 39 and 40" + misc_feature 3436..3852 + /gene="wzd" + /locus_tag="SPC44_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.4e-54" + misc_feature 3958..4035 + /gene="wzd" + /locus_tag="SPC44_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4120..4794 + /gene="wze" + /locus_tag="SPC44_0007" + CDS 4120..4794 + /gene="wze" + /locus_tag="SPC44_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34749.1" + /db_xref="GOA:Q4JYR9" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JYR9" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + QGEGKSTTSINIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITQKCDASILVTKAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGKK" + gene 5141..5740 + /gene="wciI" + /locus_tag="SPC44_0008" + CDS 5141..5740 + /gene="wciI" + /locus_tag="SPC44_0008" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34750.1" + /db_xref="GOA:Q4JYR8" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JYR8" + /translation="MYRVTKRLGDILLSLIGIIVLFPVFIVIAIAINTDSEGPIIFKQ + KRFRIYKEPFYILKFRSMKIGAPKNVAPRNLDNPEQWITKVGAFLRKTSLDELPQLWN + ILIGNMSIVGPRPAGINELDLLTEREKFGANDVLPGLTGWAQINGRDTLSIEMKAEAD + GYYVKHMSLSMDLRCIIRTIPYVLKRKGIVEGSGKKELD" + misc_feature 5141..5233 + /gene="wciI" + /locus_tag="SPC44_0008" + /note="Signal peptide predicted for SPC1939 by SignalP 2.0 + HMM (Signal peptide probability 0.994) with cleavage site + probability 0.844 between residues 31 and 32" + misc_feature 5156..5710 + /gene="wciI" + /locus_tag="SPC44_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.6e-30" + gene 5706..6971 + /gene="wciJ" + /locus_tag="SPC44_0009" + CDS 5706..6971 + /gene="wciJ" + /locus_tag="SPC44_0009" + /note="member of homology group 35" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34751.1" + /db_xref="GOA:Q4JYR7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYR7" + /translation="MWRAVVRKSWIDAMKILFVCQHYKPEPFRLSDICEDLVQRGHEV + AVLTGIPNYPEGEIYADYRKRKKRRETINGVAIFRSYTIARRQNTLYRILNYFSFALS + STIGVIFGRYKAKDGSDFDCVFVNQLSPVMMAWAGIAYKNKYNKPMFLYCMDVWPDSL + IVGGVKENGLIYKIFEFVSKKVYQASDYIFVTSLSFKDYFVKKFNIPLHKITYLPQYA + EDLFVPNELKTNKNTIDLTFAGNIGKAQNLETILKAASAIEQIPDLAKRVHFHFVGDG + TELLNMQKLACELELENTSFYGRRPLEEMPDFYTKSDAMLVSLIGDSIISRTLPGKVQ + SYMAAGKPIIGAISGDTQRVVKEAKCGFISPEGNVDQLVRNIRKFCLLSVEEREKLGR + QARCYYEEQFSKEWFMTYLENHLKEGFLS" + misc_feature 6363..6896 + /gene="wciJ" + /locus_tag="SPC44_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.8e-16" + gene 6920..8137 + /gene="wcxB" + /locus_tag="SPC44_0010" + CDS 6920..8137 + /gene="wcxB" + /locus_tag="SPC44_0010" + /note="member of homology group 55" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34752.1" + /db_xref="GOA:Q4JYR6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYR6" + /translation="MVYDILRKSFKRGVSIMKVLMINSVCGIRSTGRICADLATALTE + EGYEVKIAYGREYVPKQFQQYAVKIGTKSDIRFHAIRSRLFDESGFGSRQATVNFIKW + MKEFDPDIIHLHNLHGYYINVELLFDYLRICGKKIIWTLHDCWAFTGHSAYFDCLECE + SKGVCDHPSQKNDYPKSFVNFSKRNYQRKKKCFTHIPNLTIVTPSQWLANLVRQSFLK + EYPVKVIHNGIDTTVFQPRLIAAQKLRKRHHLEGKQVLLGVAAIWDNRKGFSDMLALA + NDLTDNQRIVLIGLKDRQLKELPKGIIGLTETNSPEELVAWYTLADVFLNPTYQDNYP + TTNLEAISCGTPVISYPTGGSVESAKLYGLVCQDRNVASILSSLEKVSQLSKTEKLDF + SIASFIKQMKYLY" + misc_feature 7640..8122 + /gene="wcxB" + /locus_tag="SPC44_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 4.2e-12" + gene 8175..9386 + /gene="wzy" + /locus_tag="SPC44_0011" + CDS 8175..9386 + /gene="wzy" + /locus_tag="SPC44_0011" + /note="member of homology group 71" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34753.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K1V9" + /translation="MMKRIYYHLLAIWAWTLPNSYAFIDSLKVFFPNISLQIAGSLLA + VVSIGIFITRIYYTRYEVFISLLVCISILIFYSTRFFYSTNVELYQSFFNSFLIRPVP + AILVAMLLAKNNHIKGFIKWSEPMMLFYTLTSFLAALSPRNSIITYQSLSYYAMTAYM + INVFNIIYKEKILEEQLTYFRFSAWNFIRYFLLLIQAFNALSGGGRGAFILLIIFTGI + LLIRTAMKFKFLFSFIGGLSAIALVVFFTKGLDLTWLLNMDGGERLLNFFGRPEHIST + DNRLLIYDTVWSAIQEKPFLGWGVGSTFLKFNGYSHNIVLDLLHDMGSFGLLIILSAF + FASSVILYKLRKIDWKVNLFILMFLEVYVHMSFSGSYLADGRLWFLVIFTYCYYRWKV + QEKDEVSNFII" + misc_feature 8991..9158 + /gene="wzy" + /locus_tag="SPC44_0011" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 9.9e-08" + gene 9361..10437 + /gene="wcxD" + /locus_tag="SPC44_0012" + CDS 9361..10437 + /gene="wcxD" + /locus_tag="SPC44_0012" + /note="member of homology group 72" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34754.1" + /db_xref="GOA:Q4K1V8" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1V8" + /translation="MKLAILLSDISKIGGVQRVTTALVNELCQNIDVTIISIFSENEL + PAFGLSDRVQVSYLLKEHVNLKKNFFKVSGALRKVLKKQQFDVVLSSGTGLVSFLWFA + SLGIPTRLLAWEHQCFYFGRSFGLEWLGRKLACRFAESIVVLTKKDEGFYKENRPKAH + IEQIYNILDMDSQTAKCQLSSKKIISVGSLVRQKGFDLALEVASQIQLSYPDWQWDIY + GDGPDREKLEEKVREYQLEGFINLKGLVQNVRELYPDYSIYALTSRYEGLSMVLLEAK + NCQMPAISFDCNCGPSDIISDGRNGFLIDCFDVNIYAKTLSKLMTSLELREQVAKSSV + IPAEELSTTYILDKWNNLLKIERR" + misc_feature 9862..10368 + /gene="wcxD" + /locus_tag="SPC44_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.2e-33" + gene 10439..11617 + /gene="wcxE" + /locus_tag="SPC44_0013" + CDS 10439..11617 + /gene="wcxE" + /locus_tag="SPC44_0013" + /note="member of homology group 73" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34755.1" + /db_xref="GOA:Q4K1X6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K1X6" + /translation="MKIVHVEDFFHPDAGYQINVLPKYLAKFGHEQVIITSEMDKIPD + NLTQFFGRENIEERDRSYEEKHHVKIIRLPLHGFVSGRAIFSGKLISAIKGLSPEVLY + IHGNDTLTGIRLLLARKKLNCRIVTDSHMLEMASRNPFNNYFRRFYKTLITPILIKEQ + IPIIRTQDDNYVEKHLGIPLSQAPWISYGSDTAFFHADSQIKEDFRSQYQIASDALIC + VYAGKLDEHKGGMFLAESLSKKLNTEQPIVFIIVGNTNGEYGEAVEKSFSQSENQILR + FPTQKYQKLAQFFQVADFALFPKQCSLSFYDAQACGLPVLLEDNNINLDRTSHYNGWT + FKANSKLSLRDSLKMIASLDKEKRQEYSQNALHYILEHYNYEDKAREYEKILIGERTK + " + misc_feature 11042..11542 + /gene="wcxE" + /locus_tag="SPC44_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 0.00013" + gene 11650..12846 + /gene="wcxF" + /locus_tag="SPC44_0014" + CDS 11650..12846 + /gene="wcxF" + /locus_tag="SPC44_0014" + /note="member of homology group 74" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34756.1" + /db_xref="GOA:Q4JYR2" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYR2" + /translation="MDLMKICIVSVGVGGLPIPAVKGGAVENLIDNYLSYNEKYNHDE + ITVVSCDHKEAREASKKYKYAQFVYIDIHSLKYKINKTIRYAINKYSPFFVGNAYISQ + LPDLSGFDTVLIENRPEYGYYIRKKFKGNLVLHLHNDLLMDNEYSVDYSVYDKIITVS + DYIRNRSEVVTSGVPIQTVYNGIDTEPFLQNFSEVDLSDLKNQLEILSDDFVIVFFGR + INKNKGIKELLEAFLLLPKNLNIKLLAVGSSIFGQTELDTFTTEIRQLAKQASDKVVF + TGYVNYKDIPKYHHIADCIVVPSIWEEPAALTVCEALISGKYVITTDTGGTPELVAGS + DALVVANDECIVEHLKTALLSVYQKGKCSSVITSNRDRGTYFSIEKYGRNLRKELTQN + ERIINI" + misc_feature 11650..11724 + /gene="wcxF" + /locus_tag="SPC44_0014" + /note="Signal peptide predicted for SPC1945 by SignalP 2.0 + HMM (Signal peptide probability 0.653) with cleavage site + probability 0.406 between residues 25 and 26" + misc_feature 12238..12765 + /gene="wcxF" + /locus_tag="SPC44_0014" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.6e-25" + gene 12843..14387 + /gene="wzx" + /locus_tag="SPC44_0015" + CDS 12843..14387 + /gene="wzx" + /locus_tag="SPC44_0015" + /note="member of homology group 56" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34757.1" + /db_xref="GOA:Q4JYR1" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYR1" + /translation="MSRVKNSFFNILAGIVGTIISSVLAFIVRTVFIRVLGETYLGFN + GLYTNILTVLSLTELGIGSSIAYLMYKPLAEKDGDKLAQVVQFYKKIYRVIGIIILIL + GLCLVPFLPVIVNLKNAEDLNYTALYLLYLADTVSTYLFFAYKRGVLAADQKIYVANI + FDIIITTILSIFQIITLMIFKDFYLYIILKIAKNLTLNLVISLKVDKMYPSIHKFKGI + APLPKMERRLVWKNVYATSVRQIFNELMNSTDSIVISIVLGIVMVGKYSNYAYILSIV + YIFFGGIFNPIQASIGNLSLLASIEKKNEIFNRLRFINFFFLSFCSSCLLVLVNPFIT + IWIGENYTLSFTGVIAIVGMLFVRQTGNCTTIFRLGEGYFRDYHFSPLIAGILNLVVS + VILVNYIGIAGVFVGTMLGFGFQFILVDTIVTYKKVLSRPLSEFYLRWLQTILLTVGL + CIASYYLSRLVRVNSIYDLILLFVVVIGFNFFALCFIYWRNDDFQYFIQLVKNFMKNL + EEKNHD" + misc_feature 12843..12917 + /gene="wzx" + /locus_tag="SPC44_0015" + /note="Signal peptide predicted for SPC1946 by SignalP 2.0 + HMM (Signal peptide probability 0.819) with cleavage site + probability 0.398 between residues 25 and 26" + gene 14380..15603 + /gene="mnaB" + /locus_tag="SPC44_0016" + CDS 14380..15603 + /gene="mnaB" + /locus_tag="SPC44_0016" + /note="member of homology group 75" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylmannosamine dehydrogenase MnaB" + /protein_id="CAI34758.1" + /db_xref="GOA:Q4K1X3" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K1X3" + /translation="MINVIGLGYIGLPTILMLATNGVKVVGTDYNQDLVRTLNEGQTT + FKEDGLDELFHKAVESGVDFTTEYQQTDTYIISVPTPYDSFSKKIDPSYVIEATKTVL + DNCNKGAVIIIESTVSPGTVDKFIRPVVEEKGFVIGSDIHLVHAPERIIPGNMVYELV + NNNRTIGADDLEIGYKVKELYASFCKGDIVVTDIRTAEMTKVVENTFRAVNIAFANEL + AQICSYDNMNVYEIIRICNMHPRVNILQPGPGVGGHCISVDPWFLVGDYPELTNVIEH + SMRTNAAMPEFVLNRIYTIMNEHHLTDISRVGLYGLTYKENVDDMRESPTLQLLESMS + RHLATPAIKVYDPFIEKDVVANQSHDLDEFLSNVDIVVLLVGHDEILQNMDKLKDKIV + LDTRYICHLDGTYRL" + misc_feature 14383..14937 + /gene="mnaB" + /locus_tag="SPC44_0016" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.4e-45" + misc_feature 14959..15219 + /gene="mnaB" + /locus_tag="SPC44_0016" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 4.5e-33" + misc_feature 15301..15564 + /gene="mnaB" + /locus_tag="SPC44_0016" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 2.5e-15" + gene 15626..16729 + /gene="mnaA" + /locus_tag="SPC44_0017" + CDS 15626..16729 + /gene="mnaA" + /locus_tag="SPC44_0017" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI34759.1" + /db_xref="GOA:Q4K1V3" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1V3" + /translation="MTMKKIVVIFGTRPEAIKMCPLVKELRTRENLETLVCVTGQHRQ + MLDQVLDTFRITPDFDLSIMKDKQTLFDVTIGILEGMKTVLESVNPDLILVHGDTSTT + FASSLAAFYLQIPIGHVEAGLRTYDIYSPYPEEFNRQAVGALAQYHFTPTQLSKDNLL + REGKNSEAIFITGNTAIDALQTTIQEDYTHPELNWVGDSKLILITAHRRENIGDPMRH + MFRAIRRIIEEHSDIKALYPIHMNPLVRQIAEEELSGCERIKMIDPLEVLDFHNFLSR + SYLILTDSGGIQEEAPSLGKPVLVMRDTTERPEGIKAGTLKLVGTDEDNIYRHFKELL + ENDLVYQAMSQASNPYGDGTACKKIADILEGEV" + misc_feature 15695..16717 + /gene="mnaA" + /locus_tag="SPC44_0017" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 2.5e-174" + gene order(16733..17173,17175..17786) + /gene="fnlA" + /locus_tag="SPC44_0018" + CDS join(16733..17173,17175..17786) + /gene="fnlA" + /locus_tag="SPC44_0018" + /note="member of homology group 36" + /codon_start=1 + /transl_table=11 + /product="FnlA" + /protein_id="CAI34760.1" + /db_xref="GOA:Q4JYQ8" + /db_xref="InterPro:IPR003869" + /db_xref="InterPro:IPR013692" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYQ8" + /translation="MSQFTGKTLLITGGTGSFGNAVLNRFLQTDIGEIRIFSRDEKKQ + DDMRHEFQVKVPEVAGKIRFYLGDVRDLASVKNAMHGVDYVFHAAALKQVPSCEFFPV + EAVKTNILGTENVLTAAIEAGVKQVICLSTDKAAYPVNAMGTSKAMEKIAVAKSRTVN + PEHTKICVTRYGNVLCSRGSVVPLWIEQIKQGNALTITEPSMTRFVMTLEEAVDLVLF + AFEEGKSGDILVQKAPACTIEVLAKAVSEIFASEQDIKIIGIRHGEKRYETLLTNEEC + ANAIDLGDFYRVPSDNRNLNYDKYFKDGSTNRNLLTEFNSNNTDLMDVEQVKRKLLEL + DEIQTAIRDMVADEEM" + misc_feature order(16754..17173,17175..17606) + /gene="fnlA" + /locus_tag="SPC44_0018" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0046" + misc_feature order(16757..17173,17175..17603) + /gene="fnlA" + /locus_tag="SPC44_0018" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 2.7e-158" + misc_feature order(16757..17173,17175..17426) + /gene="fnlA" + /locus_tag="SPC44_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 3.1e-08" + misc_feature order(16760..17173,17175..17393) + /gene="fnlA" + /locus_tag="SPC44_0018" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2e-08" + misc_feature 17604..17747 + /gene="fnlA" + /locus_tag="SPC44_0018" + /note="HMMPfam hit to PF08485, Polysaccharide biosynthesis + protein C, score 2e-23" + gene 17886..19115 + /gene="fnlB" + /locus_tag="SPC44_0019" + CDS 17886..19115 + /gene="fnlB" + /locus_tag="SPC44_0019" + /note="member of homology group 37" + /codon_start=1 + /transl_table=11 + /product="FnlB" + /protein_id="CAI34761.1" + /db_xref="GOA:Q4K1V1" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K1V1" + /translation="MIKNILITGAKGFVGKNLICTLEALKDGRDRTRPNLEIGEIFQY + DRDTDPILLDEYCKKADFVFHLAGVNRPQNPDEFMEGNYGFSSRLLEILEKYENTCPV + LLSSSTQASLEGRFSNSIYGQSKLAGEELFFEYGKKTGAPVLVYRFPNLYGKWCRPNY + NSAVATFCHNLAHDLPIQVNDPSVELELLYIDDLIQECLTALEGNPHRCNLDGLQILP + SPSGNYCYVPTTHRATLGEIVSLLETFKKQPNSLVMPEIPQGSFKKKLYSTYLSYLPV + DKFRFPLKMNIDERGSFTELLKTENTGQFSVNISKPGITKGQHWHHSKWEFFMVVSGR + ALIQERRIGLDENGQEYPILNFEVSGDKIEAIHMIPGYAHNIINLSDTENLITVMWAN + ESFDPRHPDTFFEQVEK" + misc_feature 17898..18521 + /gene="fnlB" + /locus_tag="SPC44_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 6.9e-09" + gene 19116..20300 + /gene="fnlC" + /locus_tag="SPC44_0020" + CDS 19116..20300 + /gene="fnlC" + /locus_tag="SPC44_0020" + /note="member of homology group 38" + /codon_start=1 + /transl_table=11 + /product="UDP-L-fucosamine FnlC" + /protein_id="CAI34762.1" + /db_xref="GOA:Q4JYQ6" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4JYQ6" + /translation="MKIKTDYSDIHFKDNGKLKLLIIVGTRPEIIRLSSVITKCRKYF + DVILAHTGQNYDYNLNGIFFDNLGLDTPDVYMDAVGDDLGATVGNIINTSYKLMNQIK + PDALLILGDTNSCLSAIAAKRLHIPIFHMEAGNRCKDECLPEETNRRIVDIISDVNLA + YSEHARKYLHECGLPKERTYVTGSPMAEVLHKNLPAIESSDIHERLGLKKGGYILLSA + HREENIDTDKNFISLFTAINQLAEKYNMPILYSCHPRSKKRLQESGFKLDKRVIQHEP + LGFHDYNCLQMNAFVVVSDSGTLPEESSFFTSQGYPFPAVCIRTSTERPESLDKAGFI + LAGIDENSLLQAVETAVSLAEDEDFGLPVPDYVEENVSTKVVKIIQSYTGIVDKIVWR + KS" + misc_feature 19227..20255 + /gene="fnlC" + /locus_tag="SPC44_0020" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 9.7e-106" + gene complement(20498..20584) + /gene="tnp" + /locus_tag="SPC44_0021" + /pseudo + CDS complement(20498..20584) + /gene="tnp" + /locus_tag="SPC44_0021" + /note="Lone member of homology group 0256" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase (fragment)" + gene complement(20663..21608) + /gene="tnp" + /locus_tag="SPC44_0022" + /pseudo + CDS complement(join(20663..20884,20895..21608)) + /gene="tnp" + /locus_tag="SPC44_0022" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase (fragment)" + gene 21711..21899 + /gene="tnp" + /locus_tag="SPC44_0023" + /pseudo + CDS 21711..21899 + /gene="tnp" + /locus_tag="SPC44_0023" + /note="member of homology group 0047 7" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene complement(21982..22684) + /gene="tnp" + /locus_tag="SPC44_0024" + /pseudo + CDS complement(join(21982..22434,22415..22684)) + /gene="tnp" + /locus_tag="SPC44_0024" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature complement(order(22099..22434,22415..22419)) + /gene="tnp" + /locus_tag="SPC44_0024" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 8.3e-52" + /pseudo + gene order(22751..23060,23086..23475) + /gene="tnp" + /locus_tag="SPC44_0025" + /pseudo + CDS join(22751..22948,22947..23060,23086..23475) + /gene="tnp" + /locus_tag="SPC44_0025" + /note="member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature order(22998..23060,23086..23463) + /gene="tnp" + /locus_tag="SPC44_0025" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 2.7e-15" + /pseudo + gene 23736..>24095 + /gene="aliA" + /locus_tag="SPC44_0026" + CDS 23736..>24095 + /gene="aliA" + /locus_tag="SPC44_0026" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34768.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 23736..23822 + /gene="aliA" + /locus_tag="SPC44_0026" + /note="Signal peptide predicted for SPC1961 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 23982..24050 + /gene="aliA" + /locus_tag="SPC44_0026" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaaggcag aaatcctttg + 241 ttttttataa ccaaggttta taaaccttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gacgaacata aagaagcgta tccttagtgc aggcctgact + 361 tttacatctg ctttgctttt agctacttgc ggccaatcag gttcagatat aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtca attgaaacaa gaacaagaca aaagagcctc ataaaaggta ttgcaacttg + 541 gtaatacctt tttgaggtgc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggtgagta gggaggaaga ggtaaaagtt tatgcccaaa ctcttcgcat aaaagttcta + 661 gcttccccat tctatggaat cttgcattat ccataataat aaccgatggt gtgtttaatg + 721 ttggtaagaa aaacttctga aaccatactt caaaaaagtc gctcgtcatc gtctcttcgt + 781 aagtcattgg aacgattaat tcaccatttg ttagacctgc aaccaaagaa attctctgat + 841 atcttcttcc agatactttg cctcttctta actgaccttt taatgagcga ccatattctc + 901 gataaaaata agtatcgaat cctgtttcgt caatctaaac aggtgctagg tgctttaaac + 961 tattaaaatt cttaagaaat aaggctactt tttctgggtc ttgttcataa ttagattgaa + 1021 actagagtag tacacctctg cttctaaaaa atttttagaa atcgatttaa ctgtcctgat + 1081 cgatttgtca tgttcttatt tcattttatt atatttttgg ttcgcgggaa gtctactaag + 1141 atacttaaag atgcagatag taaaaaaaat gtagacatta ccgtaaaaaa gtgatataat + 1201 cgtatgatgt tcaaggtata ggtgttaatc atgagtagac gttttaaaaa atcaggttca + 1261 cagaaagtga agcgaagtgt taatatcgtt ttgctgacta tttatttatt gttagtttgt + 1321 tttttattgt tcttaatctt taagtacaat atccttgctt ttagatatct taacctagtg + 1381 gtaactgcgt tagtcctact agttgccttg gtagggctac tcttgattat ctataaaaaa + 1441 gctgaaaagt ttactatttt tctgttgctg ttctctatcc ttgtcagctc tgtgtcgctc + 1501 tttgcagtac agcagtttgt tggactgacc aatcgtttaa atgcgacttc taattactca + 1561 gaatattcaa tcagtgtcgt tgttttagca gatagtgata tcgaaaatgt tacgcaactg + 1621 acgagtgtga cagcaccgac tgggactgat aatgaaaata ttcaaaaact actagctgat + 1681 attaagtcaa gtcagaatac cgatttgacg gtcaaccaga gttcgtctta cttggcagct + 1741 tacaagagtt tgattgcagg ggagactaag gccattgtcc taaatagtgt ctttgaaaac + 1801 atcatcgagt tagagtatcc agactacgca tcgaagataa aaaagattta taccaaggga + 1861 ttcactaaaa aagtagaagc tcctaagacg tctaagaatc agtctttcaa tatctatgtt + 1921 agtggaattg acacctatgg tcctattagt tcggtgtcgc gatcagatgt caatatcctg + 1981 atgactgtca atcgagatac caagaaaatc ctcttgacca caacgccacg tgatgcctat + 2041 gtaccaatcg cagatggtgg aaataatcaa aaagataaat taacccatgc aggcatttat + 2101 ggagttgatt cgtccattca caccttagaa aatctctatg gagtggatat caattactat + 2161 gtgcgattga acttcacttc tttcttgaaa atgattgact tattgggagg ggtagatgtt + 2221 cataatgatc aagagttttc agctctacat gggaagttct atttcccagt agggaatgtc + 2281 catctagact ctgagcaggc tctaggtttt gtacgtgaac gctactcact agccgatgga + 2341 gaccgtgacc gtggtcgcaa ccaacaaaag gtgattgtgg ctatccttca aaaattaacg + 2401 tcaaccgaag cactgaaaaa ttatagtacg atcattaata gcttgcaaga ttctatccaa + 2461 acaaatatgc cacttgagac tatgataaat ttggtcaatg ctcagttaga aagtggaggg + 2521 aattataaag taaattctca agatttaaaa gggacaggtc ggacggatct tccttcttat + 2581 gcaatgccag acagtaacct ctatgtgttg gaaatagatg atagtagttt agctgtagtt + 2641 aaagcagcta tacaggatgt gatggagggt agatgaaatg atagacatcc attcgcatat + 2701 cgtttttgat gtagatgacg gtcccaagtc aagagaggaa agcaaggctc tcttggcaga + 2761 atcctacagg caaggggtac gaatcattgt ctctacctct caccgtcgca agggcatgtt + 2821 tgaaactccg gaagagaaga tagcagaaaa ctttcttcag gttcgggaaa tagctaagga + 2881 agtggcgagt gacttagtca tcgcttacgg ggctgaaatt tactacacac cagatgttct + 2941 ggataagcta gaaaaaaagc ggattccgac cctcaatgat agtcgttatg ccttgataga + 3001 gtttagtatg aacactcctt atcgcgatat tcatagcgcc ttgagcaaga tcttgatgtt + 3061 gggaattact ccagtcattg cccacattga gcgctatgat gctcttgaaa ataatgaaaa + 3121 acgcgttcga gaattgatcg atatgggctg ttacacgcaa gtaaatagtt cacatgtcct + 3181 caaatccaaa ctttttggcg aacgttataa attcatgaaa aaaagagctc agtatttttt + 3241 agagcaggat ttggtccatg tcattgcaag tgatatgcac aatctagacg gcagacctcc + 3301 tcatatggca gaagcatatg accttgttac ccaaaaatac ggagaagcga aggctcagga + 3361 actttttata gacaatcctc gaaaaattgt aatggatcaa ctaatttagg agaaatgatg + 3421 aaagaacaaa acacgataga aatcgatgta tttcaattat ttaaaacctt gtggaaacgc + 3481 aagctaatga ttttattagt ggcacttgtg acaggtgcgg gggcttttgc atatagcgct + 3541 tttattgtta agccagaata tacgagtacc acgcgaattt acgtagtgaa tcgcgatcaa + 3601 ggagacaagt cggggctgac aaatcaggat ttgcaggcag gatcttatct ggtaaaagac + 3661 taccgtgaga ttatcctttc gcagaatgta ttggaaaaag tagcgacaaa tttgaagttg + 3721 gatataccag ccaaaacgtt agctagaaaa gttcaagtga ctgtaccagt tgacactcgt + 3781 atcgtctcaa tctctgtcaa ggataaacag ccagaggaag ccagtcgtat cgctaattct + 3841 ctacgagaag ttgctgcaga aaagatcatc gctgtaacgc gagtatctga tgtgacgaca + 3901 cttgaagaag cgcgaccagc tacgactccc tcttctccaa atgttggacg caattccttg + 3961 tttggttttt ttggaggagc agtcgtaaca gtaattgctg ttcttttgat tgagttgttc + 4021 gacatccgtg tgaaacgtcc tgaagatgtc gaagatgtac tgcaaattcc acttttaggg + 4081 gtcgttccag atttggacaa aatgaaatag gaggaagtta tgccaacatt agaaatctca + 4141 caggcaaaat tggattttgt aaaaaaggca gaggaaaatt ataacgcttt gtgcacgaac + 4201 ctacagttaa gtggagatga tttgaaagta ttttctatca cttctgtgaa acaaggagaa + 4261 ggaaaatcaa cgacttccat caatatcgct tgggcttttg cgcgtgcagg ttacaaaacg + 4321 ctgctgattg atggagatat tcgcaattct gttatgttag gtgtctttaa agcaagagat + 4381 aagattacag gcctgacaga atttttatca ggaactacag acctatcaca agggctttgt + 4441 gataccaata tcgaaaatct ctttgtaatt caggctggct ctgtgtcacc gaatccgaca + 4501 gctcttcttc aaagtaagaa tttcagtaca atgcttgaaa ccttgcgtaa atattttgac + 4561 tacatcattg tagatactgc tcctgtcggt gtcgtgattg atgcggctat tattacgcaa + 4621 aaatgcgatg cttctatttt agtgacgaag gcaggtgaaa taaatcgacg ggatattcaa + 4681 aaagcaaaag aacagttgga acacacaggg aagccgtttt tgggagttgt gttgaataaa + 4741 ttcgatactt cagtagacaa atacggttct tatggaaatt acggaaaaaa ataagtcgtt + 4801 aagtatttgt gtaaggacat ttttagaact acaatcaaaa tctttggaat tgctggcttc + 4861 aaatcatatt gatttgaaat gaaacttgca aaagagtttt taaggtgagt ttcttaattt + 4921 gtgactgaaa tcaatcttct acttccatac cttggaaaaa cagggtaaac gagagatgtt + 4981 ttttccataa taaagttttg atatggctag tagagtagta atataatgaa ttgtaatcat + 5041 tagtgttcat accaagaaat atcaagtatc tatttttgaa aatcataaat atgagatagt + 5101 ttttaaatct ctaaggagag ctagttttga gaggtaattt atgtatagag taacaaaacg + 5161 attaggggat attttacttt ctttaatagg aataatagta ctgtttccag tgtttattgt + 5221 aattgcaatt gcgataaaca ctgattcgga gggtccgatt atatttaaac aaaaacgatt + 5281 taggatatac aaggaacctt tttatatcct gaaatttagg tccatgaaaa taggagcacc + 5341 gaaaaatgta gctccacgga acttggataa tccagaacag tggattacca aagtgggagc + 5401 tttcttaaga aaaacatctt tggacgaact gccacaatta tggaatattc ttattggtaa + 5461 tatgagcatt gtaggaccta ggccagcagg tataaatgag cttgatttgc tcaccgaaag + 5521 agaaaagttt ggtgcgaatg atgtcttacc tggattaact ggatgggcac aaattaatgg + 5581 gcgagatact ttgtcaatag agatgaaggc agaagcagat ggttattatg tgaaacatat + 5641 gtcgttaagc atggatctta gatgtatcat taggacaatc ccctacgtat taaaacgtaa + 5701 gggaattgtg gagggcagtg gtaagaaaga gttggattga tgcaatgaaa attctatttg + 5761 tttgtcaaca ttataagcca gaacctttta ggttgtcaga tatttgtgag gatctagttc + 5821 aaagagggca tgaggtggct gttttgacag ggattcctaa ctatcctgag ggggaaatat + 5881 atgctgatta tcgtaagaga aaaaaaagaa gagagactat aaatggtgtt gctatttttc + 5941 gttcatacac cattgctagg aggcaaaata ctttataccg tatattgaat tattttagtt + 6001 ttgctctttc ttctacgata ggtgttatat ttgggcgtta taaagcgaaa gatggctcag + 6061 attttgattg tgtctttgtc aatcaactat ctccagttat gatggcttgg gctggtatag + 6121 cttataagaa caagtacaat aaacctatgt ttttgtattg catggatgtt tggccggata + 6181 gtttaattgt aggtggggtg aaggaaaatg gattgattta caagatattt gaatttgttt + 6241 caaaaaaagt atatcaagcc agcgattata tatttgttac tagtctatct tttaaagatt + 6301 attttgtaaa aaaatttaat attcctctcc acaaaattac ttacttacca caatatgcag + 6361 aggatttatt tgtaccaaat gaattaaaaa cgaacaaaaa tactattgac ttaacttttg + 6421 ctggaaatat tggaaaagct cagaatttag agactatttt gaaagcagcc agtgcaatag + 6481 aacagattcc cgatttagca aagagagttc attttcattt tgttggagat ggtacggaac + 6541 tattaaatat gcaaaaatta gcatgtgaac tagaattaga gaacacttca ttttatggta + 6601 gacgtccatt agaagagatg ccggattttt atacaaaatc agatgcgatg ctagtttctt + 6661 taataggcga ctctataatt tctcgcacct taccaggcaa ggtacaatct tatatggcgg + 6721 caggaaaacc aattatagga gcgatttcag gagatactca gagagttgta aaagaagcaa + 6781 aatgtggttt cataagtccg gaagggaatg ttgatcagtt agtgagaaat attcgtaagt + 6841 tctgtttgct ttctgtagag gaaagagaga aactaggaag gcaagctcgt tgttattatg + 6901 aagaacagtt ttcgaaagag tggtttatga catacttaga aaatcattta aaagaggggt + 6961 ttctatcatg aaggttttaa tgattaattc cgtttgtggt attaggagca ctgggagaat + 7021 ttgtgcagat ctcgcaactg ctttgacaga agaaggatat gaggttaaaa tcgcctatgg + 7081 tcgtgagtat gttccgaaac aatttcaaca gtatgcagtg aaaattggta caaagtctga + 7141 tattcgtttt catgcgattc gttctcgatt atttgacgaa tctggctttg gaagtagaca + 7201 ggcaactgtt aattttatta aatggatgaa agagtttgat cctgatatta ttcatctcca + 7261 taaccttcat gggtattata tcaatgttga actgttattt gattatctcc gaatatgcgg + 7321 taaaaagatt atatggactt tgcatgattg ttgggcattt acaggacact cggcttattt + 7381 tgattgtttg gaatgtgagt caaagggagt ttgtgaccat ccatctcaga aaaatgatta + 7441 tcccaagtcg ttcgtgaatt tttcaaagcg aaattatcaa agaaagaaaa aatgttttac + 7501 tcatattcct aatctcacta ttgttactcc gtctcaatgg ctagctaatt tagtaagaca + 7561 gtcattttta aaagaatatc cagtgaaagt aattcataat ggtattgata ctactgtctt + 7621 tcaaccgagg ctaatagccg ctcaaaaatt gagaaaaaga caccatcttg aaggaaagca + 7681 ggtactgctt ggtgtggctg ctatctggga taatagaaag ggattttctg atatgttagc + 7741 gctcgcgaat gatctaactg ataatcagag aatagttttg atagggttaa aagataggca + 7801 actcaaagaa ctacccaaag ggatcattgg gttaacagaa actaatagcc cagaagagtt + 7861 ggtagcatgg tatacactag cggatgtatt tctaaatcct acttatcaag ataattaccc + 7921 gacaactaat ttagaagcta tttcttgtgg gacaccagtt atcagctatc cgacaggtgg + 7981 tagtgtagaa agtgctaaac tttatggtct cgtttgtcag gatagaaacg tagcttctat + 8041 tttatcttcg ttagaaaaag tctctcagct atctaaaaca gaaaaattgg atttttcaat + 8101 tgcaagtttt attaaacaaa tgaaatattt atattagaac ttgaattata ggaaaatgag + 8161 gaatttgcat taaaatgatg aaaagaattt attatcacct tttggctatt tgggcttgga + 8221 ctcttccaaa ttcttatgct tttattgatt cgttaaaggt gttttttccg aatattagct + 8281 tacaaattgc aggttctctt ttggctgttg tctcaatagg aatttttatc actagaatat + 8341 attatacaag atatgaagtt tttatatctc tattggtttg tatttctatt ttaatttttt + 8401 attcaactcg ctttttttat tcgactaacg tagagttgta tcagtctttc ttcaattcct + 8461 ttctgattcg tccagttcct gcgatattag tagcgatgct gttagctaag aataatcata + 8521 taaaaggttt cataaaatgg tcagaaccta tgatgctttt ctatacattg acatcatttt + 8581 tagcagccct atctcctaga aacagcatta ttacttacca atctttatct tattatgcca + 8641 tgacagctta tatgattaat gtgtttaata ttatatacaa agagaaaata ttggaggagc + 8701 aactgacgta tttcagattc tcagcgtgga attttattag atatttttta cttttgattc + 8761 aagcttttaa tgcactctca ggaggtggga gaggtgcctt tattttatta attattttta + 8821 caggaatatt attaataaga actgctatga aatttaagtt ccttttctca tttattggag + 8881 gcctgtctgc tatagctcta gttgtttttt ttacaaaagg tttggatttg acatggctct + 8941 tgaatatgga cggtggagag cgattgttga acttcttcgg cagacctgaa catatatcta + 9001 cagataatag actattgatt tatgatactg tttggtctgc aatacaggaa aaaccctttt + 9061 taggatgggg agttggttca acttttttaa aatttaatgg atattcacat aatattgtat + 9121 tggatttatt gcatgatatg ggaagttttg gtttattaat tattctttcg gctttctttg + 9181 cttcttcagt aatattgtac aaattacgta aaatagattg gaaagtgaat ttatttattc + 9241 tgatgtttct agaagtatat gttcacatga gtttcagtgg aagctatctt gcagatggta + 9301 gactatggtt tttggtgatc tttacttatt gttactacag gtggaaagtg caggaaaagg + 9361 atgaagttag caattttatt atctgatatt tcaaaaatag gaggagtgca gcgtgtcacg + 9421 acagctcttg ttaatgaact ttgtcaaaat atagacgtta caattatcag catcttttcg + 9481 gaaaatgagc taccagcttt tggactttca gatagagttc aggtgagcta tcttttgaaa + 9541 gaacatgtta atttgaagaa gaattttttt aaagttagtg gagctttgcg aaaagtgttg + 9601 aaaaaacagc agtttgatgt tgttttatcg tcaggaactg gtctagtatc ctttctttgg + 9661 tttgctagtt tgggaattcc taccagactt ttggcatggg aacatcagtg tttttacttt + 9721 gggagatcgt ttggtctaga gtggttgggg cgaaagctag cctgtcgttt tgctgagagt + 9781 attgttgtct tgactaaaaa agatgaagga ttttacaaag agaatcgtcc taaggctcat + 9841 attgaacaaa tctataatat cctagacatg gattcacaaa cagctaagtg tcagctctct + 9901 tctaaaaaaa ttatcagtgt tggatcttta gtacgacaaa aaggttttga tctggctctt + 9961 gaggtagcta gtcaaataca attaagttat ccagattggc agtgggacat ttatggtgat + 10021 ggccccgata gagaaaaatt agaggagaaa gtcagggaat accaattaga aggctttata + 10081 aatttgaaag ggcttgttca gaatgttcgg gagctctatc ctgactactc tatctacgcc + 10141 ttgacatcac gatatgaagg attatcaatg gtattattag aagctaaaaa ctgccagatg + 10201 cctgctattt catttgattg taactgtgga ccctctgata ttatttcaga tggaagaaat + 10261 ggttttttga ttgattgttt tgatgtaaat atctatgcaa aaactttatc taaattaatg + 10321 actagtttag agttgcgaga acaagttgca aaatcgagtg ttattccagc agaagaattg + 10381 tcaacaactt atatcctaga taagtggaac aatctattaa agatagaaag aagataatat + 10441 gaaaatagtc catgtagaag atttttttca tccagatgca ggttaccaga ttaatgtttt + 10501 accaaaatat ctagcaaagt ttggtcatga acaagtgatt atcacttcag aaatggataa + 10561 aatccccgat aatcttaccc aattttttgg acgagaaaat atagaagaga gagatagaag + 10621 ttacgaagag aagcatcatg tgaagattat tcgcttgcct cttcatggat ttgtaagcgg + 10681 acgtgcgatt ttttctggaa agcttatttc ggctattaag ggtctttctc cagaggtatt + 10741 gtatattcat gggaatgaca ctttaacagg gattcgtctc cttttagctc gaaagaaact + 10801 taattgcaga atcgtcaccg atagtcatat gcttgaaatg gcatcaagaa atcctttcaa + 10861 caactacttt aggagatttt ataaaacctt gattactccc attttgataa aagaacagat + 10921 accaattatt cggacgcaag atgataatta tgttgaaaaa cacttgggaa ttcctttatc + 10981 gcaagctcca tggatttctt atgggtcgga tacagcgttc tttcacgcag atagccagat + 11041 taaggaagat tttcgttctc agtatcaaat cgcttcagat gctcttattt gtgtttacgc + 11101 aggaaagtta gatgagcata agggtgggat gtttttagca gagtctctaa gtaaaaagtt + 11161 aaatacggag caaccaattg ttttcattat agtgggtaat acaaatggag agtatggaga + 11221 agctgtcgag aaaagtttct cccaatctga aaaccaaatt ttgcgctttc cgactcaaaa + 11281 atatcaaaaa ttagcacagt tttttcaggt agcagatttt gctttatttc ctaaacaatg + 11341 tagtttaagt ttttatgatg cacaggcctg tggtttacca gttttattgg aagataataa + 11401 tatcaacctc gatagaactt ctcattataa tggttggacg ttcaaggcta acagcaaatt + 11461 aagtttgaga gattcattaa aaatgattgc gagtctagat aaagagaaga gacaagagta + 11521 ctctcagaat gcactgcact atatccttga acattataat tatgaagata aagcaagaga + 11581 atatgaaaag attcttatag gggaacgtac gaaatgagat agttaatatt tcgttatttt + 11641 ataggaaagg tggatttaat gaaaatttgc attgtttcag tcggagtggg cggactaccg + 11701 attccagctg taaaaggggg agcagtagaa aatctcattg ataattattt aagttacaat + 11761 gagaaatata atcatgatga aattacggtc gttagttgtg accataagga ggcgcgtgag + 11821 gcttcaaaaa aatacaagta tgcccaattt gtctatatag atattcattc acttaaatat + 11881 aaaataaaca aaacaatacg ttatgccatt aataaatatt cacctttctt cgtagggaac + 11941 gcttatatca gtcaattgcc agacttgtct ggttttgata cagttttgat tgaaaatcgc + 12001 cctgaatacg gttattatat tcgtaaaaag tttaaaggaa atcttgtttt acatcttcac + 12061 aatgatttat taatggacaa tgagtattct gtagattata gcgtttatga taaaattatc + 12121 acagtatctg actatattag gaataggtca gaagtagtaa cgtcaggtgt tccgatacag + 12181 actgtctata atggtattga cacagaacct tttttgcaga atttctctga agttgattta + 12241 tcagatctta aaaatcagtt ggaaattttg tcggatgatt ttgtgattgt tttttttgga + 12301 cgtatcaaca aaaataaagg tatcaaagaa ctgcttgaag ccttcttgtt gctaccaaag + 12361 aatttgaata taaaattact agctgttggt agttctatat ttggtcagac ggagttggat + 12421 actttcacaa cagagatacg gcaattggca aaacaagcat cagataaagt tgtttttaca + 12481 ggctatgtta attacaaaga cattcctaag tatcatcata ttgcagattg cattgttgtt + 12541 ccatctattt gggaggaacc agcggctttg acggtctgtg aagctttgat atcagggaaa + 12601 tatgttatta caacagatac tggagggaca ccagagcttg tagctggcag tgatgccctt + 12661 gtggtagcaa atgatgagtg tatagttgaa cacctcaaaa cagccctatt gagtgtctac + 12721 caaaaaggga aatgctcttc ggttattact tctaatagag atagaggaac ctatttttct + 12781 attgaaaaat atggaagaaa cttacgaaaa gagctcacac aaaatgaaag aattattaac + 12841 atatgagtcg tgtaaaaaat agttttttta atattttagc tggaatagtt ggtactatca + 12901 tatcgagtgt tttagctttc atagttagaa cagtgtttat ccgagttttg ggagagactt + 12961 atctaggttt caatggtcta tacaccaata tcttaacagt tttatcccta actgaattag + 13021 ggatcggatc atcaattgct tatttgatgt acaaaccttt agcagaaaaa gatggggaca + 13081 aattagctca agtagttcaa ttctataaaa aaatatatcg agtgattggt atcattattc + 13141 ttattttagg tttgtgtctc gttccttttt taccagtcat tgtaaattta aaaaatgcag + 13201 aagatttgaa ctatacagca ttgtatttgc tttatttagc agatacagtt tctacttatc + 13261 tattctttgc atataaaaga ggggtattgg ctgctgatca aaagatctat gttgcgaata + 13321 tctttgatat aattataacg acaattttat ctattttcca aattatcact ttgatgattt + 13381 ttaaagactt ttatctatat attattttaa aaattgctaa aaatcttact ttgaacctag + 13441 taattagttt aaaagtagat aaaatgtatc caagtattca taaatttaaa gggatagctc + 13501 cgcttccaaa aatggaaaga cgactagttt ggaaaaatgt atatgctacc tctgttcgac + 13561 aaatctttaa cgaattaatg aattcaacag atagtatagt tatttccatt gtcttaggaa + 13621 tagttatggt tggtaagtat tcgaactatg cttatatttt atcaatcgta tatattttct + 13681 ttggaggaat ttttaatccg attcaggctt ctattggaaa cctatctctg ttagcttcta + 13741 tagagaaaaa aaatgaaatc ttcaatagat tacgttttat aaattttttc tttttatcat + 13801 tttgctcaag ttgtcttcta gtattggtaa atccttttat cactatttgg attggagaaa + 13861 attacacttt atcatttaca ggtgtgattg caatagttgg tatgttattc gttagacaaa + 13921 ctggaaattg tacaaccatt tttcgtttgg gagaaggata ttttagagat tatcattttt + 13981 ctcctttaat cgcgggcatt ttaaatttag ttgtttcagt aattttagtg aattatatag + 14041 gtattgcagg tgtttttgtt ggaacaatgt taggatttgg tttccaattt atactggtgg + 14101 atacaattgt tacttataaa aaagtactta gtcgtccact atcagagttt tatttaagat + 14161 ggttgcagac gatcttatta actgtaggtt tatgtattgc gagttactat ttatctcgat + 14221 tggttagagt gaatagtata tatgatttga tactgttgtt tgtagtggtt attggattta + 14281 atttttttgc tttatgtttt atttattggc gaaatgatga ttttcaatat tttattcaat + 14341 tggttaaaaa ttttatgaaa aatttggagg aaaaaaatca tgattaatgt aatcggatta + 14401 ggttatattg gattgccaac aattttaatg ttggcaacaa acggcgtgaa agtagttgga + 14461 actgactaca atcaggattt ggtgagaact ttaaatgaag gtcaaacaac ctttaaagaa + 14521 gatggattgg atgaactatt ccataaagca gtggagtcgg gtgtggactt tacaaccgaa + 14581 tatcaacaaa cggataccta tattatttcc gttccaacac catatgactc cttctctaaa + 14641 aaaattgatc caagctatgt gattgaagct acgaaaacgg tacttgataa ttgcaataaa + 14701 ggagcggtta ttattattga atcgaccgta tcaccaggaa cggttgataa atttattcga + 14761 cctgttgtag aagaaaaagg ttttgttatt ggtagtgata ttcatcttgt ccatgctcca + 14821 gaacgtatta ttccagggaa tatggtctat gaattggtga ataataaccg tacaattgga + 14881 gctgatgacc tagaaatcgg ctataaagtg aaagagcttt atgcttcatt ttgtaagggc + 14941 gatattgttg ttacagatat tagaactgcg gagatgacca aggtagtaga aaatacattt + 15001 agagctgtaa atattgcttt cgctaacgaa ttagcacaga tctgtagtta tgataatatg + 15061 aatgtttatg aaattatccg gatctgtaat atgcacccac gggtaaatat tctacaacct + 15121 ggacctggtg ttggtgggca ttgtatttct gtggatcctt ggttcttagt tggagattat + 15181 cctgagttga caaatgttat tgaacattct atgcgaacaa atgctgccat gccagaattt + 15241 gtattaaatc gtatctatac cattatgaac gaacatcatc taacagatat tagtcgggtt + 15301 ggtctatatg gtcttaccta caaagagaat gtagatgata tgcgtgaatc tccaacgctt + 15361 cagttattag aatctatgag ccgccatctg gcaacacctg ctattaaagt atatgatcca + 15421 tttatagaaa aagatgttgt ggcgaatcag tcacatgatt tagatgaatt tttatctaat + 15481 gttgatattg ttgtactgtt ggttggtcat gatgagattt tacaaaatat ggataaacta + 15541 aaagataaga tagtgttaga tacacgttat atctgtcatc ttgatggaac ttacagatta + 15601 taattagtga taaataaagt aaggattgac tatgaaaaaa atagttgtaa ttttcggaac + 15661 tcgtcccgaa gctatcaaga tgtgtccctt ggttaaagag ctaagaacac gtgagaatct + 15721 tgaaacattg gtctgtgtta cgggtcaaca tcgtcaaatg ctggatcaag ttttggatac + 15781 ttttaggatt acgcctgatt ttgatttatc tattatgaag gacaaacaaa ctctctttga + 15841 tgtcacaatt ggcattttgg aaggcatgaa gactgtctta gagtcagtta atcctgattt + 15901 aatattagtt catggggata cgagtacaac atttgccagt tcactggccg ccttttatct + 15961 acagattcca attggacatg tagaggctgg tttgcgtact tatgatattt attcacctta + 16021 tcctgaagaa tttaatcgtc aagcagtagg tgctttggct cagtatcatt ttacaccaac + 16081 acaactctca aaagacaatc tcttgagaga aggaaaaaat tctgaagcta tatttatcac + 16141 aggtaacaca gcaattgatg ctttacaaac tacaattcaa gaggattata ctcatcctga + 16201 gttaaattgg gttggggata gcaaactaat attaattact gctcatcgtc gtgaaaatat + 16261 tggtgacccg atgaggcaca tgtttagagc aatccgacgt atcattgaag aacattcgga + 16321 tataaaggct ctttacccca ttcatatgaa tcctctagtt cgtcagattg ctgaggaaga + 16381 actaagcgga tgtgaacgta tcaaaatgat cgatccgttg gaagtattag attttcataa + 16441 ctttttatca cggagttatc tcattttaac agatagtggt ggtatccaag aagaggcacc + 16501 tagtttagga aaacctgttt tagttatgag agatacaact gaacgtccgg agggaattaa + 16561 agcaggaact ttgaagcttg taggtactga tgaggacaat atttatagac attttaaaga + 16621 attgttagaa aatgatttag tttatcaagc gatgagccaa gcttcaaatc cgtatggaga + 16681 tggaacagct tgcaagaaaa ttgcagacat actagaagga gaagtataat atatgtcaca + 16741 atttacagga aaaactctcc taattacagg aggaacaggt tcatttggta atgctgtcct + 16801 taatcgtttt ttacagactg atattggtga aattcgtatt ttttcccgtg atgaaaaaaa + 16861 acaggatgat atgcgtcatg agtttcaggt aaaagtacca gaagtagctg ggaaaatccg + 16921 tttttacctt ggagatgtgc gtgacttagc ttcggtaaaa aatgctatgc atggtgtgga + 16981 ttatgttttt catgctgctg ctcttaaaca agtaccttcg tgtgaatttt tccctgtaga + 17041 agcggtaaaa actaacattt tgggaacgga gaatgtcctc actgcggcta tcgaagctgg + 17101 tgtaaagcaa gttatctgtc tttctacaga taaggcggct tatcccgtca atgctatggg + 17161 aacatccaag gctgatggaa aagattgctg ttgctaagtc caggacggta aatcctgagc + 17221 atacaaagat atgtgtgact cgctatggga atgttctgtg tagccgtgga tctgtcgttc + 17281 ctctttggat tgagcaaatt aagcaaggaa atgctcttac aattactgaa cctagcatga + 17341 cacgttttgt gatgacatta gaagaagcag tagacttggt tttatttgca tttgaagaag + 17401 ggaaatctgg agatatacta gttcagaaag caccagcatg tacgattgaa gtgttggcta + 17461 aggctgtatc agaaattttt gcctcagaac aagatattaa gattataggt attagacacg + 17521 gagaaaaaag gtatgaaaca ctattaacta atgaagagtg cgcaaatgca attgatttgg + 17581 gtgattttta tagagttcct agtgataatc gtaatcttaa ctatgataag tatttcaaag + 17641 atggtagtac gaatagaaat ttgttgacag aattcaatag taataatacc gatttgatgg + 17701 atgtagagca agttaaaaga aagttgctag aattagatga aatacagaca gcaattcgtg + 17761 atatggtagc agatgaagag atgtaaaatc ttttaagata cattaaaatt atcaaggata + 17821 tataatgtat catgtattgt cgagagagtt gactattaaa acagcatata aaacaaggag + 17881 ggggcatgat taaaaatatt ttaatcacag gagcgaaagg atttgtagga aaaaatctta + 17941 tctgtactct ggaagctttg aaagatgggc gagataggac tcgtcctaat ttagagattg + 18001 gagagatttt tcagtatgat cgtgatacag atccgatttt attagatgaa tattgtaaga + 18061 aggccgattt cgtattccat ttagctggtg tcaatcgtcc acagaatcct gatgaattca + 18121 tggagggaaa ttacggtttt tcaagtagat tattggagat tttagaaaag tatgaaaaca + 18181 cttgtcctgt tctactctca agttctactc aagctagttt agaaggccga ttttcaaact + 18241 ctatatatgg acaatctaag ctagcagggg aagaactctt ctttgaatat ggaaagaaaa + 18301 cgggagcacc tgtcttagtt taccgtttcc cgaatcttta tgggaagtgg tgccgtccta + 18361 actacaattc tgctgtagca actttctgtc ataatctagc tcacgattta cctattcaag + 18421 taaatgatcc aagtgtagaa ttggagttgc tgtatattga tgatttgata caagagtgtc + 18481 taactgcatt ggaaggaaat cctcatcgtt gtaatctaga tggattacaa atcttaccta + 18541 gcccatcagg aaactactgc tacgtaccaa cgactcatcg tgcaacctta ggagagattg + 18601 tctctctatt agaaacattt aaaaaacagc ctaatagttt agttatgcct gaaattcctc + 18661 aaggatcgtt taaaaagaaa ttgtattcta cctacctatc ttatttacca gtagataagt + 18721 ttaggtttcc tctaaaaatg aatatagatg aacgaggtag ttttacggaa ttattaaaaa + 18781 cagaaaatac gggtcaattt tctgttaata tttctaaacc tggcattacc aaagggcaac + 18841 attggcatca ttctaagtgg gaatttttca tggttgtttc tggtcgtgct ttaatacaag + 18901 agcgtaggat agggctggat gaaaacggtc aagagtatcc tattctgaac tttgaagtgt + 18961 cgggcgataa gattgaagca atacatatga taccgggcta tgcacataat attattaatc + 19021 tttctgatac agaaaatcta attactgtca tgtgggctaa tgagtcattt gatcctagac + 19081 atccagatac tttttttgaa caagtggaga aataaatgaa aattaagaca gattatagtg + 19141 atattcattt taaagataat ggcaaactta agttattgat tattgtggga acacgtccag + 19201 agattatacg tctaagtagt gttatcacta aatgtcgaaa gtattttgat gttattttgg + 19261 cacatactgg acaaaactat gattacaatt taaatggtat tttctttgat aatttagggt + 19321 tagacactcc ggacgtatac atggatgctg ttggagatga tcttggtgct actgtaggga + 19381 atattattaa tacttcatac aaattgatga atcaaattaa accagatgct ttattgattt + 19441 taggggatac aaattcttgt ttatcagcta ttgctgccaa gcgtttacat attccaattt + 19501 ttcatatgga ggctggcaat cgctgtaaag atgagtgcct gccggaagag actaatcgtc + 19561 ggattgttga tattatttca gatgttaact tagcatactc tgaacatgca cgtaagtatt + 19621 tacatgagtg tggtttacct aaagagcgca catatgtaac tggttctcct atggcagaag + 19681 tgttacataa aaatttacct gccattgagt cttcagatat ccatgaacgt ttgggattga + 19741 aaaaaggagg ttatatctta ctttcagctc accgtgagga aaatattgat acagataaaa + 19801 attttatttc tctctttaca gcaattaatc aattagctga aaagtataat atgccaatct + 19861 tatattcttg ccatcctaga tcaaagaaaa ggctacaaga gagcggtttt aaactagata + 19921 aacgtgtgat tcagcatgag ccactaggat tccatgacta taattgttta cagatgaatg + 19981 catttgttgt agtatctgat tcgggaactt taccggaaga aagtagtttc tttactagtc + 20041 aaggttatcc ttttcccgct gtatgtattc gtacaagtac agaacgtcct gagtccttag + 20101 ataaggcagg atttattttg gcaggcattg atgaaaattc tcttcttcaa gcagttgaaa + 20161 ctgctgttag cttggcagaa gatgaggatt ttggattacc ggttccagat tatgttgagg + 20221 aaaatgtctc tactaaagtt gttaagataa tacagagcta tacagggata gtggataaaa + 20281 tagtttggag gaaaagctga attgtatatt tttaataaat caaaacgaga tgattaattc + 20341 ttagtagaac aagagtaaaa ttgaacgtat ttgatggaaa tgtcttactt gatagtcgag + 20401 ggatagccat tctatcggat ttttggcttg tttttgcgct tcatgtttga tagaataaag + 20461 ggctctttgt caactgtagt gggttgaaga aaagctaagc ttgagaaagg acaaatttcg + 20521 tcctttcttt tttgatgttc agagcgataa aaatccgttt tttgaagttt tcaaagtttc + 20581 gaaagtaacc gcccaataac gaagtatatt gaaaaatctc cagactagag aactcacgga + 20641 tagttcctaa tctggagatt tcttatttgc acttttcttg tacaacttta gtccatggta + 20701 aataagcctc taaaacctct ttgtttacga gagtttcctc gtttggaaga cattctagaa + 20761 gataggatag atatttctca ctatttagtt gatgacgttt agctgtttcc aacaagctca + 20821 taataatagc tcttgcttta gctccttcaa aactttgaga aaataaccac cctcgctttt + 20881 ttaaactgag ctcaggctaa aagagtccac tggactcttt tactccgtcc cataaccaat + 20941 gatttaatgg cgcgttcagc tagattattg gaaaggacca gatgtccgtc tttcaaaata + 21001 gtcttaaagg tttcttcata cttgaggctg tattcaattg cccttcctag ttttgaacct + 21061 gctaaaactg actgacggcg gcaccaagca aagaagtctt ccattagggg ctggagatgt + 21121 tcttgacgtt tctgtagtcg ttcatcagct ggcaaagcct cccagtctct ttccaaggaa + 21181 aataactgat cacaataagc taaaccttta gctcctaagg atgatttatc tgcttgcttg + 21241 ggggtcgctt caaaaaattt ccttctcaca tgcgcccaac atccaacaag ttcagcttct + 21301 tccagttgac gataagcttc tagcggttcg tagtttacca agcttagcgt cgccttgctc + 21361 ctaaaccttg gactgctatc gcataggcag aactagagga ctaaagtcct aagttactgc + 21421 cgcaacatat cacaatgaac atagccagaa taatctccta ggaattcttg tactaccgaa + 21481 ccactccgac tctgatcatg atggtacagc gtgattgctt gattctcaac tttcccagac + 21541 aaaaaggtcc aatagtaggt cagatggcta tgactctcta gaacccgata agaagtttca + 21601 tccgcatgaa gtaagggctg agtcaatagt ctctctcgca agaggttata aaggggcttt + 21661 aggaatagga gctttcacaa gcttatccag atgattatct tttactcgtt atggacaatg + 21721 ctatatggca taaatcaagt accttaaaga ttccgactaa tattggtttt gcatttattc + 21781 ctccatacac accagagatg aaccccattg aacaagtgtg gaaagagatt cgtaaacgtg + 21841 gatttaagaa taaagccttt cgaactttgg aagatgtcat acaaggactg gagaaggagg + 21901 tgataaagtc catcgttaat cggagatgga ctagaatgct ttttgaaagc agatgagtgt + 21961 aaaaagaaag tcctcatttc aatagaaatc acgactttct gatgaattta tagtgaaatg + 22021 aaataagacc aggacaaatc gatcaggaca gtcaaatcga tttctaacaa tgttttagaa + 22081 acagaggtgt actattctag tttcaatcta ctatattttt ggagtgatag aaaagccctt + 22141 catcagccaa tctacttgtt caggtgcgag agctttgaca tccttttctg tactgggcca + 22201 agtcagtctg ccgttctcaa agcgtttata tagtagccaa aatccttgac catcccagta + 22261 aagggcttta aagcggtctt tacgtccacc acaaaagaga aaaacttgac ctgagaaaga + 22321 atccaattca aagtgggttt taaccagata agccagtgaa tcgattcctt gtctcatatc + 22381 cgttttccca catacgagat agacctgccc taggctagat agatgaattg tcatagagca + 22441 acaccttatc caaaagctgt tctatcattt cgagattgag agattgaaaa aaacttactt + 22501 caagcttgcc aatacgaatt ttaagcagaa tatcatttct ctttttagaa tcaaaaggac + 22561 gagattgtgg aatctctaca ggaacaatag gttgtagcat taaaatatcc tccaatagtt + 22621 ttactttact aatagtatac aggaggagct ccatgaatga tagatacctt gttatgacgc + 22681 gcttactaaa caactaactg atgcacgatt taagcgcctt gttggtgttc agcgcacgac + 22741 ttttgaagag atgttagctg tattaaaaac agcttatcaa cttaaacacg caaaaggtgg + 22801 acgaaaacct aaattaagcc tagaagacct tcttatggcc actcttcaat atgtgcgaga + 22861 atatcgaact tatgaagaaa ttgcggctga ttttggtatc cacgaaagca acttaatccg + 22921 tcggagccaa tgggttgaag taactcttgt tcaaaggtgg tgttacgatt tcaagaactc + 22981 ctctcagttc tgaggacacg gtaatgattg atgcgacgga agtaaaaatc aatcgcccta + 23041 aaaaaagaat tagcgaatga ttctggtaaa aagaaatgcc acgctatgaa ggctcaagcg + 23101 attgtcacaa gtcaagggag aattgtttct ttggatatca ctgtgaacta ttgtcatgat + 23161 atgaagttgt tcaaaatgag ttgcagaaat atcggacaag ctggaaaaat cttggctgac + 23221 agtggttatc aagggctcat gaagatatat cctcaagcac aaactccacg taaatccagc + 23281 aaactcaatc cgctaacagc taaagataaa gcctgtaacc atgcactatc taaggataga + 23341 agcaaggttg agaacatctt tgccaaagta aaaacgttta aaatgttttc aacaacctat + 23401 cgaaatcatc gtaaacgctt cggattacga atgaatttga ttgctggtat tatcaatcat + 23461 gaactaggat tctagttttg caggaagtct attgaaggat cttttgcttt agttccttgg + 23521 tcaaggttga ttattttcac ggagcgcttc cgattgtttt cataaaccat ttgcgcatag + 23581 tcagcagaat aaatcttttt gaaacgtccc tttcctagac attatagaac tttcagattc + 23641 atctgaattt accaaattaa cacaaaaatt ctgaaaattc tgttgacatc tttctgaaaa + 23701 gagtttataa tggagagaaa gttttaaagg agaaaatgat gaaaagttca aaactatttg + 23761 cccttgcggg cgtgacatta ttggcggcga ctactttagc tgcatgctct ggatcaggtt + 23821 caagcactaa aggtgagaag acattctcat acatttatga gacagaccct gataacctca + 23881 actatttgac aactgctaag gctgcgacag caaatattac cagtaacgtg gttgatggtt + 23941 tgctagaaaa tgatcgctac gggaactttg tgccgtctat ggctgaggat tggtctgtat + 24001 ccaaggatgg attgacttac acttatacta tccgtaagga tgcaaaatgg tatacttctg + 24061 aaggtgaaga atacgcggca gtcaaagctc aagac +// + diff --git a/public/res/serotype_genbank/serotype_45.gb b/public/res/serotype_genbank/serotype_45.gb new file mode 100644 index 0000000..e34f894 --- /dev/null +++ b/public/res/serotype_genbank/serotype_45.gb @@ -0,0 +1,1249 @@ +LOCUS CR931718 27591 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Eddy nr. 72 (serotype 45). +ACCESSION CR931718 +VERSION CR931718.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 27591) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 27591) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..27591 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Eddy nr. 72" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC45_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC45_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34573.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SPC45_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SPC45_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(488..808,810..1355)) + /gene="tnp" + /locus_tag="SPC45_0003" + /pseudo + CDS complement(join(488..808,810..1355)) + /gene="tnp" + /locus_tag="SPC45_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(966..1337) + /gene="tnp" + /locus_tag="SPC45_0003" + /note="HMMPfam hit to PF01710, Transposase, score 7.2e-22" + /pseudo + gene 1581..3035 + /gene="wzg" + /locus_tag="SPC45_0004" + CDS 1581..3035 + /gene="wzg" + /locus_tag="SPC45_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34576.1" + /db_xref="GOA:Q4JYP2" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYP2" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + GAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1581..1706 + /gene="wzg" + /locus_tag="SPC45_0004" + /note="Signal peptide predicted for SPC1965 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 42 and 43" + misc_feature 1794..2141 + /gene="wzg" + /locus_tag="SPC45_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 2319..2762 + /gene="wzg" + /locus_tag="SPC45_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 3037..3768 + /gene="wzh" + /locus_tag="SPC45_0005" + CDS 3037..3768 + /gene="wzh" + /locus_tag="SPC45_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34577.1" + /db_xref="GOA:Q4JYP1" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYP1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLVESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHNALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3040..3648 + /gene="wzh" + /locus_tag="SPC45_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 8.2e-36" + gene 3774..4469 + /gene="wzd" + /locus_tag="SPC45_0006" + CDS 3774..4469 + /gene="wzd" + /locus_tag="SPC45_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34578.1" + /db_xref="GOA:Q4JYP0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JYP0" + /translation="MMKEQNTIEIDVFQLVKSLWKRKLMILIVALVTGAGAFAYSTFI + VKPKYTSTTRIYVVNRNQGDKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKL + DLTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDV + TTLEEARPAISPSSPDIKRNTLIGFLAGVIGTSVIVLLLELLDTRVKRPEDIEDTLQM + TLLGVVPNLDKLK" + misc_feature 3795..4211 + /gene="wzd" + /locus_tag="SPC45_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.5e-56" + misc_feature 4317..4394 + /gene="wzd" + /locus_tag="SPC45_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4479..5162 + /gene="wze" + /locus_tag="SPC45_0007" + CDS 4479..5162 + /gene="wze" + /locus_tag="SPC45_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34579.1" + /db_xref="GOA:Q4JYN9" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JYN9" + /translation="MPTLEIAQKKLEFVKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIAISFACAGYKTLLIDGDTRNSVMSGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGTVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDIQKAKQQLKQTKKLFLGVVLNKLDISVDKYGIY + GSYGNYGKR" + gene 5485..6138 + /gene="wciI" + /locus_tag="SPC45_0008" + CDS 5485..6138 + /gene="wciI" + /locus_tag="SPC45_0008" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34580.1" + /db_xref="GOA:Q4JYN8" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JYN8" + /translation="MSNGNRMKNGNRIYSWRLFMYSIIKRLGDILLSLIGIIILCPVF + MIIAIAIKLDSEGPVIFKQKRFGIHKEYFYILKFRSMKIDAPKNVAPRNLYNPEQWIT + KVGAFLRKTSLDELPQLFNILVGNMSIVGPRPAGINELDLIAERDKYGANDILPGLTG + WAQINGRDTLSVEMKTELDGYYVKHLSLIMDIRCIVKTIPYVLKRKGIVEGSGKKES" + misc_feature 5485..5634 + /gene="wciI" + /locus_tag="SPC45_0008" + /note="Signal peptide predicted for SPC1969 by SignalP 2.0 + HMM (Signal peptide probability 0.907) with cleavage site + probability 0.634 between residues 50 and 51" + misc_feature 5557..6111 + /gene="wciI" + /locus_tag="SPC45_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 4.3e-37" + gene 6147..7373 + /gene="wciJ" + /locus_tag="SPC45_0009" + CDS 6147..7373 + /gene="wciJ" + /locus_tag="SPC45_0009" + /note="member of homology group 35" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34581.1" + /db_xref="GOA:Q4JYN7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYN7" + /translation="MKILFVCQHYKPEPFRLSDICEDLVRKGHEVSVLAGIPNYPEGK + IYADYRHNKKRREIIEGVTIYRSYTIPRKKSVVFRLLNYFSFAISSTLGVLLGRYKTK + DGSNFDCVFVNQLSPVMMAWAGMAYKKKYKKPMFLYCMDVWPDSLTVGGVKQDGLIFK + LFKFISKKVYRASDYIFVTSPSFKNYFVKQFDISEQKITYLPQYAEDLFIPDESIVNK + ESVDLTFAGNIGKAQNLETILKAASLIEKNTNLPKKIHFHFVGDGTELLSMKALAHEL + ELKNISFYGRRSLEEMPSFYKKSDAMLVSLIGDSIVSRTIPGKVQSYMAAGKPIIGAI + SGDAKIIVEEANCGYVSPERDVKQLAKNICKFSMLSIKRQRELGKKARCYYENHFSKE + QFMTQLEKYLREEFSS" + misc_feature 6765..7298 + /gene="wciJ" + /locus_tag="SPC45_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.1e-12" + gene 7370..8539 + /gene="wcxB" + /locus_tag="SPC45_0010" + CDS 7370..8539 + /gene="wcxB" + /locus_tag="SPC45_0010" + /note="member of homology group 55" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34582.1" + /db_xref="GOA:Q4JYQ4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYQ4" + /translation="MKILMINTVCGIRSTGRICTDIATALTKKGHEVKIAYGREYVPT + QYRNYAVKIGSRVDVNRHVLQARIFDNAGFVGRAATRKFITWVKEYDPDIIHLHNLHG + YYIHVGELFSYLKTCGKKILWTLHDCWAFTGHGAYFDTLECEKIGQCHHSSQKNDYPK + SLIDFSSRNFKRKKNLFTGVPNLTLITPSEWLANLVRNSFLKEYPVTVIHNGIDTTIF + KPRVLEAKKLRKKFRLEGKQVLLGVASIWDQRKGLDDLLELSVQLKSYQQLVLIGLSK + EQLNKLPKEIIGLTTTDSVEELSAWYTLADVFINPTTQDNYPTTNLEAIACGTPVVTY + PTGGSIESTYMYGIVCSDRTVVSILESLKEVSQCKRSPNFNLSKEYFVENILNLY" + misc_feature 8042..8533 + /gene="wcxB" + /locus_tag="SPC45_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.3e-10" + gene 8511..9650 + /gene="wciL" + /locus_tag="SPC45_0011" + CDS 8511..9650 + /gene="wciL" + /locus_tag="SPC45_0011" + /note="member of homology group 30" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34583.1" + /db_xref="GOA:Q4JYQ3" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYQ3" + /translation="MWKIYSIYTSGTGVDMIKILYVNGGTMDRGGVSTFMMNVYEKMH + SEKIQIDFLVHTLSEGVRDEDILNLGGKIFRVPARGKNPLKNYRQIKQIMLNGNYDVV + HAHADAGNRTILSIAKECDIPIRISHCHNTNYTNKSLLKKFLNEQFKKQIPRYATHLW + ACSEKAGEWLYGNHSFEVIPNAIDVQKFIYSPQLSKDLRKELNLENKFVIGHVGRFDY + QKNHDFLLKVFTEFINEREDAHLVLIGKGELEEVIKKQANHLGILDKISFLGESSNVN + ELINVFDVGVFPSLFEGFSIAMVEMQVNGLPLVVSDNVPSEINLTDNIRFLSLDETVK + YWCKTILETKGRDTGAVDKIIAKGYNLSDMVHKLTKTYERIVDKS" + misc_feature 9093..9593 + /gene="wciL" + /locus_tag="SPC45_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 6.2e-25" + gene 9647..10756 + /gene="wcyQ" + /locus_tag="SPC45_0012" + CDS 9647..10756 + /gene="wcyQ" + /locus_tag="SPC45_0012" + /note="member of homology group 202" + /codon_start=1 + /transl_table=11 + /product="putative transferase" + /protein_id="CAI34584.1" + /db_xref="GOA:Q4JYQ2" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYQ2" + /translation="MKKVLFVTNIPSPYRVDFYNQLGKFVDLTVVFEATGAQDIRFDY + REIFKNFTAIFLSEGNIDEKKLNSAIFQYLIPKKYDYIFLTNYSYRTELFGYLKCVFS + KIPFVLEIDGGKIPESENFLKYQFKKFILTKPYYYFSPSQSSDDFLAHYHVNKENIYR + YSFTSLSEKDIRYQIVDEKEKQFLRKKLGFSPTKKTILFVGRIIPGKGVDVLIKAVQN + LSDDVQCLIVGPSPDSEYKQYLLDLIGQDSRFHFIDFLQTSELKQYYKLSDIFVLPTK + SDVWGLVVNEAMSQGLPVISTSACVAAIELVSNGNNGYIIDRVDDWKAIFQKLSKVLQ + DDSLRVQLSQNALSTIKHYTIETMVKEHLKFMEEK" + misc_feature 10187..10693 + /gene="wcyQ" + /locus_tag="SPC45_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.2e-35" + gene 10753..11673 + /gene="wcxS" + /locus_tag="SPC45_0013" + CDS 10753..11673 + /gene="wcxS" + /locus_tag="SPC45_0013" + /note="member of homology group 104" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34585.1" + /db_xref="GOA:Q4JYQ1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYQ1" + /translation="MRISVAMTTYNGADYLLEQLESLRTQSLMADEVIIVDDCSTDNT + VELLDMYIQKYHLDNWVLIRNSSNIGWRKNFRKALQETTGDIVFLCDQDDIWNKDKIS + LMVKEFHKSPSIELLASNYEILDFGRNDKIKIRDVELDNGAVVPFSLKNKSISVMRPG + CTFAVKRELIVLLEKYDIDRFGHDNILWNLAMIRGTLYLYLKRLIHFRRHETSASAPN + QSLNRDRRVVEVDTSHQITVFLLDAARREHLDIKIISQLENMEMVLERRRDILKYGTL + MQIVHFQLKYHTYYPTFRNLLSDILVFLKK" + misc_feature 10762..11271 + /gene="wcxS" + /locus_tag="SPC45_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 9.4e-34" + gene 11689..13128 + /gene="wzx" + /locus_tag="SPC45_0014" + CDS 11689..13128 + /gene="wzx" + /locus_tag="SPC45_0014" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34586.1" + /db_xref="GOA:Q4JYQ0" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYQ0" + /translation="MSKISKNYLYNLIYQVVVLILPLLITPYVARILGAHQLGIYDYV + NSIVTLIYTLGLLGIGHYGNRECAYTRDDKEELSETFWSILAIQIILGFFSLLFLYIF + SNINSNYQVYFQLFSIWLFGSILDCTWLYRGLEEMQYVVLKNIIAKLLFTIATFLFVK + SETDLTLYVLIYGLSVLVANLSTYSQLRMFISRPKININRFTEIILGSLKLFLPSIIT + QIMLSADKIVLGSLSSGISNVSYYSNAEKIIQIPLSLIVVLNSVMMPRIANEFRNRRL + ENMKKYLTTAAEFSLFLAVPLSIGLYAIADTFVPWFLGESFMPSMDALKWLAPIAVGN + ALLGVSGSQYFVAVNKTKVLFFSNTLAAILNILLDLLLAPMFGVVGVCLATIVSLTSS + VIVQYYIMSKDIPIIPILKSLFKYLIYSMIMGMIIIVSFRGYPANYRTTIKQIVLGIV + VYFGLNLLTRDVFVFQTLDFVKKGFKKSR" + misc_feature 11698..12501 + /gene="wzx" + /locus_tag="SPC45_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.1e-49" + gene 13125..14213 + /gene="wzy" + /locus_tag="SPC45_0015" + CDS 13125..14213 + /gene="wzy" + /locus_tag="SPC45_0015" + /note="member of homology group 257" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34587.1" + /db_xref="UniProtKB/TrEMBL:Q4JYP9" + /translation="MISALFYISFLTNLLVVVNRMRINSLAFLSWLILFFIYAGNIRE + GFSDLIHYRARYAVGKSSLYFSDHAYNFFADWFSHHSISFQVFLACIFLFSSACFYFV + AKKLHCNYNLLILLLSLFYFFYTLEVLRFFLATSVALIAHYYLSQNHRFIFIGLMFIA + FLFHGSIIYFLPFIIFYRQKNTSKMLWALVFISMVLIVTNLLVGNNSSYLTKIFELLG + SEVTKSRVMYYTAKSTRLGFILYDSYYIFNLLISINLKKIAKTVSNAPQEVTNFINLV + YQHSFFSTIFLPLIMFSTAFTRYLIFTVVLNFIAIAALQPFMQQSFIKLKSGLYIIFG + VLGATCFWWYLRENVLYFYEALLPNLFN" + gene 14321..15175 + /gene="wcyR" + /locus_tag="SPC45_0016" + CDS 14321..15175 + /gene="wcyR" + /locus_tag="SPC45_0016" + /note="member of homology group 203" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34588.1" + /db_xref="GOA:Q4JYP8" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JYP8" + /translation="MINYSADELDMIQKLELKILKEIIRICKKEKIEYFLIGGSALGA + IRHEGFIPWDDDIDVGMTRENYDNFLRVAEQYLGEEFYLQSPSSDRKSPYSYSKLMLK + ETLFLEYAQRNLKTQSGIYVDIFPFDEVPDNESENERQFKAVQFYKKLYVMRMLPTVS + KAPENLIQGLKAILRRCIHYSLRLIPKSLILKKIDQFSRLYNGTNQSALACLDFPVRN + VEYVLKTTLYPLIEHKFEEITILLPGDFHQYLTTHYGEYMKLPPLEERVGHRPYLIDL + GTYGKEEK" + misc_feature 14399..15085 + /gene="wcyR" + /locus_tag="SPC45_0016" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 2.1e-48" + gene 15172..15576 + /gene="gct" + /locus_tag="SPC45_0017" + CDS 15172..15576 + /gene="gct" + /locus_tag="SPC45_0017" + /note="member of homology group 28" + /codon_start=1 + /transl_table=11 + /product="CDP-glycerol-1-phosphate biosynthetic protein + Gct" + /protein_id="CAI34589.1" + /db_xref="GOA:Q4JYP7" + /db_xref="InterPro:IPR004820" + /db_xref="InterPro:IPR004821" + /db_xref="InterPro:IPR006409" + /db_xref="InterPro:IPR014729" + /db_xref="UniProtKB/TrEMBL:Q4JYP7" + /translation="MKRVITYGTFDLLHYGHINLLKRAKDLGDYLIVALSTDEFNLQK + DKISYFNYQQRKILLESIRYVDLVIPEISWEQKREDVKKYYADIFVIGDDWEGKFDFL + KDEGVEVVYLPRTKEISTTQIKEDLNKTKGGK" + misc_feature 15184..15549 + /gene="gct" + /locus_tag="SPC45_0017" + /note="HMMPfam hit to PF01467, Cytidylyltransferase, score + 1.4e-22" + gene 15566..16633 + /gene="fnlA" + /locus_tag="SPC45_0018" + CDS 15566..16633 + /gene="fnlA" + /locus_tag="SPC45_0018" + /note="member of homology group 36" + /codon_start=1 + /transl_table=11 + /product="FnlA" + /protein_id="CAI34590.1" + /db_xref="GOA:Q4JYP6" + /db_xref="InterPro:IPR003869" + /db_xref="InterPro:IPR013692" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYP6" + /translation="MENNMSQFTGKTLLITGGTGSFGNAVLKRFLETDISEIRIFSRD + EKKQDDMRHEFQVKVPEVAGKIRFYLGDVRDLASVKNAMHGVDYVFHAAALKQVPSCE + FFPVEAVKTNILGTENVLAAAIEADVKQVICLSTDKAAYPVNAMGTSKAMMEKIAVAK + SRAVNPEHTKICVTRYGNVLCSRGSVVPLWIEQIKQGNALTITEPSMTRFVMTLEEAV + DLVLFAFEEGKSGDILVQKAPACTIEVLAKAVSEIFASEQDIKIIGIRHGEKMYETLL + TNEECANAIDLGNFYRVPSDNRNLNYDKYFKDGSTNRNLLTEFNSNNTDLMDVEQVKR + KLLELDEIQTAIRDMVADEEM" + misc_feature 15599..16453 + /gene="fnlA" + /locus_tag="SPC45_0018" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0019" + misc_feature 15602..16450 + /gene="fnlA" + /locus_tag="SPC45_0018" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 4.2e-163" + misc_feature 15602..16273 + /gene="fnlA" + /locus_tag="SPC45_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 6.6e-09" + misc_feature 15605..16240 + /gene="fnlA" + /locus_tag="SPC45_0018" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 9.6e-09" + misc_feature 16451..16594 + /gene="fnlA" + /locus_tag="SPC45_0018" + /note="HMMPfam hit to PF08485, Polysaccharide biosynthesis + protein C, score 2e-23" + gene 16733..17962 + /gene="fnlB" + /locus_tag="SPC45_0019" + CDS 16733..17962 + /gene="fnlB" + /locus_tag="SPC45_0019" + /note="member of homology group 37" + /codon_start=1 + /transl_table=11 + /product="FnlB" + /protein_id="CAI34591.1" + /db_xref="GOA:Q4JYP5" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYP5" + /translation="MIKNILITGAKGFVGKNLICTLEALKDGRDRTRPNLEIGEIFQY + DRDTDPILLDEYCKKADFVFHLAGVNRPQNPDEFMEGNYGFSSRLLEILEKYENTCPV + LLSSSTQASLEGRFSNSIYGQSKLAGEELFFEYGKKTGAPVLVYRFPNLYGKWCRPNY + NSAVATFCHNLAHDLPIQVNDPSVELELLYIDDLIQECLTALEGNPHRCNLDGLQILP + SPSGNYCYVPTTHRATLGEIVSLLETFKKQPDSLVMPEIPQGSFKKKLYSTYLSYLPV + DKFKFPLKMNIDERGSFTELLKTENTGQFSVNISKPGITKGQHWHHSKWEFFMVVSGR + ALIQERRIGLDKNGQEYPILNFEVSGDKIEAIHMIPGYAHNIINLSDTENLVTVMWAN + ESFDPRHPDTFFEQVEK" + misc_feature 16745..17368 + /gene="fnlB" + /locus_tag="SPC45_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 6.9e-09" + gene 17963..19147 + /gene="fnlC" + /locus_tag="SPC45_0020" + CDS 17963..19147 + /gene="fnlC" + /locus_tag="SPC45_0020" + /note="member of homology group 38" + /codon_start=1 + /transl_table=11 + /product="UDP-L-fucosamine FnlC" + /protein_id="CAI34592.1" + /db_xref="GOA:Q4JYP4" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4JYP4" + /translation="MKIKTNYSDIHFKDNGKLKLLIIVGTRPEIIRLSSVITKCRKYF + DVILAHTGQNYDYNLNGIFFDDLGLDTPDVYMDAVGDDLGATVGNIINTSYKLMNQIK + PDALLILGDTNSCLSAIAAKRLHIPIFHMEAGNRCKDECLPEETNRRIVDIISDVNLA + YSEHARKYLHECGLPKERTYVTGSPMAEVLHKNLSAIESSDIHERLGLKKGGYILLSA + HREENIDTDKNFISLFTAINQLAEKYNMPILYSCHPRSKKRLQESGFKLDKRVIQHEP + LGFHDYNCLQMNAFVVVSDSGTLPEESSFFTSQGYPFPTVCIRTSTERPESLDKAGFI + LAGIDENSLLQAVETAVSLAEDEDFGLPVPDYVEENVSTKVVKIIQSYTGIVDKIVWR + KS" + misc_feature 18074..19102 + /gene="fnlC" + /locus_tag="SPC45_0020" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 1.8e-106" + gene complement(19693..20637) + /gene="tnp" + /locus_tag="SPC45_0021" + /pseudo + CDS complement(join(19693..19848,19845..20243,20245..20637)) + /gene="tnp" + /locus_tag="SPC45_0021" + /note="member of homology group 258" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1672 transposase" + /db_xref="PSEUDO:CAI34593.1" + gene 20864..21118 + /gene="HG273" + /locus_tag="SPC45_0022" + /pseudo + CDS 20864..21118 + /gene="HG273" + /locus_tag="SPC45_0022" + /note="member of homology group 273" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase (fragment)" + gene order(21210..21518,21544..21933) + /gene="tnp" + /locus_tag="SPC45_0023" + /pseudo + CDS join(21210..21518,21544..21933) + /gene="tnp" + /locus_tag="SPC45_0023" + /note="member of homology group 19; + member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature join(21456..21518,21544..21921) + /gene="tnp" + /locus_tag="SPC45_0023" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 3.7e-15" + /pseudo + gene 22226..23095 + /gene="rmlA" + /locus_tag="SPC45_0024" + CDS 22226..23095 + /gene="rmlA" + /locus_tag="SPC45_0024" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34596.1" + /db_xref="GOA:Q8RSF0" + /db_xref="HSSP:1FXO" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q8RSF0" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + misc_feature 22229..22945 + /gene="rmlA" + /locus_tag="SPC45_0024" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.3e-120" + gene 23096..23689 + /gene="rmlC" + /locus_tag="SPC45_0025" + CDS 23096..23689 + /gene="rmlC" + /locus_tag="SPC45_0025" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34597.1" + /db_xref="GOA:Q9AHA9" + /db_xref="HSSP:1NXM" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q9AHA9" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + misc_feature 23132..23662 + /gene="rmlC" + /locus_tag="SPC45_0025" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 4.5e-16" + gene 23702..24751 + /gene="rmlB" + /locus_tag="SPC45_0026" + CDS 23702..24751 + /gene="rmlB" + /locus_tag="SPC45_0026" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34598.1" + /db_xref="GOA:Q4JYN4" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYN4" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLVAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAVD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 23717..24673 + /gene="rmlB" + /locus_tag="SPC45_0026" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4e-05" + misc_feature 23720..24586 + /gene="rmlB" + /locus_tag="SPC45_0026" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0044" + misc_feature 23720..24460 + /gene="rmlB" + /locus_tag="SPC45_0026" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9e-78" + misc_feature 23723..24535 + /gene="rmlB" + /locus_tag="SPC45_0026" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1e-05" + gene 24817..25668 + /gene="rmlD" + /locus_tag="SPC45_0027" + CDS 24817..25668 + /gene="rmlD" + /locus_tag="SPC45_0027" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34599.1" + /db_xref="GOA:Q9RQL5" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9RQL5" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGRELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 24817..25665 + /gene="rmlD" + /locus_tag="SPC45_0027" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.1e-148" + misc_feature 24820..25461 + /gene="rmlD" + /locus_tag="SPC45_0027" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 9.3e-05" + misc_feature 24820..25449 + /gene="rmlD" + /locus_tag="SPC45_0027" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.4e-19" + misc_feature 24823..25551 + /gene="rmlD" + /locus_tag="SPC45_0027" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.4e-08" + gene order(25744..26695,26712..26927) + /gene="tnp" + /locus_tag="SPC45_0028" + /pseudo + CDS join(25744..26484,26483..26695,26712..26927) + /gene="tnp" + /locus_tag="SPC45_0028" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 25750..26193 + /gene="tnp" + /locus_tag="SPC45_0028" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 2.1e-05" + /pseudo + gene 27226..>27591 + /gene="aliA" + /locus_tag="SPC45_0029" + CDS 27226..>27591 + /gene="aliA" + /locus_tag="SPC45_0029" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34601.1" + /db_xref="GOA:Q4JYN2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JYN2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSSSTKGEKTFSYIYE + TDPDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIR + KDAKWYTSEGEEYAAVKAQD" + misc_feature 27226..27318 + /gene="aliA" + /locus_tag="SPC45_0029" + /note="Signal peptide predicted for SPC1993 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.703 between residues 31 and 32" + misc_feature 27478..27546 + /gene="aliA" + /locus_tag="SPC45_0029" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaaagcag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggcctgact + 361 tttgcatctg ctttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtca attgaaacaa gaacaagaca aaagagcctc ataaaaggta ttgcaacttg + 541 gtaatacctt tttgaggtgc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggtgagta gggaggaaga ggtaaaagtt tacgcctaaa ctcttcacac aagagttcta + 661 gcttccccat tctatggaat cttgcattat ccataataat aaccgatggt gtgtttaatg + 721 ttggtaagag aaacttctga aaccaagctt caaaaaagtc gctcgtcatc gtctcttcgt + 781 aagtcattgg agcgattaac tcaccattca tttgttagac ctgcaaccaa agaaatcctc + 841 tgatatcttc ttccagatac tttgcctctt attaactgac tttttaatga gcgaccatat + 901 tctcgataaa aataagtatc gaatcctgtt tcatcaatct aaacaggtgc taggtgcttt + 961 aaactattaa aattcttaag aaataaggct actttttctg ggtcttgttc atagtaggtg + 1021 tggttctttt ttcgagtgta gcccatagct ttgagcgcat agtggatggt agttggatga + 1081 cagccaaatt cagaagctat ttcagtcaaa taagcatctg gattgtcagt aagatagttt + 1141 ttaagtctat ctctatcaac ttttcttggt tttgttcctt ttacttggtg gtttagctct + 1201 cctgttttct cttttagctt taaccagcca taaatggtat tacgtgagat ttggaaaacg + 1261 tgtgatgctt ctgttatact acctgttcgc tcacaataag agagaacttt tttacgaaaa + 1321 tctattgaat atcccataag aagattatac cacattgtgt actatagtag attgaaacta + 1381 gaatagtaca cctctacttc taaaacattg ttagaaatcg atttgactgt cctgatcgat + 1441 ttgtcatgtt cttatttcat tttactatat ttttggttcg cgggaagtct actaagatac + 1501 ttaaagatgc agatagtgaa aataaaggtg tagacattac cgtaaaaaag tgatataatc + 1561 gtatgatgtt gaatgtatag gtgttaatca tgagtagacg ttttaaaaaa tcacgttcac + 1621 agaaagtgaa gcgaagtgtt aatatagttt tgctgactat ttatttattg ttagtttgtt + 1681 ttttattgtt cttaatcttt aagtacaata tccttgcttt tagatatctt aatctagtgg + 1741 taactgcgtt agtcctacta gttgccttgg tagggctact cttgattatc tataaaaaag + 1801 ctgaaaaatt tactattttt ctgttggtgt tctctatcct tgtcagctct gtgtcgctct + 1861 ttgcagtaca gcagtttgtt ggactgacca atcgtttaaa tgcgacttct aattactcag + 1921 aatattcaat cagtgtcgct gttttagcag atagtgagat cgaaaatgtt acgcaactga + 1981 cgagtgtgac agcaccgact gggactgata atgaaaatat tcaaaaacta ctagctgata + 2041 tcaagtcaag tcagaatacc gatttgacgg tcaaccagag ttcgtcttac ttggcagctt + 2101 acaagagttt gattgcaggg gagactaagg ccattgtcct aaatagtgtc tttgaaaaca + 2161 tcatcgagtc agagtatcca gactacgcat cgaagataaa gaagatttat accaagggat + 2221 tcactaaaaa agtaggagct cctaagacgt ctaagaatca gtctttcaat atctatgtta + 2281 gtggaattga cacctatggt cctattagtt cggtgtcgcg atcagatgtc aatatcttga + 2341 tgactgtcaa tcgagatacc aagaaaatcc tcttgaccac aacgccacgt gatgcctatg + 2401 taccaatcgc agatggtgga aataatcaaa aagataaatt gactcatgcg ggcatttatg + 2461 gagttgattc gtccattcac accttggaaa atctctatgg agtggatatc aattactatg + 2521 tgcgattgaa cttcacttcg tttttgaaat tgattgactt attgggaggg gtagatgttc + 2581 ataatgatca agagttttca gctctacatg ggaagttcca tttcccagta gggaatgtcc + 2641 atctagactc tgagcaggct ctaggttttg tacgtgaacg ctactcacta gccgatggag + 2701 accgtgaccg tggtcgcaac caacaaaagg tgattgtggc tatccttcaa aaattaacgt + 2761 caaccgaagc actgaaaaat tatagtacga tcattaatag cttgcaagat tctatccaaa + 2821 caaatatgcc gattgagact atgatagatt tggtgaatac tcagttggaa agtggaggga + 2881 attataaagt aaattctcaa gatttaaaag ggacaggtcg gatggatctt ccttcttatg + 2941 caatgccaga cagtaatctc tatgtgatgg aaatagatga tagtagttta gctgtagtta + 3001 aagcagctat acaggatgtg atggagggca gatgaaatga tagacatcca ttcgcacatc + 3061 gtctttgatg tagatgatgg tcccaagtca agagaggaaa gcaaggctct cttggtagaa + 3121 tcctacaggc agggggtgcg aaccattgtc tctacctctc accgtcgcaa gggcatgttt + 3181 gaaactccgg aagagaagat agcagaaaac tttcttcagg ttcgggaaat agctaaggaa + 3241 gtggcgagtg acttggtcat tgcttacggg gctgaaattt actacacacc agatgttctg + 3301 gataagctag aaaaaaagcg gattccgacc ctcaatgata gtcgttatgc cttgatagag + 3361 tttagtatga acactcctta tcgcgatatt cataacgcct tgagcaagat cttgatgtta + 3421 ggaattactc cagttatcgc ccacattgag cgctatgatg ctcttgaaaa taatgaaaaa + 3481 cgcgttcgag aactgatcga tatgggctgt tacacgcaag taaatagttc acatgtcctc + 3541 aaatccaaac tttttggcga acgttataaa ttcatgaaaa aaagagctca gtatttttta + 3601 gagcaggatt tggtccatgt cattgcaagt gatatgcaca atctagacgg cagacctcct + 3661 catatggcag aagcatatga ccttgttacc caaaaatacg gagaagcgaa ggctcaggaa + 3721 ctttttatag acaatcctcg aaaaattgta atggatcaac taatttagga gaaatgatga + 3781 aagaacaaaa cacgatagaa atcgatgtat ttcaattagt taaaagcttg tggaaacgca + 3841 agctaatgat tttaatagtg gcacttgtga caggtgcggg ggcttttgca tatagcactt + 3901 ttattgttaa gccaaaatat acgagtacca cgcgaattta cgtagtgaat cgcaatcaag + 3961 gagacaagtc ggggttgaca aatcaggatt tgcaggcagg atcttatctg gtaaaagact + 4021 accgtgagat tatcctttcg caggatgttt tggaggaagt tgtttctgat ttaaaactag + 4081 atttgacgcc aaaaggtttg gctaataaaa ttaaagtgac agtaccagtt gatacccgta + 4141 ttgtctctgt ttcagttaat gatcgagttc ctgaagaggc aagccgtatc gctaactctt + 4201 tgagagaagt agctgctcaa aaaattatca gtattactcg tgtttctgat gtgacaacac + 4261 tggaggaggc aagaccggcg atatcaccgt cttcgccaga tattaaacgc aatacactaa + 4321 ttggtttttt ggcaggggtg attggaacta gtgttatagt tcttcttctt gaacttttgg + 4381 acactcgtgt gaaacgtccg gaagatatcg aagatacact gcagatgaca cttttgggag + 4441 ttgtaccaaa cttggataag ttgaaatagg agagaggaat gccgacatta gaaatagcac + 4501 aaaaaaaact ggagttcgtt aagaaggcag aagaatatta caatgccttg tgtacaaata + 4561 tacagttgag cggagataaa ctaaaagtaa tttccgttac ttctgttaac cctggggaag + 4621 gaaaaacaac tacttccgta aatatagcaa tatcgtttgc gtgtgcaggc tataaaactc + 4681 ttttgatcga tggtgatact cgaaattcag ttatgtcagg attttttaaa tctcgtgaaa + 4741 aaattacagg gctaacagaa tttttatctg ggacagctga tttatctcac ggtttatgtg + 4801 atacaaatat tgaaaattta tttgtagttc aatcgggaac tgtatcacca aaccctacag + 4861 ccttgttaca aagtaaaaat tttaatgata tgattgaaac attgcgtaaa tattttgatt + 4921 atatcattgt tgatacagca cctattggaa ttgttattga tgcggcaatt atcactcaaa + 4981 agtgtgatgc gtccatcttg gtaacagcaa caggtgaggt gaataaacgt gatatccaaa + 5041 aagcgaaaca acaattaaaa caaacaaaga aactgttcct aggagttgtt ttaaataaat + 5101 tggatatctc ggttgataag tatggaattt acggttccta tggaaattat ggtaaaagat + 5161 aaaatgaata tagtatggaa ggggactaca gtataactct ggcattctta cagagcatac + 5221 ttatcagttt attagcttat gtactgattg caatttcaga aaccgatatg tcttcaaata + 5281 atattcggtc tatttggaag aacaattgaa ctgaaccttc taattcatta ttgagaactc + 5341 atatattact gaaacaaata aattttgttt agatggagaa aagttttatc tgacgtagag + 5401 gataaaagaa ttatatttct gaaaatcatt gagtgaccaa atatatattg agtttctgta + 5461 gttgcatgta ctgcctgatt taatttgtca aatggaaata gaatgaaaaa tggaaataga + 5521 atttatagtt ggaggttgtt tatgtacagt ataataaaac gattaggtga tatattatta + 5581 tctttaatag ggataataat attgtgtccg gtttttatga taattgcaat tgcgattaaa + 5641 cttgattcag aaggtccggt tatatttaag caaaaacgct ttggtattca taaagaatac + 5701 ttctatattt tgaaatttag gtctatgaaa atagatgcac ctaaaaatgt ggcgcctcga + 5761 aacttatata atccagagca atggattaca aaagtagggg ctttcttgcg aaaaacatct + 5821 ttggatgaac taccacaatt gtttaatatt cttgttggta atatgagtat tgtaggtcct + 5881 agaccagcgg gtataaatga actagatttg attgcagaga gagataagta tggagcaaat + 5941 gatatcttgc cagggttaac tggatgggca caaattaacg ggcgtgatac tttgtctgtt + 6001 gagatgaaga cggagttaga tggctactat gttaaacatc tgtctttgat aatggatatt + 6061 agatgtatag ttaagacaat accttacgta ctgaaacgaa aaggtattgt agagggtagt + 6121 ggtaagaaag aaagttaaat tggacaatga aaatactatt tgtttgccaa cattataagc + 6181 cagaaccatt caggttgtca gatatttgtg aagatttagt tcgaaaaggg catgaagtct + 6241 ctgttttggc tgggattcct aattaccctg aagggaagat atatgcagat tatcgtcata + 6301 ataaaaaaag acgtgagatt atagaaggtg ttacgatata tcgttcttat acaatcccta + 6361 gaaaaaaaag tgttgtattt cgattgttga attattttag ctttgcaatt agttctactt + 6421 taggagtttt attggggagg tataaaacga aagatggatc gaattttgac tgtgtattcg + 6481 ttaaccaatt gtctccagtt atgatggcat gggctggtat ggcttataaa aaaaaatata + 6541 agaaaccgat gtttctatat tgtatggatg tttggccaga tagtttaacc gtaggtggag + 6601 tgaaacaaga tggcttgatt ttcaagctgt ttaaatttat ctcaaaaaaa gtttaccgag + 6661 ctagtgatta tatatttgtc actagtccat catttaaaaa ttattttgtg aagcaatttg + 6721 acatatccga acaaaagatt acatatttgc cacaatatgc agaagatctt tttatccctg + 6781 atgaatctat agttaataaa gaaagtgttg acctaacttt tgctggtaat attggcaaag + 6841 cacaaaattt ggaaactatt ttgaaagctg ccagtttgat agagaagaat accaatttac + 6901 ccaagaaaat tcattttcat tttgttggag atggtacgga attgttaagc atgaaagcat + 6961 tagctcatga attggagtta aagaatattt ccttctatgg aagacgttct ttggaggaaa + 7021 tgccatcctt ctataaaaaa tcagatgcta tgttagtttc tttaatagga gactcgatag + 7081 tttctcgtac tatacctggg aaggtacaat cttatatggc ggcaggcaaa ccaattatag + 7141 gtgcaatttc aggagatgct aaaataattg tagaagaagc aaattgtgga tatgttagtc + 7201 ccgaacgaga tgtaaaacaa ttggcaaaaa atatttgtaa atttagtatg ttatctatta + 7261 agagacaaag agagttagga aagaaagctc gttgttacta tgaaaatcac ttttcaaaag + 7321 agcagtttat gacacagtta gaaaagtatt tgagagagga attttcctca tgaaaatttt + 7381 gatgattaat actgtttgtg gtattaggag tacaggaaga atttgtacgg atatcgcaac + 7441 cgctttaaca aagaagggtc atgaagttaa gattgcatat ggacgtgagt atgttcctac + 7501 acagtatcga aattacgcgg ttaagatagg gtctagagtg gatgtaaata ggcatgtctt + 7561 acaagctcga atttttgata atgctggttt tgtaggtaga gcagcaacta gaaaatttat + 7621 cacttgggtg aaagaatatg atcctgatat tattcatctg cataatttac atggatacta + 7681 tattcatgta ggagagttat tttcctattt gaaaacttgc ggaaagaaaa ttttatggac + 7741 tttacatgat tgttgggctt ttactggaca tggtgcttac tttgatactt tagaatgtga + 7801 aaaaattgga cagtgccatc attcgagtca aaaaaatgat tatccaaagt cattaattga + 7861 tttttcatct agaaatttta aacgtaaaaa aaatttgttt acaggtgttc caaacttgac + 7921 acttattaca ccatcagagt ggttggcaaa tttggtaaga aattcatttt tgaaagaata + 7981 tcccgtaaca gtcattcata atggtattga tactacgata tttaaaccaa gggtattaga + 8041 ggctaagaaa ctgagaaaaa aatttcgctt agaaggaaaa caggtattgc ttggtgtggc + 8101 ttctatctgg gatcagcgta aaggattgga tgatctatta gaattatctg tacagctaaa + 8161 atcttatcaa caattagttt tgataggatt atcaaaagaa caattgaata aacttcctaa + 8221 agagattatt ggtctgacca caacagatag tgtagaagaa ctttctgctt ggtacacgtt + 8281 ggcagatgta tttatcaacc caacaacaca ggataattat cctacaacta acttagaagc + 8341 tattgcctgt ggaacaccag ttgtgaccta cccaactggt gggagtatag aaagtacata + 8401 tatgtatggt atagtgtgta gtgatagaac agttgtttct atattagagt ccctaaaaga + 8461 agtgagtcaa tgtaaaagga gtcctaattt taatttgtca aaagagtatt ttgtggaaaa + 8521 tatactcaat ttatactagt ggaactggag ttgatatgat aaaaatttta tatgttaacg + 8581 gcgggactat ggatagaggt ggtgtatcta cttttatgat gaatgtttat gaaaaaatgc + 8641 attctgaaaa aattcaaatt gattttttag tccatacctt atccgaaggt gtacgcgatg + 8701 aggatatttt aaatcttgga ggtaaaatct ttagagttcc tgctagagga aagaatcctc + 8761 taaaaaatta tcgccaaatt aaacaaatta tgttgaatgg aaattatgat gtagttcatg + 8821 cgcatgctga tgcaggaaat aggacaattt tatctattgc aaaagagtgt gatattccta + 8881 ttcgtatttc acattgccat aatacaaact atacaaacaa aagtttatta aagaagtttt + 8941 tgaatgagca attcaagaag caaattccga gatatgctac tcatctatgg gcttgttcag + 9001 aaaaagcagg agagtggttg tatgggaatc actcttttga agttattcct aatgctattg + 9061 atgttcaaaa gttcatctat agtccacaat tatctaaaga tttacgtaag gaattaaatt + 9121 tagaaaataa gtttgttatt ggtcatgtag gacgatttga ttatcagaaa aatcatgatt + 9181 ttcttcttaa agtttttacg gaatttatca atgaaagaga agatgctcat cttgttctca + 9241 taggtaaggg agaattggaa gaggttatta aaaagcaagc aaatcactta ggaatattgg + 9301 ataagattag ttttttaggc gagtcttcta atgtgaatga actgattaat gtgtttgatg + 9361 taggtgtttt cccatctctt tttgaaggtt ttagtatagc tatggtagag atgcaagtca + 9421 acggtttacc attagtggtt tctgataatg ttccaagtga gattaattta actgataata + 9481 tacgtttttt atcactggat gaaacagtta aatattggtg taaaacgatt ttggagacca + 9541 aaggacggga tactggggca gttgataaaa ttattgctaa gggttataac ctgtctgata + 9601 tggttcataa gttaacaaaa acttatgaaa gaattgtaga taaatcatga aaaaagtatt + 9661 atttgtaact aatattccat caccttatcg tgtggatttc tataatcaac ttgggaaatt + 9721 tgtagattta actgttgttt ttgaagcaac aggagctcaa gatattagat ttgattaccg + 9781 agagattttt aaaaatttta ccgccatttt tttaagtgaa ggtaatattg atgagaagaa + 9841 attaaattca gctatatttc agtatttaat tcctaaaaaa tatgactata tttttttgac + 9901 taactattct tatcgaacag aattatttgg ttatttaaag tgtgtttttt ctaagatacc + 9961 gtttgtatta gaaattgatg gtggtaagat accagaaagc gagaattttt taaaatacca + 10021 gtttaaaaaa tttattctta cgaaacccta ctattatttt agcccaagtc agtccagtga + 10081 tgatttctta gcgcattatc atgtgaataa agaaaatatt tatcggtatt catttacttc + 10141 cttatcagag aaagacatac gatatcaaat tgtcgatgag aaagaaaaac aatttttaag + 10201 aaagaaactg ggattcagtc caactaagaa aacaatttta tttgttggta gaatcatccc + 10261 tggtaaaggt gtggatgttc taatcaaggc tgttcagaat ttatcagacg atgtacaatg + 10321 tttaattgta ggcccaagtc ccgatagtga atacaaacaa tacttgcttg atcttattgg + 10381 acaagatagc cgttttcatt ttattgattt tttacagaca tctgaactga aacaatacta + 10441 caagctatct gatatatttg ttttaccaac aaagtcggat gtttggggac ttgttgtaaa + 10501 cgaggcaatg tctcagggac ttcctgttat ttctacatct gcatgtgttg ctgcaattga + 10561 gcttgtttcg aatggtaaca atggatatat tattgatagg gttgatgact ggaaagctat + 10621 ttttcaaaag ttaagcaaag tattacagga tgactcgtta cgagttcaat tatctcaaaa + 10681 tgctttatct actattaaac actacactat tgaaacaatg gttaaagagc atttgaaatt + 10741 tatggaggaa aaatgaggat atctgttgcg atgacaacct ataatggagc agattatttg + 10801 ctagagcagc tagaatcgct tcgcactcag agtttaatgg ctgatgaagt tattattgtt + 10861 gatgattgtt caacggataa tacagttgag ctacttgata tgtatattca gaagtatcat + 10921 ctcgataatt gggtattgat tagaaactca tctaatatag gttggagaaa aaactttaga + 10981 aaagctcttc aagagacaac aggagatata gtttttcttt gtgatcaaga tgatatttgg + 11041 aacaaagata aaatttcact gatggtaaaa gagtttcata aatcgccgtc aatagaacta + 11101 ttggctagta actatgagat tctcgatttt ggcagaaatg ataaaatcaa gattagggat + 11161 gttgagttag ataatggtgc tgtagttccg ttttcgttaa aaaacaagag tatttctgtt + 11221 atgagaccag gatgtacttt tgcagttaag cgtgagttaa tagttctgtt agaaaagtat + 11281 gatatagata gatttggcca tgataatatt ttatggaatc tagctatgat aagaggaact + 11341 ctatatctat acttaaaacg cttaatacat tttcgtcgcc acgagacaag tgcttctgct + 11401 cctaaccaat ctcttaatcg tgaccggcga gttgttgaag tggatacgag tcatcaaatt + 11461 acagttttct tacttgatgc ggctcgtaga gaacatttag acataaaaat aatttctcag + 11521 cttgaaaata tggaaatggt tcttgagaga cgtagagata ttttaaaata tggtactctt + 11581 atgcaaatag ttcatttcca actgaagtat catacttatt atcctacatt ccgcaattta + 11641 ttatcggata tattagtgtt tttgaaaaaa taatgagaga gaagagtttt gagcaaaatt + 11701 tctaaaaatt atctatataa cttaatttat caagtggtag ttttaatatt gccactattg + 11761 attactccat atgttgctag aatattaggc gcacaccagt taggaattta tgattatgtc + 11821 aattcaatcg ttactttgat ttacacttta ggtttattag gtattggtca ctatggaaat + 11881 cgcgaatgtg cctatactag agatgataaa gaggaactat cagagacatt ttggagtatt + 11941 ttagctattc agattattct aggatttttt tcactgttat tcttgtatat tttttctaac + 12001 ataaattcaa attatcaagt ttactttcag cttttctcta tttggctttt tgggtctatt + 12061 cttgattgta cttggctcta tcgtggctta gaggaaatgc agtatgttgt gttaaaaaat + 12121 attattgcta agttattatt tacgatagcg accttcttat ttgtaaaaag tgaaacagat + 12181 ttaactctat atgtgctcat atatggtctc tctgttttag tagccaattt atcaacttat + 12241 agtcaactaa ggatgtttat tagtagacca aagataaata ttaatcgttt tacggagatt + 12301 attttaggga gtctcaaact atttttacca agtatcatca cgcaaattat gttatctgct + 12361 gataaaattg ttctagggtc tttaagttct ggaatcagca atgtttctta ctatagtaat + 12421 gcagagaaga ttatacagat accactctct ttaatagtag tattaaattc tgttatgatg + 12481 ccccgaatag caaatgaatt tcgtaataga cggttagaaa atatgaaaaa gtatctgaca + 12541 actgcagctg aattttcttt gttcttagct gttccattgt cgattggcct ttatgctatt + 12601 gcagatactt ttgttccgtg gtttttaggc gaaagtttta tgccatctat ggatgctctt + 12661 aaatggcttg ctcctattgc tgttggcaat gctttgctag gagtctcagg tagtcagtat + 12721 tttgttgcag ttaataaaac aaaagtctta tttttttcta atactttagc tgcaatttta + 12781 aatattctat tagatttgtt acttgctcca atgtttggag tagtaggggt ttgtttagca + 12841 actatagtat cacttacctc ttctgttata gtgcaatact atataatgtc aaaggatata + 12901 cctattatac ctattttgaa gtcattattt aaatatctca tttattctat gataatggga + 12961 atgattatta ttgtttcatt cagaggatat ccagcaaatt atagaacaac tattaagcaa + 13021 atcgttcttg ggatagtagt ttactttggt ttgaacttgt tgacacgaga tgtatttgtt + 13081 tttcaaacat tagattttgt aaagaaagga ttcaaaaaaa gtagatgatt tcagctttat + 13141 tttatataag ttttttaaca aatctattag tcgttgtcaa taggatgcgt ataaattccc + 13201 tagcattttt atcttggtta attttgtttt ttatctatgc aggaaatatc cgagaaggat + 13261 tttcagattt aattcattat cgtgcaagat atgctgtagg gaaaagtagt ctgtattttt + 13321 cagaccatgc gtataatttt tttgcagatt ggttttcaca tcactccatc tcttttcaag + 13381 tttttttagc atgtattttt ctattctcct cagcatgttt ctattttgtt gctaaaaaat + 13441 tgcattgtaa ttataatctt ctgattttat tattatctct tttttatttc ttttatactt + 13501 tagaagttct aaggttcttt ttagcaacta gtgtagcact tatagcacac tattatcttt + 13561 cacaaaatca tcgattcata ttcataggat tgatgttcat agcgtttctg tttcacggat + 13621 ctatcattta tttcttacca tttattattt tttatagaca aaaaaatact agtaagatgc + 13681 tatgggcatt ggtatttata tctatggtgt taattgtgac aaatctattg gtaggtaata + 13741 attctagcta cttgactaaa atatttgaac tgctagggag cgaggtcact aaaagtcgtg + 13801 ttatgtatta tacagcgaaa tcgactcgtc ttggttttat attgtatgat agttactata + 13861 ttttcaacct actaattagt attaacctta aaaagattgc aaaaacagtt tcaaatgcac + 13921 ctcaggaagt gaccaatttt ataaatctgg tgtatcaaca tagttttttt agtacaattt + 13981 ttttaccact aattatgttt agtacagcat ttactcgcta tttaattttt actgttgttt + 14041 taaattttat agctattgca gctttacaac catttatgca acaatcattt ataaaattaa + 14101 agagtgggct ttatattatt ttcggagttt taggtgctac ttgtttttgg tggtatctaa + 14161 gagaaaatgt cctttatttt tatgaggcac ttttgccaaa tttatttaac tgattttata + 14221 ttctttatgt ctgtactttg caaacattac aagagtggtc tataatataa aaatataaag + 14281 aaatacggta tagctatttc tttagaaagt ggaaatttaa atgattaatt acagcgcaga + 14341 tgaattagac atgattcaga agcttgaact caaaatatta aaagaaatta ttcgaatatg + 14401 taaaaaagaa aagatagagt attttttaat tggtggaagt gctcttggag caatacgtca + 14461 tgaaggattt ataccatggg atgacgatat tgatgttggt atgacacgtg agaattatga + 14521 taactttttg agagtagctg aacagtattt aggagaagag ttttatttac aatcaccctc + 14581 ctctgataga aaatcaccct attcttacag taaactaatg ttaaaagaga ctttgttctt + 14641 agagtatgcc caaaggaatt taaaaacaca aagtggtatt tatgtagata tttttccatt + 14701 tgatgaggtt ccagataatg agtcagaaaa tgagagacag tttaaagcgg tacagtttta + 14761 taaaaagtta tatgtgatga ggatgttgcc aactgtttct aaggctcctg agaatttgat + 14821 tcaaggttta aaagctattc taaggagatg cattcattat agtttaagat taatccctaa + 14881 aagtttaata ctcaaaaaaa ttgatcaatt ttctagatta tataatggaa caaatcaatc + 14941 tgcattggct tgtttagatt ttccggtaag aaatgtagag tatgttctaa aaacaacact + 15001 atatccctta attgaacata aatttgaaga aatcacaatt ttattacctg gtgattttca + 15061 tcaatacttg actacacatt atggtgagta catgaagttg ccacctttag aagaacgtgt + 15121 tgggcataga ccatatttga ttgatttagg aacatatgga aaggaagaaa aatgaagaga + 15181 gtgattactt acgggacttt tgatttgctt cattacggtc atatcaattt attgaagcgt + 15241 gctaaagatt tgggagatta tttaatagta gctctatcta ctgatgaatt taatcttcaa + 15301 aaagataaga tttcatattt caattatcaa cagcgtaaaa ttttgcttga atctattcgt + 15361 tatgtagatc tggtaattcc tgagatttca tgggaacaaa aacgagaaga tgtaaagaaa + 15421 tattatgctg atatctttgt tattggtgat gattgggaag gtaagtttga ttttttgaaa + 15481 gatgaggggg tagaagtagt atatttacct cgtactaaag aaatttctac tacacagata + 15541 aaagaagact taaacaagac caaaggtgga aaataatatg tcacaattta caggaaaaac + 15601 tcttctaatt acaggaggga caggttcatt tgggaatgcg gttctcaagc gttttttaga + 15661 aacagatatc tcagagattc gtatcttttc gcgagatgaa aagaaacaag atgatatgcg + 15721 tcatgagttt caggtaaaag taccagaagt ggctgggaaa atccgttttt acctcggaga + 15781 tgtgcgtgac ttagcttcgg taaaaaatgc tatgcatggt gtggattatg tttttcatgc + 15841 tgctgctctg aaacaggtac cttcttgtga atttttccct gtagaagcgg taaaaactaa + 15901 cattttggga acggagaatg ttctcgctgc agctatcgaa gctgatgtaa agcaagttat + 15961 ctgtctttct acagataagg cggcttatcc tgttaatgct atgggaacgt ccaaggctat + 16021 gatggaaaag attgctgttg ctaagtcccg ggcggtaaat cctgagcata caaagatatg + 16081 tgtgactcgc tatgggaatg ttctatgtag ccgaggatct gtagttcctc tttggattga + 16141 gcaaattaag caaggaaatg ctcttacaat tactgaacct agcatgacac gttttgtgat + 16201 gacattggaa gaagcagtag atttagtttt atttgcattt gaagaaggga aatctggcga + 16261 tatactagtt cagaaagcac cagcatgtac gattgaagtt ttggctaagg ctgtatcaga + 16321 aatttttgcc tcagaacaag atattaagat tataggtatt agacacggag aaaaaatgta + 16381 tgaaacacta ctaactaatg aagagtgtgc aaatgcaatt gatttgggta atttttatag + 16441 agttcctagt gataatcgta atcttaacta tgataagtat ttcaaagatg gtagtacgaa + 16501 tagaaatttg ttgacagaat tcaatagtaa taataccgat ttgatggatg tagagcaagt + 16561 taaaagaaag ttgctagaat tagatgaaat acagacagca attcgtgata tggtagcaga + 16621 tgaagagatg taaaatcttt taagttacat taaaattatc aagtatatat aatgtatcat + 16681 gtattgtcga gagagttgat tattaaaaca gcatataaaa caaggagggg gcatgattaa + 16741 aaatatttta atcacaggag caaaaggatt tgtaggaaaa aatcttatct gtactctgga + 16801 agctttgaaa gatggacgag ataggactcg tcctaattta gagattggag agatttttca + 16861 gtatgatcgt gatacagatc cgattttatt agatgaatat tgtaagaagg ccgatttcgt + 16921 attccattta gctggtgtca atcgtccaca gaatcctgat gaattcatgg agggaaatta + 16981 cggtttttca agtagattat tggagatttt agaaaagtat gaaaacactt gtcctgttct + 17041 actctcaagt tctactcaag ctagtttaga aggccgattt tcaaactcta tatatggaca + 17101 atctaagcta gcaggggaag aactcttctt tgaatatgga aagaaaacgg gagcacctgt + 17161 cttagtttac cgtttcccga atctttatgg gaagtggtgc cgtcctaact acaattctgc + 17221 tgtagcaact ttctgtcata atctagctca cgatttacct attcaagtaa atgatccaag + 17281 tgtagaattg gagttgctgt atattgatga tttgatacaa gagtgtctaa ctgcattgga + 17341 aggaaatcct catcgttgta atctagatgg attacaaatc ttacctagcc cgtcaggaaa + 17401 ctactgctac gtaccaacga ctcatcgtgc aaccttagga gagattgtct ctctattaga + 17461 aacatttaaa aaacagcctg atagtttagt tatgcctgaa attcctcaag gatcgtttaa + 17521 aaagaaattg tattctacct acctatctta tttaccagta gataagttta agtttcctct + 17581 aaaaatgaat atagatgaac gaggtagttt tacggaatta ttaaaaacag aaaatacggg + 17641 tcaattttct gttaatattt ctaaacctgg cattaccaaa gggcaacatt ggcatcattc + 17701 taagtgggaa tttttcatgg ttgtttctgg tcgtgcttta atacaagagc gtaggatagg + 17761 gctggataaa aatggtcaag agtatcctat tctgaacttt gaagtgtcgg gcgataagat + 17821 tgaagcaata catatgatac cgggctatgc acataatatt attaatcttt ctgatacaga + 17881 aaatctagtt actgtcatgt gggctaatga gtcatttgat cctagacatc cagatacttt + 17941 ttttgaacaa gtggagaaat aaatgaaaat taagacaaat tatagtgata ttcactttaa + 18001 agataatggc aaacttaagt tattgattat tgtgggaaca cgtccagaga ttatacgtct + 18061 aagtagtgtt atcactaaat gtcgaaagta ttttgatgtt attttggcac atactggaca + 18121 aaactatgat tacaatttaa atggtatttt ctttgatgat ttagggttag acactccgga + 18181 cgtatacatg gatgctgttg gagatgatct tggtgctact gtagggaata ttattaatac + 18241 ttcatacaaa ttgatgaatc aaattaaacc agatgcttta ttgattttag gggatacaaa + 18301 ttcttgttta tcagctattg ctgccaagcg tttacatatt ccaatttttc atatggaggc + 18361 tggcaatcgc tgtaaggatg agtgcctgcc ggaagagact aatcgtcgga ttgttgatat + 18421 tatttcagat gttaacttag catactctga acatgcacgt aagtatttac atgagtgtgg + 18481 tttacctaaa gagcgcacat atgtaactgg ttctcctatg gcagaagtgt tacataaaaa + 18541 tttatctgcc attgagtctt cagatatcca tgaacgtttg ggattgaaaa aaggaggtta + 18601 tatcttactt tcagctcacc gtgaggaaaa tattgataca gataaaaatt ttatctctct + 18661 ctttacggca attaatcaat tagctgaaaa atataatatg ccaatcttat attcttgcca + 18721 tcctagatca aagaaaaggc tacaagagag cggttttaaa ctagataaac gtgtgattca + 18781 gcatgagcca ctaggattcc atgactataa ttgtttacag atgaatgcat ttgttgtagt + 18841 atctgattcg ggaactttac cggaagaaag tagtttcttt actagtcaag gttatccttt + 18901 tcccactgta tgtattcgta caagtacaga acgtcctgag tccttagata aggcaggatt + 18961 tattttggca ggcattgatg aaaattctct tcttcaagca gttgaaactg ctgttagctt + 19021 ggcagaagat gaggattttg gattaccggt tccagattat gttgaggaaa atgtctctac + 19081 taaagttgtt aagataatac agagctatac agggatagtg gataaaatag tttggcggaa + 19141 aagctgaatt gtatattttt aataaatcaa aatgagatga ttaattctta gtagaacaag + 19201 agtaaaattg aacgtatttg atggaaatgt cttacttgat attcgaggga tagccattct + 19261 atcggatttt tggcttgttt ttgcgcttca tatttgatag aataaagtga cgacacttta + 19321 accatcgaag cgaggtgaga ataatggcag taatttttaa agatgtactt attgaagaga + 19381 agactgaaga agaaaaacaa catattttat ctattttaaa tggtgagtat aacttatctg + 19441 atgatgtaag tcgtagatta agacgactga atgaggaaag taaacgcttg aaagtgttta + 19501 gtaaggagac gcactaattg cctgtcttgt attttattga tgaattgaaa ttaatcagta + 19561 cttcatcatc tattttaaat gatgggaatg ttagaacttt tgattgtgga tatcaagaat + 19621 tgaatgacat ttttttagat atttacaaca aatacaatga agaatcaggc tatgtattgg + 19681 ctattgtaat actcatctgt tttcaaaaag cattctagtc catctccgat taacgatgaa + 19741 ctttatcacc tccttctcca atccttgtat gacatcttga agttgattca tgacatcttc + 19801 cacagtttga aagactttat tcttaaatcc acgtttacga atctctttcc acacttgttc + 19861 aatgggttca tctctggtgt gtatggagga gtaaatgcaa agccaatatt agtcggaatc + 19921 tttaaggtac ttgatttatg ccatatagca ttgtccataa cgagtaaaaa ataatcatat + 19981 ggataagctt gtgaaagctc ttctaaaaag gcgttcatcc actcagtatt acatccacca + 20041 gctattaaga aaaatgattc gcctgtatgg gcatcaacag ctccataaca atagcgaaat + 20101 tctcgtatat agtgactatg gacatgtgga cctactccta ttggagacca acaagatccc + 20161 agtttactga ttctaccgaa accagcctca tcttggtaca tcaagcgaac cttatgaaaa + 20221 cgtctactgg ttttaaaacg ctttcttgtc ttcttgaatt gagattttat ttttagacgc + 20281 gacaatggtt tgagcgtctg ctttcttagg atgttctgga cgtggcataa tatttcgcca + 20341 accatggcgc ttcaacagtt gatagaaggc attacgtgtg taggaacgac ctaactcctt + 20401 tttataagcc tgaaataagg catcaattgt aacaaattct cctgcctctg cagccttcaa + 20461 atggcgagca agaaaggctt tctcttcctc aatcgtcata tatgcatggt tacgaccacc + 20521 acgtgttttt tgaaggagag aatcgagtcc gaactcgtca tattttttta cagttcgcca + 20581 aatcattgtt tgattacagt ctaaaagctc tataatctct ttataagatt tgcccatcag + 20641 acgaaataga acgatttgaa ggcgtttatg atatttagct gtacgagagt cttttaaaag + 20701 tgttttgatg gtttggattt cttctttagt tgatttcata ttactattat acaatgcttt + 20761 tttattttga tctagtataa atcaaaattt tgaattatta ggttttattt cttgtagact + 20821 agtgtcattt tctcttctag ctcagggtaa agagatggga attagcatag attatcttgg + 20881 tgttcacaag gatatccaga aaaagaggat aggttcgctt ttggtgacct ttgcacttcg + 20941 attatcttta actattgact gttggttacc aataaaaggt gttagagttc atgctttaga + 21001 ggatgctgtg gaattctatg aaaaactggg ttttattgtt cctagagata tggtgattaa + 21061 taatagcaaa ccggttacta tgtattttag tagacttcct gcgaaacaaa atatggtata + 21121 gtagttctat gaatgatgaa gcaagtaaac aactaactga tgcatgattt aagcgtcttg + 21181 ttggtgttca gcgtaccact tttgaagaga tgttagctgg attaaaaaca gcttatcaac + 21241 ttaaacacgc aaaaggtgga cgaaaaccta aattaagcct agaagacctt cttatggcca + 21301 ctcttcaata tgtgcgagaa taccgcactt atgaagaaat tgcggctgac tttggtatcc + 21361 acgaaagcaa cttaatccgt cgaagccaat gggttgaagt aactcttgtt caaagtagtt + 21421 ttacgatttc aagaactcct ctcagttctg aggacacgat aatgattgat gcgacggaag + 21481 taaaaatcaa tcgccctaaa aaaagaatta gcgaatgatt ctggtaaaaa gaaatgccac + 21541 gctatgaagg ctcaagcgat tgtcacaagt caagggagaa ttgtttcttt ggatatcact + 21601 gtgaactatt gtcatgatat gaagttgttc aaaatgagtc gcagaaatat cggacaagct + 21661 ggtaaaatct tggctgacag tggttatcaa gggctcatga agatatatcc tcaagcacaa + 21721 actccacgta aatccagcaa actcaagccg ctaacagttg aagataaagc ctgtaaccat + 21781 gcgctatcca aggagagaag caaggttgag aacatctttg ccaaagtaaa aacgtttaaa + 21841 atgttttcaa caacctatcg aaatcatcgt aaacgcttcg gattacgaat gaatttgatt + 21901 gctggtatta tcaatcatga actaggattc tagttttgca ggaagtctag tattgaaaac + 21961 ctaagaaatg gtggaattat gcctcttaca cagttatttg aaacaccctt aggaaatgat + 22021 ttttaattgt atgcaaacaa agtagaattt gcttatttca ttttatgcta aatataatat + 22081 gaaataagtg aatttttata gataaagaag agtttttcta tgtttttaga taataatttg + 22141 aaaaactgtg acgattattt tgcttttaga gcagtataca attaatagga attgaatcta + 22201 aaacaacaaa gaaaggtacc ctactatgaa aggtattatt ctagcaggtg gttcggggac + 22261 acgtttatat cctttgactc gggctgcatc aaaacaactt atgccggttt atgataaacc + 22321 gatgatttac tatccacttt caacattgat gttggctggg attagggata ttttgataat + 22381 ctcaactcct caagatttgc ctcgttttaa agagcttctt caagacggat ctgagtttgg + 22441 gattaaactt tcttatgcag agcaaccaag tccagatggt ttggcacaag cctttatcat + 22501 tggggaagag tttattggtg atgatagtgt tgctttgatc ttgggggaca atatctatca + 22561 cggccctggt ttgagcaaaa tgcttcaaaa agcagccaag aaagagaaag gtgcgactgt + 22621 ttttggctac caagtgaagg atccagagcg ttttggtgtg gttgagtttg atacagacat + 22681 gaatgctatc tccatcgaag aaaagccaga ataccctcgt tcaaactatg cagtgacagg + 22741 actctatttc tatgataatg atgttgtcga aattgccaag agtatcaaac caagtcctcg + 22801 cggagaatta gaaatcacag atgtcaacaa ggcttacttg gatcgtggag acttatccgt + 22861 tgagcttatg ggacgtggct ttgcttggct ggatactgga actcatgaaa gtttactaga + 22921 ggcttcacag tacatcgaaa cagtgcaacg gatgcaaaat gttcaggtag caaacttaga + 22981 agaaattgct taccgtatgg gctatatcag tcgagaagat gtattggctt tagcccaacc + 23041 acttaagaaa aatgaatacg gacagtatct gctccgtttg attggagaag catagatgac + 23101 agataatttt ttcggtaaga cgcttgcggc acgcaaggtt gaagctattc caggcatgtt + 23161 ggagtttgat atccccgttc atggagataa tcgtggctgg tttaaagaaa atttccaaaa + 23221 ggaaaaaatg cttccacttg gatttccaga gtctttcttt gcagaaggaa aattgcaaaa + 23281 caatgtatcc ttctcacgta aaaatgtcct tcgaggcctc cacgcagagc cttgggataa + 23341 gtacatctct gtagcagatg gagggaaagt tctgggttct tgggttgatc tacgcgaggg + 23401 tgaaaccttt gggaatacct atcagacagt gattgatgcg agtaagggaa tctttgttcc + 23461 tcgaggcgta gctaatggct tccaagtttt atcagataca gtgtcatata gctatctggt + 23521 caatgattac tgggctcttg aactcaaacc caagtatgcc tttgtgaact acgctgatcc + 23581 aagccttggt attgaatggg aaaatattgc agaagcagag gtttcagaag cagataaaaa + 23641 tcatccacta cttaaggatg taaaaccttt gaaaaaagaa gatttgtaaa aaggaaagaa + 23701 tatgactgaa tacaaaaata ttatcgtgac aggtggagct ggctttatcg gttctaactt + 23761 tgtccattat gtttacgaga actttccaga tgttcatgtg acagtcctag ataagttgac + 23821 ttatgctgga aaccgcgcga atattgagga aattttaggt aatcgtgttg agttagttgt + 23881 tggtgacatt gctgatgcgg agttggtaga caagttggtt gctcaagcag atgctatcgt + 23941 tcattatgca gcggaaagcc acaatgataa ttcgctcaat gatccatcgc catttattca + 24001 tactaacttc atcggaacct atactctttt agaagctgct cgtaagtatg atattcgctt + 24061 ccaccatgta tcgacagatg aagtttatgg ggatctccct ttacgcgaag atttgccagg + 24121 tcatggtgaa ggaccaggtg agaaatttac tgctgaaaca aaatacaacc caagctctcc + 24181 gtactcatca accaaggcag cctcagattt gattgtcaaa gcctgggtgc gttcttttgg + 24241 agtcaaggca acgatttcca actgttcaaa taactacggt ccttatcaac atattgagaa + 24301 gtttattcca cgacaaatca ccaatatctt gagcggtatc aagccaaaac tttacggtga + 24361 aggtaagaac gttcgtgact ggattcatac caatgaccat tcttcaggag tttggacaat + 24421 cttgacaaaa gggcaaatcg gtgaaaccta cttgattggg gctgatggtg agaagaacaa + 24481 taaggaagtt ttggaactta tccttaagga aatgggacaa gctgtggatg cctatgatca + 24541 tgtgactgac cgtgcaggac atgaccttcg ctatgcgatt gatgctagca agctccgtga + 24601 tgagttgggg tggaaacctg aatttaccaa ctttgaagct gggctcaagg caacaatcaa + 24661 gtggtataca gataaccaag aatggtggaa agcagaaaaa gaagctgttg aagccaatta + 24721 tgctaagact caggagatta ttacagtata aaaagcagga aatagctgct ttttattgct + 24781 atattgggaa gagttacata ttagaaaggt ctagagatga ttttaattac aggggcaaat + 24841 ggccaattag gaacggaact tcgctattta ttggatgaac gtaatgaaga atacgtggca + 24901 gtagatgtgg ctgagatgga cattaccgat gcagaaatgg ttgagaaagt ttttgaagag + 24961 gtgaaaccga ctttagtcta ccactgtgca gcctacaccg ctgttgatgc agcagaggat + 25021 gaaggaagag agttggactt cgccatcaat gtgacgggga caaaaaatgt cgcaaaagca + 25081 tctgaaaagc atggtgcaac tctagtttat atttctacgg actatgtctt tgatggtaag + 25141 aaaccagttg gacaagagtg ggaagttgat gaccgaccag atccacagac agaatatggc + 25201 cgtactaagc gtatggggga agagttagtt gagaagcatg tgtctaattt ctatattatc + 25261 cgtactgcct gggtatttgg aaattatggc aaaaacttcg tttttaccat gcaaaatctt + 25321 gcgaaaactc ataagacttt aacagttgta aatgaccagt acggtcgtcc gacttggact + 25381 cgtaccttgg ctgagttcat gacctaccta gctgaaaatc gtaaggaatt tggttattat + 25441 catttgtcaa atgatgcgac agaagacaca acatggtatg attttgcagt tgaaattttg + 25501 aaagatacag atgtcgaagt caagccagta gattccagtc aatttccagc caaagctaaa + 25561 cgtccgctaa actcaacgat gagcctggcc aaagccaaag ctactggatt tgttattcca + 25621 acttggcaag atgcattgca agaattttac aaacaagaag tgagataagt agtagaatga + 25681 ttttctagtc taataaaaga ggcagataat gaactccaaa ggagcttaag atgtacgatt + 25741 atcttgttgt tggtgctggt ctctttggcg catagctttg gctcagtttc tattatcgct + 25801 cacaccatcc atcagaagtt taatctgaag gtacccaatt atcgccaaga agaagattgg + 25861 gctaggatgg gtttaccaat cacacgtaag gaaatctcta attggcatat caaggcaagt + 25921 caatactatt tagagtccct ttataacctt ttacgagaaa agttgttaga acaacctctt + 25981 cttcatgcgg atgaaacctc ttatcgggtt ctagagagtg atagccatct gacctactat + 26041 tggacctttt tgtctgggaa agctgagaat caagcaatca cgctgtacca tcatgatcag + 26101 agtcggagtg gttcggtagt acaagaattc ctaggagatt attctggcta tgttcattgt + 26161 gatatgttgc ggcagtaact taggacttta gtcctctagt tctgcctatg cgatagcagt + 26221 ccaaggttta ggagcaaggc gacgctaagc ttggtaaact gcgaaccgct agaagcttat + 26281 cgtcaactgg aagaagctgc acttgttgga tgttgggcac atgtgagaag gaagtttttt + 26341 gaagcgaccc ccaagcaagc ggataaatca tcgttaggag ctaaaggttt agcttattgt + 26401 aatcagttat tttccttgga aagagactgg gaggctttgc cagctgatga acgactacag + 26461 aaacgtcaag aagagctcca acctaatgga agacttcttt gcttggtgcc ggcgtcagtc + 26521 agttttatcg ggttcaaaac taggaagggc aattgaatac agcctcaagt atgaagaaac + 26581 ctttaagact attttgaaag acggacatct ggtcctttcc aataatctag ctgaacgcgc + 26641 cattaaatca ttggttatgg gacggagtaa aagagtccag tggactcttt tagcctaagc + 26701 taaattttaa aaagcgaggg tggttatttt ctcaaagttt tgaaggagct aaagcaagaa + 26761 ctattattat gagtttgttg gaaacagcta aacgtcatca attaaatagc gagaaatatc + 26821 tattctatct tctagaatgt cttccaaacg aggaaactct cgtaaacaaa gaggttttag + 26881 aggcttattt accatggact aaagttgtac aagaaaaatg caaataagaa atctccagat + 26941 taggaactat ccgtgagttc tctagtctgg agatttttcg gctctttgtc aactgtagtg + 27001 ggttgaaaaa aagctaagct cgagaaagga caaattttgt cctttctttt tttagaaata + 27061 gtattaaaaa ttccttgact atgtgatata gttgagggat ttttaaatga tattcatatt + 27121 ttttgcaaag atgttgtttg aaaaataatt ttcaaaaatt ctgaaaattc tgttgacaac + 27181 tttctgaaaa gagtctataa tggagagaaa gttttaaagg agaaaatgat gaaaagttca + 27241 aaactatttg cccttgcggg cgtgacatta ttggcggcga ctactttagc tgcatgctct + 27301 ggatcaggtt caagttcaag cactaaaggt gagaagacat tctcatacat ttatgagaca + 27361 gaccctgata acctcaacta tttgacaact gctaaggctg cgacagcaaa tattaccagt + 27421 aacgtggttg atggtttgct agaaaatgat cgctacggga actttgtgcc gtctatggct + 27481 gaggattggt ctgtatccaa ggatggattg acttacactt atactatccg taaggatgca + 27541 aaatggtata cttctgaagg tgaagaatac gcggcagtca aagctcaaga c +// + diff --git a/public/res/serotype_genbank/serotype_46.gb b/public/res/serotype_genbank/serotype_46.gb new file mode 100644 index 0000000..f370334 --- /dev/null +++ b/public/res/serotype_genbank/serotype_46.gb @@ -0,0 +1,1131 @@ +LOCUS CR931719 25070 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Eddy nr. 73 (serotype 46). +ACCESSION CR931719 +VERSION CR931719.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 25070) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 25070) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..25070 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Eddy nr. 73" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SCP46_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SCP46_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34602.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SCP46_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SCP46_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(488..808,810..1013)) + /gene="tnp" + /locus_tag="SCP46_0003" + /pseudo + CDS complement(join(488..808,810..1013)) + /gene="tnp" + /locus_tag="SCP46_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1227..2681 + /gene="wzg" + /locus_tag="SCP46_0004" + CDS 1227..2681 + /gene="wzg" + /locus_tag="SCP46_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34605.1" + /db_xref="GOA:Q4JYN0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYN0" + /translation="MLIMSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + FAFRYLNLVVTVLVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIIDSLQNSIQTNMPLETMINLVNAQLESGGSYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1227..1364 + /gene="wzg" + /locus_tag="SCP46_0004" + /note="Signal peptide predicted for SPC1997 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 46 and 47" + misc_feature 1440..1787 + /gene="wzg" + /locus_tag="SCP46_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 1965..2408 + /gene="wzg" + /locus_tag="SCP46_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 2683..3414 + /gene="wzh" + /locus_tag="SCP46_0005" + CDS 2683..3414 + /gene="wzh" + /locus_tag="SCP46_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34606.1" + /db_xref="GOA:Q4JYM9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYM9" + /translation="MIDIHSHIVFDVDDGPKSREESKALLVEAYRQGVRTIVSTSHRR + KGMFETPEEKIEENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKSKLFGERYKFMKKRAQYFLEQDLVHAIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2686..3294 + /gene="wzh" + /locus_tag="SCP46_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 7.8e-36" + gene 3420..4115 + /gene="wzd" + /locus_tag="SCP46_0006" + CDS 3420..4115 + /gene="wzd" + /locus_tag="SCP46_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34607.1" + /db_xref="GOA:Q4JYM8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JYM8" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSAFI + VKPEYTSTTRIYVVNRDQGDKSGLTNQDLQAGTYLVKDYREIILSQNVLEKVATNLKL + DIPAKTLARKVQVTVPVDTRIVSISVKDKQPEEASRIANSLREVAAEKIIAVTRVSDV + TTLEEARPATTPSSPNVRLNSLFGFFGGAVVTVIAVLLIELFDIRVKRPEDVEDVLQI + PLLGVVPDLNKMK" + misc_feature 3420..3536 + /gene="wzd" + /locus_tag="SCP46_0006" + /note="Signal peptide predicted for SPC1999 by SignalP 2.0 + HMM (Signal peptide probability 0.729) with cleavage site + probability 0.460 between residues 39 and 40" + misc_feature 3441..3857 + /gene="wzd" + /locus_tag="SCP46_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.5e-54" + misc_feature 3963..4040 + /gene="wzd" + /locus_tag="SCP46_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4125..4799 + /gene="wze" + /locus_tag="SCP46_0007" + CDS 4125..4799 + /gene="wze" + /locus_tag="SCP46_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34608.1" + /db_xref="GOA:Q4K1Y2" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K1Y2" + /translation="MPTLEISQAKLDFVKKAEENYNALCTNLQLSGDDLKVFSITSVK + QGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITQKCDASILVTKAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGKK" + gene order(5073..5498,5510..5887) + /gene="tnp" + /locus_tag="SCP46_0008" + /pseudo + CDS join(5073..5498,5510..5887) + /gene="tnp" + /locus_tag="SCP46_0008" + /note="member of homology group 148" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature order(5406..5498,5510..5878) + /gene="tnp" + /locus_tag="SCP46_0008" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 1.1e-10" + /pseudo + gene 6019..6618 + /gene="wciI" + /locus_tag="SCP46_0009" + CDS 6019..6618 + /gene="wciI" + /locus_tag="SCP46_0009" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34610.1" + /db_xref="GOA:Q4JYM6" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JYM6" + /translation="MYREIKRLGDILLSFIGIIVLFPVFIIIAIAIKLDSKGPVIFKQ + KRFGLHKKSFYVLKFRTMKVESPKYVATRDLDKPEQWITKVGACLRKTSLDELPQLWN + ILVGDMSVVGPRPVAINELDLIKEREQYGANDILPGLTGWAQINGRDNLSTEMKAEID + GYYVKHMSLRMDLRCILRTIPYVLKRKGIVEGSGKKELE" + misc_feature 6019..6111 + /gene="wciI" + /locus_tag="SCP46_0009" + /note="Signal peptide predicted for SPC2003 by SignalP 2.0 + HMM (Signal peptide probability 0.855) with cleavage site + probability 0.449 between residues 31 and 32" + misc_feature 6034..6588 + /gene="wciI" + /locus_tag="SCP46_0009" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.4e-36" + gene 6584..7849 + /gene="wciJ" + /locus_tag="SCP46_0010" + CDS 6584..7849 + /gene="wciJ" + /locus_tag="SCP46_0010" + /note="member of homology group 35" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34611.1" + /db_xref="GOA:Q4JYM5" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYM5" + /translation="MWRVVVRKSWSDAMKILFVCQHYKPEPFRLSDICEDLVQRGHEV + AVLTGIPNYPEGEIYADYRKRKKRRETINGVAIFRSYTIARRQNTLYRILNYFSFALS + STIGVIFGRYKAKDGSDFDCVFVNQLSPVMMAWAGIAYKNKYNKPMFLYCMDVWPDSL + IVGGVKENGLIYKIFEFVSKKVYQASDYIFVTSLSFKDYFVKKFNIPLHKITYLPQYA + EDLFVPNELKTNKNTIDLTFAGNIGKAQNLETILKAASAIEQIPDLAKRVHFHFVGDG + TELLNMQKLACELELENTSFYGRRPLEEMPDFYTKSDAMLVSLIGDSIISRTLPGKVQ + SYMAAGKPIIGAISGDTQRVVKEAKCGFISPEGNVDQLVRNIRKFCLLSVEEREKLGR + QARCCYEEQFSKEWFMTYLENHLKEGFLS" + misc_feature 7241..7774 + /gene="wciJ" + /locus_tag="SCP46_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.7e-14" + gene 7798..9015 + /gene="wcxB" + /locus_tag="SCP46_0011" + CDS 7798..9015 + /gene="wcxB" + /locus_tag="SCP46_0011" + /note="member of homology group 55" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34612.1" + /db_xref="GOA:Q4JYM4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYM4" + /translation="MVYDILRKSFKRGVSIMKVLMINSVCGIRSTGRICTDLATALTE + EGYEVKIAYGREYVPKQFQQYAVKIGTKSDIRFHAIRSRLFDESGFGSRQATVNFIKW + IKEFDPDVIHLHNLHGYYINIELLFDYLRICGKKIIWTLHDCWAFTGHSAHFDCLECE + SKGVCDHPSQKNDYPKSFVNFSRRNYQRKKKCFTHIPNLTIVTPSQWLANLVGQSFLK + EYPVKVIHNGIDTTVFQPRLIAAQKLKKRYHLEGKQVLLGVAAIWTDKKGFSDMLVLA + SHLADNQRIVLIGLKDRQLKKLPKGIIGLTETNSPEELAAWYTLADVFLNPTYQDSYP + TTNLEAISCGTPVISYPTGGSVESAKLYGLVCQDRNVASILSSLEKVSQLSKTEKLDF + SIASFIKQMKYLY" + misc_feature 8518..9000 + /gene="wcxB" + /locus_tag="SCP46_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.6e-12" + gene 9053..10264 + /gene="wzy" + /locus_tag="SCP46_0012" + CDS 9053..10264 + /gene="wzy" + /locus_tag="SCP46_0012" + /note="member of homology group 71" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34613.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4JYM3" + /translation="MMKRIYYHLLAILAWTLPNSYAFIDSLKVFFPNISLQIAGSLLA + VISIGIFITRIYYTGYEVFISLLVCIFILIFYSTRFFYSTNVELYHSFFNSFLIRPVP + GILVAMLLAKNNHIKGFIKWSEPMMLFYTLTSFLAALSPRNSIIIYQSLSYYAMTAYM + INVFNIIYKEKILEEQLTYFRFSAWNFIRYFLLLIQAFNALSGGGRGAFILLIIFTGI + LLIRIAMNFKFLFSFIGGLSAIALVVFCIKDLDFTWLLNMDGGERLLNFFGRPERIST + DNRLLIYDTVWSAIQEKPFLGWGVGSTFLKFNGYSHNIVLDLLHDMGSFGLLIILSAF + FASSVILYKLRKIDWKVNLFILMFLEVYVHMSFSGSYLADGRLWFLVIFTYCYYRWKV + QEKDEVSNFII" + misc_feature 9869..10036 + /gene="wzy" + /locus_tag="SCP46_0012" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1.1e-08" + gene 10239..11315 + /gene="wcxD" + /locus_tag="SCP46_0013" + CDS 10239..11315 + /gene="wcxD" + /locus_tag="SCP46_0013" + /note="member of homology group 72" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34614.1" + /db_xref="GOA:Q4JYM2" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYM2" + /translation="MKLAILLSDISKIGGVQRVTTALVNELCQNIDVTIISIFSENEL + PAFGLSDRVQVSYLLKEHVNLKKNFFKVSGALRKVLKKQQFDVVLSSGTGLVSFLWFA + SLGIPTRLLAWEHQCFYFGRSFGLEWLGRKLACRFAESIVVLTKKDEGFYKENRPKAH + IEQIYNILDMDSQTAKCQLSSKKIISVGSLGRQKGFDLALEVASQIQLSYPDWQWDIY + GDGPDREKLEEKVREYQLEGFINLKGLVQNVRELYPDYSIYAMTSRHEGLPTVLLEAK + NCQMPVISFDCNCGPSDIISDGRNGFLIDCFDVNIYAKTLSKLMTSLELREQVAKSSV + IPAEELSTTYILDKWNNLLKIERR" + misc_feature 10740..11246 + /gene="wcxD" + /locus_tag="SCP46_0013" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.8e-33" + gene 11317..12495 + /gene="wcxE" + /locus_tag="SCP46_0014" + CDS 11317..12495 + /gene="wcxE" + /locus_tag="SCP46_0014" + /note="member of homology group 73" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34615.1" + /db_xref="GOA:Q4JYM1" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYM1" + /translation="MKIVHVEDFFHPDAGYQINVLPKYLAKFGHEQVIITSEMDKIPD + NLTQFFGRENIEERDRSYEEKHHVKIIRLPLHGFVSGRAIFSGKLISAIKGLSPEVLY + IHGNDTLTGIRLLLARKKLNCRIATDSHMLEMASRNPFNNYFRRFYKTLITPILIKEQ + IPIIRTQDDNYVEKHLGIPLSQAPWISYGSDTAFFHADSQIKEDFRSQYQIPSDALIC + VYAGKLDEHKGGMFLAESLSKKLNTEQPIVFIIVGNTNGEYGEAVEKSFSQSENQILR + FPTQKYQKLAQFFQVADFALFPKQCSLSFYDAQACGLPVLLEDNNINLDRTSHYNGWT + FKANSKLSLRDSLKMIASLDKEKRQEYSQNALHYILEHYNYEDKAREYEKILIGERTK + " + misc_feature 11920..12420 + /gene="wcxE" + /locus_tag="SCP46_0014" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 9.8e-05" + gene 12528..13724 + /gene="wcxF" + /locus_tag="SCP46_0015" + CDS 12528..13724 + /gene="wcxF" + /locus_tag="SCP46_0015" + /note="member of homology group 74" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34616.1" + /db_xref="GOA:Q4JYM0" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYM0" + /translation="MDLMKICIVSVGVSGLPIPAVKGGAVENLIDNYLSYNEKYNHDE + ITVVSCDHKEAREASKKYKYAQFVYIDIHSLKYKINKTIRYTINKYSPFFVGNAYISQ + LPDLSGFDTVLIENRPEYGYYIRKKFKGNLVLHLHNDLLMDNEYSVDYSVYDKIITVS + DYIRNRSEVVTSGVPIQTVYNGIDTELFLQNFSEVDLSDLKNQLEILSDDFVIVFFGR + INKNKGIKELLEAFLLLPKNLNIKLLAVGSSIFGQTELDTFTTELRQLAKQASDKVVF + TGYVNYKDIPKYHHIADCIVIPSIWEEPASLTVCEALISGKYVITTDTGGTPELVAGS + DALVVANDECIVEHLKTALLSVYQKGKCSSVITSNRDRGAYFSIEKYGRNLRKELTQN + ERIINI" + misc_feature 12528..12602 + /gene="wcxF" + /locus_tag="SCP46_0015" + /note="Signal peptide predicted for SPC2009 by SignalP 2.0 + HMM (Signal peptide probability 0.717) with cleavage site + probability 0.447 between residues 25 and 26" + misc_feature 13116..13643 + /gene="wcxF" + /locus_tag="SCP46_0015" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.1e-25" + gene 13721..15265 + /gene="wzx" + /locus_tag="SCP46_0016" + CDS 13721..15265 + /gene="wzx" + /locus_tag="SCP46_0016" + /note="member of homology group 56" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34617.1" + /db_xref="GOA:Q4JYL9" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYL9" + /translation="MSRVKNSFFNILAGIVGTIISSVLAFIVRTVFIRVLGETYLGFN + GLYTNILTVLSLTELGIGSSIAYLMYKPLAEKDGDKLAQVVQFYKKIYRVIGIIILIL + GLCLVPFLPVIVNLKNAEDLNYTALYLLYLADTVSTYLFFAYKRGVLAADQKIYVANI + FDIIITTILSIFQIITLMIFKDFYLYIILKIAKNLTLNLVISLKVDKMYPSIHKFKGI + APLPKMERRLVWKNVYATSVRQIFNELMNSTDSIVISIVLGIVMVGKYSNYAYILSIV + YIFFGGIFNPIQASIGNLSLSASIEKKNEIFNRLRFINFFFLSFCSSCLLVLVNPFIT + IWIGENYTLSFTGVIAIVGMLFVRQTGNCTTIFRLGEGYFRDYHFSPLIAGILNLVVS + VILVNYIGIAGVFVGTMLGFGFQFILVDTIVTYKKVLSRPLSEFYLRWLQTILLTVGL + CIASYYLSRLVRVNSIYDLILLFVVVIGFNFFALCFIYWRNDDFQYFIQLVKNFMKNL + EEKNHD" + misc_feature 13721..13795 + /gene="wzx" + /locus_tag="SCP46_0016" + /note="Signal peptide predicted for SPC2010 by SignalP 2.0 + HMM (Signal peptide probability 0.819) with cleavage site + probability 0.398 between residues 25 and 26" + gene 15258..16481 + /gene="mnaB" + /locus_tag="SCP46_0017" + CDS 15258..16481 + /gene="mnaB" + /locus_tag="SCP46_0017" + /note="member of homology group 75" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylmannosamine dehydrogenase MnaB" + /protein_id="CAI34618.1" + /db_xref="GOA:Q4K1X3" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K1X3" + /translation="MINVIGLGYIGLPTILMLATNGVKVVGTDYNQDLVRTLNEGQTT + FKEDGLDELFHKAVESGVDFTTEYQQTDTYIISVPTPYDSFSKKIDPSYVIEATKTVL + DNCNKGAVIIIESTVSPGTVDKFIRPVVEEKGFVIGSDIHLVHAPERIIPGNMVYELV + NNNRTIGADDLEIGYKVKELYASFCKGDIVVTDIRTAEMTKVVENTFRAVNIAFANEL + AQICSYDNMNVYEIIRICNMHPRVNILQPGPGVGGHCISVDPWFLVGDYPELTNVIEH + SMRTNAAMPEFVLNRIYTIMNEHHLTDISRVGLYGLTYKENVDDMRESPTLQLLESMS + RHLATPAIKVYDPFIEKDVVANQSHDLDEFLSNVDIVVLLVGHDEILQNMDKLKDKIV + LDTRYICHLDGTYRL" + misc_feature 15261..15815 + /gene="mnaB" + /locus_tag="SCP46_0017" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.4e-45" + misc_feature 15837..16097 + /gene="mnaB" + /locus_tag="SCP46_0017" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 4.5e-33" + misc_feature 16179..16442 + /gene="mnaB" + /locus_tag="SCP46_0017" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 2.5e-15" + gene 16504..17607 + /gene="mnaA" + /locus_tag="SCP46_0018" + CDS 16504..17607 + /gene="mnaA" + /locus_tag="SCP46_0018" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI34619.1" + /db_xref="GOA:Q4K1V3" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1V3" + /translation="MTMKKIVVIFGTRPEAIKMCPLVKELRTRENLETLVCVTGQHRQ + MLDQVLDTFRITPDFDLSIMKDKQTLFDVTIGILEGMKTVLESVNPDLILVHGDTSTT + FASSLAAFYLQIPIGHVEAGLRTYDIYSPYPEEFNRQAVGALAQYHFTPTQLSKDNLL + REGKNSEAIFITGNTAIDALQTTIQEDYTHPELNWVGDSKLILITAHRRENIGDPMRH + MFRAIRRIIEEHSDIKALYPIHMNPLVRQIAEEELSGCERIKMIDPLEVLDFHNFLSR + SYLILTDSGGIQEEAPSLGKPVLVMRDTTERPEGIKAGTLKLVGTDEDNIYRHFKELL + ENDLVYQAMSQASNPYGDGTACKKIADILEGEV" + misc_feature 16573..17595 + /gene="mnaA" + /locus_tag="SCP46_0018" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 2.5e-174" + gene 17611..18666 + /gene="fnlA" + /locus_tag="SCP46_0019" + CDS 17611..18666 + /gene="fnlA" + /locus_tag="SCP46_0019" + /note="member of homology group 36" + /codon_start=1 + /transl_table=11 + /product="FnlA" + /protein_id="CAI34620.1" + /db_xref="GOA:Q4JYL6" + /db_xref="InterPro:IPR003869" + /db_xref="InterPro:IPR013692" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYL6" + /translation="MSQFTGKTLLITGGTGSFGNAVLNRFLQTDIGEIRIFSRDEKKQ + DDMRHEFQVKVPEVAGKIRFYLGDVRDLASVKNAMHGVDYVFHAAALKQVPSCEFFPV + EAVKTNILGTENVLTAAIEAGVKQVICLSTDKAAYPVNAMGTSKAMMEKIAVAKSRTV + NPEHTKICVTRYGNVLCSRGSVVPLWIEQIKQGNALTITEPSMTRFVMTLEEAVDLVL + FAFEEGKSGDILVQKAPACTIEVLAKAVSEIFASEQDIKIIGIRHGEKRYETLLTNEE + CANAIDLGDFYRVPSDNRNLNYDKYFKDGSTNRNLLTEFNSNNTDLMDVEQVKRKLLE + LDEIQTAIRDMVADEEM" + misc_feature 17632..18486 + /gene="fnlA" + /locus_tag="SCP46_0019" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0018" + misc_feature 17635..18483 + /gene="fnlA" + /locus_tag="SCP46_0019" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 3.1e-162" + misc_feature 17635..18306 + /gene="fnlA" + /locus_tag="SCP46_0019" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 8.3e-09" + misc_feature 17638..18273 + /gene="fnlA" + /locus_tag="SCP46_0019" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 8.4e-09" + misc_feature 18484..18627 + /gene="fnlA" + /locus_tag="SCP46_0019" + /note="HMMPfam hit to PF08485, Polysaccharide biosynthesis + protein C, score 2e-23" + gene 18766..19995 + /gene="fnlB" + /locus_tag="SCP46_0020" + CDS 18766..19995 + /gene="fnlB" + /locus_tag="SCP46_0020" + /note="member of homology group 37" + /codon_start=1 + /transl_table=11 + /product="FnlB" + /protein_id="CAI34621.1" + /db_xref="GOA:Q4JYL5" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYL5" + /translation="MIKNILITGAKGFVGKNLICTLEALKDGRDRTRPNLEIGEIFQY + DRDTDPILLDEYCKKADFVFHLAGVNRPQNPDEFMEGNYGFSSRLLEILDKYENTCPV + LLSSSTQASLEGRFSNSIYGQSKLAGEELFFEYGKKTGAPVLVYRFPNLYGKWCRPNY + NSAVATFCHNIAHDLPIQVNDPSVELELLYIDDLIQECLTALEGNPHRCNLDGLQILP + SPSGNYCYVPTTHRATLGEIVSLLETFKKQPNSLVMPEIPQGSFKKKLYSTYLSYLPV + DKFRFPLKMNIDERGSFTELLKTENTGQFSVNISKPGITKGQHWHHSKWEFFMVVSGR + ALIQERRIGLDENGQEYPILNFEVSGDKIEAIHMIPGYAHNIINLSDTENLITVMWAN + ESFDPRHPDTFFEQVEK" + misc_feature 18778..19401 + /gene="fnlB" + /locus_tag="SCP46_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 2.9e-09" + gene 19996..21180 + /gene="fnlC" + /locus_tag="SCP46_0021" + CDS 19996..21180 + /gene="fnlC" + /locus_tag="SCP46_0021" + /note="member of homology group 38" + /codon_start=1 + /transl_table=11 + /product="UDP-L-fucosamine FnlC" + /protein_id="CAI34622.1" + /db_xref="GOA:Q4K1W9" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K1W9" + /translation="MKIKTDYSDIHFKDNGKLKLLIIVGTRPEIIRLSSVITKCRKYF + DVILAHTGQNYDYNLNGIFFDNLGLDTPDVYMDAVGDDLGATVGNIINTSYKLMNQIK + PDALLILGDTNSCLSAIAAKRLHIPIFHMEAGNRCKDECLPEETNRRIVDIISDVNLA + YSEHARKYLHECGLPKERTYVTGSPMAEVLHKNLSAIESSDIHERLGLKKGGYILLSA + HREENIDTDKNFISLFTAINQLAEKYNMPILYSCHPRSKKRLQESGFKLDKRVIQHEP + LGFHDYNCLQMNAFVVVSDSGTLPEESSFFTSQGYPFPAVCIRTSTERPESLDKAGFI + LAGIDENSLLQAVETAVSLAEDEDFGLPVPDYVEENVSTKVVKIIQSYTGIVDKIVWR + KS" + misc_feature 20107..21135 + /gene="fnlC" + /locus_tag="SCP46_0021" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 4.8e-105" + gene complement(21378..21464) + /gene="tnp" + /locus_tag="SCP46_0022" + /pseudo + CDS complement(21378..21464) + /gene="tnp" + /locus_tag="SCP46_0022" + /note="Lone member of homology group 0259" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase (fragment)" + gene complement(21546..22605) + /gene="tnp" + /locus_tag="SCP46_0023" + /pseudo + CDS complement(join(21546..21731,21877..22605)) + /gene="tnp" + /locus_tag="SCP46_0023" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase (fragment)" + gene 22686..22874 + /gene="tnp" + /locus_tag="SCP46_0024" + /pseudo + CDS 22686..22874 + /gene="tnp" + /locus_tag="SCP46_0024" + /note="member of homology group 0047 7" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene complement(23086..23659) + /gene="tnp" + /locus_tag="SCP46_0025" + /pseudo + CDS complement(join(23086..23409,23390..23659)) + /gene="tnp" + /locus_tag="SCP46_0025" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature complement(order(23092..23409,23390..23394)) + /gene="tnp" + /locus_tag="SCP46_0025" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 1.7e-52" + /pseudo + gene order(23726..24044,24061..24450) + /gene="tnp" + /locus_tag="SCP46_0026" + /pseudo + CDS join(23726..23923,23922..24044,24061..24450) + /gene="tnp" + /locus_tag="SCP46_0026" + /note="member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature order(23973..24044,24061..24438) + /gene="tnp" + /locus_tag="SCP46_0026" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 7.6e-14" + /pseudo + gene 24711..>25070 + /gene="aliA" + /locus_tag="SCP46_0027" + CDS 24711..>25070 + /gene="aliA" + /locus_tag="SCP46_0027" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34628.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 24711..24797 + /gene="aliA" + /locus_tag="SCP46_0027" + /note="Signal peptide predicted for SPC2025 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 24957..25025 + /gene="aliA" + /locus_tag="SCP46_0027" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaaggcag aaatcctttg + 241 ttttttataa ccaaggttta taaaccttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gacgaacata aagaagcgta tccttagtgc aggcctgact + 361 tttacatctg ctttgctttt agctgcttgc gaccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtca attgaaacaa gaacaagaca aaagagcctc ataaaaggta ttgcaacttg + 541 gtaatacctt tttgaggtgc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggtgagta gggaggaaga ggtaaaagtt tatgcccaaa ctcttcgcat aaaagttcta + 661 gcttccccat tctatggaat cttgcattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagag aaatttctga aaccaagctt caaaaaagtc gctcgtcatc gtctcttcgt + 781 aagtcattgg agcgattaac tcaccattca tttgttagac ctgcaatcaa agaaatcctc + 841 tgatatcttc ttccagatac tttacctctt attaactgac cttttaatga gcgaccatat + 901 tctcgataaa aataagtatc gaatcctgtt tcgtcaatct aaacaggtgc taggtgcttt + 961 aaactattaa aattcttaag aaataaggct actttttcta ggtcttgttc ataattagat + 1021 tgaaactaga atagtacacc tctgcttcta aaacattgtt agaaatcgat ttgactgtcc + 1081 tgatcgtttt gtcatgttct tatttcattt tactatattt ttggttcgcg ggaagtctac + 1141 taagatactt aaagatgcag atagtaaaaa aagatgtaga cattaccgta aaaaagtgat + 1201 ataattgtat gatgttcaag gtataggtgt taatcatgag tagacgtttt aaaaaatcac + 1261 gttcacagaa agtgaagcga agtgttaata tcgttttgct gactatttat ttattattag + 1321 tttgtttttt attgttctta atctttaagt ataatatctt tgcttttaga tatcttaatc + 1381 tagtggtaac tgtgttagtc ctactagttg ccttggtagg gctactcttg attatctata + 1441 aaaaggctga aaagtttact atttttctgt tggtgttctc tatccttgtc agctctgtgt + 1501 cgctctttgc agtacagcag tttgttggac tgaccaatcg tttaaatgcg acttctaatt + 1561 actcagaata ttcaatcagt gtcgctgttt tagcagatag tgagatcgaa aatgttacgc + 1621 aactgacgag tgtgacagca ccgactggga ctgataatga aaatattcaa aaactactag + 1681 ctgatatcaa gtcaagtcag aataccgatt tgacggtcaa ccagagttcg tcttacttgg + 1741 cagcttacaa gagtttgatt gcaggggaga ctaaggccat tgtcctaaat agtgtctttg + 1801 aaaatatcat cgagtcagag tatccagact acgcatcgaa gataaaaaag atttatacca + 1861 agggattcac taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct + 1921 atgttagtgg aattgacacc tatggtccta ttagttcggt gtcgcgatca gatgtcaata + 1981 tcctgatgac tgtcaatcga gataccaaga aaatcctctt gaccacaacg ccgcgtgatg + 2041 cctatgtacc aatcgcagat ggtggaaata atcaaaaaga taaattaacc catgcgggca + 2101 tttatggagt tgattcgtcc attcacacct tagaaaatct ctatggagtg gatatcaatt + 2161 actatgtgcg attgaacttc acttctttct tgaaaatgat tgacttattg ggaggggtag + 2221 atgttcataa tgatcaagag ttttcagctc tacatgggaa gttccatttc ccagtaggga + 2281 atgtccatct agactctgag caggctctag gttttgtacg tgaacgctac tccctagcag + 2341 atggcgatcg tgaccgtggt cgcaaccaac aaaaggtgat tgtggctatc cttcaaaaat + 2401 taacgtcaac cgaagcactg aaaaattata gtacgatcat tgatagcttg caaaattcta + 2461 tccaaacaaa tatgccactt gagaccatga taaatttggt caatgctcag ttagaaagtg + 2521 gagggagtta taaagtaaat tctcaagatt taaaagggac aggtcggatg gatcttcctt + 2581 cttatgcaat gccagacagt aacctctatg tgatggaaat agatgatagt agtttagctg + 2641 tagttaaagc agctatacag gatgtgatgg agggtagatg agatgataga catccattcg + 2701 catatcgttt ttgatgtaga tgacggtccc aagtcaagag aggaaagcaa ggctctcttg + 2761 gtagaagcct acagacaggg ggtgcgaacc attgtctcta cctctcaccg tcgcaaggga + 2821 atgtttgaaa ctccggaaga gaagatagaa gaaaactttc ttcaggttcg ggaaatagct + 2881 aaggaagtgg cgagtgattt agtcatcgct tacggggctg aaatttacta cacaccagat + 2941 gttctggata agctagaaaa aaagcggatt ccgaccctca atgatagtcg ttatgccttg + 3001 atagagttta gtatgaacac tccttatcgc gatattcata gcgccttgag caagatcttg + 3061 atgttgggaa ttactccagt cattgcccac attgagcgct atgatgctct tgaaaataat + 3121 gaaaaacgcg ttcgagaatt gatcgatatg ggctgttaca cgcaagtaaa tagttcacat + 3181 gtcctcaaat ccaaactttt tggcgaacgt tataaattca tgaaaaaaag agctcagtat + 3241 tttttagagc aggatttggt ccatgccatt gcaagtgata tgcacaatct agacggcaga + 3301 cctcctcata tggcagaagc atatgacctt gttacccaaa aatacggaga agcgaaggct + 3361 caggaacttt ttatagacaa tcctcgaaaa attgtaatgg atcaactaat ttaggagaaa + 3421 tgatgaaaga acaaaacacg atagaaatcg atgtatttca attatttaaa accttgtgga + 3481 aacgcaagct aatgatttta ttagtggcac ttgtgacagg tgcgggggct tttgcatata + 3541 gcgcttttat tgttaagcca gaatatacga gtaccacgcg aatttacgta gtgaatcgcg + 3601 atcaaggaga caagtcgggg ctgacaaatc aggatttgca ggcaggaact tatctggtaa + 3661 aagactaccg tgagattatc ctttcgcaga atgtattgga aaaagtagcg acaaatttga + 3721 agttggatat accagccaaa acgttagcta gaaaagttca agtgactgta ccagttgaca + 3781 ctcgtatcgt ctcaatctct gtcaaggata aacagccaga ggaagccagt cgtatcgcta + 3841 attctctacg agaagttgct gcagaaaaga tcatcgctgt aacgcgagta tctgatgtaa + 3901 cgacacttga agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgtctcaatt + 3961 ccttgtttgg tttttttgga ggagcagtcg taacagtaat tgctgttctt ttgattgagt + 4021 tgttcgacat ccgtgtgaaa cgtcctgaag atgtcgaaga tgtactgcaa attccacttt + 4081 taggggtcgt tccagatttg aacaaaatga aataggagga agttatgcca acattagaaa + 4141 tctcacaggc aaaattggat tttgtaaaaa aggcagagga aaattataac gctttgtgca + 4201 cgaacctaca gttaagtgga gatgatttga aagtattttc tatcacttct gtgaaacaag + 4261 gagaaggaaa atcaacgact tccaccaata ttgcttgggc ttttgcgcgt gcaggttaca + 4321 aaacgctgct gattgatgga gatattcgca attctgttat gttaggtgtc tttaaagcaa + 4381 gagataagat tacaggcctg acagaatttt tatcaggaac tacagaccta tcacaagggc + 4441 tttgtgatac caatatcgaa aatctctttg taattcaggc tggctctgtg tcaccgaatc + 4501 cgacagctct tcttcaaagt aagaatttca gtacaatgct tgaaaccttg cgtaaatatt + 4561 ttgactatat cattgtagat actgctcctg tcggtgtcgt gattgatgcg gctattatta + 4621 cgcaaaaatg cgatgcttct attttagtga cgaaggcagg tgaaataaat cgacgggata + 4681 ttcaaaaagc aaaagaacag ttggaacaca cagggaagcc gtttttggga gttgtgttga + 4741 ataaattcga tacttcagta gacaaatacg gttcttatgg aaattacgga aaaaaataag + 4801 tcgttaagta tttgtgtaag gacattttta gaactacaat caaaatcttt ggaattgctg + 4861 gcttcaaatc atattgattt gaaatgaaac ttgcaaaaga gttttttagg tgagtttctt + 4921 aatttgtgac tgaaatcaat cttctacttc cataccttgg aaaaataggg taaacgagaa + 4981 atgttttttc cataataaag ttttgatatg gctagtagag tagtaatata atagacttgt + 5041 tcggtaactg taaaaagtgt tatactattt ttatggaaac agtatacgac aaagcacaaa + 5101 aacttaactc aaaaaacttc aaactattga ttggtgtcaa aaaggaaacc tttcaactca + 5161 tgctagaaca cctgaattca gcctatcaga ttcagcaccg aaaaggtgga cgtccacgta + 5221 gtctgcccat ggaagaccag ctcattatgc ccctccgtta cttgcgatat tatcccactc + 5281 agcgtctgct ggcctttgat tttggcgtcg gtgtagctac ggtaaatgcc atcatcactt + 5341 gggtggagga tacacttcgt gcgtcaggta gctttgattt ggaccattta gaagccccga + 5401 gtgctgctgt ggctattgac gtgaccgaaa gtccgattca gcgtccaaaa aaaaccaaag + 5461 caaaaattat tctggtaaaa agaaacgaca caccttaaaa actcaaatta tgctggattt + 5521 gacgacacat aaagtctgtc aaatggcctt ttctgacgga catacgcatg attttactct + 5581 cttcaaagaa agtattggac aaagtttgcc tgaaacgacg cttgcctttg ttgacctagg + 5641 ttatttaggc atcttgaaat ttcatgagaa tactttcatt cctgctaaaa attccaaaaa + 5701 tcgccgcctg agtgaggatg ataagcagtt aaataaagag atgtcagcga tacgaattga + 5761 aattgaacat tttaacgcta aattcaagac cttccaaatc atgtcagtcc cttatcgtaa + 5821 ccgcagaaaa cgtttcgagt tacgggcgga attaatttgt gccatcatca attatgaagt + 5881 gaactagatt ccgaacaagt ctaatgaatt gtaatcatta gtgttcatac caagaaatat + 5941 caagtaccta tttttggaaa ttataaatgt tagatagtgt ttaaattttt acggagagat + 6001 tgttttgaga ggtaatttat gtatagggaa ataaaacgat taggtgatat tttactttct + 6061 ttcataggaa taatagtact gtttccagtg tttattataa ttgcaatcgc aataaagctt + 6121 gattcaaaag gtccagtaat atttaagcaa aagcgatttg gacttcataa gaaatcgttc + 6181 tatgtcttga agtttcgaac tatgaaggtt gaatcgccaa aatatgtggc gactcgagac + 6241 ttagataaac cagaacagtg gattaccaaa gtaggagctt gtttgcggaa aacatcttta + 6301 gatgaactgc ctcaactgtg gaacattctt gttggtgata tgagtgttgt aggacctagg + 6361 cctgtagcta taaatgaact tgatttgata aaagaaagag aacagtatgg tgccaatgat + 6421 atcttaccag gattaactgg atgggcacaa attaatggac gtgataattt gtcaacagag + 6481 atgaaggcag agatagatgg ttattatgta aaacatatgt cgttaagaat ggatcttaga + 6541 tgtatcctta gaacaatccc ctacgtatta aaacgtaagg gaattgtgga gggtagtggt + 6601 aagaaagagt tggagtgatg caatgaaaat tctatttgtt tgtcaacatt ataagccaga + 6661 accttttaga ttgtcagata tttgtgagga tctagttcaa agagggcacg aggtggctgt + 6721 tttgacaggg attcctaact atcccgaggg ggaaatatat gctgattatc gtaagagaaa + 6781 aaaaagaaga gagactataa atggtgttgc tatttttcgt tcatacacca ttgctaggag + 6841 gcaaaatact ttataccgta tattgaatta ttttagtttt gctctttctt ctacgatagg + 6901 tgttatattt gggcgttata aagcgaaaga tggctcagat tttgattgtg tctttgttaa + 6961 tcaactatct ccagttatga tggcttgggc tggtatagct tataagaaca agtacaataa + 7021 acctatgttt ttgtattgca tggatgtttg gccggatagt ttaattgtag gtggggtgaa + 7081 ggaaaatgga ttgatttaca agatatttga atttgtttca aaaaaagtat atcaagccag + 7141 cgattatata tttgttacta gtctatcttt taaagattat tttgtaaaaa aatttaatat + 7201 tcctctccac aaaattactt acttaccaca atatgcagag gatttatttg taccaaatga + 7261 attaaaaacg aacaaaaata ctattgactt aacttttgct ggaaatattg gaaaagctca + 7321 gaatttagag actattttga aagcagccag tgcaatagaa cagattcccg atttagcaaa + 7381 gagagttcat tttcattttg ttggagatgg tacggaacta ttaaacatgc aaaaattagc + 7441 atgtgaacta gaattagaga acacttcatt ttatggtaga cgtccattag aagagatgcc + 7501 ggatttttat acaaaatcag atgcgatgct agtttcttta ataggcgact ctataatttc + 7561 tcgcacctta ccaggtaagg tacaatctta tatggcggca ggaaaaccaa ttataggagc + 7621 gatttcagga gatactcaga gagttgtaaa agaagcaaaa tgtggtttca taagtccgga + 7681 agggaatgtt gatcagttag tgagaaatat tcgtaagttc tgtttgcttt ctgtagagga + 7741 aagagagaaa ctaggaaggc aagctcgttg ttgttatgaa gaacagtttt cgaaagagtg + 7801 gtttatgaca tacttagaaa atcatttaaa agaggggttt ctatcatgaa ggttttaatg + 7861 attaattccg tttgtggtat taggagcact gggagaattt gtacggatct cgcaactgct + 7921 ttgacagaag aaggatatga ggttaaaatc gcctatggtc gtgagtatgt tccgaaacaa + 7981 tttcaacagt atgcagtgaa aattggtaca aagtctgata ttcgttttca tgcgattcgt + 8041 tctcgattat ttgacgaatc tggctttgga agtagacagg caactgttaa ttttattaaa + 8101 tggataaaag agtttgaccc tgatgttatt catcttcata atcttcatgg atattatatc + 8161 aatattgaac tgttatttga ttatctccgt atatgcggta aaaagattat atggactttg + 8221 catgattgtt gggcatttac aggacactcg gctcactttg attgtttgga atgtgagtca + 8281 aagggggttt gtgaccatcc atctcagaaa aatgattatc ctaagtcgtt cgtgaatttt + 8341 tcaaggcgaa attatcaaag gaagaaaaaa tgttttacac atattcctaa tctcactatt + 8401 gttactcctt cgcaatggct agctaacttg gtaggacagt catttttaaa agaatatcca + 8461 gtgaaagtaa ttcataatgg cattgatact actgtctttc aaccgaggct aatagccgct + 8521 caaaagttga aaaaaagata ccatcttgaa ggaaagcagg tattgcttgg tgtggctgct + 8581 atctggactg ataaaaaggg attttctgat atgttagtcc ttgcgagtca tctagctgat + 8641 aatcagagaa tagttttgat agggttaaaa gataggcaac tcaaaaaatt acccaaaggt + 8701 attattgggc taacagagac taatagtcca gaagagttgg cagcatggta tacactagcg + 8761 gatgtattct taaatcctac ttatcaagat agttacccga caactaattt agaagctatt + 8821 tcttgtggga caccagttat cagctatccg acaggtggta gtgtagaaag tgctaaactt + 8881 tatggtctcg tttgtcagga tagaaacgta gcttctattt tatcttcgtt agaaaaagtc + 8941 tctcagctat ctaaaacaga aaaattagat ttttcaattg caagttttat taaacaaatg + 9001 aaatatttat actagaactt gaattatagg aaaatgagga atttgcatta aaatgatgaa + 9061 aagaatttat tatcaccttt tggctatttt ggcttggact cttccaaatt cttatgcttt + 9121 tattgattcg ttaaaggtgt tttttccgaa tattagttta caaattgcag gttctctttt + 9181 ggctgttatc tcgataggaa tttttatcac tagaatatat tatacaggat acgaagtttt + 9241 tatatctcta ttggtttgta tttttatttt aattttttat tcaactcgct ttttttattc + 9301 gactaatgta gagttgtatc attctttctt caattccttt ctgattcgtc cagttcctgg + 9361 gatattagta gcgatgctgt tagctaagaa taatcatata aaaggtttca taaaatggtc + 9421 agaacctatg atgcttttct atacattgac atcattttta gcagccctat ctcctagaaa + 9481 tagcattatt atttaccaat ctttatctta ttatgccatg acagcttata tgattaatgt + 9541 gtttaatatt atatacaaag agaaaatatt ggaggagcaa ctgacgtatt tcagattctc + 9601 agcgtggaat tttattagat attttttact tttgattcaa gcttttaatg cactctcagg + 9661 aggtgggaga ggtgccttta tcttattaat tatttttaca ggaatattat taataagaat + 9721 tgctatgaat tttaagttcc ttttctcatt cattggaggc ttatctgcta tagctctagt + 9781 tgttttttgt ataaaagatt tggatttcac atggctcttg aatatggacg gtggagagcg + 9841 attgttgaac ttcttcggca gacctgaacg tatatctaca gataatagac tattgattta + 9901 tgatactgtt tggtctgcaa tacaggaaaa acccttttta ggatggggag ttggttcaac + 9961 ttttttaaaa tttaatggat attcacataa tattgtattg gatttattgc atgatatggg + 10021 aagttttggt ttattaatta ttctttcggc tttctttgct tcttcagtaa tattgtacaa + 10081 attacgtaaa atagattgga aagtgaattt atttattctg atgtttctag aagtatatgt + 10141 tcacatgagt ttcagtggaa gctatcttgc agatggtaga ctatggtttt tggtgatctt + 10201 tacttattgt tactacaggt ggaaagtgca ggaaaaggat gaagttagca attttattat + 10261 ctgatatttc aaaaatagga ggagtgcagc gtgtcacgac agctcttgtt aatgaacttt + 10321 gtcaaaatat agacgttaca attatcagca tcttttcgga aaatgagcta ccagcttttg + 10381 gactttcaga tagagttcag gtgagctatc ttttgaaaga acatgttaat ttgaagaaga + 10441 atttttttaa agttagtgga gctttgcgaa aagtgttgaa aaaacagcag tttgatgttg + 10501 ttctatcgtc aggaactggt ctagtatcct ttctttggtt tgctagtttg ggaattccta + 10561 ccagactttt ggcatgggaa catcagtgtt tttactttgg gagatcgttt ggtctagagt + 10621 ggttggggcg aaagctagcc tgtcgttttg ctgagagtat tgttgtcttg actaaaaaag + 10681 atgaaggatt ttacaaagag aatcgtccta aggctcatat tgaacaaatc tataatatcc + 10741 tagacatgga ttcacaaaca gctaagtgtc agctctcttc taaaaaaatt atcagtgttg + 10801 gctctttagg acgacaaaaa ggttttgatc tggctcttga ggtagctagt caaatacaat + 10861 taagctatcc agattggcag tgggacattt atggtgatgg ccccgataga gaaaaattag + 10921 aggagaaagt cagggaatac caattagaag gctttataaa tttgaaaggg cttgttcaga + 10981 atgttcggga gctctatcct gactactcta tctacgccat gacatcacga catgaaggat + 11041 taccaactgt attattagaa gctaaaaact gccagatgcc tgttatttca tttgattgta + 11101 actgtggacc ctctgatatt atttcagatg gaagaaatgg ttttttgatt gattgttttg + 11161 atgtaaatat ctatgcaaaa actttatcta aattaatgac tagtttagag ttgcgagaac + 11221 aagttgcaaa atcgagtgtt attccagcag aagaattgtc aacaacttat atcctagata + 11281 agtggaacaa tctattaaag atagaaagaa gataatatga aaatagtcca tgtagaagat + 11341 ttttttcatc cagatgcagg ttaccagatt aatgttttac caaaatatct agcaaagttt + 11401 ggtcatgaac aggtgattat cacttcagaa atggataaaa tccccgataa tcttacccaa + 11461 ttttttggac gagaaaatat agaagagaga gatagaagtt acgaagagaa gcatcatgtg + 11521 aagattattc gcttacctct tcatggattt gtaagtggac gtgcgatttt ttctggaaag + 11581 cttatttcgg ctattaaggg tctttctcca gaggtattgt atattcatgg gaatgacacc + 11641 ttaacaggga ttcgtctcct tttagctcga aagaaactta attgcagaat cgccaccgat + 11701 agtcatatgc ttgaaatggc atcaagaaat cctttcaaca actactttag gagattttat + 11761 aaaaccttga ttactcccat tttgataaaa gaacagatac caattattcg gacgcaagat + 11821 gataattatg ttgaaaaaca cttgggaatt cctttatcgc aagctccatg gatttcttat + 11881 gggtcggata cagcgttctt tcacgcagat agccagatta aggaagattt tcgttctcaa + 11941 tatcaaatcc cttcagatgc tcttatttgt gtttacgcag gaaagttaga tgagcataag + 12001 ggtgggatgt ttttagcaga gtctctaagt aaaaagttaa atacggagca accaattgtt + 12061 ttcattatag tgggtaatac aaatggagag tatggagaag ctgtcgagaa aagtttctcc + 12121 caatctgaaa accaaatctt gcgctttccg actcaaaaat atcaaaaatt agcacagttt + 12181 tttcaggtag cagattttgc tttatttcct aaacaatgta gtttaagttt ttatgatgca + 12241 caggcctgtg gtttaccagt tttattggaa gataataata tcaacctcga tagaacttct + 12301 cattataatg gttggacgtt caaggctaac agcaaattaa gtttgagaga ttcattaaaa + 12361 atgattgcga gtctagataa agagaagaga caagagtact ctcagaatgc actgcactat + 12421 atccttgaac attataatta tgaagataaa gcaagagaat atgaaaagat tcttataggg + 12481 gaacgtacga aatgagatag ttaatatttc gttattttat aggaaaggtg gatttaatga + 12541 aaatttgcat tgtttcagtc ggagtgagcg gactaccgat tccagctgta aaagggggag + 12601 cagtagaaaa tctcattgat aattatttaa gttacaatga gaaatataat catgatgaaa + 12661 ttacggtcgt tagttgtgac cataaggagg cgcgtgaggc ttcaaaaaaa tacaagtatg + 12721 cccaatttgt ctatatagat attcattcac ttaaatataa aataaacaaa acaatacgtt + 12781 ataccatcaa taaatattca cctttcttcg tagggaacgc ttatatcagt caattgccag + 12841 acttgtctgg ttttgataca gttttgattg aaaatcgccc tgaatacggt tattatattc + 12901 gtaaaaagtt taaaggaaat cttgttttac atcttcacaa tgatttatta atggacaatg + 12961 agtattctgt agattatagc gtttatgata aaattatcac agtatctgac tatattagga + 13021 ataggtcaga agtagtaacg tcaggtgttc cgatacagac tgtctataat ggtattgaca + 13081 cagaactttt tttgcagaat ttctctgaag ttgatttatc agatcttaaa aatcagttgg + 13141 aaattttgtc ggatgatttt gtgattgttt tttttggacg tatcaacaaa aataaaggta + 13201 tcaaagaact gcttgaagcc ttcttgttgc taccaaagaa tttgaatata aaattactag + 13261 ctgttggtag ttctatattt ggtcagacgg agttggatac tttcacaaca gagctacggc + 13321 aattggcaaa acaagcatca gataaagttg tttttacagg ctatgttaat tacaaagaca + 13381 ttcctaagta tcatcatatt gcagattgca ttgttattcc atctatttgg gaggaaccag + 13441 cgagtttgac ggtctgtgaa gctttgatat cagggaaata tgttattaca acagatactg + 13501 gagggacacc agagcttgta gctggcagtg atgcccttgt ggtagcaaat gatgagtgta + 13561 tagttgaaca cctcaaaaca gccctattga gtgtctacca aaaagggaaa tgctcttcgg + 13621 ttattacttc taatagagat agaggagcct atttttctat tgaaaaatat ggaagaaact + 13681 tacgaaaaga gctcacacaa aatgaaagaa ttattaacat atgagtcgtg taaaaaatag + 13741 tttttttaat attttagctg gaatagttgg tactatcata tcgagtgttt tagctttcat + 13801 agttagaaca gtgtttatcc gagttttggg agagacttat ctaggtttca atggtctata + 13861 caccaatatc ttaacagttt tatccctaac tgaattaggg atcggatcat caattgctta + 13921 tttgatgtac aaacctttag cagaaaaaga tggggacaaa ttagctcaag tagttcaatt + 13981 ctataaaaaa atatatcgag tgattggtat cattattctt attttaggtt tgtgtctcgt + 14041 tcctttttta ccagtcattg taaatttaaa aaatgcagaa gatttgaact atacagcatt + 14101 gtatttgctt tatttagcag atacagtttc tacttatcta ttctttgcat ataaaagagg + 14161 ggtattggct gctgatcaaa agatctatgt tgcgaatatc tttgatataa ttataacgac + 14221 aattttatct attttccaaa ttatcacttt gatgattttt aaagactttt atctatatat + 14281 tattttaaaa attgctaaaa atcttacttt gaacctagta attagtttaa aagtagataa + 14341 aatgtatcca agtattcata aatttaaagg gatagctccg cttccaaaaa tggaaagacg + 14401 actagtttgg aaaaatgtat atgctacctc tgttcgacaa atctttaacg aattaatgaa + 14461 ttcaacagat agtatagtta tttccattgt cttaggaata gttatggttg gtaagtattc + 14521 gaactatgct tatattttat caatcgtata tattttcttt ggaggaattt ttaatccgat + 14581 tcaggcttct attggaaacc tatctctgtc agcttctata gagaaaaaaa atgaaatctt + 14641 caatagatta cgttttataa attttttctt tttatcattt tgctcaagtt gtcttctagt + 14701 attggtaaat ccttttatca ctatttggat tggagaaaat tacactttat catttacagg + 14761 tgtgattgca atagttggta tgttattcgt tagacaaact ggaaattgta caaccatttt + 14821 tcgtttggga gaaggatatt ttagagatta tcatttttct cctttaatcg cgggcatttt + 14881 aaatttagtt gtttcagtaa ttttagtgaa ttatataggt attgcaggtg tttttgttgg + 14941 aacaatgtta ggatttggtt tccaatttat actggtggat acaattgtta cttataaaaa + 15001 agtacttagt cgtccactat cagagtttta tttaagatgg ttgcagacga tcttattaac + 15061 tgtaggttta tgtattgcga gttactattt atctcgattg gttagagtga atagtatata + 15121 tgatttgata ctgttgtttg tagtggttat tggatttaat ttttttgctt tatgttttat + 15181 ttattggcga aatgatgatt ttcaatattt tattcaattg gttaaaaatt ttatgaaaaa + 15241 tttggaggaa aaaaatcatg attaatgtaa tcggattagg ttatattgga ttgccaacaa + 15301 ttttaatgtt ggcaacaaac ggcgtgaaag tagttggaac tgactacaat caggatttgg + 15361 tgagaacttt aaatgaaggt caaacaacct ttaaagaaga tggattggat gaactatttc + 15421 ataaagcagt ggagtcgggt gtggacttta caaccgaata tcaacaaacg gatacctata + 15481 ttatttccgt tccaacacca tatgactcct tctctaaaaa aattgatcca agctatgtga + 15541 ttgaagctac gaaaacggta cttgataatt gcaataaagg agcggttatt attattgaat + 15601 cgaccgtatc accaggaacg gttgataaat ttattcgacc tgttgtagaa gaaaaaggtt + 15661 ttgttattgg tagtgatatt catcttgtcc atgctccaga acgtattatt ccagggaata + 15721 tggtctatga attggtgaat aataaccgta caattggagc tgatgaccta gaaatcggct + 15781 ataaagtgaa agagctttat gcttcatttt gtaagggcga tattgttgtt acagatatta + 15841 gaactgcgga gatgaccaag gtagtagaaa atacatttag agctgtaaat attgctttcg + 15901 ctaacgaatt agcacagatc tgtagttatg ataatatgaa tgtttatgaa attatccgga + 15961 tctgtaatat gcacccacgg gtaaatattc tacaacctgg acctggtgtt ggtgggcatt + 16021 gtatttctgt ggatccttgg ttcttagttg gagattatcc tgagttgaca aatgttattg + 16081 aacattctat gcgaacaaat gctgccatgc cagaatttgt attaaatcgt atctatacca + 16141 ttatgaacga acatcatcta acagatatta gtcgggttgg tctatatggt cttacctaca + 16201 aagagaatgt agatgatatg cgtgaatctc caacgcttca gttattagaa tctatgagcc + 16261 gccatctggc aacacctgct attaaagtat atgatccatt tatagaaaaa gatgttgtgg + 16321 cgaatcagtc acatgattta gatgaatttt tatctaatgt tgatattgtt gtactgttgg + 16381 ttggtcatga tgagatttta caaaatatgg ataaactaaa agataagata gtgttagata + 16441 cacgttatat ctgtcatctt gatggaactt acagattata attagtgata aataaagtaa + 16501 ggattgacta tgaaaaaaat agttgtaatt ttcggaactc gtcccgaagc tatcaagatg + 16561 tgtcccttgg ttaaagagct aagaacacgt gagaatcttg aaacattggt ctgtgttacg + 16621 ggtcaacatc gtcaaatgct ggatcaagtt ttggatactt ttaggattac gcctgatttt + 16681 gatttatcta ttatgaagga caaacaaact ctctttgatg tcacaattgg cattttggaa + 16741 ggcatgaaga ctgtcttaga gtcagttaat cctgatttaa tattagttca tggggatacg + 16801 agtacaacat ttgccagttc actggccgcc ttttatctac agattccaat tggacatgta + 16861 gaggctggtt tgcgtactta tgatatttat tcaccttatc ctgaagaatt taatcgtcaa + 16921 gcagtaggtg ctttggctca gtatcatttt acaccaacac aactctcaaa agacaatctc + 16981 ttgagagaag gaaaaaattc tgaagctata tttatcacag gtaacacagc aattgatgct + 17041 ttacaaacta caattcaaga ggattatact catcctgagt taaattgggt tggggatagc + 17101 aaactaatat taattactgc tcatcgtcgt gaaaatattg gtgacccgat gaggcacatg + 17161 tttagagcaa tccgacgtat cattgaagaa cattcggata taaaggctct ttaccccatt + 17221 catatgaatc ctctagttcg tcagattgct gaggaagaac taagcggatg tgaacgtatc + 17281 aaaatgatcg atccgttgga agtattagat tttcataact ttttatcacg gagttatctc + 17341 attttaacag atagtggtgg tatccaagaa gaggcaccta gtttaggaaa acctgtttta + 17401 gttatgagag atacaactga acgtccggag ggaattaaag caggaacttt gaagcttgta + 17461 ggtactgatg aggacaatat ttatagacat tttaaagaat tgttagaaaa tgatttagtt + 17521 tatcaagcga tgagccaagc ttcaaatccg tatggagatg gaacagcttg caagaaaatt + 17581 gcagacatac tagaaggaga agtataatat atgtcacaat ttacaggaaa aactctccta + 17641 attacaggag gaacaggttc atttggtaat gctgtcctta atcgtttttt acagactgat + 17701 attggtgaaa ttcgtatttt ttcccgtgat gaaaaaaaac aggatgatat gcgtcatgag + 17761 tttcaggtaa aagtaccaga agtagctggg aaaatccgtt tttaccttgg agatgtgcgt + 17821 gacttagctt cggtaaaaaa tgctatgcat ggtgtggatt atgtttttca tgctgctgct + 17881 cttaaacaag taccttcgtg tgaatttttc cctgtagaag cggtaaaaac taacattttg + 17941 ggaacggaga atgtcctcac tgcggctatc gaagctggtg taaagcaagt tatctgtctt + 18001 tctacagata aggcggctta tcctgtcaat gctatgggaa catccaaggc tatgatggaa + 18061 aagattgctg ttgctaagtc caggacggta aatcctgagc atacaaagat atgtgtgact + 18121 cgctatggga atgttctgtg tagccgtgga tctgtcgttc ctctttggat tgagcaaatt + 18181 aagcaaggaa atgctcttac aattactgaa cctagcatga cacgttttgt gatgacatta + 18241 gaagaagcag tagacttggt tttatttgca tttgaagaag ggaaatctgg agatatacta + 18301 gttcagaaag caccagcatg tacgattgaa gtgttggcta aggctgtatc agaaattttt + 18361 gcctcagaac aagatattaa gattataggt attagacacg gagaaaaaag gtatgaaaca + 18421 ctattaacta atgaagagtg cgcaaatgca attgatttgg gtgattttta tagagttcct + 18481 agtgataatc gtaatcttaa ctatgataag tatttcaaag atggtagtac gaatagaaat + 18541 ttgttgacag aattcaatag taataatacc gatttgatgg atgtagagca agttaaaaga + 18601 aagttgctag aattagatga aatacagaca gcaattcgtg atatggtagc agatgaagag + 18661 atgtaaaatc ttttaagata cattaaaatt atcaaggata tataatgtat catgtattgt + 18721 cgagagagtt gactattaaa acagcatata aaacaaggag ggggcatgat taaaaatatt + 18781 ttaatcacag gagcgaaagg atttgtagga aaaaatctta tctgtactct ggaagctttg + 18841 aaagatggac gagataggac tcgtcctaat ttagagattg gagagatttt tcagtatgat + 18901 cgtgatacag atccgatttt attagatgaa tattgtaaga aggccgattt cgtattccat + 18961 ttagctggtg tcaatcgtcc acagaatcct gatgaattca tggagggaaa ttacggtttt + 19021 tcaagtagat tattggagat tttagacaag tatgaaaaca cttgtcctgt tctactctca + 19081 agttctactc aagctagttt agaaggccga ttttcaaact ctatatatgg acaatctaag + 19141 ctagcagggg aagaactctt ctttgaatat ggaaagaaaa cgggagcacc tgtcttagtt + 19201 taccgtttcc cgaatcttta tgggaagtgg tgccgtccta actacaattc tgctgtagca + 19261 actttctgtc ataatatagc tcacgattta cctattcaag taaatgatcc aagtgtagaa + 19321 ttggagttgc tgtatattga tgatttgata caagagtgtc taactgcatt ggaaggaaat + 19381 cctcatcgtt gtaatctaga tggattacaa atcttaccta gcccatcagg aaactactgc + 19441 tacgtaccaa cgactcatcg tgcaacctta ggagagattg tctctctatt agaaacattt + 19501 aaaaaacagc ctaatagttt agttatgcct gaaattcctc aaggatcgtt taaaaagaaa + 19561 ttgtattcta cctacctatc ttatttacca gtagataagt ttaggtttcc tctaaaaatg + 19621 aatatagatg aacgaggtag ttttacggaa ttattaaaaa cagaaaatac gggtcaattt + 19681 tctgttaata tttctaaacc tggcattacc aaagggcaac attggcatca ttctaagtgg + 19741 gaatttttca tggttgtttc tggtcgtgct ttaatacaag agcgtaggat agggctggat + 19801 gaaaacggtc aagagtatcc tattctgaac tttgaagtgt cgggcgataa gattgaagca + 19861 atacatatga taccgggcta tgcacataat attattaatc tttctgatac agaaaatcta + 19921 attactgtca tgtgggctaa tgagtcattt gatcctagac atccagatac tttttttgaa + 19981 caagtggaga aataaatgaa aattaagaca gattatagtg atattcattt taaagataat + 20041 ggcaaactta agttattgat tattgtggga acacgtccag agattatacg tctaagtagt + 20101 gttatcacta aatgtcgaaa gtattttgat gttattttgg cacatactgg acaaaactat + 20161 gattacaatt taaatggtat tttctttgat aatttagggt tagacactcc ggacgtatac + 20221 atggatgctg ttggagatga tcttggtgct actgtaggga atattattaa tacttcatac + 20281 aaattgatga atcaaattaa accagatgct ttattgattt taggggatac aaattcttgt + 20341 ttatcagcta ttgctgccaa gcgtttacat attccaattt ttcatatgga ggctggcaat + 20401 cgctgtaaag atgagtgcct gccggaagag actaatcgtc ggattgttga tattatttca + 20461 gatgttaact tagcatactc tgaacatgca cgtaagtatt tacatgagtg tggtttacct + 20521 aaagagcgca catatgtaac tggttctcct atggcagaag tgctacataa aaatttatct + 20581 gccattgagt cttcagatat ccatgaacgt ttgggattga aaaaaggagg ttatatctta + 20641 ctttcagctc accgtgagga aaatattgat acagataaaa attttatttc tctctttaca + 20701 gcaattaatc aattagctga aaagtataat atgccaatct tatattcttg ccatcctaga + 20761 tcaaagaaaa ggctacaaga gagcggtttt aaactagata aacgtgtgat tcagcatgag + 20821 ccactaggat tccatgacta taattgttta cagatgaatg catttgttgt agtatctgat + 20881 tcgggaactt taccggaaga aagtagtttc tttactagtc aaggttatcc ttttcccgct + 20941 gtatgtattc gtacaagtac agaacgtcct gagtccttag ataaggcagg atttattttg + 21001 gcaggcattg atgaaaattc tcttcttcaa gcagttgaaa ctgctgttag cttggcagaa + 21061 gatgaggatt ttggattacc ggttccagat tatgttgagg aaaatgtctc tactaaagtt + 21121 gttaagataa tacagagcta tacagggata gtggataaaa tagtttggag gaaaagctga + 21181 attgtatatt tttaataaat caaaacgaga tgattaattc ttagtagaac aagagtaaaa + 21241 ttgaacgtat ttgatggaaa tgtcttactt gatagtcgag ggatagccat tctatcggat + 21301 ttttggcttg tttttgcgct tcatgtttga tagaataaag ggctctttgt caactgtagt + 21361 gggttgaaga aaagctaagc ttgagaaagg acaaatttcg tcctttcttt tttgatgttc + 21421 agagcgataa aaatccgttt tttgaagttt tcaaagtttc gaaagtaacc gcccaataac + 21481 gaagtatatt gaaaaatctc cagactagag aactcacgga tagttcctaa tctggagatt + 21541 tcttatttgc acttttcttg tacaacttta gtccatggta aataagcctc taaaacctct + 21601 ttgtttacga gagtttcctc gtttggaaga cattctagaa gataggatag atatttctcg + 21661 ctatttataa tggattgaaa taagatatga acaaatcgat taggaaagga aaattgattt + 21721 atagaaatgt tttagcagtc gatgcgtact gttatagatt caacgcacta taattgatga + 21781 cgtttagctg tttccaacaa gctcataata atagctcttg ctttagctcc ttcaaaactt + 21841 tgagaaaata accaccctcg cttttttaaa ctgagctcag gctaaaagag tccactggac + 21901 tcttttactc cgtcccataa ccaatgattt aatggcgcgt tcagctagat tattggaaag + 21961 gaccagatgt ccgtctttca aaatagtctt aaaggtttct tcatacttga ggctgtattc + 22021 aattgccctt cctagttttg aacctgctaa aactgactga cggcggcacc aagcaaagaa + 22081 gtcttccatt aggggctgga gatgttcttg acgtttctgt agtcgttcat cagctggcaa + 22141 agcctcccag tctctttcca aggaaaataa ctgatcacaa taggctaaac ctttagctcc + 22201 taaggatgat ttatctgctt gcttgggggt cgcttcaaaa aacttccttc tcacatgtgc + 22261 ccaacatcca acaagtgcag cttcttccag ttgacgataa gcttctagcg gttcgcagtt + 22321 taccaagctt agcgtcgcct tgctcctaaa ccttggactg ctatcgcata ggcagaacta + 22381 gaggactaaa gtcctaagtt actgccgcaa catgtcacaa tgaacatagc cagaataatc + 22441 tcctaggaat tcttgtacta ctaaaccact ccgacgctga tcatggtggt acagcgtgat + 22501 tgcttgattc tcagctttcc cagacaaaaa ggtccaatag taagtcagct gactatcact + 22561 ctctagcacc ctataagaag tttcatctgc atgaagtaag ggcttgagtc aatagtctcg + 22621 ttataaaggg gctttaggaa taggagcttt cacaagctta tccagatgat tatcttttac + 22681 tcgttatgga caatgctata tggcataaat caagtacctt aaagattccg actaatattg + 22741 gttttacctt tattcctcca tacacaccag agatgaaccc cattgaacaa gtgtggaaag + 22801 agattcgtaa acgtggattt aagaataaag cctttcgaac tttggaagat gtcatacaag + 22861 gactggagaa ggaggtgata aagtccatcg ttaatcggag atggactaga atgctttttg + 22921 aaagcagatg agtataaaaa gaaagtcctc atttcaatag aaatcacgac tttctgatgg + 22981 atttatagta aaatgaaata agaacaggac aaatcgatca ggacagtcaa atcgatttct + 23041 aacaatgttt tagaagcaga tgtgtactat tctagtttca atctactata tttttggagt + 23101 gatagaaaag cccttcatca gccaatctac ttgttcaggt gcgagagctt tgacatcctt + 23161 ttctgtactg ggccaagtca gtctgccgtt ctcaaagcgt ttatatagta gccaaaatcc + 23221 ttgaccatcc cagtaaaggg ctttaaagcg gtctttacgt ccaccacaaa agagaaaaac + 23281 ttgacctgag aaaggatcta attcaaagtg ggttttaacc agataagcca gtgaatcaat + 23341 gccttgcctc atatccgttt tcccacatac gagatagacc tgccctaggc tagatagatg + 23401 aattgtcata gagcaacacc ttatccaaaa gctgttctat catttcgaga ttgagagatt + 23461 gaaaaaaact tacttcaagc ttgccaatac gaattttaag cagaatatca tttctctttt + 23521 tagaatcaaa aggacgagat tgtggaatct ctacaggaac aataggttgt ggcattaaaa + 23581 tatcctccaa tagttttact ttactaatag tatacaggag gagctccatg aatgatagat + 23641 accttgttat gacgcgctta ctaaacaact aactgatgca cgatttaagc gccttgttgg + 23701 tgttcagcgc acgacttttg aagagatatt agctgtatta aaaacagctt atcaacttaa + 23761 acacgcaaaa ggtggacgaa aacctaaatt aagcctagaa gaccttctta tggccactct + 23821 tcaatatatg cgagaatatc gcacttatga acaaattgcg gctgattttg gtatccacga + 23881 aagcaactta ctccgtcgga gccaatgggt tgaagtaact cttgttcaaa ggtggtgtta + 23941 cgatttcaag aactcctctc agttctgagg acacggtaat gattgatgcg acggaagtac + 24001 aaatcaatcg ccctaaaaaa acaattagcg aatcattctg gtaaaaagaa atttcacgct + 24061 atgaaggctc aagcgattgt cacaagtcaa gggagaattg tttctttgga tatcgctgtg + 24121 aactatagtc atgatatgaa gttgttcaaa atgagttgca gaaatatcgg acaagctggt + 24181 aaaatcttgg ccgacagtgg ttatcaaggg ctcatgaaga tatatcctca agcacaaact + 24241 ccacgtaaat ccagcaaact caagccgcta atagctgaag ataaagcctg taaccatgcg + 24301 ctatctaagg agagaagcaa ggttgagaac atctttgcca aagtaaaaac gtttaaaatg + 24361 ttttcaacaa cctatcgaaa tcatcgtaaa cgcttcggat tacgaatgaa tttgattgct + 24421 ggtattatca atcatgaact aggattctag ttttgcagga agtctattga aggatctttt + 24481 gctttagttc cttggtcaag gttgattatt ttcacggagc gcttccgatt gttttcataa + 24541 accatttgcg catagtcagc agaataaatc tttttgaaac gtccctttcc tagacattat + 24601 agaactttca gattcatctg aatttaccaa atcaacacaa aaattctgaa aattctgttg + 24661 acatctttct gaaaagagtc tataatggag agaaagtttt aaaggagaaa atgatgaaaa + 24721 gttcaaaact atttgccctt gcgggcgtga cattattggc ggcgactact ttagctgcat + 24781 gctctggatc aggttcaagc actaaaggtg agaagacatt ctcatacatt tatgagacag + 24841 accctgataa cctcaactat ttgacaactg ctaaggctgc gacagcaaat attaccagta + 24901 acgtggttga tggtttgcta gaaaatgatc gctacgggaa ctttgtgccg tctatggctg + 24961 aggattggtc tgtatccaag gatggattga cttacactta tactatacgt aaggatgcaa + 25021 aatggtatac ttctgaaggt gaagaatacg cggcagtcaa agctcaagac +// + diff --git a/public/res/serotype_genbank/serotype_47A.gb b/public/res/serotype_genbank/serotype_47A.gb new file mode 100644 index 0000000..d032a5e --- /dev/null +++ b/public/res/serotype_genbank/serotype_47A.gb @@ -0,0 +1,782 @@ +LOCUS CR931720 17250 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain L351 (serotype 47a). +ACCESSION CR931720 +VERSION CR931720.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17250) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17250) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17250 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="L351" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC47A_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC47A_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34629.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..490 + /gene="aliB" + /locus_tag="SPC47A_0002" + /pseudo + CDS 322..490 + /gene="aliB" + /locus_tag="SPC47A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(491..1024,1026..1352)) + /gene="tnp" + /locus_tag="SPC47A_0003" + /pseudo + CDS complement(join(491..1024,1026..1352)) + /gene="tnp" + /locus_tag="SPC47A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(962..1024,1026..1334)) + /gene="tnp" + /locus_tag="SPC47A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.1e-23" + /pseudo + gene 1565..3010 + /gene="wzg" + /locus_tag="SPC47A_0004" + CDS 1565..3010 + /gene="wzg" + /locus_tag="SPC47A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34632.1" + /db_xref="GOA:Q4JYL1" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYL1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVVVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIELEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1565..1681 + /gene="wzg" + /locus_tag="SPC47A_0004" + /note="Signal peptide predicted for SPC2029 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 1769..2116 + /gene="wzg" + /locus_tag="SPC47A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.8e-63" + misc_feature 2294..2737 + /gene="wzg" + /locus_tag="SPC47A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 5.7e-70" + gene 3012..3743 + /gene="wzh" + /locus_tag="SPC47A_0005" + CDS 3012..3743 + /gene="wzh" + /locus_tag="SPC47A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34633.1" + /db_xref="GOA:Q4JYL0" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYL0" + /translation="MIDIHSHIVFDVDDGPKSREESKALLIESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHIIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 3015..3623 + /gene="wzh" + /locus_tag="SPC47A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.1e-35" + gene 3749..4444 + /gene="wzd" + /locus_tag="SPC47A_0006" + CDS 3749..4444 + /gene="wzd" + /locus_tag="SPC47A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34634.1" + /db_xref="GOA:Q4JYK9" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JYK9" + /translation="MMKEQNMIEIDVFQLFKILWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKLGLTNQDLQAGSYLVKDYREIILSQDSLEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLQI + PLLGLVPDLDKMK" + misc_feature 3749..3865 + /gene="wzd" + /locus_tag="SPC47A_0006" + /note="Signal peptide predicted for SPC2031 by SignalP 2.0 + HMM (Signal peptide probability 0.709) with cleavage site + probability 0.459 between residues 39 and 40" + misc_feature 3770..4186 + /gene="wzd" + /locus_tag="SPC47A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 4.5e-54" + misc_feature 4292..4369 + /gene="wzd" + /locus_tag="SPC47A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4454..5137 + /gene="wze" + /locus_tag="SPC47A_0007" + CDS 4454..5137 + /gene="wze" + /locus_tag="SPC47A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34635.1" + /db_xref="GOA:Q4JYK8" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JYK8" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDDLKVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNRFDTSVDKYGSY + GNYGNYGKE" + gene 5195..5830 + /gene="wcjG" + /locus_tag="SPC47A_0008" + CDS 5195..5830 + /gene="wcjG" + /locus_tag="SPC47A_0008" + /note="member of homology group 50" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34636.1" + /db_xref="GOA:Q4JYK7" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JYK7" + /translation="MKQNGIIYIGFKRVMDVFIGLFGTIFIILPSSLIIYIIYKIKGY + KGSIFFTQYRVGLKGKKFKIIKFRSMVENAEEVLAANKALYEKYINNSYKLPPNEDPR + LTNIGDFIRKTSIDEIPQFINLLLGDMSLIGPRPILENELEEYSKEEQQVLLSVRPGI + TGMWQVSGRSEVYYPERCEMELYYPRNQSFLLDVKIFFLTIKKVLSGEGAH" + misc_feature 5228..5827 + /gene="wcjG" + /locus_tag="SPC47A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 9.9e-58" + gene 6048..6842 + /gene="wciB" + /locus_tag="SPC47A_0009" + CDS 6048..6842 + /gene="wciB" + /locus_tag="SPC47A_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34637.1" + /db_xref="GOA:Q4JYK6" + /db_xref="UniProtKB/TrEMBL:Q4JYK6" + /translation="MSKKYKIIVATHKRFQMPEDKDLYVPVQVGSEGKENLGYQRDNQ + GNHISHLNPYYCELTGLYWAWKNLDCDYLGLVHYRRYFTDKNRPYHDKINMNEVILSA + DQVKEFMSEADVVVPKKRKYYIETLYSHYAHTHDSSHLDTTREIIKEIAPEYLETFDK + VMDCRSGYMFNMFIMSKENVSSYCEWLFPIIDELYRRLDISRYSAFDARLFGRVSERL + FNVWLNYQNLRVKEVPFMYMEKVNLFEKGKSFLKAKYFGKKYGQSF" + gene 6951..7781 + /gene="whaI" + /locus_tag="SPC47A_0010" + CDS 6951..7781 + /gene="whaI" + /locus_tag="SPC47A_0010" + /note="member of homology group 149" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34638.1" + /db_xref="GOA:Q4JYK5" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JYK5" + /translation="MSDIKIIQDKILSILKEFINICEENNLTYYALGGTLLGAVRHKG + FIPWDDDIDIGMPREDYEKFKKVAPNFLPNNYKFLSEDTANYKKAFSVIRDDSTKIIM + NYSKEELVESLWIDIFPLDGMPAAPFKRKMHEYRYLYRRMMVQLSQFNSLVNQKKENR + PLSEKMIIGFANAVNIEKIISFNWAQKKYLQTLKKYSFKEAFAGNYTGAYKLREIVPS + DYFGEPVSLEFEGTDLSCPRKYKEYLIAIYGENYMQLPPEDKRNQHHYKIISLGDNEE + " + misc_feature 7014..7697 + /gene="whaI" + /locus_tag="SPC47A_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 3e-53" + gene 7795..8898 + /gene="wcrC" + /locus_tag="SPC47A_0011" + CDS 7795..8898 + /gene="wcrC" + /locus_tag="SPC47A_0011" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34639.1" + /db_xref="GOA:Q4JYK4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYK4" + /translation="MKKIALVKWILNDSGGGERVAISLANELTKKYEVHLIGITTKQS + DLFFKINSQVKYSNFFDHRVRLSKNLLKISKMLKNYFVDNEIDVAFGIGISANIFLSL + AGIGISTKIVLCDHTNSITDNREFSQKIQRYIGTKLADKIITLTQEDCQNYIKKYGIA + EGIIDYIYNWKENIPSDTLSYNKESTKIVTVGRFDYQKGYDYLVQVAKKVLSEKSGWS + WEIYGSGNQDEVDKIRDLINENDLQDRLVIKGLEKNQDVIYGDKGIYVMTSRYEGLPL + VLLEAQQYNLPIVSFRCPTGPSEIVEDGVNGFLIDCYDVYQMSEKLLELMKNDDLRQS + FSEHAKDNMDKFDKNKILNQWIYLIEEIGADNR" + misc_feature 8305..8820 + /gene="wcrC" + /locus_tag="SPC47A_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 6.4e-37" + gene 8900..10000 + /gene="wcyM" + /locus_tag="SPC47A_0012" + CDS 8900..10000 + /gene="wcyM" + /locus_tag="SPC47A_0012" + /note="member of homology group 181" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34640.1" + /db_xref="GOA:Q4JYK3" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYK3" + /translation="MKKMLICITSLTGGGAEKSLVNFIQQFKYKYDISLLVYSEKNNY + YAQKLEDIKIDYFIKKDTPYLIEKLLNKVVKFFPRTLVYKFILNKTRFKKEKYDIEFA + YIEGKPTKIISGSYNEDSLKLAYIHCDFSKNWYSRKSFRSIRDESVCYQKFHDVLAVS + LGQKESFEKIFPSCKLDIVPNLINQNEIERLSKESNVQKTFPYFCAVGRLAEVKNYSL + LINAFHQFRKKYPEFHLLILGEGELRQTLQNQIEILGEQNYIQLVGFQSNPYSYIRQS + KGLIQSSISESFSYVLAEASILGVPTISTRTQGSELMMKYFDVIEVDHDSAALAKGME + FILQKEIFEKNTDFNEEAINKFEAIFSKIKEK" + misc_feature 9461..9964 + /gene="wcyM" + /locus_tag="SPC47A_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.1e-29" + gene 10004..11092 + /gene="wzy" + /locus_tag="SPC47A_0013" + CDS 10004..11092 + /gene="wzy" + /locus_tag="SPC47A_0013" + /note="member of homology group 182" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34641.1" + /db_xref="UniProtKB/TrEMBL:Q4JYK2" + /translation="MKYDRVYNLIFNILFSVSTVLYMLKFVNIAKSGSLNILILASSV + FLLLLHTVIYGFNKLKLFCLSFVLFLCFLIYFQGLVYLELLNFFLIYSTLRVSNIQFN + KTHWSVFFIFFILVVLFANAGIIKSVFIFRTGGLVRGSLGFVHPNSLGLMAYAITLNT + LYVFNPNRYKIIFYCGLLIFNYFIFAITDSRTSFSISLLIILSCFIFDFRGILYKVVK + NSFIYIVIVVSSLFIILATTYFEVREPFIFLNKLFTNRIYSGNVFVAEYGYNLFGNFI + EGTLPTLAGDVIIDSGYVGLILRLGVLFFIGYLLFMLLRIKQNIFLLKEAILISSAFI + SLMFESYGFSGFIFPVLFVDFVGRRKEL" + gene 11092..11967 + /gene="wcyN" + /locus_tag="SPC47A_0014" + CDS 11092..11967 + /gene="wcyN" + /locus_tag="SPC47A_0014" + /note="member of homology group 204" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34642.1" + /db_xref="GOA:Q4JYK1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYK1" + /translation="MSLKVTVFTATYNRMNLLKKLYDSLVKQTSKDFEWIIVDDGSTD + DTSTVVQQFLSENKLDISYIYQENSGKHRAVNEGLDRAKGQLFFIVDSDDALLPKAIA + TVIDRFTTIQDNPKYAGIAFNRGYSETVIVGETFEGEFIDCDNLHRVKYNILGDKAEV + YRTEILKEIKFPEIEGENFMSEVVLWNEVARRGHKLRWFNEIIYISDYLEDGLTKNST + TIFKKNPIAHKMMTKELLQIDYPLKNKFGHIYKYHQIQQNSVQETARDLHISYIAVGI + IVAMGKVKDLLKKSK" + misc_feature 11107..11601 + /gene="wcyN" + /locus_tag="SPC47A_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 6.7e-28" + gene 12109..13107 + /gene="whaM" + /locus_tag="SPC47A_0015" + CDS 12109..13107 + /gene="whaM" + /locus_tag="SPC47A_0015" + /note="member of homology group 205" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34643.1" + /db_xref="GOA:Q4JYK0" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYK0" + /translation="MLKFSVIVPIYNVEKYIEECVYSVLRQTYNNFELILVNDASPDH + SLDIITKIAEKDSRIVIIDKEKNEGVALARSSGLANAKGDYVVYLDGDDQLIPEALKI + LATKIDSQNPDIVIFPKIKERNGVKHVNPYFSKEMLFEEDKKELYKGFLSYSYFVIGC + AAINRELAVQYDIAHELKEIWLGEDLLQSLPLLTHAKRILYIIEGIYIMVYNPDSATR + SKALRKDRYLQAIENHKVIDQYIQLWGEEELQNDFHEHIMNDVISYAFAGCRGASSVR + EGSEYLQTIGSDAGFRRAYSFGYPKKLLHKILAFFLKHESYVVAYYLIKMKERLSS" + misc_feature 12121..12624 + /gene="whaM" + /locus_tag="SPC47A_0015" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 2e-44" + gene 13104..14537 + /gene="wzx" + /locus_tag="SPC47A_0016" + CDS 13104..14537 + /gene="wzx" + /locus_tag="SPC47A_0016" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34644.1" + /db_xref="GOA:Q4JYJ9" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYJ9" + /translation="MKVLKNFLYNFSYKILTMILPFVTVPYVTRVFNPTLMGEYNYTA + SIVAYFSTFGMLGIVIYGSNQIAKVSHKGKKEISHVFSSVYYFQLFSTTLTILVYLAY + IFLFPSQYQQYFIVQIFSLIAIMFDISWLFQGLEDFKRIVMRNTVVKLIGVVSIFTLI + KSQSDIYLYVFIISFSTLISQGIMWLSVKNYVNLVRVGVKEILSNFKPNLSFFLPQIS + ISIYNTLDKIILGSLGSVFDVGIYTQAVNINSVLVNLVVTLSAVLQPRMTNLHAQGKK + EEVRRVMSASMLFNSILTFPVVVGILLVSQEFVHMFLGKEYAETFIALNIVVFSLIPI + AFSEIVGRQTLIPTDNVRYFTISVMSGAVVSILLNFIVIPFGGYKGAALVHVLVEIIV + CALMSYYARKYLDILALLRIAIKPLVTSVVTVIIVHLMFSYIWPIYNSLLSLLLKIIV + YSVIYGILLLLTRTITQKEISMIRKTP" + misc_feature 13110..13916 + /gene="wzx" + /locus_tag="SPC47A_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.3e-49" + gene 14592..15701 + /gene="glf" + /locus_tag="SPC47A_0017" + CDS 14592..15701 + /gene="glf" + /locus_tag="SPC47A_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34645.1" + /db_xref="GOA:Q4JYJ8" + /db_xref="InterPro:IPR003953" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYJ8" + /translation="MYNYLIVGAGLSGAIFAHEATKCGKKVKVIDKRDHIGGNIYCEN + VEGINVHKYGAHIFHTSNKKVWDYVNQFAEFNNYINSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKIAEQTAGMKDVEPKNLEEQAIKLIGPDIYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASANKVVFTGMIDQYFDYKHGELEYRSLRFEHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGMQPKTVITHEYPADWKRGDEPYYPINDEKNNAMFAKYQEETAQNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + misc_feature 15027..15629 + /gene="glf" + /locus_tag="SPC47A_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 7.1e-137" + gene 15688..16716 + /gene="wcjE" + /locus_tag="SPC47A_0018" + CDS 15688..16716 + /gene="wcjE" + /locus_tag="SPC47A_0018" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34646.1" + /db_xref="GOA:Q4JYJ7" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYJ7" + /translation="MTKSRINWIDFGKGFSIFLVLVGHVLLGLYQSEKFPTANNILSL + LIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQKV + AGASVRVSTTISDLLNIYKNPFGVSWYLYILWSILIIYGLLSILVKNRRMLFLISVFA + YCLTLFVQTDIYIIQRTLVWGLCFFLGSVLSEIHFDKINLKKFLFFFVLFDFIYMFAW + FLFYEVGSKKDYVSYINPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSL + GIYILHAPICSMIRILMLKVGINSVFIHVVVGIVLGWYLSILATYILKKIPFLNIVLL + PQKYIKLK" + gene 16891..>17250 + /gene="aliA" + /locus_tag="SPC47A_0019" + CDS 16891..>17250 + /gene="aliA" + /locus_tag="SPC47A_0019" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34647.1" + /db_xref="GOA:Q4JYJ6" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4JYJ6" + /translation="MMKSSKLLALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 16891..16977 + /gene="aliA" + /locus_tag="SPC47A_0019" + /note="Signal peptide predicted for SPC2044 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.270 between residues 29 and 30" + misc_feature 17137..17205 + /gene="aliA" + /locus_tag="SPC47A_0019" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcgtat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttatcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa aatgaacata aagaagcgtg tccttagtgc aggtctgact + 361 tttgcatctg ctttgctttt agctgcttgc gaccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaattacc tgttagacta ttacgctgat + 481 aatatagtca attgaaacaa gagcaggaca aaagagcctc gtaaaaggta ttgcaacttg + 541 gtaatacctt ttacgaggct ttttgatatg agcccatgtt ttctcaatag gattgtactc + 601 aggtgagtag ggaggaagaa ggtaaaagtt tatgcctaaa ctcttcacac aagagttcta + 661 gcttccccat tctatggaat cttgcattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagag aaacttctga aaccaagctt caaaaaagtc gctcgtcatc gtctcttcgt + 781 aagtcattgg agcgattaac tcaccatttg ttagacctgc aaccaaagaa atcctctgat + 841 atcttcttcc agatactttg cctcttatta actgaccttt taatgagcga ccatattctc + 901 gataaaaata agtatcgaat cctgtttcgt caatctaaac aggtgttagg tgctttaaac + 961 tattaaaatt cttaagaaat aaggctactt tttctgggtc ttgttcatag taggtgtggt + 1021 tctttttttc gagtgtagcc catagctttg agcgcatagt ggatggtagt tggatgacag + 1081 ccaaattcag aagctatttc agtcaaataa gcatctggat tgtcagtaag atagttttta + 1141 agtctatctc tatcaacttt tcttggtttt gttcctttta cttggtggtt tagctctcct + 1201 gttttctctt ttagctttaa ccagccataa atggtattac gtgagatttg gaaaacgtgt + 1261 gatgcttctg ttatactacc tgttcgctca caataagaga gaactttttt acgaaaatct + 1321 attgaatatg ccataaaaag attataccac attgtgtact atattagatt gaaactagaa + 1381 tagtacacat ctgcttctaa aacattgtta gaaatcgatt tgactgtcct tatttcattt + 1441 tattatattt ttggttcgcg ggaagtctac taagatactt aaagatgcag atagtaaaaa + 1501 aaatgtagac attaccgtaa aaaagtgata taatcgtatg atgttcaagg tataggtgtt + 1561 aatcatgagt agacgtttta aaaaatcagg ttcacagaaa gtgaagcgaa gtgttaatat + 1621 cgttttgctg actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta + 1681 caatatcctt gcttttagat atcttaacct agtggtaact gcgttagtcc tactagttgc + 1741 cttggtaggg ctactcttga ttatctataa aaaagctgaa aagtttacta tttttctgtt + 1801 gctgttctct atccttgtca gctctgtgtc gctctttgca gtacagcagt ttgttggact + 1861 gaccaatcgt ttaaatgcga cttctaatta ctcagaatat tcaatcagtg tcgttgtttt + 1921 agcagatagt gatatcgaaa atgttacgca actgacgagt gtgacagcac cgactgggac + 1981 tgataatgaa aatattcaaa aactactagc tgatattaag tcaagtcaga ataccgattt + 2041 gacggtcaac cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac + 2101 taaggccatt gtcctaaata gtgtctttga aaacatcatc gagttagagt atccagacta + 2161 cgcatcgaag ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa + 2221 gacgtctaag aatcagtctt tcaatatcta tgttagtgga attgacacct atggtcctat + 2281 tagttcggtg tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa + 2341 aatcctcttg accacaacac cacgtgatgc ctatgtacca atcgcagatg gtggaaataa + 2401 tcaaaaagat aaattaaccc atgcgggcat ttatggagtt gattcgtcca ttcacacctt + 2461 agaaaatctc tatggagtgg atatcaatta ctatgtgcga ttgaacttca cttctttctt + 2521 gaaaatgatt gacttattgg gaggggtaga tgttcataat gatcaagagt tttcagctct + 2581 acatgggaag ttccatttcc cagtagggaa tgtccatcta gactctgagc aagctctcgg + 2641 ttttgtacgt gaacgctact cactagccga tggagaccgt gaccgtggtc gcaaccaaca + 2701 aaaggtgatt gtggctatcc ttcaaaaatt aacgtcaacc gaagcactga aaaattatag + 2761 tacgatcatt gatagcttgc aagattctat ccaaacaaat atgccacttg agactatgat + 2821 aaatttggtc aatgctcagt tagaaagtgg agggaattat aaagtaaatt ctcaagattt + 2881 aaaaggtaca ggtcggacgg atcttccttc ttatgcaatg ccagacagta acctctatgt + 2941 gatggaaata gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga + 3001 gggtagatga aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca + 3061 agtcaagaga ggaaagcaag gctctcttga tagaatccta caggcagggg gtgcgaacca + 3121 ttgtctctac ctctcaccgt cgcaagggca tgtttgaaac tccggaagag aagatagcag + 3181 aaaactttct tcaggttcgg gaaattgcaa aagaagtagc agatgattta gtcattgctt + 3241 atggcgcaga gatatactat actctggatg ctctagaaaa gctagaaaaa aaagaaattc + 3301 ctacccttaa tgatagtcgt tatgccttga ttgagtttag catgcatact tcctatcgtc + 3361 agattcatac gggattgagc aatattttga tgttgggaat cacgccagta attgctcata + 3421 ttgaacgtta tgatgcttta gagaataacg aaaaacgtgt tcgtgaactg attgatatgg + 3481 ggtgttacac gcaagtaaat agttcacatg tcctcaaacc caaacttttt ggcgaacgtt + 3541 ataaattcat gaaaaaaaga gctcagtatt ttttagagca ggatttggtt catatcattg + 3601 caagtgatat gcacaatcta gacggtagac ctcctcatat ggcagaagca tatgaccttg + 3661 ttacccaaaa atacggagaa gcgaaggctc aggaactttt tatagacaat cctcgaaaaa + 3721 ttgtaatgga tcaactaatt taggagaaat gatgaaagaa caaaacatga tagaaatcga + 3781 tgtatttcaa ttatttaaaa tcttgtggaa acgcaagcta atgattttaa tagtggcact + 3841 tgtgacaggt gcgggggctt ttgcatatag cacttttatt gttaagccag aatatacgag + 3901 taccacgaga atttacgtag tgaatcgcaa tcaaggagac aagctagggt tgacaaatca + 3961 ggatttgcag gcaggatctt atctggtaaa agactaccgc gagattatcc tttcgcagga + 4021 ttcattggaa aaagtagcga caaatttgaa gttggatatg ccagcaaaaa cgttagccag + 4081 caaagttcaa gtggctgtac cagctgacac tcgtatcgtc tcaatctctg tcaaggataa + 4141 acagccagag gaagccagtc gtatcgctaa ttctctacga gaagttgctg cagaaaagat + 4201 cgtcgctgta acgcgagtat ctgatgtaac gacacttgaa gaagcgcgac cagctacgac + 4261 tccctcttct ccaaatgttc gacgcaattc cttgtttggt tttcttggag gagcagtcgt + 4321 aacagtaatt gctgttcttt tgattgagtt gctcgacacc cgtgtgaaac gtcctgaaga + 4381 tgttgaagat gtactgcaaa ttccactttt agggctcgtt ccagatttgg acaaaatgaa + 4441 ataggaggaa gttatgccaa cgttagaaat ctcacaggcg aaattggatt ttgtaaaaaa + 4501 ggcagaggaa tattataacg ctttgtgtac gaacctacag ttaagtggag atgatttgaa + 4561 agtattttct atcacttctg tgaaactagg agaaggaaaa tcaacgactt ccaccaatat + 4621 cgcttgggct tttgcgcgtg caggttacaa aacgctgctg attgatggag atattcgcaa + 4681 ttctgttatg ttaggtgtct ttaaagcaag ggataagatt acaggcctga cagaattttt + 4741 atcaggaact acagacctat cacaagggct ttgtgatacc aatatcgaaa atctctttgt + 4801 aattcaggct ggctctgtgt caccgaatcc gacagctctt cttcaaagta agaatttcag + 4861 tacaatgctt gaaacattgc gtaaatattt tgactacatc attgtagata ctgctcctgt + 4921 cggtgttgtg attgatgcgg ctattattac gcgaaaatgc gatgcttcta ttttagtgac + 4981 ggaggcaggt gaaataaatc gacgggatat tcaaaaagca aaagaacagt tggaacacac + 5041 agggaagccg tttttgggag ttgtgttgaa tagattcgat acttcagtag acaaatacgg + 5101 ttcttatggg aactatggga attatggaaa ggaataaata gtcttgtagt accaagatta + 5161 tttgagataa ctaccatggg agggggagtt taaggtgaaa cagaatggta tcatctatat + 5221 tggctttaaa agggttatgg atgtttttat tggcttattt ggaacaatat tcataatctt + 5281 acctagttct ttaataattt atattatcta taaaataaaa ggttacaaag gaagtatatt + 5341 cttcacacaa tatagagtgg ggctaaaggg gaaaaaattt aaaattatta aatttagatc + 5401 aatggttgaa aatgctgaag aagttttggc cgcaaataaa gcactctatg aaaaatatat + 5461 aaataacagt tataaattac ctccaaatga ggatcctcgt cttaccaata tcggagattt + 5521 tatcaggaaa acaagcattg atgaaattcc tcaatttata aacttattgc taggtgatat + 5581 gagtcttatt ggacctagac cgattttgga gaatgagtta gaggagtatt ctaaggaaga + 5641 acagcaagtt ttgttatctg tacggccagg tattacaggg atgtggcaag tttctggtag + 5701 gagtgaggta tattatcctg aacgctgtga aatggaactg tactatcctc ggaatcaatc + 5761 ctttttgttg gatgtcaaaa tcttcttttt gacaataaaa aaagttctgt ctggagaagg + 5821 ggctcattga tgtatgagct aaatcatcta gcaaaaaata gatagaaaga tgaagtggaa + 5881 tacgaataac gtttcttggg tattcgtatt cattttttca agtaaaggaa gcattatgaa + 5941 taagtggatt taatctagta ttttttgctt gaaaaaatga atgggaattc aatctaaaga + 6001 attgtccagt gaggcaagat tttaggaatt ggagttagga tgtataaatg tcaaaaaagt + 6061 ataaaattat agtagcgact cataaaagat ttcaaatgcc agaagataag gacttatatg + 6121 ttcctgttca ggttggcagt gaaggaaagg aaaatttagg ttaccaacga gataatcaag + 6181 gtaatcatat ctcacacctc aatccgtatt attgtgaatt gacaggatta tactgggctt + 6241 ggaaaaattt agactgtgat tacctaggat tagttcatta ccgacgttat tttacagata + 6301 agaaccgacc ttatcatgat aagattaaca tgaatgaagt tatcctatcg gcagatcaag + 6361 ttaaggaatt tatgtctgaa gcggacgtcg ttgttcctaa aaagagaaaa tattatatag + 6421 agactctcta ttcacattat gcacatactc atgattctag tcatttagat acaacgcgtg + 6481 aaatcataaa agaaatcgca ccagagtatc tagaaacatt tgataaggtg atggactgtc + 6541 gtagtggcta tatgttcaat atgtttatca tgtccaaaga aaatgtatca tcttattgcg + 6601 agtggttatt ccctatcatt gatgagttgt acagaagatt ggatatatca aggtactctg + 6661 cttttgatgc aagactattt ggacgtgtta gtgagcgtct ctttaatgtt tggttaaact + 6721 accaaaatct acgtgttaaa gaagttccgt ttatgtatat ggaaaaagtt aatttatttg + 6781 agaagggcaa atccttcttg aaagccaagt atttcggaaa aaaatatgga cagagttttt + 6841 agagtttact aagtaacttt caagttttaa actaatatta aaattattta atttaactat + 6901 cattgggcgt tgtgaaaaga agaactcacc cttagtttag gaggacaagt atgtcagata + 6961 taaaaattat tcaagataaa atcctgtcta tcttgaaaga atttattaat atttgtgaag + 7021 aaaataattt gacttactat gctctagggg gaacattgct tggagcagta cgtcacaaag + 7081 gatttatccc ttgggatgat gatattgata ttggcatgcc aagagaagat tacgaaaagt + 7141 ttaagaaagt agctcccaat tttctaccaa ataattataa atttttaagt gaagataccg + 7201 ctaattataa aaaagctttc tctgtaattc gggatgattc aacgaaaatc ataatgaatt + 7261 atagtaaaga ggaattggta gagagtttgt ggatagatat ttttccactt gatggaatgc + 7321 ctgctgcccc ctttaagaga aaaatgcatg agtatagata cttatataga cggatgatgg + 7381 ttcaactttc tcagtttaat agtttagtaa atcagaagaa agagaatcgt ccactatctg + 7441 aaaaaatgat tattggattt gcgaacgctg ttaatattga aaagattatt tcttttaact + 7501 gggcacagaa aaaatattta caaacgctaa aaaaatattc gtttaaggaa gcttttgcag + 7561 gaaactatac aggagcatat aaactaagag aaatcgtacc ttcagattat tttggagagc + 7621 cagtatcatt agagtttgaa gggactgatt tgagttgtcc tcgtaagtat aaagaatatt + 7681 tgatagcaat ttatggagag aattatatgc agttacctcc agaagataag cgaaaccaac + 7741 atcactataa gataatatct cttggtgata atgaagaatg agagtagttg aaacatgaaa + 7801 aaaatcgctt tagtgaaatg gattttgaat gattctggcg gtggtgagcg agttgctata + 7861 tccttggcaa acgaacttac aaaaaagtat gaagtccatt tgattggaat tacaacaaag + 7921 caatcggatt tattctttaa aatcaattct caagtaaaat actccaattt ttttgaccat + 7981 cgagtacgct tgtctaagaa tcttctaaaa atttcaaaaa tgttaaaaaa ttattttgta + 8041 gataatgaga tagatgttgc ctttggaata ggaatatcag caaatatatt tttatcattg + 8101 gcaggaatag gtatatccac caaaatagtt ttgtgcgacc atacgaattc aattacagac + 8161 aatcgagagt tttctcagaa aattcaaaga tatattggaa caaaacttgc agacaagatt + 8221 attaccctta ctcaggaaga ttgtcaaaac tatataaaaa aatatggaat tgctgaagga + 8281 attatcgatt atatctataa ttggaaagaa aatatacctt cagacacgtt aagttataat + 8341 aaagaatcaa cgaaaattgt tacagtgggt cgtttcgatt atcaaaaggg ctatgattat + 8401 cttgttcaag ttgcgaaaaa ggttttgtct gagaagtcag gctggagttg ggaaatctat + 8461 ggatccggca atcaagatga agtagacaaa atcagagatt taatcaacga aaatgatttg + 8521 caagacaggt tagtcataaa aggactcgaa aaaaatcagg atgtgattta tggagataaa + 8581 ggaatttatg tcatgacttc tcgctatgag ggcttacctt tagtcctatt agaagcacaa + 8641 caatacaatc ttcctattgt tagcttcaga tgtccaacgg gacctagtga gattgttgaa + 8701 gatggagtca atggattttt gattgattgc tatgacgtgt atcagatgag tgagaaattg + 8761 cttgaattga tgaaaaatga tgatttgcga caatctttct cagaacatgc caaagacaat + 8821 atggataaat ttgataaaaa taaaattctt aatcagtgga tatatttaat agaagaaata + 8881 ggagcggata atcgttaaaa tgaaaaaaat gttaatttgc ataactagct taacaggagg + 8941 cggagctgaa aaatcactgg taaattttat acagcaattt aagtataagt atgatatctc + 9001 tttactcgta tatagcgaaa agaataatta ttatgcacaa aaacttgaag atattaaaat + 9061 agattatttc ataaaaaaag acacaccata tcttattgaa aaacttttga ataaggtagt + 9121 gaaatttttt cctaggacat tggtatataa atttattctt aataaaacta ggtttaaaaa + 9181 agaaaaatac gacatagaat ttgcgtatat agaaggaaag ccaactaaaa ttatttcagg + 9241 ctcatacaat gaagatagtc taaaattagc gtatattcat tgtgattttt ctaagaattg + 9301 gtactctcgt aaatcgttta gaagtattag agatgagagt gtgtgctatc aaaaatttca + 9361 tgatgtttta gctgtttctt taggtcagaa agaaagtttt gaaaaaatat ttccatcatg + 9421 taaattggat atagttccaa atttaatcaa tcaaaatgaa atagaaagat taagcaaaga + 9481 atcaaatgtg caaaagacat ttccttattt ttgtgcagta ggaagattgg cagaagtgaa + 9541 aaattattca ttattaataa atgcatttca ccaatttaga aaaaaatatc ctgaatttca + 9601 tttattaatt ttgggtgaag gagagctacg gcaaacactg caaaatcaga ttgagattct + 9661 aggtgagcaa aattacattc aattagtcgg ttttcaaagt aacccatact cctatataag + 9721 acaaagcaaa gggctgattc aaagctcaat ttcagaatca tttagttatg ttctagctga + 9781 agcgtcaata ttgggagttc ccacgatttc tactagaact caagggtcag aattaatgat + 9841 gaaatatttt gatgttatag aagttgatca tgatagtgcg gcactggcta agggaatgga + 9901 atttattctc cagaaggaaa tttttgagaa aaatacggat ttcaatgagg aagcaataaa + 9961 taagtttgaa gcaatatttt caaaaataaa ggagaaataa tttgtgaaat atgatagagt + 10021 atataatctg atttttaata tattgttctc cgtgtcaaca gttttgtata tgctgaaatt + 10081 tgtaaatatt gcgaaaagtg gtagtttaaa tatcttaatt ttagctagtt cagtattttt + 10141 attgctactt cacacagtga tttacggctt taataaattg aagctatttt gtctatcctt + 10201 cgtattattt ttatgttttc taatttattt tcaaggatta gtttatctgg aattgcttaa + 10261 tttttttctg atttactcaa ctctaagagt gagtaatatt caatttaaca agactcattg + 10321 gtcagtgttt tttatttttt ttatattagt agttttattt gctaatgcag gaattattaa + 10381 aagtgtattc atttttcgaa ctggagggtt agtaagagga tcattagggt ttgtccatcc + 10441 gaattcacta ggtctcatgg cttatgcaat tacattaaat acattgtacg tctttaaccc + 10501 caatagatac aaaattattt tctactgcgg tcttcttata tttaattatt ttatatttgc + 10561 cataacggac tctagaactt ctttctcaat aagtttattg attattttaa gttgttttat + 10621 ttttgatttt agaggtattc tatacaaggt tgttaaaaat tcatttattt atatagtaat + 10681 tgtagtaagt tcgctattta ttattttagc aactacctat tttgaagtga gggaaccttt + 10741 catttttttg aataaacttt ttaccaatag aatttacagt ggtaatgttt ttgtagctga + 10801 atatggatat aatctttttg ggaattttat agagggaaca ctacctactt tagcaggaga + 10861 tgtaattatt gatagtggtt atgtgggttt aattcttcgt ttaggtgtat tattttttat + 10921 aggctacttg ttgtttatgt tgttaagaat aaaacaaaat atttttttat tgaaggaagc + 10981 aatcttgatt agcagtgcct ttatttcatt aatgtttgaa tcctatgggt tttctggttt + 11041 tattttccca gttttatttg tggattttgt gggtagaaga aaggaattat aatgagttta + 11101 aaagttacag tatttacagc tacatataat aggatgaact tgttaaaaaa attgtatgac + 11161 tctctagtga agcaaactag taaagatttt gagtggataa ttgtagatga tggttcaacg + 11221 gatgatacct caacggtagt tcagcaattt ttatcagaaa ataaattgga tataagttat + 11281 atttatcaag aaaatagtgg gaagcataga gcggttaatg agggattgga cagagctaag + 11341 ggacagttgt tttttatagt cgactcagat gatgctctcc ttccgaaagc tatagccacc + 11401 gttattgata gattcacaac tattcaagat aatcccaaat atgcaggcat cgcttttaat + 11461 cgaggatatt cagagacagt aatcgttggg gaaacgtttg aaggggaatt tatagattgt + 11521 gataatttgc atcgagtaaa atataatatt cttggtgata aagctgaagt ctacagaaca + 11581 gaaattttaa aagaaataaa attcccagaa attgagggag aaaattttat gagtgaagta + 11641 gttttgtgga atgaagtagc aaggagagga cacaaattac gatggttcaa tgagattatt + 11701 tacatatctg attacctaga ggacggcttg acgaagaata gtacgactat ttttaaaaaa + 11761 aatccaattg ctcataaaat gatgacaaaa gagttattac agattgatta tcctttaaaa + 11821 aacaaatttg gacatattta taagtatcat cagatccaac agaattctgt tcaagagaca + 11881 gctagagatt tacatatttc atatatagca gtcggtatta ttgtagcaat gggaaaagta + 11941 aaagatttat taaaaaagag taaataaatc tatgttttat atgatgaaaa tgtctatgaa + 12001 attttcgtaa gaatgatctt catgaagttt tttagattta aggttgaact ttcagtttga + 12061 ttatccagta tatctatgaa acttaaacta ataaaatgga ggaagtaaat gctaaagttt + 12121 tctgtcattg tacctattta caatgttgaa aagtatattg aggaatgtgt atattctgta + 12181 ttgagacaga catataataa ttttgaactt attttggtga atgatgcctc tccagatcat + 12241 tcgcttgata ttattacaaa aatagctgaa aaggattcac gcattgtaat tatagacaaa + 12301 gagaagaatg aaggtgtggc gttagcaaga tcatctggct tagcaaatgc taaaggagat + 12361 tacgttgttt atttggatgg agatgatcaa ctaattccag aagcgttaaa aattttagct + 12421 actaaaattg attcacaaaa tccagacatt gtaatttttc ctaaaattaa ggagagaaac + 12481 ggtgtgaaac atgtgaatcc atacttctca aaggaaatgc tctttgagga agataaaaaa + 12541 gaactatata aaggcttttt aagttatagt tactttgtaa ttggatgcgc tgctattaat + 12601 agagagttag ctgtgcaata tgacattgct catgaattga aagagatttg gcttggtgag + 12661 gatttattgc aaagccttcc tttgttgaca catgcaaaaa ggattttata cattatagag + 12721 ggaatctata taatggttta caatcctgat tcagcaacaa ggagtaaagc attaagaaaa + 12781 gatagatatc tccaagcaat tgaaaatcat aaggtaattg accaatatat acaactatgg + 12841 ggtgaggaag aactacaaaa tgattttcat gaacatatta tgaatgatgt tatttcttat + 12901 gcattcgcag ggtgtagggg tgcaagctct gttagagagg gcagtgagta tcttcaaaca + 12961 attggtagtg atgcaggatt ccgcagagcc tactcattcg gatatcctaa aaaattgtta + 13021 cataaaatac tagcgttttt tctaaagcat gagtcatatg tcgttgcgta ttatttaatt + 13081 aaaatgaaag aaaggttatc atcatgaaag ttttgaaaaa ttttttatat aatttttcat + 13141 ataaaatctt aacgatgatt cttccttttg taacggttcc ctatgtaact agagttttta + 13201 atccaacatt gatgggtgaa tataattata ccgcctctat agtcgcctat ttttcaacat + 13261 ttggtatgtt aggaattgtt atttatggaa gtaaccaaat tgcaaaagta agtcataagg + 13321 gaaaaaaaga aatatctcat gttttttctt cagtctatta ttttcagtta ttttcaacaa + 13381 ctctaacgat actggtatat ctagcctata tttttctttt tccaagtcaa taccaacaat + 13441 attttatagt acaaatcttt tctctcattg caataatgtt tgatattagt tggctatttc + 13501 aaggattaga agattttaag cgaattgtta tgcgaaatac agtagtcaag ctaattggtg + 13561 tcgtttctat atttacattg ataaaatccc aatcagatat ctatttgtat gtatttatta + 13621 ttagtttttc tacgttaatt tcgcaaggca ttatgtggtt aagtgtaaag aactatgtca + 13681 atttggttcg agttggagta aaagagatac tatcaaactt taaacctaac ttatctttct + 13741 ttcttcccca aatttcaatt tcgatttaca atacgctaga taaaataatt ttgggctctt + 13801 taggtagtgt atttgatgtt ggaatttata cccaagctgt gaatataaac tctgttttag + 13861 ttaatttagt agtgactctc agtgctgtac ttcaacctag aatgaccaat ttgcatgctc + 13921 aaggtaaaaa ggaggaagtt cgcagggtaa tgtccgcatc aatgttattt aatagcatac + 13981 taacctttcc ggtagtagtt ggaatattac ttgttagcca agaatttgtt catatgtttt + 14041 tgggaaaaga gtatgctgaa acatttattg ctctcaacat tgttgttttc tctctaattc + 14101 cgattgcttt ttcagagatt gtggggcgtc aaactctgat tccgacggat aatgttcgat + 14161 actttacaat ttcagtaatg tcaggtgctg tagttagcat tttattaaat tttattgtca + 14221 tacctttcgg aggatataaa ggagcggcgc ttgtacatgt actcgttgag attattgtat + 14281 gcgcattaat gtcatattat gctcgtaaat atttagatat tttagcttta ctcagaatag + 14341 caattaaacc actggttacg agtgtagtga ctgttattat agtgcatttg atgttttctt + 14401 atatttggcc tatttataat agcttgctta gtttattatt aaagataata gtttattcag + 14461 taatatatgg tattctatta ttactgacaa gaacaataac tcagaaagag atttctatga + 14521 taagaaaaac cccctagttt ttctatgtaa tggtgagaat cattaaaaag taagggagat + 14581 ttaaaattaa aatgtacaac tatctaatcg tcggtgcggg tttgtctggt gcaatctttg + 14641 cgcacgaagc tacaaaatgt ggaaaaaaag taaaagtgat tgataaacgc gatcacattg + 14701 gagggaacat atactgtgag aatgtagaag gtatcaatgt tcataaatat ggtgcccata + 14761 tcttccatac ttctaataaa aaagtctggg actacgtcaa tcaatttgct gagtttaaca + 14821 actatatcaa ctcacctgtc gcaaactata agggaagtct ttataacctt cctttcaata + 14881 tgaatacctt ctatgctatg tggggcacaa aaactccaca agaagtgaag gataagattg + 14941 ctgagcagac agctggtatg aaggatgttg agccgaaaaa tctggaagaa caagctatca + 15001 agttgattgg tccggatatc tatgaaaagt tgatcaaggg ttatacagaa aagcaatggg + 15061 gacgctcagc gacagaactt cctccattta tcataaaacg ccttccagtt cgtttaacct + 15121 ttgataataa ctattttaat gaccgttacc aagggattcc tattggtggt tacaatgtca + 15181 tcatcgaaaa tatgctgaaa gatgtagaag ttgaacttgg agtagacttt tttgctcatc + 15241 gtgaagagtt ggaagcatct gctaacaaag ttgtcttcac aggaatgatc gaccaatatt + 15301 ttgactacaa gcacggagag ttagaatacc gtagccttcg ttttgagcat gagattttag + 15361 acgaggaaaa ttatcaaggg aatgctgtag tgaactatac agagcgtgag atcccttata + 15421 ctcgtatcat cgaacacaaa cattttgaat atggaatgca gccaaagaca gttatcacgc + 15481 atgaatatcc agctgactgg aagcgtgggg acgagcccta ctatcctatt aacgatgaga + 15541 aaaataatgc tatgtttgct aagtaccaag aggaaacagc gcagaatgat aaagttatct + 15601 tttgtgggcg tttagcagat tataaatatt acgatatgca tgtggtgatt gaacgggcgc + 15661 ttgaggttgt ggagaaagag tttggatatg acaaaaagta gaatcaattg gatagatttt + 15721 ggaaaaggct tttccatatt tttagtatta gtaggacatg tgttgcttgg actgtatcaa + 15781 tcggaaaaat ttcccacagc aaacaatata ctatcattgt tgatagcaca agtctacata + 15841 tttcatatac cagtattttt tgccttatca ggatactttt tcaaacctgt gtcggatttg + 15901 aaggagttct ggcaatatgc taaaaagaag acaattgttt ttggtctgcc atatattttc + 15961 tattcgatca ttcactttgg tcttcaaaaa gttgcagggg catctgttcg tgtttctaca + 16021 accatatctg atttgctaaa tatctataaa aatccttttg gggtttcgtg gtatttatat + 16081 atactctggt cgattttgat aatctatgga ttattgtcta ttttagtcaa aaatcgtaga + 16141 atgttatttt tgataagtgt tttcgcttat tgtttaaccc tatttgttca aacagatatt + 16201 tatattattc aaagaacgct agtttggggg ctttgtttct ttcttggcag tgtattgagt + 16261 gaaattcact ttgataaaat taatttgaaa aaatttcttt ttttctttgt gttatttgat + 16321 tttatttata tgttcgcttg gttcttgttt tatgaagtag ggtctaagaa ggattatgta + 16381 agctatatta acccaggttt gtgggggatt gcttttattg tctgtgtatt agttgctttt + 16441 gcgatttttc ctaaaatgga gaaaaatttt cctaaaactt tcctatattt cactaaatac + 16501 gggaaagata gtttagggat ctatattctt catgcaccaa tttgtagcat gattcggatt + 16561 ctaatgttga aagtgggaat aaactcagtt tttattcacg ttgttgttgg gattgtgcta + 16621 ggctggtatt tatccatact agcaacttat atattgaaaa aaattccatt tttgaatatt + 16681 gttttattac cacaaaagta tattaaatta aaataaatta ttttagattt ataatgtggc + 16741 tctttgtcaa ctaacatctg gagaggacaa tcactgtctt ctcttttttt gtcttttcag + 16801 aatataccaa attaacacaa aaattctgaa aattctgttg acaactttct gaaaagagtc + 16861 tataatggag agaaagtttt aaaggagaaa atgatgaaaa gttcaaaact acttgccctt + 16921 gcgggcgtga cattattggc ggcgactact ttagctgcat gctctggatc aggttcaagc + 16981 actaaaggtg agaagacatt ctcatacatt tatgagacag accctgataa cctcaactat + 17041 ttgacaactg ctaaggctgc gacagcaaat attaccagta acgtggttga tggtttgcta + 17101 gaaaatgatc gctacgggaa ctttgtgccg tctatggctg aggattggtc tgtatccaag + 17161 gatggattga cttacactta tactatccgt aaggatgcaa aatggtatac ttctgaaggt + 17221 gaagaatacg cggcagtcaa agctcaagac +// + diff --git a/public/res/serotype_genbank/serotype_47F.gb b/public/res/serotype_genbank/serotype_47F.gb new file mode 100644 index 0000000..d9c5165 --- /dev/null +++ b/public/res/serotype_genbank/serotype_47F.gb @@ -0,0 +1,733 @@ +LOCUS CR931721 16064 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Eddy nr. 52 (serotype 47f). +ACCESSION CR931721 +VERSION CR931721.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 16064) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 16064) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..16064 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Eddy nr. 52" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC47F_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC47F_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34648.1" + /db_xref="GOA:Q4JZD8" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4JZD8" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTAAKEVLEKQVLAP + WDAFCVELL" + gene 323..491 + /gene="aliB" + /locus_tag="SPC47F_0002" + /pseudo + CDS 323..491 + /gene="aliB" + /locus_tag="SPC47F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(512..1024,1026..1352)) + /gene="tnp" + /locus_tag="SPC47F_0003" + /pseudo + CDS complement(join(512..1024,1026..1352)) + /gene="tnp" + /locus_tag="SPC47F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(962..1024,1026..1334)) + /gene="tnp" + /locus_tag="SPC47F_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.1e-23" + /pseudo + gene 1568..3013 + /gene="wzg" + /locus_tag="SPC47F_0004" + CDS 1568..3013 + /gene="wzg" + /locus_tag="SPC47F_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34651.1" + /db_xref="GOA:Q4JYJ4" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYJ4" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYEVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMIDLVNTQLESGGKYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1568..1684 + /gene="wzg" + /locus_tag="SPC47F_0004" + /note="Signal peptide predicted for SPC2048 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 1772..2119 + /gene="wzg" + /locus_tag="SPC47F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.6e-63" + misc_feature 2297..2740 + /gene="wzg" + /locus_tag="SPC47F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.6e-68" + gene 3015..3746 + /gene="wzh" + /locus_tag="SPC47F_0005" + CDS 3015..3746 + /gene="wzh" + /locus_tag="SPC47F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34652.1" + /db_xref="GOA:Q4JYJ3" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYJ3" + /translation="MIDIHSHIVFDVDDGPKSREESKALLVESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNIPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRVQYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + misc_feature 3018..3626 + /gene="wzh" + /locus_tag="SPC47F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 4.7e-36" + gene 3755..4447 + /gene="wzd" + /locus_tag="SPC47F_0006" + CDS 3755..4447 + /gene="wzd" + /locus_tag="SPC47F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34653.1" + /db_xref="GOA:Q4JZA0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZA0" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 3773..4189 + /gene="wzd" + /locus_tag="SPC47F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-53" + misc_feature 4295..4372 + /gene="wzd" + /locus_tag="SPC47F_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4457..5140 + /gene="wze" + /locus_tag="SPC47F_0007" + CDS 4457..5140 + /gene="wze" + /locus_tag="SPC47F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34654.1" + /db_xref="GOA:Q4JYJ1" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JYJ1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARTGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDASILVTAIGEVNKRDVQKAKQQLEQTEKLFLGVVLNKLDISVDKYGGY + GSYGNYRKE" + gene 5149..5790 + /gene="wcjH" + /locus_tag="SPC47F_0008" + CDS 5149..5790 + /gene="wcjH" + /locus_tag="SPC47F_0008" + /note="member of homology group 61" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI34655.1" + /db_xref="GOA:Q4JYJ0" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q4JYJ0" + /translation="MIKMYFVFKNILDRFLAFFLFITLIIIPIIPITILVIWIEDPGD + VFFFQDRIGLNGKSFKVIKFRSMYKDADQRIKKSIISGEIDRLNFKEHSQSMTTKVGK + VIRKLSIDELPQLVNIIKGDMAIVGPRPLQQFEITHHILTHKEMETTLKMSKRLSVKP + GLLCYWQVTPNKNDIPFSDRMNLDLLYIDNVSFKTDFLLILKGFYTVLMGNNN" + misc_feature 5185..5781 + /gene="wcjH" + /locus_tag="SPC47F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.1e-23" + gene 5792..6583 + /gene="wciB" + /locus_tag="SPC47F_0009" + CDS 5792..6583 + /gene="wciB" + /locus_tag="SPC47F_0009" + /note="member of homology group 16" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34656.1" + /db_xref="GOA:Q4JYI9" + /db_xref="UniProtKB/TrEMBL:Q4JYI9" + /translation="MKNIKILVATHKKYKMPSDSNMYLPIHVGCEGKKNLGFQGDNSE + ENISNLNPYYCELTGLFWAWKNLDCDYLGLVHYRRYFTKMTKRYNESINIDDVILNRF + EVEKLLENSDIIVPKRRKYYIETLYSHYDHTFDGSHLDLARKMIEMKNPEYLSSFDKV + MEQRSGYMFNMFIMKKELADDYFSWLFPILDSMYESMDLSGLTDFEARLFGRVSELLF + NVWLVKSNLTPKEVPFMYMEKVNLFKKGISFLMAKFFGKKYGQSF" + gene 6600..7820 + /gene="wzy" + /locus_tag="SPC47F_0010" + CDS 6600..7820 + /gene="wzy" + /locus_tag="SPC47F_0010" + /note="member of homology group 45" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34657.1" + /db_xref="UniProtKB/TrEMBL:Q4JYI8" + /translation="MMKVVIKRKSLPEILALSALTIFLVVSILNVTFYVQYLPKVVYK + ILIAISLILLVIKELYKRKFDYRTIISLFATVLMYLLIGRVSTLNSNIAIGIIFIYAL + RDIPFKSVAKTSLAVSVLILLFVITGAKLGVIINYLEISGTRVRSYLGFRYALFPSIL + MMNIVAIVFYLKQNKIQYWQWLLLSLSAYWLYDETDSRLTFYSSCILLICSLLIRWIP + ELFSKFGYIFKAFKLTFIINAVVSFWVSFTYLNLSHSYINNLFLKLDYILGGRIYLVN + KSLNLYGFGLFGRPVEWNGNGLTIEGVRNYQTYLYVDNLYVQILQKFGLLALGIMLLV + LTLTLFKVIKRREWVLSFILILMSFHSMIDDLNLYLHYNIFWILLGSLIYPDYQFSDE + SDEELGENSFEEII" + misc_feature 6600..6704 + /gene="wzy" + /locus_tag="SPC47F_0010" + /note="Signal peptide predicted for SPC2054 by SignalP 2.0 + HMM (Signal peptide probability 0.991) with cleavage site + probability 0.762 between residues 35 and 36" + gene 7916..8746 + /gene="whaI" + /locus_tag="SPC47F_0011" + CDS 7916..8746 + /gene="whaI" + /locus_tag="SPC47F_0011" + /note="member of homology group 149" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34658.1" + /db_xref="GOA:Q4JYI7" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JYI7" + /translation="MSDIKIIQDKILIILKEFINICEENNLTYYALGGTLLGAVRHKG + FIPWDDDIDIGMPREDYEKFKKVAPNFLPNNYKFLSEDTANYKKAFSVIRDDSTKIIM + NYSKEELVESLWIDIFPLDGMPAAPFKRKMHEYRYLYRRMMVQLSQFNSLVNQKKENR + PLSEKMIIGFANAVNIEKIISFNWAQKKYLQTLKKYSFKEAFAGNYTGAYKLREIVPS + DYFGEPVSLEFEGTDLSCPRKYKEYLIAIYGENYMQLPPEDKRNQHHYKIISLGDNEE + " + misc_feature 7979..8662 + /gene="whaI" + /locus_tag="SPC47F_0011" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 3e-53" + gene 8760..9863 + /gene="wcrC" + /locus_tag="SPC47F_0012" + CDS 8760..9863 + /gene="wcrC" + /locus_tag="SPC47F_0012" + /note="member of homology group 24" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34659.1" + /db_xref="GOA:Q4JYI6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4JYI6" + /translation="MKKIALVKWILNDSGGGERVAISLANELTKKYEVHLIGITTKQS + DLFFKINSQVKYSNFFDHRVRLSKNLLKISKMLKNYFVDNEIDVAFGIGISANVFLSL + AGIGTQTKVVLCDHTNSITDNREFYQKFQRYVGTKLADKIITLTQEDRENYIKKYGVP + EERICYIYNWKEAALSDVSYNKKSTKIVTVGRFDYQKGYDYLIQVAKKVLEKRADWTW + EIYGSGNQDEVEKIRDLINENDLQDRLVIKGLEKNQDLIYGDKGIYVMTSRYEGLPLV + LLEAQQYNLPIASFSCPTGPNEIVEDGVNGYLVECYDVEAMSNRLLELMNDKELRNRF + SSHAKDNIEKFNKDRIIHQWIDLIEEVSGGGNV" + misc_feature 9270..9782 + /gene="wcrC" + /locus_tag="SPC47F_0012" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3.4e-39" + gene 9856..10872 + /gene="wcrD" + /locus_tag="SPC47F_0013" + CDS 9856..10872 + /gene="wcrD" + /locus_tag="SPC47F_0013" + /note="member of homology group 32" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34660.1" + /db_xref="GOA:Q4JYI5" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4JYI5" + /translation="MSNKILTITVPTYNIENYIGKCIESFKAVNPTYYSDFEVLIIND + GSTDNSVQVVKDLMEGSTLDLRIITKENGGHGSTINRGIKEASGKYFKVIDGDDWINV + PEFESLLDKLREINTDLVISDYTEQHVYNNSTIFKEFSSYLIPNQETRGIPSKWTPMH + ALVYKTSILKDNAITISENTFYVDQEYTMLPLQFVENYIYFKLDIYQYFLGRADQSMN + IDIMRKRADHHERVTKRILDLYKESYTQKPEIEKVVSDSLQYLVNKQNILYVMNEELD + KVYELFSYSEKSGFKFKFETKTKTSNLLYVNYKTKYLFNLVIKNLVKRKANSLEKEFQ + EKGF" + misc_feature 9874..10374 + /gene="wcrD" + /locus_tag="SPC47F_0013" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.4e-32" + gene 10962..12392 + /gene="wzx" + /locus_tag="SPC47F_0014" + CDS 10962..12392 + /gene="wzx" + /locus_tag="SPC47F_0014" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34661.1" + /db_xref="GOA:Q4JYI4" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYI4" + /translation="MECACMKVLKNYAYNLSYQLLIIILPIITTPYVTRIFSSDNLGT + YGYFNSIVTYFLLLATLGIGNYGTKEISGNRKAIHQNFWGIYSIQLGASLFSTFLYVI + VCLILPAMQNTVAYILGLSLFSKGLDISWLFQGLEDFRKITVRNITVKVIGGTSIFLF + VKSASDLYLYVFLLTIFELLGQLSMWVPAREFIGKPHFDWLYAKQHLKPVILLFLPQV + AISLYVTLDSTMLGSLASIRDVGIYDQSLKLVKILLTLVTSLGSVMLPRVSNLLSSGD + HKAVNKMHEISFLIYNLVIFPIMAGMLIVNDDFVTFFLGQDFQEARYAIAIMIFRMFF + IGWTNIMGIQILIPHNKNKEFMLSTIIPAIVSVGLNLLLLPKLGYIGAAIVSVLTEAL + VWAIQLYYTRTYLKDVPIIRTMIKIILASAIMYSVLLVSKTYIHFSPTINVLVFVVLG + GIIYLFSVLSLKVIDVIELKQVIRKN" + misc_feature 10983..11777 + /gene="wzx" + /locus_tag="SPC47F_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 4.7e-63" + gene 12394..13392 + /gene="wciG" + /locus_tag="SPC47F_0015" + CDS 12394..13392 + /gene="wciG" + /locus_tag="SPC47F_0015" + /note="member of homology group 21" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34662.1" + /db_xref="GOA:Q4JYI3" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYI3" + /translation="MHKFKDINLDLLKVIACVGVVLLHTEMGGFKETGSWNFSTYLYY + LGTYSIPLFFIVNGYLLLGKKEITYSYILQKVKWILITVLSWTLIVWLFKRDFSVNPI + KKLIGSLVQKGYFFQFWFFGALILIYICLPVLKQFLNSKRSYLYFLSVLLVIGLIFEL + TNIVLQMPIQAYVIQTFRLWTWLFYYILGGFISQFDKNTIKNGFKRWMKVIAVLLLLV + SPFILFFIAKTTYYNFFAEYFYDILLVKVVSVGIFLTIFSLVLNENSNKWIIFLSNQT + MGIFIIHTYIMKVWEKVLGFNFVGAYLLFALFTLSVSFIIVGMLMKIPYFNRIVKL" + gene 13406..14515 + /gene="glf" + /locus_tag="SPC47F_0016" + CDS 13406..14515 + /gene="glf" + /locus_tag="SPC47F_0016" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34663.1" + /db_xref="GOA:Q4JYU6" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR006076" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYU6" + /translation="MYDYLIVGAGLSGAIFAYEATKRGKKVKVIDKRNHIGGNIYCEN + VEGVNVHKYGAHIFHTSNKKVWDYVNQFAEFNNYVNSPVANYKGSLYNLPFNMNTFYA + MWGTKTPQEVKDKITEQTADMKDVEPKNLEEQAIKLIGPDVYEKLIKGYTEKQWGRSA + TELPPFIIKRLPVRLTFDNNYFNDRYQGIPIGGYNVIIENMLKDVEVELGVDFFAHRE + ELEASAEKVVFTGMIDQYFDYKHGELEYRSLRFDHEILDEENYQGNAVVNYTEREIPY + TRIIEHKHFEYGTQAKTVITREYPADWKRGDEPYYPINDEKNNAMFAKYQEEASKNDK + VIFCGRLADYKYYDMHVVIERALEVVEKEFGYDKK" + misc_feature 13841..14443 + /gene="glf" + /locus_tag="SPC47F_0016" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.2e-137" + gene 14502..15530 + /gene="wcjE" + /locus_tag="SPC47F_0017" + CDS 14502..15530 + /gene="wcjE" + /locus_tag="SPC47F_0017" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI34664.1" + /db_xref="GOA:Q4JYI1" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q4JYI1" + /translation="MTKSRINWIDFGKGFSIFLVLAGHVLLGLYQSEKFPTANNILSL + LIAQVYIFHIPVFFALSGYFFKPVSDLKEFWQYAKKKTIVFGLPYIFYSIIHFGLQKV + AGASVRVLTTISDLLNIYKHPLGVSWYLYILWSILIIYGLLSILVKNRRMLFLISVFA + YCLTLFVQTDIYIIQRTLVWGICFFLGSVLSEIHFDKINLKKFLFFFVLFDFIYMFAW + FLFYEVGSKKDYVSYINPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKDSL + GIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIVLL + PQKYIKLK" + gene 15705..>16064 + /gene="aliA" + /locus_tag="SPC47F_0018" + CDS 15705..>16064 + /gene="aliA" + /locus_tag="SPC47F_0018" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34665.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 15705..15791 + /gene="aliA" + /locus_tag="SPC47F_0018" + /note="Signal peptide predicted for SPC2062 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 15951..16019 + /gene="aliA" + /locus_tag="SPC47F_0018" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa cactgcggct aaagaagtac ttgaaaaaca + 121 ggtcttggct ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattta aggagaaaga agatgaacat aaagaagcga gtccttagtg caggcctgac + 361 ttttgcatct gctttgcttt tagctgcttg cggccaatca ggttcagata caaaaactta + 421 ctcatcaacc tttggtggaa atccaactac atttaactat ctattagact attacgctga + 481 taacatagtc aattgaaaca agaacaggac aaaagagcct cataaaaggt attgcaactt + 541 ggtaatacct tttacgaggc tttttgatat aagcccatgt tttctcaata ggattgtact + 601 caggtgagta gggaggaaga ggtaaaagtt tatgcccaaa ctcctcgcat aaaagttcta + 661 acttacccat tctatggaat cttgcattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagag aaacttctga aaccaagctt caaaaaagtc gctcgtcacc atctcttcgt + 781 aagtcattgg agcgattaac tcaccatttg ttagacctgc aaccaaagaa atcctctgat + 841 atcttcttcc agatacttta cctcttatta actgaccttt taatgagcga ccatattctc + 901 gataaaaata agtatcgaat cctgtttcat caatctaaac aggtgctagg tgctttaaac + 961 tattaaaatt tttaagaaat aaggctactt tttctgggtc ttgttcatag taggtgtggt + 1021 tctttttttc gagtgtagcc catagctttg agcgcatagt ggatggtagt tggatgacag + 1081 ccaaattcag aagctatttc agtcaaataa gcgtctggat tgtcagtaag atagttttta + 1141 agtctatctc tatcaacctt tcttggtttt gttcctttta cttggtggtt tagctctcct + 1201 gttttctctt ttagctttaa ccagccataa atggtattac gtgagatttg gaaaacgtgt + 1261 gacgcttctg ttatactacc tgttcgctca caataagaga gaactttttt acgaaaatct + 1321 attgaatatg ccataagaag attataccac attgtgtact atattagatt gaaactagag + 1381 tagtacacct ctgcttctaa aacattgtta gaaatcgatt tgactgtcct tatttcattt + 1441 tattatattt ttggttcgcg ggaagtctac taagatactt aaagatgcag atagtgaaaa + 1501 taaaggtgta gacattaccg taaaaaagtg atataatcgt atgatgttca aggtataggt + 1561 gttaatcatg agtagacgtt ttaaaaaatc aggttcacag aaagtgaagc gaagtgttaa + 1621 tatcgttttg ctgactattt atttattatt agtttgtttt ttattgttct taatctttaa + 1681 gtacaatatc cttgctttta gatatcttaa tctagtggta actgcgttag tcctactagt + 1741 tgccttggta gggctactct tgattatcta taaaaaagct gaaaaattta ctatttttct + 1801 gttgctgttc tctatccttg tcagctctgt gtcgctcttt gcagtacagc agtttgttgg + 1861 actgaccaat cgtttaaatg cgacttctaa ttactcagaa tattcaatca gtgtcgctgt + 1921 tttagcagat agtgatatcg aaaatgttac gcaactgacg agtgtgacag caccgactgg + 1981 gactgataat gaaaatattc aaaaactact agctgatatc aagtcaagtc agaataccga + 2041 tttgacggtc aaccagagtt cgtcttactt ggcagcttac aagagtttga ttgcagggga + 2101 gactaaggcc attgtcctaa atagtgtctt tgaaaacatc atcgagtcag agtatccaga + 2161 ctacgcatcg aagataaaga agatttatac caagggattc actaaaaaag tagaagctcc + 2221 taagacgtct aagaatcagt ctttcaatat ctatgttagt ggaattgaca cctatggccc + 2281 tattagttcg gtgtcgcgat cagatgtcaa tatcctgatg actgtcaatc gagataccaa + 2341 gaaaatcctc ttgaccacaa cgccacgtga tgcctatgta ccaatcgcag atggtggaaa + 2401 taatcaaaaa gataaattaa cccatgcggg catttatgga gttgattcgt ccattcacac + 2461 cttagaaaat ctctatgaag tggatatcaa ttactatgtg cgattgaact tcacttcgtt + 2521 tttgaaattg attgatttgt tgggtggaat tgatgtttat aatgatcaag aatttactgc + 2581 ccatacgaat ggaaagtatt accctgcagg caatgttcat cttgattcag aacaggctct + 2641 cggttttgtt cgtgagcgct actcactagc agatggcgat cgtgaccgtg ggcgcaatca + 2701 acaaaaggtc attgtggcta tccttcaaaa attaacgtca accgaagcgc tgaaaaatta + 2761 tagtacgatc attaatagct tgcaagattc tatccaaaca aatatgccac ttgagactat + 2821 gatagattta gtgaatactc agttggaaag tggagggaag tataaagtaa attctcaaga + 2881 tttaaaaggt acaggtcgga tggatcttcc ttcttatgca atgccagaca gtaacctcta + 2941 tgtgatggaa atagatgata gtagtttagc tgtagttaaa gcagctatac aggatgtgat + 3001 ggagggtaga tgaaatgata gatatccatt cgcacatcgt ctttgatgta gatgatggtc + 3061 ccaagtcaag ggaggaaagc aaggctctct tggtagaatc ctacagacag ggggtgcgaa + 3121 ccattgtctc tacctctcac cgtcgcaagg gcatgtttga aactccggaa gagaagatag + 3181 cagaaaactt tcttcaggtt cgggaaatag ctaaggaagt ggcgagtgac ttggtcattg + 3241 cttacggggc tgaaatttac tacacaccag atgttctgga taagctggaa aaaaagcgga + 3301 ttccgaccct caatgatagt cgttatgcct tgatagagtt tagtatgaac attccttatc + 3361 gcgatattca tagcgctttg agcaagatct tgatgttggg aattactcca gtcattgccc + 3421 acatcgagcg ctatgatgct cttgaaaata atgaaaaacg cgttcgggaa ctgatcgata + 3481 tgggctgtta cacgcaagta aatagttcac atgtcctcaa acccaaactt tttggcgaac + 3541 gttataaatt catgaaaaaa agagttcagt attttttgga acgtgattta gttcatgtag + 3601 ttgcaagtga catgcacaat ttagacagta gacctccata tatgcaacag gcatatgata + 3661 tcattgctaa gaaatatgga gcgaaaaaag cgaaagaatt ttttgtagat aatcccagaa + 3721 aaattataat ggatcaatta atttaggaga aaatatgaag gaacaaaaca ctttggaaat + 3781 cgatgtattg caactattca gggctttatg gaaaagaaag ttggtcattt tattagtggc + 3841 aattataact tcttcagttg cttttgccta cagtactttt gttatcaaac ctgagtttac + 3901 tagtacgact cggatttatg tagttaaccg taatcaggaa gagaagtctg gtttaaccaa + 3961 tcaagacttg caggcaggat catacttggt taaagactat cgtgaaatta tcctatcgca + 4021 ggatgttttg gaggaagtta tttctgattt gaaactagat ttgacgccaa aaggtttggc + 4081 taataaaatt aaagtaacag taccagttga tacccgtatt gtctctgtct cagttaatga + 4141 tcgagttcct gaagaggcaa gccgtatcgc taactctttg agagaagtag ctgctcaaaa + 4201 aattatcagt attactcgtg tttctgatgt gacaacactg gaggaggcaa gaccggcgat + 4261 atcaccatct tcgccaaata ttaaacgcaa tacactaatt ggttttttgg caggggggat + 4321 tggaactagt gttatagttc ttcttcttga acttttggac actcatgtga aacgtccgga + 4381 agatatcgaa gatacactgc agatgacact tttgggagtt gtaccaaact tgagtaagtt + 4441 gaaataggag agaggaatgc cgacattaga aatagcacaa aaaaaactgg agttcattaa + 4501 gaaggcagaa gaatattaca atgccttgtg tacaaatata cagttgagcg gagataaact + 4561 aaaagtaatt tccgttactt ctgttaaccc tggggaagga aaaacaacta cttccgtaaa + 4621 tatagcaagg tcgtttgcgc gtacaggcta taaaactctt ttgattgatg gcgatactcg + 4681 aaattcagtt atatcaggag tttttaaatc gcgtgaaaaa attacagggc taacagaatt + 4741 tttatctggg acagctgatt tatctcacgg tttatgtgat acaaatattg aaaatttatt + 4801 tgtaattcaa tcgggatctg tatcaccaaa ccctacagcc ttgttacaaa gtaaaaattt + 4861 taatgatatg attgaaacat tgcgtaaata ttttgattat atcattgttg atacaccacc + 4921 tattggaatt gttattgatg cggcaattat cactcaaaag tgtgatgcgt ccatcttggt + 4981 aacagcaata ggtgaggtga ataaacgtga tgtccaaaaa gcgaaacaac aattagaaca + 5041 aacagagaaa ctgttcctag gagttgtttt aaataaattg gatatctcgg ttgataagta + 5101 tggaggttac ggttcctatg gaaattatag gaaggaataa cggagtaatt gataaaaatg + 5161 tattttgttt ttaaaaatat tttagataga tttttggcgt ttttcctatt tatcacactg + 5221 ataatcatac cgattattcc gataacaatt ctggttattt ggatagaaga tccaggagat + 5281 gtgtttttct ttcaagatag aattggttta aatgggaaga gctttaaagt aataaagttt + 5341 cggagcatgt ataaagatgc tgatcaaagg ataaagaaaa gtattattag tggtgaaatt + 5401 gatcgtctaa attttaaaga acattctcaa agtatgacta caaaagtcgg taaagtgata + 5461 cgaaaacttt caattgatga attacctcaa ttagtgaata ttataaaagg tgatatggct + 5521 atagtgggac ctcgtccatt acaacaattt gaaataactc atcatattct tacccataaa + 5581 gaaatggaga ctactttaaa gatgtctaaa agattgtctg tgaaacctgg tttgctttgt + 5641 tattggcaag ttacgccgaa taaaaatgac attcctttta gtgatagaat gaatctagat + 5701 ttattataca ttgataatgt atctttcaag actgatttct tgcttatttt gaagggattt + 5761 tatacagttt taatgggtaa taacaattaa catgaaaaat ataaaaatat tagtagcaac + 5821 acataaaaaa tataaaatgc ccagtgattc aaatatgtat ctaccaattc atgtaggatg + 5881 tgaaggaaag aaaaatttag gatttcaagg tgacaattca gaagaaaata tttctaattt + 5941 aaatccttat tattgtgaat taactggctt gttttgggct tggaaaaact tagattgtga + 6001 ttatctgggt ttagtacatt atcgtcgtta ttttactaaa atgacaaaaa ggtacaatga + 6061 atcaataaat atcgatgatg taattttaaa taggtttgaa gttgagaaat tgttagagaa + 6121 ctcagatatc attgttccta aaagaagaaa atattatatt gaaactcttt attctcatta + 6181 cgaccatact tttgatggtt ctcatttaga tctagctaga aaaatgattg aaatgaagaa + 6241 tccagaatat ctctctagtt ttgataaggt aatggaacaa agaagcgggt acatgtttaa + 6301 catgttcatt atgaaaaaag aactggcaga tgattatttt tcttggctgt ttcctatctt + 6361 ggatagtatg tatgaaagta tggatttatc agggttaact gattttgaag ctagattatt + 6421 tggaagagta agtgagttgt tatttaacgt atggttggtg aagagcaatt taactccaaa + 6481 ggaagtgccg tttatgtata tggaaaaagt taacttattt aaaaaaggga tttcattttt + 6541 gatggcgaaa tttttcggaa agaaatatgg acagagtttt tagttaggaa taaaaaatag + 6601 tgatgaaagt agtaataaaa agaaagtctt tgccagagat tttagctctt agtgcactaa + 6661 ctatattttt agttgtgtca attttaaatg tgacttttta tgttcagtat cttccaaaag + 6721 ttgtttataa gatactgata gctatttcgc ttattctgct agttataaaa gagttgtaca + 6781 aaagaaagtt tgattataga actatcataa gtctatttgc tacagttttg atgtatctcc + 6841 ttatagggag ggtgagtact cttaactcta atattgcaat aggaattatt ttcatttatg + 6901 ctttacgcga tattcctttt aaaagcgtgg caaaaacttc tttagcagta agtgtactca + 6961 tattactgtt tgttataact ggcgcaaaat tgggagttat tataaattat ttagagattt + 7021 ctgggactcg agtccgtagt tatttaggat ttaggtacgc actattccca tctatcttga + 7081 tgatgaacat agtcgctatt gtattttatt taaagcaaaa taaaatacaa tattggcaat + 7141 ggttattgtt atctttatct gcttattggc tgtatgatga aacggattct cgattaacat + 7201 tttatagttc ctgtatattg ttgatatgca gtttattaat aagatggatc ccagaactat + 7261 tctctaagtt cggatatata tttaaagctt ttaaactcac ctttattata aatgcagttg + 7321 ttagtttttg ggtctccttt acctatctca atttgagtca ttcttatatc aataatcttt + 7381 ttttaaaatt agactatata ttaggtggtc gtatatactt ggtgaataaa tcgttgaatt + 7441 tgtatggttt tggattattc ggacgaccag ttgaatggaa tggaaatggt ctgaccattg + 7501 aaggagttag aaactatcag acctatctgt atgttgataa tttgtatgtt caaattttac + 7561 aaaaatttgg tttactcgct ctaggaataa tgctcctagt cctaacttta accttgttta + 7621 aagtgattaa gagacgcgaa tgggttctgt cttttatttt gatattgatg agttttcatt + 7681 ccatgattga tgatttgaat ttgtaccttc attacaatat tttttggata ttattaggta + 7741 gtttaatcta ccccgattat caattttctg atgaaagtga tgaagagtta ggggaaaatt + 7801 cttttgaaga aattatatag tgaaatgcta agaaatattt gagaagaact cacaagagta + 7861 tagctgagaa gacagttgta tatcgagttt tgctgttttt atataggagg gaagtatgtc + 7921 ggatataaaa atcattcaag ataagatttt aattatctta aaagaattta ttaatatttg + 7981 tgaagaaaat aatttgactt actatgctct agggggaaca ttgcttggag cagtacgtca + 8041 caaaggattt atcccttggg atgatgatat tgatattggc atgccaagag aagattacga + 8101 aaagtttaag aaagtagctc ccaattttct accaaataat tataaatttt taagtgaaga + 8161 taccgctaat tataaaaaag ctttctctgt aattcgggat gattcaacga aaatcataat + 8221 gaattatagt aaagaggaat tggtagagag tttgtggata gatatttttc cacttgatgg + 8281 aatgcctgct gcccccttta agagaaaaat gcatgagtat agatacttat atagacggat + 8341 gatggttcaa ctttctcagt ttaatagttt agtaaatcag aagaaagaga atcgtccact + 8401 atctgaaaaa atgattattg gatttgcgaa cgctgttaat attgaaaaga ttatttcttt + 8461 taactgggca cagaaaaaat atttacaaac gctaaaaaaa tattcgttta aggaagcttt + 8521 tgcaggaaac tatacaggag catataaact aagagaaatc gtaccttcag attattttgg + 8581 agagccagta tcattagagt ttgaagggac tgatttgagt tgtcctcgta agtataaaga + 8641 atatttgata gcaatttatg gagagaatta tatgcagtta cctccagaag ataagcgaaa + 8701 ccaacatcac tataagataa tatctcttgg tgataatgaa gaatgagagt agttgaaaca + 8761 tgaaaaaaat cgctttagtg aaatggattt tgaatgattc tggcggtggt gagcgagttg + 8821 ctatatcctt ggcaaacgaa cttacaaaaa agtatgaagt ccatttgatt ggaattacaa + 8881 caaagcaatc ggatttattc tttaaaatca attctcaagt aaaatactcc aatttttttg + 8941 accatcgagt acgcttgtct aagaatcttc taaaaatttc aaaaatgtta aaaaattatt + 9001 ttgtagataa tgagatagat gttgcctttg gaatagggat atctgctaat gtatttttat + 9061 ctttggcagg aataggaact caaactaaag tagttttgtg tgatcatacc aattcgatta + 9121 cggataatag agaattttat cagaaattcc aaagatatgt tgggacaaag ttggcagaca + 9181 agattatcac tctcactcaa gaagaccgtg aaaattatat aaaaaaatac ggtgttcctg + 9241 aggaaagaat ttgctacatc tataattgga aagaggctgc tctttcagat gtatcttata + 9301 ataaaaaatc aactaaaatt gtgactgttg gccgttttga ttatcaaaaa ggctatgatt + 9361 atctcattca agtcgcgaaa aaagtgttag agaaaagggc tgactggact tgggaaatct + 9421 acggttccgg caatcaagat gaagtagaga aaatcagaga tttaatcaac gaaaatgatt + 9481 tacaggatag gttagtcata aaaggactcg aaaaaaatca agatttgatt tatggagata + 9541 aagggattta tgtcatgact tctcgctatg aaggtctacc tttagtcctg ctggaagcac + 9601 aacaatataa tcttcctata gctagcttta gttgtccgac aggaccgaac gaaattgttg + 9661 aagatggagt taatggctat ctggttgagt gttatgatgt agaagcgatg tctaatagat + 9721 tattagaact aatgaatgat aaggagctaa gaaatcgttt ttcatctcat gcaaaagata + 9781 acattgaaaa atttaataaa gaccgaatta tacatcagtg gatagatttg atagaagaag + 9841 tatctggggg gggaaatgtc taataaaata ctgacgatta ctgtgccaac ctataatatt + 9901 gaaaactata ttggtaaatg catagaatca tttaaagctg taaatcctac ctattacagt + 9961 gattttgaag tgttaatcat taatgacgga agtactgata attctgtaca agttgttaag + 10021 gatttaatgg aaggtagcac tttagattta agaattatca caaaagaaaa tgggggccat + 10081 ggctcaacta ttaatcgcgg gattaaagaa gctagtggaa aatattttaa ggtcattgat + 10141 ggggatgatt ggatcaatgt tccagaattt gaaagcttat tggataagtt aagagagatt + 10201 aacactgatt tagtgatttc tgactataca gagcagcatg tatataataa tagcactatt + 10261 tttaaagaat tctcttctta tctaattcca aatcaagaga caagaggtat tcctagcaag + 10321 tggacaccta tgcatgccct ggtctataaa acaagtatct tgaaggataa tgctattacg + 10381 attagtgaaa atacatttta tgtcgaccaa gagtatacaa tgctccctct tcaatttgta + 10441 gaaaattata tttattttaa gttggatatt tatcagtact tcttgggaag agctgatcag + 10501 agtatgaata ttgatataat gagaaagaga gcagatcatc atgagagagt aacgaaacga + 10561 atcttagact tatataaaga gagttataca caaaagccag aaatagaaaa ggttgtcagt + 10621 gactctttgc agtatctggt taataagcaa aatattttgt atgttatgaa tgaggaactt + 10681 gataaggtat atgaactgtt ttcatattct gagaaaagtg gattcaaatt taaatttgaa + 10741 acaaaaacaa agacttcaaa tttactttat gtcaattata aaacgaagta tctttttaac + 10801 cttgttatta aaaatctagt taaaagaaaa gcaaacagtc tagaaaaaga atttcaagag + 10861 aagggatttt gatgaaatat gtcaggaagt aaaacaaatc atcaattttt tctgaaggaa + 10921 ttcataacaa aattaactac actgtataag actgtattca agtggagtgt gcttgtatga + 10981 aagtacttaa aaactacgct tacaatcttt catatcagtt actaatcata atcttaccga + 11041 ttattaccac tccctacgtt actaggattt ttagttcgga taatctaggg acttatggtt + 11101 attttaactc aattgtaacc tattttcttt tgctggctac tttaggaata ggaaattatg + 11161 gaacaaaaga gatttcaggt aataggaaag ctatccatca gaatttttgg ggtatttata + 11221 gtatacaact gggagcatct ctattctcca ctttccttta tgttattgtc tgtctaattt + 11281 taccagctat gcaaaatact gtagcctata ttttaggctt aagtttgttt tctaaaggtt + 11341 tagatatttc ttggttattt caaggtttag aggattttcg gaaaattaca gtaagaaata + 11401 taactgtgaa agtcattggg ggaacctcga ttttcttatt tgtaaaatca gctagcgacc + 11461 tctaccttta tgtttttctt ttaacgatat ttgagttatt agggcaactt agtatgtggg + 11521 taccagctcg ggaatttatt gggaaaccgc actttgactg gttgtatgct aaacaacatt + 11581 tgaagccagt tatcttatta tttttaccac aggtcgctat atcgctttat gtgactttag + 11641 atagtactat gcttggttct ctagcctcaa taagagatgt tggaatttat gatcaatctc + 11701 tgaaacttgt caaaatatta ttaacattag taacttcatt aggaagtgtc atgttgccta + 11761 gagtttcaaa tcttttatcc tcaggggatc ataaagcagt caacaaaatg catgagatat + 11821 catttttaat ttataatttg gttattttcc ccattatggc aggaatgcta attgtaaatg + 11881 atgactttgt aacctttttc ctcgggcaag attttcaaga ggcacgttat gcgatagcaa + 11941 ttatgatttt tagaatgttc tttattggtt ggaccaatat tatggggatt caaattttga + 12001 tacctcataa taaaaataaa gaatttatgc tgtcaacaat aattcctgct attgttagtg + 12061 taggcttaaa tcttctcttg cttccaaagc tgggctatat aggagcagca attgtttctg + 12121 tcttaacaga ggcgctagta tgggctattc aattgtacta tactcgtaca tacttaaaag + 12181 atgttccgat tattagaact atgataaaaa ttattctagc ctcagctatc atgtatagcg + 12241 ttttgctagt ttctaagaca tacatacatt tttccccaac tataaatgtt ttggtatttg + 12301 tggtgttagg tggaatcatt tatctttttt cagttttatc tctaaaagtg atagatgtga + 12361 tagaattaaa acaagtaatt aggaaaaatt agaatgcata aatttaaaga tattaacttg + 12421 gatttactaa aagtaattgc atgtgttgga gttgttttac tccatacaga gatgggggga + 12481 tttaaagaga caggttcatg gaatttttcg acatatttat actacttagg aacctattct + 12541 atccctctat tttttatagt taatggttat ttattgttag ggaagaaaga gattacctat + 12601 tcctacatat tacagaaagt aaaatggatt ctaataacag tgctgtcatg gacccttata + 12661 gtttggctat ttaaacggga tttttcagtt aatccaataa aaaaacttat aggatcattg + 12721 gtgcaaaaag gttatttctt tcagttttgg ttttttggtg cgcttatact tatttatata + 12781 tgtctccccg ttttgaaaca atttcttaat tcaaaaagaa gttatttata ctttttatct + 12841 gtattgctag ttattggttt gatttttgag ttaacaaata ttgtgcttca aatgccaata + 12901 caagcatatg taatacaaac ttttagatta tggacttggc ttttctatta tattttaggg + 12961 ggctttatat ctcagtttga taaaaatacc atcaaaaatg ggtttaagag atggatgaaa + 13021 gtaattgcag tacttttatt attagtttcg ccatttatat tatttttcat agcaaagacc + 13081 acttactata atttttttgc tgaatatttt tatgatattt tattagtaaa agttgtaagc + 13141 gtagggattt ttctaactat tttctcactt gtattgaatg aaaatagcaa caaatggatt + 13201 atttttcttt ctaatcaaac tatgggtatc tttataatac acacttatat tatgaaggta + 13261 tgggaaaaag tgcttggttt taattttgta ggagcatatt tactttttgc tctatttact + 13321 ttaagtgtta gttttattat tgttgggatg ttaatgaaga ttccttactt caatcgaatc + 13381 gtcaaattat aaaaaggaga acaagatgta cgattatctt attgtcggtg ctggtttgtc + 13441 aggagcaatt tttgcttatg aggcgaccaa gcgtggaaaa aaagtaaaag tgattgataa + 13501 acgtaaccac attggtggga atatctactg tgagaatgta gaaggagtta atgttcataa + 13561 atatggtgcc catatctttc atacttctaa taagaaagtt tgggattatg ttaatcaatt + 13621 tgctgaattt aacaactacg tcaactcgcc tgtagctaat tacaagggta gcctctataa + 13681 tctacctttc aatatgaata ccttctatgc tatgtggggg acaaaaactc ctcaagaagt + 13741 caaagataag attactgagc agacagctga tatgaaggat gttgagccga aaaatctgga + 13801 agaacaggct atcaagttga ttggtccaga tgtctatgaa aagttaatca agggttatac + 13861 tgaaaagcag tggggacgct cagcaacgga acttcctcca tttatcatta aacgtcttcc + 13921 agttcgttta acatttgata ataactattt taacgaccgt taccaaggaa ttcctattgg + 13981 tggttacaat gtcatcatcg aaaatatgct taaagacgtt gaagttgagc ttggtgttga + 14041 tttctttgct catcgtgaag agttagaagc atcagctgaa aaagttgtct ttacagggat + 14101 gatcgaccag tattttgact acaagcacgg agagttagaa taccgtagcc ttcgctttga + 14161 tcatgaaatt ttggacgagg aaaattatca aggaaatgct gtagtgaact atacggagcg + 14221 tgagattcct tatactcgta ttatcgaaca caagcatttt gaatatggaa cacaggcaaa + 14281 gacagttatc acgcgtgaat atccagctga ctggaagcgt ggggacgagc cttactatcc + 14341 gatcaacgat gagaaaaata atgctatgtt tgctaagtac caagaggaag cttcaaagaa + 14401 tgataaggtt attttctgtg gacgtttagc agattataaa tattacgata tgcatgtggt + 14461 gattgaacgg gcgcttgagg ttgtggagaa agagtttgga tatgacaaaa agtagaatca + 14521 attggataga ttttggaaaa ggcttttcca tatttttagt cttagcagga catgtgttgc + 14581 ttggactgta tcaatcggaa aaatttccca cagcaaataa catactatcg ttgttgatag + 14641 cacaagtcta catatttcat ataccagtat tttttgcctt atcaggatac tttttcaaac + 14701 ctgtgtcgga tttgaaggag ttctggcaat atgctaaaaa gaagacaatt gtttttggtc + 14761 tgccatatat tttctattcg atcattcact ttggtcttca aaaagttgca ggggcatctg + 14821 ttcgtgttct tacaaccata tctgatttgc taaatatcta taaacatcct cttggagttt + 14881 cgtggtattt atatatactc tggtcgattt tgataatcta tggattattg tctattttag + 14941 tcaaaaatcg tagaatgtta tttttgataa gtgttttcgc ttattgttta accctatttg + 15001 ttcaaacaga tatttatatt attcaaagaa cgctagtttg ggggatttgt ttctttcttg + 15061 gcagtgtatt gagtgaaatt cactttgata aaattaattt gaaaaaattt ctttttttct + 15121 ttgtgttatt tgattttatt tatatgttcg cttggttctt gttttatgaa gtagggtcta + 15181 agaaggatta tgtaagctat attaacccag gtttgtgggg gattgctttt attgtctgtg + 15241 tattagttgc ttttgcgatt tttcctaaaa tggagaaaaa ttttcctaaa actttcctat + 15301 atttcactaa atacgggaaa gatagtttag ggatctatat tcttcatgca ccaatttgta + 15361 gcatgattcg gattctaatg ttgaaagtgg gaataaactc agtttttctt cacgttgttg + 15421 ttgggattgt gctaggctgg tatttatcca tactagcaac ttatatattg aaaaaaattc + 15481 catttttgaa tattgtttta ttaccacaaa agtatattaa attaaaataa attattttag + 15541 atttataatg tggctctttg tcaactaaca tctggagagg acaatcactg ttttctcttt + 15601 ttttgtcttt tcagaatata ccaaattaac acaaaaattc tgaaaattct gttgacatct + 15661 ttctgaaaag agtttataat ggagagaaag ttttaaagga gaaaatgatg aaaagttcaa + 15721 aactatttgc ccttgcgggc gtgacattat tggcggcgac tactttagct gcatgctctg + 15781 gatcaggttc aagcactaaa ggtgagaaga cattctcata catttatgag acagaccctg + 15841 ataacctcaa ctatttgaca actgctaagg ctgcgacagc aaatattacc agtaacgtgg + 15901 ttgatggttt gctagaaaat gatcgctacg ggaactttgt gccgtctatg gctgaggatt + 15961 ggtctgtatc caaggatgga ttgacttaca cttatactat ccgtaaggat gcaaaatggt + 16021 atacttctga aggtgaagaa tacgcggcag tcaaagctca agac +// + diff --git a/public/res/serotype_genbank/serotype_48.gb b/public/res/serotype_genbank/serotype_48.gb new file mode 100644 index 0000000..35df910 --- /dev/null +++ b/public/res/serotype_genbank/serotype_48.gb @@ -0,0 +1,1060 @@ +LOCUS CR931722 22062 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 656/63 (serotype 48). +ACCESSION CR931722 +VERSION CR931722.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22062) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 22062) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..22062 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="656/63" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC48_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC48_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI34666.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..378 + /gene="aliB" + /locus_tag="SPC48_0002" + /pseudo + CDS 322..378 + /gene="aliB" + /locus_tag="SPC48_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(349..840,842..1168)) + /gene="tnp" + /locus_tag="SPC48_0003" + /pseudo + CDS complement(join(349..840,842..1168)) + /gene="tnp" + /locus_tag="SPC48_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(778..840,842..1150)) + /gene="tnp" + /locus_tag="SPC48_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.8e-23" + /pseudo + gene 1402..2847 + /gene="wzg" + /locus_tag="SPC48_0004" + CDS 1402..2847 + /gene="wzg" + /locus_tag="SPC48_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI34669.1" + /db_xref="GOA:Q4JYH8" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4JYH8" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLGFSILVSSASLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIGNVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KMSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1402..1518 + /gene="wzg" + /locus_tag="SPC48_0004" + /note="Signal peptide predicted for SPC2066 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1606..1953 + /gene="wzg" + /locus_tag="SPC48_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.9e-61" + misc_feature 2131..2574 + /gene="wzg" + /locus_tag="SPC48_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 2849..3580 + /gene="wzh" + /locus_tag="SPC48_0005" + CDS 2849..3580 + /gene="wzh" + /locus_tag="SPC48_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI34670.1" + /db_xref="GOA:Q4JYH7" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4JYH7" + /translation="MIDIHSHIVFDVDDGPKSIEESKALLREAYNQGIRMIVSTSHRR + KGLFETPEEKIATNFIKVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHAGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDTIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + misc_feature 2852..3460 + /gene="wzh" + /locus_tag="SPC48_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.6e-37" + gene 3589..4281 + /gene="wzd" + /locus_tag="SPC48_0006" + CDS 3589..4281 + /gene="wzd" + /locus_tag="SPC48_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI34671.1" + /db_xref="GOA:Q4JYH6" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JYH6" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSISVNDRVSEEASRIANSLREVAGQKIISITRVSDVT + TLEEARPTISPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTRVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 3607..4023 + /gene="wzd" + /locus_tag="SPC48_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 9.3e-52" + misc_feature 4129..4206 + /gene="wzd" + /locus_tag="SPC48_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4291..4974 + /gene="wze" + /locus_tag="SPC48_0007" + CDS 4291..4974 + /gene="wze" + /locus_tag="SPC48_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI34672.1" + /db_xref="GOA:Q4JYH5" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4JYH5" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVSIARSFARAGYKTLLIDGDIRNSVMSGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVVQSGTVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTPPIGIVI + DAAIITQKCDAFILVTATGDVNKRDVQKAKQQLEQAGKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 4990..6357 + /gene="wchA" + /locus_tag="SPC48_0008" + CDS 4990..6357 + /gene="wchA" + /locus_tag="SPC48_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI34673.1" + /db_xref="GOA:Q4JYH4" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4JYH4" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETEVERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISKRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSILDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDVGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAVASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5773..6354 + /gene="wchA" + /locus_tag="SPC48_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 3.3e-146" + gene 6388..7560 + /gene="wchF" + /locus_tag="SPC48_0009" + CDS 6388..7560 + /gene="wchF" + /locus_tag="SPC48_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI34674.1" + /db_xref="GOA:Q4JYH3" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4JYH3" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACIR + ENSAKSGITEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDEDPIF + YILACRIGPFIHGIKKKIQAIGGTLLVNPDGHEWLRAKWSAPVRRYWKISEGLMVKYA + DFLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTRSTLKSSDKKVRSWFKEKNISEN + EYYLVVGRFVPENNYESMIRGFLASNSKKDFVLITNVEQNKFYNQLLAKTGFDKDPRV + KFVGTVYEQELLKYIRENAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + QSAIYWKKDELSQVIEKVEQFDAKMIDELDRQSNQRIADSFTWEKIVTDYEKVFKG" + gene 7566..8462 + /gene="wcxG" + /locus_tag="SPC48_0010" + CDS 7566..8462 + /gene="wcxG" + /locus_tag="SPC48_0010" + /note="member of homology group 79" + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase" + /protein_id="CAI34675.1" + /db_xref="GOA:Q4JYH2" + /db_xref="InterPro:IPR007074" + /db_xref="UniProtKB/TrEMBL:Q4JYH2" + /translation="MAVKLKYDKSDITFLDDDELKKYQSELLKMISDVFTFFDENGIA + YSLSGGSILGAIRHKGFIPWDDDVDINIPRESYDKLFSLFESDNSLSRKYYLQSAKSH + PELGLHVSQIRKKGTVARRKYDHSAEECGISIDLYIVENVYNNPVKRFFQGYTSMFLT + FALASVRETKNHALMKEMFRLEGRKLNYSVGKLMVGWFFGIIPIEKWLNWLDKCNSSC + KDSHTKYVSIPTGRKHFRRETYLRENMNIYKKVPFETLMVNVPVWSEEYLEMFYGKDY + MVVPPVDKREQHLFLELSYGEE" + misc_feature 7683..8384 + /gene="wcxG" + /locus_tag="SPC48_0010" + /note="HMMPfam hit to PF04991, LICD Protein Family, score + 1.2e-21" + gene 8463..9182 + /gene="abp1" + /locus_tag="SPC48_0011" + CDS 8463..9182 + /gene="abp1" + /locus_tag="SPC48_0011" + /note="member of homology group 57" + /codon_start=1 + /transl_table=11 + /product="putative IspD-family transferase (arabinitol) + Abp1" + /protein_id="CAI34676.1" + /db_xref="GOA:Q4JYH1" + /db_xref="InterPro:IPR001228" + /db_xref="UniProtKB/TrEMBL:Q4JYH1" + /translation="MKVAILTASGIGSRIGQDIPKQFIHVENKPVIIYTLEKFQNHPE + IDEICIVILKGWEQMVKAYAEQFGITKLKMITLGGKSGQESIYNGLRAVKKAHPNEDV + TVLIHDGNRPLVSNNIISNALATYQRFGNAVAAIPTTEVVFVLENPQSTSSTEALNRD + LLRRTQTPHVYHLDNILSLHEKALENGITDVAASCQLMQLFGGKSYFSLGSEKNLKIT + TVEDLDIFKALLSSTRDKWIK" + misc_feature 8469..9158 + /gene="abp1" + /locus_tag="SPC48_0011" + /note="HMMPfam hit to PF01128, Uncharacterized protein + family UPF0007, score 5.5e-17" + gene 9185..10237 + /gene="abp2" + /locus_tag="SPC48_0012" + CDS 9185..10237 + /gene="abp2" + /locus_tag="SPC48_0012" + /note="member of homology group 58" + /codon_start=1 + /transl_table=11 + /product="putative dehydratase/epimerase (arabinitol) + Abp2" + /protein_id="CAI34677.1" + /db_xref="GOA:Q4JYH0" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYH0" + /translation="MTLLLNKIYRQDVESSLETIVNINDLNGKSILITGASGLIGSSV + IDQLLLLNEIRNFNIKIICCGRKFESLEKRFGRQTEYLHFVFYDATKVPHFAFAVDYI + IHAASPASPELYVNQPVETMASNFLGMYNLLEYAKNAKVSNLVYISSSEVYGISTSNN + PLDENYIGTVDHLSVRSSYASSKRATETLCASFASEYGIKIMIVRPGHIYGPSAKDSD + NRVSSFFMTEAIAGRDIVMKSTGSQLRSYCYSLDCASAILSVLLSGGSGQAYNVSNPN + SIITIKQMAETISRVGNVKLTMAIPSNQDIKQTNPMQNASLRSDKLEGLGWKGLFSAE + KGIENTFQILKALRSN" + misc_feature 9272..10222 + /gene="abp2" + /locus_tag="SPC48_0012" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00063" + misc_feature 9275..10108 + /gene="abp2" + /locus_tag="SPC48_0012" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00052" + misc_feature 9275..10003 + /gene="abp2" + /locus_tag="SPC48_0012" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.4e-44" + misc_feature 9278..10090 + /gene="abp2" + /locus_tag="SPC48_0012" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 9.1e-05" + gene 10249..11265 + /gene="wcyS" + /locus_tag="SPC48_0013" + CDS 10249..11265 + /gene="wcyS" + /locus_tag="SPC48_0013" + /note="member of homology group 118" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI34678.1" + /db_xref="GOA:Q4JYG9" + /db_xref="InterPro:IPR008441" + /db_xref="UniProtKB/TrEMBL:Q4JYG9" + /translation="MIFFLSFYLVTEFKMDGKLGSFLKLLKKVDGLRILKQYFKSGVL + FFAIFQILSQGFSKKSLEIVRNSVDNKILAKLRKKYLSYIVENKDRILRESAERQSSS + KVWILWLQGMNNAPEIVKLCYNSVVQNLPDKEAVLLTEDTYRNYVIFPNHVQQKIDKG + IISKTHLSDLLRLELLTLYGGIWIDATVFISSDKIPDYMLFSELFLFQKLKPGLDGNP + KRISSWYICAKSNHPILVLTKELLYQYWSEHNYMMDYFLMHDFMELSIETYPQEWNKV + IPFSSSPSHILLLRLFETFDKRMLEYVYQQISIHKLTYKYDTDICYTETYLNKILSEG + EIDA" + misc_feature 10393..11238 + /gene="wcyS" + /locus_tag="SPC48_0013" + /note="HMMPfam hit to PF05704, Capsular polysaccharide + synthesis protein, score 1.1e-56" + gene 11255..12229 + /gene="wcwY" + /locus_tag="SPC48_0014" + CDS 11255..12229 + /gene="wcwY" + /locus_tag="SPC48_0014" + /note="member of homology group 183" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI34679.1" + /db_xref="UniProtKB/TrEMBL:Q4JYG8" + /translation="MMHKKLALIIAYFGELPEYSKVFFNSLNYNPEIDLFLVTDQCVN + INIDNLIVIKKTFSEFKNDVQNLFDFKIVLDTPYKLCDYKPIYGMLFKDILYEYPFWG + YCDLDMVLGDVFSFLPENILDNYSKIYEYGHLTIYKNDPENNRRFMYEVGMNYQDVFT + TKVIKVFDETEGIQRKYELMGIPTYTPRDCADINPWKYQLNRVETGISKEKLNSFNHK + KQLFFWENGKIFRGFINPYTHKIEYDSFNYLHFQKREMKITFPFNSSTKAFFITNQGI + VEKKQGFNIKKEDFKKYNNYNLIREISKGLQRYYFIWKRRLLKYIFRR" + gene 12238..13419 + /gene="wzy" + /locus_tag="SPC48_0015" + CDS 12238..13419 + /gene="wzy" + /locus_tag="SPC48_0015" + /note="member of homology group 260" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI34680.1" + /db_xref="UniProtKB/TrEMBL:Q4JYG7" + /translation="MKISITNLYIWMLTVMFILMWIPSVPIFNYVDELLTLMILPYVI + MNFRALLLKSRLVIIGAIGFLLIGLISTYLSDLSRPLIAIVSDFFTFIKFPITYLYFR + YLFTKQNSTYFLNILYILSKFVVVIAFICCLLNYSFELGMTYDIRFGIGSFQFIYNNP + GFFLALMVVCYSLINYSNNSGNFKYKILAILNMVATLRSVAFGVIALLLVLSVFIGRN + LRLYHLFILIPSIIFVGNGAISTYFGDLETPRKLLFQGGIKVFQKFFPLGAGFASYGS + NAAYVYYSPLYFQFGFHHIWGLNLEYGNIANDNFWPMIFAQFGFIGSIFYILMFMAIM + KDLFIKSMYKNQVVSLSLIIGHLLISSVGANIITGVLGVSMICAYASMAHVLDDVEVN + Y" + gene 13416..14834 + /gene="wzx" + /locus_tag="SPC48_0016" + CDS 13416..14834 + /gene="wzx" + /locus_tag="SPC48_0016" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI34681.1" + /db_xref="GOA:Q4JYG6" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4JYG6" + /translation="MKLLKNYIYNLVYQIVAIILPLVTIPYASRVLGAEIIGINSYTN + TIISYFVLIANVGLTTYGNRTISYTRDSVLKRSQKFWEIFVIKIIMALFSLSLFFTFT + FIYREYTTFLYIQSIQILATAIDISWFFTGMEYFKRTVTRNILTKILSAICIIGFVKS + REDLWLYILILVLSTFLGNLTLWTYVFDAIEVINFKSLQLKEHIKPVFVLFIPQLATT + LFLTLNKLLLGNLSTLSQSGYFDSADKVIRILLTFITAIGTVIFPRLANSFNRGEKRN + VEELLKLSFGAINIIAFPMIVGIMVIGRPFSILFFGSEFEGIEIVLGILSIELVFMGW + SSVLGNQFLVAVNKTKGLTVSVFIASLILLISSFILIPMLGASGASISSVIGEATIAL + VQLYYVSKHTRLCLLFSDISKILVSSLIMGTTCLVIGSCFYDGIMKLCVQGTVGLMVY + CIMIWYSRTEIVNTILKKIKIQ" + misc_feature 13422..14222 + /gene="wzx" + /locus_tag="SPC48_0016" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 5.1e-55" + gene 14896..15303 + /gene="glf" + /locus_tag="SPC48_0017" + CDS 14896..15303 + /gene="glf" + /locus_tag="SPC48_0017" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34682.1" + /db_xref="GOA:Q4JYG5" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYG5" + /translation="MIDQYFDYKHGELEYRSLRFEHEVLDEENYQGNAVVNYTEREIP + YTRIIEHKHCEYGTQPKTVITREYPADWKRGDEPYYPINDEKNNTMFAKYQEEAAKND + KVIFCGRLADYKYYDMHVVIERALSVVTNEFGY" + misc_feature 14896..15240 + /gene="glf" + /locus_tag="SPC48_0017" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 6.4e-37" + gene 15360..16229 + /gene="rmlA" + /locus_tag="SPC48_0018" + CDS 15360..16229 + /gene="rmlA" + /locus_tag="SPC48_0018" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI34683.1" + /db_xref="GOA:Q4JYG4" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4JYG4" + /translation="MKGIILAGGSGTRLYPLTRVASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSV + ALILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGGLSVEVMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 15363..16079 + /gene="rmlA" + /locus_tag="SPC48_0018" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 5.2e-119" + gene 16230..16823 + /gene="rmlC" + /locus_tag="SPC48_0019" + CDS 16230..16823 + /gene="rmlC" + /locus_tag="SPC48_0019" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI34684.1" + /db_xref="GOA:Q4JYG3" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4JYG3" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTASYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENLEEADVSEADKHHPLLKDVKPLKKEDL" + misc_feature 16266..16796 + /gene="rmlC" + /locus_tag="SPC48_0019" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 6.5e-16" + gene 16836..17885 + /gene="rmlB" + /locus_tag="SPC48_0020" + CDS 16836..17885 + /gene="rmlB" + /locus_tag="SPC48_0020" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI34685.1" + /db_xref="GOA:Q4JYG2" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYG2" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVIGDIADAELVDKLATQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 16851..17807 + /gene="rmlB" + /locus_tag="SPC48_0020" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0001" + misc_feature 16854..17651 + /gene="rmlB" + /locus_tag="SPC48_0020" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0038" + misc_feature 16854..17594 + /gene="rmlB" + /locus_tag="SPC48_0020" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 3.5e-77" + misc_feature 16857..17669 + /gene="rmlB" + /locus_tag="SPC48_0020" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.2e-05" + gene 17951..18802 + /gene="rmlD" + /locus_tag="SPC48_0021" + CDS 17951..18802 + /gene="rmlD" + /locus_tag="SPC48_0021" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI34686.1" + /db_xref="GOA:Q4JYG1" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYG1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELNFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLVKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 17951..18799 + /gene="rmlD" + /locus_tag="SPC48_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 1.4e-144" + misc_feature 17954..18595 + /gene="rmlD" + /locus_tag="SPC48_0021" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00012" + misc_feature 17954..18583 + /gene="rmlD" + /locus_tag="SPC48_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.2e-19" + misc_feature 17957..18685 + /gene="rmlD" + /locus_tag="SPC48_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 2.4e-08" + gene 18843..20047 + /gene="glf" + /locus_tag="SPC48_0022" + CDS join(18843..18860,18859..19371,19371..19484,19460..20047) + /gene="glf" + /locus_tag="SPC48_0022" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI34687.1" + /db_xref="GOA:Q4JYG0" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4JYG0" + /translation="MNSKGALKIYNYLVVGAGLFGAVFAHEAALKGKKVKVIEKRNHI + AGNIYTREEEGIQIYQYGAHIFHTSDKEIWDYVNQFAEFNRYINSPVANYKGEIYNLP + FNMNTFNKLWGVVTPAEAQAKIDEQRAILNGKTPENLEEQAISLVATDIYEKLIKDYT + EKQWGKPTTELPSFIIVLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKCWIMKILMMLD + HENIDVETNVDFFVNKEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENEALDME + NYQGNAVVNYTDAETPYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDR + NNHLYKSYKKLADEQGNVIFGGRLGHYRYYDMHQVIGAALQCVRNELDSYSMKIKEQT + RKLAAGCSKHCFEVADGN" + misc_feature 18843..18923 + /gene="glf" + /locus_tag="SPC48_0022" + /note="Signal peptide predicted for SPC2084 by SignalP 2.0 + HMM (Signal peptide probability 0.719) with cleavage site + probability 0.362 between residues 27 and 28" + misc_feature join(19300..19371,19371..19460,19484..19903) + /gene="glf" + /locus_tag="SPC48_0022" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 2.1e-102" + gene complement(20115..21371) + /gene="tnp" + /locus_tag="SPC48_0023" + CDS complement(20115..21371) + /gene="tnp" + /locus_tag="SPC48_0023" + /note="member of homology group 13" + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /protein_id="CAI34688.1" + /db_xref="GOA:Q4JYF9" + /db_xref="InterPro:IPR002560" + /db_xref="InterPro:IPR012287" + /db_xref="UniProtKB/TrEMBL:Q4JYF9" + /translation="MEQLHFITKLLDIKDPNIQILDIINKDTHKEIIAKLDYDAPSCP + ECGNQLKKYDFQKPSKIPYLETTGMPTRILLRKRRFKCYHCSKMMVAETSIVKKNHQI + PRIINQKIAQKLIEKISMTDIAHQLSISTSTVIRKLNDFHFKHDFSCLPEIMSWDEYA + FTKGKMSFIAQDFNNLNIITVLEGRTQAIIRNHFLKYDRAVRCRVKIITMDMFSPYYD + LARQLFPCAKIVLDRFHIVQHLSRAMSRVRVQIMNQFHRKSHEYKAIKRYWKLIQQDS + RKLSDKQFYRPTFRMHLTNKEILNKLLSYSEDLKHHYQLYQLLLFHFQNKEPEKFFGL + IEDNLKQVHSLFQTVFKTFLKDKEKIVNALQLHYSNAKLEATNNLIKLIKRNAFGFRN + FENFKKRIFIALNIKKERTKFVLSRA" + misc_feature complement(20619..20915) + /gene="tnp" + /locus_tag="SPC48_0023" + /note="HMMPfam hit to PF01610, Transposase, score 1.3e-46" + misc_feature complement(20955..21020) + /gene="tnp" + /locus_tag="SPC48_0023" + /note="Predicted helix-turn-helix motif with score + 1860.000, SD 5.52 at aa 118-139, sequence + ISMTDIAHQLSISTSTVIRKLN" + gene 21703..>22062 + /gene="aliA" + /locus_tag="SPC48_0024" + CDS 21703..>22062 + /gene="aliA" + /locus_tag="SPC48_0024" + /codon_start=1 + /transl_table=11 + /protein_id="CAI34689.1" + /db_xref="GOA:Q4K2T2" + /db_xref="InterPro:IPR000914" + /db_xref="UniProtKB/TrEMBL:Q4K2T2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKD + AKWYTSEGEEYAAVKAQD" + misc_feature 21703..21789 + /gene="aliA" + /locus_tag="SPC48_0024" + /note="Signal peptide predicted for SPC2086 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" + misc_feature 21949..22017 + /gene="aliA" + /locus_tag="SPC48_0024" + /note="PS01040 Bacterial extracellular solute-binding + proteins, family 5 signature." +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact taacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaagacag aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggtctgact + 361 tttgcatctg ctttgctttt tgatatgagc ccatgttttc tcaataggat tgtactcagg + 421 tgagtaggga ggaagaggta aaagtttatg cccaaactcc tcgcataaaa gttctaactt + 481 acccattcta tggaatctta cattatccat aataataacc gatggtgtgg ttaatgttgg + 541 taagaaaaac ttctgaaacc aagattcaaa aaagtcgctc gtcatcgtct cttcgtaagt + 601 cattggagcg attaactcac catttgttag acctgcaacc aaagaaatcc tctgatatct + 661 tcttccagat actttgcctc ttattaactg accttttaat gagcgaccat attctcgata + 721 aaaataagta tcgaatcctg tttcatcaat ctaaacaggt gctaggtgct ttaaactatt + 781 aaaattctta agaaataagg ctattttttc tgggtcttgt tcatagtagg tgtggttctt + 841 tttttcgagt gtagcccata gctttgagcg catagtggat ggtagttgga tgacagccaa + 901 attcagaagc tatttcagtc aaataagcgt ctggattatc agtaagatag tttttaagtc + 961 tatctctatc aacttttctt ggttttgttc cttttacttg gtggtttagc tctcctgttt + 1021 tctcttttag ctttaaccag ccataaatgg tattacgtga gatttggaaa acgtgtgatg + 1081 cttctgttat actacctgtt cgctcacaat aagagagaac ttttttacga aaatctattg + 1141 aatatgccat aaaaagatta taccacattg tgtactatag tagattgaaa ctagagtagt + 1201 acacctctgc ttctaaaaca ttgttagaaa tcgatttaac tgtcctggtc gagttgtcct + 1261 gttcttgttt caatctacta tatttttgtt tcgcgggaag tctacttaag atacttaaag + 1321 atgcagatag taaaaaaaga tgtagacatt accgtaaaaa agtgatataa ttgtatgata + 1381 ttgaatgtat aggtgttaat cttgagtaga cgttttaaaa aatcacgttc acagaaagtg + 1441 aagcgaagtg ttaatatagt tttactgact atttatttat tgttagtttg ttttttattg + 1501 ttcttaatct ttaagtacaa tatccttgct tttagatatc ttaatctagt ggtaactgcg + 1561 ttagttctac tagttgcctt ggtagggctg ctcttgatta tctataaaaa agcagaaaag + 1621 ttcacgattt ttctgttggg attctctatc cttgtcagct ctgcgtcgct ctttgcagta + 1681 cagcagtttg ttggactgac caatcgttta aatgcgactt ctaattactc agaatattca + 1741 atcagtgtcg ctgttttagc agatagtgag atcggaaatg ttacgcaact gacgagtgtg + 1801 acagcaccga ctgggactga taatgaaaat attcaaaaac tactagctga tatcaagtca + 1861 agtcagaata ccgatttgac ggtcaaccag agttcgtctt acttggcagc ttacaagagt + 1921 ttgattgcag gggagactaa ggccattgtc ctaaatagtg tctttgaaaa tatcatcgag + 1981 tcagagtatc cagactacgc atcgaagata aagaagattt ataccaaggg attcactaaa + 2041 aaagtagaag ctcctaagat gtctaagaat cagtctttca atatctatgt tagtgggatt + 2101 gacacctatg gtcctattag ttcggtgtcg cgatcagatg tcaatatcct gatgactgtc + 2161 aatcgagata ccaagaaaat cctcttgacc acaacgccac gtgatgccta tgtaccaatc + 2221 gcagatggtg gaaataatca aaaagataaa ttaacccatg cgggcattta tggagttgat + 2281 tcgtccattc ataccctaga gaacctttat ggtgtagata ttaattatta tgttcgtttg + 2341 aattttacct catttttgaa attgattgac ttattgggag gggtagatgt tcataatgat + 2401 caagagtttt cagctctaca tgggaagttc catttcccag tagggaatgt ccatctagac + 2461 tctgagcagg ctctaggttt tgtacgtgaa cgctactcac tagccgatgg agaccgtgac + 2521 cgtggtcgca accaacaaaa ggtgattgtg gctatccttc aaaaattaac gtcaaccgaa + 2581 gcactgaaaa attatagtac gatcattaat agcttgcaag attctatcca aacaaatatg + 2641 ccacttgaga ctatgataaa tttggtcaat gctcagttag aaagtggagg gaattataaa + 2701 gtaaattctc aagatttaaa aggtacaggt cggacggatc ttccttctta tgcaatgcca + 2761 gacagtaacc tctatgtgat ggaaatagat gatagtagtt tagctgtagt taaagcagct + 2821 atacaggatg tgatggaggg tagatgaaat gatagacatc cattcgcata tcgtttttga + 2881 tgtagatgac ggtcccaagt caatagagga aagcaaggca cttttaagag aagcttataa + 2941 tcaaggaatt cgaatgattg tgtctacttc gcatcgtcga aaagggctgt ttgaaactcc + 3001 agaagaaaaa attgcaacaa attttattaa ggttcgtgaa attgcaaaag aagtagcaga + 3061 tgatttagtc atagcttatg gcgcagagat atactatact ctggatgctc tagaaaagct + 3121 agaaaaaaaa gaaattccta cccttaatga tagtcgttat gctttgattg agtttagcat + 3181 gcatacttcc tatcgtgaga ttcatgcggg attgagcaat attttgatgt tgggaatcac + 3241 gccagtaatt gctcatattg aacgttatga tgccttagag aataacgaaa aacgtgttcg + 3301 tgaactgatt gatatggggt gctatactca gataaatagt tatcatgttt taaaacctaa + 3361 gttctttggt gaaaaatata aattcatgaa aaagagagct cgatattttt tggaacgtga + 3421 tttagttcat gtagttgcaa gtgacatgca caatttagac agtagacctc catatatgca + 3481 acaggcatat gataccattg ctaagaaata tggagcgaaa aaagcgaaag aattttttgt + 3541 agataatccc agaaaaatta taatggatca attaatttag gagaaaatat gaaggaacaa + 3601 aacactttgg aaatcgatgt attgcaacta ttcagagctt tatggaaaag aaagttggtc + 3661 attttattag tggcaattat aacttcttca gttgcttttg cctacagtac ttttgttatc + 3721 aaacctgagt ttactagtac aactcggatt tatgtagtta accgtaatca ggaagagaag + 3781 tctggtttaa ccaatcaaga cttgcaggca ggatcatact tggttaaaga ctatcgtgaa + 3841 attatcctat cgcaggatgt tttggaggaa gttatttctg atttgaaact agatttgacg + 3901 ccaaaaggtt tggctaataa aattaaagta acagtaccag ttgatacccg tattgtctct + 3961 atttcagtta atgatcgagt ttctgaagag gcaagccgta tcgctaactc tttgagagaa + 4021 gtagctggtc aaaaaattat cagtattact cgtgtttccg atgtgacaac actagaggag + 4081 gcaagaccga cgatatcacc gtcttcgcca aatattaaac gcaatacact aattggtttt + 4141 ttggcagggg ggattggaac tagtgttata gttcttcttc ttgaactttt ggacactcgt + 4201 gtgaaacgtc cggaagatat cgaagataca ctgcagatga cacttttggg agttgtacca + 4261 aacttgagta agttgaaata ggagagagga atgccgacat tagaaatagc acaaaaaaaa + 4321 ctggagttca ttaagaaggc agaagaatat tacaatgcct tatgtacaaa tatacagttg + 4381 agcggagata aactaaaagt aatttccgtt acttctgtta accctgggga aggaaaaaca + 4441 actacttctg taagtatagc aaggtcgttt gcgcgtgcag gctataaaac tcttttgatc + 4501 gatggcgata ttcgaaattc agttatgtca ggatttttta aatctcgtga aaaaattaca + 4561 gggctaacag aatttttatc tgggacagct gatttatctc acggtttatg tgatacaaat + 4621 attgaaaatt tatttgtagt tcaatcggga actgtatcac caaaccctac agccttgtta + 4681 caaagtaaaa attttaatga tatgattgaa acattgcgta aatattttga ctatatcatt + 4741 gttgatacac cacctattgg aattgttatt gatgcggcaa ttatcactca aaagtgtgat + 4801 gcgttcatct tggtaacagc aacaggtgat gtgaataaac gtgatgtcca aaaagcgaaa + 4861 caacaattag aacaagcagg gaaactgttc ctgggagttg ttttaaataa attagatatc + 4921 tcggttgata agtatggcgt ttacggttcc tacggaaatt atggtaaaaa ataatttagg + 4981 aaagatttta tggatgaaaa aggattgaaa atttttctgg cagtattaca gagtattatt + 5041 gtcattttat tggtttattt tcttagcttt gttagagaga cagaagttga acgttcttcg + 5101 atggttatac tataccttct ccactttttt gtattctatt ttagttccta tggtaacaat + 5161 ttttttaaaa gagggtacct agttgagttt aatagtacta taagatatat ttttttcttt + 5221 gcaatagcta taagtgtatt aaactttttt atagcggaac ggtttagtat atctaaaaga + 5281 ggaatggtat acttcttaac tttagaagga atatccttat acttgttaaa tttcttagta + 5341 aaaaaatatt ggaagcatgt gttttttaat ctaaaaaata gcaagaaaat tttactgtta + 5401 acagtaacga aaaatatgga aaaagttctt gataaattgc tagaatctga tgaactttca + 5461 tggaaattgg tagcagtaag tattttggat aaatctgatt ttcaacatga taaaatacct + 5521 gtaattgaga aggaaaaaat tattgaattt gcaacgcatg aagttgtgga tgaggtgttt + 5581 gtcaatcttc caggagagag ctacgatgtt ggagaaatta tctctaggtt tgagacaatg + 5641 gggatagatg taactgtaaa tcttaaagca tttgataaga atttgggtcg caataaacaa + 5701 attcatgaga tggtaggatt gaatgtagtc actttctcta caaattttta taaaactagt + 5761 catgtgattt caaagagaat tctcgatatt tgtggtgcca ctattggcct tattcttttt + 5821 gctgtagcta gtctagtttt agttccattg attcgtaaag atggcggacc agctattttt + 5881 gctcaaactc gtatagggaa aaatggtcga catttcacct tttataaatt ccgttcaatg + 5941 cggatcgatg ctgaagctat caaagaacag ttgatggatc aaaatacgat gcaaggtggt + 6001 atgtttaaga tagacaatga tcctcgtgtt acaaaaattg gtcgctttat tcgtaaaacc + 6061 agtttggatg aattgccgca gttttggaat gtctttatag gagatatgag tttggtggga + 6121 acacgtccac ctacagtaga cgagtatgat cagtatactc cagaacagaa acgtcgactc + 6181 agctttaaac ctggtattac aggtttatgg caggttagcg gccgtagtaa aataaccgat + 6241 tttgacgatg ttgtaaaatt agatgtggct tatattgata attggacaat ctggaaagat + 6301 attgaaattt tgcttaaaac tgttaaagtt gtatttatga gagatggagc gaagtaattt + 6361 ctgtatatcc atcatattag gagagaaatg aaaaagtcag tttatatcat tggttcaaaa + 6421 ggaattcctg ctaagtatgg aggatttgaa acttttgttg aaaaattaac agccttccaa + 6481 caagataagg ctatccaata ttatgtggct tgtatacgtg aaaactctgc aaaatcaggg + 6541 attactgagg atgtttttga acataatggt gctatctgtt ataacgtcga tgttcctaat + 6601 attggtccag cgcgagctat agcgtatgat atcgctgcaa ttaacagagc tattgaaatt + 6661 gccaaagaaa ataaggatga agatccaatc ttctatattt tagcttgtcg aattggtccg + 6721 ttcatccatg gaattaagaa aaaaatccag gcgataggtg ggactcttct agttaatcca + 6781 gatggccacg agtggttgcg agctaagtgg agtgctcctg ttcgtcgcta ctggaaaatt + 6841 tctgaaggtc ttatggtcaa atatgcagat tttttagtgt gtgatagtaa gaatattgaa + 6901 aaatatatcc aagaagatta taaacagtat caacctaaaa caacctatat cgcttatgga + 6961 acagatacaa cacgctctac attaaagagt agtgataaaa aagtacgttc ttggttcaaa + 7021 gagaagaata tttctgagaa cgagtattat ctagttgtag gacgttttgt accagaaaac + 7081 aactatgaat ctatgattcg tggctttctg gcgtctaact ctaagaagga ctttgtctta + 7141 atcacaaatg tagaacagaa taaattttat aatcagttgt tggcaaaaac tggttttgat + 7201 aaggacccac gagtaaaatt tgtaggtaca gtctatgagc aagagcttct taaatatatt + 7261 cgtgaaaacg cctttgctta cttccacggg catgaagttg gtggaaccaa tccttcgctt + 7321 ttagaagctc tggcatcaac taaactgaat ttattgctag atgttggctt taaccgagaa + 7381 gttggggagc aaagtgcgat ctattggaaa aaagatgagc tttcccaagt aatcgagaaa + 7441 gttgaacaat ttgatgcaaa aatgattgat gagttagata gacaatcaaa tcagagaatt + 7501 gcggattctt tcacttggga aaagattgtc acagactacg agaaagtatt taaaggttag + 7561 agttaatggc agtaaaatta aaatatgata aatcagatat tacattttta gatgatgacg + 7621 aattgaaaaa ataccaatca gaattgttga aaatgatatc agatgtgttt actttttttg + 7681 atgaaaatgg gatagcgtat tctttaagtg gaggtagcat tttaggggca atccgtcata + 7741 aagggtttat cccttgggat gatgatgttg atatcaatat tccgagggaa agttacgata + 7801 aactattttc tctatttgag tcagacaata gtcttagtcg taaatattat cttcaatcag + 7861 caaaaagtca tccagaatta ggacttcatg tttctcaaat tagaaaaaaa ggaacagttg + 7921 ctcgtaggaa atacgatcat tcggctgagg agtgcggtat ttctatagat ctttacattg + 7981 tagaaaatgt atacaataat ccagtgaaac gattctttca aggttataca agtatgtttt + 8041 tgacttttgc cttggcttct gtacgagaaa caaagaacca tgccctgatg aaggaaatgt + 8101 ttagactgga aggtagaaaa ctaaattatt cagttggaaa gttaatggtt ggttggtttt + 8161 ttggaattat tccaattgaa aagtggttga attggcttga taaatgtaat tcaagctgta + 8221 aggattcaca tacaaaatat gtatccatac ctacaggaag gaaacacttt agacgcgaga + 8281 cttacttgcg agagaatatg aatatttata aaaaggttcc ttttgaaact ttgatggtga + 8341 atgttcctgt ttggtcagaa gagtatttag aaatgtttta cggtaaagat tatatggtcg + 8401 ttcctcctgt tgataagaga gagcaacatt tgtttttaga gttgagttac ggagaagaat + 8461 aaatgaaagt agcaatatta actgcttcag gtatcgggag caggattggt caagatatcc + 8521 ctaaacaatt tattcatgtt gaaaataagc cagtcattat ctataccctt gaaaaatttc + 8581 aaaatcatcc agaaattgat gaaatctgta ttgtcatttt aaaagggtgg gagcagatgg + 8641 ttaaggctta tgcggaacaa tttggaatta caaagttaaa gatgataact ttgggaggga + 8701 agtctggtca agaatcaatt tataacggtc ttagagcagt taagaaagct catcccaatg + 8761 aggatgtgac tgtattaatt catgacggga atcgtccttt agtgagcaat aatattatta + 8821 gtaacgcttt agcaacatac caacggtttg gaaatgctgt tgcagctata ccaacgactg + 8881 aggtagtatt tgttttagaa aacccacaat caacttcgtc cacagaagca ttgaatcgtg + 8941 acttgttgag acgaacacaa actcctcatg tttaccatct tgataatatt ctatcgcttc + 9001 atgaaaaagc attagaaaat gggataactg atgttgcagc atcatgccaa ctcatgcaac + 9061 tattcggtgg aaagagttat ttctctcttg gatcagagaa aaacttgaaa attacgactg + 9121 tagaagatct cgatattttt aaagccttat tgagttcaac tcgagataag tggattaaat + 9181 agtaatgaca ttattattaa ataaaatata tagacaagat gtagaatctt ctctagaaac + 9241 aatcgtcaat attaatgatt tgaatggcaa gtcaatttta attactggag cttctggttt + 9301 gattggttca agtgtcattg accagttatt attgctaaat gaaataagga attttaacat + 9361 taaaattatt tgttgcggaa gaaagtttga atcattagaa aaacgatttg gtagacaaac + 9421 agagtattta cactttgtgt tctatgatgc gactaaagta cctcactttg cttttgcagt + 9481 ggactacatt attcatgctg ctagtcctgc tagtcctgaa ttatatgtta atcagcctgt + 9541 agaaacaatg gctagtaact ttctgggcat gtataatcta ctggaatacg ccaaaaatgc + 9601 taaagtttca aatctagttt atatctcatc tagtgaagtt tatggaatta gcactagtaa + 9661 taatcctttg gacgaaaatt atattggaac tgttgatcat cttagcgtac ggtcttctta + 9721 tgccagttca aaaagagcta ctgaaacact ttgtgctagt tttgcttccg agtatggaat + 9781 caaaataatg atagtaaggc caggacatat ctatggtcct agtgccaagg actctgataa + 9841 tcgtgtatca tcatttttta tgacagaagc gattgctggg cgtgatattg tcatgaaaag + 9901 tacaggtagt cagttaagat cctattgtta tagtttggat tgtgccagtg caattctaag + 9961 tgttctcctt tcgggtgggt caggacaagc ttataatgtt tccaatccaa attcaattat + 10021 tactataaaa cagatggctg aaactatttc acgagttggc aatgtgaaac ttaccatggc + 10081 tattcctagt aatcaagata ttaaacagac caatcctatg cagaatgcca gtcttaggag + 10141 tgataagtta gaaggattgg gatggaaagg attgttttct gctgaaaaag gtatagaaaa + 10201 tacattccaa attttgaaag cattaagaag caattagata gattaaattt gatatttttc + 10261 ttatcatttt acttagtaac ggagtttaaa atggatggta aattaggttc ttttttgaaa + 10321 ttattaaaaa aagtagatgg cttaaggatt ttaaaacagt attttaagtc tggggtacta + 10381 ttttttgcta tttttcaaat actatctcaa ggtttttcaa aaaagtcttt agaaattgtt + 10441 cgtaattcag tagataataa aatattagct aaattgagga aaaaatacct ttcctatata + 10501 gttgaaaata aagatagaat tttacgggaa tcggctgaac gtcaatcttc tagtaaggtg + 10561 tggatattgt ggttacaggg gatgaacaat gctcctgaga tcgtaaagtt atgttataat + 10621 tctgtggttc aaaatctccc tgataaagag gcagttcttt taacggaaga tacttataga + 10681 aattatgtaa tctttccaaa tcatgttcaa cagaagattg ataaaggaat catttctaaa + 10741 acacacctgt ctgatttgtt gagattagaa ctgctaactc tgtatggagg tatttggatt + 10801 gatgcgactg tttttatatc ttccgataaa atccctgatt atatgttgtt ttctgaatta + 10861 tttttattcc aaaaattgaa accagggtta gatggaaatc ctaagagaat ttcaagttgg + 10921 tatatttgtg cgaagtctaa tcatccaata cttgttctta ccaaggagtt gttgtatcaa + 10981 tattggtcgg aacacaatta tatgatggac tactttttaa tgcatgattt tatggaatta + 11041 tcaattgaga catatccaca agaatggaat aaagtgattc cattctctag ttctccttcc + 11101 catatactgc tattaagatt atttgaaaca tttgataaga ggatgctaga atatgtttat + 11161 caacaaattt ctatacataa actaacttat aaatatgata ctgatatctg ttatactgaa + 11221 acctacttga ataaaatact aagtgaagga gagattgatg cataaaaagt tagctctaat + 11281 aatagcatat tttggtgaat tacctgaata ctctaaagtt ttttttaatt ctttaaatta + 11341 taatcctgag attgatttat ttctagtgac ggatcaatgt gtaaatataa acatagataa + 11401 tttaattgtt ataaaaaaaa cgttctctga atttaaaaat gatgttcaaa atttatttga + 11461 tttcaaaata gttttagata ctccttataa attatgtgat tacaagccta tatatgggat + 11521 gctttttaaa gatattttat atgaatatcc attttgggga tattgtgatt tggatatggt + 11581 gctgggagat gtgttttcgt ttttacctga aaatatattg gataattaca gcaaaatata + 11641 tgaatatggt catttaacta tttataaaaa tgaccctgaa aataatcgac gtttcatgta + 11701 tgaagttgga atgaattacc aagacgtttt tacaactaaa gttattaaag tatttgatga + 11761 gacagaagga attcagagaa aatatgaatt aatgggaatt cctacatata caccaagaga + 11821 ttgtgctgat ataaaccctt ggaagtatca gttaaataga gtagaaacag gtatttccaa + 11881 agaaaaatta aattcattta atcataaaaa gcagttgttt ttctgggaaa atggtaagat + 11941 ttttagagga tttatcaacc catatacaca taaaatagag tacgattctt tcaattatct + 12001 tcattttcaa aaaagagaaa tgaagataac ctttcctttt aattctagta caaaagcatt + 12061 ttttattact aatcaaggga ttgtagagaa gaagcagggg tttaatataa aaaaagaaga + 12121 ttttaaaaaa tataataact ataacttaat aagagaaata tcgaaaggtt tacaacgata + 12181 ttatttcatc tggaaaagga gattattaaa atatatattt aggagataac ttcaataatg + 12241 aaaatttcaa ttacaaattt atatatatgg atgttgacag taatgtttat attaatgtgg + 12301 attccaagtg ttcctatatt taattatgta gatgaactat taacgttgat gatacttccg + 12361 tatgtgatta tgaattttag agctcttcta ctaaaaagta gattagtaat tataggtgca + 12421 attggttttt tattaatagg attaatatca acataccttt cagatcttag ccgccctttg + 12481 atagctatag tatcggattt tttcacattt attaagtttc ctattaccta tttatatttt + 12541 agatatttat ttacaaaaca aaattcaact tattttttga atattttata tattcttagt + 12601 aagtttgttg tggttattgc ttttatttgc tgtttattaa attatagttt tgaactaggc + 12661 atgacctatg atatccgctt tggaataggt agttttcagt ttatatataa taacccagga + 12721 ttttttctag ccttgatggt tgtttgttat tcacttataa attactctaa taattcaggt + 12781 aattttaaat ataaaatttt agctatttta aatatggttg caactctacg atcagtggca + 12841 tttggagtta ttgccctact gctagttttg agtgtgttta taggaagaaa tttaagatta + 12901 tatcacttat ttatattgat tccgtcgatt atttttgtag gtaatggtgc tataagtaca + 12961 tatttcggtg atttggaaac acctagaaaa cttctattcc agggaggtat aaaggttttt + 13021 cagaaatttt tcccattagg ggcaggtttt gcttcatatg ggagcaacgc tgcttatgtg + 13081 tattactctc ccctgtattt tcaatttggt tttcatcata tttggggtct taatttagaa + 13141 tatgggaata tagctaatga taacttttgg ccgatgattt ttgcacagtt tggttttatt + 13201 ggttctatat tttatatact gatgttcatg gctattatga aggatttatt cattaaatct + 13261 atgtataaaa atcaagtggt atctttatct ttaattatag gtcatttgtt aatttcctca + 13321 gttggtgcaa atataattac tggtgtgtta ggtgtaagta tgatatgtgc atatgcctca + 13381 atggctcatg ttttagatga tgtagaggta aattattgaa attattaaaa aactacatat + 13441 ataatttggt ttatcaaata gtagctatta ttttaccatt ggtgaccatt ccatatgctt + 13501 ctagggtctt aggtgcagaa ataattggta ttaattcata tacaaataca attatttctt + 13561 actttgttct gattgcaaat gttggattaa ctacttatgg gaatagaacg atttcgtata + 13621 ctagagattc tgttttaaaa agaagtcaaa aattctggga aatctttgtc ataaaaatta + 13681 ttatggcttt gttttcattg tcactgtttt ttacctttac atttatttat agagagtata + 13741 caactttctt atatatacag tctattcaaa tccttgcaac agcaatagat atttcttggt + 13801 tttttacagg aatggaatat tttaaaagaa cagtcactag aaatatattg acaaagatat + 13861 tatctgcaat ttgtattatt ggatttgtta aaagtaggga agatttatgg ttatatatat + 13921 taattttagt tctctcaact tttttaggga atttaacttt atggacatat gtttttgatg + 13981 cgattgaagt aattaatttt aaaagcttgc aacttaaaga gcatattaaa cctgtatttg + 14041 tgttatttat acctcaattg gcaacaactc tttttctcac attaaacaaa ttgttgttag + 14101 gaaacttatc aacattatct caatctggct attttgatag tgcagacaaa gtgatacgaa + 14161 ttttactgac atttatcaca gctattggga cagtaatttt tccaagactg gcgaatagct + 14221 ttaatagagg agaaaaaaga aatgtcgaag aattattaaa actatctttt ggtgctatta + 14281 atattattgc tttcccaatg attgttggta ttatggtaat cggaaggcca ttttcaatcc + 14341 ttttttttgg aagtgaattt gaaggaattg aaattgtttt ggggatatta tcaatagaat + 14401 tggtttttat gggctggtca tcagtcttag gtaaccaatt tttagtagct gttaataaga + 14461 cgaagggctt aactgtttca gtgtttattg cttcattaat cttgctcata tcctctttca + 14521 tattgattcc tatgttagga gcttctggag cttcaatttc atcagttata ggagaggcga + 14581 caatagcttt ggtgcagtta tattatgttt caaaacatac tagattatgt ttattattta + 14641 gtgatatttc taaaatttta gtttctagtc tcataatggg aacgacttgt ttggtaattg + 14701 ggagttgttt ttatgatggt attatgaaac tctgtgttca aggaacagtt ggtttaatgg + 14761 tatattgtat aatgatttgg tatagcagga ctgaaattgt aaatactata cttaaaaaaa + 14821 taaagataca gtagtgaaaa atatttatag agatttttac tgcaaataat tgcaaataaa + 14881 gttgtcttca ctggaatgat tgaccagtac tttgattaca aacacgggga gttagaatac + 14941 cgtagccttc gttttgaaca cgaagtcttg gatgaagaaa attatcaagg gaatgcagta + 15001 gtaaactata cagaacgtga gattccttac actcgtatca ttgagcacaa gcactgtgag + 15061 tatggtacac aaccgaagac ggttatcact cgtgagtacc cagctgattg gaaacgtgga + 15121 gatgaaccat attatccgat caacgatgaa aagaacaaca ctatgtttgc taagtatcaa + 15181 gaagaagcag caaaaaatga caaggttatc ttctgtgggc gcctagctga ctataaatac + 15241 tacgacatgc atgttgttat tgaacgtgca cttagtgtag taacgaatga gtttggttac + 15301 taagacatac atttttaaca atataatgat tgttcaacaa caaagaaagg taccctacta + 15361 tgaaaggtat tattctagca ggtggttcgg ggacacgttt atatcctttg actcgcgttg + 15421 catcaaaaca acttatgccg gtttatgata aaccgatgat ttactaccca ctttcaacat + 15481 tgatgttggc tgggattagg gatattttga ttatttccac tccacaggat ttacatcgat + 15541 ttcaagagct tcttcaagac ggatctgagt ttgggatcaa actttcttat gcagagcaac + 15601 caagtccaga tggtttggca caagccttta tcattgggga agagtttatt tctgatgata + 15661 gcgttgcgct aatcttaggt gataatatct accatggttc tggactttcc aagatgctac + 15721 aaaaggcagc gagtaaggag tcgggagcaa ctgtttttgg ctaccatgtc aaggatccag + 15781 agcgctttgg tgtggttgag tttgatcagg atatgaaggc tatttctatt gaagaaaagc + 15841 cagagcaacc tcgttcaaac tatgcagtta caggtctcta tttctatgat aatgatgtag + 15901 tagagattgc caagagtatt aaaccaagtc ctcgtggtga actggaaatt acagatgtaa + 15961 acaaggctta tctagatcgt ggaggcttat ccgttgaggt tatgggacgt ggctttgctt + 16021 ggttggatac tggcactcat gaaagtttac tagaggcttc gcagtacatc gaaacagtcc + 16081 aacggatgca aaatgttcag gtagcaaact tggaagaaat tgcctatcgc atgggttata + 16141 tcagtcgtga agatgtattg accttagccc aaccacttaa gaaaaatgaa tacggacagt + 16201 atctgctccg tttgattgga gaagcataga tgacagataa ttttttcggt aagacgcttg + 16261 cggcacgcaa ggttgaagct attccaggca tgttggagtt tgatatcccc gttcatggag + 16321 ataatcgtgg ctggtttaaa gaaaatttcc aaaaggaaaa aatgcttcca cttggatttc + 16381 cagagtcttt ctttgcagaa ggaaaattgc aaaacaatgt atccttctca cgtaaaaatg + 16441 tccttcgtgg cctccacgca gagccttggg ataagtacat ctctgtggca gatggaggga + 16501 aagttctggg ttcttgggtt gatctacgcg agggtgaaac ctttgggaat acctatcaga + 16561 cagtaattga tgcaagcaag ggaatctttg ttcctcgagg cgtagctaat ggcttccaag + 16621 ttttatcaga tacagcttca tatagctatc tggtcaatga ttactgggcg cttgaactca + 16681 aacccaagta tgcctttgtg aactacgctg atccaagcct tggtattgaa tgggaaaatc + 16741 tggaagaagc agacgtatct gaagcagaca aacatcatcc cctacttaag gacgtgaagc + 16801 ctttgaaaaa agaagatttg taaaaaggaa agaatatgac tgaatacaaa aatattatcg + 16861 tgacaggtgg agctggcttt atcggttcta actttgtcca ttatgtttac gagaactttc + 16921 cagatgttca tgtgacagtc ctagataagt tgacttatgc tggaaaccgc gcgaatattg + 16981 aggaaatttt aggtaatcgt gttgagttag ttattggtga cattgctgat gcggagttgg + 17041 tagacaagtt ggctactcaa gcagatgcta tcgttcatta tgcagcggaa agccacaatg + 17101 ataattcgct caatgatcca tcgccattta ttcatactaa cttcatcgga acctatactc + 17161 ttttagaagc tgctcgtaag tatgatattc gcttccacca tgtatcgaca gatgaagttt + 17221 atggggatct ccctttacgc gaagatttgc caggtcatgg tgaaggacca ggtgagaaat + 17281 ttactgctga aacaaaatac aacccaagct ctccgtactc atcaaccaag gcagcctcag + 17341 atttgattgt caaagcctgg gtgcgttctt ttggagtcaa ggcaacgatt tccaactgtt + 17401 caaataacta cggtccttat caacatattg agaagtttat tccacgacaa atcaccaata + 17461 tcttgagcgg tatcaagcca aaactttacg gtgaaggtaa gaacgttcgt gactggattc + 17521 ataccaatga ccattcttca ggagtttgga caatcttgac aaaagggcaa atcggtgaaa + 17581 cctacttgat tggggctgat ggtgagaaga acaataagga agttttggaa cttatcctta + 17641 aggaaatggg acaagctgcg gatgcctatg atcatgtgac tgaccgtgca ggacatgacc + 17701 ttcgctatgc gattgatgct agcaagctcc gtgatgagtt gggatggaaa cctgaattta + 17761 ccaactttga agctgggctc aaggcaacaa tcaagtggta tacagataac caagaatggt + 17821 ggaaagcaga gaaagaagct gttgaagcca attatgctaa gactcaggag attattacag + 17881 tataaaaagc aggaaatagc tgctttttat tgctatattg ggaagagtta catattagaa + 17941 agatctagag atgattttaa ttacaggggc aaatggccaa ttaggaacgg aacttcgcta + 18001 tttattggat gaacgtaatg aagaatacgt ggcagtagat gtggctgaga tggatattac + 18061 caatgaagaa atggttgaga aagtttttga agaggtgaaa ccgactttag tctaccattg + 18121 tgcagcctac accgctgttg atgcagcaga ggatgaagga aaagagttga acttcgccat + 18181 caatgtgacg gggacaaaaa atgtcgcaaa agcatctgaa aagcatggtg caactctagt + 18241 ttatatttct actgactatg tctttgacgg taagaaacca gttggacaag agtgggaagt + 18301 tgatgaccga ccagatccac agacagaata tggacgcact aagcgtatgg gggaagagtt + 18361 agttgagaag catgtgtcta atttctatat tatccgtact gcctgggtat ttggaaatta + 18421 tggcaaaaac ttcgttttta ccatgcaaaa tcttgcgaaa actcataaga ctttaacagt + 18481 tgtaaatgac cagtacggtc gtccgacttg gactcgtacc ttggctgagt tcatgaccta + 18541 cctagctgaa aaccgcaagg aatttggtta ttatcatttg tcaaatgatg cgacagaaga + 18601 cacaacatgg tatgattttg cagttgaaat tttgaaagat acagatgtcg aagtcaagcc + 18661 agtagattcc agtcaatttc cagccaaagc taaacgtccg ctaaactcaa cgatgagtct + 18721 ggtcaaagcc aaagctactg gatttgttat tccaacttgg caagatgcat tgcaagaatt + 18781 ttacaaacaa gaagtgagat aagtagtaga atgattttct agtctaataa aagaggcaga + 18841 taatgaactc caaaggagct taagatatac aattatcttg ttgttggtgc tggtctcttt + 18901 ggtgcagtct ttgcccatga agcggcctta aaaggaaaaa aagtaaaagt tattgaaaaa + 18961 cgaaatcata tcgcgggtaa tatctatact cgtgaagagg aaggaattca aatttatcaa + 19021 tatggtgctc atatcttcca tacttctgat aaggagatct gggattatgt aaatcagttt + 19081 gcagagttta accgttacat aaattctcct gttgcaaact ataagggtga gatttataac + 19141 cttcctttta atatgaatac tttcaataaa ctctggggag ttgtaacgcc agcagaagca + 19201 caagctaaga ttgatgaaca acgtgctatt ttaaatggta aaactcctga aaatttggaa + 19261 gaacaggcga tttctcttgt agctacagac atctacgaaa aattaatcaa agactataca + 19321 gagaaacagt ggggcaaacc aactactgaa cttccatcct ttattattgt ttgccagtac + 19381 gcctgaccta tgataacaac tattttaacg atacctatca agggattcca attggtggat + 19441 acactcaaat agttgaaaaa tgttggatca tgaaaatatt gatgtagaaa caaacgttga + 19501 tttctttgtg aataaagagc aatatctgaa agattttcct aagattgtct ttactggtat + 19561 gattgatgaa ttctttgact ataagttggg cgaactagag taccgtagtc ttcgttttga + 19621 aaatgaggcc ttggatatgg aaaattacca aggaaatgca gttgtgaact atacggatgc + 19681 agaaacccca tatactcgca ttattgaaca caaacatttt gagtttggga gtcaagcaaa + 19741 gactatcatt actaaagaac attctaaaac atgggaaaaa ggtgatgagc cttattatcc + 19801 agttaataat gatcgtaata atcatttgta taaatcatat aaaaaacttg ctgatgagca + 19861 agggaatgtt atctttggtg gccgcttagg acactatcgt tattacgata tgcaccaagt + 19921 aattggagca gctttgcagt gcgtgagaaa tgagttagat tcatactcaa tgaaaatcaa + 19981 agagcaaact aggaagctag ccgcaggttg ctcaaaacac tgttttgagg ttgcagatgg + 20041 aaactgacgc ggtttgaaga gattttcgaa gagtataaac aggctctttg tcaactgtag + 20101 tgggttgaag tcagctaagc tcgagaaagg acaaattttg tcctttcttt tttgatattc + 20161 agagcgataa aaatccgttt tttgaagttt tcaaagttcc gaaaaccaaa ggcattgcgc + 20221 ttgataagtt tgatgagatt attggtcgct tccaatttgg cgttagaata gtgtagttga + 20281 agggcgttga cgattttctc tttgtccttt agaaaggttt taaagacagt ctgaaaaaga + 20341 gaatgaacct gctttagatt gtcctcaata agtccgaaaa atttctctgg ttccttattc + 20401 tggaagtgaa aaagcaagag ctgatagagc tgatagtgat gtttcaagtc ttccgaatag + 20461 ctcaaaagct tgtttaaaat ctctttattg gttaaatgca tacgaaaagt aggacgataa + 20521 aattgcttat cactcagttt acggctatcc tgttgaatga gtttccagta gcgcttgata + 20581 gccttgtatt catgggattt tcgatgaaac tgattcatga tttggacacg cacacgactc + 20641 atagcacggc taagatgttg tacaatgtga aagcgatcca acacgatttt agcacatggg + 20701 aaaagttgtc tagctaagtc atagtaagga ctaaacatat ccatagtaat aattttgacg + 20761 cgacatcgga cggctctatc atatttaaga aagtgatttc gaatgatagc ttgtgttctt + 20821 ccctcaagaa cagtgatgat attgagattg ttaaaatctt gcgcaatgaa gctcatcttt + 20881 ccctttgtaa aagcatactc atcccaagac ataatctcag gaagacaaga aaaatcatgt + 20941 ttaaagtgaa agtcattgag cttacgaata acagttgaag ttgagatgga aagctgatgg + 21001 gcaatatcag tcatagaaat cttttcaatt aacttttgag caatcttttg gttgatgata + 21061 cgagggattt ggtgattctt cttgacgata gaagtttcag cgaccatcat ttttgaacag + 21121 tgatagcact tgaatcgacg ctttctaagg agaattctag taggcatacc agtcgtttca + 21181 agataaggaa ttttagaagg tttttgaaag tcatatttct tcaattggtt tccgcactca + 21241 gggcaagatg gggcgtcgta gtccagtttg gcgatgattt ccttgtgtgt atccttattg + 21301 atgatgtcta aaatctggat attagggtct ttaatgtcta gtaattttgt gataaaatgt + 21361 aattgttcca tatgattctt tctaatgagt tgttttgtcg cttttcatta taggtcatat + 21421 gggacttttt ttctacaata aaataggctc cataatatct atagtggatt tacccactac + 21481 aaatattata gaacctataa acaagtaaaa ctgactacca gttattattt agaaatagta + 21541 ttaaaaattc cttgactatg tgatatagtt gaggaatttt taaatgatat tcatattttt + 21601 tgcaaagatg ttgtttgaaa aataattttc aaaaattctg aaaattctgt tgacatcttt + 21661 ctgaaaagag tctataatgg agagaaagtt ttaaaggaga aaatgatgaa aagttcaaaa + 21721 ctatttgccc ttgcgggcgt gacattattg gcggcgacta ctttagctgc atgctctgga + 21781 tcaggttcaa gcactaaagg tgagaagaca ttctcataca tttatgagac agaccctgat + 21841 aacctcaact atttgacaac tgctaaggct gcgacagcaa atattaccag taacgtggtt + 21901 gatggtttgc tagaaaatga tcgctacggg aactttgtgc cgtctatggc tgaggattgg + 21961 tctgtatcca aggatggatt gacttacact tatactatcc gtaaggatgc aaaatggtat + 22021 acttctgaag gtgaagaata cgcggcagtc aaagctcaag ac +// + diff --git a/public/res/serotype_genbank/serotype_5.gb b/public/res/serotype_genbank/serotype_5.gb new file mode 100644 index 0000000..fe5c936 --- /dev/null +++ b/public/res/serotype_genbank/serotype_5.gb @@ -0,0 +1,896 @@ +LOCUS CR931637 19969 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Ambrose (serotype 5). +ACCESSION CR931637 +VERSION CR931637.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 19969) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 19969) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from wzg to aliA and is likely to be responsible for the + expressed capsule serotype. For this particular strain a cps gene + cluster appears to have deleted from the dexB-aliA locus. For a + detailed description of how CDS products were predicted see the + associated publication. +FEATURES Location/Qualifiers + source 1..19969 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Ambrose" + /db_xref="taxon:1313" + gene <1..1422 + /gene="wzg" + /locus_tag="SPC05_0001" + CDS <1..1422 + /gene="wzg" + /locus_tag="SPC05_0001" + /note="member of homology group 0; + DNA sequence does not include 5' end of this CDS" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32791.1" + /db_xref="GOA:Q4K320" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K320" + /translation="RSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFRYLNLVVT + ALVLLVTLVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLNVTSNYS + EYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVNQSSSYL + AAYKNLIAGETKAIVLNSVFENIIESEYPGYASKIKKIYTKGFTKKVEAPKTSKNQSF + NIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQKDKL + THAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGIDVYNDQEFTAHTNG + KYYPAGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYST + IINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSYAIPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1..93 + /gene="wzg" + /locus_tag="SPC05_0001" + /note="Signal peptide predicted for SPC0099 by SignalP 2.0 + HMM (Signal peptide probability 0.884) with cleavage site + probability 0.473 between residues 31 and 32" + misc_feature 181..528 + /gene="wzg" + /locus_tag="SPC05_0001" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 6.2e-63" + misc_feature 706..1149 + /gene="wzg" + /locus_tag="SPC05_0001" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 1.8e-69" + gene 1424..2155 + /gene="wzh" + /locus_tag="SPC05_0002" + CDS 1424..2155 + /gene="wzh" + /locus_tag="SPC05_0002" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32792.1" + /db_xref="GOA:Q7WVX2" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q7WVX2" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKIIMDQLI" + misc_feature 1427..2035 + /gene="wzh" + /locus_tag="SPC05_0002" + /note="HMMPfam hit to PF02811, PHP domain, score 2.3e-38" + gene 2164..2856 + /gene="wzd" + /locus_tag="SPC05_0003" + CDS 2164..2856 + /gene="wzd" + /locus_tag="SPC05_0003" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32793.1" + /db_xref="GOA:Q7WVX1" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q7WVX1" + /translation="MEKQNTLEIDVLQLFRSLWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVSRDQGEKSGLTNQDLQAGSYLTKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVAVPVDTRIVSISVNDQVPEGASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKLNTLIGFLVGLIVINVTVLLLELLDTRVKRPEDIEDALQMT + LLGVVPNLDKLK" + misc_feature 2182..2598 + /gene="wzd" + /locus_tag="SPC05_0003" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 2.9e-50" + misc_feature 2704..2781 + /gene="wzd" + /locus_tag="SPC05_0003" + /note="PS00217 Sugar transport proteins signature 2." + gene 2866..3540 + /gene="wze" + /locus_tag="SPC05_0004" + CDS 2866..3540 + /gene="wze" + /locus_tag="SPC05_0004" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32794.1" + /db_xref="GOA:Q7WVX0" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q7WVX0" + /translation="MPTLEIVQKKLEFIKKTEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSINIAWSFARAGYKTLLIDGDIRNSVMSGVFKSREKITGLTEFLSGTTDL + SHGLCDTNIENLFVVQSGAVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGVVI + DSAIITQKCDASILVTATGEVNKRDVPKAKQQLEQTGKLFLGVVLNKFNVQHEKYGSY + GNYGKR" + gene 3944..4537 + /gene="wciI" + /locus_tag="SPC05_0005" + CDS 3944..4537 + /gene="wciI" + /locus_tag="SPC05_0005" + /note="member of homology group 29" + /codon_start=1 + /transl_table=11 + /product="putative initial sugar transferase" + /protein_id="CAI32795.1" + /db_xref="GOA:Q7WVW9" + /db_xref="InterPro:IPR003362" + /db_xref="UniProtKB/TrEMBL:Q7WVW9" + /translation="MYSILKRLGDISISLIVITLFCPFFILIAIAIKFDSKGPVIFKQ + KRFGIHKKTFYVFKFRTMKVETPKNVATRDLQNPEQWITRVGTFLRKTSLDELPQLCN + ILVGDMSIVGPRPALWNQFDLIEERDKYGANDILPGLTGWAQINGRDNLSIDMKAELD + GYYVTHKSLLMDIRCIVRTIPYVLKRKGIVEGSQKES" + misc_feature 3944..4051 + /gene="wciI" + /locus_tag="SPC05_0005" + /note="Signal peptide predicted for SPC0103 by SignalP 2.0 + HMM (Signal peptide probability 0.812) with cleavage site + probability 0.384 between residues 36 and 37" + misc_feature 3959..4513 + /gene="wciI" + /locus_tag="SPC05_0005" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 8.1e-32" + gene 4546..5772 + /gene="wciJ" + /locus_tag="SPC05_0006" + CDS 4546..5772 + /gene="wciJ" + /locus_tag="SPC05_0006" + /note="member of homology group 35" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32796.1" + /db_xref="GOA:Q7WVW8" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q7WVW8" + /translation="MKILFVSQHYRPEPFRLSDICEDLVERGHEVTVLTGIPNYPEGK + TYADYRNNKNRRETIEGVTVFRSYTIPRGKSTLHRILNYFSFAISSSIGVLLGQYKAK + DGSEFDCIFVNQSSPVMMAWAAMAYKNKYKKPMFLYCMDVWPDSLTVGGVKQDGLIFK + LFKFISKKVYRASDYIFVTSPSFKNYFVNQFDITEQKITYLPQYAEDLFIPDESRVNK + ESVDLTFAGNIGKAQNLETILKAASLIEKNTDLPKKIQFHFVGDGTELLSMKALAHEL + ELKNVSFYGRRSLEEMPTFYKKSDAMLVSLIGDSIVSRTIPGKVQSYMAAGKPIIGAI + SGDTKTIVEEAKCGFVSPEQDVEQLAQNICKFSMLSTEEQRELGKQARCYYGKHFSKE + QFMTQLENYLREGFSS" + misc_feature 5164..5697 + /gene="wciJ" + /locus_tag="SPC05_0006" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1e-12" + gene 6003..7208 + /gene="wzy" + /locus_tag="SPC05_0007" + CDS 6003..7208 + /gene="wzy" + /locus_tag="SPC05_0007" + /note="member of homology group 217" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32797.1" + /db_xref="UniProtKB/TrEMBL:Q7WVW7" + /translation="MESRKKFVCFPNSSLRFYILQAAIALSILSQTPYIWKFSGIPTQ + LLIMPLWILLGVVSIFSRIDMERSFLFFLLTIGCLISTIALLDIVTGVSYVFNGLSQQ + LYLAVGILVLGYWNADVIVHYWKIITMTFLGACLLISVDIYFHYFQGHTFSNIDYVYR + AKNSAASIFLSAVILNLSLYNRKWALWRKVLLLASSGLLIYMCILMRSRAVLLAAAVL + PLVYIWFQETSLGHKIGRTLGVSTVVGAFLLNSAIYDFFINNLFLRVTSEYRPSSLTL + DYVSSNRFVYFEIFAKEISGHELTGIGYYYMDNFFLESFLNYGYIVGTAFVLIALSPM + IYALLQRSSSHRFRMLFLALAFSYTVNALFEGYAPFGPGAKSFILWLVFGCLLNTRIG + KVGEHSETS" + gene 7183..8655 + /gene="wzx" + /locus_tag="SPC05_0008" + CDS 7183..8655 + /gene="wzx" + /locus_tag="SPC05_0008" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32798.1" + /db_xref="GOA:Q4K313" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K313" + /translation="MVNILKQVSLKWNYVFNLANKLFSLTIPLIVTPYVTRVFSSDHF + GIYTYTNTVASYFVTFTLMGISMYGSKKISLKRHDEIAVNDEYASLLTVQLLNVGLAT + LTYFLYVTFFVNNNQVIYWIQMLYVISAGFDMTWFLSGLERFREIAVRNIIVNVLSAL + MIFFFVHTEADLAIYTLIKVGTIFISQIVIFLPVVRMQRFYLAGAEHIRRTYRGLLLL + FIPVLADTLFQTMDKIMLGIYASYTAVGLYYSSRMVTDIPQTVITSLNIILFPRITHL + LSQNKKVESNKLFYQSFILIIALSLATAFGVSAIARDFVGIFFGSSYGAVADYVPSLS + LYICLAAWSGTIRYQYLIPHSLERVYVVAIILGSGINLVLNSLLIPFLGVYGSILATI + ISELVICVYQTYPIRKEIPLKGLLGYVIIFAGLSFLMYLSLGWLRLLLLGRLSTVLLL + ASEIIFGILVFTIATITYIYLGNPILWQAIKKYIESRKNV" + misc_feature 7210..8013 + /gene="wzx" + /locus_tag="SPC05_0008" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.5e-31" + gene 8652..9533 + /gene="whaC" + /locus_tag="SPC05_0009" + CDS 8652..9533 + /gene="whaC" + /locus_tag="SPC05_0009" + /note="member of homology group 184" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32799.1" + /db_xref="GOA:Q4K312" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K312" + /translation="MISIIMPAYNEEKNIGAAIASIQQQTYTDFQLIIVNDGSTDDTA + AIVQEKIMGDERIVFLNPGKIGKVPAYNLASQYVKGDWIYFMGADDQLPLDAFEKWNK + EAQKWNPAEKVALRARMRMVSDSHKYDGLVLPKKNTVRNFSGPLTLLSKEMHRFILPI + PEAYPNEDIWWGLCIEYFGDRVSLIEDVVVYYRVHEGNSISRTSTFEPFNEKYHIRQI + IRRDFLERFSNHLTADQKTKLQRELKLEEARYKGNRLPILLMPGISAVHRLRLLFLSG + RRSYVLKVKLDRFFLGH" + misc_feature 8658..9125 + /gene="whaC" + /locus_tag="SPC05_0009" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 4.3e-28" + gene 9547..10632 + /gene="whaD" + /locus_tag="SPC05_0010" + CDS 9547..10632 + /gene="whaD" + /locus_tag="SPC05_0010" + /note="member of homology group 185" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32800.1" + /db_xref="GOA:Q7WVW4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q7WVW4" + /translation="MSKKKISYVTNNIAPFRVMLLDELAKHAEVTLFYVHEIEAGVKA + EYVKLRPVRTKLQSITELGLFQTFQMLKEMDMVFFDGYTGWEKMFLMSSMWLTRRQYA + ISVDGIINHSNISLKQRLLDFIKSVALSKAEFVLSTNTPTDAYIQQLAPKAKIKRHIF + STLSQDDFKNMIEVASDTVFTRYSIRKSEKNLLFVGQFINRKGVDELLAFMKEHEADT + SLQLIMVGGTREELSVFETEIPSNIHIIPFLEKTDILELMRVADVFVLPTREDIWGLV + IIEALSMGIPIVSTDRCNAALEFVRDGENGYLMQEVTAVELANKLKATFKLDAEHVAR + YDQKLMQDYNLEGSAKNIMDILEGIHV" + misc_feature 10072..10572 + /gene="whaD" + /locus_tag="SPC05_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 3e-22" + gene 10625..11431 + /gene="whaE" + /locus_tag="SPC05_0011" + CDS 10625..11431 + /gene="whaE" + /locus_tag="SPC05_0011" + /note="previously sequenced as SWALL:Q7WVW3; + member of homology group 186" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="CAI32801.1" + /db_xref="UniProtKB/TrEMBL:Q7WVW3" + /translation="MFNSSCALFIVSCETNQQVVNLLIQSMRQQISHMVSIYVSSDGP + LLITDPSVRVLIGQEEVFGDRVATALEQVTEERVIVFCDDFIVEKPAKIEELEELLSL + MEEDTSIASIALSQISGGNTPERIAEHYIRRTKYAPYKTTLQCAIWKKSSLIQFMKGS + PSPWEFEIYHNFKTYLTKEKFYALEDDMFQPIPYNRGKLIIRGKVVKPEKERLEELLG + YSLDLSDFPETESFIQGENLTVGYRLKRKIKLLEKEIIYRLKSKIKNKKK" + gene 11665..12702 + /gene="fnlA" + /locus_tag="SPC05_0012" + CDS 11665..12702 + /gene="fnlA" + /locus_tag="SPC05_0012" + /note="member of homology group 36" + /codon_start=1 + /transl_table=11 + /product="FnlA" + /protein_id="CAI32802.1" + /db_xref="GOA:Q7WVW2" + /db_xref="InterPro:IPR003869" + /db_xref="InterPro:IPR013692" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q7WVW2" + /translation="MFTKKTLLITGGTGSFGNAVLKRFLGTDISEVRIFSRDEKKQDD + MRHEFQAKMPEVADKIRFYLGDVRDLASVKNAMIGVDYVFHAAALKQVPSCEFFPVEA + VKTNVLGTENILTAAIEAGVKQVICLSTDKAAYPVNAMGTSKAMMEKIAVAKSRTVEE + DQTKVCVTRYGNVLCSRGSVIPLWIDQIKQGNPITITEPSMTRFIMSLEEAVDLVLFA + FEKGKTGDILVQKAPACTIEVLAQAVTELFAPNQDIKVIGIRHGEKMYETLLTTEECT + NAIDLGGFYRVPSDNRDLNYDKYFNEGDAKRNPLIEFNSSNTELWNVEQVKEKLLLLP + YIREELASLNQ" + misc_feature 11680..12516 + /gene="fnlA" + /locus_tag="SPC05_0012" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00038" + misc_feature 11683..12531 + /gene="fnlA" + /locus_tag="SPC05_0012" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 5.2e-165" + misc_feature 11683..12357 + /gene="fnlA" + /locus_tag="SPC05_0012" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 1.5e-13" + misc_feature 11686..12327 + /gene="fnlA" + /locus_tag="SPC05_0012" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 4.4e-08" + misc_feature 12532..12675 + /gene="fnlA" + /locus_tag="SPC05_0012" + /note="HMMPfam hit to PF08485, Polysaccharide biosynthesis + protein C, score 1.3e-26" + gene 12711..13922 + /gene="ugd" + /locus_tag="SPC05_0013" + CDS 12711..13922 + /gene="ugd" + /locus_tag="SPC05_0013" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI32803.1" + /db_xref="GOA:Q7WVW1" + /db_xref="HSSP:1DLI" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q7WVW1" + /translation="MKIAVAGTGYVGLSIAILLAQYHKVIAVDVIPEKVELINRRQSP + IKDDDIETYLVEKELDLVATLDGNEAYRDADFVIIAVPTNYDSKKNYFDTSVVEAVIE + QIIAVNLKATIVIKSTIPVGYTESLRTRFGQFKILFSPEFLRESKALYDNLYPSRIIV + GADLRDTEQVVQAERFATLLQEGSLKPDVETLIMGVTEAEAVKLFANTYLALRVSYFN + ELDTYAEIKGLDTKSIIDGVGLDPRIGSHYNNPSFGYGGYCLPKDSKQLLANYHDVPQ + NMMTAIVESNRTRKYFIADRILKNALELSDGNQTIIVGVYRLTMKSGSDNFRQSSIQG + VIKCLKAKGVEVIIYEPTLEDHSFFFGNQVVNDLEVFKSSSQVIVANRMEKSLYDVLE + KVYTRDIFQRD" + misc_feature 12711..13253 + /gene="ugd" + /locus_tag="SPC05_0013" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 2.1e-52" + misc_feature 12711..13226 + /gene="ugd" + /locus_tag="SPC05_0013" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.0013" + misc_feature 13296..13577 + /gene="ugd" + /locus_tag="SPC05_0013" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 2.6e-36" + misc_feature 13650..13880 + /gene="ugd" + /locus_tag="SPC05_0013" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 0.00029" + gene 13941..15170 + /gene="fnlB" + /locus_tag="SPC05_0014" + CDS 13941..15170 + /gene="fnlB" + /locus_tag="SPC05_0014" + /note="member of homology group 37" + /codon_start=1 + /transl_table=11 + /product="FnlB" + /protein_id="CAI32804.1" + /db_xref="GOA:Q7WVW0" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR008894" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q7WVW0" + /translation="MPLKILVTGSKGFVGKNLICTLEALKDGRDRTRPNLEIGEIFQY + DRDTDPILLDEYCKKADFVFHLAGVNRPQNPDEFMEGNYGFSSRLLEILEKYENTCPV + LLSSSTQASLEGRFSNSIYGQSKLVGEELFFEYGKKTGAPVLVYRFPNLYGKWCRPNY + NSAVATFCHNLAHDLPIQVNDPSVELELLYIDDLIQECLTALEGNPHRCNLDGLQILP + SPSGNYCYVPTTHRATLGEIVSLLETFKKQPNSLIMPEIPQGSFKKKLYSTYLSYLPV + DKFKFPLKMNIDERGSFTELLKTENKGQFSVNISKPGITKGQHWHHSKWEFFMVVSGR + ALIQERRIGLDENGQEYPILNFEVSGDKIEAIHMIPGYAHNIINLSDTENLVTVMWAN + ESFDPRHPDTFFEQVEK" + misc_feature 13953..14576 + /gene="fnlB" + /locus_tag="SPC05_0014" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 1.6e-08" + gene 15171..16355 + /gene="fnlC" + /locus_tag="SPC05_0015" + CDS 15171..16355 + /gene="fnlC" + /locus_tag="SPC05_0015" + /note="member of homology group 38" + /codon_start=1 + /transl_table=11 + /product="UDP-L-fucosamine FnlC" + /protein_id="CAI32805.1" + /db_xref="GOA:Q7WVV9" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q7WVV9" + /translation="MKIKTDYSDIHFKDNGKLKLLIIVGTRPEIIRLSSVITKCRKYF + DVILAHTGQNYDYNLNGIFFDNLGLDTPDVYMDAVGDDLGATVGNIINTSYKLMNQIK + PDALLILGDTNSCLSAITAKRLHIPIFHMEAGNRCKDECLPEETNRRIVDIISDVNLA + YSEHARKYLHECGLPKERTYVTGSPMAEVLHKNLSAIESSDIHERLGLKKGGYILLSA + HREENIDTDKNFISLFTAINQLAEKYNMPILYSCHPRSKKRLQESGFKLDKRVIQHEP + LGFHDYNCLQMNAFVVVSDSGTLPEESSFFTSQGYPFPAVCIRTSTERPESLDKAGFI + LAGIDENSLLQAVETAVSLAEDEDFGLPVPDYVEENVSTKVVKIIQSYTGIVDKIVWR + KS" + misc_feature 15282..16310 + /gene="fnlC" + /locus_tag="SPC05_0015" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 2.6e-103" + gene 16556..17264 + /gene="tnp" + /locus_tag="SPC05_0016" + /pseudo + CDS join(16556..16933,16917..17264) + /gene="tnp" + /locus_tag="SPC05_0016" + /note="member of homology group 31" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1671 transposase" + misc_feature 16935..17261 + /gene="tnp" + /locus_tag="SPC05_0016" + /note="HMMPfam hit to PF05717, IS66 Orf2 like protein, + score 3.9e-55" + /pseudo + gene 17332..17505 + /gene="tnp" + /locus_tag="SPC05_0017" + /pseudo + CDS 17332..17505 + /gene="tnp" + /locus_tag="SPC05_0017" + /note="Lone member of homology group 0218" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative ISPSy5-like transposase (fragment)" + gene order(17768..18205,18281..18907) + /gene="tnp" + /locus_tag="SPC05_0018" + /pseudo + CDS join(17768..18205,18281..18907) + /gene="tnp" + /locus_tag="SPC05_0018" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature join(17768..18205,18281..18301) + /gene="tnp" + /locus_tag="SPC05_0018" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 2.4e-06" + /pseudo + gene complement(19192..19541) + /gene="tnp" + /locus_tag="SPC05_0019" + /pseudo + CDS complement(join(19192..19410,19398..19541)) + /gene="tnp" + /locus_tag="SPC05_0019" + /note="member of homology group 219" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1380-Spn1 transposase (fragment)" + gene 19817..>19969 + /gene="aliA" + /locus_tag="SPC05_0020" + CDS 19817..>19969 + /gene="aliA" + /locus_tag="SPC05_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32810.1" + /db_xref="UniProtKB/TrEMBL:Q4K305" + /translation="MMKSSRLLALAGVTLLTATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYL" + misc_feature 19817..19903 + /gene="aliA" + /locus_tag="SPC05_0020" + /note="Signal peptide predicted for SPC0121 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.270 between residues 29 and 30" +ORIGIN + 1 cgttcacaga aagtgaagcg aagtgttaat atcgttttgc tgactattta tttattgtta + 61 gtttgttttt tattgttctt aatctttaag tacaatatcc ttgcttttag atatcttaat + 121 ctagtggtaa ctgcattagt cctactagtt accttggtag ggctactctt gattatctac + 181 aaaaaagctg aaaaatttac tatttttctg ttggtgttct ctattcttgt cagctctgtg + 241 tcgctctttg cagtacagca gtttgttgga ctgaccaatc gtttaaatgt gacttctaat + 301 tactcagaat attcaatcag tgtcgctgtt ttagcagata gtgagatcga aaatgttacg + 361 caactgacga gtgtgacagc accgactggg actgataatg aaaatattca aaaattacta + 421 gctgatatca agtcaagtca gaataccgat ttgacggtca accagagttc gtcttacttg + 481 gcagcttaca agaatttgat tgcaggggag actaaggcca ttgtcctaaa tagtgtcttt + 541 gaaaacatca tcgagtcaga gtatccaggc tacgcatcga agataaaaaa gatttatacc + 601 aagggattca ctaaaaaagt agaagctcct aagacgtcta agaatcagtc tttcaatatc + 661 tatgttagtg gaattgacac ctatggtcct attagttcgg tgtcgcgatc agatgtcaat + 721 atcctgatga ctgtcaatcg agataccaag aaaatcctct tgaccacaac gccgcgtgat + 781 gcctatgtac caatcgcaga tggtggaaat aatcaaaaag ataaattgac tcatgcgggc + 841 atttatggag ttgattcgtc cattcacacc ttagaaaatc tctatggagt agatatcaat + 901 tactatgtgc gattgaactt cacttcgttt ttgaaaatga ttgatttgtt gggtggaatt + 961 gatgtttata atgatcaaga atttactgcc catacaaatg gaaagtatta ccctgcaggc + 1021 aatgttcatc ttgattcaga acaggctctc ggttttgttc gtgagcgcta ctcactagca + 1081 gatggcgatc gtgaccgtgg gcgcaatcaa caaaaggtga ttgtggctat ccttcaaaaa + 1141 ttaacgtcaa ccgaagcact gaaaaattat agtacgatca ttaatagctt gcaagattct + 1201 atccaaacaa atatgccact tgagaccatg ataaatttgg tcaatgctca gttagaaagt + 1261 ggagggaatt ataaagtaaa ttctcaagat ttaaaaggga caggtcggat ggatcttcct + 1321 tcttatgcaa taccagacag taacctctat gtgatggaaa tagatgatag tagtttagct + 1381 gtagttaaag cagctataca ggatgtgatg gagggtagat gaaatgatag acatccattc + 1441 gcatatcgtt tttgatgtag atgacggtcc caagtcaaga gaggaaagca aggctctctt + 1501 ggcagaagcc tacagacagg gggtgcgaac cattgtctct acctctcacc gtcgcaaggg + 1561 catgtttgaa actccggaag agaagatagc agaaaacttt cttcaagttc gggaaatagc + 1621 taaggaagtg gcgagtgact tagtcattgc ttatggcgca gagatatact atactctgga + 1681 tgctctagaa aagctagaaa aaaaagaaat tcctaccctt aatgatagtc gttatgcttt + 1741 gattgagttt agcatgcata cttcctatcg tcagattcat acgggattga gcaatatttt + 1801 gatgttggga atcacgccag taattgctca tattgaacgg tatgatgctt tagagaataa + 1861 cgaaaaacgt gttcgtgaac tgattgatat gggatgctat actcagataa atagttatca + 1921 tgttttaaaa cctaagttct ttggtgaaaa atataaattc atgaaaaaga gagctcggta + 1981 ttttttggaa cgtgatttag ttcatgtagt tgcaagtgac atgcacaatt tagacagtag + 2041 acctccatat atgcaacagg catatgatat cattgctaag aaatatggag cgaaaaaagc + 2101 gaaagaactt tttgtagata atcccagaaa aattataatg gatcaattaa tttaggagaa + 2161 aatatggaga aacaaaacac tttggaaatc gatgtattgc aactattcag atctttatgg + 2221 aaaagaaagt tggtcatttt attagtggca attataactt cttcagttgc ttttgcctac + 2281 agtacttttg ttatcaaacc tgagtttact agtacgactc ggatttatgt agttagccgt + 2341 gatcagggag agaagtctgg tttaaccaat caagacttgc aggcaggatc gtacttgact + 2401 aaagactatc gtgaaattat cctatcgcag gatgttttgg aggaagttgt ttctgatttg + 2461 aaactagatt tgacgccaaa aggtttggct aataaaatta aagtggcagt accagttgat + 2521 acccgtatcg tgtctatttc ggttaatgat caagttcctg aaggggcaag ccgtatcgct + 2581 aactctttga gagaagtggc ggctcaaaaa attatcagta ttactcgtgt ttctgatgtg + 2641 acaacactgg aggaggcaag accagcgata tcaccgtctt cgccaaatat taaactcaat + 2701 acactaattg gttttttggt aggattgatt gtcataaatg ttacagttct tcttcttgaa + 2761 cttttggaca cacgagtgaa acgtccggaa gatatcgaag atgcactaca gatgacactt + 2821 ttgggggttg taccaaactt ggataagttg aaataggaga gagagatgcc gacattagaa + 2881 atagtacaaa aaaaactgga gttcattaag aagacagagg aatattacaa tgccttgtgt + 2941 acaaacatac agttgagcgg agataaacta aaagtgattt ccgttacttc tgttaaccct + 3001 ggagaaggga aaacaactac ttctataaat atagcatggt cttttgcgcg tgcaggatat + 3061 aaaactcttt tgatagatgg cgatatccga aattcggtga tgtcaggagt ttttaaatct + 3121 cgtgaaaaaa ttacaggctt aacagaattt ttatctggta caactgattt atctcacggt + 3181 ttatgtgata caaatattga aaatttattt gtagttcaat cgggagctgt atcaccaaac + 3241 cctacagcct tgttacaaag taaaaatttt aatgatatga ttgaaacctt gcgtaaatat + 3301 tttgattata tcattgttga tacagcacct attggagttg ttattgattc ggcaattatc + 3361 actcaaaagt gtgatgcgtc tatcttggta acggcaacgg gtgaggtgaa taaacgtgat + 3421 gtcccaaaag cgaaacaaca attagaacaa acagggaaac tatttttagg tgtcgttctc + 3481 aataaattta atgttcaaca tgaaaaatat ggttcttacg gtaattatgg taaaagataa + 3541 aatgaatata gtatggaagg ggctacaata taactctggc attctgaact gcaccccaaa + 3601 agttagacag aaaaaatcta acttttgggg gtcagtacat tcttacaggg tacacttgtt + 3661 agtttattag cttagatact gattgcaatt tcagaaaccg atattttttc aaataaatat + 3721 tcggtctgtt tggaagtgca atcgaactga actttccaat gctttattgg gcatcatata + 3781 ttaccgaaac aaataaattt tgttatattg gatgatgttg ttatgttatt gtaaaaatat + 3841 tgtgtgacca aatatattga gtctttgtgg tctaataggc tgatatattt aatttgataa + 3901 ataaaaataa gatgaagttt gaatttagag tgagagatag tttatgtata gtatattaaa + 3961 acggttagga gatatatcta tatctttaat agttataacg ttattttgtc cattttttat + 4021 cctaattgca attgcgatta agtttgattc aaaaggacct gtaatattta aacaaaaacg + 4081 ttttggaatt cacaaaaaaa ctttttatgt ttttaaattt cggactatga aagtggagac + 4141 accaaaaaat gtggcaactc gagatttaca aaatccagag cagtggatca ctagagtggg + 4201 aactttctta aggaaaacat ctctagatga attgcctcaa ttatgtaata ttcttgttgg + 4261 tgatatgagt attgtaggac caagacctgc cctttggaat caatttgatt tgattgaaga + 4321 aagagacaaa tatggagcaa atgatatttt acctggttta acaggttggg cacaaatcaa + 4381 tggtcgtgat aatctatcaa tagatatgaa agctgaattg gatggatact atgtgacaca + 4441 taaatcgttg ctaatggaca ttagatgtat agtaagaaca ataccttatg tgctgaaacg + 4501 caaaggaatt gtagagggaa gtcaaaaaga gagttaagtt gtacgatgaa aattttattt + 4561 gttagtcaac attatagacc agaacctttt agattatcag atatttgtga ggatcttgtt + 4621 gagagaggtc atgaagttac tgttttgaca ggaattccta attatcctga aggtaaaaca + 4681 tatgcggatt atcggaataa caaaaataga cgagagacta tagaaggagt tactgttttt + 4741 cgttcctata caattccaag gggaaaaagt actttacata ggatattaaa ttattttagt + 4801 tttgctatca gttcctcgat aggggttcta ctgggacagt ataaagcaaa agatggatca + 4861 gaatttgatt gtatttttgt aaatcaatcg tctccagtta tgatggcatg ggctgctatg + 4921 gcttataaaa ataaatataa gaaacctatg tttctgtatt gtatggatgt ttggccagat + 4981 agtttaactg taggtggagt gaaacaagat ggcttgattt tcaagttgtt taaatttata + 5041 tcgaaaaaag tttatcgagc tagtgattat atatttgtta ctagtccatc atttaagaat + 5101 tattttgtga accaatttga cataacagaa caaaagatta cttatttgcc acaatatgca + 5161 gaagatcttt ttatccctga tgaatctaga gttaataaag aaagtgttga cctaactttt + 5221 gctggtaata ttggcaaagc acaaaatttg gaaactattt tgaaagctgc cagtttgata + 5281 gagaagaata ccgatctacc caagaaaatt caatttcatt ttgttggaga tggtacggaa + 5341 ttgctaagta tgaaagcatt agctcatgaa ttggagttaa agaatgtttc cttctatgga + 5401 agacgttctt tggaagaaat gcctaccttc tataaaaaat cagatgctat gttagtttct + 5461 ttaataggag actcgatagt ttctcgtact atacctggga aggtacaatc ttacatggcg + 5521 gcagggaaac caattatagg tgcaatttca ggagatacta aaacaattgt agaagaagca + 5581 aagtgtggtt ttgtcagtcc tgaacaagat gtggaacaat tggcacaaaa tatttgtaaa + 5641 tttagtatgt tgtctacgga agaacaaaga gagttaggaa agcaagctcg ttgttactat + 5701 gggaagcact tttctaaaga gcagtttatg acacagttag aaaattattt gagagagggc + 5761 ttttcctcat gagaatttta atgattaata ctgtttgtgg tattaggagt atagatactt + 5821 tgttaaagaa atttgctgag atttggcgtt tcaatttata ggatttgaaa gtttagtaag + 5881 taaatttaag tattttctgt aagataataa gttcttaatg acttattaac tattgtataa + 5941 tagctgtaat tccaaataaa agtacatagg tactgacatg ttgacgatag taaggaggag + 6001 gaatggaatc ccgaaagaaa tttgtttgtt ttcccaatag tagtttgcgt ttttatattt + 6061 tgcaggcagc gattgcctta tctattttat cgcagactcc ctatatctgg aagtttagtg + 6121 ggatacctac acaacttctg attatgcctt tgtggatcct gttgggagta gtgtctattt + 6181 tttctagaat tgacatggaa cgatcattcc tatttttttt attaacaata ggttgtttaa + 6241 ttagcactat tgctttgtta gatatagtta cgggagtatc ttatgtcttt aatggtttgt + 6301 ctcagcaact ctatttggct gtgggaattc tagttttagg ctactggaat gctgatgtga + 6361 ttgttcatta ttggaaaatc atcaccatga cttttttggg agcatgtttg ctgatttcag + 6421 tggatattta ttttcactac tttcaaggac atactttttc aaatattgat tatgtttatc + 6481 gagctaagaa ttcagcggca tctatctttt tatcggcagt tattctcaac ttgtctctat + 6541 ataatcgcaa gtgggcactg tggagaaaag tattgttatt agctagtagc ggattgctga + 6601 tttacatgtg catccttatg cggtcacgag cagttctgtt agcagctgca gtacttccgc + 6661 tagtttatat atggtttcag gagacgtctt tggggcataa gattggacgg acattaggag + 6721 tttcaacagt agtaggtgcg tttttgctca attcagctat ttatgatttt tttatcaata + 6781 atctattttt aagggtcaca tctgaatatc gaccatctag tctgactttg gactacgttt + 6841 cctccaaccg ttttgtgtat tttgagatct ttgctaaaga aatttcagga catgaattaa + 6901 cagggattgg ttattattat atggataatt tttttctaga gagttttctc aattatggtt + 6961 atatagtagg gactgctttt gttttaatag ccttgtctcc catgatttat gccctcttgc + 7021 aacgttcttc ttctcatcgt ttccgcatgc tttttttagc ccttgctttt tcttatactg + 7081 tcaatgcctt atttgaaggt tacgcgccat ttggtcctgg tgccaagagt tttattcttt + 7141 ggttagtttt tggttgcctt ctgaatacac gaattggaaa ggttggtgaa cattctgaaa + 7201 caagttagtc taaagtggaa ctatgtgttt aatcttgcca ataaactatt ttctctaact + 7261 attccactta ttgttactcc ctatgtcact cgagtctttt cttcagatca ttttgggatt + 7321 tatacttata ccaatacagt tgcttcttac tttgttacct ttacattgat ggggataagt + 7381 atgtatggaa gtaagaaaat ttctcttaaa agacatgatg agatagcagt caatgatgaa + 7441 tatgcttcct tactgactgt ccagctgctt aatgtaggtc tagccacgtt aacttacttt + 7501 ctctatgtga ccttttttgt caataataat caagttattt attggatcca gatgttgtat + 7561 gtgatttctg ctggttttga tatgacttgg tttttatcag gattggaacg ttttcgtgaa + 7621 attgctgttc gaaatatcat tgtaaatgtc ttatcagccc tcatgatttt tttctttgtg + 7681 catacggagg ctgatttggc tatctatacc ttaataaagg tagggacgat ttttatcagt + 7741 cagattgtta tttttttacc agttgttcgg atgcaacggt tttatcttgc aggagctgaa + 7801 catattcgac gtacctatcg aggcttgctt ttgttgttta tccctgtttt ggcagacacc + 7861 ctttttcaaa ctatggataa gatcatgcta ggtatctatg catcctatac tgctgtgggt + 7921 ttgtattact caagtaggat ggttactgac atcccgcaaa ctgtcattac ttctctcaat + 7981 ataatcttat ttccacgaat aacacatctt ttaagtcaga ataaaaaagt tgaatctaat + 8041 aaactttttt atcagtcttt tatcttaatt attgctttat ctctagctac agcttttgga + 8101 gttagtgcta ttgctaggga ttttgtaggt attttttttg gatcttcata tggtgcggta + 8161 gcagattatg tgcctagttt atcgctctat atctgccttg ctgcctggag tggaacgata + 8221 cgttaccaat atctgattcc tcattcactt gagagagtct atgtagtagc gattattttg + 8281 ggaagtggga tcaatctagt tttaaactct ctcttaattc cttttttggg agtatacggt + 8341 tccattttag ctactattat atcagaatta gtgatttgtg tttaccagac atatcctatt + 8401 cgaaaggaaa ttcctcttaa aggattgtta ggatatgtga tcatttttgc aggcttgtct + 8461 tttcttatgt atctatctct tggttggcta cgattgttat tgctaggccg cctatccaca + 8521 gtattgctat tggcaagtga aataatattt ggtatccttg tttttactat cgcaactata + 8581 acctatattt atctaggtaa cccaatttta tggcaagcta ttaaaaaata tatagaaagt + 8641 aggaaaaacg tatgatctct atcattatgc cagcttataa tgaagaaaaa aatatcggag + 8701 cagctattgc cagtattcaa cagcaaacct atacggactt tcagttgatt atcgtcaatg + 8761 atggatctac agatgatacg gcagctattg tacaggaaaa aatcatggga gatgagcgaa + 8821 ttgtcttttt gaatcctgga aagattggca aggtaccagc ttataacttg gcttcacagt + 8881 atgtaaaagg agactggata tattttatgg gagcggatga ccagttgcca ttggatgcct + 8941 ttgaaaagtg gaacaaggag gctcaaaagt ggaatcctgc tgaaaaggtg gctttaagag + 9001 ctcgcatgcg gatggtttct gactctcaca agtatgatgg attggtatta ccaaagaaaa + 9061 atacagttcg caattttagt ggacctctta ccttgctttc aaaagagatg caccgtttta + 9121 tccttcctat acctgaggcc tatccgaacg aagatatttg gtgggggcta tgtattgagt + 9181 atttcggaga tcgtgtttcg ttgattgagg atgttgtggt ttattatcgt gttcatgagg + 9241 ggaattctat atcccgaacc tcaacttttg aaccttttaa cgagaaatat catatccgtc + 9301 agattatccg tcgtgatttt ttagagagat ttagcaatca cttaacagca gaccagaaga + 9361 ctaaacttca gcgtgaattg aaactagaag aagcacgcta taaaggaaat agattgccaa + 9421 ttcttctgat gccaggtatt tctgcagtac acagacttcg attacttttt ttatcgggta + 9481 ggcgttcata tgtacttaaa gtcaaattgg atcgcttttt cttaggacat tagaaagaag + 9541 gaagagatgt caaagaaaaa aatttcttat gttacaaata atattgctcc ttttagggtt + 9601 atgttattag atgagttagc caagcatgca gaagtgactc ttttttatgt gcacgaaatt + 9661 gaggcggggg taaaggctga gtatgtcaag ctacgacctg ttcgtaccaa gctccaatca + 9721 atcacagaac taggtttatt tcagacgttt caaatgttga aagagatgga tatggtcttc + 9781 tttgatggct atactgggtg ggaaaagatg ttcttgatga gcagtatgtg gctaacaaga + 9841 cggcagtacg ctatttctgt tgatggtata ataaatcata gtaatatctc acttaagcag + 9901 agactgttgg attttattaa gtctgttgct ctaagcaaag cggagtttgt gcttagcacc + 9961 aataccccaa cagatgctta tatacagcaa ttagctccca aggcaaagat taaacgacac + 10021 atattttcaa ctctttcaca agatgatttc aaaaacatga tagaggttgc ctcggatacg + 10081 gttttcacaa gatatagtat tcgaaaatct gagaaaaatc tgctttttgt gggacagttt + 10141 atcaatagaa aaggagtcga tgagcttttg gcttttatga aagagcacga agctgatact + 10201 tcgttgcagt taattatggt cggaggtaca agagaagaat tgtcagtttt tgaaacagag + 10261 attccttcta atatacatat aattcctttt ctagaaaaaa ctgatatcct agagttgatg + 10321 cgggtggcag atgtctttgt tttgcccact cgagaagata tttggggact ggttattata + 10381 gaggcgctat caatgggcat tcctattgtt tctacggatc gttgtaacgc agccttggag + 10441 tttgttaggg atggcgaaaa tggttatctg atgcaggaag tgactgcggt agaattggct + 10501 aacaagctta aggctacctt taaactagat gctgagcatg ttgctcgcta tgatcaaaaa + 10561 ctgatgcaag actataatct ggaaggttca gcaaaaaata ttatggacat cttggaggga + 10621 attcatgttt aattcatctt gtgctttatt tattgttagt tgcgagacta atcagcaggt + 10681 agtcaatctc ctcatccagt ccatgcgtca gcagatttct catatggtat ccatttatgt + 10741 atcatcagat ggcccattgt taatcacgga tcctagcgta agggttttga ttggtcagga + 10801 agaagttttt ggagatcgtg ttgcaactgc tttggaacaa gttactgaag agcgagtcat + 10861 tgttttttgt gatgacttta tcgtagaaaa accagctaaa attgaagaat tagaagaact + 10921 actgtctcta atggaagagg atacaagtat tgctagtatt gccctgtcac aaatatctgg + 10981 agggaataca cctgagcgta ttgctgagca ttatataaga cgcacgaaat atgcccccta + 11041 taagacaact cttcaatgcg ctatttggaa gaagtctagt ttgattcaat tcatgaaggg + 11101 gagtccctct ccttgggaat ttgagattta tcataacttt aaaacttacc tgacgaaaga + 11161 gaaattttat gctttagagg atgatatgtt ccaacctatc ccttataata gaggaaagtt + 11221 gattattcga ggtaaagttg ttaaacctga aaaagaacgt ttggaggaac ttttgggtta + 11281 ttcattagat ttatcggatt tcccagaaac ggagtctttt atccaggggg aaaatcttac + 11341 tgtaggctat cggttgaaga gaaagattaa attgttagaa aaagaaatta tttatcgttt + 11401 gaaatctaaa ataaagaata agaaaaaata gtgaaaaaga aagtttataa tatttggtgg + 11461 atgcaaaaga tttaaagatt gagttatctt tatttctaca cctttaaaaa atatagcttt + 11521 tcttttggat aaggtgtatg ttgaaattct caccaatatt atcagtcaga aaaatattgt + 11581 agtgcgttat ttttcatgtt gttaagcttt aaatttattt aaaaagcatt atgttgaaca + 11641 tcattataga taggagtaat aactatgttt acaaagaaaa ctctccttat tacagggggg + 11701 acaggttcat tcgggaatgc agttctcaaa cgatttttgg gaacagatat ttcggaggta + 11761 cgtatctttt caagagatga gaagaaacag gatgatatgc gtcatgaatt tcaagcaaaa + 11821 atgccagaag tagctgataa gatacgtttt tacttaggag atgtgcgtga tttagcttct + 11881 gttaaaaatg ctatgatcgg tgtggattac gtatttcatg ctgctgcatt aaaacaagtc + 11941 ccttcttgtg aatttttccc tgtggaagca gtcaaaacta acgttctagg aactgaaaat + 12001 attctcactg cagctataga agctggagta aaacaagtca tctgcctttc tacagataag + 12061 gcagcctatc ctgttaatgc gatgggaacc tctaaggcta tgatggaaaa gattgctgtt + 12121 gctaagtcaa ggacggtaga agaagatcag acaaaagtct gtgtaactcg ctacggcaat + 12181 gttctatgta gtcgtggttc tgtgattccc ctatggattg atcaaataaa gcaagggaat + 12241 cctataacga ttacggaacc tagtatgact cgttttatta tgtccttaga agaagcggta + 12301 gacctagttc tgtttgcttt tgaaaaagga aaaacaggag atatcctagt acagaaagca + 12361 ccagcatgta ccattgaagt gttggcgcaa gctgttacgg aactttttgc acctaatcaa + 12421 gatattaaag taatcgggat tcgccacggt gaaaagatgt atgaaacgtt gttgactact + 12481 gaagaatgta cgaatgccat tgatttaggc ggcttttatc gtgtgcctag cgataatcga + 12541 gatcttaact atgataagta tttcaacgaa ggggatgcca aacgcaatcc cttaatagag + 12601 tttaacagta gtaatacaga actctggaat gtcgagcagg ttaaggaaaa actcttactt + 12661 ttgccctata ttagggaaga attagcatct ttaaatcagt gaggtatcct atgaaaatag + 12721 cagtagcagg gacaggttat gtgggtttat ctattgcaat tctattagcg caatatcata + 12781 aggttatagc ggtagatgtt attcctgaaa aagtagagct tatcaatcgt cgccaatctc + 12841 ccattaagga tgatgatatt gaaacttatt tagtggaaaa ggaattagac ttagttgcaa + 12901 cattagatgg taatgaagct tatcgagatg ctgactttgt cataattgct gtcccaacta + 12961 actatgacag taaaaaaaat tattttgata catctgttgt ggaagcagtt attgagcaga + 13021 ttattgcggt taatttgaag gcaacaattg tcataaaatc cacaattcct gtgggatata + 13081 cagaaagtct ccgaacacgt tttgggcaat ttaagattct ctttagtcct gaatttttac + 13141 gggagtctaa agcactttat gataatctct atcctagtcg aatcatcgtt ggagcagatt + 13201 tgagagatac ggagcaggta gttcaggctg agcggtttgc aactcttttg caggaaggtt + 13261 cacttaaacc tgatgttgag accttaatta tgggtgtaac agaggcagaa gcagtcaaac + 13321 tatttgccaa cacctatttg gctttgcggg tttcttactt taacgaattg gatacctatg + 13381 cggagataaa gggattggac actaaatcca tcattgacgg agtagggtta gatccacgaa + 13441 ttggtagcca ttataacaat ccgtcatttg gttatggagg ttattgtctt cccaaagata + 13501 gtaagcagtt gctggcgaat tatcatgatg taccacaaaa tatgatgaca gctattgtag + 13561 aaagtaaccg tactcgcaag tattttattg ccgatcgtat tttgaaaaat gcgttggagc + 13621 tttcagacgg taatcaaaca atcatagtag gtgtttaccg cttaactatg aagagtggtt + 13681 cggataattt ccgtcaatca tcaatccaag gtgttataaa atgtttaaag gccaaaggtg + 13741 tagaagtaat tatctatgaa ccaactttgg aggatcatag ctttttcttt ggtaatcagg + 13801 tggttaatga tttggaagtt tttaagtcta gcagtcaagt gattgttgcc aatcggatgg + 13861 aaaaatcttt atatgatgtg ctagaaaaag tttatacaag agatattttt cagcgagatt + 13921 aagtatatgg agggaaaaat atgccattaa aaattttagt gactggttct aaaggatttg + 13981 taggaaaaaa tcttatctgt actctggaag ctttgaaaga tggacgagat aggactcgtc + 14041 ctaatttaga gattggagag atttttcagt atgatcgtga tacagatccg attttattag + 14101 atgaatattg taagaaggcc gatttcgtat tccatttagc tggtgtcaat cgtccacaga + 14161 atcctgatga attcatggag ggaaattacg gtttttcaag tagattattg gagattttag + 14221 aaaagtatga aaacacttgt cctgttctac tctcaagttc tactcaagct agtttagaag + 14281 gccgattttc aaactctata tatggacaat ctaagctagt aggggaagaa ctcttctttg + 14341 aatatggaaa gaaaacggga gcacctgtct tagtttaccg tttcccgaat ctttatggga + 14401 agtggtgccg tcctaactac aattctgctg tagcaacttt ctgtcataat ctagctcacg + 14461 atttacctat tcaagtaaat gatccaagtg tagaattgga gttgctgtat attgatgatt + 14521 tgatacaaga gtgtctaact gcattggaag gaaatcctca tcgttgtaat ctagatggat + 14581 tacaaatctt acctagccca tcaggaaact actgctacgt accaacgact catcgtgcaa + 14641 ccttaggaga gattgtctct ctattagaaa catttaaaaa acagcctaat agtttaatta + 14701 tgcctgaaat tcctcaagga tcgtttaaaa agaaattgta ttctacctac ctatcttatt + 14761 taccagtaga taagtttaag tttcctctaa aaatgaatat agatgaacga ggtagtttta + 14821 cggaattatt aaaaacagaa aataagggtc aattttctgt taatatttct aaacctggca + 14881 ttaccaaagg gcaacattgg catcattcta agtgggaatt tttcatggtt gtttctggtc + 14941 gtgctttaat acaagagcgt aggatagggc tggatgaaaa cggtcaagag tatcctattc + 15001 tgaactttga agtgtcgggc gataagattg aagcaataca tatgataccg ggctatgcac + 15061 ataatattat taatctttct gatacagaaa atctagttac tgtcatgtgg gctaatgagt + 15121 catttgatcc tagacatcca gatacttttt ttgaacaagt ggagaaataa atgaaaatta + 15181 agacagatta tagtgatatt cactttaaag ataatggcaa acttaagtta ttgattattg + 15241 tgggaacacg tccagagatt atacgtctaa gtagtgttat cactaaatgt cgaaagtatt + 15301 ttgatgttat tttggcacat actggacaaa actatgatta caatttaaat ggtattttct + 15361 ttgataattt agggttagac actccggatg tatacatgga tgctgttgga gatgatcttg + 15421 gtgctactgt agggaatatt attaatactt catacaaatt gatgaatcaa attaaaccag + 15481 atgctttatt gattttaggg gatacaaatt cttgtttatc agctattact gccaagcgtt + 15541 tacatattcc aatttttcat atggaggctg gcaatcgctg taaggatgag tgcctgccgg + 15601 aagagactaa tcgtcggatt gttgatatta tttcagatgt taacttagca tactctgaac + 15661 atgcacgtaa gtatttacat gagtgtggtt tacctaaaga gcgcacatat gtaacaggtt + 15721 ctcctatggc agaagtgtta cataaaaatt tatctgccat tgagtcttca gatatccatg + 15781 aacgtttggg attgaaaaaa ggaggttata tcttactttc agctcaccgt gaggaaaata + 15841 ttgatacaga taaaaatttt atttctctct ttacagcaat taatcaatta gctgaaaagt + 15901 ataatatgcc aatcttatat tcttgccatc ctagatcaaa gaaaaggcta caagagagcg + 15961 gttttaaact agataaacgt gtgattcagc atgagccact aggattccat gactataatt + 16021 gtttacagat gaatgcattt gttgtagtat ctgattcggg aactttaccg gaagaaagta + 16081 gtttctttac tagtcaaggt tatccttttc ctgctgtatg tattcgtaca agtacagaac + 16141 gtcctgagtc cttagataag gcaggattta ttttggcagg cattgatgaa aattctcttc + 16201 ttcaagcagt tgaaactgct gttagcttgg cagaagatga ggattttgga ttaccggttc + 16261 cagattatgt tgaggaaaat gtctctacta aagttgttaa gataatacag agctatacag + 16321 ggatagtgga taaaatagtt tggaggaaaa gctgaattgt atatttttaa taaatcaaaa + 16381 cgagatgatt aattcttagt agaacaagag taaaattgaa cgtatttgat ggaaatgtct + 16441 tacttgatag tcgagggata gccattctat cggatttttg gcttgttttt gcgcttcatg + 16501 tttgatagaa taaagggctc tttgttaact gtagtgggtt gaagaaaagc taagcttgag + 16561 aaaggacaaa tttcgtcctt tcttttttga tgttcagagc gatgaaaatc cgttttttga + 16621 agttttcaaa gttccgaaaa ccaaaggcat tgcgcttgat aagtgtaagc gcgtcataac + 16681 aaggtatcta tcattcatgg agctcctcct gtatactatt agtaaagtaa aactattgga + 16741 ggatatttta atgccacaac ctattgttcc tgtagagatt ccacaatctc gtcgttttga + 16801 ttctaaaaag agaaatgata ttctacttaa aattcgtatt ggcaagcttg aagtaagttt + 16861 ttttcaatct ctcaatctcg aaatgataga acagcttttg gataaggtgt tgctctatga + 16921 caattcatct atctagccta gggcaggtct atctcgtatg tgggaaaacg gatatgaggc + 16981 aaggcattga ttcactggct tatctggtta aaacccactt tgaattagat cctttctcag + 17041 gtcaagtttt tctcttttgt ggtggacgta aagaccgctt taaagccctt tactgggatg + 17101 gtcaaggatt ttggctacta tataaacgct ttgagaacgg cagactgact tggcccagta + 17161 cagaaaagga tgtcaaagct ctcacacctg aacaagtaga ctggcttatg aagagctttt + 17221 ctatcactcc caaaataaac tcatcagaaa gtcgtgattt ctattgaaat gaggactttc + 17281 tttttagtat aataaagtta gaaaacagag agggaagctc atggaagaag attgaaaatc + 17341 attcaacaac agagtgctac aattgatagt ctcaccaatg aacttgccct tcttcgtgaa + 17401 caagtggctt atctgactca aaagctctat ggaaaatcct ctgagaaaag tgtttgcccc + 17461 tctggacaac tcaacctttt tgaggaagat ggagatgttc ccagttgaaa cagaggaaat + 17521 tacccacaaa cgtaagaaat ctaaagggaa acgccaagct cttcttgccc aatttgattc + 17581 agaagaagtt catcatcaag tagaagagag catttgccct gattgtcagg gagatctaaa + 17641 agagattgga gcaacccttc aacgacaaga attagtcttt attcctgcgc aattaaaacg + 17701 aatagatcat atccaacacg cttataagtg ccaagcatgc agtgataaaa atccgagtga + 17761 taaaatcgtg aaagctccta ttcctaaagc ccctttggcg catagctttg gctcagcttc + 17821 tattatcgct cacaccatcc atcagaagtt taatctgaag gtacccaatt atcgccaaga + 17881 agaagattgg gctaggatgg gtttaccaat cacacgtaag gaaatctcta attggcatat + 17941 caaggcaagt caatactatt tagagtccct ttataacctt ttacgagaaa agttgttaga + 18001 acaacctctt cttcatgcgg atgaaacctc ctatcgggtt ctagagagtg atagtcagct + 18061 gacttactat tggacttttt tgtcaggtaa agctgagaat caagcaatca cgctgtacca + 18121 ccatgatcag cgtcggagtg gttcggtagt gcaagaattc ctaggaaatt attctggcta + 18181 tgtgcattgt gatatgttgc ggcagtaact taggacttta gtcctctagt tctgcctatg + 18241 cgatagcagt ccaaggttta ggagcaaggc gacgctaagc ttggtaaact gcgaaccgct + 18301 agaagcttat cgtcaactgg aagaagctga acttgttgga tgttgggcgc atgtgagaag + 18361 gaaatttttt gaagcgcccc ccaagcaagc ggataaatca tcgttaggag ctaaaggttt + 18421 agcttattgt gatcagttat tttccttgga aagagactgg gaggctttgc cagctgatga + 18481 acgactacag aaacgtcaag aacatctcca acccctactg gaagacttct ttgcttggtg + 18541 ccgtcgtcag tcagttttat cgggttcaaa actaggaagg gcaattgaat acagcctcaa + 18601 gtatgaagaa acctttaaga ccattttaaa agacggacat ctggtccttt ccaataatct + 18661 agctgaacgc gccattaaat cattggttat gggacgtaaa aattggttgt tttctcaaag + 18721 ttttgaagga gctaaagcaa gagctattat tatgagctta ttggaaacag ctaaacgtca + 18781 tcaactaaat agtgagaaat atctatccta tcttccagaa tgtcttccaa acgaggaaac + 18841 tctcgtaaac aaagaggttt tagaggccta tttaccgtgg actaaagttg tacaagaaaa + 18901 gtgcaaataa gaaatctcca gattaggaac tatatatgag ttctctagtc tggagatttt + 18961 tcaatatact tcgttattgg gcggttacga tattcaaccc aaatcattca tacccctctc + 19021 aactagatgt aacttacaaa acccctgacc tcatgagcca ctttcttcct cctcatgagg + 19081 tcagttttac tttctgctgt tccagtatcg tttttcctcg ctagatttcc tcaaaagggc + 19141 agacttctcc cttggtgcat cacacgattt tttcatctcg actgttcttt aatgcatcat + 19201 taacgacgct tttcttccag gtggttcata aggaacagga agattcaggt tgacttttct + 19261 aatcctagaa taaagtgctg aaaacaattc ggaataggca tagagactag acaatttgag + 19321 gagctgcttg cgtcctgttc gaacacattt tcctaccacg tgaagaaaaa gatggcggaa + 19381 gcgtttgatt gttaaagttt ggaagtcacc tcttttagtt tcaactggga aaaaagttcc + 19441 tgaaaaaaga taagaccacc atactgggtt aaatgacctc catcgaaaga tagttggtaa + 19501 aaagacttgt tttggaagtg atgatttggt aaactgttca tgtgagtttc ctttcttttt + 19561 gtgttttttt ctacacttat accataaagg ggaaactctt ttttgtctag taaaaaacac + 19621 ccattgggtg aaaaaagaaa ccatccagga tctaagctaa ggcaaggatt ctggatggtt + 19681 tttagattag gggtgaataa ttggggatat tttttgaaaa gatgttgttt gaaaaataat + 19741 tttcaaaaat tctgaaaatt ctgttgacat ctttctgaaa agagtttata atggagagaa + 19801 agttttaaag gagaaaatga tgaaaagttc aagactactt gcccttgcgg gcgtgacatt + 19861 attgacggcg actactttag ctgcatgctc tggatcaggt tcaagcacta aaggtgagaa + 19921 gacattctca tacatttatg agacagaccc tgataacctc aactatttg +// + diff --git a/public/res/serotype_genbank/serotype_6A.gb b/public/res/serotype_genbank/serotype_6A.gb new file mode 100644 index 0000000..dbbf0a4 --- /dev/null +++ b/public/res/serotype_genbank/serotype_6A.gb @@ -0,0 +1,829 @@ +LOCUS CR931638 17611 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 34351= Rodriques (serotype 6a). +ACCESSION CR931638 +VERSION CR931638.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17611) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17611) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17611 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="34351=Rodriques" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC06A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC06A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI32811.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..458 + /gene="aliB" + /locus_tag="SPC06A_0002" + /pseudo + CDS 293..458 + /gene="aliB" + /locus_tag="SPC06A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..981) + /gene="tnp" + /locus_tag="SPC06A_0003" + /pseudo + CDS complement(join(459..521,520..981)) + /gene="tnp" + /locus_tag="SPC06A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1309..2754 + /gene="wzg" + /locus_tag="SPC06A_0004" + CDS 1309..2754 + /gene="wzg" + /locus_tag="SPC06A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32814.1" + /db_xref="GOA:Q4K303" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K303" + /translation="MSRRFKKSSSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSTLHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIKKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1309..1425 + /gene="wzg" + /locus_tag="SPC06A_0004" + /note="Signal peptide predicted for SPC0126 by SignalP 2.0 + HMM (Signal peptide probability 0.997) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1513..1860 + /gene="wzg" + /locus_tag="SPC06A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 9.8e-65" + misc_feature 2038..2481 + /gene="wzg" + /locus_tag="SPC06A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.5e-70" + gene 2756..3487 + /gene="wzh" + /locus_tag="SPC06A_0005" + CDS 2756..3487 + /gene="wzh" + /locus_tag="SPC06A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32815.1" + /db_xref="GOA:Q4K302" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K302" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQNLVYVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2759..3367 + /gene="wzh" + /locus_tag="SPC06A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.1e-38" + gene 3493..4188 + /gene="wzd" + /locus_tag="SPC06A_0006" + CDS 3493..4188 + /gene="wzd" + /locus_tag="SPC06A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32816.1" + /db_xref="GOA:Q9AHB8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q9AHB8" + /translation="MMKEQNTIEIDVFQLFKTLWQRKLMILLVALVTSAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDIEDVLKI + PLLGLVPDFDKMK" + misc_feature 3514..3930 + /gene="wzd" + /locus_tag="SPC06A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-53" + misc_feature 4036..4113 + /gene="wzd" + /locus_tag="SPC06A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4198..4887 + /gene="wze" + /locus_tag="SPC06A_0007" + CDS 4198..4887 + /gene="wze" + /locus_tag="SPC06A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32817.1" + /db_xref="GOA:Q9AHB7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q9AHB7" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 4902..6269 + /gene="wchA" + /locus_tag="SPC06A_0008" + CDS 4902..6269 + /gene="wchA" + /locus_tag="SPC06A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI32818.1" + /db_xref="GOA:Q4K2Y3" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K2Y3" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYINGWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 4902..4988 + /gene="wchA" + /locus_tag="SPC06A_0008" + /note="Signal peptide predicted for SPC0130 by SignalP 2.0 + HMM (Signal peptide probability 0.759) with cleavage site + probability 0.388 between residues 29 and 30" + misc_feature 5685..6266 + /gene="wchA" + /locus_tag="SPC06A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.7e-160" + gene 6365..7309 + /gene="wciN" + /locus_tag="SPC06A_0009" + CDS 6365..7309 + /gene="wciN" + /locus_tag="SPC06A_0009" + /note="member of homology group 62" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32819.1" + /db_xref="GOA:Q9AHB5" + /db_xref="InterPro:IPR002495" + /db_xref="UniProtKB/TrEMBL:Q9AHB5" + /translation="MNIVYATDNNFVDVLSASIKSLYTTNSDLDLNLWIIADKVSDRN + KEKINRLSKQFAQREINWIENVEIPFKLHLDRGSISSFSRLFLGSVLPSSMSKVLYLD + SDIIVMDSLRSIFDIDFKGKILYGVNDTFNKEYKQVLGIPIDKPMFNAGVMLINLELW + RNNNVEERFLQVIQKFNGTILQGDLGVLNAVLYNSFGVLPPEYNYMTIFEDLTYEEMI + VFKKPINYYSKEEIKNARERIVLRHFTTSFLSKRPWQEGSNVAHIDQFKKYYEGSYKN + VKESILLKIVQKLPKKCSVFLLGIIQSKFRPKLYRILK" + misc_feature 6368..7138 + /gene="wciN" + /locus_tag="SPC06A_0009" + /note="HMMPfam hit to PF01501, Glycosyl transferase + family, score 3.9e-72" + gene order(7347..7490,7492..7593) + /gene="HG262" + /locus_tag="SPC06A_0010" + /pseudo + CDS join(7347..7490,7492..7593) + /gene="HG262" + /locus_tag="SPC06A_0010" + /note="member of homology group 262" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase + (pseudogene)" + /db_xref="PSEUDO:CAI32820.1" + gene 7580..8299 + /gene="wciO" + /locus_tag="SPC06A_0011" + CDS 7580..8299 + /gene="wciO" + /locus_tag="SPC06A_0011" + /note="member of homology group 81" + /codon_start=1 + /transl_table=11 + /product="putative ribitol phophotransferase" + /protein_id="CAI32821.1" + /db_xref="GOA:Q4K2Y1" + /db_xref="InterPro:IPR000462" + /db_xref="UniProtKB/TrEMBL:Q4K2Y1" + /translation="MSIYRICKDIERKTMSPAKKAMAKNDYFAFYVGRPLSYLLTVPF + VKTNITPNQISYLSIIPLIVGFIIMIFTTDFVVLLLAWFLFFLWNLLDGVDGNLARYR + EQYSKDGSVVDAMAGYVAMVLTYFGAGIVAAHLNDSDIYIILGALSGISLIFPRLVMH + KYINTVAQDESVSSIKDKSDFNTIKILALNMTSITGIPQVLLLLTILTNQWVLFTLVY + FTINFLLMIFSLYSLFKKENV" + misc_feature 7823..8287 + /gene="wciO" + /locus_tag="SPC06A_0011" + /note="HMMPfam hit to PF01066, CDP-alcohol + phosphatidyltransferase, score 0.01" + gene 8302..9288 + /gene="wciP" + /locus_tag="SPC06A_0012" + CDS 8302..9288 + /gene="wciP" + /locus_tag="SPC06A_0012" + /note="member of homology group 97" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32822.1" + /db_xref="GOA:Q8RIW1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q8RIW1" + /translation="MGKSVAILMTTYNGERYLSQQIDSIRSQTFTNWTLFIRDDGSKD + KTIEVIQRYSKIDDRIRFVENPSKFHGAYYNFFNLIEYVKNNYQFDYYFFCDQDDIWK + EHKLEIQLLRFSKDDMPEMVYSDMSMIDASNNLIDISINKIMGIELPNINNLYFIHAY + IWGCTAGFNHALLEMVPSVDIDKDYLYIEKLAHDSYFAKFALEYGKVLFCPEQLVLYR + RHGHNVTTSHHFKLSPLNVFRKAILGFNELALTHARVYNQTLYMLKKASGKNPLSDRL + LEIQEVIKIGGLKGVRYFYQNRISRKQLVRTIGLYTIMLFGTYKKYIMKELL" + misc_feature 8317..8820 + /gene="wciP" + /locus_tag="SPC06A_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 7.7e-25" + gene 9288..10631 + /gene="wzy" + /locus_tag="SPC06A_0013" + CDS 9288..10631 + /gene="wzy" + /locus_tag="SPC06A_0013" + /note="member of homology group 139" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32823.1" + /db_xref="UniProtKB/TrEMBL:Q8RSF1" + /translation="MLLNFLFISIFLLIIITFILFEGDFFQPAVILTIAYFISIASAL + VNRNVWGTELHFKTFYLILLGVATFVIVSLLTKLSYRPKVEGISHEELKEINPSKIIY + VILLTLNLVMLFLYIREIQKVVLFSGRSFSNITDLISNYRYLSYYSNEVENRVSGMIN + QLSKIIPATTLISLYIFMNNYFITKQIKKNFIYLIPIAIFFVYAIISGGRLPLIRLVV + GSLLILYIYSVYGSPKSQLTKSFKMITRSLFTFLILIVLFFLLKFVLGRSSQEDFISY + ITRYMGGSIQLFDLFVIDPIRRNKELGAETFSGIYEMLAKLGFDNNIIKGLEWRVSPN + YYSLGNVYTAIRRYYSDFGVIGIVICQSFTAWLYTLGYEKVRHYSLVTNVQRFRLILL + AASFYPIFLNGIEDVFYISMVTIGYGIQIVIFYLVFWVLLKVQVDFNKGKLTINR" + misc_feature 9288..9416 + /gene="wzy" + /locus_tag="SPC06A_0013" + /note="Signal peptide predicted for SPC0135 by SignalP 2.0 + HMM (Signal peptide probability 0.938) with cleavage site + probability 0.688 between residues 43 and 44" + gene 10756..12168 + /gene="wzx" + /locus_tag="SPC06A_0014" + CDS 10756..12168 + /gene="wzx" + /locus_tag="SPC06A_0014" + /note="member of homology group 82" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32824.1" + /db_xref="UniProtKB/TrEMBL:Q9AHB1" + /translation="MKLKFLITNLFHVFLSNLITIVTSVIVVLILPKIMGVTEYSYWQ + LYIFYLTYIGFFHLGWIDGIYLKYGGLEYQNLDKKQFYSQILQFFSFLILISFLLFGF + NLLIVTDPNAKYIYNMTIISMIVTNLRMLFVYILQMTNRLKDSSIILISDRVIYIFLL + FLFIIFKWHEYKVMIWADVLGRTFSLLLSFWICKDIVFQSLSEFILDLRESFDNIRVG + INLMLSNIASSMIIGIVRMGIQWNWNIETFGKVSLTLSISNLLMTFINAIGLVVFPLL + KRTKTENLSKIYSNLRNVLMLIMFAILLFYYPLKIILDLWLPAYRDALIFMALIFPMS + IYEGKMALVINTYLKALRMERDILKINTLIMLFSMLVTLITTLLLNNLELTVISIVVL + LALRSIIAELILSKKLDISVEQDIVLELLMTIIFISSSWYLPIWLAVIVYLLAYTLYL + YLKRKDTKMYIEYFRKKIFE" + misc_feature 10756..10863 + /gene="wzx" + /locus_tag="SPC06A_0014" + /note="Signal peptide predicted for SPC0136 by SignalP 2.0 + HMM (Signal peptide probability 0.692) with cleavage site + probability 0.398 between residues 36 and 37" + gene 12662..13531 + /gene="rmlA" + /locus_tag="SPC06A_0015" + CDS 12662..13531 + /gene="rmlA" + /locus_tag="SPC06A_0015" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI32825.1" + /db_xref="GOA:Q4K2Z3" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K2Z3" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSTMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQSLKKN + EYGQYLLRLVGEA" + misc_feature 12665..13381 + /gene="rmlA" + /locus_tag="SPC06A_0015" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.7e-121" + gene 13532..14125 + /gene="rmlC" + /locus_tag="SPC06A_0016" + CDS 13532..14125 + /gene="rmlC" + /locus_tag="SPC06A_0016" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI32826.1" + /db_xref="GOA:Q9AHA9" + /db_xref="HSSP:1NXM" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q9AHA9" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + misc_feature 13568..14098 + /gene="rmlC" + /locus_tag="SPC06A_0016" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 4.5e-16" + gene 14138..15187 + /gene="rmlB" + /locus_tag="SPC06A_0017" + CDS 14138..15187 + /gene="rmlB" + /locus_tag="SPC06A_0017" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI32827.1" + /db_xref="GOA:Q4K0A7" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K0A7" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAVD + AYDHVTDRAGHDLRYAIDASKLREELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 14153..15109 + /gene="rmlB" + /locus_tag="SPC06A_0017" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 6.3e-05" + misc_feature 14156..15100 + /gene="rmlB" + /locus_tag="SPC06A_0017" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0033" + misc_feature 14156..14896 + /gene="rmlB" + /locus_tag="SPC06A_0017" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.4e-77" + misc_feature 14159..14971 + /gene="rmlB" + /locus_tag="SPC06A_0017" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.6e-05" + gene 15253..16104 + /gene="rmlD" + /locus_tag="SPC06A_0018" + CDS 15253..16104 + /gene="rmlD" + /locus_tag="SPC06A_0018" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI32828.1" + /db_xref="GOA:Q4K2Z0" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2Z0" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPVKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 15253..16101 + /gene="rmlD" + /locus_tag="SPC06A_0018" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4.7e-147" + misc_feature 15256..15897 + /gene="rmlD" + /locus_tag="SPC06A_0018" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00013" + misc_feature 15256..15885 + /gene="rmlD" + /locus_tag="SPC06A_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 9.9e-19" + misc_feature 15259..15987 + /gene="rmlD" + /locus_tag="SPC06A_0018" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.7e-08" + gene order(16180..17133,17150..17365) + /gene="tnp" + /locus_tag="SPC06A_0019" + /pseudo + CDS join(16180..17133,17150..17365) + /gene="tnp" + /locus_tag="SPC06A_0019" + /note="member of homology group 12" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1670 transposase" + misc_feature 16186..16629 + /gene="tnp" + /locus_tag="SPC06A_0019" + /note="HMMPfam hit to PF03050, Transposase IS66 family, + score 8.9e-05" + /pseudo + gene 17564..>17611 + /gene="aliA" + /locus_tag="SPC06A_0020" + CDS 17564..>17611 + /gene="aliA" + /locus_tag="SPC06A_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32830.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaattac ctattagact attaaactga taatatagtc aatcgaaaca agaacaagac + 481 aaaagagcct tgtaaaaggt attgcaactt ggtaatacct tttatgaggt gctttttgat + 541 atgagtccat gttttctcaa taggattgta ctcaggtgag tagggaggaa gaggtaaaag + 601 tttattccca aactcttcac acaagagttc tagcttcccc attctatgga atcttacatt + 661 atccataata ataaccgatg gtgtggttaa tgttggtaag aaaaacttct gaaaccatac + 721 ttcaaaaaag tcgctcgtca tcgtctcttc gtaagtcatt ggagcgatta actcaccatt + 781 tgttagacct gcaaccaaag aaatcctctg atatcttctt ccagatactt tacctcttat + 841 taactgacct tttaatgagc gaccatattc tcgataaaaa taagtatcga atcctgtttc + 901 gtcaatctaa acaggtgcta ggtgctttaa tctattaaaa ttcttaagaa ataaggctac + 961 tttttctggg tcttgttcat aattagattg aaaaaagaac atgaaagatg aagcaatcaa + 1021 tgtactggat aaagttatga aaaagatttt ttaaaaagtt ttgccccttt tttgtcctct + 1081 aaatacaaaa atagccctct agaatagtac acctctgctt ctaaaacatt gctagaaatc + 1141 gatttgactg tcctgatcga tttatcatgt tcttatttca ttttactata tttttgtttc + 1201 gcgggaagtc tactaagata cttaaagatg cagatagtga aaaaaggtgt agacattacc + 1261 gtaaaaaagt gatataatcg tatgatgttc aatgtatagg tgttaatcat gagtagacgt + 1321 tttaaaaaat caagttcaca gaaagtgaag cgaagtgtta atatagtttt gttgactatt + 1381 tatttattgt tagtttgttt tttattgttc ttaatcttta agtacaatat ccttgctttt + 1441 agatatctta atttagtggt aactgcgtta gtcctactag ttgccttggt agggctactc + 1501 ctgattatct ataaaaaagc tgaaaaattt actatttttc tgttggtgtt ctctatcctt + 1561 gtcagctctg tgtcgctctt tgcagtacag cagtttgttg gactgaccaa tcgtttaaat + 1621 gcgacttcta attactcaga atattcaatc agtgtcgctg ttttagcaga tagtgagatc + 1681 gaaaatgtta cgcaactgac gagtgtgaca gcaccgactg ggactgataa tgaaaatatt + 1741 caaaaactac tagctgatat caagtcaagt cagaataccg atttgacggt cgatcagagt + 1801 tcgtcttact tggcagctta caagagtttg attgcagggg agactaaggc cattgtctta + 1861 aatagtgtct ttgaaaatat catcgagtca gagtatccag actatgcatc gaagataaaa + 1921 aagatttata ccaagggatt cactaaaaaa gtagaagctc ctaagacgtc taagaatcag + 1981 tctttcaata tctatgttag tggaattgac acctatggtc ctattagttc ggtgtcgcga + 2041 tcagatgtca atatcctgat gactgtcaat cgagatacca agaaaatcct cttgaccaca + 2101 acaccacgtg atgcctatgt accaatcgca gatggtggaa ataatcaaaa agataaatta + 2161 acccatgcgg gcatttatgg agttgattcg tccattcaca ccttagaaaa tctctatgga + 2221 gtggatatca attactatgt gcgattgaac ttcacttctt tcttgaaaat gattgactta + 2281 ttgggagggg tagatgttca taatgatcaa gaattttcaa ctctacatgg gaagttccat + 2341 ttcccagtag ggaatgtcca tctagactct gagcaggctc taggttttgt acgtgaacgc + 2401 tactcactag ccgatggaga ccgtgaccgt ggtcgcaacc aacaaaaggt cattgtagca + 2461 attattaaga agttaacttc tacagaggtt ttgaaaaact atagtagtat tcttcaagga + 2521 ttgcaggatt ctcttcaaac aaatatgccg attgagacta tgatagattt agtgaatact + 2581 cagttggaga gtggagggaa ttataaagta aattcgcaag acttgaaagg tacaggtcgg + 2641 atggatcttc cttcttatgc aatgccagac agtaacctct atgtgatgga aatagatgat + 2701 agtagtttag ctgtagttaa agcagctata caggatgtga tggagggtag atgaaatgat + 2761 agacatccat tcgcatatcg tttttgatgt agatgacggt cccaagtcaa gagaggaaag + 2821 caaggctctc ttggcagaag cctacagaca gggggtgcga accattgtct ctacctctca + 2881 ccgtcgcaag ggcatgtttg aaactccgga agagaagata gcagaaaact ttcttcaggt + 2941 tcgggaaata gctaaggaag tggcgagtga cttagtcatt gcttacgggg ctgaaattta + 3001 ctacacacca gatgttctgg ataagctggg aaaaaagcgg attccgaccc tcaatgatag + 3061 tcgttatgcc ttgatagagt ttagtatgaa tactccttat cgcgatattc atagcgcctt + 3121 gagcaagatt ttgatgttgg gaattactcc agtcattgcc cacattgagc gctatgatgc + 3181 tcttgaaaat aatgaaaaac gcgttcgaga actaatcgat atgggctgtt acacgcaagt + 3241 aaatagttca catgtcctca aacccaaact ttttggcgaa cgttataaat tcatgaaaaa + 3301 aagagctcag tattttttag agcagaattt ggtttatgtc attgcaagtg atatgcacaa + 3361 tctagacggt agacctcctc atatggcaga agcatatgac cttgttaccc aaaaatacgg + 3421 agaagcgaag gctcaggaac tttttataga caatcctcga aaaattgtaa tggatcaact + 3481 aatttaggag aaatgatgaa agaacaaaac acgatagaaa tcgatgtatt tcaattattt + 3541 aaaaccttgt ggcaacgcaa gctaatgatt ttattagtgg cacttgtgac aagtgcgggg + 3601 gcttttgcat atagcacttt tattgttaag ccagaatata cgagtaccac gcgaatttac + 3661 gtagtgaatc gcaatcaagg agacaagccg gggctgacaa atcaggattt gcaggcagga + 3721 acttatctgg taaaagacta ccgtgagatt atcctttcgc aggatgcatt ggaaaaagta + 3781 gcgacaaatt tgaagttgga tatgccagca aaaacgttag ccagcaaagt tcaagtggct + 3841 gtaccagctg acactcgtat cgtctcaatc tctgtcaagg ataaacagcc agaggaagcc + 3901 agtcgtatcg ctaattctct acgagaagtt gctgcagaaa agatcgtcgc tgtaacgcga + 3961 gtatctgatg taacgacact tgaagaagcg cgaccagcta cgactccctc ttctccaaat + 4021 gttcgacgca attccttgtt tggttttctt ggaggagcag tcgtaacagt aattgctgtt + 4081 cttttgattg agttgctcga cacccgtgtg aaacgtcctg aagatattga agatgtactg + 4141 aaaattccac ttttagggct cgttccagat tttgacaaaa tgaaatagga ggaagttatg + 4201 ccaacattag aaatctcaca ggcaaaattg gattctgtaa aaaaggcaga ggaatattat + 4261 aacgctttgt gcacgaacct acagttaagt ggagatggtt tgaaagtatt ttctatcact + 4321 tctgtgaaaa taggagaagg aaaatcaacg acttccacca atatcgcttg ggcttttgcg + 4381 cgtgcaggtt acaaaacgct gctgattgat ggagatattc gcaattctgt tatgttaggt + 4441 gtctttaaag caagggataa gattacaggc ctgacagaat ttttatcagg aactacagac + 4501 ctatcacaag ggctttgtga taccaatatc gaaaatctct ttgtaattca ggctggctct + 4561 gtgtcaccga atccgacagc tcttcttcaa agtaagaatt tcagtacaat gcttgaaacc + 4621 ttgcgtaaat attttgacta catcattgta gatactgctc ctgtcggtgt cgtgattgat + 4681 gcggctatta ttacgcgaaa atgcgatgct tctattttag tgacggaggc aggtgaaata + 4741 aatcgacggg atattcaaaa agcaaaagaa cagttggaac acacagggaa gccgtttttg + 4801 ggagttgtgt tgaataaatt cgatacttca gtagacaaat acggttctta tggaaattat + 4861 ggagattacg ggaaaaataa aaaataggtc gggggataga gatgaatgga aaaatagtaa + 4921 agtcttcatt ggccataatc cagagctttc ttgttatttt attgacttat ctacttagtg + 4981 ctgtgagaga aacggagatt gtttcaacaa cagctattgc actttatatc ctccattatt + 5041 ttgtctttta tatcagtgat tatggacagg atttctttaa aaggggatat ttgattgaac + 5101 ttgtccagac attgaaatat atcctattct ttgcactagc gattagtatt tctaattttt + 5161 tcttagagga tcgatttagt atttccagac gaggcatgat ttacttcctc acattacatg + 5221 ctctcttagt ctatgtgcta aacctattta tcaagtggta ttggaagcgg gcttatccca + 5281 actttaaagg aagtaagaag attctcctac ttacagcaac ttctcgtgtc gaaaaggtac + 5341 tggatagatt aatagaatca aatgaggttg ttggggagtt ggtagccgtc agtgtcttag + 5401 ataaaccaga ttttcagcat gattgtttaa aggtagtagc agagggggag atagtaaact + 5461 ttgcgactca tgaggtggtc gatgaagtct ttatcaatct tccaagtgaa aaatacaata + 5521 ttggagagct tgtctctcag tttgaaacga tgggaattga tgtaacagtc aatctaaatg + 5581 cttttgatcg tagtttggca cgtaacaagc aaattcgtga gatggcagga ttaaacgttg + 5641 tgactttttc tacaacattt tataagacta gtcatgtaat tgctaagcgg attattgata + 5701 tcgtgggtgc attggtaggg ctgatactat gtggtttagt cagtattgta ctggttcctt + 5761 tgattcgaaa ggatgggggc tctgctattt ttgctcagac gcgtatagga aaaaatggtc + 5821 gtcagttcac tttttataag tttcgctcta tgtgtgtaga tgccgaggcg aaaaaaagag + 5881 aactcatgga acaaaatacc atgcagggtg gaatgtttaa ggtggacgat gatcctcgta + 5941 tcacgaaaat tggtcgtttt atacggaaga ctagcttgga cgagctacca cagttttaca + 6001 atgttctaaa gggagatatg agcttggtag gtacacgacc accaacagtg gacgagtatg + 6061 agcactatac cccagaacaa aaacgccgac taagttttaa acctggcata acaggtttat + 6121 ggcaggtcag cggacgaagt gaaatcaaga atttcgatga agttgtcaaa ttagatgtgg + 6181 cctatattaa tggttggaca atctggaaag atattgaaat tttattgaaa acggttaaag + 6241 ttgtatttat gagagatgga gcgaaatagt ttggttgtgt aggatatttg tagaggtaaa + 6301 agtttcgaat atatctcact caatcttttt tataagtgaa aataaattta gaagtaggaa + 6361 ttttatgaat atagtttatg ccacagataa taattttgta gatgtattga gtgcttccat + 6421 caaatcactt tacactacta attcagattt ggatttaaat ttatggatta ttgctgataa + 6481 agtttcggat agaaataaag aaaagataaa tagattatca aaacaatttg cgcagagaga + 6541 aattaattgg atagagaacg ttgagatccc atttaaatta catttagata ggggatcaat + 6601 tagttcattt agcagattat ttctgggaag tgttcttcca tcttcaatga gtaaagttct + 6661 ttatcttgac agtgatatta ttgttatgga ttctttacga agtatttttg atattgattt + 6721 taagggtaaa attctctatg gggtgaatga tacttttaat aaagaataca agcaggtgtt + 6781 gggtatacca attgacaagc caatgtttaa tgctggagtt atgcttatta atttagagtt + 6841 atggagaaat aataacgtcg aagaaagatt tttgcaagta attcaaaagt ttaatggtac + 6901 tatattacaa ggagatttag gggttttaaa tgcagtttta tataactcat ttggtgtact + 6961 tcctccagaa tataattata tgaccatatt tgaagatttg acttatgaag aaatgatagt + 7021 ttttaaaaaa ccaattaatt attattcaaa agaggaaatt aaaaatgcca gagaacgtat + 7081 agtcttacga catttcacaa ctagtttttt atcaaaaaga ccttggcaag aaggcagtaa + 7141 tgttgcacat atagaccaat ttaaaaaata ctatgaaggt agttataaaa atgttaaaga + 7201 atctatttta ctaaaaatag ttcaaaaatt acccaaaaaa tgttcagttt ttttattagg + 7261 aattattcaa tcaaaattta gacctaaatt gtatagaatt ttgaaataag gtggatagta + 7321 ttaatgacaa aaaagaaaga attttattga aaattcaaga agaattgaaa ttattaaaag + 7381 agtttataaa aatatgttct aaaaataaaa ttaagtattt tgctcttgga ggcagtctat + 7441 taggagctgt aagacacaaa ggtttcattc cttgggatga tatggatcta agctttccaa + 7501 agagttaaat ctatgtttga aataaaggaa aaagtgttag aattagagaa tgtattaatg + 7561 agtttaggag aaagtataga tgtcaatata tagaatctgt aaagatattg aaagaaaaac + 7621 tatgtcgcct gctaaaaaag caatggctaa aaacgactat tttgcatttt atgttggaag + 7681 acctttatcc tatcttttaa cagttccttt cgtgaaaaca aatattactc ccaatcaaat + 7741 atcttattta tctataattc ctttgattgt tggatttata ataatgatat ttacaactga + 7801 tttcgttgta ttattactgg catggtttct atttttttta tggaacttac tagatggagt + 7861 agatgggaac ttagccagat atcgggagca atactcgaag gatggaagtg tagtagatgc + 7921 aatggctggc tatgtagcca tggtgttgac gtatttcggt gcaggaatag tagctgctca + 7981 tttaaacgac tcagatatct atataatttt gggtgcatta tctgggattt cattgatttt + 8041 tccaaggtta gtgatgcata agtatatcaa tacagtagct caagatgagt ctgtgagtag + 8101 cattaaagat aaatctgatt ttaatactat aaaaatactg gctctaaaca tgacatcaat + 8161 tacaggaatt ccgcaggttt tactgctatt aactatttta acaaatcagt gggtactttt + 8221 tactttagta tattttacga ttaatttttt attaatgata ttttctttgt attcattatt + 8281 caaaaaggag aatgtttaga aatgggaaag tcagttgcaa ttttaatgac cacctataat + 8341 ggtgagcgat atttgtcaca acagattgat agtattaggt ctcaaacatt cactaattgg + 8401 acacttttta ttagggatga tggatcaaaa gataaaacaa tagaagtaat acagaggtat + 8461 tctaagatag atgatagaat tagattcgtt gaaaatccct caaagtttca tggagcttat + 8521 tacaattttt ttaatctaat tgaatacgtt aaaaacaatt atcaatttga ttattacttt + 8581 ttttgtgatc aagatgatat ttggaaagag cacaagttag aaatacagct gttaagattt + 8641 tctaaagatg acatgccaga gatggtttac tctgatatgt caatgattga tgccagtaat + 8701 aatttgatag atattagtat aaataaaata atggggattg aattaccgaa cataaataat + 8761 ttgtatttta ttcatgccta tatctggggg tgtactgcag gttttaatca tgcattgcta + 8821 gagatggttc cttcagttga tattgataaa gattatttat atatagaaaa actggctcat + 8881 gatagttatt ttgcaaagtt tgcactagag tatgggaagg tgttgttctg ccctgagcaa + 8941 ctggtcttgt atcgaagaca tggacataat gtaacaacta gtcatcattt taaattatct + 9001 ccgctaaatg ttttcagaaa ggctatattg ggtttcaatg aattggcact tacacatgct + 9061 agggtatata atcaaactct ttatatgcta aaaaaagctt ctggaaaaaa tcctttaagt + 9121 gatagactac ttgaaattca ggaagtaatc aaaattggag gattaaaagg tgtgagatat + 9181 ttctatcaga atcgaatttc tcgaaagcaa ctcgtaagaa caatcggctt atataccatc + 9241 atgctttttg ggacctataa aaaatatatt atgaaagaac tcttataatg cttttaaatt + 9301 tcttattcat atctattttt ctattaatta tcattacatt tatattattt gagggggatt + 9361 tttttcaacc tgcagtaatt ttaacaatcg cttattttat ttcgattgca agtgctctag + 9421 ttaatagaaa tgtttgggga acagaactcc atttcaaaac cttttatttg atattgttag + 9481 gggttgctac atttgttata gtttccttgt tgacaaaatt gtcgtacagg cctaaagtgg + 9541 agggaatttc gcatgaagaa ttgaaagaaa taaatccttc aaagataatc tatgtcattc + 9601 ttctgactct aaatcttgtt atgttatttc tttatatccg tgaaattcag aaagtagtat + 9661 tgttttcagg tagaagtttt tctaatatta cagatttgat aagtaactat aggtacctat + 9721 cttattattc aaatgaagta gaaaatcgtg taagtggaat gattaatcaa ctatctaaaa + 9781 ttattccagc gactacactt atttctttat atatatttat gaataattat tttataacta + 9841 aacaaataaa gaaaaatttc atttatttga ttccaatagc tatattcttt gtctatgcaa + 9901 tcattagtgg tggtagattg ccccttataa ggttagttgt tggatctctg ttgatattgt + 9961 atatatactc tgtgtacggg agtcctaaat ctcaacttac caaaagtttt aaaatgatca + 10021 ctcgctctct gtttacattt cttattttga tagttttatt ctttctttta aaatttgtat + 10081 tagggcgctc ctctcaggaa gattttatca gttacatcac tcgttatatg ggaggttcaa + 10141 ttcaactatt tgatttattt gttatagatc cgatacgacg taacaaagaa ctaggtgcag + 10201 aaactttttc gggaatttat gagatgcttg caaaattagg atttgacaat aatattataa + 10261 aaggcttaga atggagagtg tctcctaatt attattcttt agggaatgtg tatactgcaa + 10321 ttagacgtta ttattcagac tttggtgtaa ttggtattgt aatttgtcag agttttacag + 10381 cgtggttata tactttaggt tatgaaaaag ttagacatta ttctttagtt acaaatgttc + 10441 aaagatttag gttgatccta ttagcagctt cattttatcc aatattttta aatggtatcg + 10501 aggatgtgtt ttatatttca atggttacca ttggatatgg aatacaaatt gttatctttt + 10561 atctggtctt ttgggttctt ctgaaagttc aggttgactt taacaaaggt aaattaacga + 10621 taaatagatg aatttagcgc taatgtattg agtcatataa agggatatat ttggtaggta + 10681 ttttaattgg aggaagagag tcttgaatgg gaagtacaaa tcttctgaaa taatttttag + 10741 gtggggagta tagctatgaa attgaagttt cttataacaa atttgtttca tgtctttttg + 10801 tctaatctga ttacaattgt cacatcggtt atagttgtac taatcttacc aaaaattatg + 10861 ggagtaactg agtatagtta ttggcaacta tatatttttt acctaacata tattggtttt + 10921 tttcatctgg gttggattga tggaatttat cttaaatatg gtggattaga gtaccagaat + 10981 ttagataaga aacagtttta ttctcaaata cttcaatttt tcagtttttt aattttaatt + 11041 tcttttctat tatttggttt taacttattg attgtgacag atccaaatgc aaaatatatt + 11101 tataacatga ctattattag tatgatagtt acaaatttaa gaatgttatt cgtttatatt + 11161 ttgcagatga caaatcgatt aaaggatagc tctataattc tgataagtga tcgcgttata + 11221 tatatttttc ttttatttct gtttattata tttaaatggc atgaatacaa ggtaatgatt + 11281 tgggcggatg ttttaggaag gacattttct ctcctacttt ctttttggat ttgtaaagat + 11341 attgtttttc aatccttatc cgagttcata ttggatctga gagagtcttt tgacaatatc + 11401 cgtgttggaa tcaatttaat gttatccaat attgcaagta gtatgattat tggtattgtt + 11461 cgaatgggaa ttcaatggaa ttggaatatc gaaacattcg ggaaagtatc actgacgcta + 11521 agcatctcta atttattaat gacttttatt aatgcgattg gtttagttgt ctttcctttg + 11581 ttaaaacgga caaaaacgga aaatttatct aaaatttatt ccaacttaag aaatgttttg + 11641 atgctgatca tgtttgcaat attgctcttt tattatcctt taaaaattat tctagatctt + 11701 tggttgccag cttatcggga tgcgttgatt tttatggctc ttatttttcc tatgtcaatt + 11761 tatgaaggga agatggcctt ggtgattaat acatatttaa aggcgctaag gatggaaaga + 11821 gatattctca aaataaatac tttgattatg ttgttcagta tgttagttac cctaataact + 11881 actctattat taaataattt agagctaacg gttatatcta tagttgtttt gctagcttta + 11941 cgtagtataa tagcagaact aattctatct aaaaaacttg atatatcagt tgagcaagac + 12001 attgtgttag aattacttat gacaattata tttatttctt caagttggta cttaccgatt + 12061 tggctcgcag taatagttta tttgttagcg tatactttat acttgtatct aaagcgtaaa + 12121 gatacaaaaa tgtatataga atattttaga aagaaaatat ttgaataaaa agaactatat + 12181 atcagttaga tggcaaattc tatttttacc tttttgtcgt ttaatagaaa atgataaaaa + 12241 atatgatatt attcttacac atatttataa gcaatttaaa tgtatcaggt gataaattaa + 12301 tttaaaataa gaatagtttc tggaacattg ctattagtgg gaacaggtta cgaaataatt + 12361 tatcaatttt aaagacgttt tttaaaatat aaaataatgg attctgtcaa caattctaaa + 12421 ttctaatagg aatgataatg ctagaaaatc agattgttca tttttcaagg aagtttattt + 12481 ttaaaataat atatctttaa gtaagaatta ttttattaga cttaacctag cctatcagtt + 12541 aaattagaat atcaactttg attaattaaa aattagcaaa atttattgac attttgtttt + 12601 tataaattgc aataaaggtc taattctgaa tttcagtgaa tataagaaag ggatcctact + 12661 aatgaaaggt attattctag caggtggttc gggaactcgc ttgtatcctt tgactcgcgc + 12721 tgcatcaaaa caacttatgc cggtttatga taaaccgatg atttactacc cactttcaac + 12781 attaatgttg gctgggatta gggatatttt gattatctca actcctcaag atttgcctcg + 12841 ttttaaagag cttcttcaag atggttctga gtttggtatt aaactttctt atgctgagca + 12901 accaagtcca gatggtttgg cacaagcctt tatcattggg gaagagttta tcggtgacga + 12961 tagcgttgcc ttgattttag gtgacaatat ctaccatggt cctggtttga gcacaatgct + 13021 tcaaaaagca gccaagaaag agaaaggtgc gactgttttt ggctaccatg tcaaggatcc + 13081 agaacgcttt ggtgttgtag aatttgatga aaatatgaat gctatctcca tcgaagaaaa + 13141 gccagaatac cctcgttcaa actatgcagt gacaggactc tatttctatg ataatgatgt + 13201 agtagagatt gccaaaagta ttaaaccaag tcctcgtggt gaattggaaa ttacagatgt + 13261 caacaaggct tacttggatc gtggtgattt gtctgttgag ctcatgggac gtggttttgc + 13321 ttggttggat actggcactc atgaaagttt actagaggct tcgcagtaca tcgaaacagt + 13381 ccaacggatg caaaatgttc aggtagcaaa cttagaagaa attgcttacc gtatgggcta + 13441 tatcagtcga gaagatgtat tggccttagc ccaatcactt aagaaaaatg aatacggaca + 13501 gtatctgctc cgtttggttg gagaagcata gatgacagat aattttttcg gtaagacgct + 13561 tgcggcacgc aaggttgaag ctattccagg catgttggag tttgatatcc ccgttcatgg + 13621 agataatcgt ggctggttta aagaaaattt ccaaaaggaa aaaatgcttc cacttggatt + 13681 tccagagtct ttctttgcag aaggaaaatt gcaaaacaat gtatccttct cacgtaaaaa + 13741 tgtccttcga ggcctccacg cagagccttg ggataagtac atctctgtag cagatggagg + 13801 gaaagttctg ggttcttggg ttgatctacg cgagggtgaa acctttggga atacctatca + 13861 gacagtgatt gatgcgagta agggaatctt tgttcctcga ggcgtagcta atggcttcca + 13921 agttttatca gatacagtgt catatagcta tctggtcaat gattactggg ctcttgaact + 13981 caaacccaag tatgcctttg tgaactacgc tgatccaagc cttggtattg aatgggaaaa + 14041 tattgcagaa gcagaggttt cagaagcaga taaaaatcat ccactactta aggatgtaaa + 14101 acctttgaaa aaagaagatt tgtaaaaagg aaagaatatg actgaataca aaaatattat + 14161 cgtgacaggt ggagctggct ttatcggttc taactttgtc cattatgttt acgagaactt + 14221 tccagatgtt catgtgacag tcctagataa gttgacttat gctggaaacc gcgcgaatat + 14281 tgaggaaatt ttaggtaatc gtgttgagtt agttgttggt gacattgctg atgcggagtt + 14341 ggtagacaag ttggctgctc aagcagatgc tatcgttcat tatgcagcgg aaagccacaa + 14401 tgataattcg ctcaatgatc catcgccatt tattcatact aacttcatcg gaacctatac + 14461 tcttttagaa gctgctcgta agtatgatat tcgcttccac catgtatcga cagatgaagt + 14521 ttatggggat ctccctttac gcgaagattt gccaggtcat ggtgaaggac caggtgagaa + 14581 atttactgct gaaacaaaat acaacccaag ctctccgtac tcatcaacca aggcagcctc + 14641 agatttgatt gtcaaagcct gggtgcgttc ttttggagtc aaggcaacga tttccaactg + 14701 ttcaaataac tacggtcctt atcaacatat cgaaaaattc atcccacgtc agattactaa + 14761 catcctaagt ggaattaagc caaaacttta cggtgaaggt aagaatgttc gtgactggat + 14821 tcataccaat gaccattctt caggagtttg gacaatcttg acaaaagggc aaatcggtga + 14881 aacctacttg attggggctg atggtgagaa gaacaataag gaagttttgg aacttatcct + 14941 taaggaaatg ggacaagctg tggatgccta tgatcatgtg actgaccgtg caggacatga + 15001 ccttcgctat gcgattgatg ccagcaagct ccgtgaggag ttggggtgga aacctgaatt + 15061 taccaacttt gaagctgggc tcaaggcaac aatcaagtgg tatacagata accaagaatg + 15121 gtggaaagca gaaaaagaag ctgttgaagc caattatgct aagactcagg agattattac + 15181 agtataaaaa gcaggaaaca gctgcttttt attgctatat tgggaagagt tacatattag + 15241 aaaggtctag agatgatttt aattacaggg gcaaatggcc aattaggaac ggaacttcgc + 15301 tatttattgg atgaacgtaa tgaagaatac gtggcagtag atgtggctga gatggacatt + 15361 accaatgaag aaatggttga aaaagttttt gaagaggtga aaccgacttt agtctaccac + 15421 tgtgcagcct acaccgctgt tgatgcagca gaggatgaag gaaaagagtt ggacttcgcc + 15481 atcaatgtga cggggacaaa aaatgtcgca aaagcatctg aaaagcatgg tgcaactcta + 15541 gtttatattt ctacggacta tgtctttgac ggtaagaaac cagttggaca agagtgggaa + 15601 gttgatgacc gaccagatcc acagacagaa tatggacgca ctaagcgtat gggggaagag + 15661 ttagttgaga agcatgtgtc taatttctat attatccgta ctgcctgggt atttggaaat + 15721 tatggcaaaa acttcgtttt taccatgcaa aatcttgcga aaactcataa gactttaaca + 15781 gttgtaaatg accagtacgg tcgtccgact tggactcgta ccttggctga gttcatgacc + 15841 tacctagctg aaaatcgtaa ggaatttggt tattatcatt tgtcaaatga tgcgacagaa + 15901 gacacaacat ggtatgattt tgcagttgaa attttgaaag atacagatgt cgaagtcaag + 15961 ccagtagatt ccagtcaatt tccagtcaaa gctaaacgtc cgctaaactc aacgatgagc + 16021 ctggccaaag ccaaagctac tggatttgtt attccaactt ggcaagatgc attgcaagaa + 16081 ttttacaaac aagaagtgag ataagtagta gaatgatttt ctagtctaat aaaagaggca + 16141 gataatgaac tccaaaggag cttaagatgt acgattatct tgttgttggt gctggtctct + 16201 ttggcgcata gctttggctc agtttctatt atcgctcaca tcatccatca gaagattaat + 16261 ctgaaggtac ccaattatcg ccaagaagaa gattgggcta ggatgggttt accaatcaca + 16321 cgtaaggaaa tctctaattg gcatatcaag gcaagtcaat actatttaga gtccctttat + 16381 aaccttttac gagaaaagtt gttagaacaa cctcttcttc atgcggatga aacctcttat + 16441 cgggttctag agagtgatag ccatctgacc tactattgga cctttttgtc tgggaaagct + 16501 gagaatcaag caatcacgct gtaccatcat gatcagcgtc ggagtggttt agtagtacaa + 16561 gaattcctag gagattattc tggctatgtg cattgtgata tgttgcggca gtaacttagg + 16621 actttagtcc tctagttctg cctatgcgat agcagtccaa ggtttaggag caaggcgacg + 16681 ctaagcttgg taaactgcga accgctagaa gcttatcgtc aactggaaga agctgaactt + 16741 gttggatgtt gggcacatgt gagaaggaag ttttttgaag cgacccccaa gcaagcagat + 16801 aaatcatcct tagaagctaa aggtttagct tattgtgatc agttattttc cctggaaaga + 16861 gactgggagg ctttgccagc tgatgaacga ctacagaaac gtcaagaaga gctccaaccc + 16921 ctaatggaag acttctttgc ttagtgccgg cgtcagtcag ttttagcagg ttcaaaacta + 16981 ggaagggcaa ttgaatacag cctcaagtat gaagaaacct ttaagactat tttgaaagac + 17041 ggacatctgg tcctttccaa taatctagct gaacgcgcca ttaaatcatt ggttatggga + 17101 cggagtaaaa gagttcagtg gactctttta gcctaagcta aattttaaaa agcgagggtg + 17161 gttattttct caaagttttg aaggagctaa agcaacagct attattatga gtttgttgga + 17221 aacagctaaa cgtcatcaat taaatagcga gaaatatcta ttctatcttc tagaatgtct + 17281 tccaaacgag gaaactctcg taaacaaaga ggttttagag gcttatttac catggactaa + 17341 agttgtacaa gaaaagtgca aataagaaat ctccagatta ggaactatcc gtgagttctc + 17401 tagtctggag atttttcaat atacttcgtt attgggcgct tacaatgata ttcatatttt + 17461 ttgcaaagat gttgtttgaa aaataatttt caaaaattct gaaaattctg ttgacaactt + 17521 tctgaaaaga gtctataatg gagagaaagt tttaaaggag aaaatgatga aaagttcaaa + 17581 actacttgcc cttgcgggcg tgacattatt g +// + diff --git a/public/res/serotype_genbank/serotype_6B.gb b/public/res/serotype_genbank/serotype_6B.gb new file mode 100644 index 0000000..4b4fe76 --- /dev/null +++ b/public/res/serotype_genbank/serotype_6B.gb @@ -0,0 +1,835 @@ +LOCUS CR931639 17506 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 2616/39 (serotype 6b). +ACCESSION CR931639 +VERSION CR931639.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17506) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17506) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17506 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="2616/39" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC06B_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC06B_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI32831.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..458 + /gene="aliB" + /locus_tag="SPC06B_0002" + /pseudo + CDS 293..458 + /gene="aliB" + /locus_tag="SPC06B_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..984) + /gene="tnp" + /locus_tag="SPC06B_0003" + /pseudo + CDS complement(join(459..779,781..984)) + /gene="tnp" + /locus_tag="SPC06B_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase (fragment)" + gene 1207..2652 + /gene="wzg" + /locus_tag="SPC06B_0004" + CDS 1207..2652 + /gene="wzg" + /locus_tag="SPC06B_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32834.1" + /db_xref="GOA:Q4K2Y7" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2Y7" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNEHIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSTLHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIKKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1207..1323 + /gene="wzg" + /locus_tag="SPC06B_0004" + /note="Signal peptide predicted for SPC0146 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 1411..1758 + /gene="wzg" + /locus_tag="SPC06B_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 1.2e-62" + misc_feature 1936..2379 + /gene="wzg" + /locus_tag="SPC06B_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 6.5e-70" + gene 2654..3385 + /gene="wzh" + /locus_tag="SPC06B_0005" + CDS 2654..3385 + /gene="wzh" + /locus_tag="SPC06B_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32835.1" + /db_xref="GOA:Q4K2Y6" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2Y6" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVYVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + misc_feature 2657..3265 + /gene="wzh" + /locus_tag="SPC06B_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 3.6e-38" + gene 3391..4086 + /gene="wzd" + /locus_tag="SPC06B_0006" + CDS 3391..4086 + /gene="wzd" + /locus_tag="SPC06B_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32836.1" + /db_xref="GOA:Q9AHB8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q9AHB8" + /translation="MMKEQNTIEIDVFQLFKTLWQRKLMILLVALVTSAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDIEDVLKI + PLLGLVPDFDKMK" + misc_feature 3412..3828 + /gene="wzd" + /locus_tag="SPC06B_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-53" + misc_feature 3934..4011 + /gene="wzd" + /locus_tag="SPC06B_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4096..4785 + /gene="wze" + /locus_tag="SPC06B_0007" + CDS 4096..4785 + /gene="wze" + /locus_tag="SPC06B_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32837.1" + /db_xref="GOA:Q9AHB7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q9AHB7" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + gene 4800..6167 + /gene="wchA" + /locus_tag="SPC06B_0008" + CDS 4800..6167 + /gene="wchA" + /locus_tag="SPC06B_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI32838.1" + /db_xref="GOA:Q4K2Y3" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K2Y3" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYINGWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 4800..4886 + /gene="wchA" + /locus_tag="SPC06B_0008" + /note="Signal peptide predicted for SPC0150 by SignalP 2.0 + HMM (Signal peptide probability 0.759) with cleavage site + probability 0.388 between residues 29 and 30" + misc_feature 5583..6164 + /gene="wchA" + /locus_tag="SPC06B_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.7e-160" + gene 6263..7207 + /gene="wciN" + /locus_tag="SPC06B_0009" + CDS 6263..7207 + /gene="wciN" + /locus_tag="SPC06B_0009" + /note="member of homology group 62" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32839.1" + /db_xref="GOA:Q9AHB5" + /db_xref="InterPro:IPR002495" + /db_xref="UniProtKB/TrEMBL:Q9AHB5" + /translation="MNIVYATDNNFVDVLSASIKSLYTTNSDLDLNLWIIADKVSDRN + KEKINRLSKQFAQREINWIENVEIPFKLHLDRGSISSFSRLFLGSVLPSSMSKVLYLD + SDIIVMDSLRSIFDIDFKGKILYGVNDTFNKEYKQVLGIPIDKPMFNAGVMLINLELW + RNNNVEERFLQVIQKFNGTILQGDLGVLNAVLYNSFGVLPPEYNYMTIFEDLTYEEMI + VFKKPINYYSKEEIKNARERIVLRHFTTSFLSKRPWQEGSNVAHIDQFKKYYEGSYKN + VKESILLKIVQKLPKKCSVFLLGIIQSKFRPKLYRILK" + misc_feature 6266..7036 + /gene="wciN" + /locus_tag="SPC06B_0009" + /note="HMMPfam hit to PF01501, Glycosyl transferase + family, score 3.9e-72" + gene order(7209..7388,7390..7491) + /gene="HG263" + /locus_tag="SPC06B_0010" + /pseudo + CDS join(7209..7388,7390..7491) + /gene="HG263" + /locus_tag="SPC06B_0010" + /note="member of homology group 263" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative LicD-family phosphotransferase + (pseudogene)" + /db_xref="PSEUDO:CAI32840.1" + gene 7478..8197 + /gene="wciO" + /locus_tag="SPC06B_0011" + CDS 7478..8197 + /gene="wciO" + /locus_tag="SPC06B_0011" + /note="member of homology group 81" + /codon_start=1 + /transl_table=11 + /product="putative ribitol phophotransferase" + /protein_id="CAI32841.1" + /db_xref="GOA:Q4K2Y1" + /db_xref="InterPro:IPR000462" + /db_xref="UniProtKB/TrEMBL:Q4K2Y1" + /translation="MSIYRICKDIERKTMSPAKKAMAKNDYFAFYVGRPLSYLLTVPF + VKTNITPNQISYLSIIPLIVGFIIMIFTTDFVVLLLAWFLFFLWNLLDGVDGNLARYR + EQYSKDGSVVDAMAGYVAMVLTYFGAGIVAAHLNDSDIYIILGALSGISLIFPRLVMH + KYINTVAQDESVSSIKDKSDFNTIKILALNMTSITGIPQVLLLLTILTNQWVLFTLVY + FTINFLLMIFSLYSLFKKENV" + misc_feature 7721..8185 + /gene="wciO" + /locus_tag="SPC06B_0011" + /note="HMMPfam hit to PF01066, CDP-alcohol + phosphatidyltransferase, score 0.01" + gene 8200..9186 + /gene="wciP" + /locus_tag="SPC06B_0012" + CDS 8200..9186 + /gene="wciP" + /locus_tag="SPC06B_0012" + /note="member of homology group 97" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32842.1" + /db_xref="GOA:Q9AHB3" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q9AHB3" + /translation="MGKSVAILMTTYNGERYLSQQIDSIRSQTFTNWTLFIRDDGSKD + KTIEVIQRYSKIDDRIRFVENPSKFHGAYYNFFNLIEYVKNNYQFDYYFFCDQDDIWK + EHKLEIQLLRFSKDDMPEMVYSDMSTIDASNNLIDISINKIMGIELPNINNLYFIHAY + IWGCTAGFNHALLEMVPSVDIDKDYLYIEKLSHDNYFAKFALEYGKVLFCPEQLVLYR + RHGHNVTTSHHFKLSPLNVFRKAILGFNELALTHAGVYNQTLYMLKKASGKNPLSDRL + LEIQEVIKIGGLKGVRYFYQNRISRKQLVRTIGLYTIMLFGTYKKYIMKELL" + misc_feature 8215..8718 + /gene="wciP" + /locus_tag="SPC06B_0012" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 4.9e-25" + gene 9186..10529 + /gene="wzy" + /locus_tag="SPC06B_0013" + CDS 9186..10529 + /gene="wzy" + /locus_tag="SPC06B_0013" + /note="member of homology group 139" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32843.1" + /db_xref="UniProtKB/TrEMBL:Q4K2X9" + /translation="MLLNFLFISIFLLIIITFILFEGDFFQPAVILTIAYFISIASAL + VNRNVWGTELHFKTFYLILLGVATFVIVSLLTKLSYRPKVEGISHEELKEINPSKIIY + VILLTLNLVMLFLYIREIQKVVLFSGRSFSNITDLISNYRYLSYYSNEVENRVSGMIN + QLSKIIPATTLISLYIFMNNYFITKQIKKNFIYLIPIAIFFVYAIISGGRLPLIRLVV + GALLILYIYSVYGSPKSQLTKSFKMITRSLFTFLILIVLFFLLKFVLGRSSQEDFISY + ITRYMGGSIQLFDLFVIDPIRRNKELGAETFSGIYEMLAKLGFDNNIIKGLEWRVSPN + YYSLGNVYTAIRRYYSDFGVIGIVICQSFTAWLYTLGYEKVRHYSLVTNVQRFRLILL + AASFYPIFLNGIEDVFYISMVTIGYGIQIVIFYLVFWVLLKVQVDFNKGKLTINR" + misc_feature 9186..9314 + /gene="wzy" + /locus_tag="SPC06B_0013" + /note="Signal peptide predicted for SPC0155 by SignalP 2.0 + HMM (Signal peptide probability 0.938) with cleavage site + probability 0.688 between residues 43 and 44" + gene 10654..12066 + /gene="wzx" + /locus_tag="SPC06B_0014" + CDS 10654..12066 + /gene="wzx" + /locus_tag="SPC06B_0014" + /note="member of homology group 82" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32844.1" + /db_xref="UniProtKB/TrEMBL:Q9AHB1" + /translation="MKLKFLITNLFHVFLSNLITIVTSVIVVLILPKIMGVTEYSYWQ + LYIFYLTYIGFFHLGWIDGIYLKYGGLEYQNLDKKQFYSQILQFFSFLILISFLLFGF + NLLIVTDPNAKYIYNMTIISMIVTNLRMLFVYILQMTNRLKDSSIILISDRVIYIFLL + FLFIIFKWHEYKVMIWADVLGRTFSLLLSFWICKDIVFQSLSEFILDLRESFDNIRVG + INLMLSNIASSMIIGIVRMGIQWNWNIETFGKVSLTLSISNLLMTFINAIGLVVFPLL + KRTKTENLSKIYSNLRNVLMLIMFAILLFYYPLKIILDLWLPAYRDALIFMALIFPMS + IYEGKMALVINTYLKALRMERDILKINTLIMLFSMLVTLITTLLLNNLELTVISIVVL + LALRSIIAELILSKKLDISVEQDIVLELLMTIIFISSSWYLPIWLAVIVYLLAYTLYL + YLKRKDTKMYIEYFRKKIFE" + misc_feature 10654..10761 + /gene="wzx" + /locus_tag="SPC06B_0014" + /note="Signal peptide predicted for SPC0156 by SignalP 2.0 + HMM (Signal peptide probability 0.692) with cleavage site + probability 0.398 between residues 36 and 37" + gene 12534..13403 + /gene="rmlA" + /locus_tag="SPC06B_0015" + CDS 12534..13403 + /gene="rmlA" + /locus_tag="SPC06B_0015" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI32845.1" + /db_xref="GOA:Q8RSF0" + /db_xref="HSSP:1FXO" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q8RSF0" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + misc_feature 12537..13253 + /gene="rmlA" + /locus_tag="SPC06B_0015" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 3.3e-120" + gene 13404..14000 + /gene="rmlC" + /locus_tag="SPC06B_0016" + CDS 13404..14000 + /gene="rmlC" + /locus_tag="SPC06B_0016" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI32846.1" + /db_xref="GOA:Q4K2X6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q4K2X6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHSLLKDVKPLKKEDLE" + misc_feature 13440..13970 + /gene="rmlC" + /locus_tag="SPC06B_0016" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 1.1e-15" + gene 14010..15059 + /gene="rmlB" + /locus_tag="SPC06B_0017" + CDS 14010..15059 + /gene="rmlB" + /locus_tag="SPC06B_0017" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI32847.1" + /db_xref="GOA:O54546" + /db_xref="HSSP:1KEP" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:O54546" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 14025..14981 + /gene="rmlB" + /locus_tag="SPC06B_0017" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.00012" + misc_feature 14028..14768 + /gene="rmlB" + /locus_tag="SPC06B_0017" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 5.4e-77" + misc_feature 14031..14843 + /gene="rmlB" + /locus_tag="SPC06B_0017" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.4e-05" + gene 15125..15976 + /gene="rmlD" + /locus_tag="SPC06B_0018" + CDS 15125..15976 + /gene="rmlD" + /locus_tag="SPC06B_0018" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI32848.1" + /db_xref="GOA:Q9AH81" + /db_xref="HSSP:1N2S" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q9AH81" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 15125..15973 + /gene="rmlD" + /locus_tag="SPC06B_0018" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 4.3e-146" + misc_feature 15128..15769 + /gene="rmlD" + /locus_tag="SPC06B_0018" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.00011" + misc_feature 15128..15757 + /gene="rmlD" + /locus_tag="SPC06B_0018" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 2e-18" + misc_feature 15131..15859 + /gene="rmlD" + /locus_tag="SPC06B_0018" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 3.6e-08" + gene 16039..17141 + /gene="glf" + /locus_tag="SPC06B_0019" + CDS join(16039..16638,16638..17141) + /gene="glf" + /locus_tag="SPC06B_0019" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI32849.1" + /db_xref="GOA:Q4K083" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K083" + /translation="MYDYLIVGAGLFGAVFAHESALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIEEQRAILNGKTPENLKEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPSFIIRRLPVHLTYDNNYFNDTYQGIPIGGYTQIVEKMLDYENIDVETNVDFFVN + KEQYLKDFPKIVFTGMIDEFFDYKLGELEYRSLRFENETLDMENYQGNAVVNYTDAET + PYTRIIEHKHFEFGSQAKTIITKEHSKTWEKGDEPYYPVNNDRNNHLYKSYKKFADEQ + GNVIFGGRLGHYRYYDMHQVIGAALQCVRNELD" + misc_feature join(16474..16638,16638..17081) + /gene="glf" + /locus_tag="SPC06B_0019" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.9e-107" + gene 17459..>17506 + /gene="aliA" + /locus_tag="SPC06B_0020" + CDS 17459..>17506 + /gene="aliA" + /locus_tag="SPC06B_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32850.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaagttt ataaactttc + 241 attcttgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacactga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcctaa actcttcgca taaaagttct aacttaccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccatact + 721 tcaaaaaagt cgctcgtcat catctcttcg taagtcattg gagcgattaa ctcaccattc + 781 atttgttaga cctgcaacca aagaaatcct ccgatatctt cttccagata ttttgcctct + 841 tcttaactga ccttttaaag agcgaccata ttctcgataa aaataagtat cgaatcctgt + 901 ttcatcaatc taaacaggtg ctaggtgctt taaactatta aaattcttaa gaaataaggc + 961 tactttttct gggtcttgtt cataattaga ttgaaactag aatagtacac ctctgcttct + 1021 aaaacattgt tagaaatcga tttgactgtc ctgatcgttt tgtcatgttc ttatttcatt + 1081 ttactatatt tttggttcgt gggaagtcta ctaagatact taaagatgca gatagtgaaa + 1141 aaaggtgtag acattaccgt aaaaaagtga tataatcgta tgatgttcaa tgtataggtg + 1201 ttaatcatga gtagacgttt taaaaaatca ggttcacaga aagtgaagcg aagtgttaat + 1261 atagttttgt tgactattta tttattgtta gtttgttttt tattgttctt aatctttaag + 1321 tacaatatcc ttgcttttag atatcttaat ctagtggtaa ctgcgttagt cctactagtt + 1381 gccttggtag ggctactctt gattatctat aaaaaagctg aaaaatttac tatttttcta + 1441 ttggtgtttt ctatccttgt cagctcagtg tcgctctttg cagtacagca gtttgttgga + 1501 ctgaccaatc gtttaaatgc gacttctaat tactcagaat attcaatcag tgtcgctgtt + 1561 ttagcagata gtgatatcga aaatgttacg caactgacga gtgtgacagc accgactggg + 1621 actgataatg aacatattca aaaactacta gctgatatca agtcaagtca gaataccgat + 1681 ttgacggtca accagagttc gtcttacttg gcagcttaca agagtttgat tgcaggggag + 1741 actaaggcca ttgtcctaaa tagtgtcttt gaaaatatca tcgagtcaga gtatccagac + 1801 tacgcatcga agataaaaaa gatttatacc aagggattca ctaaaaaagt agaagctcct + 1861 aagacgtcta agaatcagtc tttcaatatc tatgttagtg gaattgacac ctatggccct + 1921 attagttcgg tgtcgcgatc agatgtcaat atcctgatga ctgtcaatcg agataccaag + 1981 aaaatcctct tgaccacaac gccacgtgat gcctatgtac caatcgcaga tggtggaaat + 2041 aatcaaaaag ataaattaac ccatgcgggc atttatggag ttgattcgtc cattcacacc + 2101 ttagaaaatc tctatggagt ggatatcaat tactatgtgc gattgaactt cacttctttc + 2161 ttgaaaatga ttgacttatt gggaggggta gatgttcata atgatcaaga attttcaact + 2221 ctacatggga agttccattt cccagtaggg aatgtccatc tagactctga gcaggctcta + 2281 ggttttgtac gtgaacgcta ctcactagcc gatggagacc gtgaccgtgg tcgcaaccaa + 2341 caaaaggtca ttgtagcaat tattaagaag ttaacttcta cagaggtttt gaaaaactat + 2401 agtagtattc ttcaaggatt gcaggattct cttcaaacaa atatgccgat tgagactatg + 2461 atagatttag tgaatactca gttggagagt ggagggaatt ataaagtaaa ttcgcaagac + 2521 ttgaaaggta caggtcggat ggatcttcct tcttatgcaa tgccagacag taacctctat + 2581 gtgatggaaa tagatgatag tagtttagct gtagttaaag cagctataca ggatgtgatg + 2641 gagggtagat gaaatgatag acatccattc gcatatcgtt tttgatgtag atgacggtcc + 2701 caagtcaaga gaggaaagca aggctctctt ggcagaagcc tacagacagg gggtgcgaac + 2761 cattgtctct acctctcacc gtcgcaaggg catgtttgaa actccggaag agaagatagc + 2821 agaaaacttt cttcaggttc gggaaatagc taaggaagtg gcgagtgact tagtcattgc + 2881 ttacggggct gaaatttact acacaccaga tgttctggat aagctgggaa aaaagcggat + 2941 tccgaccctc aatgatagtc gttatgcctt gatagagttt agtatgaata ctccttatcg + 3001 cgatattcat agcgccttga gcaagatttt gatgttggga attactccag tcattgccca + 3061 cattgagcgc tatgatgctc ttgaaaataa tgaaaaacgc gttcgagaac taatcgatat + 3121 gggctgttac acgcaagtaa atagttcaca tgtcctcaaa cccaaacttt ttggcgaacg + 3181 ttataaattc atgaaaaaaa gagctcagta ttttttagag caggatttgg tttatgtcat + 3241 tgcaagtgat atgcacaatc tagacggtag acctcctcat atggcagaag catatgacct + 3301 tgttacccaa aaatacggag aagcgaaggc tcaggaactt tttatagaca atcctcgaaa + 3361 aattgtaatg gatcaactaa tttaggagaa atgatgaaag aacaaaacac gatagaaatc + 3421 gatgtatttc aattatttaa aaccttgtgg caacgcaagc taatgatttt attagtggca + 3481 cttgtgacaa gtgcgggggc ttttgcatat agcactttta ttgttaagcc agaatatacg + 3541 agtaccacgc gaatttacgt agtgaatcgc aatcaaggag acaagccggg gctgacaaat + 3601 caggatttgc aggcaggaac ttatctggta aaagactacc gtgagattat cctttcgcag + 3661 gatgcattgg aaaaagtagc gacaaatttg aagttggata tgccagcaaa aacgttagcc + 3721 agcaaagttc aagtggctgt accagctgac actcgtatcg tctcaatctc tgtcaaggat + 3781 aaacagccag aggaagccag tcgtatcgct aattctctac gagaagttgc tgcagaaaag + 3841 atcgtcgctg taacgcgagt atctgatgta acgacacttg aagaagcgcg accagctacg + 3901 actccctctt ctccaaatgt tcgacgcaat tccttgtttg gttttcttgg aggagcagtc + 3961 gtaacagtaa ttgctgttct tttgattgag ttgctcgaca cccgtgtgaa acgtcctgaa + 4021 gatattgaag atgtactgaa aattccactt ttagggctcg ttccagattt tgacaaaatg + 4081 aaataggagg aagttatgcc aacattagaa atctcacagg caaaattgga ttctgtaaaa + 4141 aaggcagagg aatattataa cgctttgtgc acgaacctac agttaagtgg agatggtttg + 4201 aaagtatttt ctatcacttc tgtgaaaata ggagaaggaa aatcaacgac ttccaccaat + 4261 atcgcttggg cttttgcgcg tgcaggttac aaaacgctgc tgattgatgg agatattcgc + 4321 aattctgtta tgttaggtgt ctttaaagca agggataaga ttacaggcct gacagaattt + 4381 ttatcaggaa ctacagacct atcacaaggg ctttgtgata ccaatatcga aaatctcttt + 4441 gtaattcagg ctggctctgt gtcaccgaat ccgacagctc ttcttcaaag taagaatttc + 4501 agtacaatgc ttgaaacctt gcgtaaatat tttgactaca tcattgtaga tactgctcct + 4561 gtcggtgtcg tgattgatgc ggctattatt acgcgaaaat gcgatgcttc tattttagtg + 4621 acggaggcag gtgaaataaa tcgacgggat attcaaaaag caaaagaaca gttggaacac + 4681 acagggaagc cgtttttggg agttgtgttg aataaattcg atacttcagt agacaaatac + 4741 ggttcttatg gaaattatgg agattacggg aaaaataaaa aataggtcgg gggatagaga + 4801 tgaatggaaa aatagtaaag tcttcattgg ccataatcca gagctttctt gttattttat + 4861 tgacttatct acttagtgct gtgagagaaa cggagattgt ttcaacaaca gctattgcac + 4921 tttatatcct ccattatttt gtcttttata tcagtgatta tggacaggat ttctttaaaa + 4981 ggggatattt gattgaactt gtccagacat tgaaatatat cctattcttt gcactagcga + 5041 ttagtatttc taattttttc ttagaggatc gatttagtat ttccagacga ggcatgattt + 5101 acttcctcac attacatgct ctcttagtct atgtgctaaa cctatttatc aagtggtatt + 5161 ggaagcgggc ttatcccaac tttaaaggaa gtaagaagat tctcctactt acagcaactt + 5221 ctcgtgtcga aaaggtactg gatagattaa tagaatcaaa tgaggttgtt ggggagttgg + 5281 tagccgtcag tgtcttagat aaaccagatt ttcagcatga ttgtttaaag gtagtagcag + 5341 agggggagat agtaaacttt gcgactcatg aggtggtcga tgaagtcttt atcaatcttc + 5401 caagtgaaaa atacaatatt ggagagcttg tctctcagtt tgaaacgatg ggaattgatg + 5461 taacagtcaa tctaaatgct tttgatcgta gtttggcacg taacaagcaa attcgtgaga + 5521 tggcaggatt aaacgttgtg actttttcta caacatttta taagactagt catgtaattg + 5581 ctaagcggat tattgatatc gtgggtgcat tggtagggct gatactatgt ggtttagtca + 5641 gtattgtact ggttcctttg attcgaaagg atgggggctc tgctattttt gctcagacgc + 5701 gtataggaaa aaatggtcgt cagttcactt tttataagtt tcgctctatg tgtgtagatg + 5761 ccgaggcgaa aaaaagagaa ctcatggaac aaaataccat gcagggtgga atgtttaagg + 5821 tggacgatga tcctcgtatc acgaaaattg gtcgttttat acggaagact agcttggacg + 5881 agctaccaca gttttacaat gttctaaagg gagatatgag cttggtaggt acacgaccac + 5941 caacagtgga cgagtatgag cactataccc cagaacaaaa acgccgacta agttttaaac + 6001 ctggcataac aggtttatgg caggtcagcg gacgaagtga aatcaagaat ttcgatgaag + 6061 ttgtcaaatt agatgtggcc tatattaatg gttggacaat ctggaaagat attgaaattt + 6121 tattgaaaac ggttaaagtt gtatttatga gagatggagc gaaatagttt ggttgtgtag + 6181 gatatttgta gaggtaaaag tttcgaatat atctcactca atctttttta taagtgaaaa + 6241 taaatttaga agtaggaatt ttatgaatat agtttatgcc acagataata attttgtaga + 6301 tgtattgagt gcttccatca aatcacttta cactactaat tcagatttgg atttaaattt + 6361 atggattatt gctgataaag tttcggatag aaataaagaa aagataaata gattatcaaa + 6421 acaatttgcg cagagagaaa ttaattggat agagaacgtt gagatcccat ttaaattaca + 6481 tttagatagg ggatcaatta gttcatttag cagattattt ctgggaagtg ttcttccatc + 6541 ttcaatgagt aaagttcttt atcttgacag tgatattatt gttatggatt ctttacgaag + 6601 tatttttgat attgatttta agggtaaaat tctctatggg gtgaatgata cttttaataa + 6661 agaatacaag caggtgttgg gtataccaat tgacaagcca atgtttaatg ctggagttat + 6721 gcttattaat ttagagttat ggagaaataa taacgtcgaa gaaagatttt tgcaagtaat + 6781 tcaaaagttt aatggtacta tattacaagg agatttaggg gttttaaatg cagttttata + 6841 taactcattt ggtgtacttc ctccagaata taattatatg accatatttg aagatttgac + 6901 ttatgaagaa atgatagttt ttaaaaaacc aattaattat tattcaaaag aggaaattaa + 6961 aaatgccaga gaacgtatag tcttacgaca tttcacaact agttttttat caaaaagacc + 7021 ttggcaagaa ggcagtaatg ttgcacatat agaccaattt aaaaaatact atgaaggtag + 7081 ttataaaaat gttaaagaat ctattttact aaaaatagtt caaaaattac ccaaaaaatg + 7141 ttcagttttt ttattaggaa ttattcaatc aaaatttaga cctaaattgt atagaatttt + 7201 gaaataaggt ggatagtatt aatgacaaaa aagaaagaat tttattgaaa attcaagaag + 7261 aattgaaatt attaaaagag tttataaaaa tatgttctaa aaataaaatt aagtattttg + 7321 ctcttggagg tagtctatta ggagctgtaa gacacaaagg tttcattcct tgggatgata + 7381 tggatctaag ctttccaaag agttcaatct atgtttgaaa taaaggaaaa agtgttagaa + 7441 ttagagaatg tattaatgag tttaggagaa agtatagatg tcaatatata gaatctgtaa + 7501 agatattgaa agaaaaacta tgtcgcctgc taaaaaagca atggctaaaa acgactattt + 7561 tgcattttat gttggaagac ctttatccta tcttttaaca gttcctttcg tgaaaacaaa + 7621 tattactccc aatcaaatat cttatttatc tataattcct ttgattgttg gatttataat + 7681 aatgatattt acaactgatt tcgttgtatt attactggca tggtttctat tttttttatg + 7741 gaacttacta gatggagtag atgggaactt agccagatat cgggagcaat actcgaagga + 7801 tggaagtgta gtagatgcaa tggctggcta tgtagccatg gtgttgacgt atttcggtgc + 7861 aggaatagta gctgctcatt taaacgactc agatatctat ataattttgg gtgcattatc + 7921 tgggatttca ttgatttttc caaggttagt gatgcataag tatatcaata cagtagctca + 7981 agatgagtct gtgagtagca ttaaagataa atctgatttt aatactataa aaatactggc + 8041 tctaaacatg acatcaatta caggaattcc gcaggtttta ctgctattaa ctattttaac + 8101 aaatcagtgg gtacttttta ctttagtata ttttacgatt aattttttat taatgatatt + 8161 ttctttgtat tcattattca aaaaggagaa tgtttagaaa tgggaaagtc agttgcaatt + 8221 ttaatgacca cctataatgg tgagcgatat ttgtcacaac agattgatag tattaggtct + 8281 caaacattca ctaattggac actttttatt agggatgatg gatcaaaaga taaaacaata + 8341 gaagtaatac agaggtattc taagatagat gatagaatta gattcgttga aaatccctca + 8401 aagtttcatg gagcttatta caattttttt aatctaattg aatacgttaa aaacaattat + 8461 caatttgatt attacttttt ttgtgatcaa gatgatattt ggaaagagca caagttagaa + 8521 atacagctgt taagattttc taaagatgac atgccagaga tggtttactc tgatatgtca + 8581 acgattgatg ccagtaataa tttgatagat attagtataa ataaaataat ggggattgaa + 8641 ttaccgaaca taaataattt gtattttatt catgcctata tctgggggtg tactgcaggt + 8701 tttaatcatg cattgctaga gatggttcct tcagttgata ttgataaaga ttatttatat + 8761 atagaaaaac tgtctcatga taattatttt gcaaagtttg cactagagta tgggaaggtg + 8821 ttgttctgcc ctgagcaact ggtcttgtat cgaagacatg gacataatgt aacaactagt + 8881 catcatttta aattatctcc gctaaatgtt ttcagaaagg ctatattggg tttcaatgaa + 8941 ttggcactta cacatgctgg ggtatataat caaactcttt atatgctaaa aaaagcttct + 9001 ggaaaaaatc ctttaagtga tagactactt gaaattcagg aagtaatcaa aattggagga + 9061 ttaaaaggtg tgagatattt ctatcagaat cgaatttctc gaaagcaact cgtaagaaca + 9121 atcggcttat ataccatcat gctttttggg acctataaaa aatatattat gaaagaactc + 9181 ttataatgct tttaaatttc ttattcatat ctatttttct attaattatc attacattta + 9241 tattatttga gggggatttt tttcaacctg cagtaatttt aacaatcgct tattttattt + 9301 cgattgcaag tgctctagtt aatagaaatg tttggggaac agaactccat ttcaaaacct + 9361 tttatttgat attgttaggg gttgctacat ttgttatagt ttccttgttg acaaaattgt + 9421 cgtacaggcc taaagtggag ggaatttcgc atgaagaatt gaaagaaata aatccttcaa + 9481 agataatcta tgtcattctt ctgactctaa atcttgttat gctatttctt tatatccgtg + 9541 aaattcagaa agtagtattg ttttcaggta gaagtttttc taatattaca gatttgataa + 9601 gtaactatag gtacctatct tattattcaa atgaagtaga aaatcgtgta agtggaatga + 9661 ttaatcaact atctaaaatt attccagcga ctacacttat ttctttatat atatttatga + 9721 ataattattt tataactaaa caaataaaga aaaatttcat ttatttgatt ccaatagcta + 9781 tattctttgt ctatgcaatc attagtggtg gtagattgcc ccttataagg ttagttgttg + 9841 gagctctgtt gatattgtat atatactctg tgtacgggag tcctaaatct caacttacca + 9901 aaagttttaa aatgatcact cgctctctgt ttacatttct tattttgata gttttattct + 9961 ttcttttaaa atttgtatta gggcgctcct ctcaggaaga ttttatcagt tacatcactc + 10021 gttatatggg aggttcaatt caactatttg atttatttgt tatagatccg atacgacgta + 10081 acaaagaact aggtgcagaa actttttcgg gaatttatga gatgcttgca aaattaggat + 10141 ttgacaataa tattataaaa ggcttagaat ggagagtgtc tcctaattat tattctttag + 10201 ggaatgtgta tactgcaatt agacgttatt attcagactt tggtgtaatt ggtattgtaa + 10261 tttgtcagag ttttacagcg tggttatata ctttaggtta tgaaaaagtt agacattatt + 10321 ctttagttac aaatgttcaa agatttaggt tgatcctatt agcagcttca ttttatccaa + 10381 tatttttaaa tggtatcgag gatgtgtttt atatttcaat ggttaccatt ggatatggaa + 10441 tacaaattgt tatcttttat ctggtctttt gggttcttct gaaagttcag gttgacttta + 10501 acaaaggtaa attaacgata aatagatgaa tttagcgcta atgtattgag tcatataaag + 10561 ggatatattt ggtaggtatt ttaattggag gaagagagcc ttgaaaggga agtacaaatc + 10621 ttctgaaata atttttaggt ggggagtata gctatgaaat tgaagtttct tataacaaat + 10681 ttgtttcatg tctttttgtc taatctgatt acaattgtca catcggttat agttgtacta + 10741 attttaccaa aaattatggg agtaactgag tatagttatt ggcaactata tattttttac + 10801 ctaacatata ttggtttttt tcatctgggt tggattgatg gaatttatct taaatatggt + 10861 ggattagagt accagaattt agataagaaa cagttttatt ctcaaatact tcaatttttc + 10921 agttttttaa ttttaatttc ttttctatta tttggtttta acttattgat tgtgacagat + 10981 ccaaatgcaa aatatattta taacatgact attattagta tgatagttac aaatttaaga + 11041 atgttattcg tttatatttt gcagatgaca aatcgattaa aggatagctc tataattctg + 11101 ataagtgatc gcgttatata tatttttctt ttatttctgt ttattatatt taaatggcat + 11161 gaatacaagg taatgatttg ggcggatgtt ttaggaagga cattttctct cctactttct + 11221 ttttggattt gtaaagatat tgtttttcaa tccttatccg agttcatatt ggatctgaga + 11281 gagtcttttg acaatatccg tgttggaatc aatttaatgt tatccaatat tgcaagtagt + 11341 atgattattg gtattgttcg aatgggaatt caatggaatt ggaatatcga aacattcggg + 11401 aaagtatcac tgacgctaag catctctaat ttattaatga cttttattaa tgcgattggt + 11461 ttagttgtct ttcctttgtt aaaacggaca aaaacggaaa atttatctaa aatttattcc + 11521 aacttaagaa atgttttgat gctgatcatg tttgcaatat tgctctttta ttatccttta + 11581 aaaattattc tagatctttg gttgccagct tatcgggatg cgttgatttt tatggctctt + 11641 atttttccta tgtcaattta tgaagggaag atggccttgg tgattaatac atatttaaag + 11701 gcgctaagga tggaaagaga tattctcaaa ataaatactt tgattatgtt gttcagtatg + 11761 ttagttaccc taataactac tctattatta aataatttag agctaacggt tatatctata + 11821 gttgttttgc tagctttacg tagtataata gcagaactaa ttctatctaa aaaacttgat + 11881 atatcagttg agcaagacat tgtgttagaa ttacttatga caattatatt tatttcttca + 11941 agttggtact taccgatttg gctcgcagta atagtttatt tgttagcgta tactttatac + 12001 ttgtatctaa agcgtaaaga tacaaaaatg tatatagaat attttagaaa gaaaatattt + 12061 gaataaaaag aactatatat cagttagatg gcaaattcta tttttacctt tttgtcgttt + 12121 aatagaaaat gataaaaaat atgatattat tcttacacat atttataagt aatttaaaat + 12181 aagaatagtt tctggaacat tgctattagt gggaacaggt tacgaaataa tttatcaatt + 12241 ttaaagatgt ttttttaaat ataaaataat ggattctgtc aacaattcta aattctaata + 12301 ggaatgataa tgctagaaaa tcagattgtt catttttcaa ggaagtttat ttttaaaata + 12361 atatatcttt aagtaagaat tattttatta gacttaacct agcctatcag ttaaattaga + 12421 atatcaactt tgattaatta aaaattagca aaatttattg acattttgtt tttataaatt + 12481 gcaataaagg tctaattctg aatttcagtg aatataagaa agggatccta ctaatgaaag + 12541 gtattattct tgcaggtggt tcggggacac gattatatcc tttgactcgg gctgcatcaa + 12601 aacaacttat gccggtttat gataaaccga tgatttacta tccactttca acattgatgt + 12661 tggctgggat tagggatatt ttgataatct caactcctca agatttgcct cgttttaaag + 12721 agcttcttca agacggatct gagtttggga ttaaactttc ttatgcagag caaccaagtc + 12781 cagatggttt ggcacaagcc tttatcattg gggaagagtt tattggtgat gatagtgttg + 12841 ctttgatttt gggggacaat atctatcacg gccctggttt gagcaaaatg cttcaaaaag + 12901 cagccaagaa agagaaaggt gcgactgttt ttggctacca agtgaaggat ccagagcgtt + 12961 ttggtgtggt tgagtttgat acagacatga atgctatctc catcgaagaa aagccagaat + 13021 accctcgttc aaactatgca gtgacaggac tctatttcta tgataatgat gtagtagaga + 13081 ttgccaagag tatcaaacca agtcctcgcg gagaattaga aatcacagat gtcaacaagg + 13141 cttacttgga tcgtggagac ttatccgttg agcttatggg acgtggcttt gcttggctgg + 13201 atactggaac tcatgaaagt ttactagagg cttcacagta catcgaaaca gtgcaacgga + 13261 tgcaaaatgt tcaggtagca aacttagaag aaattgctta ccgtatgggc tatatcagtc + 13321 gagaagatgt attggcctta gcccaaccac ttaagaaaaa tgaatacgga cagtatctgc + 13381 tccgtttgat tggagaagca tagatgacag ataatttttt cggtaagacg cttgcggcac + 13441 gcaaggttga agctattcca ggcatgttgg agtttgatat ccccgttcat ggagataatc + 13501 gtggctggtt taaagaaaat ttccaaaagg aaaaaatgct tccacttgga tttccagagt + 13561 ctttctttgc agaaggaaaa ttgcaaaaca atgtatcctt ctcacgtaaa aatgtccttc + 13621 gaggcctcca cgcagagcct tgggataagt acatctctgt agcagatgga gggaaagttc + 13681 tgggttcttg ggttgatcta cgcgagggtg aaacctttgg gaatacctat cagacagtga + 13741 ttgatgcgag taagggaatc tttgttcctc gaggcgtagc taatggcttc caagttttat + 13801 cagatacagt gtcatatagc tatctggtca atgattactg ggctcttgaa ctcaaaccca + 13861 agtatgcctt tgtgaactac gctgatccaa gccttggtat tgaatgggaa aatattgcag + 13921 aagcagaggt ttcagaagca gataaaaatc attcactact taaggatgta aaacctttga + 13981 aaaaagaaga tttggaataa ggaaagaata tgactgaata caaaaatatt atcgtgacag + 14041 gtggagctgg ctttatcggt tctaactttg tccattatgt ttacgagaac tttccagatg + 14101 ttcacgtgac agtcctagat aagttgactt atgctggaaa ccgcgcgaat attgaggaaa + 14161 ttttaggtaa tcgtgttgag ttagttgttg gtgacattgc tgatgcggag ttggtagaca + 14221 agttggctgc tcaagcagat gctatcgttc attatgcagc ggaaagccac aatgataatt + 14281 cgctcaatga tccatcgcca tttattcata ctaacttcat tggaacctat actcttttag + 14341 aagctgctcg taagtatgat attcgcttcc accatgtatc gacagatgaa gtttatggag + 14401 atctcccttt acgcgaagat ttgccaggtc atggagaagg gccgggtgag aaatttacgg + 14461 ctgaaaccaa gtacaatcca agctcgcctt actcatcaac caaggcagcc tcagatttga + 14521 ttgtcaaagc ctgggtgcgt tcttttggag tcaaggcaac gatttccaac tgttcaaata + 14581 actacggtcc ttatcaacat atcgaaaaat tcatcccacg tcagattact aacatcctaa + 14641 gtggtatcaa gccaaaactt tacggtgaag gtaaaaacgt tcgtgactgg attcatacca + 14701 atgaccattc ttcaggagtt tggacaatct tgacaaaagg gcaaatcggt gaaacctact + 14761 tgattggggc tgatggtgag aagaacaata aggaagtttt ggaacttatc cttaaggaaa + 14821 tgggacaagc tgcggatgcc tatgatcatg tgactgaccg tgcaggacat gaccttcgct + 14881 atgcgattga tgctagcaag ctccgtgatg agttggggtg gaaacctgaa tttaccaact + 14941 ttgaagctgg gctcaaggca acaatcaagt ggtatacaga taaccaagaa tggtggaaag + 15001 cagaaaaaga agctgttgaa gccaattatg ctaagactca ggagattatt acagtataaa + 15061 aagcaggaaa tagctgcttt ttattgctat attgggaaga gttacatatt agaaaggtct + 15121 agagatgatt ttaattacag gggcaaatgg ccaattagga acggaacttc gctatttatt + 15181 ggatgaacgt aatgaagaat acgtggcagt agatgtggct aagatggaca ttaccaatga + 15241 agaaatggtt gagaaagttt ttgaagaggt gaaaccgact ttagtctacc attgtgcagc + 15301 ctacaccgct gttgatgcag cagaggatga aggaaaagag ttggacttcg ccatcaatgt + 15361 gacggggaca aaaaatgtcg caaaagcatc tgaaaagcat ggtgcaactc tagtttatat + 15421 ttctacggac tatgtctttg acggtaagaa accagttgga caagagtggg aagttgatga + 15481 ccgaccagat ccacagacag aatatggacg cactaagcgt atgggggaag agttagttga + 15541 gaagcatgtg tctaatttct atattatccg tactgcctgg gtatttggaa attatggcaa + 15601 aaacttcgtt tttaccatgc aaaatcttgc gaaaactcat aagactttaa cagttgtaaa + 15661 tgatcagtac ggtcgtccga cttggactcg taccttggct gagttcatga cctacctagc + 15721 tgaaaatcgt aaggaatttg gttattatca tttgtcaaat gatgcgacag aagacacaac + 15781 atggtatgat tttgcagttg aaattttgaa agatacagat gtcgaagtca agccagtaga + 15841 ttccagtcaa tttccagcca aagctaaacg tccgctaaac tcaacgatga gcctggccaa + 15901 agccaaagct actggatttg ttattccaac ttggcaagat gcattgcaag aattttacaa + 15961 acaagaagtg agataagtag tagaatgatt ttctagtcta ataaaagagg cagagaatga + 16021 actccaaagg agcataagat gtacgattat cttatcgttg gtgccggtct ttttggtgca + 16081 gtatttgccc atgaatcagc cttaaaagga aaaaaagtaa aagttattga aaaacgaaat + 16141 catattgcgg gtaatatcta tactcgtgaa gaggaaggaa ttcaagttca tcagtatggt + 16201 gctcatatct ttcatacttc tgataaggag atctgggatt atgtgaacca gtttgcagag + 16261 tttaaccgtt atacaaattc tcctgttgca aactataagg gagagattta taacttacct + 16321 tttaatatga ataccttcaa taaactctgg ggagttgtga cgccagcaga agcacaagct + 16381 aagattgagg aacaacgtgc tattttaaat ggtaaaactc ctgaaaattt gaaagaacag + 16441 gcgatttctc ttgtaggtac agacatctac gaaaaattaa tcaaagacta tacagagaaa + 16501 cagtggggca aaccaactac tgaacttcca tcctttatta ttcgccgttt accagtacac + 16561 ctgacctatg ataacaacta ttttaacgat acctatcaag ggattccaat tggtggatac + 16621 actcaaatag ttgaaaaatg ttggattatg aaaatattga tgtagaaaca aatgttgatt + 16681 tctttgtgaa caaagagcaa tatctgaaag attttcctaa gattgtcttt actggtatga + 16741 ttgatgaatt ctttgactat aagttgggcg aactagagta ccgtagtctt cgttttgaaa + 16801 atgagacctt ggatatggaa aattaccaag gaaatgcagt tgtgaactat acggatgcag + 16861 aaaccccata tactcgcatt attgaacaca aacattttga gtttgggagt caagcaaaga + 16921 ctatcattac taaagaacat tctaaaacat gggaaaaagg tgatgagcct tattatccag + 16981 ttaataatga tcgtaataat catttgtata aatcgtataa aaaatttgct gatgagcaag + 17041 ggaatgttat ctttggtggc cgcttaggac actatcgtta ttacgatatg caccaagtaa + 17101 ttggagcagc tttgcagtgc gtgagaaatg agttagatta atactcaatg aaaatcaaag + 17161 agcaaactag gaagctagcc acaggttgct caaaatactg ttttgaggtt gcagatggaa + 17221 gctgacgcgg tttgaagaga ttttcgaaga gtataaacaa gtaaaactga ctaccagtta + 17281 ttatttagaa atagtattaa aaattccttg actatgtgat atagttgagg gatttttaaa + 17341 tgatattcat atttttttca aagatgttgt ttgaaaaata attttcaaaa attctgaaaa + 17401 ttctgttgac atctttctga aaagagtcta taatggagag aaagttttaa aggagaaaat + 17461 gatgaaaagt tcaaaactac ttgcccttgc gggcgtgaca ttattg +// + diff --git a/public/res/serotype_genbank/serotype_6C.gb b/public/res/serotype_genbank/serotype_6C.gb new file mode 100644 index 0000000..a671744 --- /dev/null +++ b/public/res/serotype_genbank/serotype_6C.gb @@ -0,0 +1,503 @@ +LOCUS EF538714 17682 bp DNA linear BCT 22-AUG-2007 +DEFINITION Streptococcus pneumoniae strain CHPA388 Wzg, Wzh, Wzd, Wze, WchA, + WciNbeta, WciO, WciP, Wzy, Wzx, RmlA, RmlC, RmlB, and RmlD genes, + complete cds. +ACCESSION EF538714 +VERSION EF538714.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17682) + AUTHORS Park,I.H., Park,S., Hollingshead,S.K. and Nahm,M.H. + TITLE Genetic basis for the new pneumococcal serotype, 6C + JOURNAL Infect. Immun. 75 (9), 4482-4489 (2007) + PUBMED 17576753 +REFERENCE 2 (bases 1 to 17682) + AUTHORS Park,I.H., Park,S., Hollingshead,S.K. and Nahm,M.H. + TITLE Direct Submission + JOURNAL Submitted (05-APR-2007) Pathology, University of Alabama at + Birmingham, 845 19th Street South BBRB 612, Birmingham, AL 35294, + USA +FEATURES Location/Qualifiers + source 1..17682 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="CHPA388" + /serotype="6C" + /db_xref="taxon:1313" + CDS 1555..3000 + /note="integral membrane regulatory protein" + /codon_start=1 + /transl_table=11 + /product="Wzg" + /protein_id="ABR37221.1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTHLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIKKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGDYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + CDS 3002..3733 + /note="protein-tyrosine phosphatase" + /codon_start=1 + /transl_table=11 + /product="Wzh" + /protein_id="ABR37222.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + CDS 3739..4434 + /note="capsular polysaccharide biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="Wzd" + /protein_id="ABR37223.1" + /translation="MMKEQNTIEIDVFQLFKTLWQRKLMILLVALVTSAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKMK" + CDS 4444..5133 + /note="tyrosine-protein kinase" + /codon_start=1 + /transl_table=11 + /product="Wze" + /protein_id="ABR37224.1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDAFYFMDEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSIDKYGSY + GNYGNYGKNKK" + CDS 5148..6515 + /note="undecaprenylphosphate glucosephosphotransferase; + initial sugar transferase" + /codon_start=1 + /transl_table=11 + /product="WchA" + /protein_id="ABR37225.1" + /translation="MNGKIVKSSLVIIQSSLVILLTYLLSTVREAKIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDGLIESNEVVGEL + VAVSVLDKPDFQHDYLKIVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIRKMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGCFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + CDS 6522..7646 + /note="putative glucosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciNbeta" + /protein_id="ABR37226.1" + /translation="MFMKLLHFSEVGGGVDRYIKLFLKYSDKEHFKNIVVGSDQLNRQ + TYEQEYNIKFYHIDIYRSLSPIKLLRAIKQFRKILYLERPDIVYLHSTFAGVVGRLAS + MGLSCKVVYNPHGWSFKMDVSKIKQFVYKNIEKFLSYLTDKYILISKSEYEAAQSLKI + PLKKLTLVYNGVEIDEDFNEHQINVLLPINKYVIGMIGRISEQKNPFFFVEFAKKLSE + IYSNLYFGIVGDGELRGRTEELIEEYGLRSSFFITGWVDNPEDYLAQFNQAVLFSKWE + GFGLAVAEYMKHKKPILITNVDGMSELVIDGESGFKVPLYNLEVTVDRSRSIIENREL + ANELGSAAFQRVRSTFEIKEKVSELENIFMSLREDDNVNI" + CDS 7633..8352 + /note="putative ribitol phophotransferase" + /codon_start=1 + /transl_table=11 + /product="WciO" + /protein_id="ABR37227.1" + /translation="MSIYKLCKDIERKTMSPAKKAMPKNDYFAFYVGRPLSYLLTVPF + VKTNITPNQISYLSIIPLIVGFIIMIFTTDFVVLLLAWFLFFLWNLLDGVDGNLARYR + EQYSKDGSVVDAMAGYVAMVLTYFGAGIVAAHLTDSDIYIILGALSGISLIFPRLVMH + KYINTVAQDESVSSIKDKSDFNTIKILALNMTSITGIPQVLLLLTILTNQWVLFTLVY + FTINFLLMIFSLYSLFKKENV" + CDS 8355..9341 + /note="putative rhamnosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciP" + /protein_id="ABR37228.1" + /translation="MGKSVAILMTTYNGERYLSQQIDSIRSQTFTNWTLFIRDDGSKD + KTIEVIQRYSKIDDRIRLVENPSKFHGAYYNFFNLIEYVKNNYQFDYYFFCDQDDIWK + EHKLEIQLLRFSKDDMPEMVYSDLSTIDASNNLIDISINKIMGIELPNINNLYFIQAY + IWGCTAGFNHALLEMVPSVDIDKDYLYIEKLAHDSYFAKFALEYGKVLFCPEQLVLYR + RHGHNVTTSHHFKLSPLNVFRKAILGFNELALTHARVYNQTLYMLKKASGKNPLSDRL + LEIQEVIKIGGLKGVRYFYQNRISRKQLVRTIGLYTIMLFGAYKKYIMKELL" + CDS 9341..10678 + /note="oligosaccharide repeat unit polymerase" + /codon_start=1 + /transl_table=11 + /product="Wzy" + /protein_id="ABR37229.1" + /translation="MLLNFLFISIFLLIIITFILFEGDFFQPAVILTLTYFISIASAL + VNRNVWGTELHFKTFGLILLGVATFIIVSLLTKLSYRPKVEGISYEELKEINPSKIIY + VILLILNLVMLFLYTREIQKVVLFSGRSFSNITDLISNYRYLSYYSNEVEISGMINQL + SKIIPATTLISLYIFINNYFITKQIKKNFIYLIPIAIFFVYAIISGGRLPLIRLVVGA + LLILYIYSVYGSPKSQLTKSFKMITRSLFAFLILIVLFFLLKFVLGRSSQEDFISYIT + RYMGGSIQLFDLFVIDPIRRNKELGAETFSGIYEMLAKLGFDNNIIKGLEWRVSPNYY + SLGNVYTAIRRYYSDFGVIGIVICQSFTAWLYTLGYEKVRHYSLVTNVQRFRLILLAA + SFYPIFLNSIEDVFYISMVTIGYGIQIVIFYLVFWVLLKVQVDFNKGKLTINR" + CDS 10803..12215 + /note="flippase" + /codon_start=1 + /transl_table=11 + /product="Wzx" + /protein_id="ABR37230.1" + /translation="MKLKFLITNLFHVFLSNLITIVTSVIVVLILPKIMGVTEYSYWQ + LYIFYLTYIGFFHLGWIDGIYLKYGGLEYQNLDKKQFYSQILQFFSFLILISFLLFGF + NLLIVTDPNAKYIYNMTIISMIVTNLRMLFVYILQMTNRLKDSSIILISDRVIYIFLL + FLFIIFKWHEYKVMIWADVLGRTFSLLLSFWICKDIVFQSLSEFILDLRESFDNIRVG + INLMLSNIASSMIIGIVRMGIQWNWNIETFGKVSLMLSISNLLMTFINAIGLVVFPLL + KRTKTENLSKIYSNLRNVLMLIMFAILLFYYPLKIILDLWLPAYRDALIFMALIFPMS + IYEGKMALVINTYLKALRMERDILKINTLIMLFSMLVTLITTLLLNNLELTVISIVVL + LALRSIIAELILSKKLDISVEQDIVLELLMTIIFISSSWYLPIWLAVIVYLLAYTLYL + YLKRKDTKMYIEYFRKKIFE" + CDS 12710..13579 + /note="glucose-1-phosphate thymidylyltransferase" + /codon_start=1 + /transl_table=11 + /product="RmlA" + /protein_id="ABR37231.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + CDS 13580..14176 + /note="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase" + /codon_start=1 + /transl_table=11 + /product="RmlC" + /protein_id="ABR37232.1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDLE" + CDS 14186..15235 + /note="dTDP-D-glucose 4,6-dehydratase" + /codon_start=1 + /transl_table=11 + /product="RmlB" + /protein_id="ABR37233.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + CDS 15301..16152 + /note="dTDP-4-keto-L-rhamnose reductase" + /codon_start=1 + /transl_table=11 + /product="RmlD" + /protein_id="ABR37234.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaagaca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggtctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatacagtc aattgaaaca agaacaagac + 481 aaaagagcct cgtaaaaagt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggcgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcaca caagagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt acctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt tttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaattca gaagctattt cagtcaaata + 1081 agcgtctgga ttgtcagtaa gatagttttt aagtctatct ctatcaacct ttcttggttt + 1141 tgttcctttt acttggtggt ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatggtatta cgtgagattt ggaaaacgtg tgatgcttct gttatactac ctgttcgctc + 1261 acaataagag agaacttttt tacgaaatct attgaatatg ccataaaaag attataccac + 1321 attgtgtact atattagatt gaaactagaa tagtacacct ctgcttctaa aacattgtta + 1381 gaaatcgatt tgactgtcct gatcgttttg tcatgttctt atttcatttt actatatttt + 1441 tggttcgtgg gaagtctact aagatactta aagatgcaga tagtgaaaaa aggtgtagac + 1501 attaccgtaa aaaagtgata taatcgtatg atgttcaatg tataggtgtt aatcatgagt + 1561 agacgtttta aaaaatcagg ttcacagaaa gtgaagcgaa gtgttaatat agttttgttg + 1621 actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta caatatcctt + 1681 gcttttagat atcttaatct agtggtaact gcgttagtcc tactagttgc cttggtaggg + 1741 ctactcttga ttatctataa aaaagctgaa aaatttacta tttttctgtt ggtgttttct + 1801 atccttgtca gctcagtgtc gctctttgca gtacagcagt ttgttggact gaccaatcgt + 1861 ttaaatgcga cttctaatta ctcagaatat tcaatcagtg tcgctgtttt agcagatagt + 1921 gagatcgaaa atgttacgca cctgacgagt gtgacagccc cgactgggac tgataatgaa + 1981 aatattcaaa aactactagc tgatatcaag tcaagtcaga ataccgattt gacggtcgac + 2041 cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac taaggccatt + 2101 gtcttaaata gtgtctttga aaatatcatc gagtcagagt atccagacta tgcatcgaag + 2161 ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa gacgtctaag + 2221 aatcagtctt tcaatatcta tgttagtgga attgacacct atggtcctat tagttcggtg + 2281 tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa aatcctcttg + 2341 accacaacac cacgtgatgc ctatgtacca atcgcagatg gtggaaataa tcaaaaagat + 2401 aaattaaccc atgcgggcat ttatggagtt gattcgtcca ttcacacctt agaaaatctc + 2461 tatggagtgg atatcaatta ctatgtgcga ttgaacttca cttcgttttt gaaattgatt + 2521 gatttgttgg gtggaattga tgtttataat gatcaagaat ttactgccca tacgaatgga + 2581 aagtattacc ctgtaggcaa tgttcatctt gattcagaac aggctctcgg ttttgttcgt + 2641 gagcgctact cactagcaga tggcgatcgt gaccgtggtc gcaaccaaca aaaggtcatt + 2701 gtagcaatta ttaagaagtt aacttctaca gaggttttga aaaactatag tagtattctt + 2761 caaggattgc aggattctct tcaaacaaat atgccgattg agactatgat agatttagtg + 2821 aatactcagt tggaaagtgg gggggattat aaagtaaatt ctcaagattt aaaagggaca + 2881 ggtcggatgg atcttccttc ttatgcaatg ccagacagta acctctatgt gatggaaata + 2941 gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga gggtagatga + 3001 aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca agtcaagaga + 3061 ggaaagcaag gctctcttgg cagaagccta cagacagggg gtgcgaacca ttgtctctac + 3121 ctctcaccgt cgcaagggca tgtttgaaac tccggaagag aagatagcag aaaactttct + 3181 tcaggttcgg gaaatagcta aggaagtggc gagtgactta gtcattgctt acggggctga + 3241 aatttactac acaccagatg ttctggataa gctgggaaaa aagcggattc cgaccctcaa + 3301 tgatagtcgt tatgccttga tagagtttag tatgaacact ccttatcgcg atattcatag + 3361 cgccttgagc aagatcttga tgttgggaat tactccagtc attgcccaca ttgagcgcta + 3421 tgatgctctt gaaaataatg aaaaacgcgt tcgagaacta atcgatatgg gctgttacac + 3481 gcaagtaaat agttcacatg tcctcaaacc caaacttttt ggcgaacgtt ataaattcat + 3541 gaaaaaaaga gctcagtatt ttttagagca ggatttggtc catgtcattg caagtgatat + 3601 gcacaatcta gacggtagac ctcctcatat ggcagaagca tatgaccttg ttacccaaaa + 3661 atacggagaa gcgaaggctc aggaactttt tatagacaat cctcgaaaaa ttgtaatgga + 3721 tcaactaatt taggagaaat gatgaaagaa caaaacacga tagaaatcga tgtatttcaa + 3781 ttatttaaaa ccttgtggca acgcaagcta atgattttat tagtggcact tgtgacaagt + 3841 gcgggggctt ttgcatatag cacttttatt gttaagccag aatatacgag taccacgcga + 3901 atttacgtag tgaatcgcaa tcaaggagac aagccggggc tgacaaatca ggatttgcag + 3961 gcaggaactt atctggtgaa agactaccgt gagattatcc tttcgcagga tgcattggaa + 4021 aaagtagcga caaatttgaa gttggatatg ccagcaaaaa cgttagccag caaagttcaa + 4081 gtggctgtac cagctgacac tcgtatcgtc tcaatctctg tcaaggataa acagccagag + 4141 gaagccagtc gtatcgctaa ttctctacga gaagttgctg cagaaaagat cgtcgctgta + 4201 acgcgagtat ctgatgtaac gacacttgaa gaagcgcgac cagctacgac tccctcttct + 4261 ccaaatgttc gacgcaattc cttgtttggt tttcttggag gagcagtcgt aacagtaatt + 4321 gctgttcttt tgattgagtt gctcgacacc cgtgtgaaac gtcctgaaga tgttgaagat + 4381 gtactgaaaa ttccactttt agggctcgtt ccagattttg acaaaatgaa ataggaggaa + 4441 gttatgccaa cattagaaat ctcacaggca aaattggatt ctgtaaaaaa ggcagaggaa + 4501 tattataacg ctttgtgcac gaacctacag ttaagtggag atggtttgaa agtattttct + 4561 atcacttctg tgaaactagg agaaggaaaa tcaacgactt ccaccaatat cgcttgggct + 4621 tttgcgcgtg caggatacaa aacgctgctg attgatggag atattcgcaa ttctgttatg + 4681 ttaggtgtct ttaaagcaag ggataagatt acaggcctga cagaattttt atcaggaact + 4741 acagacctat cacaagggct ttgtgatacc aatatcgaaa atctctttgt aattcaggct + 4801 ggctctgtgt caccgaatcc gacagctctt cttcaaagta agaatttcag tacaatgctt + 4861 gaaaccttgc gtaaatattt tgactacatc attgtagata ctgctcctgt cggtgtcgtg + 4921 attgatgcgg ctattattac gcgaaaatgc gatgctttct attttatgga cgaggcaggt + 4981 gaaataaatc gacgggatat tcaaaaagca aaagaacagt tggaacacac agggaagccg + 5041 tttttgggag ttgtgttgaa taaattcgat acttcaatag acaaatacgg ttcttatgga + 5101 aattatggaa attacgggaa aaataaaaaa taggtcgggg gatagagatg aatggaaaaa + 5161 tagtaaagtc ttcattggtc ataatccaga gttctcttgt tattttattg acttatctac + 5221 ttagtactgt gagagaagcg aagattgttt caacaacagc tattgcactt tatatcctcc + 5281 attattttgt cttttatatc agtgattatg gacaggattt ctttaaaagg ggatatttga + 5341 ttgaacttgt ccagacattg aaatatatcc tattctttgc actagcgatt agtatttcta + 5401 attttttctt agaggatcga tttagtattt ccagacgagg catgatttac ttcctcacat + 5461 tacatgctct cttagtctat gtgctaaacc tatttatcaa gtggtattgg aagcgggctt + 5521 atcccaactt taaaggaagt aagaagattc tcctacttac agcaacttct cgtgtcgaaa + 5581 aggtactgga tggattaata gaatcaaatg aggttgttgg ggagttggta gccgtcagtg + 5641 tcttagataa accagatttt cagcatgatt atttaaagat agtagcagag ggggagatag + 5701 taaactttgc gactcatgag gtggtcgatg aagtctttat caatcttcca agtgaaaaat + 5761 acaatattgg agagcttgtc tctcagtttg aaacgatggg aattgatgta acagtcaatc + 5821 taaatgcttt tgatcgtagt ttggcacgta acaagcaaat tcgtaagatg gcaggattaa + 5881 acgttgtgac tttttctaca acattttata agactagtca tgtaattgct aagcggatta + 5941 ttgatatcgt gggtgcattg gtcgggttga tattatgtgg tttagtcagt attgtactgg + 6001 ttcctttgat tcgaaaggat gggggctctg ctatttttgc tcagacgcgt ataggaaaaa + 6061 atggtcgtca gttcactttt tataagtttc gctctatgtg tgtagatgcc gaggcgaaaa + 6121 aaagagaact catggaacaa aataccatgc agggtggaat gtttaaggtg gacgatgatc + 6181 ctcgtatcac gaaaattggt tgttttatac ggaagactag cttggacgag ctaccacagt + 6241 tttataatgt tctaaaggga gatatgagtt tggttggcac acgtccacca acagtggatg + 6301 agtatgaaca ctatacccca gaacaaaaac gtcggctaag ttttaaacct ggtataacag + 6361 gcttatggca ggtcagtgga cgaagtgaaa tcaaaaattt cgatgaagtt gtcaaattag + 6421 atgtggctta tatagatgat tggacaatct ggaaagatat tgaaatttta ttgaagacag + 6481 ttaaggtagt attgatgaag gatggagcca aataggggga tatgttcatg aaattgcttc + 6541 attttagtga agttggcggt ggagttgata ggtatattaa gttattttta aaatattcag + 6601 ataaagaaca ttttaaaaat attgtggtag gatcagatca gcttaataga caaacatatg + 6661 aacaagaata taatataaag ttttatcaca ttgatatcta tagaagcttg tctccaataa + 6721 agcttttacg cgcgattaaa caatttagaa aaatattgta tctagaaaga cctgatatag + 6781 tatatctgca cagtactttt gcaggtgtag taggcaggtt agcttctatg ggtttgtcgt + 6841 gtaaagtagt atacaatcct cacggatggt cttttaagat ggatgtttct aagattaagc + 6901 aattcgttta taaaaatatt gaaaagtttt tgtcttatct tacagataag tatatattaa + 6961 tctctaaatc tgaatatgaa gcggctcaat ctttaaaaat accccttaag aaattgactt + 7021 tagtgtataa tggagtagag attgatgaag attttaacga acatcaaata aacgttttat + 7081 tacccataaa taaatatgtt attgggatga ttggtcgtat tagtgaacag aaaaatcctt + 7141 tcttttttgt tgaatttgca aaaaaattat cagagattta tagcaattta tattttggta + 7201 ttgtcggcga tggcgaattg cgtgggcgaa ctgaagaact aattgaagag tatgggcttc + 7261 gaagctcatt ttttataaca gggtgggtgg ataatccaga ggattattta gctcagttca + 7321 atcaggcagt tcttttctcg aaatgggagg gctttggatt ggcggttgcg gaatatatga + 7381 aacataagaa gccaattctt ataactaatg ttgatgggat gtcagaattg gttattgatg + 7441 gtgagtcagg ttttaaagtc ccactatata atttagaagt aactgtagat agaagtagaa + 7501 gtattattga gaatagagaa ctagccaatg agttaggtag tgctgctttc caaagagttc + 7561 gatctacatt tgaaataaaa gaaaaagtgt cagagttaga gaatatattc atgagtttaa + 7621 gagaggatga taatgtcaat atataaactt tgtaaagata ttgaaagaaa aactatgtcg + 7681 cctgctaaaa aagcaatgcc taaaaacgac tattttgcat tttatgttgg aagaccttta + 7741 tcctatcttt taacagttcc tttcgtgaaa acaaatatta ctcccaatca aatatcttat + 7801 ttatctataa ttcctttgat tgttggattt ataataatga tatttacaac tgatttcgtt + 7861 gtattattac tggcatggtt tctatttttt ttatggaact tactagatgg agtagatggg + 7921 aacttagcca gatatcggga gcaatactcg aaggatggaa gtgtagtaga tgcaatggct + 7981 ggctatgtag ccatggtgtt gacgtatttc ggtgcaggaa tagtagctgc tcatttaacc + 8041 gactcagata tctatataat cctgggtgca ttatctggga tttcattgat ttttccaagg + 8101 ttagtgatgc ataagtatat caatacagta gctcaagatg agtctgtgag tagcattaaa + 8161 gataaatccg attttaatac tataaaaata ctggctctaa acatgacatc aattacagga + 8221 attccgcagg ttttactgct attaactatt ttaacaaatc agtgggtact ttttacttta + 8281 gtatatttca cgattaattt tttattaatg atattttctt tgtattcatt attcaaaaag + 8341 gagaatgttt agaaatggga aagtcagttg caattttaat gaccacctat aatggtgagc + 8401 gatatttgtc acaacagatt gatagtatta ggtctcaaac attcactaat tggacgcttt + 8461 ttattaggga tgatggatca aaagataaaa caatagaagt aatacagagg tattctaaga + 8521 tagatgatag aattagatta gttgaaaatc cctcaaagtt tcatggagct tattacaatt + 8581 tttttaatct aattgaatac gttaaaaaca attatcaatt tgattattac tttttttgtg + 8641 atcaagatga tatttggaaa gagcacaagt tagaaataca gctgttaaga ttttctaaag + 8701 atgacatgcc agagatggtt tactctgatc tgtcaacgat tgatgccagt aataatttga + 8761 tagatattag tataaataaa ataatgggga ttgaattacc gaacataaat aatttgtatt + 8821 ttattcaagc ctatatctgg gggtgtactg caggttttaa tcatgcattg ctagagatgg + 8881 ttccttcagt tgatattgat aaagattatt tatatataga aaaactggct catgatagtt + 8941 attttgcaaa gtttgcgcta gagtatggga aggtgttgtt ctgccctgaa caactggtct + 9001 tgtatcgaag acatggacat aatgtaacaa ctagtcatca ttttaaatta tctccgctaa + 9061 atgttttcag aaaggctata ttgggtttca atgaattggc acttacacat gctagggtat + 9121 ataatcaaac tctttatatg ctaaaaaaag cttctggaaa aaatccttta agtgatagac + 9181 tacttgaaat tcaggaagta atcaaaattg gaggattaaa aggtgtgaga tatttctatc + 9241 agaatcgaat ttctcgaaaa caactcgtaa gaacaatcgg cttatatacc atcatgcttt + 9301 ttggggccta taaaaaatat attatgaaag agctcttata atgcttttaa atttcttatt + 9361 catatctatt tttctattaa ttatcattac atttatatta tttgaggggg atttttttca + 9421 acctgcagta attttaacac tcacttattt tatttcgatt gcaagtgctc tagttaatag + 9481 aaatgtttgg ggaacagaac tccatttcaa aacctttggt ttgatattgt taggggttgc + 9541 tacatttatt atagtttcct tgttgacaaa attgtcgtac aggcctaaag tggagggaat + 9601 ttcgtatgaa gaattgaaag aaataaatcc ttcaaagata atctatgtca ttcttctgat + 9661 tctaaatctt gttatgctat ttctttatac ccgtgaaatt cagaaagtgg tattgttttc + 9721 aggtagaagt ttttctaata ttacagattt gataagtaac tataggtacc tatcttatta + 9781 ttcaaatgaa gtagaaataa gtggaatgat taatcaacta tctaaaatta ttccagcgac + 9841 tacacttatt tctttatata tatttataaa taattatttt ataactaaac aaataaagaa + 9901 aaatttcatt tatttgattc caatagctat attctttgtc tatgcaatca ttagtggtgg + 9961 tagattgccc cttataaggt tagttgttgg agctctgttg atattgtata tatactctgt + 10021 gtacgggagt cctaaatctc aacttaccaa aagttttaaa atgattactc gctctctgtt + 10081 tgcatttctt attttgatag ttttattctt tcttttaaaa tttgtattag ggcgctcctc + 10141 tcaggaagat tttatcagtt acatcactcg ttatatggga ggttcaattc aactatttga + 10201 tttatttgtt atagatccga tacgacgtaa caaagaacta ggtgcagaaa ctttttcggg + 10261 aatttatgag atgcttgcaa aattaggatt tgacaataat attataaaag gcttagaatg + 10321 gagagtgtct cctaattatt attctttagg aaatgtgtat actgcaatta gacgttatta + 10381 ttcagacttt ggtgtaattg gtattgtaat ttgtcagagt tttacagcgt ggttatatac + 10441 tttaggttat gaaaaagtta gacattattc tttagttaca aatgttcaaa gatttaggtt + 10501 gatcctatta gcagcttcat tttatccaat atttttaaat agtatcgagg atgtgtttta + 10561 tatttcaatg gttaccattg gatatggaat acaaattgtt atcttttatc tggtcttttg + 10621 ggttcttctg aaagttcagg ttgactttaa caaaggtaaa ttaacgataa atagatgaat + 10681 ttagcgctaa tgtattgaat catataaagg gatatatttg gtaggtattt taattggagg + 10741 aagagagcct tgaatgggaa gtacaaatct tctgaaacaa tttttaggtg gggagtatag + 10801 ctatgaaatt gaagtttctt ataacaaatt tatttcatgt ctttttgtct aatctgatta + 10861 caattgtcac atcggttata gttgtactaa ttttaccaaa aattatggga gtaactgagt + 10921 atagttattg gcaactatat attttttacc taacatatat tggttttttt catctgggtt + 10981 ggattgatgg aatttatctt aaatatggtg gattagagta ccagaattta gataagaaac + 11041 agttttattc tcaaatactt caatttttca gttttttaat tttaatttct tttctattat + 11101 ttggttttaa cttattgatt gtgacagatc caaatgcaaa atatatttat aacatgacta + 11161 ttattagtat gatagttaca aatttaagaa tgttatttgt ttatattttg cagatgacaa + 11221 atcgattaaa ggatagctct ataattctga taagtgatcg cgttatatat atttttcttt + 11281 tatttctgtt tattatattt aaatggcatg aatacaaggt aatgatttgg gcggatgttt + 11341 taggaaggac attttctctc ctactttctt tttggatttg taaagatatt gtttttcaat + 11401 ccttatccga gttcatattg gatctgagag agtcttttga caatatccgt gttggaatca + 11461 acttaatgtt atccaatatt gcaagtagta tgattattgg tattgttcga atgggaattc + 11521 aatggaattg gaatatcgaa acattcggga aagtatcact gatgctaagc atctctaatt + 11581 tattaatgac ttttattaat gcgattggtt tagttgtctt tcctttgtta aaacggacaa + 11641 aaacggaaaa tttatctaaa atttattcca acttaagaaa tgttttgatg ctgatcatgt + 11701 ttgcaatatt gctcttttat tatcctttaa aaattattct agatctttgg ttgccagctt + 11761 atcgggatgc gttgattttt atggctctta tttttcctat gtcaatttat gaagggaaga + 11821 tggccttggt gattaataca tatttaaagg cgctaaggat ggaaagagat attctcaaaa + 11881 taaatacttt gattatgttg ttcagtatgt tagttaccct aataactact ctattattaa + 11941 ataatttaga gctaacggtt atatctatag ttgttttgct agctttacgt agtataatag + 12001 cagaactaat tctatctaaa aaacttgata tatcagttga gcaagacatt gtgttagaat + 12061 tacttatgac aattatattt atttcttcaa gttggtactt accgatttgg ctcgcagtaa + 12121 tagtttattt gttagcgtat actttatact tgtatctaaa gcgtaaagat acaaaaatgt + 12181 atatagaata ttttagaaag aaaatatttg aataaaaaga actatatatc agttagatgg + 12241 caaattctat ttttaccttt ttgtcgttta atagaaaatg ataaaaaata tgatactatt + 12301 ttttacacat atttataagc gatttgaatg tatcaggtga taaattaatt taaaataaga + 12361 atagtttctg gaacattgct attagtggga acaggttacg aaataattta tcaattttaa + 12421 agacgttttt ttaaatataa aataatggat tttgtcaaca attctaaatt ctaataggaa + 12481 tgataatgct agaaaatcag attgttcatt tttcaaggaa gtttattttt aaaataatat + 12541 atctttaagt aagaattatt ttattagact taacctagcc tatcagttaa attagaatat + 12601 caactttgat taattaaaaa ttagcaaaat ttattgacat tttgttttta taaattgcaa + 12661 taaaggtcta attctgaatt tcagtgaata taagaaaggg atcctactaa tgaaaggtat + 12721 tattcttgca ggtggttcgg ggacacgatt atatcctttg actcgggctg catcaaaaca + 12781 acttatgccg gtttatgata aaccgatgat ttactatcca ctttcaacat tgatgttggc + 12841 tgggattagg gatattttga taatctcaac tcctcaagat ttgcctcgtt ttaaagagct + 12901 tcttcaagac ggatctgagt ttgggattaa actttcttat gcagagcaac caagtccaga + 12961 tggtttggca caagccttta tcattgggga agagtttatt ggtgatgata gtgttgcttt + 13021 gattttgggg gacaatatct atcacggccc tggtttgagc aaaatgcttc aaaaagcagc + 13081 caagaaagag aaaggtgcga ctgtttttgg ctaccaagtg aaggatccag agcgttttgg + 13141 tgtggttgag tttgatacag acatgaatgc tatctccatc gaagaaaagc cagaataccc + 13201 tcgttcaaac tatgcagtga caggactcta tttctatgat aatgatgtag tagagattgc + 13261 caagagtatc aaaccaagtc ctcgcggaga attagaaatc acagatgtca acaaggctta + 13321 cttggatcgt ggagacttat ccgttgagct tatgggacgt ggctttgctt ggctggatac + 13381 tggaactcat gaaagtttac tagaggcttc acagtacatc gaaacagtgc aacggatgca + 13441 aaatgttcag gtagcaaact tagaagaaat tgcttaccgt atgggctata tcagtcgaga + 13501 agatgtattg gccttagccc aaccacttaa gaaaaatgaa tacggacagt atctgctccg + 13561 tttgattgga gaagcataga tgacagataa ttttttcggt aagacgcttg cggcacgcaa + 13621 ggttgaagct attccaggca tgttggagtt tgatatcccc gttcatggag ataatcgtgg + 13681 ctggtttaaa gaaaatttcc aaaaggaaaa aatgcttcca cttggatttc cagagtcttt + 13741 ctttgcagaa ggaaaattgc aaaacaatgt atccttctca cgtaaaaatg tccttcgagg + 13801 cctccacgca gagccttggg ataagtacat ctctgtagca gatggaggga aagttctggg + 13861 ttcttgggtt gatctacgcg agggtgaaac ctttgggaat acctatcaga cagtgattga + 13921 tgcgagtaag ggaatctttg ttcctcgagg cgtagctaat ggcttccaag ttttatcaga + 13981 tacagtgtca tatagctatc tggtcaatga ttactgggct cttgaactca aacccaagta + 14041 tgcctttgtg aactacgctg atccaagcct tggtattgaa tgggaaaata ttgcagaagc + 14101 agaggtttca gaagcagata aaaatcatcc actacttaag gatgtaaaac ctttgaaaaa + 14161 agaagatttg gaataaggaa agaatatgac tgaatacaaa aatattatcg tgacaggtgg + 14221 agctggcttt atcggttcta actttgtcca ttatgtttac gagaactttc cagatgttca + 14281 cgtgacagtc ctagataagt tgacttatgc tggaaaccgc gcgaatattg aggaaatttt + 14341 aggtaatcgt gttgagttag ttgttggtga cattgctgat gcggagttgg tagacaagtt + 14401 ggctgctcaa gcagatgcta tcgttcatta tgcagcggaa agccacaatg ataattcgct + 14461 caatgatcca tcgccattta ttcatactaa cttcattgga acctatactc ttttagaagc + 14521 tgctcgtaag tatgatattc gcttccacca tgtatcgaca gatgaagttt atggggatct + 14581 ccctttacgc gaagatttgc caggtcatgg agaagggccg ggtgagaaat ttacggctga + 14641 aaccaagtac aatccaagct cgccttactc atcaaccaag gcagcctcag atttgattgt + 14701 caaagcctgg gtgcgttctt ttggagtcaa ggcaacgatt tccaactgtt caaataacta + 14761 cggtccttat caacatatcg aaaaattcat cccacgtcag attactaaca tcctaagtgg + 14821 tatcaagcca aaactttacg gtgaaggtaa aaacgttcgt gactggattc ataccaatga + 14881 ccattcttca ggagtttgga caatcttgac aaaagggcaa atcggtgaaa cctacttgat + 14941 tggggctgat ggtgagaaga acaataagga agttttggaa cttatcctta aggaaatggg + 15001 acaagctgcg gatgcctatg atcatgtgac tgaccgtgca ggacatgacc ttcgctatgc + 15061 gattgatgct agcaagctcc gtgatgagtt ggggtggaaa cctgaattta ccaactttga + 15121 agctgggctc aaggcaacaa tcaagtggta tacagataac caagaatggt ggaaagcaga + 15181 aaaagaagct gttgaagcca attatgctaa gactcaggag attattacag tataaaaagc + 15241 aggaaatagc tgctttttat tgctatattg ggaagagtta catattagaa aggtctagag + 15301 atgattttaa ttacaggggc aaatggccaa ttaggaacgg aacttcgcta tttattggat + 15361 gaacgtaatg aagaatacgt ggcagtagat gtggctaaga tggacattac caatgaagaa + 15421 atggttgaga aagtttttga agaggtgaaa ccgactttag tctaccattg tgcagcctac + 15481 accgctgttg atgcagcaga ggatgaagga aaagagttgg acttcgccat caatgtgacg + 15541 gggacaaaaa atgtcgcaaa agcatctgaa aagcatggtg caactctagt ttatatttct + 15601 acggactatg tctttgacgg taagaaacca gttggacaag agtgggaagt tgatgaccga + 15661 ccagatccac agacagaata tggacgcact aagcgtatgg gggaagagtt agttgagaag + 15721 catgtgtcta atttctatat tatccgtact gcctgggtat ttggaaatta tggcaaaaac + 15781 ttcgttttta ccatgcaaaa tcttgcgaaa actcataaga ctttaacagt tgtaaatgat + 15841 cagtacggtc gtccgacttg gactcgtacc ttggctgagt tcatgaccta cctagctgaa + 15901 aatcgtaagg aatttggtta ttatcatttg tcaaatgatg cgacagaaga cacaacatgg + 15961 tatgattttg cagttgaaat tttgaaagat acagatgtcg aagtcaagcc agtagattcc + 16021 agtcaatttc cagccaaagc taaacgtccg ctaaactcaa cgatgagcct ggccaaagcc + 16081 aaagctactg gatttgttat tccaacttgg caagatgcat tgcaagaatt ttacaaacaa + 16141 gaagtgagat aagtagtaga atgattttct agtctaataa aagaggcaga gaatgaactc + 16201 caaaggagca taagatgtac gattatctta tcgttggtgc cggtcttttt ggtgcagtat + 16261 ttgcccatga atcagcctta aaaggaaaaa aagtaaaagt tattgaaaaa cgaaatcata + 16321 ttgcgggtaa tatctatact cgtgaagagg aaggaattca agttcatcag tatggtgctc + 16381 atatctttca tacttctgat aaggagatct gggattatgt gaaccagttt gcagagttta + 16441 accgttatac aaattctcct gttgcaaact ataagggaga gatttataac ttacctttta + 16501 atatgaatac cttcaataaa ctctggggag ttgtgacgcc agcagaagca caagctaaga + 16561 ttgaggaaca acgtgctatt ttaaatggta aaactcctga aaatttgaaa gaacaggcga + 16621 tttctcttgt aggtacagac atctacgaaa aattaatcaa agactataca gagaaacagt + 16681 ggggcaaacc aactactgaa cttccatcct ttattattcg ccgtttacca gtacacctga + 16741 cctatgataa caactatttt aacgatacct atcaagggat tccaattggt ggatacactc + 16801 aaatagttga aaaatgttgg attatgaaaa tattgatgta gaaacaaatg ttgatttctt + 16861 tgtgaacaaa gagcaatatc tgaaagattt tcctaagatt gtctttactg gtatgattga + 16921 tgaattcttt gactataagt tgggcgaact agagtaccgt agtcttcgtt ttgaaaatga + 16981 gaccttggat atggaaaatt accaaggaaa tgcagttgtg aactatacgg atgcagaaac + 17041 cccatatact cgcattattg aacacaaaca ttttgagttt gggagtcaag caaagactat + 17101 cattactaaa gaacattcta aaacatggga aaaaggtgat gagccttatt atccagttaa + 17161 taatgatcgt aataatcatt tgtataaatc gtataaaaaa tttgctgatg agcaagggaa + 17221 tgttatcttt ggtggccgct taggacacta tcgttattac gatatgcacc aagtaattgg + 17281 agcagctttg cagtgcgtga gaaatgagtt agattaatac tcaatgaaaa tcaaagagca + 17341 aactaggaag ctagccacag gttgctcaaa atactgtttt gaggttgcag atggaagctg + 17401 acgcggtttg aagagatttt cgaagagtat aaacaagtaa aactgactac cagttattat + 17461 ttagaaatag tattaaaaat tccttgacta tgtgatatag ttgagggatt tttaaatgat + 17521 attcatattt tttgcaaaga tgttgtttga aaaataattt tcaaaaattc tgaaaattct + 17581 gttgacaact ttctgaaaag agtctataat ggagagaaag ttttaaagga gaaaatgatg + 17641 aaaagttcaa aactacttgc ccttgcgggc gtgacattat tg +// + diff --git a/public/res/serotype_genbank/serotype_6D.gb b/public/res/serotype_genbank/serotype_6D.gb new file mode 100644 index 0000000..c302ccd --- /dev/null +++ b/public/res/serotype_genbank/serotype_6D.gb @@ -0,0 +1,525 @@ +LOCUS HM448897 15933 bp DNA linear BCT 26-JAN-2011 +DEFINITION Streptococcus pneumoniae strain MNZ920 cps gene locus, complete + sequence. +ACCESSION HM448897 +VERSION HM448897.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 15933) + AUTHORS Nahm,M.H., Oliver,M.B., Siira,L., Kaijalainen,T., Lambertsen,L.M. + and Virolainen,A. + TITLE A report of Streptococcus pneumoniae serotype 6D in Europe + JOURNAL J. Med. Microbiol. 60 (PT 1), 46-48 (2011) + PUBMED 20829399 +REFERENCE 2 (bases 1 to 15933) + AUTHORS Nahm,M.H., Oliver,M.B., Siira,L., Kaijalainen,T., Lambertsen,L. and + Virolainen,A. + TITLE Direct Submission + JOURNAL Submitted (03-JUN-2010) Microbiology, University of Alabama at + Birmingham, Bevill Building, Room 614, 845 19th Street South, + Birmingham, AL 35294, USA +FEATURES Location/Qualifiers + source 1..15933 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="MNZ920" + /db_xref="taxon:1313" + misc_feature 1..15933 + /note="cps gene locus" + gene 1142..2587 + /gene="cpsA" + /gene_synonym="wzg" + CDS 1142..2587 + /gene="cpsA" + /gene_synonym="wzg" + /note="integral membrane regulatory protein" + /codon_start=1 + /transl_table=11 + /product="CpsA" + /protein_id="ADQ39178.1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIKKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGDYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 2589..3320 + /gene="cpsB" + /gene_synonym="wzh" + CDS 2589..3320 + /gene="cpsB" + /gene_synonym="wzh" + /note="protein-tyrosine phosphatase" + /codon_start=1 + /transl_table=11 + /product="CpsB" + /protein_id="ADQ39179.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + gene 3326..4021 + /gene="cpsC" + /gene_synonym="wzd" + CDS 3326..4021 + /gene="cpsC" + /gene_synonym="wzd" + /note="capsular polysaccharide biosynthesis protein" + /codon_start=1 + /transl_table=11 + /product="CpsC" + /protein_id="ADQ39180.1" + /translation="MMKEQNTIEIDVFQLFKTLWQRKLMILLVALVTSAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKSGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKIK" + gene 4022..4720 + /gene="cpsD" + /gene_synonym="wze" + CDS 4031..4720 + /gene="cpsD" + /gene_synonym="wze" + /note="tyrosine-protein kinase" + /codon_start=1 + /transl_table=11 + /product="CpsD" + /protein_id="ADQ39181.1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARNKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFTTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDKYGSY + GNYGNYGKNKK" + gene 4735..6102 + /gene="wchA" + CDS 4735..6102 + /gene="wchA" + /note="undecaprenylphosphate glucosephosphotransferase" + /codon_start=1 + /transl_table=11 + /product="WchA" + /protein_id="ADQ39182.1" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRKYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLIYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDGLIESNEVVGEL + VAVSVLDKPDFQHDYLKIVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIRKMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGCFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + gene 6109..7233 + /gene="wciNbeta" + CDS 6109..7233 + /gene="wciNbeta" + /note="putative glucosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciNbeta" + /protein_id="ADQ39183.1" + /translation="MFMKLLHFSEVGGGVDRYIKLYLKYSDKEHFKNIVVGSDQLNRQ + TYEQEYNIKFYHIDIYRSLSPIKLLRAIKQFRKILYLERPDIVYLHSTFAGVVGRLAS + MGLSCKVVYNPHGWSFKMDVSKIKQFVYKNIEKFLSYLTDKYILISKSEYEAAQSLKI + PLKKLTLVYNGVEIDEDFNENQINVLLPINKYVIGMIGRISEQKNPFFFVEFAKKLSE + IYSNLYFVIVGDGELRGRTEELIEEYGLRSSFFITGWVDNPEDYLAQFNQAVLFSKWE + GFGLAVAEYMKHKKPILITNVDGMSELVIDGESGFKVPLYNLEVTVDRSRSIIENREL + ANELGSAAFQRVRSTFEIKEKVSELENIFMSLRGDDNVNI" + gene 7220..7939 + /gene="wciO" + CDS 7220..7939 + /gene="wciO" + /note="putative ribitol phosphotransferase" + /codon_start=1 + /transl_table=11 + /product="WciO" + /protein_id="ADQ39184.1" + /translation="MSIYKLCKDIERKTMSPAKKAMAKNDYFAFYVGRPLSYLLTVPF + VKTNITPNQISYLSIIPLIVGFIIMIFTTDFVVLLLAWFLFFLWNLLDGVDGNLARYR + EQYSKDGSVVDAMAGYVAMVLTYFGAGIVAAHLNDSDIYIILGALSGISLIFPRLVMH + KYINTVAQDESVSSIKDKSDFNTIKILALNMTSITGIPQVLLLLTILTNQWVLFTLVY + FTINFLLMIFSLYSLFKKENV" + gene 7942..8928 + /gene="wciP" + CDS 7942..8928 + /gene="wciP" + /note="putative rhamnosyl transferase" + /codon_start=1 + /transl_table=11 + /product="WciP" + /protein_id="ADQ39185.1" + /translation="MGKSVAILMTTYNGERYLSQQIDSIRSQTFTNWTLFIRDDGSKD + KTIEVIQRYSKIDDRIRLVENPSKFHGAYYNFFNLIEYVKNNYQFDYYFFCDQDDIWK + EHKLEIQLLRFSKDDMPEMVYSDLSTIDASNNLIDISINKIMGIELPNINNLYFIHAY + IWGCTAGFNHALLEMVPSVDIDKDYLYIEKLSHDNYFAKFALEYGKVLFCPEQLVLYR + RHGHNVTTSHHFKLSPLNVFRKAILGFNELALTHAGVYNQTLYMLKKASGKNPLSDRL + LEIQEVIKIGGLKGVRYFYQNRISRKQLVRTIGLYTIMLFGTYKKYIMKELL" + gene 8928..10271 + /gene="wzy" + CDS 8928..10271 + /gene="wzy" + /note="oligosaccharide repeat unit polymerase" + /codon_start=1 + /transl_table=11 + /product="Wzy" + /protein_id="ADQ39186.1" + /translation="MLLNFLFISIFLLIIITFILFEGDFFQPAVILTIAYFISIASAL + VNRNVWGTELHFKTFYLILLGVATFVIVSLLTKLSYRPKVEGISHEELKEINPSKIIY + VILLTLNLVMLFLYIREIQKVVLFSGRSFSNITDLISNYRYLSYYSNEVENRVSGMIN + QLSKIIPATTLISLYIFMNNYFITKQIKKNFIYLIPIAIFFVYAIISGGRLPLIRLVV + GSLLILYIYSVYGSPKSQLTKSFKMITRSLFTFLILIVLFFLLKFVLGRSSQEDFISY + ITRYMGGSIQLFDLFVIDPIRRNKELGAETFSGIYEMLAKLGFDNNIIKGLEWRVSPN + YYSLGNVYTAIRRYYSDFGVIGIVICQSFTAWLYTLGYEKVRHYSLVTNVQRFRLILL + AASFYPIFLNGIEDVFYISMVTIGYGIQIVIFYLVFWVLLKVQVDFNKGKLTINR" + gene 10396..11808 + /gene="wzx" + CDS 10396..11808 + /gene="wzx" + /note="flippase" + /codon_start=1 + /transl_table=11 + /product="Wzx" + /protein_id="ADQ39187.1" + /translation="MKLKFLITNLFHVFLSNLITIVTSVIVVLILPKIMGVTEYSYWQ + LYIFYLTYIGFFHLGWIDGIYLKYGGLEYQNLDKKQFYSQILQFSSFLILISFLLFGF + NLLIVTDPNAKYIYNMTIISMIVTNLRMLFVYILQMTNRLKDSSIILISDRVIYIFLL + FLFIIFKWHEYKVMIWADVLGRTFSLLLSFWICKDIVFQSLSEFILDLRESFDNIRVG + INLMLSNIASSMIIGIVRMGIQWNWNIETFGKVSLTLSISNLLMTFINAIGLVVFPLL + KRTKTENLSKIYSNLRNVLMLIMFAILLFYYPLKIILDLWLPAYRDALIFMALIFPMS + IYEGKMALVINTYLKALRMERDILKINTLIMLFSMFVTLITTLLLNNLELTVISIVVL + LALRSIIAELILSKKLDISVEQDIVLELLMTIIFISSSWYLPIWLAVIVYLLAYTLYL + YLKRKDTKMYIEYFRKKIFE" + gene 12303..13172 + /gene="rmlA" + CDS 12303..13172 + /gene="rmlA" + /note="glucose-1-phosphate thymidylyltransferase" + /codon_start=1 + /transl_table=11 + /product="RmlA" + /protein_id="ADQ39188.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYHVKDPERFGVVEFDTDMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + gene 13173..13769 + /gene="rmlC" + CDS 13173..13769 + /gene="rmlC" + /note="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase" + /codon_start=1 + /transl_table=11 + /product="RmlC" + /protein_id="ADQ39189.1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDLE" + gene 13779..14828 + /gene="rmlB" + CDS 13779..14828 + /gene="rmlB" + /note="dTDP-D-glucose 4,6-dehydratase" + /codon_start=1 + /transl_table=11 + /product="RmlB" + /protein_id="ADQ39190.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNHVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVESNYAKTQEIITV" + gene 14894..15745 + /gene="rmlD" + CDS 14894..15745 + /gene="rmlD" + /note="dTDP-4-keto-L-rhamnose reductase" + /codon_start=1 + /transl_table=11 + /product="RmlD" + /protein_id="ADQ39191.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" +ORIGIN + 1 cactgcggct aaagaagtac ttgaaaaacg ggtcttggct ccatgggatg ctttctgtgt + 61 ggaattacta taaatatttt ttgcagaaaa atttaaaatt gaaatcgtat aaaaacaagg + 121 gaggactgta taaaaggcag aaatcctttg ttttttataa ccaaggttta taaaccttca + 181 ttctcgaaat tcaattaact ttacaaattc ccactattaa ggagaaagaa gacgaacata + 241 aagaagcgta tccttagtgc aggcctgact tttacatctg ctttgctttt agctgcttgc + 301 ggccaatcag gttcagatac aaaaacttac tcatcaacct ttagtggaaa tccaactaca + 361 tttaactatc tattagacta ttacgctgat aatatagtca attgaaacaa gaacaagaca + 421 aaagagcctc ataaaaggta ttgcaacttg gtaatacctt ttacgaggct ttttgatgtg + 481 agcccatgtt ttctcaatag gattgtactc aggtgagtag ggaggaagaa ggtaaaagtt + 541 tatgcccaaa ctcttcgcat aaaagttcta gcttccccag tctatggaat cttacattat + 601 ccataataat aaccgatgat gtgtttaatg ttggtaagag aaatttttga aaccaagctt + 661 caaaaaagtc gctcgtcatc gtctcttcgt aagtcattgg agcgattaac tcaccatttg + 721 ttagacctgc aaccaaagaa atcctctgat atcttcttcc agatactttg cctcttctta + 781 actgaacttt taatgagcga ccatattctc gataaaaata aatatcgaat cctgtttcgt + 841 caatctaaac aggtgctagg tgctttaaac tattaaaatt cttaagaaat aaggctactt + 901 tttctgggtc ttgttcataa ttagattgaa actagaatag tacacctctg cttctaaaac + 961 attgttagaa atcgatttga ctgtcctgat tgatttgtca tgttcttatt tcattttact + 1021 atatttttgt ttcgcgggaa gtctactaag atacttaaag atgcagatag tgaaaaaagg + 1081 tgtagacatt accgtaaaaa agtgatacaa ttgtatgatg ttcaatgtat aggtgttaat + 1141 catgagtaga cgttttaaaa aatcaggttc acagaaagtg aagcgaagtg ttaatatagt + 1201 tttgttgact atttatttat tgttagtttg ttttttattg ttcttaatct ttaagtacaa + 1261 tatccttgct tttagatatc ttaatctagt ggtaactgcg ttagtcctac tagttgcctt + 1321 ggtagggcta ctcctgatta tctataaaaa agctgaaaaa tttactattt ttctgttggt + 1381 gttctctatc cttgtcagct ctgtgtcgct ctttgcagta cagcagtttg ttggactgac + 1441 caatcgttta aatgcgactt ctaattactc agaatattca atcagtgtcg ctgttttagc + 1501 agatagtgag atcgaaaatg ttacgcaact gacgagtgtg acagcaccga ctgggactga + 1561 taatgaaaat attcaaaaac tactagctga tatcaagtca agtcagaata ccgatttgac + 1621 ggtcgaccag agttcgtctt acttggcagc ttacaagagt ttgattgcag gggagactaa + 1681 ggccattgtc ttaaatagtg tctttgaaaa tatcatcgag tcagagtatc cagactatgc + 1741 atcgaagata aaaaagattt ataccaaggg attcactaaa aaagtagaag ctcctaagac + 1801 gtctaagaat cagtctttca atatctatgt tagtggaatt gacacctatg gtcctattag + 1861 ttcggtgtcg cgatcagatg tcaatatcct gatgactgtc aatcgagata ccaagaaaat + 1921 cctcttgacc acaacaccac gtgatgccta tgtaccaatc gcagatggtg gaaataatca + 1981 aaaagataaa ttaacccatg cgggcattta tggagttgat tcgtccattc acaccttaga + 2041 aaatctctat ggagtggata tcaattacta tgtgcgattg aacttcactt cgtttttgaa + 2101 attgattgat ttgttgggtg gaattgatgt ttataatgat caagaattta ctgcccatac + 2161 gaatggaaag tattaccctg taggcaatgt tcatcttgat tcagaacagg ctctcggttt + 2221 tgttcgtgag cgctactcac tagcagatgg cgatcgtgac cgtggtcgca accaacaaaa + 2281 ggtcattgta gcaattatta agaagttaac ttctacagag gttttgaaaa actatagtag + 2341 tattcttcaa ggattgcagg attctcttca aacaaatatg ccgattgaga ctatgataga + 2401 tttagtgaat actcagttgg aaagtggggg ggattataaa gtaaattctc aagatttaaa + 2461 agggacaggt cggatggatc ttccttctta tgcaatgcca gacagtaacc tctatgtgat + 2521 ggaaatagat gatagtagtt tagctgtagt taaagcagct atacaggatg tgatggaggg + 2581 tagatgaaat gatagacatc cattcgcata tcgtttttga tgtagatgac ggtcccaagt + 2641 caagagagga aagcaaggct ctcttggcag aagcctacag acagggggtg cgaaccattg + 2701 tctctacctc tcaccgtcgc aagggcatgt ttgaaactcc ggaagagaag atagcagaaa + 2761 actttcttca ggttcgggaa atagctaagg aagtggcgag tgacttagtc attgcttacg + 2821 gggctgaaat ttactacaca ccagatgttc tggataagct gggaaaaaag cggattccga + 2881 ccctcaatga tagtcgttat gccttgatag agtttagtat gaacactcct tatcgcgata + 2941 ttcatagcgc cttgagcaag atcttgatgt tgggaattac tccagtcatt gcccacattg + 3001 agcgctatga tgctcttgaa aataatgaaa aacgcgttcg agaactaatc gatatgggct + 3061 gttacacgca agtaaatagt tcacatgtcc tcaaacccaa actttttggc gaacgttata + 3121 aattcatgaa aaaaagagct cagtattttt tagagcagga tttggtccat gtcattgcaa + 3181 gtgatatgca caatctagac ggtagacctc ctcatatggc agaagcatat gaccttgtta + 3241 cccaaaaata cggagaagcg aaggctcagg aactttttat agacaatcct cgaaaaattg + 3301 taatggatca actaatttag gagaaatgat gaaagaacaa aacacgatag aaatcgatgt + 3361 atttcaatta tttaaaacct tgtggcaacg caagctaatg attttattag tggcacttgt + 3421 gacaagtgcg ggggcttttg catatagcac ttttattgtt aagccagaat atacgagtac + 3481 cacgcgaatt tacgtagtga atcgcaatca aggagacaag tcggggctga caaatcagga + 3541 tttgcaggca ggaacttatc tggtaaaaga ctaccgtgag attatccttt cgcaggatgc + 3601 attggaaaaa gtagcgacaa atttgaagtt ggatatgcca gcaaaaacgt tagccagcaa + 3661 agttcaagtg gctgtgccag ctgacactcg tatcgtctca atctctgtca aggataaaca + 3721 gccagaggaa gccagtcgta tcgctaattc tctacgagaa gttgctgcag aaaagatcgt + 3781 cgctgtaacg cgagtatctg atgtaacaac acttgaagaa gcgcgaccag ctacgactcc + 3841 ctcttctcca aatgttcgac gcaattcctt gtttggtttt cttggaggag cagtcgtaac + 3901 agtaattgct gttcttttga ttgagttgct cgacacccgt gtgaaacgtc ctgaagatgt + 3961 tgaagatgta ctgaaaattc cacttttagg gctcgttcca gattttgaca aaataaaata + 4021 ggaggaagtt atgccaacat tagaaatctc acaggcaaaa ttggattctg taaaaaaggc + 4081 agaggaatat tataacgctt tgtgcacgaa cctacagtta agtggagatg gtttgaaagt + 4141 attttctatc acttctgtga aactaggaga aggaaaatca acgacttcca ccaatatcgc + 4201 ttgggctttt gcgcgtgcag gttacaaaac gctgctgatt gatggagata ttcgcaattc + 4261 tgttatgtta ggtgtcttta aagcaaggaa taagattaca ggcctgacag aatttttatc + 4321 aggaactaca gacctatcac aagggctttg tgataccaat atcgaaaatc tctttgtaat + 4381 tcaggctggc tctgtgtcac cgaatccgac agctcttctt caaagtaaga atttcactac + 4441 aatgcttgaa accttgcgta aatattttga ctacatcatt gtagatactg ctcctgttgg + 4501 tgtcgtgatt gatgcggcta ttattacgcg aaactgcgat gcttctattt tagtgacgga + 4561 ggcaggtgaa ataaatcgac gggatattca aaaagcaaaa gaacagttgg aacacacagg + 4621 aaagccgttt ttgggaattg tgttgaataa attcgatact tcagtagaca aatacggttc + 4681 ttatggaaat tatggaaatt acgggaaaaa taaaaaatag gtcaggggat agagatgaat + 4741 ggaaaaatat taaggtcttc attggccata atccagagtt ttcttgttat tttattgact + 4801 tatctactta gtgctgtgag agaaacggag attgtttcaa caacagctat tgcactttat + 4861 atcctccatt attttgtctt ttatatcagt gattatggac aggatttctt taaaaggaaa + 4921 tatttgattg aacttgtcca gacattgaaa tatatcctat tctttgcact agcgattagt + 4981 atttctaatt ttttcttaga ggatcgattt agtatttcca gacgaggcat gatttacttc + 5041 ctcacattac atgctctctt aatctatgtg ctaaacctat ttatcaagtg gtattggaag + 5101 cgggcttatc ccaactttaa aggaagtaag aagattctcc tacttacagc aacttctcgt + 5161 gtcgaaaagg tactggatgg attaatagaa tcaaatgagg ttgttgggga gttggtagcc + 5221 gtcagtgtct tagataaacc agattttcag catgattatt taaagatagt agcagagggg + 5281 gagatagtaa actttgcgac tcatgaggtg gtcgatgaag tctttatcaa tcttccaagt + 5341 gaaaaataca atattggaga gcttgtctct cagtttgaaa cgatgggaat tgatgtaaca + 5401 gtcaatctaa atgcttttga tcgtagtttg gcacgtaaca agcaaattcg taagatggca + 5461 ggattaaacg ttgtgacttt ttctacaaca ttttataaga ctagtcatgt aattgctaag + 5521 cggattattg atatcgtggg tgcattggtc gggttgatat tatgtggttt agtcagtatt + 5581 gtactggttc ctttgattcg aaaggatggg ggctctgcta tttttgctca gacgcgtata + 5641 ggaaaaaatg gtcgtcagtt cactttttat aagtttcgct ctatgtgtgt agatgccgag + 5701 gcgaaaaaaa gagaactcat ggaacaaaat accatgcagg gtggaatgtt taaggtggac + 5761 gatgatcctc gtatcacgaa aattggttgt tttatacgga agactagctt ggacgagcta + 5821 ccacagtttt ataatgttct aaagggagat atgagtttgg ttggcacacg gccaccaaca + 5881 gtggatgagt atgaacacta taccccagaa caaaaacgtc ggctaagttt taaacctggt + 5941 ataacaggct tatggcaggt cagtggacga agtgaaatca aaaatttcga tgaagttgtc + 6001 aaattagatg tggcttatat agatgattgg acaatctgga aagatattga aattttattg + 6061 aagacagtta aggtagtatt gatgaaggat ggagccaaat agggggatat gttcatgaaa + 6121 ttgcttcatt ttagtgaagt tggcggtgga gttgataggt atattaagtt atatttaaaa + 6181 tattcagata aagaacattt taaaaatatt gtggtaggat cagatcagct taatagacaa + 6241 acatatgaac aagaatataa tataaagttt tatcacattg atatctatag aagcttgtct + 6301 ccaataaagc ttttacgcgc gattaaacaa tttagaaaaa tattgtatct agaaagacct + 6361 gatatagtat atctgcacag tacttttgca ggtgtagtag gcaggttagc ttctatgggt + 6421 ttgtcgtgta aagtagtata caatcctcac ggatggtctt ttaagatgga tgtttctaag + 6481 attaagcaat tcgtttataa aaatattgaa aagtttttgt cttatcttac agataagtat + 6541 atattaatct ctaaatctga atatgaagcg gctcaatctt taaaaatacc ccttaagaaa + 6601 ttgactttag tgtataatgg agtagagatt gatgaagatt ttaacgaaaa tcaaataaac + 6661 gttttattac ccataaataa atatgttatt gggatgattg gtcgtattag tgaacagaaa + 6721 aatcctttct tttttgttga atttgcaaaa aaattatcag agatttatag caatttatat + 6781 tttgttattg tcggcgatgg cgaattgcgt gggcgaactg aagaactaat tgaagagtat + 6841 gggcttcgaa gctcattttt tataacaggg tgggtggata atccagagga ttatttagct + 6901 cagttcaatc aggcagttct tttctcgaaa tgggagggct ttggattggc ggttgcggaa + 6961 tatatgaaac ataagaagcc aattcttata actaatgttg atgggatgtc agaattggtt + 7021 attgatggtg agtcaggttt taaagtccca ctatataatt tagaagtaac tgtagataga + 7081 agtagaagta ttattgagaa tagagaacta gccaatgagt taggtagtgc tgctttccaa + 7141 agagttcgat ctacatttga aataaaagaa aaagtgtcag agttagagaa tatattcatg + 7201 agtttaagag gggatgataa tgtcaatata taaactttgt aaagatattg aaagaaaaac + 7261 tatgtcgcct gctaaaaaag caatggctaa aaacgactat tttgcatttt atgttggaag + 7321 acctttatcc tatcttttaa cagttccttt cgtgaaaaca aatattactc ccaatcaaat + 7381 atcttattta tctataattc ctttgattgt tggatttata ataatgatat ttacaactga + 7441 tttcgttgta ttattactgg catggtttct atttttttta tggaacttac tagatggagt + 7501 agatgggaac ttagccagat atcgggagca atactcgaag gatggaagtg tagtagatgc + 7561 aatggctggc tatgtagcca tggtgttgac gtatttcggt gcaggaatag tagctgctca + 7621 tttaaacgac tcagatatct atataatttt gggtgcatta tctgggattt cattgatttt + 7681 tccaaggtta gtgatgcata agtatatcaa tacagtagct caagatgagt ctgtgagtag + 7741 cattaaagat aaatctgatt ttaatactat aaaaatactg gctctaaaca tgacatcaat + 7801 tacaggaatt ccgcaggttt tactgctatt aactatttta acaaatcagt gggtactttt + 7861 tactttagta tatttcacga ttaatttttt attaatgata ttttctttgt attcattatt + 7921 caaaaaggag aatgtttaga aatgggaaag tcagttgcaa ttttaatgac cacctataat + 7981 ggtgagcgat atttgtcaca acagattgat agtattaggt ctcaaacatt cactaattgg + 8041 acgcttttta ttagggatga tggatcaaaa gataaaacaa tagaagtaat acagaggtat + 8101 tctaagatag atgatagaat tagattagtt gaaaatccct caaagtttca tggagcttat + 8161 tacaattttt ttaatctaat tgaatacgtt aaaaacaatt atcaatttga ttattacttt + 8221 ttttgtgatc aagatgatat ttggaaagag cacaagttag aaatacagct gttaagattt + 8281 tctaaagatg acatgccaga gatggtttac tctgatctgt caacgattga tgccagtaat + 8341 aatttgatag atattagtat aaataaaata atggggattg aattaccgaa cataaataat + 8401 ttgtatttta ttcatgccta tatctggggg tgtactgcag gttttaatca tgcattgcta + 8461 gagatggttc cttcagttga tattgataaa gattatttat atatagaaaa actgtctcat + 8521 gataattatt ttgcaaagtt tgcactagag tatgggaagg tgttgttctg ccctgagcaa + 8581 ctggtcttgt atcgaagaca tggacataat gtaacaacta gtcatcattt taaattatct + 8641 ccgctaaatg ttttcagaaa ggctatattg ggtttcaatg aattggcact tacacatgct + 8701 ggggtatata atcaaactct ttatatgcta aaaaaagctt ctggaaaaaa tcctttaagt + 8761 gatagactac ttgaaattca ggaagtaatc aaaattggag gattaaaagg tgtgagatat + 8821 ttctatcaga atcgaatttc tcgaaagcaa ctcgtaagaa caatcggctt atataccatc + 8881 atgctttttg ggacctataa aaaatatatt atgaaagaac tcttataatg cttttaaatt + 8941 tcttattcat atctattttt ctattaatta ttattacatt tatattattt gagggggatt + 9001 tttttcaacc tgcagtaatt ttaacaatcg cttattttat ttcgattgca agtgctctag + 9061 ttaatagaaa tgtttgggga acagaactcc atttcaaaac cttttatttg atattgttag + 9121 gggttgctac atttgttata gtttccttgt tgacaaaatt gtcgtacagg cctaaagtgg + 9181 agggaatttc gcatgaagaa ttgaaagaaa taaatccttc aaagataatc tatgtcattc + 9241 ttctgactct aaatcttgtt atgttatttc tttatatccg tgaaattcag aaagtagtat + 9301 tgttttcagg tagaagtttt tctaatatta cagatttgat aagtaactat aggtacctat + 9361 cttattattc aaatgaagta gaaaatcgtg taagtggaat gattaatcaa ctatctaaaa + 9421 ttattccagc gactacactt atttctttat atatatttat gaataattat tttataacta + 9481 aacaaataaa gaaaaatttc atttatttga ttccaatagc tatattcttt gtctatgcaa + 9541 tcattagtgg tggtagattg ccccttataa ggttagttgt tggatctctg ttgatattgt + 9601 atatatactc tgtgtacggg agtcctaaat ctcaacttac caaaagtttt aaaatgatca + 9661 ctcgctctct gtttacattt cttattttga tagttttatt ctttctttta aaatttgtat + 9721 tagggcgctc ctctcaggaa gattttatca gttacatcac tcgttatatg ggaggttcaa + 9781 ttcaactatt tgatttattt gttatagatc cgatacgacg taacaaagaa ctaggtgcag + 9841 aaactttttc gggaatttat gagatgcttg caaaattagg atttgacaat aatattataa + 9901 aaggcttaga atggagagtg tctcctaatt attattcttt agggaatgtg tatactgcaa + 9961 ttagacgtta ttattcagac tttggtgtaa ttggtattgt aatttgtcag agttttacag + 10021 cgtggttata tactttaggt tatgaaaaag ttagacatta ttctttagtt acaaatgttc + 10081 aaagatttag gttgatccta ttagcagctt cattttatcc aatattttta aatggtatcg + 10141 aggatgtgtt ttatatttca atggttacca ttggatatgg aatacaaatt gttatctttt + 10201 atctggtctt ttgggttctt ctgaaagttc aggttgactt taacaaaggt aaattaacga + 10261 taaatagatg aatttagcgc taatgtattg agtcatataa agggatatat ttgggaggta + 10321 ttttaattgg aggaagagag tcttgaatgg gaagtacata tcttctgaaa tattttttag + 10381 gtggggagta tagctatgaa attgaagttt cttataacaa atttgtttca tgtctttttg + 10441 tctaatctga ttacaattgt cacatcggtt atagttgtac taatcttacc aaaaattatg + 10501 ggagtaactg agtatagtta ttggcaacta tatatttttt acctaacata tattggtttt + 10561 tttcatctgg gttggattga tggaatttat cttaaatatg gtggattaga gtaccagaat + 10621 ttagataaga aacagtttta ttctcaaata cttcaatttt ccagtttttt aattttaatt + 10681 tcttttctat tatttggttt taacttattg attgtgacag atccaaatgc aaaatatatt + 10741 tataacatga ctattattag tatgatagtt acaaatttaa gaatgttatt cgtttatatt + 10801 ttgcagatga caaatcgatt aaaggatagc tctataattc tgataagtga tcgcgttata + 10861 tatatttttc ttttatttct gtttattata tttaaatggc atgaatacaa ggtaatgatt + 10921 tgggcggatg ttttaggaag gacattttct ctcctacttt ctttttggat ttgtaaagat + 10981 attgtttttc aatccttatc cgagttcata ttggatctga gagagtcttt tgacaatatc + 11041 cgtgttggaa tcaatttaat gttatccaat attgcaagta gtatgattat tggtattgtt + 11101 cgaatgggaa ttcaatggaa ttggaatatc gaaacattcg ggaaagtatc actgacgcta + 11161 agcatctcta atttattaat gacttttatt aatgcgattg gtttagttgt ctttcctttg + 11221 ttaaaacgga caaaaacgga aaatttatct aaaatttatt ccaacttaag aaatgttttg + 11281 atgctgatca tgtttgcaat attgctcttt tattatcctt taaaaattat tctagatctt + 11341 tggttgccag cttatcggga tgcgttgatt tttatggctc ttatttttcc tatgtcaatt + 11401 tatgaaggga agatggcctt ggtgattaat acatatttaa aggcgctaag gatggaaaga + 11461 gatattctca aaataaatac tttgattatg ttgttcagta tgtttgttac cctaataact + 11521 actctattat taaataattt agagctaacg gttatatcta tagttgtttt gctagcttta + 11581 cgtagtataa tagcagaact aattctatct aaaaaacttg atatatcagt tgagcaagac + 11641 attgtgttag aattacttat gacaattata tttatttctt caagttggta cttaccgatt + 11701 tggctcgcag taatagttta tttgttagcg tatactttat acttgtatct aaagcgtaaa + 11761 gatacaaaaa tgtatataga atattttaga aagaaaatat ttgaataaaa agaactatat + 11821 atcagttaga tggcaaattc tatttttacc tttttgtcgt ttaatagaaa atgataaaaa + 11881 atatgatact attttttaca catatttata agcgatttga atgtatcagg tgataaatta + 11941 atttaaaata agaatagttt ctggaacatt gctattagtg ggaacaggtt acgaaataat + 12001 ttatcaattt taaagacgtt tttttaaata taaaataatg gattttgtca acaattctaa + 12061 attctaatag gaatgataat gctagaaaat cagattgttc atttttcaag gaagtttatt + 12121 tttaaaataa tatatcttta agtaagaatt attttattag acttaaccta gcctatcagt + 12181 taaattagaa tatcaacttt gattaattaa aaattagcaa aatttattga cattttgttt + 12241 ttataaattg cgataaaggt ctaattctga atttcagtga atataagaaa gggatcctac + 12301 taatgaaagg tattattctt gcaggtggtt cggggacacg attatatcct ttgactcggg + 12361 ctgcatcaaa acaacttatg ccggtttatg ataaacccat gatttactat ccactttcaa + 12421 cattgatgtt ggctgggatt agggatattt tgataatctc aactcctcaa gatttgcctc + 12481 gttttaaaga gcttcttcaa gacggatctg agtttgggat taaactttct tatgcagagc + 12541 aaccaagtcc agatggtttg gcacaagcct ttatcattgg ggaagagttt attggtgatg + 12601 atagcgttgc tttgatcttg ggggacaata tctatcacgg ccctggtttg agcaaaatgc + 12661 ttcaaaaagc agccaagaaa gagaaaggtg cgactgtctt tggctaccat gtcaaggatc + 12721 cagagcgctt tggtgtggtt gagtttgata cagacatgaa tgctatttcc atagaagaaa + 12781 aaccggagta tcctcgctcc aactatgcag ttacaggtct ctatttctat gataatgatg + 12841 tagtagagat tgccaaaagt ataaaaccaa gccctcgtgg tgaactggaa attacagatg + 12901 taaacaaagc ttacctagat cgtggtgatt tgtctgttga gcttatggga cgtggctttg + 12961 cttggctgga tactggaact catgaaagtt tactagaggc ttcacagtac atcgaaacag + 13021 tgcaacggat gcaaaatgtt caggtagcaa acttagaaga aattgcctat cgcatgggtt + 13081 atatcagtcg tgaagatgta ttgaccttag cccaaccact taagaaaaat gaatacggac + 13141 agtatctgct ccgtttgatt ggagaagcat agatgacaga taattttttc ggtaagacgc + 13201 ttgcggcacg caaggttgaa gctattccag gcatgttgga gtttgatatc cccgttcatg + 13261 gagataatcg tggctggttt aaagaaaatt tccaaaagga aaaaatgctt ccacttggat + 13321 ttccagagtc tttctttgca gaaggaaaat tgcaaaacaa tgtatccttc tcacgtaaaa + 13381 atgtccttcg agggctccac gcagagcctt gggataagta catctctgta gcagatggag + 13441 ggaaagttct gggttcttgg gttgatctac gcgagggtga aacctttggg aatacctatc + 13501 agacagtaat tgatgcaagc aagggaatct ttgttcctcg aggcgtagct aatggcttcc + 13561 aagttctatc agatacagtg tcatatagct atctggtcaa tgattactgg gcgcttgaac + 13621 tcaaacccaa gtatgccttt gtgaactacg ctgatccaag ccttggtatt gaatgggaaa + 13681 atattgcaga agcagaggtt tcagaagcag ataaaaatca tccactactt aaggatgtaa + 13741 aacctttgaa aaaagaagat ttggaataag gaaagaatat gactgaatac aaaaatatta + 13801 tcgtgacagg tggagctggc tttatcggtt ctaactttgt ccattatgtt tacgagaact + 13861 ttccagatgt tcatgtgaca gtcctagata agttgactta tgctggaaac cgcgcgaata + 13921 ttgaggaaat tttaggtaat catgttgagt tagttgttgg tgacattgct gatgcggagt + 13981 tggtagacaa gttggctgct caagcagatg ctatcgttca ttatgcagcg gaaagccaca + 14041 atgataattc gctcaatgat ccatcgccat ttattcatac taacttcatt ggaacctata + 14101 ctcttttaga agctgctcgt aagtatgata ttcgcttcca ccatgtatcg acagatgaag + 14161 tttatgggga tctcccttta cgcgaagatt tgccaggtca tggagaaggg ccgggtgaga + 14221 aatttacggc tgaaaccaag tacaatccaa gctcgcctta ctcatcaacc aaggcagcct + 14281 cagatttgat tgtcaaagcc tgggtgcgtt cttttggagt caaggcaacg atttccaact + 14341 gttcaaataa ctacggtcct taccagcata ttgagaagtt tattccacga caaatcacca + 14401 atatcttgag cggtatcaag ccaaaacttt acggtgaagg taagaacgtt cgtgattgga + 14461 ttcataccaa tgaccattct tcaggagttt ggacaatctt gacaaaaggg caaatcggtg + 14521 aaacctactt gattggggct gatggtgaga agaacaataa ggaagttttg gaacttatcc + 14581 ttaaggaaat gggacaagct gcggatgcct atgatcatgt gactgaccgt gcaggacatg + 14641 accttcgcta tgcgattgat gctagcaagc tccgtgatga gttggggtgg aaacctgaat + 14701 ttaccaactt tgaagctggg ctcaaggcaa caatcaagtg gtatacagat aaccaagaat + 14761 ggtggaaagc agaaaaagaa gctgttgaat ccaattatgc taagactcag gagattatta + 14821 cagtataaaa agcaggaaat agctgctttt tattgctata ttgggaagag ttacatatta + 14881 gaaaggtcta gagatgattt taattacagg ggcaaatggc caattaggaa cggaacttcg + 14941 ctatttattg gatgaacgta atgaagaata cgtggcagta gatgtggcta agatggacat + 15001 taccaatgaa gaaatggttg agaaagtttt tgaagaggtg aaaccgactt tagtctacca + 15061 ttgtgcagcc tacaccgctg ttgatgcagc agaggatgaa ggaaaagagt tggacttcgc + 15121 catcaatgtg acggggacaa aaaatgtcgc aaaagcatct gaaaagcatg gtgcaactct + 15181 agtttatatt tctacggact atgtctttga cggtaagaaa ccagttggac aagagtggga + 15241 agttgatgac cgaccagatc cacagacaga atatggacgc actaagcgta tgggggaaga + 15301 gttagttgag aagcatgtgt ctaatttcta tattatccgt actgcctggg tatttggaaa + 15361 ttatggcaaa aacttcgttt ttaccatgca aaatcttgcg aaaactcata agactttaac + 15421 agttgtaaat gatcagtacg gtcgtccgac ttggactcgt accttggctg agttcatgac + 15481 ctacctagct gaaaatcgta aggaatttgg ttattatcat ttgtcaaatg atgcgacaga + 15541 agacacaaca tggtatgatt ttgcagttga aattttgaaa gatacagatg tcgaagtcaa + 15601 gccagtagat tccagtcaat ttccagccaa agctaaacgt ccgctaaact caacgatgag + 15661 cctggccaaa gccaaagcta ctggatttgt tattccaact tggcaagatg cattgcaaga + 15721 attttacaaa caagaagtga gataagtagt agaatgattt tctagtctaa taaaagaggc + 15781 agagaatgaa ctccaaagga gcataagatg tacgattatc ttatcgttgg tgccggtctt + 15841 tttggtgcag gatttgccat gaatcagcct aaaaggaaaa aagaaaagtt atggaaaacg + 15901 aatcatattg cggtaatatc tatcctcgtg aag +// + diff --git a/public/res/serotype_genbank/serotype_6E_6B.gb b/public/res/serotype_genbank/serotype_6E_6B.gb new file mode 100644 index 0000000..43e6ba3 --- /dev/null +++ b/public/res/serotype_genbank/serotype_6E_6B.gb @@ -0,0 +1,569 @@ +LOCUS LT594599 15725 bp DNA linear BCT 06-JUL-2016 +DEFINITION Streptococcus pneumoniae capsular locus (cps) operon, strain 6E. +ACCESSION LT594599 +VERSION LT594599.1 +DBLINK BioProject: PRJEB14267 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 + AUTHORS Kapatai,G., Sheppard,C.L., Al-Shahib,A., Litt,D.J., Underwood,A.P., + Harrison,T.G. and Fry,N.K. + TITLE Whole Genome Sequencing of Streptococcus pneumoniae: Development, + Evaluation and Verification of Targets for Serogroup and Serotype + Prediction using an Automated Pipeline + JOURNAL Unpublished +REFERENCE 2 (bases 1 to 15725) + AUTHORS Underwood,A. + TITLE Direct Submission + JOURNAL Submitted (20-JUN-2016) PHE, 61 Colindale Avenue, London NW9 5EQ, + UNITED KINGDOM +COMMENT This sequence is a consensus sequence extracted from a multiple + alignment of cps loci from 12 6E isolates. The cps loci were + extracted from genome assemblies of the 12 isolates using the cps + locus from 6B (CR931639). For detail description see the + associated publication. +FEATURES Location/Qualifiers + source 1..15725 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="6E" + /serotype="6E" + /db_xref="taxon:1313" + operon 1..15725 + /operon="capsular locus, cps" + /note="nucleotide blast analysis using this sequence + returns a number of 6B capsular gene locus and complete + genome sequences that following molecular analysis would + probably be identified as 6E" + gene 1..1446 + /gene="wzg" + /operon="capsular locus, cps" + CDS 1..1446 + /gene="wzg" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="SBT85374.1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVATAFVLLVALIGLLSIIYKKAEKFTIFLLVLSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNIDLT + VNQSSSYLSAYRSLIAGETKAIVLNSVFENIIESEYPDHASKIKKIYTKGFIKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVYNDQ + EFTALANKKHYSIGNVHLDSEEALAFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EVLKNYSTIIDSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGRGRTDLPSY + AMPDSNLYVMEINDSSLASVKTAIQDVLEGR" + gene 1448..2179 + /gene="wzh" + /operon="capsular locus, cps" + CDS 1448..2179 + /gene="wzh" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="tyrosine protein phosphatase Wzh" + /protein_id="SBT85375.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLTEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLENNRIPTLNNS + RYALIEFSMNTPYRDIHSALNKILMLGITPVIAHIERYDVLENNEKRVRELIDMGCYT + QINSSHVLKSKLFGEPYKFMKKRAQYFLERDLVHIIASDMHNVDGRPPHMAEAYDLVS + QKYGEAKAQELFIDNPRKIVMDQLI" + gene 2185..2880 + /gene="wzd" + /operon="capsular locus, cps" + CDS 2185..2880 + /gene="wzd" + /operon="capsular locus, cps" + /note="putative regulatory protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="SBT85376.1" + /translation="MMKEQNTIEIDVFQVLKTLWKHKLIILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQEGKSGLTNQDLQAGTYLVKDYREIILSQDVLEKVATNLKL + DMPAKALTSKVQVTVPTDTRIVSISVKDKEPEEASRIANSLREVAAGKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNTLVGFLGGAVVTVITVLLIELLDTRVKRPEEVEEVLQV + PLLGVVPDLDKMK" + gene 2890..3570 + /gene="wze" + /operon="capsular locus, cps" + CDS 2890..3570 + /gene="wze" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="tyrosine protein kinase Wze" + /protein_id="SBT85377.1" + /translation="MPTLEISQVKLELAKKAEEYYNALCTNLQLSGDDLKVFSITSVK + PGEGKTTTSTNIARAFARAGYKTLLIDADMRNSVMSGVFKSRERITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSRNFSTMLETVRKYFDYIVVDTAPVGVVI + DAAIITQKCDASILVTKAGETKRRDIQKAKEQIEQTGKPCLGVVLNKFDTSVDEYGSY + GSYGKKKK" + gene 3585..4952 + /gene="wchA" + /operon="capsular locus, cps" + CDS 3585..4952 + /gene="wchA" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="galactosyl transferase WchA" + /protein_id="SBT85378.1" + /translation="MNGKLVKPSLAIVQSFLVILLAYLLSTVRETEIVSTTAIVLYIL + HYFAFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LLLHVFLVYVLNRFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESDDVVGEL + VAVSVLDKPDFQHDYLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + VDVTVNLNAFDCILAHNKQICEMAGLNVVTFSTTFYKTSHVIAKRVIDIIGSLVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRHFTFYKFRSMCVDAEEKKRELMEQNTM + QGGMFKVDEDPRITKIGHFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDGWTIWKDIEILLKTVKVVLM + KDGAK" + gene 5081..6025 + /gene="wciN" + /operon="capsular locus, cps" + CDS 5081..6025 + /gene="wciN" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="glycosyl_transferase wciN" + /protein_id="SBT85379.1" + /translation="MDIVYATDNNFVDVLSASIKSLYTTNSDLDLNLWIIADKVSDRN + KEKINRLSKQFAQREINWIENVEIPFKLHLDRGSISSFSRLFLGSVLPSSMSKVLYLD + SDIIVMDSLRSILDIDFKDKILYGVNDTFNKEYKQVLGIPIDKPMFNAGVMLINLELW + RNNNVEEKFLQVIQKFNGTILQGDLGVLNAVLYNSFGVLPPEYNYMTIFEDLTYEEMI + VFKKPINYYSKEEIKNARERIVLRHFTTCFLSLRPWQENSEVAHVEIFKKYYRGTYKQ + VSPSKLSRIYKILPKKMSLYLLGFIQSKVRPKLYRILK" + gene 6062..6619 + /gene="unknown" + /operon="capsular locus, cps" + CDS 6062..6619 + /gene="unknown" + /operon="capsular locus, cps" + /note="high similarity with cps6bQ and other + lipopolysaccharide cholinephosphotrasferases" + /codon_start=1 + /transl_table=11 + /product="putative lipopolysaccharide + cholinephosphotrasferase" + /protein_id="SBT85380.1" + /translation="MKVQEKLKLLKEFIKICSKNKMKYFASGGSLLEAARYKGFIPWN + DDMALGLPRKHFEKFINEIDFEKYNKNYILESSEMNLGIFQYKLKSAILILGKSYDVC + LNLFLLDRMSELVIDGESGFKVPLYNLEVAVDRSRSIIENRELANELGSVAFQRVQSI + FEIKEKVSELENIFMSLGEDDNVNI" + gene 6600..7325 + /gene="wciO" + /operon="capsular locus, cps" + CDS 6600..7325 + /gene="wciO" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="CPD-ribitol phophotransferase WciO" + /protein_id="SBT85381.1" + /translation="MIMSIYKLYKDIERKTMSPAKKAMAKNDYFAFYVGRPLSYLLTV + PFLKTNITPNQVSYLSIAPLILGFLTMTFTTNFILLLLAWFLFFLWNLLDGVDGNLAR + YREQYSKDGSVVDAMAGYVAMVLTYFGAGIVATHLNGSDMYVILGALSGISLIFPRLV + MHKYINTVARNESVNNIKDKSNFSTIKLLALNMTSITGIPQVLLLVTILTNQWEFFTL + VYFTINFLLMIFSLYSLFKKENV" + gene 7328..8314 + /gene="wciP" + /operon="capsular locus, cps" + CDS 7328..8314 + /gene="wciP" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="glucosyl transferase WciP" + /protein_id="SBT85382.1" + /translation="MGKSVAILMTTYNGERYLSQQIDSIRSQTFTNWTLFIRDDGSKD + KTVEVIQRYSKIDDRIRLVENPSKFHGAYYNFFNLIEYVKNNYQFDYYFFCDQDDIWK + EHKLEIQLLRFSKDEMPEMVYSDMSTIDANNKLIDISINNIMGIELPNINNLYFIHAY + IWGCTAGFNHALLEMVPSVDIDKDYLYIEKLSHDNYFAKFALEYGKVLFCPEQLVLYR + RHGHNVTTSHHFKLSPLNILRKAILGFNELALTHAGVYNQTLYMLKKASEKSPLSDRL + LEIQEVIKIGGLKGVRYFCQNRISRKQLVRTIGLYTIMLFGTYKKYIMKELS" + gene 8314..9657 + /gene="wzy" + /operon="capsular locus, cps" + CDS 8314..9657 + /gene="wzy" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="SBT85383.1" + /translation="MLLNFLFIFIFLLIIITFILFEGDLFQPAVILTLAYFISIASAL + VNRNVWGTELHFKTFGLILLGVATFIIVSLLTKLSYKPKVEGISYKELKEINPSKIIY + GILLILNLVMLFLYIHEIQKVVLFSGRGFSNITDLISNYRYLSYYSNEVEDRVSGMIN + QLAKIIPATTFVSLYIFINNYFITKQIKKNFIYLIPIAIFFVYAIISGGRLPLIRLVI + GTLLILYIYSVYGSHKSQLTRSFKMITRSLFAFLMLIVLFFLLKFVLGRSSQEDFISY + ITRYMGGSIQLFDLFVIDPIRRNKELGAETFSGIYEMLAKLGFDNNIIKGLEWRISPN + YYSLGNVYTAIRRYYSDFGVIGIVICQSFTAWLYTLGYEKIRHHSLVTNGQRFRLILL + AASFYPLFLNSIEDVFYISMVTIGYGIQIVIFYLVFWVLLKVQVDFNKGKLRINR" + gene 9791..11203 + /gene="wzx" + /operon="capsular locus, cps" + CDS 9791..11203 + /gene="wzx" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="SBT85384.1" + /translation="MKLKFLITNLFHVLLSNLITILTSVIVVLILPKIMGVTEYSYWQ + LYIFYLTYIGFFHLGWIDGIYLKYGGLEYQNLDKKQFYSQILQFSSFLILISFLLFGF + NLLTVTDQNAKYIYNMTIISMIVTNLRMLFVYILQMTNRLKDSSIILISDRVIYVILL + FLFIIFKWHEYKVMIWADVLGRTFSLLLSFWICKDIVFQSLSEFILDLRESFDNIRVG + INLMLSNIASSMIIGIVRMGIQWNWNIETFGKVSLTLSISNLLMTFINAIGLVVFPLL + KRTKTENLSKIYSNLRNVLMLIMFAILLIYYPLKIVLDLWLPAYQDALIFMTLIFPMS + VYEGKMALVINTYLKALRMERDILKINTLIMLFSMLVTLITTLLLNSLELTVVSIVVL + LALRSVIAELILSKKLDVSVKKDIVLEFLLTIVFISSSWYLPIWPAVIVYLLAYTLYL + YLKRKDIKMYIEYFRKKIFE" + gene 11692..12561 + /gene="rmlA" + /operon="capsular locus, cps" + CDS 11692..12561 + /gene="rmlA" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="SBT85385.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFLIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAQKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PENPRSNYAVTGLYFYDNDVVEIAKGIKPSARGELEITDINKAYLNRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISCEDVLELAQPLKKN + EYGQYLLRLIGEA" + gene 12562..13158 + /gene="rmlC" + /operon="capsular locus, cps" + CDS 12562..13158 + /gene="rmlC" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="SBT85386.1" + /translation="MSDNFFGKTLAVRKIDAIPGLLEFDIPVHGDNRGWFKENFQKEK + MEPLGFPESFFAAGKLQNNVSFSRKNVLRGLHAEPWDKYISVADDGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDLE" + gene 13168..14217 + /gene="rmlB" + /operon="capsular locus, cps" + CDS 13168..14217 + /gene="rmlB" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="SBT85387.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + gene 14283..15134 + /gene="rmlD" + /operon="capsular locus, cps" + CDS 14283..15134 + /gene="rmlD" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="SBT85388.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + gene 15216..15644 + /gene="tnp" + /operon="capsular locus, cps" + CDS 15216..15644 + /gene="tnp" + /operon="capsular locus, cps" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="SBT85389.1" + /translation="MVLISLAHSFGSVSIIAHTIHQKFNLKVPNYRQEEDWARMGLPI + TRKEISNWHIKASQYYLESLYNLLREKLLEQPLLHADETSYRVLESDSHLTYYWTFLS + GKAENQAITLYHHDQRRSGLVVQEFLGDYSGYVHCDMLRQ" +ORIGIN + 1 atgagtagac gttttaagaa atcaggttca cagaaagtga agcgaagtgt taatatagtt + 61 ttgttgacta tttatttatt gttagtttgt tttttattgt tcttaatctt taagtacaat + 121 atccttgctt ttagatatct taatctagtg gcaactgcct ttgttctact agttgcctta + 181 atagggctac tctcgattat ctataaaaaa gctgaaaagt ttaccatttt tctgttggtg + 241 ctctctattc ttgtcagctc agtgtcgctc tttgcagtac agcagtttgt tggactgacc + 301 aatcgtttaa atgcgacttc taattactca gaatattcgc tcagtgtcgc tgttttagca + 361 gatagtgaga ttgagaatgt tacgcaactg acgagtgtga cagcaccgac tgggactgat + 421 aatgaaaaca ttcaaaaact actagctgat atcaaatcaa gtcagaatat cgatttgacg + 481 gttaatcaaa gttcgtctta cttgtcagct tacaggagtt tgattgcagg agagactaag + 541 gccattgtct taaatagtgt ctttgaaaat atcattgaat cggagtatcc agatcacgca + 601 tcgaagataa aaaagattta taccaaggga ttcattaaaa aagtagaagc tcctaagacg + 661 tctaagaatc agtctttcaa tatctatgtt agtggaattg atacttatgg tccaattagt + 721 tcggtgtcgc gttcagatgt caatatcttg atgactgtca atcgagatac caagaaaatt + 781 ctcttgacca caacgccacg tgatgcttat gtaccaatcg cagatggtgg aaataatcaa + 841 aaagataaat tgactcatgc gggcatttat ggagttgatt cgtccattca caccttagaa + 901 aatctctatg gagtggatat caattactat gtgcgattga acttcacttc gtttttgaaa + 961 ttgattgatt tgttgggtgg ggtagatgtt tataatgatc aggaattcac agctcttgct + 1021 aataaaaaac actattctat tggtaatgtc catttagatt cagaagaggc actcgctttt + 1081 gttcgtgagc gctattccct agcggatggt gatcgtgacc gtgggcgcaa tcaacaaaag + 1141 gtgattgtgg ctatccttca aaaattaact tcgaccgaag tactgaaaaa ttatagtacg + 1201 atcattgata gcttgcaaga ttctatccaa acaaacatgc cacttgagac catgataaac + 1261 ttggtcaatg ctcagttaga aagtggtgga acgtacaaag taaattcgca agacttgaag + 1321 ggtaggggac ggacggatct tccttcctat gcgatgccag atagtaacct ctatgtgatg + 1381 gaaattaacg acagtagcct tgcatctgtc aaaacggcta ttcaggacgt gttggagggc + 1441 agatgaaatg attgatattc attcgcacat tgtctttgat gtagatgatg gtcccaagtc + 1501 aagagaggaa agtaaggctc tcttgacaga agcctacagg cagggggtgc gaaccattgt + 1561 ctctacctct caccgtcgca agggcatgtt tgaaactcca gaagagaaga tagcagaaaa + 1621 ctttcttcag gttcgggaaa tagctaagga agtcgcgagt gacttggtca ttgcttatgg + 1681 ggctgaaatt tactacacgc cagatgtttt ggataagctg gaaaacaatc ggattccgac + 1741 cctcaataat agtcgttatg ccttgataga gtttagtatg aacactcctt atcgcgatat + 1801 tcatagtgcc ttgaataaaa tattgatgtt gggaattact cccgtcattg cccacataga + 1861 gcgctatgat gttcttgaaa ataatgaaaa acgcgttcga gagctgatcg atatgggctg + 1921 ttacacgcaa ataaatagtt cacatgtcct caaatccaaa ctttttggag aaccttataa + 1981 attcatgaaa aaaagagcgc agtatttctt ggagcgtgat ttggttcata tcattgcaag + 2041 tgatatgcat aatgtggacg gcagaccccc ccatatggca gaagcatatg accttgtttc + 2101 ccaaaaatac ggagaagcga aggctcagga actttttata gacaatcctc gaaaaattgt + 2161 aatggatcaa ctaatttagg agaaatgatg aaagaacaaa acacgataga aatcgatgta + 2221 tttcaagtac ttaaaacctt gtggaaacac aagttaataa ttttattagt ggcgcttgtg + 2281 acaggggcgg gagcttttgc atatagcact tttattgtta aaccagaata tacgagcacc + 2341 acgcgtattt acgtcgtcaa ccgtaatcaa gaaggtaagt cgggactgac gaatcaggac + 2401 ttgcaggcag gaacttatct ggtaaaagac taccgcgaaa ttatcctttc gcaagatgta + 2461 ttggaaaagg tagcgacaaa tttgaaattg gatatgccag caaaagcgtt aactagcaaa + 2521 gttcaagtga ctgtaccaac cgacactcgt atcgtctcaa tctctgtcaa ggataaagaa + 2581 ccagaggaag ccagtcgcat tgctaattct ctacgagaag ttgctgcagg aaagatcgtc + 2641 gctgtaacgc gagtatctga tgtaacgacg cttgaagaag cgcggccagc tacgactccc + 2701 tcttctccca atgttcgacg taacacctta gttggttttc ttggaggagc cgtcgtaaca + 2761 gtaattactg ttcttttgat tgagttgctc gatacccgtg tgaaacgtcc tgaagaagtt + 2821 gaagaggtgc tgcaagtgcc acttctagga gtcgttccag atttggataa aatgaaatag + 2881 gaggaagtta tgccaacgtt agaaatctca caggtgaaat tagaacttgc gaaaaaggca + 2941 gaggaatatt ataatgcttt gtgcacgaac ctacagttaa gtggagatga tttgaaagta + 3001 ttttctatca cttctgtgaa accaggagaa ggaaaaacaa cgacttccac caatatcgct + 3061 cgggcttttg cgcgtgcagg ttacaaaacg ttgctgattg atgcagacat gcgtaactcc + 3121 gtgatgtcag gtgtctttaa atcaagggaa aggattaccg ggctaacaga atttctatca + 3181 gggactacag acctgtcaca gggactttgt gataccaata ttgagaatct ctttgtgatt + 3241 caggctggct ctgtgtcacc aaatccgaca gcccttcttc aaagtaggaa tttcagtaca + 3301 atgcttgaaa ccgtgcgtaa atattttgac tatatcgtcg tagacactgc tcctgtcggt + 3361 gtcgtgattg atgcggctat cattacgcag aaatgtgatg cttctatttt agtgacgaag + 3421 gcaggcgaaa caaagcgacg ggatattcaa aaagcgaaag aacagataga acaaactggg + 3481 aagccgtgtt taggagttgt gttgaataaa ttcgatactt cagtagacga atacggttct + 3541 tatggaagtt atgggaaaaa gaaaaaatag gttgggggat agagatgaat ggaaaactag + 3601 taaagccttc attggccata gtccagagtt ttcttgttat tttattggct tatctactta + 3661 gcactgtgag agaaacagag attgtttcaa caacagctat tgtactttat atcctccact + 3721 attttgcctt ttatatcagt gattatggac aggatttctt taaaagggga tatttgattg + 3781 aacttgtcca gacattgaaa tatatcctat tctttgcgct agcgattagt atttctaatt + 3841 ttttcttaga agatcgattt agtatttcca gaagaggcat gatttacttc ctcctattac + 3901 atgttttctt agtctatgtg ctaaaccgat ttatcaagtg gtattggaag cgggcttatc + 3961 ccaactttaa aggaagtaag aagattctcc tacttacagc aacttctcgt gtcgaaaagg + 4021 tattggatag actaatagaa tcagatgatg ttgttgggga gttggtagcc gtcagtgttt + 4081 tagataaacc agattttcag catgattatt taaaggttgt agcagagggg gagatcgtaa + 4141 actttgcgac tcatgaggtg gtcgatgaag tctttatcaa tcttccaagt gaaaaataca + 4201 atattggaga gcttgtctct cagtttgaaa cgatgggagt tgatgtaaca gtcaatctaa + 4261 atgctttcga ttgtatcttg gcacataaca agcaaatttg tgagatggca ggactaaacg + 4321 ttgtgacttt ttctacaaca ttttataaga ctagccatgt gattgctaag cgggttattg + 4381 atattatcgg ttccctggta ggtttgatac tatgtggtct agtcagtatt gtactggttc + 4441 ctttgattcg aaaggatggg ggctctgcta tttttgctca gacgcgtatt gggaaaaatg + 4501 gtcgccattt cactttttac aagtttcgct ctatgtgtgt ggatgctgag gagaaaaaaa + 4561 gagaactcat ggaacaaaat accatgcagg gtggaatgtt taaggtggat gaggatccac + 4621 gtatcacgaa aattggtcat tttatacgga agacgagctt ggacgagcta ccacagtttt + 4681 acaatgttct aaagggagat atgagtttgg tagggacacg accaccaaca gtggacgagt + 4741 atgagcacta taccccagaa caaaaacgtc gcctaagttt taaacctggc ataacaggtc + 4801 tatggcaggt cagcggacga agcgagatca agaatttcga tgaggttgtc aaattagatg + 4861 tggcctatat agacggttgg acaatttgga aagatattga aattttattg aagacagtta + 4921 aagttgtatt gatgaaggat ggagcgaagt agagagtttc tctctgacca caatcgtgca + 4981 atcctaataa tagcgagata ataaaattgt cttgctttta actcggactc taaatttagg + 5041 agttctagtg ataatattaa caataaaggt gaggtgaaaa atggatatag tatatgcgac + 5101 agataataat tttgtagatg tattgagtgc atctatcaag tcgctttaca ctactaattc + 5161 agatttggat ttaaatttat ggattattgc tgataaagtt tcggatagaa ataaagaaaa + 5221 gataaataga ttatcaaaac aatttgcgca gagagaaatt aattggatag agaacgttga + 5281 gattccattt aaattacatt tagatagggg atcaattagt tcatttagca gattatttct + 5341 gggaagtgtt cttccatctt caatgagtaa agttctctat cttgatagtg atattattgt + 5401 aatggattct ttacgaagta ttcttgatat tgattttaaa gataaaattc tctatggggt + 5461 aaatgatact tttaataaag aatacaagca ggtgttgggg ataccaatcg acaaaccaat + 5521 gtttaatgct ggagttatgc tgattaattt agagttatgg agaaataata acgtcgaaga + 5581 aaaatttttg caagtaattc aaaagtttaa tggtactata ttacaaggtg atttaggagt + 5641 tttaaatgca gttttatata actcatttgg tgtacttcct ccagaatata attatatgac + 5701 catatttgaa gatttgactt atgaagaaat gatagttttt aaaaaaccaa ttaactatta + 5761 ttcaaaagaa gaaattaaaa atgctagaga acgtatagtc ttgcgccatt tcacaacgtg + 5821 ttttctatca ctcagacctt ggcaagaaaa tagtgaggtg gcgcatgtgg aaatatttaa + 5881 aaaatactat agaggaacat acaaacaagt atctccatct aagttatcaa gaatttataa + 5941 aattttaccg aaaaaaatgt cgctctattt actaggtttt attcaatcaa aagtgcgtcc + 6001 aaaactgtat agaattttga aataagatgg ctagtagtaa tggcaaaaaa gaaagaattt + 6061 attgaaagtt caagaaaaat tgaaattatt aaaagagttt ataaaaatat gttctaaaaa + 6121 taaaatgaag tattttgctt ctggaggtag tctattggaa gctgcaagat acaaaggttt + 6181 tattccttgg aatgatgata tggctctagg tttaccaaga aagcattttg aaaagtttat + 6241 aaatgaaata gattttgaaa aatataataa aaattatatt ttagaaagtt cggaaatgaa + 6301 tttaggtatt tttcaatata aattaaaatc tgctatttta attttaggga aatcgtatga + 6361 cgtatgtttg aatttatttc tgttagacag gatgtcagaa ttggttattg atggtgagtc + 6421 aggttttaaa gtcccactat ataatttaga agtggctgta gatagaagta gaagtattat + 6481 tgagaataga gaactagcca atgagttagg tagtgttgct ttccaaagag ttcaatctat + 6541 atttgaaata aaagaaaaag tgtcagagct agagaatata ttcatgagtt taggagaaga + 6601 tgataatgtc aatatataaa ctttataaag atattgaaag aaaaacgatg tcgcctgcta + 6661 aaaaagcaat ggctaaaaat gattattttg cgttttatgt tggaagaccg ttatcctatc + 6721 ttttaacagt tcctttttta aaaacgaata ttactcccaa tcaagtatct tatttatcta + 6781 tagccccttt gattcttgga tttctgacaa tgacatttac aactaatttc attctattat + 6841 tgctggcatg gtttctattt tttttatgga acttactaga tggagtagat gggaacttag + 6901 ctagatatcg ggagcaatac tcgaaggatg gaagtgtagt agatgcaatg gcaggctatg + 6961 tggctatggt gctgacgtat tttggtgcag gaatagtagc aactcatcta aatggctcag + 7021 atatgtatgt gattttgggt gctttatctg gaatttcttt gatttttcca agattggtga + 7081 tgcataagta tatcaacaca gtagcacgaa atgagtctgt caataacatt aaagataaat + 7141 caaattttag tactataaaa ctactggctt taaatatgac atcaattaca ggtattcctc + 7201 aggttttact actagtaacg attttaacaa atcagtggga attttttact ttagtatatt + 7261 tcacgattaa ttttttatta atgatatttt cgttatattc attatttaaa aaggagaatg + 7321 tttagagatg ggaaaatcag ttgcaatttt aatgaccact tataatggtg agagatattt + 7381 gtcacaacag attgatagta ttaggtctca aacatttacc aattggacgc tttttattag + 7441 agatgatgga tcaaaagata agacagtaga agtaatacag aggtattcta agatagatga + 7501 tagaattaga ttagttgaaa atccctcaaa gtttcatgga gcttattata atttttttaa + 7561 tctaattgaa tacgttaaaa acaattatca atttgattat tacttttttt gtgatcaaga + 7621 tgatatttgg aaagagcaca agctagaaat acagctgtta agattttcta aggatgaaat + 7681 gccagagatg gtttactctg atatgtcaac gattgatgcc aataataagt tgatagatat + 7741 tagtataaat aacataatgg ggattgaatt accgaacata aataatttgt attttattca + 7801 tgcctatatc tgggggtgta cggcaggctt taatcatgca ttgttagaga tggttccttc + 7861 agttgatatt gataaagatt atttatatat agaaaaactg tctcatgata attattttgc + 7921 aaagtttgca ctagagtatg ggaaggtgtt gttctgccct gagcaactgg tcttgtatcg + 7981 aagacacgga cataatgtaa caactagtca tcattttaaa ttatctccgc taaatattct + 8041 cagaaaggct attttgggtt tcaatgaatt ggcacttaca catgctgggg tatataatca + 8101 aactctttat atgctaaaaa aagcttctga aaaaagtcct ttaagtgata gactgcttga + 8161 aattcaggaa gtaatcaaaa ttggaggatt aaaaggtgtg agatatttct gtcagaatcg + 8221 aatttctcga aagcaactcg taagaaccat cggcttatat accatcatgc tttttggcac + 8281 ctataaaaaa tatattatga aagaactctc ataatgcttt taaatttctt attcatattt + 8341 atttttctat taattatcat tacatttata ttatttgagg gagatttgtt tcaacccgca + 8401 gtaattttaa cacttgctta ttttatttcg attgcaagtg ctctagttaa tagaaatgtt + 8461 tggggaacag aactccattt caaaaccttt ggtttgatat tgctaggggt tgctacattt + 8521 attatagttt ccttgttgac aaaattgtcg tacaaaccta aagtggaggg aatttcgtat + 8581 aaagaattaa aagaaataaa tccttcaaag ataatatatg gcattcttct gattctaaat + 8641 cttgttatgc tatttcttta tatccatgaa attcagaaag tggtactgtt ttcaggtaga + 8701 ggtttttcta atattacaga tttgataagt aactataggt acctatctta ttattcaaat + 8761 gaagtagaag atcgtgtaag tggaatgatt aatcaactag ctaaaattat tccagcgact + 8821 acatttgttt ctttatatat atttataaat aattatttta taacgaagca aataaagaaa + 8881 aatttcattt atttgattcc aatagctata ttctttgtct atgcaatcat tagtggtggt + 8941 agactgcccc ttataaggtt agttattgga actctgttga tattgtatat atactctgtg + 9001 tacgggagtc ataaatctca acttaccaga agttttaaaa tgattactcg ctctcttttt + 9061 gcatttctta tgttgatagt tttattcttt cttttaaaat ttgtattagg gcgttcttct + 9121 caggaagatt ttatcagtta catcactcgt tatatgggag gctcaattca actatttgat + 9181 ttatttgtta tagatccgat acgacgtaac aaagaactag gtgcagaaac tttttcggga + 9241 atttatgaga tgcttgcaaa attaggattt gataataata ttataaaagg cttagaatgg + 9301 agaatatcgc ctaattatta ttctttaggg aatgtgtata ctgcaattag acgctattat + 9361 tcagactttg gtgtaattgg tattgtaatt tgtcagagtt ttacagcatg gttgtatact + 9421 ttaggttatg aaaaaattag acatcattct ttagttacaa atggtcaaag atttaggttg + 9481 attctattag cagcttcatt ttatccatta tttttaaata gtatcgagga tgtgttttat + 9541 atttcaatgg ttaccattgg atatggaatc caaattgtta tcttttatct ggttttttgg + 9601 gttcttctga aagttcaggt tgactttaac aaaggtaaat taaggataaa tagatgaatt + 9661 tagcgctaat gtattgagtt atataaaggg atagatttgg tagtatttgt aggaatttta + 9721 attggaggaa gagagccttg aatgagaatt acaaatcttc tgaaacaatt tttaggtggg + 9781 gagtatagtt atgaaattga agtttcttat aacaaatttg tttcatgttc ttttgtctaa + 9841 tctgattaca attcttacat cagttatagt tgtactaatt ttaccaaaaa ttatgggagt + 9901 aactgagtat agttattggc aactatatat tttttaccta acatatattg gtttttttca + 9961 tctgggatgg attgatggaa tttatcttaa atatggcgga ttagagtacc agaacttaga + 10021 taagaaacag ttttattctc aaatacttca attttccagt tttttaattt taatttcttt + 10081 tctattattt ggttttaact tattgactgt gacagatcaa aatgcaaaat atatttataa + 10141 catgactatt attagtatga tagttacaaa tttaagaatg ttattcgttt atattttgca + 10201 gatgacaaat cgattaaagg atagttccat cattctaatc agtgatcgcg ttatatatgt + 10261 tattctttta ttcctgttta ttatatttaa atggcatgaa tacaaggtaa tgatttgggc + 10321 agatgttttg ggaaggacat tttctctcct actttctttt tggatttgta aagatattgt + 10381 ttttcaatcc ttatccgagt tcatattgga tctgagagag tcttttgaca atatccgtgt + 10441 tggaatcaat ttaatgttat ccaatattgc aagtagtatg attattggta ttgttcgaat + 10501 gggaattcaa tggaattgga atatcgaaac attcgggaaa gtatcactga cgctaagcat + 10561 ctctaattta ttaatgactt ttattaatgc gattggttta gttgtttttc ctttgttaaa + 10621 acggacaaaa acggaaaatt tatctaaaat ttattccaac ttaagaaatg ttttgatgct + 10681 tatcatgttc gcgattttgc tcatttacta tcctttaaaa attgtattag acctctggtt + 10741 gccagcctat caagatgcct tgattttcat gacccttatt ttccctatgt cagtctatga + 10801 aggaaaaatg gcattggtca ttaatactta cttaaaggca ttaagaatgg agagagatat + 10861 tctcaaaata aatactttga ttatgttgtt cagtatgtta gttaccctaa taactactct + 10921 attattaaat agtttagagc tgactgttgt atcgatagtt gttttgctag ctttacgtag + 10981 cgtaatagca gaactaattc tatctaaaaa actggatgtt tcggttaaga aagatattgt + 11041 attagaattt cttttgacga ttgtctttat ttcttcaagt tggtacttac cgatttggcc + 11101 cgcagtaata gtttatttgt tagcgtatac tttatacttg tatctaaagc gtaaagatat + 11161 aaaaatgtat atagaatatt ttagaaagaa aatatttgaa taaaaagaat tatatatcag + 11221 ttagatggca aattctattt ttaccttttt gtcgtttagt agaaaatgat aaaaaatatg + 11281 atactatttt ttgcacatat ctagaagcaa tttaaatgtg tcaggtgata aattaattta + 11341 aactaagaat agttgctgga acattgctat tagtgggaac aagttacgaa ataatttatc + 11401 aattttaaag acgtttttta ggaaatataa aataatggat tctatcaaca attctaatag + 11461 taatgataat gctagaaaat caaactgttc attttcaaag gaagattatt tttaaaataa + 11521 tatatcttta agtaagaatc attttattag acttaatcta gcctatcagt taaattaaaa + 11581 tatcaacttt gattaattaa aaattagcaa aatttattga cattttgctt tgataaattg + 11641 caataaaggt ctaattctga atttcaggga atataagaaa ggtacactat tatgaaaggt + 11701 attattcttg caggcggctc aggtacccgc ctgtacccac ttactcgggc tgcgtcaaaa + 11761 cagctgatgc cggtttatga taaacctatg atttattatc cgttgtcgac attaatgttg + 11821 gctggaatta aagatatttt gattatctca actcctcaag atttgccccg gtttaaggac + 11881 ttgctcttgg atggttccga atttgggatc aagctttcct atgcggaaca acctagtccc + 11941 gatggacttg ctcaggcttt tcttatcggt gaagaattta tcggtgacga tagtgttgcc + 12001 ttgattttgg gcgacaatat ctatcatgga cctggtttga gcaaaatgct tcaaaaggca + 12061 gcccagaaag agaaaggtgc gactgttttt ggctaccaag tgaaggatcc agagcgtttt + 12121 ggtgtggtcg agtttgatac agacatgaat gccatttcca tagaagaaaa accagagaat + 12181 cctcgctcca actatgccgt gaccggtctg tatttctatg ataatgatgt tgtagaaatt + 12241 gctaaaggta ttaaaccaag tgcacgtggc gagttagaaa ttacagatat caacaaggct + 12301 tacctaaatc gtggtgacct ttctgttgag ctgatggggc gtggttttgc ctggttggat + 12361 acgggaaccc atgaaagcct gctagaagct tctcagtata tcgaaacagt tcaacggatg + 12421 cagaatgttc aagttgcaaa cttggaagaa attgcctatc gcatgggcta tatcagttgt + 12481 gaagatgtgc tcgagttggc gcaacctctg aagaagaatg aatacggaca atatttgctc + 12541 cgtttgattg gagaagcata gatgtcagat aatttttttg gaaaaacact tgcagtgcgt + 12601 aagattgatg ctataccagg actgctagag tttgacattc ccgttcatgg agacaatcgt + 12661 ggttggttta aggaaaactt ccagaaggaa aagatggagc cacttggctt tcctgaaagc + 12721 ttctttgctg cagggaaatt gcaaaacaac gtcagctttt ctcgcaaaaa tgttcttcga + 12781 ggattgcatg cagaaccttg ggacaagtat atctctgttg cagacgatgg gaaggtttta + 12841 ggatcttggg ttgatctacg cgagggtgaa acctttggga atacctatca gacagtgatt + 12901 gatgcgagta agggaatctt tgttcctcga ggcgtagcta atggcttcca agttttatca + 12961 gatacagtgt catatagcta tctggtcaat gattactggg ctcttgaact caaacccaag + 13021 tatgcctttg tgaactacgc tgatccaagc cttggtattg aatgggaaaa tattgcagaa + 13081 gcagaggttt cagaagcaga taaaaatcat ccactactta aggatgtaaa acctttgaaa + 13141 aaagaagatt tggaataagg aaagaatatg actgaataca aaaatattat cgtgacaggt + 13201 ggagctggct ttatcggttc taactttgtc cattatgttt acgagaactt tccagatgtt + 13261 cacgtgacag tcctagataa gttgacttat gctggaaacc gcgcgaatat tgaggaaatt + 13321 ttaggtaatc gtgttgagtt agttgttggt gacattgctg atgcggagtt ggtagacaag + 13381 ttggctgctc aagcagatgc tatcgttcat tatgcagcgg aaagccacaa tgataattcg + 13441 ctcaatgatc catcgccatt tattcatact aacttcattg gaacctatac tcttttagaa + 13501 gctgctcgta agtatgatat tcgcttccac catgtatcga cagatgaagt ttatggggat + 13561 ctccctttac gcgaagattt gccaggtcat ggagaagggc cgggtgagaa atttacggct + 13621 gaaaccaagt acaatccaag ctcgccttac tcatcaacca aggcagcctc agatttgatt + 13681 gtcaaagcct gggtgcgttc ttttggagtc aaggcaacga tttccaactg ttcaaataac + 13741 tacggtcctt atcaacatat cgaaaaattc atcccacgtc agattactaa catcctaagt + 13801 ggtatcaagc caaaacttta cggtgaaggt aaaaacgttc gtgactggat tcataccaat + 13861 gaccattctt caggagtttg gacaatcttg acaaaagggc aaatcggtga aacctacttg + 13921 attggggctg atggtgagaa gaacaataag gaagttttgg aacttatcct taaggaaatg + 13981 ggacaagctg cggatgccta tgatcatgtg actgaccgtg caggacatga ccttcgctat + 14041 gcgattgatg ctagcaagct ccgtgatgag ttggggtgga aacctgaatt taccaacttt + 14101 gaagctgggc tcaaggcaac aatcaagtgg tatacagata accaagaatg gtggaaagca + 14161 gaaaaagaag ctgttgaagc caattatgct aagactcagg agattattac agtataaaaa + 14221 gcaggaaata gctgcttttt attgctatat tgggaagagt tacatattag aaaggtctag + 14281 agatgatttt aattacaggg gcaaatggcc aattaggaac ggaacttcgc tatttattgg + 14341 atgaacgtaa tgaagaatac gtggcagtag atgtggctaa gatggacatt accaatgaag + 14401 aaatggttga gaaagttttt gaagaggtga aaccgacttt agtctaccat tgtgcagcct + 14461 acaccgctgt tgatgcagca gaggatgaag gaaaagagtt ggacttcgcc atcaatgtga + 14521 cggggacaaa aaatgtcgca aaagcatctg aaaagcatgg tgcaactcta gtttatattt + 14581 ctacggacta tgtctttgac ggtaagaaac cagttggaca agagtgggaa gttgatgacc + 14641 gaccagatcc acagacagaa tatggacgca ctaagcgtat gggggaagag ttagttgaga + 14701 agcatgtgtc taatttctat attatccgta ctgcctgggt atttggaaat tatggcaaaa + 14761 acttcgtttt taccatgcaa aatcttgcga aaactcataa gactttaaca gttgtaaatg + 14821 atcagtacgg tcgtccgact tggactcgta ccttggctga gttcatgacc tacctagctg + 14881 aaaatcgtaa ggaatttggt tattatcatt tgtcaaatga tgcgacagaa gacacaacat + 14941 ggtatgattt tgcagttgaa attttgaaag atacagatgt cgaagtcaag ccagtagatt + 15001 ccagtcaatt tccagccaaa gctaaacgtc cgctaaactc aacgatgagc ctggccaaag + 15061 ccaaagctac tggatttgtt attccaactt ggcaagatgc attgcaagaa ttttacaaac + 15121 aagaagtgag ataagtagta gaatgatttt ctagtctaat aaaagaggca gagaatgaac + 15181 tccaaaggag cataagatgt acgattatct tatcgttggt gctgatctct ttggcgcata + 15241 gctttggctc agtttctatt atcgctcaca ccatccatca gaagtttaat ttgaaggtac + 15301 ccaattatcg ccaagaagaa gattgggcta ggatgggttt accaatcaca cgtaaggaaa + 15361 tctctaattg gcatatcaag gcaagtcaat actatttaga gtccctttat aaccttttac + 15421 gagaaaagtt gttagaacaa cctcttcttc atgcggatga aacctcttat cgggtgctag + 15481 agagtgatag ccatctgacc tactattgga cctttttgtc tgggaaagct gagaatcaag + 15541 caatcacgct gtaccatcat gatcagcgtc ggagtggttt agtagtacaa gaattcctag + 15601 gagattattc tggctatgtg cattgtgata tgttgcggca gtaacttagg actttagtcc + 15661 tctagttctg cctatgcgat agcagtccaa ggtttaggag caaggcgacg ctaagcttgg + 15721 taaac +// + diff --git a/public/res/serotype_genbank/serotype_6F.gb b/public/res/serotype_genbank/serotype_6F.gb new file mode 100644 index 0000000..617439f --- /dev/null +++ b/public/res/serotype_genbank/serotype_6F.gb @@ -0,0 +1,581 @@ +LOCUS KC832410 18783 bp DNA linear BCT 09-FEB-2015 +DEFINITION Streptococcus pneumoniae strain MNZ1136 dexB gene, partial cds; and + capsular polysaccharide synthesis gene locus, complete sequence. +ACCESSION KC832410 +VERSION KC832410.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18783) + AUTHORS Oliver,M.B., van der Linden,M.P.G., Kuntzel,S.A., Saad,J.S. and + Nahm,M.H. + TITLE Discovery of Streptococcus pneumoniae Serotype 6 Variants with + glycosyltransferases Synthesizing Two Differing Repeating Units + JOURNAL J. Biol. Chem. 288 (36), 25976-25985 (2013) + PUBMED 23897812 +REFERENCE 2 (bases 1 to 18783) + AUTHORS Oliver,M.B., van der Linden,M.P.G., Kuntzel,S.A., Saad,J.S. and + Nahm,M.H. + TITLE Direct Submission + JOURNAL Submitted (25-MAR-2013) Microbiology, University of Alabama at + Birmingham, Bevill Building, Room 614, 845 19th Street South, + Birmingham, AL 35294, USA +COMMENT ##Assembly-Data-START## + Sequencing Technology :: Sanger dideoxy sequencing + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..18783 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="MNZ1136" + /serotype="6F" + /db_xref="taxon:1313" + /geo_loc_name="Germany" + /note="6X12; + serogroup: 6" + CDS <1..87 + /note="glucan 1,6-alpha-glucosidase" + /codon_start=1 + /transl_table=11 + /product="dexB" + /protein_id="AHF51326.1" + /translation="VLIENTLAQEVFEKQILVPWDAFCVELL" + misc_feature 246..411 + /note="similar to aliB" + misc_feature 412..938 + /note="similar to transposase; tnp" + misc_feature 1160..16644 + /note="capsular polysaccharide synthesis gene locus" + CDS 1160..2605 + /note="COG1316 transcriptional regulator; integral + membrane regulatory protein Wzg" + /codon_start=1 + /transl_table=11 + /product="wzg" + /protein_id="AHF51327.1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSTLHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIKKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + CDS 2607..3338 + /note="capsular polysaccharide biosynthesis protein; + member of homology group 1; protein-tyrosine phosphatase + Wzh" + /codon_start=1 + /transl_table=11 + /product="wzh" + /protein_id="AHF51328.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQNLVYVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + CDS 3344..4039 + /note="member of homology group 2; capsular polysaccharide + biosynthesis protein Wzd" + /codon_start=1 + /transl_table=11 + /product="wzd" + /protein_id="AHF51329.1" + /translation="MMKEQNTIEIDVFQLFKTLRQRKLMILLVALVTSAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDVEDVLKI + PLLGLVPDFDKMK" + CDS 4049..4738 + /note="COG0489 ATPases involved in chromosome + partitioning; member of homology group 3; capsular + polysaccharide biosynthesis protein Wze; tyrosine-protein + kinase Wze" + /codon_start=1 + /transl_table=11 + /product="wze" + /protein_id="AHF51330.1" + /translation="MPTLEISQAKLDSVKKVEEYYNALCTNLQLSGDGLKVFSITSVK + TGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRNCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFNTSVDKYGFY + GNYGDYGKNKK" + CDS 4753..6120 + /note="COG2148 sugar transferases involved in + lipopolysaccharide synthesis; undecaprenylphosphate + glucosephosphotransferase WchA (initial sugar + transferase)" + /codon_start=1 + /transl_table=11 + /product="wchA" + /protein_id="AHF51331.1" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRIEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDYLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYINGWTIWKDIEILLKTVKVVFM + RDGAK" + CDS 6216..7160 + /note="member of homology group 62; HMMPfam hit to + PF01501, glycosyl transferase family; + alpha-1,3-glycosyltransferase" + /codon_start=1 + /transl_table=11 + /product="WciN" + /protein_id="AHF51332.1" + /translation="MNIVYATDNNFVDVLSASIKSLYTTNSDLDLNLWIIADKVSDRN + KEKINRLSKQFAQREINWIENVEIPFKLHLDRGSISSFSRLFLGSVLPSSMSKVLYLD + SDIIVMDSLRSIFDIDFKGKILYGVNDTFNKEYKQVLGIPIDKPMFNTGVMLINLELW + RNNNVEERFLQVIQKFNGTILQGDLGVLNAVLYNSFGVLPPEYNYMTIFEDLTYEEMI + VFKKPINYYSKEEIKNARERIVLRHFTTSFLSKRPWQEGSNVAHIDQFKKYYEGSYKN + VKESILLKIVQKLPKKCSVFLLGIIQSKFRPKLYRILK" + CDS 7198..7371 + /note="member of homology group 262; HG262" + /codon_start=1 + /transl_table=11 + /product="hypothetical protein" + /protein_id="AHF51333.1" + /translation="MKIQEELKLLKEFIKICSKNKIKYFALGGSLLGAVRHKGFIPWD + DMDLSFPKSSIYV" + CDS 7431..8150 + /note="member of homology group 81; putative ribitol + phophotransferase" + /codon_start=1 + /transl_table=11 + /product="wciO" + /protein_id="AHF51334.1" + /translation="MSIYRICKDIERKTMSPAKKAMAKNDYFAFYVGRPLSYLLTVPF + VKTNITPNQISYLSIIPLIVGFIIMIFTTDFVVLLLAWFLFFLWNLLDGVDGNLARYR + EQYSKDGSVVDAMAGYVAMVLTYFGAGIVAAHLNDSDIYIILGALSGISLIFPRLVMH + KYINTVAQDESVSSIKDKSDFNTIKILALNMTSITGIPQVLLLLTILTNQWVLFTLVY + FTINFLLMIFFLYSLFKKENV" + CDS 8153..9139 + /note="member of homology group 97; putative glycosyl + transferase" + /codon_start=1 + /transl_table=11 + /product="wciP" + /protein_id="AHF51335.1" + /translation="MGKSVAILMTTYNGERYLSQQIDSIRSQTFTNWTLFIRDDGSKD + KTIEVIQRYSKIDDRIRFVENPSKFHGAYYNFFNLIEYVKNNYQFDYYFFCDQDDIWK + EHKLEIQLLRFSKDDMPEMVYSDMSTIDASNNLIDISINKIMGIELPNINNLYFIHAY + IWGCTAGFNHALLEMVPSVDIDKDYLYIEKLAHDSYFAKFALEYGKVLFCPEQLVLYR + RHGHNVTTSHHFKLSPLNVFRKAILGFNELALTHARVYNQTLYMLKKASGKNPLSDRL + LEIQEVIKIGGLKGVRYFYQNRISRKQLVRTIGLYTIMLFGTYKKYIMKELL" + CDS 9139..10482 + /note="member of homology group 139; oligosaccharide + repeat unit polymerase Wzy" + /codon_start=1 + /transl_table=11 + /product="wzy" + /protein_id="AHF51336.1" + /translation="MLLNFLFISIFLLIIITFILFEGDFFQPAVILTIAYFISIASAL + VNRNVWGTELHFKTFYLILLGVATFVIVSLLTKLSYRPKVEGISHEELKEINPSKIIY + VILLTLNLVMLFLYIREIQKVVLFSGRSFSNITDLISNYRYLSYYSNEVENRVSGMIN + QLSKIIPATTLISLYIFMNNYFITKQIKKNFIYLIPIAIFFVYAIISGGRLPLIRLVV + GSLLILDIYSVYGSPKSQLTKSFKMITRSLITFLIWIVLFFLLKFVLGRSSQEDFIRY + ITRYMGGSIQLFDLFVIDPIRRNKELGAETFSGIYEMLAKLGFDNNIIKGLEWRVSPN + YYSLGNVYTAIRRYYSDFGVIGIVICQSFTAGLYTLGYEKVRHYSLVTNVQRFRLILL + AASFYPIFLNGIEDVFYISMVTIGYGIQIVIFYLVFWVLLKVQVDFNKGKLTINR" + CDS 10607..12019 + /note="member of homology group 82; flippase Wzx" + /codon_start=1 + /transl_table=11 + /product="wzx3" + /protein_id="AHF51337.1" + /translation="MKLKFLITNLFHVFLSNPITIVTSVIVVLILPKIMGVTEYSYWQ + LYIFYLTYIGFFHLGWIDGIYLKYGGLEYQNLDKKQFYSQILQFSSFLILISFLLFGF + NLLIVTDPNAKYIYNMTIISMIVTNLRMLFVYILQMTNRLKDSSIILISDRVIYIFLL + FLFIIFKWHEYKVMIWADVLGRTFSLLLSFWICKDIVFQSLSEFILDLRESFDNIRVG + INLMLSNIASSMIIGIVRMGIQWNWNIETFGKVSLTLSISNLLMTFINAIGLVVFPLL + KRTKTENLSKIYSNLRNVLMLIMFAILLFYYPLKIILDLWLPAYRDALIFMALIFPMS + IYEGKMALVINTYLKALRMERDILKINTLIMLFSMLVTLITTLLLNNLELTVISIVVL + LALRSIIAELILSKKLDISVEPDIVLELLMTIIFISSSWYLPIWLAVIVYLLAYTLYL + YLKRKDTKMYIEYFRKKIFE" + CDS 12513..13382 + /note="member of homology group 10; glucose-1-phosphate + thymidylyltransferase RmlA" + /codon_start=1 + /transl_table=11 + /product="rmlA" + /protein_id="AHF51338.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKN + EYGQYLLRLIGEA" + CDS 13383..13976 + /note="member of homology group 11; + dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase RmlC" + /codon_start=1 + /transl_table=11 + /product="rmlC" + /protein_id="AHF51339.1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYSFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + CDS 13989..15038 + /note="member of homology group 8; dTDP-D-glucose + 4,6-dehydratase RmlB" + /codon_start=1 + /transl_table=11 + /product="rmlB" + /protein_id="AHF51340.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + CDS 15104..15955 + /note="member of homology group 9; dTDP-4-keto-L-rhamnose + reductase RmlD" + /codon_start=1 + /transl_table=11 + /product="rmlD" + /protein_id="AHF51341.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLTKAKATGFVIPTWQDALQE + FYKQEVR" + CDS 16018..16644 + /note="UDP-galactopyranose mutase Glf" + /codon_start=1 + /transl_table=11 + /product="glf" + /protein_id="AHF51342.1" + /translation="MYDYLIVGAGLFGAVFAHESALKGKKVKVIEKRNHIAGNIYTRE + EEGIQVHQYGAHIFHTSDKEIWDYVNQFAEFNRYTNSPVANYKGEIYNLPFNMNTFNK + LWGVVTPAEAQAKIEEQRAILNGKTPENLKEQAISLVGTDIYEKLIKDYTEKQWGKPT + TELPSFIIRRLPVRLTYDNNYFNDTYQGIPIGGYTQIVEKCWIMKILM" + misc_feature 17441..>18783 + /note="similar to aliA; ABC-type oligopeptide transport + system, periplasmic component" +ORIGIN + 1 gtcttgattg aaaacaccct agctcaagaa gtctttgaaa aacaaatctt agttccatgg + 61 gatgctttct gtgtggaatt actataaata ttttttgcag taaaatttaa aattgaaatc + 121 gtataaaaac aagggaggac tgtataaaag acagaaatcc tttgtttttt ataaccaaag + 181 tttataaact ttcattcttg aaattcaatt aactttacaa attcccacta ttaaggagaa + 241 agaagatgaa cataaagaag cgtgtcctta gtgcaggcct gacttttgca tctgctttgc + 301 ttttagctgc ttgcggccaa tcaggttcag atacaaaaac ttactcatca acctttagtg + 361 gaaatccaac tacatttaac tatctattag actattacac tgataatata gtcaattgaa + 421 acaagaacaa gacaaaagag cctcataaaa ggtattgcaa cttggtaata cctttttgag + 481 gtgctttttg atatgagccc atgttttctc aataggattg tactcaggtg agtagggagg + 541 aagaggtaaa agtttatgcc taaactcttc gcataaaagt tctaacttac ccattctatg + 601 gaatcttgca ttatccataa taataaccga tggtgtggtt aatgttggta agagaaactt + 661 ctgaaaccat acttcaaaaa agtcgctcgt catcatctct tcgtaagtca ttggagcgat + 721 taactcacca ttcatttgtt agacctgcaa ccaaagaaat cctccgatat cttcttccag + 781 atattttgcc tcttcttaat tgacctttta aagagcgacc atattctcga taaaaataag + 841 tatcgaatcc tgtttcatca atctaaacag gtgctaggtg ctttaaacta ttaaaattct + 901 taagaaataa ggctactttt tctgggtctt gttcataatt agattgaaac tagaatagta + 961 cacctctgct tctaaaacat tgttagaaat cgatttgact gtcctgatcg ttttgtcatg + 1021 ttcttatttc attttactat atttttggtt cgtgggaagt ctactaagat acttaaagat + 1081 gcagatagtg aaaaaaggtg tagacattac cgtaaaaaag tgatataatc gtatgatgtt + 1141 caatgtatag gtgttaatca tgagtagacg ttttaaaaaa tcaggttcac agaaagtgaa + 1201 gcgaagtgtt aatatagttt tgttgactat ttatttattg ttagtttgtt ttttattgtt + 1261 cttaatcttt aagtacaata tccttgcttt tagatatctt aatctagtgg taactgcgtt + 1321 agtcctacta gttgccttgg tagggctact cttgattatc tataaaaaag ctgaaaaatt + 1381 tactattttt ctattggtgt tttctatcct tgtcagctca gtgtcgctct ttgcagtaca + 1441 gcagtttgtt ggactgacca atcgtttaaa tgcgacttct aattactcag aatattcaat + 1501 cagtgtcgct gttttagcag atagtgatat cgaaaatgtt acgcaactga cgagtgtgac + 1561 agcaccgact gggactgata atgaaaacat tcaaaaacta ctagctgata ttaagtcaag + 1621 tcagaatacc gatttgacgg tcgaccagag ttcgtcttac ttggcagctt acaagagttt + 1681 gattgcaggg gagactaagg ccattgtcct aaatagtgtc tttgaaaata tcatcgagtc + 1741 agagtatcca gactacgcat cgaagataaa aaagatttat accaagggat tcactaaaaa + 1801 agtagaagct cctaagacgt ctaagaatca gtctttcaat atctatgtta gtggaattga + 1861 cacctatggt cctattagtt cggtgtcgcg atcagatgtc aatatcctga tgactgtcaa + 1921 tcgagatacc aagaaaatcc tcttgaccac aacgccacgt gatgcctatg taccaatagc + 1981 agatggtgga aataatcaaa aagataaatt aacccatgcg ggtatttatg gagttgattc + 2041 gtccattcac accttagaaa atctctatgg agtggatatc aattactatg tgcgattgaa + 2101 cttcacttct ttcttgaaaa tgattgactt attgggaggg gtagatgttc ataatgatca + 2161 agagttttca actctacatg ggaagttcca tttcccagta gggaatgtcc atctagactc + 2221 tgagcaggct ctaggttttg tacgtgaacg ctactcacta gccgatggag accgtgaccg + 2281 tggtcgcaac caacaaaagg tcattgtagc aattattaag aagttaactt ctacagaggt + 2341 tttgaaaaac tatagtagta ttcttcaagg attgcaggat tctcttcaaa caaatatgcc + 2401 gattgagact atgatagatt tagtgaatac tcagttggag agtggaggga attataaagt + 2461 aaattcgcaa gacttgaaag gtacaggtcg gatggatctt ccttcttatg caatgccaga + 2521 cagtaacctc tatgtgatgg aaatagatga tagtagttta gctgtagtta aagcagctat + 2581 acaggatgtg atggagggta gatgaaatga tagacatcca ttcgcatatc gtttttgatg + 2641 tagatgacgg tcccaagtca agagaggaaa gcaaggctct cttggcagaa gcctacagac + 2701 agggggtgcg aaccattgtc tctacctctc accgtcgcaa gggcatgttt gaaactccgg + 2761 aagagaagat agcagaaaac tttcttcagg ttcgggaaat agctaaggaa gtggcgagtg + 2821 acttagtcat tgcttacggg gctgaaattt actacacacc agatgttctg gataagctgg + 2881 gaaaaaagcg gattccgacc ctcaatgata gtcgttatgc cttgatagag tttagtatga + 2941 atactcctta tcgcgatatt catagcgcct tgagcaagat tttgatgttg ggaattactc + 3001 cagtcattgc ccacattgag cgctatgatg ctcttgaaaa taatgaaaaa cgcgttcgag + 3061 aactaatcga tatgggctgt tacacgcaag taaatagttc acatgtcctc aaacccaaac + 3121 tttttggcga acgttataaa ttcatgaaaa aaagagctca gtatttttta gagcagaatt + 3181 tggtttatgt cattgcaagt gatatgcaca atctagacgg tagacctcct catatggcag + 3241 aagcatatga ccttgttacc caaaaatacg gagaagcgaa ggctcaggaa ctttttatag + 3301 acaatcctcg aaaaattgta atggatcaac taatttagga gaaatgatga aagaacaaaa + 3361 cacgatagaa atcgatgtat ttcaattatt taaaaccttg cggcaacgca agctaatgat + 3421 tttattagtg gcacttgtga caagtgcggg ggcttttgca tatagcactt ttattgttaa + 3481 gccagaatat acgagtacca cgcgaattta cgtagtgaat cgcaatcaag gagacaagcc + 3541 ggggctgaca aatcaggatt tgcaggcagg aacttatctg gtaaaagact accgtgagat + 3601 tatcctttcg caggatgcat tggaaaaagt agcgacaaat ttgaagttgg atatgccagc + 3661 aaaaacgtta gccagcaaag ttcaagtggc tgtaccagct gacactcgta tcgtctcaat + 3721 ctctgtcaag gataaacagc cagaggaagc cagtcgtatc gctaattctc tacgagaagt + 3781 tgctgcagaa aagatcgtcg ctgtaacgcg agtatctgat gtaacgacac ttgaagaagc + 3841 gcgaccagct acgactccct cttctccaaa tgttcgacgc aattccttgt ttggttttct + 3901 tggaggagca gtcgtaacag taattgctgt tcttttgatt gagttgctcg acacccgtgt + 3961 gaaacgtcct gaagatgttg aagatgtact gaaaattcca cttttagggc tcgttccaga + 4021 ttttgacaaa atgaaatagg aggaagttat gccaacatta gaaatctcac aggcaaaatt + 4081 ggattctgta aaaaaggtag aggaatatta taacgctttg tgcacgaacc tacagttaag + 4141 tggagatggt ttgaaagtat tttctatcac ttctgtgaaa acaggagaag gaaaatcaac + 4201 gacttccacc aatatcgctt gggcttttgc gcgtgcaggt tacaaaacgc tgctgattga + 4261 tggagatatt cgcaattctg ttatgttagg tgtctttaaa gcaagggata agattacagg + 4321 cctgacagaa tttttatcag gaactacaga cctatcacaa gggctttgtg ataccaatat + 4381 cgaaaatctc tttgtaattc aggctggctc tgtgtcaccg aatccgacag ctcttcttca + 4441 aagtaagaat ttcagtacaa tgcttgaaac cttgcgtaaa tattttgact acatcattgt + 4501 agatactgct cctgtcggtg tcgtgattga tgcggctatt attacgcgaa actgcgatgc + 4561 ttctatttta gtgacggagg caggtgaaat aaatcgacgg gatattcaaa aagcaaaaga + 4621 acagttggaa cacacaggga agccgttttt gggagttgtg ttgaataaat tcaatacttc + 4681 agtagacaaa tacggttttt atggaaatta tggagattac gggaaaaata aaaaataggt + 4741 cgggggatag agatgaatgg aaaaatagta aagtcttcat tggccataat ccagagtttt + 4801 cttgttattt tattgactta tctacttagt gctgtgagag aagcggagat tgtttcaaca + 4861 acagctattg cactttatat cctccattat tttgtctttt atatcagtga ttatggacag + 4921 gatttcttta aaaggggata tttgattgaa cttgtccaga cattgaaata tatcctattc + 4981 tttgcactag cgattagtat ttctaatttt ttcttagagg atcgatttag tatttccaga + 5041 cgaggcatga tttacttcct cacattacat gctctcttag tctatgtgct aaacctattt + 5101 atcaagtggt attggaagcg ggcttatccc aactttaaag gaagtaagaa gattctccta + 5161 cttacagcaa cttctcgtat cgaaaaggta ctggatagat taatagaatc aaatgaggtt + 5221 gttggggagt tggtagccgt cagtgtctta gataaaccag attttcagca tgattattta + 5281 aaggtagtag cagaggggga gatagtaaac tttgcgactc atgaggtggt cgatgaagtc + 5341 tttatcaatc ttccaagtga aaaatacaat attggagagc ttgtctctca gtttgaaacg + 5401 atgggaattg atgtaacagt taatctaaat gcttttgatc gtagtttggc acgtaacaag + 5461 caaattcgtg agatggcagg attaaacgtt gtgacttttt ctacaacatt ttataagact + 5521 agtcatgtaa ttgctaagcg gattattgat atcgtgggtg cattggtagg gctgatatta + 5581 tgtggtttag tcagtattgt actggttcct ttgattcgaa aggatggggg ctctgctatt + 5641 tttgctcaga cgcgtatagg aaaaaatggt cgtcagttca ctttttataa gtttcgctct + 5701 atgtgtgtag atgccgaggc gaaaaaaaga gaactcatgg aacaaaatac catgcagggt + 5761 ggaatgttta aggtggacga tgatcctcgt atcacgaaaa ttggtcgttt tatacggaag + 5821 actagcttgg acgagctacc acagttttac aatgttctaa agggagatat gagcttggta + 5881 ggtacacgac caccaacagt ggacgagtat gagcactata ccccagaaca aaaacgccga + 5941 ctaagtttta aacctggcat aacaggttta tggcaggtca gcggacgaag tgaaatcaag + 6001 aatttcgatg aagttgtcaa attagatgtg gcctatatta atggttggac aatctggaaa + 6061 gatattgaaa ttttattgaa aacggttaaa gttgtattta tgagagatgg agcgaaatag + 6121 tttggttgtg taggatattt gtagaggtaa aagtttcgaa tatatctcac tcaatctttt + 6181 ttataagtga aaataaattt agaagtagga attttatgaa tatagtttat gccacagata + 6241 ataattttgt agatgtattg agtgcttcca tcaaatcact ttacactact aattcagatt + 6301 tggatttaaa tttatggatt attgctgata aagtttcgga tagaaataaa gaaaagataa + 6361 atagattatc aaaacaattt gcgcagagag aaattaattg gatagagaac gttgagatcc + 6421 catttaaatt acatttagat aggggatcaa ttagttcatt tagcagatta tttctgggaa + 6481 gtgttcttcc atcttcaatg agtaaagttc tttatcttga cagtgatatt attgttatgg + 6541 attctttacg aagtattttt gatattgatt ttaagggtaa aattctctat ggggtgaatg + 6601 atacttttaa taaagaatac aagcaggtgt tgggtatacc aattgacaag ccaatgttta + 6661 atactggagt tatgcttatt aatttagagt tatggagaaa taataacgtc gaagaaagat + 6721 ttttgcaagt aattcaaaag tttaatggta ctatattaca aggagattta ggggttttaa + 6781 atgcagtttt atataactca tttggtgtac ttcctccaga atataattat atgaccatat + 6841 ttgaagattt gacttatgaa gaaatgatag tttttaaaaa accaattaat tattattcaa + 6901 aagaggaaat taaaaatgcc agagaacgta tagtcttgcg acatttcaca actagttttt + 6961 tatcaaaaag accttggcaa gaaggcagta atgttgcaca tatagaccaa tttaaaaaat + 7021 actatgaagg tagttataaa aatgttaaag aatctatttt actaaaaata gttcaaaaat + 7081 tacccaaaaa atgttcagtt tttttattag gaattattca atcaaaattt agacctaaat + 7141 tgtatagaat tttgaaataa ggtggatagt attaatgaca aaaaagaaag aattttattg + 7201 aaaattcaag aagaattgaa attattaaaa gagtttataa aaatatgttc taaaaataaa + 7261 attaagtatt ttgctcttgg aggtagtcta ttaggagctg taagacacaa aggtttcatt + 7321 ccttgggatg atatggatct aagctttcca aagagttcaa tctatgtttg aaataaagga + 7381 aaaagtgtta gaattagaga atgtattaat gagtttagga gaaagtatag atgtcaatat + 7441 atagaatctg taaagatatt gaaagaaaaa ctatgtcgcc tgctaaaaaa gcaatggcta + 7501 aaaacgacta ttttgcattt tatgttggaa gacctttatc ctatctttta acagttcctt + 7561 tcgtgaaaac aaatattact cccaatcaaa tatcttattt atctataatt cctttgattg + 7621 ttggatttat aataatgata tttacaactg atttcgttgt attattactg gcatggtttc + 7681 tatttttttt atggaactta ctagatggag tagatgggaa cttagccaga tatcgggagc + 7741 aatactcgaa ggatggaagt gtagtagatg caatggctgg ctatgtagcc atggtgttga + 7801 cgtatttcgg tgcaggaata gtagctgctc atttaaacga ctcagatatc tatataattt + 7861 tgggtgcatt atctgggatt tcattgattt ttccaaggtt agtgatgcat aagtatatca + 7921 atacagtagc tcaagatgag tctgtgagta gcattaaaga taaatctgat tttaatacta + 7981 taaaaatact ggctctaaac atgacatcaa ttacaggaat tccgcaggtt ttactgctat + 8041 taactatttt aacaaatcag tgggtacttt ttactttagt atattttacg attaattttt + 8101 tattaatgat atttttcttg tattcattat tcaaaaagga gaatgtttag aaatgggaaa + 8161 gtcagttgca attttaatga ccacctataa tggtgagcga tatttgtcac aacagattga + 8221 tagtattagg tctcaaacat tcactaattg gacacttttt attagggatg atggatcaaa + 8281 agataaaaca atagaagtaa tacagaggta ttctaagata gatgatagaa ttagattcgt + 8341 tgaaaatccc tcaaagtttc atggagctta ttacaatttt tttaatctaa ttgaatacgt + 8401 taaaaacaat tatcaatttg attattactt tttttgtgat caagatgata tttggaaaga + 8461 gcacaagtta gaaatacagc tgttaagatt ttctaaagat gacatgccag agatggttta + 8521 ctctgatatg tcaacgattg atgccagtaa taatttgata gatattagta taaataaaat + 8581 aatggggatt gaattaccga acataaataa tttgtatttt attcatgcct atatctgggg + 8641 gtgtactgca ggttttaatc atgcattgct agagatggtt ccttcagttg atattgataa + 8701 agattattta tatatagaaa aactggctca tgatagttat tttgcaaagt ttgcactaga + 8761 gtatgggaag gtgttgttct gccctgagca actggtcttg tatcgaagac atggacataa + 8821 tgtaacaact agtcatcatt ttaaattatc tccgctaaat gttttcagaa aggctatatt + 8881 gggtttcaat gaattggcac ttacacatgc tagggtatat aatcaaactc tttatatgct + 8941 aaaaaaagct tctggaaaaa atcctttaag tgatagacta cttgaaattc aggaagtaat + 9001 caaaattgga ggattaaaag gtgtgagata tttctatcag aatcgaattt ctcgaaagca + 9061 actcgtaaga acaatcggct tatataccat catgcttttt gggacctata aaaaatatat + 9121 tatgaaagaa ctcttataat gcttttaaat ttcttattca tatctatttt tctattaatt + 9181 atcattacat ttatattatt tgagggggat ttttttcaac ctgcagtaat tttaacaatc + 9241 gcttatttta tttcgattgc aagtgctcta gttaatagaa atgtttgggg aacagaactc + 9301 catttcaaaa ccttttattt gatattgtta ggggttgcta catttgttat agtttccttg + 9361 ttgacaaaat tgtcgtacag gcctaaagtg gagggaattt cgcatgaaga attgaaagaa + 9421 ataaatcctt caaagataat ctatgtcatt cttctgactc taaatcttgt tatgttattt + 9481 ctttatatcc gtgaaattca gaaagtagta ttgttttcag gtagaagttt ttctaatatt + 9541 acagatttga taagtaacta taggtaccta tcttattatt caaatgaagt agaaaatcgt + 9601 gtaagtggaa tgattaatca actatctaaa attattccag cgactacact tatttcttta + 9661 tatatattta tgaataatta ttttataact aaacaaataa agaaaaattt catttatttg + 9721 attccaatag ctatattctt tgtctatgca atcattagtg gtggtagatt gccccttata + 9781 aggttagttg ttggatctct gttgatattg gatatatact ctgtgtacgg gagtcctaaa + 9841 tctcaactta ccaaaagttt taaaatgatc actcgctctc tgattacatt tcttatttgg + 9901 atagttttat tctttctttt aaaatttgta ttagggcgct cctctcagga agattttatc + 9961 aggtacatca ctcgttatat gggaggttca attcaactat ttgatttatt tgttatagat + 10021 ccgatacgac gtaacaaaga actaggtgca gaaacttttt cgggaattta tgagatgctt + 10081 gcaaaattag gatttgacaa taatattata aaaggcttag aatggagagt gtctcctaat + 10141 tattattctt tagggaatgt gtatactgca attagacgtt attattcaga ctttggcgta + 10201 attggtattg taatttgtca gagttttaca gcggggttat atactttagg ttatgaaaaa + 10261 gttagacatt attctttagt tacaaatgtt caaagattta ggttgatcct attagcagct + 10321 tcattttatc caatattttt aaatggtatc gaggatgtgt tttatatttc aatggttacc + 10381 attggatatg gaatacaaat tgttatcttt tatctggtct tttgggttct tctgaaagtt + 10441 caggttgact ttaacaaagg taaattaacg ataaatagat gaatttagcg ctaatgtatt + 10501 gagtcatata aagggatata tttggtaggt attttaattg gaggaagaga gtcttgaatg + 10561 ggaagtacaa atcttctgaa ataattttta ggtggggagt atagctatga aattgaagtt + 10621 tcttataaca aatttgtttc atgtcttttt gtctaatccg attacaattg tcacatcggt + 10681 tatagttgta ctaatcttac caaaaattat gggagtaact gagtatagtt attggcaact + 10741 atatattttt tacctaacat atattggttt ttttcatctg ggttggattg atggaattta + 10801 tcttaaatat ggtggattag agtaccagaa tttagataag aaacagtttt attctcaaat + 10861 acttcaattt tccagttttt taattttaat ttcttttcta ttatttggtt ttaacttatt + 10921 gattgtgaca gatccaaatg caaaatatat ttataacatg actattatta gtatgatagt + 10981 tacaaattta agaatgttat tcgtttatat tttgcagatg acaaatcgac taaaggatag + 11041 ctctataatt ctgataagtg atcgagttat atatattttt cttttatttc tgtttattat + 11101 atttaaatgg catgaataca aggtaatgat ttgggcggat gttttaggaa ggacattttc + 11161 tctcctactt tctttttgga tttgtaaaga tattgttttt caatccttat ccgagttcat + 11221 attggatctg agagagtctt ttgacaatat ccgggttgga atcaatttaa tgttatccaa + 11281 tattgcaagt agtatgatta ttggtattgt tcgaatggga attcaatgga attggaatat + 11341 cgaaacattc gggaaagtat cactgacgct aagcatctct aatttattaa tgacttttat + 11401 taatgcgatt ggtttagttg tctttccttt gttaaaacgg acaaaaacgg aaaatttatc + 11461 taaaatttat tccaacttaa gaaatgtttt gatgctgatc atgtttgcaa tattgctctt + 11521 ttattatcct ttaaaaatta ttctagatct ttggttgcca gcttatcggg atgcgttgat + 11581 ttttatggct cttatttttc ctatgtcaat ttatgaaggg aagatggcct tggtgattaa + 11641 tacatattta aaggcgctaa ggatggaaag agatattctc aaaataaata ctttgattat + 11701 gttgttcagt atgttagtta ccctaataac tactctatta ttaaataatt tagagctaac + 11761 ggttatatct atagttgttt tgctagcttt acgtagtata atagcagaac taattctatc + 11821 taaaaaactt gatatatcag ttgagccaga cattgtgtta gaattactta tgacaattat + 11881 atttatttct tcaagttggt acttaccgat ttggctcgca gtaatagttt atttgttagc + 11941 gtatacttta tacttgtatc taaagcgtaa agatacaaaa atgtatatag aatattttag + 12001 aaagaaaata tttgaataaa aagaactata tatcagttag atggcaaatt ctatttttac + 12061 ctttttgtcg tttaatagaa aatgataaaa aatatgatat tattcttaca catatttata + 12121 agcaatttaa atgtatcagg tgataaatta atttaaaata agaatagttt ctggaacatt + 12181 gctattagtg ggaacaggtt acgaaataat ttatcaattt taaagatgtt tttttaaata + 12241 taaaataatg gattctgtca acaattctaa attctaatag gaaagaaaat gctagaaaat + 12301 cagattgttc atttttcaag gaagtttatt tttaaaataa tatatcttta agtaagaatt + 12361 attttattag acttaaccta gcctatcagt taaattagaa tatcaacttt gattaattaa + 12421 aaattagcaa aatttattga cattttgttt ttataaattg caataaaggt ctaattctga + 12481 atttcagtga atataagaaa gggatcctac taatgaaagg tattattctt gcaggtggtt + 12541 cggggacacg attatatcct ttgactcggg ctgcatcaaa acaacttatg ccggtttatg + 12601 ataaaccgat gatttactat ccactttcaa cattgatgtt ggctgggatt agggatattt + 12661 tgataatctc aactcctcaa gatttgcctc gttttaaaga gcttcttcaa gacggatctg + 12721 agtttgggat taaactttct tatgcagagc aaccaagtcc agatggtttg gcacaagcct + 12781 ttatcattgg ggaagagttt attggtgatg atagtgttgc tttgattttg ggggacaata + 12841 tctatcacgg ccctggtttg agcaaaatgc ttcaaaaagc agccaagaaa gagaaaggtg + 12901 cgactgtttt tggctaccaa gtgaaggatc cagagcgttt tggtgtggtt gagtttgata + 12961 cagacatgaa tgctatctcc atcgaagaaa agccagaata ccctcgttca aactatgcag + 13021 tgacaggact ctatttctat gataatgatg tagtagagat tgccaagagt atcaaaccaa + 13081 gtcctcgcgg agaattagaa atcacagatg tcaacaaggc ttacttggat cgtggagact + 13141 tatccgttga gcttatggga cgtggctttg cttggctgga tactggaact catgaaagtt + 13201 tactagaggc ttcacagtac atcgaaacag tgcaacggat gcaaaatgtt caggtagcaa + 13261 acttagaaga aattgcttac cgtatgggct atatcagtcg agaagatgta ttggccttag + 13321 cccaaccact taagaaaaat gaatacggac agtatctgct ccgtttgatt ggagaagcat + 13381 agatgacaga taattttttc ggtaagacgc ttgcggcacg caaggttgaa gctattccag + 13441 gcatgttgga gtttgatatc cccgttcatg gagataatcg tggctggttt aaagaaaatt + 13501 tccaaaagga aaaaatgctt ccacttggat ttccagagtc tttctttgca gaaggaaaat + 13561 tgcaaaacaa tgtatccttc tcacgtaaaa atgtccttcg aggcctccac gcagagcctt + 13621 gggataagta catctctgta gcagatggag ggaaagttct gggttcttgg gttgatctac + 13681 gcgagggtga aacctttggg aatacctatc agacagtgat tgatgcgagt aagggaatct + 13741 ttgttcctcg aggcgtagct aatggcttcc aagttttatc agatacagtg tcatatagct + 13801 atctggtcaa tgattactgg gctcttgaac tcaaacccaa gtattccttt gtgaactacg + 13861 ctgatccaag ccttggtatt gaatgggaaa atattgcaga agcagaggtt tcagaagcag + 13921 ataaaaatca tccactactt aaggatgtaa aacctttgaa aaaagaagat ttgtaataag + 13981 gaaagaatat gactgaatac aaaaatatta tcgtgacagg tggagctggc tttatcggtt + 14041 ctaactttgt ccattatgtt tacgagaact ttccagatgt tcacgtgaca gtcctagata + 14101 agttgactta tgctggaaac cgcgcgaata ttgaggaaat tttaggtaat cgtgttgagt + 14161 tagttgttgg tgacattgct gatgcggagt tggtagacaa gttggctgct caagcagatg + 14221 ctatcgttca ttatgcagcg gaaagccaca atgataattc gctcaatgat ccatcgccat + 14281 ttattcatac taacttcatt ggaacctata ctcttttaga agctgctcgt aagtatgata + 14341 ttcgcttcca ccatgtatcg acagatgaag tttatggaga tctcccttta cgcgaagatt + 14401 tgccaggtca tggagaaggg ccgggtgaga aatttacggc tgaaaccaag tacaatccaa + 14461 gctcgcctta ctcatcaacc aaggcagcct cagatttgat tgtcaaagcc tgggtgcgtt + 14521 cttttggagt caaggcaacg atttccaact gttcaaataa ctacggtcct tatcaacata + 14581 tcgaaaaatt catcccacgt cagattacta acatcctaag tggtatcaag ccaaaacttt + 14641 acggtgaagg taaaaacgtt cgtgactgga ttcataccaa tgaccattct tcaggagttt + 14701 ggacaatctt gacaaaaggg caaatcggtg aaacctactt gattggggct gatggtgaga + 14761 agaacaataa ggaagttttg gaacttatcc ttaaggaaat gggacaagct gcggatgcct + 14821 atgatcatgt gactgaccgt gcaggacatg accttcgcta tgcgattgat gctagcaagc + 14881 tccgtgatga gttggggtgg aaacctgaat ttaccaactt tgaagctggg ctcaaggcaa + 14941 caatcaagtg gtatacagat aaccaagaat ggtggaaagc agaaaaagaa gctgttgaag + 15001 ccaattatgc taagactcag gagattatta cagtataaaa agcaggaaat agctgctttt + 15061 tattgctata ttgggaagag ttacatatta gaaaggtcta gagatgattt taattacagg + 15121 ggcaaatggc caattaggaa cggaacttcg ctatttattg gatgaacgta atgaagaata + 15181 cgtggcagta gatgtggcta agatggacat taccaatgaa gaaatggttg agaaagtttt + 15241 tgaagaggtg aaaccgactt tagtctacca ttgtgcagcc tacaccgctg ttgatgcagc + 15301 agaggatgaa ggaaaagagt tggacttcgc catcaatgtg acggggacaa aaaatgtcgc + 15361 aaaagcatct gaaaagcatg gtgcaactct agtttatatt tctacggact atgtctttga + 15421 cggtaagaaa ccagttggac aagagtggga agttgatgac cgaccagatc cacagacaga + 15481 atatggacgc actaagcgta tgggggaaga gttagttgag aagcatgtgt ctaatttcta + 15541 tattatccgt actgcctggg tatttggaaa ttatggcaaa aacttcgttt ttaccatgca + 15601 aaatcttgcg aaaactcata agactttaac agttgtaaat gatcagtacg gtcgtccgac + 15661 ttggactcgt accttggctg agttcatgac ctacctagct gaaaatcgta aggaatttgg + 15721 ttattatcat ttgtcaaatg atgcgacaga agacacaaca tggtatgatt ttgcagttga + 15781 aattttgaaa gatacagatg tcgaagtcaa gccagtagat tccagtcaat ttccagccaa + 15841 agctaaacgt ccgctaaact caacgatgag cctgaccaaa gccaaagcta ctggatttgt + 15901 tattccaact tggcaagatg cattgcaaga attttacaaa caagaagtga gataagtagt + 15961 agaatgattt tctagtctaa taaaagaggc agagaatgaa ctccaaagga gcataagatg + 16021 tacgattatc ttatcgttgg tgccggtctt tttggtgcag tatttgccca tgaatcagcc + 16081 ttaaaaggaa aaaaagtaaa agttattgaa aaacgaaatc atattgcggg taatatctat + 16141 actcgtgaag aggaaggaat tcaagttcat cagtatggtg ctcatatctt tcatacttct + 16201 gataaggaga tctgggatta tgtgaaccag tttgcagagt ttaaccgtta tacaaattct + 16261 cctgttgcaa actataaggg agagatttat aacttacctt ttaatatgaa taccttcaat + 16321 aaactctggg gagttgtgac gccagcagaa gcacaagcta agattgagga acaacgtgct + 16381 attttaaatg gtaaaactcc tgaaaatttg aaagaacagg cgatttctct tgtaggtaca + 16441 gacatctacg aaaaattaat caaagactat acagagaaac agtggggcaa accaactact + 16501 gaacttccat cctttattat tcgccgttta ccagtacgtc tgacctatga taacaactat + 16561 tttaacgata cctatcaagg gattccaatt ggtggataca ctcaaatagt tgaaaaatgt + 16621 tggattatga aaatattgat gtagaaacaa atgttgattt ctttgtgaac aaagagcaat + 16681 atctgaaaga ttttcctaag attgtcttta ctggtatgat tgatgaattc tttgactata + 16741 agttgggcga actagagtac cgtagtcttc gttttgaaaa tgagaccttg gatatggaaa + 16801 attaccaagg aaatgcagtt gtgaactata cggatgcaga aaccccatat actcgcatta + 16861 ttgaacacaa acattttgag tttgggagtc aagcaaagac tatcattact aaagaacatt + 16921 ctaaaacatg ggaaaaaggt gatgagcctt attatccagt taataatgat cgtaataatc + 16981 atttgtataa atcgtataaa aaatttgctg atgagcaagg gaatgttatc tttggtggcc + 17041 gcttaggaca ctatcgttat tacgatatgc accaagtaat tggagcagct ttgcagtgcg + 17101 tgagaaatga gttagattaa tactcaatga aaatcaaaga gcaaactagg aagctagcca + 17161 caggttgctc aaaatactgt tttgaggttg cagatggaag ctgacgcggt ttgaagagat + 17221 tttcgaagag tataaacaag taaaactgac taccagttat tatttagaaa tagtattaaa + 17281 aattccttga ctatgtgata tagttgaggg atttttaaat gatattcata ttttttgcaa + 17341 agatgttgtt tgaaaaataa ttttcaaaaa ttctgaaaat tctgttgaca tctttctgaa + 17401 aagagtctat aatggagaga aagttttaaa ggagaaaatg atgaaaagtt caaaactatt + 17461 tgcccttgcg ggcgtgacat tattggcggc gactacttta gctgcatgct ctggatcagg + 17521 ttcaagcact aaaggtgaga agacattctc atacatttat gagacagacc ctgataacct + 17581 caactatttg acaactgcta aagctgcgac agcaaatatt accagtaacg tggttgatgg + 17641 tttgctagaa aatgatcgct acgggaactt tgtgccgtct atggctgagg attggtctgt + 17701 atccaaggat ggattgactt acacttatac tatccgtaag gatgcaaaat ggtatacttc + 17761 tgaaggtgaa gaatacgcgg cagtcaaagc tcaagacttt gtaacaggac taaaatatgc + 17821 tgctgataaa aaatcagatg ctctttacct tgttcaagaa tcaatcaaag ggttggatgc + 17881 ctatgtaaaa ggggaaatca aagatttctc acaagtagga attaaggctc tggatgaaca + 17941 gacagttcag tacactttga acaaaccaga aagcttctgg aattctaaga caacaatggg + 18001 agtaatggct ccagttaatg aagagttttt gaattcaaaa ggggatgatt ttgccaaagc + 18061 tacggatcca agtagtctct tgtataatgg accttatttg ttgaaatcca ttgtgaccaa + 18121 atcttctgtt gaatttacga aaaatccgaa ctactgggat aaggacaatg tgcatgttga + 18181 caaagttaaa ttgtcattct gggatggtca agataccagc aaacctgcag aaaactttaa + 18241 agatggtagc cttacagcag ctcgtctcta tccaacaagt gcaagtttcg cagagcttga + 18301 gaagagtatg aaggacaata ttgtctatac tcaacaagac tctattacgt atctagtcgg + 18361 tacaaatatt gaccgtcagt cctataaata cacatctaag accagcgatg aacaaaaggc + 18421 atcgactaaa aaggctctct taaacaagga tttccgtcag gctattgcct ttggttttga + 18481 tcgtacagcc tatgcctctc agttgaatgg acaaactgga gcaagcaaaa tcttacgtaa + 18541 tatctttgtt ccaccaacat ttgttcaagc agatggtaaa aactttggcg atatggtcaa + 18601 agagaaattg gtcacttatg gggatgaatg gaaggatgtt aatcttgcag attctcagga + 18661 tggtctttac aatccagaaa aagccaaggc tgaatttgct aaagctaaat cagccttaca + 18721 agcagaaggt gtgacattcc caattcattt ggatatgcca gtgaccaaac agcaactaca + 18781 aaa +// + diff --git a/public/res/serotype_genbank/serotype_6G.gb b/public/res/serotype_genbank/serotype_6G.gb new file mode 100644 index 0000000..b82bda2 --- /dev/null +++ b/public/res/serotype_genbank/serotype_6G.gb @@ -0,0 +1,561 @@ +LOCUS KC832411 18756 bp DNA linear BCT 09-FEB-2015 +DEFINITION Streptococcus pneumoniae strain MNZ1135 capsular polysaccharide + synthesis gene locus, complete sequence. +ACCESSION KC832411 +VERSION KC832411.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 18756) + AUTHORS Oliver,M.B., van der Linden,M.P.G., Kuntzel,S.A., Saad,J.S. and + Nahm,M.H. + TITLE Discovery of Streptococcus pneumoniae Serotype 6 Variants with + glycosyltransferases Synthesizing Two Differing Repeating Units + JOURNAL J. Biol. Chem. 288 (36), 25976-25985 (2013) + PUBMED 23897812 +REFERENCE 2 (bases 1 to 18756) + AUTHORS Oliver,M.B., van der Linden,M.P.G., Kuntzel,S.A., Saad,J.S. and + Nahm,M.H. + TITLE Direct Submission + JOURNAL Submitted (25-MAR-2013) Microbiology, University of Alabama at + Birmingham, Bevill Building, Room 614, 845 19th Street South, + Birmingham, AL 35294, USA +COMMENT ##Assembly-Data-START## + Sequencing Technology :: Sanger dideoxy sequencing + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..18756 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="MNZ1135" + /serotype="6G" + /db_xref="taxon:1313" + /geo_loc_name="Germany" + /note="6X11; + serogroup: 6" + misc_feature <1..86 + /note="similar to glucan 1,6-alpha-glucosidase; dexB" + misc_feature 245..410 + /note="similar to aliB" + misc_feature 411..933 + /note="similar to transposase; tnp" + misc_feature 1156..15955 + /note="capsular polysaccharide synthesis gene locus" + CDS 1156..2601 + /note="integral membrane regulatory protein Wzg; COG1316 + transcriptional regulator" + /codon_start=1 + /transl_table=11 + /product="wzg" + /protein_id="AHF51343.1" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGIDVYNDQ + EFTAHTNGKYYPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAIIKKLTST + EVLKNYSSILQGLQDSLQTNMPIETMIDLVNTQLESGGDYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + CDS 2603..3334 + /note="protein-tyrosine phosphatase Wzh; capsular + polysaccharide biosynthesis protein; member of homology + group 1" + /codon_start=1 + /transl_table=11 + /product="wzh" + /protein_id="AHF51344.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAEAYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVYVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQELFIDNPRKIVMDQLI" + CDS 3340..4035 + /note="member of homology group 2; capsular polysaccharide + biosynthesis protein Wzd" + /codon_start=1 + /transl_table=11 + /product="wzd" + /protein_id="AHF51345.1" + /translation="MMKEQNTIEIDVFQLFKTLWQRKLMILLVALVTSAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKPGLTNQDLQAGTYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVAVPADTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELLDTRVKRPEDIEDVLKI + PLLGLVPDFDKMK" + CDS 4045..4734 + /note="COG0489 ATPases involved in chromosome + partitioning; member of homology group 3; capsular + polysaccharide biosynthesis protein Wze; tyrosine-protein + kinase Wze" + /codon_start=1 + /transl_table=11 + /product="wze" + /protein_id="AHF51346.1" + /translation="MPTLEISQAKLDSVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + IGEGKSTTSTNIAWTFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVDKYGSY + GNYGDYGKNKK" + CDS 4749..6116 + /note="COG2148 sugar transferases involved in + lipopolysaccharide synthesis; undecaprenylphosphate + glucosephosphotransferase WchA (initial sugar + transferase)" + /codon_start=1 + /transl_table=11 + /product="wchA" + /protein_id="AHF51347.1" + /translation="MNGKIVKSSLAIIQSFLVILLTYLLSAVRETEIVSTTAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVPNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYINGWTIWKDIEILLKTVKVVFM + RDGAK" + CDS 6212..7156 + /note="member of homology group 62; HMMPfam hit to + PF01501, glycosyl transferase family; + alpha-1,3-glycosyltransferase" + /codon_start=1 + /transl_table=11 + /product="WciN" + /protein_id="AHF51348.1" + /translation="MNIVYATDNNFVDVLSASIKSLYTTNSDLDLNLWIIANKVSDRN + KEKINRLSKQFAQREINWIENVEIPFKLHLDRGSISSFSRLFLGSVLPSSMSKVLYLD + SDIIVMDSLRSIFDIDFKGKILYGVNDTFNKEYKQVLGIPIDKPMFNTGVMLINLELW + RNNNVEERFLQVIQKFNGTILQGDLGVLNAVLYNSFGVLPPEYNYMTIFEDLTYEEMI + VFKKPINYYSKEEIKNARERIVLRHFTTSFLSKRPWQEGSNVAHIDQFKKYYEGSYKN + VKESILLKIVQKLPKKCSVFLLGIIQSKFRPKLYRILK" + misc_feature 7192..7370 + /note="similar to HG262; member of homology group 262" + CDS 7430..8149 + /note="member of homology group 81; putative ribitol + phophotransferase" + /codon_start=1 + /transl_table=11 + /product="wciO" + /protein_id="AHF51349.1" + /translation="MSIYRICKDIERKTMSPAKKAMAKNDYFAFYVGRPLSYLLTVPF + VKTNITPNQISYLSIIPLIVGFIIMIFTTDFVVLLLAWFLFFLWNLLDGVDGNLARYR + EQYSKDGSVVDAMAGYVAMVLTYFGAGIVAAHLNDSDIYIILGALSGISLIFPRLVMH + KYINTVAQDESVSSIKDKSDFNTIKILALNMTSITGIPQVLLLLTILTNQWVLFTLVY + FTINFLLMIFFLYSLFKKENV" + CDS 8152..9138 + /note="member of homology group 97; putative glycosyl + transferase" + /codon_start=1 + /transl_table=11 + /product="wciP" + /protein_id="AHF51350.1" + /translation="MGKSVAILMTTYNGERYLSQQIDSIRSQTFTNWTLFIRDDGSKD + KTIEVIQRYSKIDDRIRFVENPSKFHGAYYNFFNLIEYVKNNYQFDYYFFCDQDDIWK + EHKLEIQLLRFSKDDMPEMVYSDMSTIDASNNLIDISINKIMGIELPNINNLYFIHAY + IWGCTAGFNHALLEMVPSVDIDKDYLYIEKLSHDNYFAKFALEYGKVLFCPEQLVLYR + RHGHNVTTSHHFKLSPLNVFRKAILGFNELALTHAGVYNQTLYMLKKASGKNPLSDRL + LEIQEVIKIGGLKGVRYFYQNRISRKQLVRTIGLYTIMLFGTYKKYIMKELL" + CDS 9138..10481 + /note="member of homology group 139; oligosaccharide + repeat unit polymerase Wzy" + /codon_start=1 + /transl_table=11 + /product="wzy" + /protein_id="AHF51351.1" + /translation="MLLNFLFISIFLLIIITFILFEGDFFQPAVILTIAYFISIASAL + VNRNVWGTELHFKTFYLILLGVVTFVIVSLLTKLSYRPKVEGISHEELKEINPSKIIY + VILLTLNLVMLFLYIREIQKVVLFSGRSFSNITDLISNYRYLSYYSNEVENRVSGMIN + QLSKIIPATTLISLYIFMNNYFITKQIKKNFIYLIPIAIFFVYAIISGGRLPLIRLVV + GSLLILYIYSVYGSPKSQLTKSFKMITRSLFTFLILIVLFFLLKFVLGRSSQEDFISY + ITRYMGGSIQLFDLFVIDPIRRNKELGAETFSGIYEMLAKLGFDNNIIKGLEWRVSPN + YYSLGNVYTAIRRYYSDFGVIGIVICQSFTAWLYTLGYEKVRHYSLVTNVQRFRLILL + AASFYPIFLNGIEDVFYISMVTIGYGIQIVIFYLVFWVLLKVQVDFNKGKLTINR" + CDS 10606..12018 + /note="member of homology group 82; flippase Wzx" + /codon_start=1 + /transl_table=11 + /product="wzx3" + /protein_id="AHF51352.1" + /translation="MKLKFLITNLFHVFLSNLITIVTSVIVVLILPKIMGVTEYSYWQ + LYIFYLTYIGFFHLGWIDGIYLKYGGLEYQNLDKKQFYSQILQFSSFLILISFLLFGF + NLLIVTDPNAKYIYNMTIISMIVTNLRMLFVYILQMTNRLKDSSIILISDRVVYIFLL + FLFIIFKWHEYKVMIWADVLGRTFSLLLSFWICKDIVFQSLSEFILDLRESFDNIRVG + INLMLSNIASSMIIGIVRMGIQWNWNIETFGKVSLTLSISNLLMTFINAIGLVVFPLL + KRTKTENLSKIYSNLRNVLMLIMFAILLFYYPLKIILDLWLPAYRDALIFMALIFPMS + IYEGKMALVINTYLKALRMERDILKINTLIMLFSMLVTLITTLLLNNLELTVISIVVL + LALRSIIAELILSKKLDISVEQDIVLELLMTIIFISSSWYLPIWLAVIVYLLAYTLYL + YLKRKDTKMYIEYFRKKIFE" + CDS 12513..13382 + /note="member of homology group 10; glucose-1-phosphate + thymidylyltransferase RmlA" + /codon_start=1 + /transl_table=11 + /product="rmlA" + /protein_id="AHF51353.1" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIRDILIISTPQDLPRFKELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFIGDDSV + ALILGDNIYHGPGLSKMLQKAAKKEKGATVFGYQVKDPERFGVVEFDTDMNAISIEEK + PEYPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQSLKKN + EYGQYLLRLIGEA" + CDS 13383..13976 + /note="member of homology group 11; + dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase RmlC" + /codon_start=1 + /transl_table=11 + /product="rmlC" + /protein_id="AHF51354.1" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKNHPLLKDVKPLKKEDL" + CDS 13989..15038 + /note="member of homology group 8; dTDP-D-glucose + 4,6-dehydratase RmlB" + /codon_start=1 + /transl_table=11 + /product="rmlB" + /protein_id="AHF51355.1" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAVD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + CDS 15104..15955 + /note="member of homology group 9; dTDP-4-keto-L-rhamnose + reductase RmlD" + /codon_start=1 + /transl_table=11 + /product="rmlD" + /protein_id="AHF51356.1" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGRELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 16031..17216 + /note="similar to IS1670 transposase" + misc_feature 17412..>18756 + /note="similar to aliA; ABC-type oligopeptide transport + system, periplasmic component" +ORIGIN + 1 tgtcttgatt gcaaactgcg gctaaagaag tacttgaaaa acgggtcttg gctccatggg + 61 atgctttctg tgtggaatta ctataaatat tttttgcaga aaaatttaaa attgaaatcg + 121 tataaaaaca agggaggact gtataaaagg cagaaatcct ttgtttttta taaccaaggt + 181 ttataaacct tcattctcga aattcaatta actttacaaa ttcccactat taaggagaaa + 241 ggagatgaac ataaagaagc gtatccttag tgcaggcctg acttttacat ctgctttgct + 301 tttagctgct tgcggccaat caggttcaga tacaaaaact tactcatcaa cctttagtgg + 361 aaatccaact acatttaact atctattaga ctattacgct gataatatag tcaattgaaa + 421 caagaacaag acaaaagagc ctcataaaag gtattgcaac ttggtaatac cttttacgag + 481 gctttttgat gtgagcccat gttttctcaa taggattgta ctcaggtgag tagggaggaa + 541 gaaggtaaaa gtttatgccc aaactcttcg cataaaagtt ctagcttccc cagtctatgg + 601 aatcttacat tatccataat aataaccgat ggtgtggtta atgttggtaa gaaaaacttc + 661 tgaaaccaag cttcaaaaaa gtcgctcgtc atcgtctctt cgtaagtcat tggagcgatt + 721 aactcaccat ttgttagacc tgcaaccaaa gaaatcctct gatatcttct tccagatact + 781 ttgcctcttc ttaactgccc tttttaatga gcgaccatat tctcgataaa aataagtatc + 841 gaatcctgtt tcgtcaatct aaacaggtgc taggtgcttt aaactattaa aattcttaag + 901 aaataaggct actttttctg ggtcttgttc ataattagat tgaaactaga atagtacacc + 961 tctgcttcta aaacattgtt agaaatcgat ttgactgtcc tgattgattt gtcatgttct + 1021 tatttcattt tactatattt ttgtttcgcg ggaagtctac taagatactt aaagatgcag + 1081 atagtgaaaa aaggtgtaga cattaccgta aaaaagtgat ataattgtat ggtgttcaat + 1141 gtataggtgt taatcatgag tagacgtttt aaaaaatcag gttcacagaa agtgaagcga + 1201 agtgttaata tagttttgtt gactatttat ttattgttag tttgtttttt attgttctta + 1261 atctttaagt acaatatcct tgcttttaga tatcttaatc tagtggtaac tgcgttagtc + 1321 ctactagttg ccttggtagg gctactcctg attatctata aaaaagctga aaaatttact + 1381 atttttctgt tggtgttctc tatccttgtc agctctgtgt cgctctttgc agtacagcag + 1441 tttgttggac tgaccaatcg tttaaatgcg acttctaatt actcagaata ttcaatcagt + 1501 gtcgctgttt tagcagatag tgagatcgaa aatgttacgc aactgacgag tgtgacagca + 1561 ccgactggga ctgataatga aaatattcaa aaactactag ctgatatcaa gtcaagtcag + 1621 aataccgatt tgacggtcga ccagagttcg tcttacttgg cagcttacaa gagtttgatt + 1681 gcaggggaga ctaaggccat tgtcttaaat agtgtctttg aaaatatcat cgagtcagag + 1741 tatccagact atgcatcgaa gataaaaaag atttatacca agggattcac taaaaaagta + 1801 gaagctccta agacgtctaa gaatcagtct ttcaatatct atgttagtgg aattgacacc + 1861 tatggtccta ttagttcggt gtcgcgatca gatgtcaata tcctgatgac tgtcaatcga + 1921 gataccaaga aaatcctctt gaccacaaca ccacgtgatg cctatgtacc aatcgcagat + 1981 ggtggaaata atcaaaaaga taaattaacc catgcgggca tttatggagt tgattcgtcc + 2041 attcacacct tagaaaatct ctatggagtg gatatcaatt actatgtgcg attgaacttc + 2101 acttcgtttt tgaaattgat tgatttgttg ggtggaattg atgtttataa tgatcaagaa + 2161 tttactgccc atacgaatgg aaagtattac cctgtaggca atgttcatct tgattcagaa + 2221 caggctctcg gttttgttcg tgagcgctac tcactagcag atggcgatcg tgaccgtggt + 2281 cgcaaccaac aaaaggtcat tgtagcaatt attaagaagt taacttctac agaggttttg + 2341 aaaaactata gtagtattct tcaaggattg caggattctc ttcaaacaaa tatgccgatt + 2401 gagactatga tagatttagt gaatactcag ttggaaagtg ggggggatta taaagtaaat + 2461 tctcaagatt taaaagggac aggtcggatg gatcttcctt cttatgcaat gccagacagt + 2521 aacctctatg tgatggaaat agatgatagt agtttagctg tagttaaagc agctatacag + 2581 gatgtgatgg agggtagatg aaatgataga catccattcg catatcgttt ttgatgtaga + 2641 tgacggtccc aagtcaagag aggaaagcaa ggctctcttg gcagaagcct acagacaggg + 2701 ggtgcgaacc attgtctcta cctctcaccg tcgcaagggc atgtttgaaa ctccggaaga + 2761 gaagatagca gaaaactttc ttcaggttcg ggaaatagct aaggaagtgg cgagtgactt + 2821 agtcattgct tacggggctg aaatttacta cacaccagat gttctggata agctggaaaa + 2881 aaagcggatt ccgaccctca atgatagtcg ttatgccttg atagagttta gtatgaacac + 2941 tccttatcgc gatattcata gcgccttgag caagatcttg atgttgggaa ttactccagt + 3001 cattgcccac attgagcgct atgatgctct tgaaaataat gaaaaacgcg ttcgagaact + 3061 aatcgatatg ggctgttaca cgcaagtaaa tagttcacat gtcctcaaac ccaaactttt + 3121 tggcgaacgt tataaattca tgaaaaaaag agctcagtat tttttagagc aggatttggt + 3181 ttatgtcatt gcaagtgata tgcacaatct agacggtaga cctcctcata tggcagaagc + 3241 atatgacctt gttacccaaa aatacggaga agcgaaggct caggaacttt ttatagacaa + 3301 tcctcgaaaa attgtaatgg atcaactaat ttaggagaaa tgatgaaaga acaaaacacg + 3361 atagaaatcg atgtatttca attatttaaa accttgtggc aacgcaagct aatgatttta + 3421 ttagtggcac ttgtgacaag tgcgggggct tttgcatata gcacttttat tgttaagcca + 3481 gaatatacga gtaccacgcg aatttacgta gtgaatcgca atcaaggaga caagccgggg + 3541 ctgacaaatc aggatttgca ggcaggaact tatctggtaa aagactaccg tgagattatc + 3601 ctttcgcagg atgcattgga aaaagtagcg acaaatttga agttggatat gccagcaaaa + 3661 acgttagcca gcaaagttca agtggctgta ccagctgaca ctcgtatcgt ctcaatctct + 3721 gtcaaggata aacagccaga ggaagccagt cgtatcgcta attctctacg agaagttgct + 3781 gcagaaaaga tcgtcgctgt aacgcgagta tctgatgtaa cgacacttga agaagcgcga + 3841 ccagctacga ctccctcttc tccaaatgtt cgacgcaatt ccttgtttgg ttttcttgga + 3901 ggagcagtcg taacagtaat tgctgttctt ttgattgagt tgctcgacac ccgtgtgaaa + 3961 cgtcctgaag atattgaaga tgtactgaaa attccacttt tagggctcgt tccagatttt + 4021 gacaaaatga aataggagga agttatgcca acattagaaa tctcacaggc aaaattggat + 4081 tctgtaaaaa aggcagagga atattataac gctttgtgca cgaacctaca gttaagtgga + 4141 gatggtttga aagtattttc tatcacttct gtgaaaatag gagaaggaaa atcaacgact + 4201 tccaccaata tcgcttggac ttttgcgcgt gcaggttaca aaacgttgct gattgatgga + 4261 gatattcgca attctgttat gttaggtgtc tttaaagcaa gggataagat tacaggcctg + 4321 acagaatttt tatcaggaac tacagaccta tcacaagggc tttgtgatac caatatcgaa + 4381 aatctctttg taattcaggc tggctctgtg tcaccgaatc cgacagctct tcttcaaagt + 4441 aagaatttca gtacaatgct tgaaaccttg cgtaaatatt ttgactacat cattgtagat + 4501 actgctcctg tcggtgtcgt gattgatgcg gctattatta cgcgaaaatg cgatgcttct + 4561 attttagtga cggaggcagg tgaaataaat cgacgggata ttcaaaaagc aaaagaacag + 4621 ttggaacaca cagggaagcc gtttttggga gttgtgttga ataaattcga tacttcagta + 4681 gacaaatacg gttcttatgg aaattatgga gattacggga aaaataaaaa ataggtcggg + 4741 ggatagagat gaatggaaaa atagtaaagt cttcattggc cataatccag agctttcttg + 4801 ttattttatt gacttatcta cttagtgctg tgagagaaac ggagattgtt tcaacaacag + 4861 ctattgcact ttatatcctc cattattttg tcttttatat cagtgattat ggacaggatt + 4921 tctttaaaag gggatatttg attgaacttg tccagacatt gaaatatatc ctattctttg + 4981 cactagcgat tagtatttct aattttttct tagaggatcg atttagtatt tccagacgag + 5041 gcatgattta cttcctcaca ttacatgctc tcttagtcta tgtgccaaac ctatttatca + 5101 agtggtattg gaagcgggct tatcccaact ttaaaggaag taagaagatt ctcctactta + 5161 cagcaacttc tcgtgtcgaa aaggtactgg atagattaat agaatcaaat gaggttgttg + 5221 gggagttggt agccgtcagt gtcttagata aaccagattt tcagcatgat tgtttaaagg + 5281 tagtagcaga gggggagata gtaaactttg cgactcatga ggtggtcgat gaagtcttta + 5341 tcaatcttcc aagtgaaaaa tacaatattg gagagcttgt ctctcagttt gaaacgatgg + 5401 gaattgatgt aacagtcaat ctaaatgctt ttgatcgtag tttggcacgt aacaagcaaa + 5461 ttcgtgagat ggcaggatta aacgttgtga ctttttctac aacattttat aagactagtc + 5521 atgtaattgc taagcggatt attgatatcg tgggtgcatt ggtagggctg atactatgtg + 5581 gtttagtcag tattgtactg gttcctttga ttcgaaagga tgggggctct gctatttttg + 5641 ctcagacgcg tataggaaaa aatggtcgtc agttcacttt ttataagttt cgctctatgt + 5701 gtgtagatgc cgaggcgaaa aaaagagaac tcatggaaca aaataccatg cagggtggaa + 5761 tgtttaaggt ggacgatgat cctcgtatca cgaaaattgg tcgttttata cggaagacta + 5821 gcttggacga gctaccacag ttttacaatg ttctaaaggg agatatgagc ttggtaggta + 5881 cacgaccacc aacagtggac gagtatgagc actatacccc agaacaaaaa cgccgactaa + 5941 gttttaaacc tggcataaca ggtttatggc aggtcagcgg acgaagtgaa atcaagaatt + 6001 tcgatgaagt tgtcaaatta gatgtggcct atattaatgg ttggacaatc tggaaagata + 6061 ttgaaatttt attgaaaacg gttaaagttg tatttatgag agatggagcg aaatagtttg + 6121 gttgtgtagg atatttgtag aggtaaaagt ttcgaatata tctcactcaa tcttttttat + 6181 aagtgaaaat aaatttagaa gtaggaattt tatgaatata gtttatgcca cagataataa + 6241 ttttgtagat gtattgagtg cttccatcaa atcactttac actactaatt cagatttgga + 6301 tttaaattta tggattattg ctaataaagt ttcggataga aataaagaaa agataaatag + 6361 attatcaaaa caatttgcgc agagagaaat taattggata gagaacgttg agatcccatt + 6421 taaattacat ttagataggg gatcaattag ttcatttagc agattatttc tgggaagtgt + 6481 tcttccatct tcaatgagta aagttcttta tcttgacagt gatattattg ttatggattc + 6541 tttacgaagt atttttgata ttgattttaa gggtaaaatt ctctatgggg tgaatgatac + 6601 ttttaataaa gaatacaagc aggtgttggg tataccaatt gacaagccaa tgtttaatac + 6661 tggagttatg cttattaatt tagagttatg gagaaataat aacgtcgaag aaagattttt + 6721 gcaagtaatt caaaagttta atggtactat attacaagga gatttagggg ttttaaatgc + 6781 agttttatat aactcatttg gtgtacttcc tccagaatat aattatatga ccatatttga + 6841 agatttgact tatgaagaaa tgatagtttt taaaaaacca attaattatt attcaaaaga + 6901 ggaaattaaa aatgccagag aacgtatagt cttacgacat ttcacaacta gttttttatc + 6961 aaaaagacct tggcaagaag gcagtaatgt tgcacatata gaccaattta aaaaatacta + 7021 tgaaggtagt tataaaaatg ttaaagaatc tattttacta aaaatagttc aaaaattacc + 7081 caaaaaatgt tcagtttttt tattaggaat tattcaatca aaatttagac ctaaattgta + 7141 tagaattttg aaataaggtg gatagtatta atgacaaaaa agaaagaatt ttattgaaaa + 7201 ttcaagaaga attgaaatta ttaaaagagt ttataaaaat atgttctaaa aataaaatta + 7261 agtattttgc tcttggaggt agtctattag gagctgtaag acacaaaggt ttcattcctt + 7321 gggatgatga tatggatcta agctttccaa agagttcaat ctatgtttga aataaaggaa + 7381 aaagtgttag aattagagaa tgtattaatg agtttaggag aaagtataga tgtcaatata + 7441 tagaatctgt aaagatattg aaagaaaaac tatgtcgcct gctaaaaaag caatggctaa + 7501 aaacgactat tttgcatttt atgttggaag acctttatcc tatcttttaa cagttccttt + 7561 cgtgaaaaca aatattactc ccaatcaaat atcttattta tctataattc ctttgattgt + 7621 tggatttata ataatgatat ttacaactga tttcgttgta ttattactgg catggtttct + 7681 atttttttta tggaacttac tagatggagt agatgggaac ttagccagat atcgggagca + 7741 atactcgaag gatggaagtg tagtagatgc aatggctggc tatgtagcca tggtgttgac + 7801 gtatttcggt gcaggaatag tagctgctca tttaaacgac tcagatatct atataatttt + 7861 gggtgcatta tctgggattt cattgatttt tccaaggtta gtgatgcata agtatatcaa + 7921 tacagtagct caagatgagt ctgtgagtag cattaaagat aaatctgatt ttaatactat + 7981 aaaaatactg gctctaaaca tgacatcaat tacaggaatt ccgcaggttt tactgctatt + 8041 aactatttta acaaatcagt gggtactttt tactttagta tattttacga ttaatttttt + 8101 attaatgata tttttcttgt attcattatt caaaaaggag aatgtttaga aatgggaaag + 8161 tcagttgcaa ttttaatgac cacctataat ggtgagcgat atttgtcaca acagattgat + 8221 agtattaggt ctcaaacatt cactaattgg acgcttttta ttagggatga tggatcaaaa + 8281 gataaaacaa tagaagtaat acagaggtat tctaagatag atgatagaat tagattcgtt + 8341 gaaaatccct caaagtttca tggagcttat tacaattttt ttaatctaat tgaatacgtt + 8401 aaaaacaatt atcaatttga ttattacttt ttttgtgatc aagatgatat ttggaaagag + 8461 cacaagttag aaatacagct gttaagattt tctaaagatg acatgccaga gatggtttac + 8521 tctgatatgt caacgattga tgccagtaat aatttgatag atattagtat aaataaaata + 8581 atggggattg aattaccgaa cataaataat ttgtatttta ttcatgccta tatctggggg + 8641 tgtactgcag gttttaatca tgcattgcta gagatggttc cttcagttga tattgataaa + 8701 gattatttat atatagaaaa actgtctcat gataattatt ttgcaaagtt tgcactagag + 8761 tatgggaagg tgttgttctg ccctgagcaa ctggtcttgt atcgaagaca tggacataat + 8821 gtaacaacta gtcatcattt taaattatct ccgctaaatg ttttcagaaa ggctatattg + 8881 ggtttcaatg aattggcact tacacatgct ggggtatata atcaaactct ttatatgcta + 8941 aaaaaagctt ctggaaaaaa tcctttaagt gatagactac ttgaaattca ggaagtaatc + 9001 aaaattggag gattaaaagg tgtgagatat ttctatcaga atcgaatttc tcgaaagcaa + 9061 ctcgtaagaa caatcggctt atataccatc atgctttttg ggacctataa aaaatatatt + 9121 atgaaagaac tcttataatg cttttaaatt tcttattcat atctattttt ctattaatta + 9181 ttattacatt tatattattt gagggggatt tttttcaacc tgcagtaatt ttaacaatcg + 9241 cttattttat ttcgattgca agtgctctag ttaatagaaa tgtttgggga acagaactcc + 9301 atttcaaaac cttttatttg atattgttag gggttgttac atttgttata gtttccttgt + 9361 tgacaaaatt gtcgtacagg cctaaagtgg agggaatttc gcatgaagaa ttgaaagaaa + 9421 taaatccttc aaagataatc tatgtcattc ttctgactct aaatcttgtt atgttatttc + 9481 tttatatccg tgaaattcag aaagtagtat tgttttcagg tagaagtttt tctaatatta + 9541 cagatttgat aagtaactat aggtacctat cttattattc aaatgaagta gaaaatcgtg + 9601 taagtggaat gattaatcaa ctatctaaaa ttattccagc gactacactt atttctttat + 9661 atatatttat gaataattat tttataacta aacaaataaa gaaaaatttc atttatttga + 9721 ttccaatagc tatattcttt gtctatgcaa tcattagtgg tggtagattg ccccttataa + 9781 ggttagttgt tggatctctg ttgatattgt atatatactc tgtgtacggg agtcctaaat + 9841 ctcaacttac caaaagtttt aaaatgatca ctcgctctct gtttacattt cttattttga + 9901 tagttttatt ctttctttta aaatttgtat tagggcgctc ctctcaggaa gattttatca + 9961 gttacatcac tcgttatatg ggaggttcaa ttcaactatt tgatttattt gttatagatc + 10021 cgatacgacg taacaaagaa ctaggtgcag aaactttttc gggaatttat gagatgcttg + 10081 caaaattagg atttgacaat aatattataa aaggcttaga atggagagtg tctcctaatt + 10141 attattcttt agggaatgtg tatactgcaa ttagacgtta ttattcagac tttggtgtaa + 10201 ttggtattgt aatttgtcag agttttacag cgtggttata tactttaggt tatgaaaaag + 10261 ttagacatta ttctttagtt acaaatgttc aaagatttag gttgatccta ttagcagctt + 10321 cattttatcc aatattttta aatggtatcg aggatgtgtt ttatatttca atggttacca + 10381 ttggatatgg aatacaaatt gttatctttt atctggtctt ttgggttctt ctgaaagttc + 10441 aggttgactt taacaaaggt aaattaacga taaatagatg aatttagcgc taatgtattg + 10501 agtcatataa agggatatat ttggtaggta ttttaattgg aggaagagag tcttgaatgg + 10561 gaagtacaaa tcttctgaaa taatttttag gtggggagta tagctatgaa attgaagttt + 10621 cttataacaa atttgtttca tgtctttttg tctaatctga ttacaattgt cacatcggtt + 10681 atagttgtac taatcttacc aaaaattatg ggagtaactg agtatagtta ttggcaacta + 10741 tatatttttt acctaacata tattggtttt tttcatctgg gttggattga tggaatttat + 10801 cttaaatatg gtggattaga gtaccagaat ttagataaga aacagtttta ttctcaaata + 10861 cttcaatttt ccagtttttt aattttaatt tcttttctat tatttggttt taacttattg + 10921 attgtgacag atccaaatgc aaaatatatt tataacatga ctattattag tatgatagtt + 10981 acaaatttaa gaatgttatt cgtttatatt ttgcagatga caaatcgatt aaaggatagc + 11041 tctataattc tgataagtga tcgcgttgta tatatttttc ttttatttct gtttattata + 11101 tttaaatggc atgaatacaa ggtaatgatt tgggcggatg ttttaggaag gacattttct + 11161 ctcctacttt ctttttggat ttgtaaagat attgtttttc aatccttatc cgagttcata + 11221 ttggatctga gagaatcttt tgacaatatc cgtgttggaa tcaatttaat gttatccaat + 11281 attgcaagta gtatgattat tggtattgtt cgaatgggaa ttcaatggaa ttggaatatc + 11341 gaaacattcg ggaaagtatc actgacgcta agcatctcta atttattaat gacttttatt + 11401 aatgcgattg gtttagttgt ctttcctttg ttaaaacgga caaaaacgga aaatttatct + 11461 aaaatttatt ccaacttaag aaatgttttg atgctgatca tgtttgcaat attactcttt + 11521 tattatcctt taaaaattat tctagatctt tggttgccag cttatcggga tgcgttgatt + 11581 tttatggctc ttatttttcc tatgtcaatt tatgaaggga agatggcctt ggtgattaat + 11641 acatatttaa aggcgctaag gatggaaaga gatattctca aaataaatac tttgattatg + 11701 ttgttcagta tgttagttac cctaataact actctattat taaataattt agagctaacg + 11761 gttatatcta tagttgtttt gctagcttta cgtagtataa tagcagaact aattctatct + 11821 aaaaaacttg atatatcagt tgagcaagac attgtgttag aattacttat gacaattata + 11881 tttatttctt caagttggta cttaccgatt tggctcgcag taatagttta tttgttagcg + 11941 tatactttat acttgtatct aaagcgtaaa gatacaaaaa tgtatataga atattttaga + 12001 aagaaaatat ttgaataaaa agaactatat atcagttaga tggcaaattc tatttttacc + 12061 tttttgtcgt ttaatagaaa atgataaaaa atatgatact attttttaca catatttata + 12121 agcgatttga atgtatcagg tgataaatta atttaaaata agaatagttt ctggaacatt + 12181 gctattagtg ggaacaggtt acgaaataat ttatcaattt taaagacgtt tttttaaata + 12241 taaaataatg gattttgtca acaattctaa attctaatag gaatgataat gctagaaaat + 12301 cagattgttc atttttcaag gaagtttatt tttaaaataa tatatcttta agtaagaatt + 12361 attttattag acttaaccta gcctatcagt taaattagaa tatcaacttt gattaattaa + 12421 aaattagcaa aatttattga cattttgttt ttataaattg caataaaggt ctaattctga + 12481 atttcagtga atataagaaa gggatcctac taatgaaagg tattattctt gcaggtggtt + 12541 cggggacacg attatatcct ttgactcggg ctgcatcaaa acaacttatg ccggtttatg + 12601 ataaaccgat gatttactat ccactttcaa cattgatgtt ggctgggatt agggatattt + 12661 tgataatctc aactcctcaa gatttgcctc gttttaaaga gcttcttcaa gacggatctg + 12721 agtttgggat taaactttct tatgcagagc aaccaagtcc agatggtttg gcacaagcct + 12781 ttatcattgg ggaagagttt attggtgatg atagtgttgc tttgattttg ggggacaata + 12841 tctatcacgg ccctggtttg agcaaaatgc ttcaaaaagc agccaagaaa gagaaaggtg + 12901 cgactgtttt tggctaccaa gtgaaggatc cagagcgttt tggtgtggtt gagtttgata + 12961 cagacatgaa tgctatctcc atcgaagaaa agccagaata ccctcgttca aactatgcag + 13021 tgacaggact ctatttctat gataatgatg tagtagagat tgccaagagt atcaaaccaa + 13081 gtcctcgcgg agaattagaa atcacagatg tcaacaaggc ttacttggat cgtggagact + 13141 tatccgttga gcttatggga cgtggctttg cttggctgga tactggaact catgaaagtt + 13201 tactagaggc ttcgcagtac atcgaaacag tccaacggat gcaaaatgtt caggtagcaa + 13261 acttagaaga aattgcttac cgtatgggct atatcagtcg agaagatgta ttggccttag + 13321 cccaatcact taagaaaaat gaatacggac agtatctgct ccgtttgatt ggagaagcat + 13381 agatgacaga taattttttc ggtaagacgc ttgcggcacg caaggttgaa gctattccag + 13441 gcatgttgga gtttgatatc cccgttcatg gagataatcg tggctggttt aaagaaaatt + 13501 tccaaaagga aaaaatgctt ccacttggat ttccagagtc tttctttgca gaaggaaaat + 13561 tgcaaaacaa tgtatccttc tcacgtaaaa atgtccttcg aggcctccac gcagagcctt + 13621 gggataagta catctctgta gcagatggag ggaaagttct gggttcttgg gttgatctac + 13681 gcgagggtga aacctttggg aatacctatc agacagtgat tgatgcgagt aagggaatct + 13741 ttgttcctcg aggcgtagct aatggcttcc aagttttatc agatacagtg tcatatagct + 13801 atctggtcaa tgattactgg gctcttgaac tcaaacccaa gtatgccttt gtgaactacg + 13861 ctgatccaag ccttggtatt gaatgggaaa atattgcaga agcagaggtt tcagaagcag + 13921 ataaaaatca tccactactt aaggatgtaa aacctttgaa aaaagaagat ttgtaaaaag + 13981 gaaagaatat gactgaatac aaaaatatta tcgtgacagg tggagctggc tttatcggtt + 14041 ctaactttgt ccattatgtt tacgagaact ttccagatgt tcatgtgaca gtcctagata + 14101 agttgactta tgctggaaac cgcgcgaata ttgaggaaat tttaggtaat cgtgttgagt + 14161 tagttgttgg tgacattgct gatgcggagt tggtagacaa gttggctgct caagcagatg + 14221 ctatcgttca ttatgcagcg gaaagccaca atgataattc gctcaatgat ccatcgccat + 14281 ttattcatac taacttcatc ggaacctata ctcttttaga agctgctcgt aagtatgata + 14341 ttcgcttcca ccatgtatcg acagatgaag tttatgggga tctcccttta cgcgaagatt + 14401 tgccaggtca tggtgaagga ccaggtgaga aatttactgc tgaaacaaaa tacaacccaa + 14461 gctctccgta ctcatcaacc aaggcagcct cagatttgat tgtcaaagcc tgggtgcgtt + 14521 cttttggagt caaggcaacg atttccaact gttcaaataa ctacggtcct tatcaacata + 14581 tcgaaaaatt catcccacgt cagattacta acatcctaag tggaattaag ccaaaacttt + 14641 acggtgaagg taagaatgtt cgtgactgga ttcataccaa tgaccattct tcaggagttt + 14701 ggacaatctt gacaaaaggg caaatcggtg aaacctactt gattggggct gatggtgaga + 14761 agaacaataa ggaagttttg gaacttatcc ttaaggaaat gggacaagct gtggatgcct + 14821 atgatcatgt gactgaccgt gcaggacatg accttcgcta tgcgattgat gctagcaagc + 14881 tccgtgatga gttggggtgg aaacctgaat ttaccaactt tgaagctggg ctcaaggcaa + 14941 caatcaagtg gtatacagat aaccaagaat ggtggaaagc agaaaaagaa gctgttgaag + 15001 ccaattatgc taagactcag gagattatta cagtataaaa agcaggaaat agctgctttt + 15061 tattgctata ttgggaagag ttacatatta gaaaggtcta gagatgattt taattacagg + 15121 ggcaaatggc caattaggaa cggaacttcg ctatttattg gatgaacgta atgaagaata + 15181 cgtggcagta gatgtggctg agatggacat taccgatgca gaaatggttg agaaagtttt + 15241 tgaagaggtg aaaccgactt tagtctacca ctgtgcagcc tacaccgctg ttgatgcagc + 15301 agaggatgaa ggaagagagt tggacttcgc catcaatgtg acggggacaa aaaatgtcgc + 15361 aaaagcatct gaaaagcatg gtgcaactct agtttatatt tctacggact atgtctttga + 15421 tggtaagaaa ccagttggac aagagtggga agttgatgac cgaccagatc cacagacaga + 15481 atatggccgt actaagcgta tgggggaaga gttagttgag aagcatgtgt ctaatttcta + 15541 tattatccgt actgcctggg tatttggaaa ttatggcaaa aacttcgttt ttaccatgca + 15601 aaatcttgcg aaaactcata agactttaac agttgtaaat gaccagtacg gtcgtccgac + 15661 ttggactcgt accttggctg agttcatgac ctacctagct gaaaatcgta aggaatttgg + 15721 ttattatcat ttgtcaaatg atgcgacaga agacacaaca tggtatgatt ttgcagttga + 15781 aattttgaaa gatacagatg tcgaagtcaa gccagtagat tccagtcaat ttccagccaa + 15841 agctaaacgt ccgctaaact caacgatgag cctggccaaa gccaaagcta ctggatttgt + 15901 tattccaact tggcaagatg cattgcaaga attttacaaa caagaagtga gataagtggt + 15961 agaatgattt tctagtctaa taaaagaggc agagaatgaa ctccaaagga gcttaagatg + 16021 tacgattatc ttgttgttgg tgctggtctc tttggcgcat agctttggct cagtttctat + 16081 tatcgctcac accatccatc agaagtttaa tctgaaggta cccaattatc gccaagaaga + 16141 agattgggct aggatgggtt taccaatcac acgtaaggaa atctctaatt ggcatatcaa + 16201 ggcaagtcaa tactatttag agtcccttta taacctttta cgagaaaagt tgttagaaca + 16261 acctcttctt catgcggatg agacctctta tcgggtgcta gagagtgata gccatctgac + 16321 ctactattgg acctttttgt ctgggaaagc tgagaatcaa gcaatcacgc tgtaccatca + 16381 tgatcagcgt cggagtggtt tagtagtaca agaattccta ggagattatt ctggctatgt + 16441 gcattgtgat atgttgcggc agtaacttag gactttagtc ctctagttct gcctatgcga + 16501 tagcagtcca aggtttagaa gcaaggcgac gctaagcttg gtaaactgcg aaccgctaga + 16561 agcttatcgt caactggaag aagctgaact tgttggatgt tgggcacatg tgagaaggaa + 16621 gttttttgaa gcgaccccca agcaagcaga taaatcatcc ttaggagcta aaggtttagc + 16681 ttattgtgat cagttatttt ccctggaaag agactgggag gctttgccag ctgatgaacg + 16741 actacagaaa cgtcaagaac atctccagcc cttaatggaa gacttctttg cttagtgccg + 16801 gcgtcagtca gttttagcag gttcaaaact aggaagggca attgaataca gcctcaagta + 16861 tgaagaaacc tttaagacta ttttgaaaga cggacatctg gtcctttcca ataatctagc + 16921 tgaacgcgcc attaaatcat tggttatggg acggagtaaa agagttcagt ggactctttt + 16981 agcctaagct aaattttaaa aagcgagggt ggttattttc tcaaagtttt gaaggagcta + 17041 aagcaacagc tattattatg agtttgttgg aaacagctaa acgtcatcaa ttaaatagcg + 17101 agaaatatct attctatctt ctagaatgtc ttccaaacga ggaaactctc gtaaacaaag + 17161 aggttttaga ggcttattta ccatggacta aagttgtaca agaaaagtgc aaataagaaa + 17221 tctccagatt aggaactatc cgtgagttct ctagtctgga gatttttcaa tatacttcgt + 17281 tattggacgg ttacgatatt catatttttt gcaaagatgt tgtttgaaaa ataattttca + 17341 aaaattctga aaattctgtt gacatctttc tgaaaagagt ctataatgga gagaaagttt + 17401 taaaggagaa aatgatgaaa agttcaaaac tatttgccct tgcgggcgtg acattattgg + 17461 cggcgactac tttagctgca tgctctggat caggttcaag cactaaaggt gagaagacat + 17521 tctcatacat ttatgagaca gaccctgata acctcaacta tttgacaact gctaaggctg + 17581 cgacagcaaa tattaccagt aacgtggttg atggtttgct agaaaatgat cgctacggga + 17641 actttgtgcc gtctatggct gaggattggt ctgtatccaa ggatggattg acttacactt + 17701 atactatccg taaggatgca aaatggtata cttctgaagg tgaagaatac gcggcagtca + 17761 aagctcaaga ctttgtaaca ggactaaaat atgctgctga taaaaaatca gatgctcttt + 17821 accttgttca agaatcaatc aaagggttgg atgcctatgt aaaaggggaa atcaaagatt + 17881 tctcacaagt aggaattaag gctctggatg atcagacagt tcagtacact ttgaacaaac + 17941 cagaaagctt ctggaattct aagacaacca tgggtgtgct tgcgccagtt aatgaagagt + 18001 ttttgaattc aaaaggggat gattttgcca aagctacgga tccaagtagt ctcttgtata + 18061 acggtcctta tttgttgaaa tccattgtga ccaaatcctc tgttgaattt gcgaaaaatc + 18121 cgaactactg ggataaggac aatgtgcata ttgacaaagt taaattgtca ttctgggatg + 18181 gtcaagatac cagcaaacct gcagaaaact ttaaagatgg tagccttaca gcagctcgtc + 18241 tctatccaac aagtgcaagt ttcgcagagc ttgagaagag tattaaggac aatattgtct + 18301 atactcaaca agactctatt acgtatctag ttggtacaaa tattgaccgt cagtcctata + 18361 aatacacatc taagaccagc gacgaacaaa aggcatcgac taaaaaggct ctcttaaaca + 18421 aggatttccg tcaggctatt gcctttggtt ttgatcgtac agcctatgcc tctcagttga + 18481 atggacaaac tggagcaagc aaaatcttac gtaatatctt tgttccacca acatttgttc + 18541 aagcagacgg taaaaacttt ggcgatatgg tcaaagagaa attggttact tatggggatg + 18601 aatggaagga tgttaatctt gcagattctc aggatggtct ttacaatcca gaaaaagcca + 18661 aggctgaatt tgctaaagct aaatcagcct tacaagcaga aggtgtgaca ttcccaattc + 18721 atttggatat gccagtgacc aaacagcaac acaaat +// + diff --git a/public/res/serotype_genbank/serotype_6H.gb b/public/res/serotype_genbank/serotype_6H.gb new file mode 100644 index 0000000..7ee7a37 --- /dev/null +++ b/public/res/serotype_genbank/serotype_6H.gb @@ -0,0 +1,156 @@ +LOCUS KF597302 3441 bp DNA linear BCT 10-SEP-2015 +DEFINITION Streptococcus pneumoniae strain MBO190 cps gene locus, partial + sequence. +ACCESSION KF597302 +VERSION KF597302.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 3441) + AUTHORS Park,I.H., Geno,K.A., Yu,J., Oliver,M.B., Kim,K.H. and Nahm,M.H. + TITLE Genetic, biochemical, and serological characterization of a new + pneumococcal serotype, 6H, and generation of a pneumococcal strain + producing three different capsular repeat units + JOURNAL Clin. Vaccine Immunol. 22 (3), 313-318 (2015) + PUBMED 25589550 +REFERENCE 2 (bases 1 to 3441) + AUTHORS Oliver,M.B. + TITLE Direct Submission + JOURNAL Submitted (29-AUG-2013) Microbiology, University of Alabama at + Birmingham, Bevill Building, Room 614, 845 19th Street South, + Birmingham, AL 35294, USA +COMMENT ##Assembly-Data-START## + Sequencing Technology :: Sanger dideoxy sequencing + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..3441 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="MBO190" + /serotype="6Z" + /db_xref="taxon:1313" + /geo_loc_name="USA" + /note="serogroup: 6" + misc_feature <1..>3441 + /note="cps gene locus" + CDS <1..264 + /note="undecaprenylphosphate glucosephosphotransferase + WchA; COG2148 sugar transferases involved in + lipopolysaccharide synthesis" + /codon_start=1 + /transl_table=11 + /product="WchA" + /protein_id="AHB32907.1" + /translation="VLGRMSLVGTRPPTVDEYEHYTPEQKRRLSFKPGITGLWQVSGR + SEIKNFDEVVKLDVAYINGWTIWKDIEILLKTVKVVFMRDGAK" + CDS 360..1304 + /note="alpha-1,3-glycosyltransferase; member of homology + group 62; HMMPfam hit to PF01501, glycosyl transferase + family" + /codon_start=1 + /transl_table=11 + /product="WciN" + /protein_id="AHB32908.1" + /translation="MNIVYATDNNFVDVLSASIKSLYTTNSDLDLNLWIIANKVSDRN + KEKINRLSKQFAQREINWIENVEIPFKLHLDRGSISSFSRLFLGSVLPSSMSKVLYLD + SDIIVMDSLRSIFDIDFKGKILYGVNDTFNKEYKQVLGIPIDKPMFNTGVMLINLELW + RNNNVEERFLQVIQKFNGTILQGDLGVLNAVLYNSFGVLPPEYNYMTIFEDLTYEEMI + VFKKPINYYSKEEIKNARERIVLRHFTTSFLSKRPWQEGSNVAHIDQFKKYYEGSYKN + VKESILLKIVQKLPKKCSVFLLGIIQSKFRPKLYRILK" + CDS 1575..2294 + /note="putative ribitol phophotransferase; member of + homology group 81" + /codon_start=1 + /transl_table=11 + /product="WciO" + /protein_id="AHB32909.1" + /translation="MSIYRICKDIERKTMSPAKKAMAKNDYFAFYVGRPLSYLLTVPF + VKTNITPNQISYLSIIPLIVGFIIMIFTTDFVVLLLAWFLFFLWNLLDGVDGNLARYR + EQYSKDGSVVDAMAGYVAMVLTYFGAGIVAAHLNDSDIYIILGALSGISLIFPRLVMH + KYINTVAQDESVSSIKDKSDFNTIKILALNMTSITGIPQVLLLLTILTNQWVLFTLVY + FTINFLLMIFSLYSLFKKENV" + CDS 2297..3283 + /note="putative glycosyl transferase; member of homology + group 97" + /codon_start=1 + /transl_table=11 + /product="WciP" + /protein_id="AHB32910.1" + /translation="MGKSVAILMTTYNGERYLSQQIDSIRSQTFTNWTLFIRDDGSKD + KTIEVIQRYSKIDDRIRFVENPSKFHGAYYNFFNLIEYVKNNYQFDYYFFCDQDDIWK + EHKLEIQLLRFSKDDMPEMVYSDMSTIDASNNLIDISINKIMGIELPNINNLYFIHAY + IWGCTAGFNHALLEMVPSVDIDKDYLYIEKLAHDCYFAKFALEYGKVLFCPEQLVLYR + RHGHNVTTSHHFKLSPLNVFRKAILGFNELALTHARVYNQTLYMLKKASGKNPLSDRL + LEIQEVIKIGGLKGVRYFYQNRISRKQLVRTIGLYTIMLFGTYKKYIMKELL" + CDS 3283..>3441 + /note="oligosaccharide repeat unit polymerase Wzy; member + of homology group 139" + /codon_start=1 + /transl_table=11 + /product="Wzy" + /protein_id="AHB32911.1" + /translation="MLLNFLFISIFLLIIITFILFEGDFFQPAVILTIAYFISIASAL + VNRNVGNRL" +ORIGIN + 1 gttctaggga gaatgagctt ggtaggtaca cgaccaccaa cagtggacga gtatgagcac + 61 tataccccag aacaaaaacg ccgactaagt tttaaacctg gcataacagg tttatggcag + 121 gtcagcggac gaagtgaaat caagaatttc gatgaagttg tcaaattaga tgtggcctat + 181 attaatggtt ggacaatctg gaaagatatt gaaattttat tgaaaacggt taaagttgta + 241 tttatgagag atggagcgaa atagtttggt tgtgtaggat atttgtagag gtaaaagttt + 301 cgaatatatc tcactcaatc ttttttataa gtgaaaataa atttagaagt aggaatttta + 361 tgaatatagt ttatgccaca gataataatt ttgtagatgt attgagtgct tccatcaaat + 421 cactttacac tactaattca gatttggatt taaatttatg gattattgct aataaagttt + 481 cggatagaaa taaagaaaag ataaatagat tatcaaaaca atttgcgcag agagaaatta + 541 attggataga gaacgttgag atcccattta aattacattt agatagggga tcaattagtt + 601 catttagcag attatttctg ggaagtgttc ttccatcttc aatgagtaaa gttctttatc + 661 ttgacagtga tattattgtt atggattctt tacgaagtat ttttgatatt gattttaagg + 721 gtaaaattct ctatggggtg aatgatactt ttaataaaga atacaagcag gtgttgggta + 781 taccaattga caagccaatg tttaatactg gagttatgct tattaattta gagttatgga + 841 gaaataataa cgtcgaagaa agatttttgc aagtaattca aaagtttaat ggtactatat + 901 tacaaggaga tttaggggtt ttaaatgcag ttttatataa ctcatttggt gtacttcctc + 961 cagaatataa ttatatgacc atatttgaag atttgactta tgaagaaatg atagttttta + 1021 aaaaaccaat taattattat tcaaaagagg aaattaaaaa tgccagagaa cgtatagtct + 1081 tgcgacattt cacaactagt tttttatcaa aaagaccttg gcaagaaggc agtaatgttg + 1141 cacatataga ccaatttaaa aaatactatg aaggtagtta taaaaatgtt aaagaatcta + 1201 ttttactaaa aatagttcaa aaattaccca aaaaatgttc agttttttta ttaggaatta + 1261 ttcaatcaaa atttagacct aaattgtata gaattttgaa ataaggtgga tagtattaat + 1321 gacaaaaaag aaagaatttt attgaaaatt caagaagaat tgaaattatt aaaagagttt + 1381 ataaaaatat gttctaaaaa taaaattaag tattttgctc ttggaggtag tctattagga + 1441 gctgtaagac acaaaggttt cattccttgg gatgatatgg atctaagctt tccaaagagt + 1501 tcaatctatg tttgaaataa aggaaaaagt gttagaatta gagaatgtat taatgagttt + 1561 aggagaaagt atagatgtca atatatagaa tctgtaaaga tattgaaaga aaaactatgt + 1621 cgcctgctaa aaaagcaatg gctaaaaacg actattttgc attttatgtt ggaagacctt + 1681 tatcctatct tttaacagtt cctttcgtga aaacaaatat tactcccaat caaatatctt + 1741 atttatctat aattcctttg attgttggat ttataataat gatatttaca actgatttcg + 1801 ttgtattatt actggcatgg tttctatttt ttttatggaa cttactagat ggagtagatg + 1861 ggaacttagc cagatatcgg gagcaatact cgaaggatgg aagtgtagta gatgcaatgg + 1921 ctggctatgt agccatggtg ttgacgtatt tcggtgcagg aatagtagct gctcatttaa + 1981 acgactcaga tatctatata attttgggtg cattatctgg gatttcattg atttttccaa + 2041 ggttagtgat gcataagtat atcaatacag tagctcaaga tgagtctgtg agtagcatta + 2101 aagataaatc tgattttaat actataaaaa tactggctct aaacatgaca tcaattacag + 2161 gaattccgca ggttttactg ctattaacta ttttaacaaa tcagtgggta ctttttactt + 2221 tagtatattt tacgattaat tttttattaa tgatattttc tttgtattca ttattcaaaa + 2281 aggagaatgt ttagaaatgg gaaagtcagt tgcaatttta atgaccacct ataatggtga + 2341 gcgatatttg tcacaacaga ttgatagtat taggtctcaa acattcacta attggacact + 2401 ttttattagg gatgatggat caaaagataa aacaatagaa gtaatacaga ggtattctaa + 2461 gatagatgat agaattagat tcgttgaaaa tccctcaaag tttcatggag cttattacaa + 2521 tttttttaat ctaattgaat acgttaaaaa caattatcaa tttgattatt actttttttg + 2581 tgatcaagat gatatttgga aggagcacaa gttagaaata cagctgttaa gattttctaa + 2641 agatgacatg ccagagatgg tttactctga tatgtcaacg attgatgcca gtaataattt + 2701 gatagatatt agtataaata aaataatggg gattgaatta ccgaacataa ataatttgta + 2761 ttttattcat gcctatatct gggggtgtac tgcaggtttt aatcatgcat tgctagagat + 2821 ggttccttca gttgatattg ataaagatta tttatatata gaaaaactgg ctcatgattg + 2881 ttattttgca aagtttgcac tagagtatgg gaaggtgttg ttctgccctg agcaactggt + 2941 cttgtatcga agacatggac ataatgtaac aactagtcat cattttaaat tatctccgct + 3001 aaatgttttc agaaaggcta tattgggttt caatgaattg gcacttacac atgctagggt + 3061 atataatcaa actctttata tgctaaaaaa agcttctgga aaaaatcctt taagtgatag + 3121 actacttgaa attcaggaag taatcaaaat tggaggatta aaaggtgtga gatatttcta + 3181 tcagaatcga atttctcgaa agcaactcgt aagaacaatc ggcttatata ccatcatgct + 3241 ttttgggacc tataaaaaat atattatgaa agaactctta taatgctttt aaatttctta + 3301 ttcatatcta tttttctatt aattatcatt acatttatat tatttgaggg ggattttttt + 3361 caacctgcag taattttaac aatcgcttat tttatttcga ttgcaagtgc tctagttaat + 3421 agaaatgttg ggaacagact g +// + diff --git a/public/res/serotype_genbank/serotype_7A.gb b/public/res/serotype_genbank/serotype_7A.gb new file mode 100644 index 0000000..88fae74 --- /dev/null +++ b/public/res/serotype_genbank/serotype_7A.gb @@ -0,0 +1,1040 @@ +LOCUS CR931640 24019 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 2040/37 (serotype 7a). +ACCESSION CR931640 +VERSION CR931640.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 24019) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 24019) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..24019 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="2040/37" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC07A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC07A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI32851.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..458 + /gene="aliB" + /locus_tag="SPC07A_0002" + /pseudo + CDS 293..458 + /gene="aliB" + /locus_tag="SPC07A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..1322) + /gene="tnp" + /locus_tag="SPC07A_0003" + /pseudo + CDS complement(459..1322) + /gene="tnp" + /locus_tag="SPC07A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(948..1304) + /gene="tnp" + /locus_tag="SPC07A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 4e-17" + /pseudo + gene 1552..2997 + /gene="wzg" + /locus_tag="SPC07A_0004" + CDS 1552..2997 + /gene="wzg" + /locus_tag="SPC07A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32854.1" + /db_xref="GOA:Q4K2X0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2X0" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTVLVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLATYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKRILLTTTPRDSYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSAPHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1552..1668 + /gene="wzg" + /locus_tag="SPC07A_0004" + /note="Signal peptide predicted for SPC0166 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.550 between residues 39 and 40" + misc_feature 1756..2103 + /gene="wzg" + /locus_tag="SPC07A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.5e-63" + misc_feature 2281..2724 + /gene="wzg" + /locus_tag="SPC07A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 3e-70" + gene 2999..3730 + /gene="wzh" + /locus_tag="SPC07A_0005" + CDS 2999..3730 + /gene="wzh" + /locus_tag="SPC07A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32855.1" + /db_xref="GOA:Q4K2Q9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2Q9" + /translation="MIDIHSHIVFDVDDGPKSREESKALLEESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSHHISKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGVKKAKELFVDNPRKIIMDQLI" + misc_feature 3002..3610 + /gene="wzh" + /locus_tag="SPC07A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.7e-39" + gene 3739..4431 + /gene="wzd" + /locus_tag="SPC07A_0006" + CDS 3739..4431 + /gene="wzd" + /locus_tag="SPC07A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32856.1" + /db_xref="GOA:Q4K2W8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2W8" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFVYSTFVI + KPEFTSTTRIYVVNRGQGEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGVIGTSVIVLLLELLDTRVKRPEDIEDTLQMT + LLVVVPNLSKLK" + misc_feature 3757..4173 + /gene="wzd" + /locus_tag="SPC07A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.3e-52" + misc_feature 4279..4356 + /gene="wzd" + /locus_tag="SPC07A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4441..5124 + /gene="wze" + /locus_tag="SPC07A_0007" + CDS 4441..5124 + /gene="wze" + /locus_tag="SPC07A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32857.1" + /db_xref="GOA:Q4K2Q7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K2Q7" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLLDGDTRNSVISGFFKSREKITGLTEFLSGTADL + SHGLCDTNTENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGSYGKK" + gene 5140..6507 + /gene="wchA" + /locus_tag="SPC07A_0008" + CDS 5140..6507 + /gene="wchA" + /locus_tag="SPC07A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI32858.1" + /db_xref="GOA:Q4K2Q6" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K2Q6" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVREAELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIYEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRSDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYVQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + REGAK" + misc_feature 5923..6504 + /gene="wchA" + /locus_tag="SPC07A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 8.8e-145" + gene 6536..7708 + /gene="wchF" + /locus_tag="SPC07A_0009" + CDS 6536..7708 + /gene="wchF" + /locus_tag="SPC07A_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI32859.1" + /db_xref="GOA:Q4K2Q5" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K2Q5" + /translation="MKQSVYIIGSKGIPAKYGGFETFVEKLTEYQKDSNIQYYVACMR + ENSAKSGIMDDQFEHNGAICFNIDVPNIGPARAIAYDIAAVNKAIELAKKNKDEAPIF + YILACRIGPFISGLKKKIRAIGGRLLVNPDGHEWLRAKWSLPVRKYWKFSEQLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTPSILKAEDAKVRDWYQEKGVSEN + GYYLVVGRFVPENNYEAMIREFIKSKSKKDFVLITNVEQNKFYDQLLQDTGFDKDPRV + KFVGTVYDQELLKYIREYAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + DGAIYWKKDELARVIEEVEGFDQAAITDLDFKSSQRILSAFTWEKIVSDYEEVFKG" + gene 7712..8860 + /gene="wcwA" + /locus_tag="SPC07A_0010" + CDS 7712..8860 + /gene="wcwA" + /locus_tag="SPC07A_0010" + /note="member of homology group 63" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32860.1" + /db_xref="GOA:Q4K2Q4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2Q4" + /translation="MKRILYLHAGAEMYGADKVLLELIKGLDSKEFEAHVILPNDGVL + VKALRQVGAQVSVLDYPILRRKYFNPKGILEYLKSYRRYSQKISQYVRENGIDLVHNN + TTAVLEGIYLKRKVKLPLIWHVHEIIVKPKAISDFINFLMGRYADKIVTVSQAVSSHV + KQSPFIKEGQVQVVYNGVDNAVYHPMQASTVREQFAIPEESLVIGMVGRVNAWKGQGD + FLEAVAPILEQNPNSIAFLAGSAFAGEEWRVEELESTIAKSSVASQIKRIDYYEHTTE + LYNMFDIFVLPSTNPDPLPTVVLEAMACGKPVVGYRHGGVCEMIKEGKNGLLATPNKP + AELSKAIQELADNIEKREQLGSASFQRQKEFFSLESYIRNFSELYKKY" + misc_feature 8273..8794 + /gene="wcwA" + /locus_tag="SPC07A_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 4.1e-30" + gene 8862..9563 + /gene="wcwC" + /locus_tag="SPC07A_0011" + CDS 8862..9563 + /gene="wcwC" + /locus_tag="SPC07A_0011" + /note="member of homology group 48" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI32861.1" + /db_xref="GOA:Q4K2W3" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4K2W3" + /translation="MNTKMNTKMNTKMNTKMNTKMNTETIKNKLKPIVYPIINFIPRR + RLKNKNFTIICDNCWAGKVYQELGLPYQTPFVGMFVFSPDYIKMLKNLKHYLSGNIPL + TFVKESKYVKDFDNAYPLALLDDIELHFLHYADEEEATQKWNRRLERIHWDNLYFKFN + DNDACTYELMKEFEELPYKSKVIFSSRNYSGLPSLVHFKSAEKQGHVGIDLKTYHRYF + NCVTWLNKGGEDLTK" + gene 9560..10523 + /gene="wcwD" + /locus_tag="SPC07A_0012" + CDS join(9560..10153,10113..10523) + /gene="wcwD" + /locus_tag="SPC07A_0012" + /note="member of homology group 98" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI32862.1" + /db_xref="UniProtKB/TrEMBL:Q4K2W2" + /translation="MKKIRIIIPYFGKLPTFFPYFLLTAKRNQKIDFLVYTDQKVDEF + AMLNAKNIEFVTLSFDELREKVQSKFDFKISLKTPYKFCDYRPAYGLIFEEELKGYDY + WGFCDTDVLLGDIYQFLEEHSFFENDYARYGLFGHLQIFKNLREVNHIFMSGQGSDYR + LDYHNVYTSEQSFIFDESEGIQKLFEKCHFKQLQDKFFLKNVISNNCKISFFDDIDIS + HFSFREYGENKSKRYYFWSEENGLESINLINDDIVVKRPLYAHFQKRMIKCPDFKLVD + SFYVIPNQLVIGEKISKQELVEVTRNKFYWEYVKSTMLKKLKKEKWTFEFIRHKLRMK + " + gene 10567..11003 + /gene="HG140" + /locus_tag="SPC07A_0013" + /pseudo + CDS join(10567..10665,10686..10790,10794..11003) + /gene="HG140" + /locus_tag="SPC07A_0013" + /note="member of homology group 140" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase (pseudogene)" + gene 11373..12386 + /gene="wcwF" + /locus_tag="SPC07A_0014" + CDS 11373..12386 + /gene="wcwF" + /locus_tag="SPC07A_0014" + /note="member of homology group 141" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32864.1" + /db_xref="GOA:Q4K2W1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2W1" + /translation="MKDDMIIQNILLTIVIPVYNVEKYLKRCIDSVISQEWDKYEVIL + VNDGSTDASPNICEEYAQKYHFISVIHKENGGLSETRNTGLSHANGKYVFFLDSDDWI + TKDMFRNLSKMIMEQNYDILQFGMQMFHSEREELKNVQCKEKNFNSSDAFKNMLSVEG + ITSFATDKIYKRELFEKNGIEFPIGYFYEDLGTVYKLILSAKKIYLTTQVYYCYFIGN + DAAITKQWSEKKFSDVYKFHKKIFNVSSLMVSDDIFLSKSYYNNGLVYLLMKLYEENQ + EDTQLFRLILAELDANIVPIKYLRNYPNFLKYVFYRIRLLKLIVILKLTLTKIKKWNQ + KKH" + misc_feature 11409..11909 + /gene="wcwF" + /locus_tag="SPC07A_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.2e-44" + gene 12365..13303 + /gene="wcwG" + /locus_tag="SPC07A_0015" + CDS 12365..13303 + /gene="wcwG" + /locus_tag="SPC07A_0015" + /note="member of homology group 142" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32865.1" + /db_xref="GOA:Q4K2Q0" + /db_xref="UniProtKB/TrEMBL:Q4K2Q0" + /translation="MESKKTLIIFEQIDTFEQFLERNIIFNNVDIFTPYKKVSNVFMH + NFRAIAKRLPGFLFHNWWLEEWSRKLPDYTNIVVFDNAISLKLLEYIDAHKTRSSKLK + LWLWNVPNKQVNYLNSNYDVYCFDKTYSENYNLKFVEQFYVLGSTKKRDILDIEYDFY + FIGADKGRLPKLKSLAKQIVLNNYSYRFDVFSVKKQYFDSEFEGIQVIDTLLPYDEVL + DNILASNVIVELNKKGQDGLTLRAMESIFYKKKLITNNKKIINYDFYHPNNILVWEEG + KDIKLDEFIQKPYVQLEKDIIDRYSFSNWLSKITEI" + gene 13313..14380 + /gene="wcwH" + /locus_tag="SPC07A_0016" + CDS 13313..14380 + /gene="wcwH" + /locus_tag="SPC07A_0016" + /note="member of homology group 143" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32866.1" + /db_xref="GOA:Q4K2P9" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2P9" + /translation="MRITFCLPEISTVPTGGYKIIFEYANRLSERGHEITLVFLTNNV + WNRVTKNCKIKSIVGNIRGKKNPSWFKLKPTIRKIMTPYLDGRDFPEADFIFATAVTT + ANIVKEMPEKYGKKCYLIQGFETWLLPESKVIETYNYGFLNITVSKWLCDIVQSYTET + PVFCVSNPIDTEIFYLLNPIEKRNPFHLGMLYHEGEHKGISYAIDAIKKVKKIYPEIE + VNIFGVPSRPVFLPEYFNYTQQATQQELQKIYNDTSIFLCATIDEGFGLTGAESMACG + CALVSTAYSGVFEYAIDGENALLSPIKDSVSLATNIIKLIRNHDLRLSIATQATKDMK + KRGWEKTTLKLENILSEFTNF" + misc_feature 13817..14308 + /gene="wcwH" + /locus_tag="SPC07A_0016" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1e-15" + gene 14361..15812 + /gene="wzy" + /locus_tag="SPC07A_0017" + CDS 14361..15812 + /gene="wzy" + /locus_tag="SPC07A_0017" + /note="member of homology group 144" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32867.1" + /db_xref="UniProtKB/TrEMBL:Q4K2P8" + /translation="MNLLIFKDVLISMIIKLDKQKCYFIMLLLLMCVVQLTASVSMGV + ISIALTVLPILWNLNNPSKLLFSQILYLFQFQFYVSYLSFPLGISFICDIINLFLLFN + IFKDSKLLQWELRNINLKTIIFVWVLFFLIGIFSNFLYDLNIALIVWSLRNYIRFIIF + FISCCLYIDKYSINLGEYLIKLFYWFNIFFTSFQYFVLLKSGDFLGGIFGNELGISNT + YLHILLILILILSVVNYVSDNSSLVILTSYIVSTLYVAALSELKIIFVELPIIIILTL + LFKRLGIKILLKIISITCIVVVALAISIPILYELFPIFDNFFKLEKLFGYSTGNYSTS + SDFGRLSSIVQIISTIFYGDVWQTLFGIGLGEAEISKIPIFSGSFYYNYEYTHYYLFT + LSYVFIENGFIGLFLFMFMPIYLALKMIFERGTSKYDLLLIVLSISLFMLLLYNNTMR + SEIYYLYLFVLSWGVAINRGNGGCYENNKKLCL" + misc_feature 14361..14480 + /gene="wzy" + /locus_tag="SPC07A_0017" + /note="Signal peptide predicted for SPC0179 by SignalP 2.0 + HMM (Signal peptide probability 0.623) with cleavage site + probability 0.185 between residues 40 and 41" + gene 15784..17205 + /gene="wzx" + /locus_tag="SPC07A_0018" + CDS 15784..17205 + /gene="wzx" + /locus_tag="SPC07A_0018" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32868.1" + /db_xref="GOA:Q4K2V7" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K2V7" + /translation="MKTIKNYAYKSFYQLFLIIVPFITIPYVSRILGAELIGINSYTN + TIISYFVLIANLGILIYGNRTIAYHRESIEERSKKFWEIVSIKLLVAIVAYVIFIIFL + FFYSKYSWVFVIQSVQIIATAFDISWLFDGVEDFKRTVVRNFLVKIISIILIFTFVKS + TEDFDKYIWITVGSTLMGNLTLWSYLHHYIIKIPIKSLKLSEHLVPILTLFIPQIASI + VFMSINKILLGNISTISQAGYFENADKVIRILLALVSSIGVVVFPKVAHAYRSGDMKR + VLGLTYMTFDAVNIITIPIVVGIVSISPTFSSIFFGTEFQGIDKVLSVLVLELIFMGY + TSVLGSQYLIVTGQTYFLSISVFLGIFSTVISSFFFIPIYGALGSAISSVIGEASIMI + GEIYLLRNQVDFYYLYRDVPKYMIASAVMYISISSLNYFISSPFVSLLSSIAMGAVTY + VTVVLLLCPRIVIKLLNKNTRFF" + misc_feature 15790..16590 + /gene="wzx" + /locus_tag="SPC07A_0018" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.4e-47" + gene 17331..18200 + /gene="rmlA" + /locus_tag="SPC07A_0019" + CDS 17331..18200 + /gene="rmlA" + /locus_tag="SPC07A_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI32869.1" + /db_xref="GOA:Q4K2P6" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K2P6" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFLIGEEFIGDDSV + ALILGDNIYHGSGLSKMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17334..18050 + /gene="rmlA" + /locus_tag="SPC07A_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 2.2e-119" + gene 18201..18794 + /gene="rmlC" + /locus_tag="SPC07A_0020" + CDS 18201..18794 + /gene="rmlC" + /locus_tag="SPC07A_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI32870.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 18237..18767 + /gene="rmlC" + /locus_tag="SPC07A_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 18807..19856 + /gene="rmlB" + /locus_tag="SPC07A_0021" + CDS 18807..19856 + /gene="rmlB" + /locus_tag="SPC07A_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI32871.1" + /db_xref="GOA:Q4K2P4" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P4" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18822..19778 + /gene="rmlB" + /locus_tag="SPC07A_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0001" + misc_feature 18825..19565 + /gene="rmlB" + /locus_tag="SPC07A_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 2.7e-76" + misc_feature 18828..19640 + /gene="rmlB" + /locus_tag="SPC07A_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.7e-05" + gene 19922..20773 + /gene="rmlD" + /locus_tag="SPC07A_0022" + CDS 19922..20773 + /gene="rmlD" + /locus_tag="SPC07A_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI32872.1" + /db_xref="GOA:Q4K2P3" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P3" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVNPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19922..20770 + /gene="rmlD" + /locus_tag="SPC07A_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 5.7e-148" + misc_feature 19925..20566 + /gene="rmlD" + /locus_tag="SPC07A_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 19925..20554 + /gene="rmlD" + /locus_tag="SPC07A_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.6e-19" + misc_feature 19928..20656 + /gene="rmlD" + /locus_tag="SPC07A_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.9e-08" + gene 20943..22020 + /gene="glf" + /locus_tag="SPC07A_0023" + CDS join(20943..21443,21427..22020) + /gene="glf" + /locus_tag="SPC07A_0023" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + /protein_id="CAI32873.1" + /db_xref="GOA:Q4K2V2" + /db_xref="InterPro:IPR004379" + /db_xref="InterPro:IPR015899" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2V2" + /translation="MGNIYTREEEGIQVHQYGAHIFHTSDKEIWDYVNQFAGFNRYTN + SPVANYKGEIYNLPFNMNTFNKLWGVVTPAEAQAKIEEQRAILNGKTPENLEEQAISL + VGTDIYEKLIKDYTEKQWGKPTTELPSFIIRRLPVHLTYDNNYFNDTYQGIPIGGYTQ + IVEKCGSLKNVDHENIDVETNVDFFVNKEQYLKDFPKIVFTGMIDEFFDYKLGELEYR + SLRFENETLDMENYQGNAVVNYTDAETPYTRIIEHKHFEFGSQAKTIITKEHSKTWEK + GDEPYYPVNNDRNNHLYKSYKKLADEQGNVIFGGRLGHYRYYDMHQVIGAALQCVRNE + LDSYSMKIKEQTRKLATGCSKHCFEVADES" + misc_feature join(21270..21427,21443..21876) + /gene="glf" + /locus_tag="SPC07A_0023" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 7.5e-106" + gene complement(order(22137..22421,22735..23688)) + /gene="tnp" + /locus_tag="SPC07A_0024" + /pseudo + CDS complement(join(22137..22421,22735..23688)) + /gene="tnp" + /locus_tag="SPC07A_0024" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(22936..23232) + /gene="tnp" + /locus_tag="SPC07A_0024" + /note="HMMPfam hit to PF01610, Transposase, score 1.3e-45" + /pseudo + gene 23972..>24019 + /gene="aliA" + /locus_tag="SPC07A_0025" + CDS 23972..>24019 + /gene="aliA" + /locus_tag="SPC07A_0025" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32875.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaaggcg gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtt aattgaaaca agaacaagac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttggggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtaagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaaattctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gaacgattaa ctcaccattt + 781 gttagccctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttatt + 841 aactgacctt ttaaagagcg accatattct cgataaaaat aagtatcgaa tcctgtttcg + 901 tcaatataaa caggtgctag gtgctttaaa ctattaaatt cttaagaaat aaggctactt + 961 tttctgggtc ttgttcatag taggtgtggt tctttttttc gagtgtagcc cacagctttg + 1021 agcgcatagt ggatggtagt tggatgacag ccaaattcag aagctatttc agtcaaataa + 1081 gcgtctggat tgtcagtaag atagttttta agtctatctc tatcaacttt tcttggtttt + 1141 gttcctttta cttggtggtt tagctctcct gttttctctt ttagctttaa ccagccataa + 1201 atggtattac gtgagatttg gaaaacgtgt gatgcttctg ttatactacc tgttcgctca + 1261 caataagaga gaactttttt acgaaaatct attgaatatg ctataaaaag attataccac + 1321 attgtgtacc atattgaaac tagaatagta catccctgct tctaaaacat tgttagaaat + 1381 cgatgtaact gtcctgatcg ttttgtcatg ttcttatttc attttactat atttttggtt + 1441 cgcgggaagt ctactaagat acttaaagat gcagatagtg aaaataaagg tgtagacatt + 1501 accgtaaaaa agtgatataa tcgtacaatg ttcaaggtat aggtgttaat catgagtaga + 1561 cgttttaaaa aatcacgttc acagaaagtg aagcgaagtg ttaatatcgt tttgctgact + 1621 atttatttat tattagtttg ttttttattg ttcttaatct ttaagtacaa tatccttgct + 1681 tttagatatc ttaatctagt ggtaactgtg ttagtcctac tagttgcctt ggtagggcta + 1741 ctcttgatta tctataaaaa agctgaaaag tttactattt ttctgttggt gttctctatc + 1801 cttgtcagct ctgtgtcgct ctttgcagta cagcagtttg ttggactgac caatcgttta + 1861 aatgcgactt ctaattactc agaatattca atcagtgtcg ctgttttagc agatagtgag + 1921 atcgaaaatg ttacgcaact gacgagtgtg acagcaccga ctgggactga taatgaaaat + 1981 attcaaaaac tactagctga tatcaagtca agtcagaata ccgatttgac ggtcaaccag + 2041 agttcgtctt acttggcaac ttacaagagt ttgattgcag gggagactaa ggccattgtc + 2101 ctaaatagtg tctttgaaaa tatcattgag tcagagtatc cagactacgc atcgaagata + 2161 aaaaagattt ataccaaggg attcactaaa aaagtagaag ctcctaagac gtctaagaat + 2221 cagtctttca atatctatgt tagtggaatt gacacctatg gtcctattag ttcggtgtcg + 2281 cgatcagatg tcaatatcct gatgactgtc aatagggata cgaagagaat ccttcttaca + 2341 acaactcctc gagattcata tgttcctatt gctgatggtg gaaataatca aaaagataaa + 2401 ttaacccatg cgggcattta tggagttgat tcgtccattc acaccttaga aaatctctat + 2461 ggagtggata tcaattacta tgtgcgattg aacttcactt ctttcttgaa aatgattgac + 2521 ttattgggag gggtagatgt tcataatgat caagagtttt cagctccaca tgggaagttc + 2581 catttcccag tagggaatgt ccatctagac tctgagcagg ctctaggttt tgtacgtgaa + 2641 cgctactcac tagccgatgg agaccgtgac cgtggtcgca accaacaaaa ggtgattgtg + 2701 gctatccttc aaaaattaac gtcaaccgaa gcactgaaaa attatagtac gatcattaat + 2761 agcttgcaag attctatcca aacaaatatg ccacttgaga ctatgataaa tttggtcaat + 2821 gctcagttgg aaagtggagg gaattataaa gtaaattctc aagatttaaa agggacaggt + 2881 cggatggatc ttccttctta tgcaatgcca gacagtaacc tctatgtgat ggaaatagat + 2941 gatagcagtt tagctgtagt taaagcagct atacaggatg tgatggaggg tagatgaaat + 3001 gatagatatc cattcgcata tcgtttttga tgtagatgac ggtcccaagt caagagagga + 3061 aagcaaggct ctcttggaag aatcctacag gcagggggtg cgaaccattg tctctacctc + 3121 tcaccgtcgc aagggcatgt ttgaaactcc agaagagaag atagcagaaa actttcttca + 3181 ggttcgggaa attgcaaaag aagtagcaga tgatttagtc atcgcttatg gagcagagat + 3241 atactatact ctggatgctc tagaaaagct agaaaaaaaa gaaattccta cccttaatga + 3301 tagtcgttat gctttgattg agtttagcat gcatacttcc tatcgtcaga ttcatacggg + 3361 attgagcaat attttgatgt tgggaatcac gccagtaatt gctcatattg aacgttatga + 3421 tgctttagag aataacgaaa aacgtgttcg tgaactgatt gatatggggt gctatactca + 3481 gataaatagt catcatattt caaaacctaa gttctttggt gaaaaatata aattcatgaa + 3541 aaagagagct cggtattttt tggaacgtga tttagttcat gtagttgcaa gtgacatgca + 3601 caatttagac agcagacctc catatatgca acaggcatat gatatcattg ctaagaaata + 3661 tggagtgaaa aaagcgaaag aactttttgt agataatccc agaaaaatta taatggatca + 3721 attaatttag gagaaaatat gaaggaacaa aacactttgg aaatcgatgt attgcaacta + 3781 ttcagagctt tatggaaaag aaagttggtt attttattag tggcaattat aacttcttca + 3841 gttgcttttg tctacagtac ttttgttatc aaacctgagt ttactagtac gactcggatt + 3901 tatgtagtta accgtggtca gggagagaag tctggtttaa ccaatcaaga cttgcaggca + 3961 ggatcatact tggttaaaga ctatcgtgaa attatcctat cgcaggatgt tttggaggaa + 4021 gttgtttctg atttgaaact agatttgacg ccaaaaggtt tggctaataa aattaaagta + 4081 acagtaccag ttgatacccg tattgtctct gtttcagtta atgatcgagt tcctgaagag + 4141 gcaagccgta tcgctaactc tttgagagaa gtagctgctc aaaaaattat tagtattact + 4201 cgtgtttctg atgtgacaac actggaggag gcaaggccgg cgatatcacc gtcttcgcca + 4261 aatattaaac gcaatacact aattggtttt ttggcagggg tgattggaac tagtgttata + 4321 gttcttcttc ttgaactttt ggacactcgt gtgaaacgtc cggaagatat cgaagataca + 4381 ctgcagatga cacttttggt agttgtacca aacttgagta agttgaaata ggagagagga + 4441 atgccgacat tagaaatagc acaaaaaaaa ctggagttca ttaagaaggc agaagaatat + 4501 tacaatgcct tgtgtacaaa tatacagttg agcggagata aactaaaagt aatttccgtt + 4561 acttctgtta accctgggga aggaaaaaca actacttccg taaatatagc aaggtcgttt + 4621 gcgcgtgcag gctataaaac tcttttgctc gatggcgata ctcgaaattc agttatatca + 4681 ggatttttta aatctcgtga aaaaattaca gggctaacag aatttttatc tgggacagct + 4741 gatttatctc acggtttatg tgatacaaat actgaaaatt tatttgtagt tcaatcggga + 4801 tctgtatcac caaaccctac agccttgtta caaagtaaaa attttaatga tatgattgaa + 4861 acgttgcgta aatattttga ctatatcatt gttgatacag cacctattgg aattgttatt + 4921 gatgcggcaa ttatcactca aaagtgtgat gcgtccatct tggtaacagc aacaggtgag + 4981 gtgaataaac gtgatgtcca aaaagcgaaa caacaattag aacaaacagg gaaactgttc + 5041 ctaggagttg ttttaaataa attggatatc tcggttgata agtatggagt ttacggttcc + 5101 tatggaagtt atggtaaaaa ataatttagg aaaaatttta tggatgaaaa aggattgaaa + 5161 atttttctgg cagtattaca gagtattatt gtcattttat tggtttattt tcttagcttt + 5221 gttagagagg cagaacttga acgttcttcg atggttatac tataccttct ccactttttt + 5281 gtattctatt ttagttccta tggtaacaat ttttttaaaa gagggtacct agttgagttt + 5341 aatagtacta taagatatat ttttttcttt gcaatagcta taagtgtatt aaactttttt + 5401 atagcggaac ggtttagtat ctctagaaga ggaatggtat acttcttaac tttagaagga + 5461 atatccttat acttgttaaa tttcttagta aagaaatatt ggaaacatgt gttttttaat + 5521 ctaaaaaata gcaagaaaat tttactgtta acagtaacga aaaatatgga aaaagttctt + 5581 gataaactgc tagaatccga tgaactttca tggaagttgg tagcagtaag tgttttggat + 5641 aaatctgatt ttcaacatga taaaatacct gtaattgaaa aggaaaaaat tattgaattt + 5701 gcaacgcatg aagttgtgga tgaggtgttt gtcaatcttc caggagagag ctacgatatt + 5761 ggagaaatta tctctaggtt tgagacaatg gggatagatg taactgtaaa tcttaaagca + 5821 tttgataaga atttgggtcg caataaacaa atttatgaga tggtaggatt gaatgtagtc + 5881 actttctcta caaattttta taaaactagt catgtgattt caaagagaat tctcgatatt + 5941 tgtggtgcca ctattggcct tattcttttt gctatagcta gtctagtttt agttccattg + 6001 attcgtaaag atggcggacc agctattttt gctcaaactc gtatagggaa aaatggtcga + 6061 cattttacct tttataaatt ccgttcgatg cggagcgatg ctgaagctat caaagaacag + 6121 ttgatggatc aaaatacgat gcaaggtggt atgtttaaga tagacaacga tcctcgtgtt + 6181 acaaaaattg gtcgctttat tcgtaaaacc agtttagatg agttacccca gttttggaat + 6241 gtctttatag gagatatgag tttggtggga acacgtccac ctacagtaga cgagtatgtt + 6301 cagtatactc cagaacagaa acgtcgactc agctttaaac ctggtattac aggtttatgg + 6361 caggttagcg gccgtagtaa aataaccgat tttgacgatg ttgtaaaatt agatgtggct + 6421 tatattgata attggacaat ctggaaagat attgaaatat tgttaaagac cgtcaaagtg + 6481 gtatttatga gagaaggggc gaagtgattt ctgccctcaa cctgttagga gagaaatgaa + 6541 acagtcagtt tatattattg gttcaaaggg gattcctgct aagtatggag gatttgaaac + 6601 ctttgttgaa aaattaaccg aatatcaaaa agacagcaac atacaatact atgttgcttg + 6661 tatgcgtgaa aattcagcta aatctggcat catggatgat cagtttgagc acaatggagc + 6721 catttgtttc aacatcgatg tacccaatat tggaccagct cgtgccatcg cttacgatat + 6781 tgcagcggtc aacaaagcta ttgaattggc taagaaaaat aaggacgaag ctcccatttt + 6841 ttacattcta gcttgtcgca ttggtccttt tatttctggg cttaagaaaa aaattcgtgc + 6901 catcggaggc cggttgttgg taaatcctga tggtcatgaa tggttgcgag caaagtggag + 6961 tttaccagtt cgtaagtatt ggaaattttc agagcagctc atggtcaaac atgcagattt + 7021 actggtctgt gacagtaaaa acattgaaaa atatatccaa gaggattata agcagtacca + 7081 accaaagacc acctatattg cctatggaac ggatactact ccttcaatcc tgaaagcaga + 7141 agatgccaaa gttcgggatt ggtatcagga aaaaggagtt agcgaaaatg gctattatct + 7201 agtggtgggg agattcgttc ctgaaaataa ctacgaagca atgattcgtg aatttatcaa + 7261 gtccaagtcc aagaaggact ttgtcctcat cacaaatgtg gagcagaata aattttacga + 7321 ccagttgtta caggatactg gttttgataa agatcctagg gttaaatttg ttgggactgt + 7381 ctatgaccaa gagttgctca agtacatccg tgagtatgcc tttgcctatt tccatgggca + 7441 tgaggttgga gggaccaacc cttctctatt ggaagcccta gcatccacaa aactgaattt + 7501 gttgctagat gttggcttta accgtgaggt tggtgaagac ggggccattt attggaaaaa + 7561 agatgagttg gctcgtgtca ttgaggaagt agaaggattt gatcaggcag caataactga + 7621 cttggatttc aagtcaagcc aaagaatcct ctcagctttc acatgggaaa agattgtgtc + 7681 agattatgaa gaagtgttta aaggataggg aatgaaacgg attttatact tgcatgctgg + 7741 tgcagaaatg tatggagcag ataaggtttt attggaattg atcaaaggat tggattccaa + 7801 agaatttgaa gctcatgtca tcctgccaaa tgatggtgtt ttagtcaagg ccttgcgtca + 7861 agttggggct caggtcagtg tgttggatta tccgatttta cgtagaaaat actttaatcc + 7921 taaggggatt ttagaatatc tgaaatccta tcggcgctac tctcaaaaaa tttcccaata + 7981 tgtgcgtgag aatgggatag atcttgttca taacaatacg acagccgttc tggaaggaat + 8041 ctatctcaag agaaaagtaa aactcccctt aatctggcat gttcatgaga ttattgtcaa + 8101 gcccaaggct atttcagatt ttatcaactt tttgatgggg cgatatgcag ataagatcgt + 8161 aacagtatct caagctgttt ccagccatgt caaacaatct ccttttatca aagaaggtca + 8221 ggtacaggtt gtatataacg gagtggacaa tgctgtctat catcccatgc aagcaagcac + 8281 agtgcgtgaa caatttgcta ttccagaaga atctcttgtc attggtatgg taggccgcgt + 8341 caacgcttgg aagggacagg gagattttct agaagcagtg gcgccgattt tggagcagaa + 8401 tcccaattct atcgcttttc tggcaggaag tgcctttgcg ggagaagagt ggcgagttga + 8461 agaactcgaa tctacgattg ccaaatcaag tgtagcctca caaatcaaac gaattgacta + 8521 ttatgagcat acgactgagc tttataatat gtttgatatc tttgtcttgc caagcaccaa + 8581 tcccgatccc ctaccgacag tggtactaga ggcgatggca tgtggcaaac cagtagttgg + 8641 ctatcggcat ggtggtgtct gtgaaatgat taaggagggc aaaaacggtc tcctagccac + 8701 tccaaataag cctgcagaat tgtctaaggc tattcaagaa ttggctgaca atatcgagaa + 8761 aagagaacag ttaggaagtg catctttcca acgtcaaaaa gaattctttt cgttggaaag + 8821 ttatattcgg aatttctcag agctatataa aaaatactaa gatgaatact aagatgaata + 8881 ctaagatgaa tactaagatg aatactaaga tgaatactaa gatgaatact gaaacaatta + 8941 agaataaatt aaaaccaatc gtttatccaa ttatcaattt tatccctaga cgaagactca + 9001 agaataaaaa ttttacaatc atttgcgaca attgttgggc aggaaaagtc tatcaggaat + 9061 tgggcttgcc ttatcaaact ccatttgtag gtatgtttgt cttttctcct gactacatca + 9121 aaatgctcaa gaatttaaaa cactatttga gtggaaatat ccctttgaca tttgttaagg + 9181 aatcaaaata tgtcaaagac tttgataatg cctatcccct ggctctttta gacgatatcg + 9241 aattgcattt cttacattat gcagatgagg aagaagcaac tcaaaaatgg aaccgtcgtt + 9301 tagaaagaat tcattgggat aatttgtatt tcaagttcaa tgataatgat gcctgtactt + 9361 atgaattgat gaaagagttt gaagaacttc cgtacaagag taaggttatc ttctcttcga + 9421 gaaattacag tggtttacct tccttagttc atttcaaatc agctgaaaag caaggacacg + 9481 ttgggattga tttgaaaact tatcaccgct attttaattg tgttacttgg ttgaataagg + 9541 gtggggagga tttaactaaa tgaaaaaaat aagaattatt attccttatt ttgggaaact + 9601 accaaccttt tttccttatt ttttattaac tgctaaacgt aatcaaaaaa ttgatttctt + 9661 agtttatacg gatcaaaagg tggatgaatt cgctatgtta aatgctaaaa atatagaatt + 9721 tgtaactctt tcttttgatg agttaagaga aaaagttcag tctaagtttg attttaaaat + 9781 ctctctcaaa acaccttata aattttgtga ctatagacct gcttatgggc ttatctttga + 9841 agaagaatta aagggttatg attactgggg tttttgtgac acagatgtct tactaggtga + 9901 tatttatcaa tttcttgaag agcatagctt ttttgagaac gactatgctc gatatggtct + 9961 ttttggtcat cttcaaattt ttaagaattt aagagaagtt aatcatattt ttatgtctgg + 10021 gcaaggttca gactatcgat tagattatca caatgtctat actagtgaac aaagttttat + 10081 ttttgatgaa tcagaaggta tccaaaagct ttttgaaaaa tgtcatttca aacaactgca + 10141 agataagttt ttttgatgat attgatatta gtcatttctc atttcgggaa tatggcgaaa + 10201 ataaatcgaa acgctattat ttttggtctg aagaaaatgg tttggaatca ataaatttaa + 10261 tcaatgatga tatagtggtt aagcgtcctc tatacgcaca tttccaaaag agaatgatta + 10321 aatgccctga ctttaaacta gtcgattcat tttatgttat accaaatcaa ttagttattg + 10381 gagagaaaat ttctaagcaa gagctagtag aggtgacaag aaataaattc tattgggaat + 10441 atgttaaatc aacaatgtta aagaaattaa aaaaagaaaa atggacattt gaatttattc + 10501 gtcataaatt aaggatgaaa tgagcttagt attatggctt ttcctattga ttttgttgta + 10561 tgctgaattg acgaacacga tcctgattgg agggctaaaa atagcaagta tgactctgct + 10621 tttacaacat ctgaaaataa tacgaatttc gatgaagcat actgttagtg gagaacgttt + 10681 aagttttggt tagagagata gaaaaatttg ctccttgggt gaataaagtt tatcttgtta + 10741 cagaaaatca aaaaccggtc tggttgacta ttaatagtga taagttatat taattgaaca + 10801 tttgggatga tttgtatttc aagttcaata ataatgatat ttgtacttat gaattgatga + 10861 aagaatttga agagcttcca tacaagagta aggttatctt ctcttcaaaa aattacagtg + 10921 acctaccttc cttgattcat tttaaatcag ccgagaagta agcgcatgtt ggaattgatt + 10981 tgaaaactta tcaccgctat tttgatgttg ttagttggat aaaccaagat agtgtatagt + 11041 tcactaaata attaaataca gattatttca atgtttctat aagttcaaaa tttaattaga + 11101 aactatagag gaatccatct ttaagattat tatttataag tgagcaatat taactggagt + 11161 caatgattta acagaaaatt caggtgctag tcagtcattg attatgttta tgaatataat + 11221 aatgaaagga atttctaatt ttacaagaat tgaatcttgt atcgaaatac attagttcta + 11281 taaaaatgaa ttaattaaaa aattagagat ttacacaata tcagttctac taagattatg + 11341 caataaaaag tttctaaaaa attatttact aagtgaagga tgatatgatt atacaaaata + 11401 tattgctaac aattgtaata ccagtatata atgttgaaaa atatttgaaa cgttgtattg + 11461 atagcgtcat ttctcaggaa tgggataaat atgaagttat tctagtaaat gatggcagta + 11521 cagatgcttc acccaatatt tgtgaagagt atgcccagaa gtatcatttt atttctgtta + 11581 ttcataagga aaatggtgga ctatcagaga ctcgtaatac aggtctttct catgcgaatg + 11641 gaaaatacgt attttttctt gattctgatg attggattac aaaagatatg tttcgaaatt + 11701 taagtaaaat gattatggaa caaaattatg atattttgca attcggaatg caaatgtttc + 11761 attctgaaag agaagagttg aaaaatgtac aatgcaaaga aaaaaacttt aattcttcag + 11821 atgcatttaa aaacatgtta agtgttgaag ggattacaag ttttgctaca gacaaaatat + 11881 ataaaagaga attgtttgag aagaacggaa tagagtttcc tataggatat ttttacgaag + 11941 atttaggaac ggtttataaa ttaattttat ctgctaaaaa aatttattta acaacacaag + 12001 tgtattattg ttattttatt gggaatgatg cggctattac caaacagtgg tctgaaaaaa + 12061 aatttagtga tgtgtataaa tttcataaaa aaatttttaa tgtttcatct cttatggttt + 12121 cagatgacat cttcctgtct aaatcctatt ataataatgg tctggtttat cttttaatga + 12181 aattgtatga agaaaatcag gaagacactc aactttttag gttgatactt gcagaactgg + 12241 atgcaaacat agttcctata aaatatttgc gaaattatcc taattttttg aaatatgtat + 12301 tttatcgcat tcgattattg aaattaattg taatattgaa attaacttta acaaaaataa + 12361 aaaaatggaa tcaaaaaaaa cattaataat atttgaacaa atagatacat ttgaacaatt + 12421 tttagaacgt aatataattt ttaataatgt agacatattt acaccgtaca aaaaagtttc + 12481 gaatgttttt atgcacaatt ttagagcaat tgcaaaacga ttacccggat ttttattcca + 12541 taattggtgg ttagaagaat ggtctagaaa attaccggat tatactaata tagtagtatt + 12601 tgacaatgct atttccctta aattattaga gtatatagat gcacataaga ctcgtagttc + 12661 aaagttgaaa ttatggttat ggaatgttcc gaataagcaa gtgaattatt tgaattcgaa + 12721 ttatgatgtt tattgctttg ataagacata ttctgaaaac tataatttaa aatttgtaga + 12781 acaattctat gtattaggtt cgactaagaa aagagatata ttggatattg agtatgattt + 12841 ttattttatt ggtgcagata aaggaagatt gccaaaatta aaaagcttag ctaagcagat + 12901 agttttaaat aattatagtt atcgatttga cgtttttagt gtaaaaaaac agtatttcga + 12961 ttctgagttt gagggaattc aagttataga tacattactc ccttatgatg aagtcttgga + 13021 taacatacta gcttcgaatg ttattgttga gttaaataaa aagggacagg atggtctaac + 13081 ccttagagca atggaatcca ttttttataa aaaaaaatta ataacaaata ataaaaaaat + 13141 tattaactat gatttttatc acccaaataa tattttagtt tgggaggaag gaaaagatat + 13201 caaattagat gagtttattc aaaagccata tgttcaatta gaaaaagata ttattgaccg + 13261 ttattctttt agtaattggt taagtaaaat tacagaaatt taggagttaa atatgagaat + 13321 aactttttgt ctacctgaga taagcactgt tcctacggga ggatataaaa ttatttttga + 13381 gtacgcaaat aggttgtctg aacgaggtca tgagataacc cttgtttttt taaccaataa + 13441 tgtatggaac agagttacta agaattgtaa aatcaaatca attgtaggca atatacgtgg + 13501 caaaaaaaat ccaagttggt ttaaactgaa accaactatt cgtaaaataa tgactcctta + 13561 tttagatggg agagattttc ctgaagcaga ttttatattt gctactgcgg ttacaactgc + 13621 taatattgta aaagaaatgc cagaaaaata tgggaaaaaa tgttacctaa tccaaggttt + 13681 tgaaacatgg cttcttccag aaagtaaagt tattgaaact tataattatg gattccttaa + 13741 tattacagta tctaagtggt tatgtgacat agtccaatct tatacagaga ctccagtttt + 13801 ttgtgtatct aatccgattg atacagaaat tttttatttg ctaaatccta tagagaaacg + 13861 aaacccattt catctaggta tgttatatca tgaaggagag cataaaggaa tctcttatgc + 13921 gatagatgca attaagaaag ttaagaaaat ttatccggaa atagaggtta atatttttgg + 13981 agttcctagt agaccagtat ttttaccaga atattttaat tatactcaac aagctacaca + 14041 acaggaatta caaaagatat acaacgatac gtctattttt ttgtgtgcaa caattgatga + 14101 aggctttggt ttgacaggag cagagagtat ggcttgtggc tgtgcgttag tctcaacagc + 14161 ctatagtggt gtatttgaat atgcaattga tggcgagaat gcacttttat ctccgataaa + 14221 agatagtgtt agtttggcaa caaacataat aaaattgatt agaaatcatg atttgcgctt + 14281 atccatagca acgcaagcaa ctaaagatat gaaaaagaga ggatgggaga aaactacttt + 14341 aaaattagaa aatattttaa gtgaatttac taatttttaa agatgtttta atatcaatga + 14401 ttataaaact agataaacaa aaatgttatt ttattatgtt acttttattg atgtgcgtag + 14461 tacagttgac tgcaagtgtt tcaatgggag taataagtat agctctaaca gtattaccaa + 14521 tattgtggaa tttaaataat ccatccaaat tattattttc acagattctt tatttgtttc + 14581 agttccaatt ctatgtaagt tatttatcat ttccgttagg aatttccttt atctgtgata + 14641 ttattaattt atttttgtta ttcaatattt ttaaagattc caaactatta cagtgggaat + 14701 tacggaatat taatttaaaa acaattattt ttgtttgggt cttgtttttt ttgataggta + 14761 ttttttcaaa ttttttgtat gatttaaata ttgcgcttat tgtatggtcc ctccgtaatt + 14821 atataagatt tatcattttt ttcatttctt gttgtttgta tattgataaa tacagtataa + 14881 atctaggtga atacttaata aagctattct attggtttaa tatatttttt acctcgttcc + 14941 aatattttgt gcttttaaaa tcaggagatt ttcttggagg aatttttgga aacgaattgg + 15001 gaatttctaa tacctacttg catattcttt taattctcat cttgatatta tctgttgtta + 15061 attatgtatc agataattcg agtttagtta ttttaacaag ttatatcgtt tcaactctat + 15121 acgtagctgc tttgtcagag ttaaagatta tttttgtgga attacctatt attattattt + 15181 tgactttact atttaaaaga ttaggaataa aaatactgct taaaataata tctatcactt + 15241 gcatagtggt ggtcgctttg gcaatctcaa ttcctatttt atatgaatta ttccctatat + 15301 ttgacaattt ttttaaatta gaaaaattat ttggctattc aacaggaaac tattcaacta + 15361 gttctgattt tggtcggtta agttcaattg ttcaaataat ctcaactatt ttttatggag + 15421 atgtttggca gactttattt ggtattggtt taggagaggc ggaaatttca aaaattccga + 15481 tatttagtgg ttccttttat tataattacg aatacaccca ttactatctg ttcactttat + 15541 catatgtttt tattgagaat ggatttatag gattgttcct attcatgttt atgccaattt + 15601 accttgcttt aaagatgatt tttgagcgag ggacatctaa atatgatctt cttctgatag + 15661 tattatctat ttctttattt atgctcttgt tgtataataa tacaatgagg tcagagatat + 15721 attatcttta tttatttgtt ctttcatggg gagttgcaat caatagagga aatgggggat + 15781 gttatgaaaa caataaaaaa ttatgcttat aaatcttttt atcaactatt tttgataata + 15841 gtacctttta taacaatccc atatgtttct agaattttag gagcagagtt aatagggata + 15901 aattcttata caaacactat aataagttat tttgtgttaa tagcaaatct tgggattttg + 15961 atatatggta atagaaccat agcatatcat agagaaagta ttgaggagcg tagtaaaaaa + 16021 ttttgggaaa ttgtctcaat taagttgctg gtagcaattg ttgcctatgt catatttatt + 16081 atatttttat tcttttattc aaaatatagt tgggtttttg tgattcaatc tgtacaaatt + 16141 atagctacgg catttgatat atcttggctt tttgatggtg tagaagattt taaacgtaca + 16201 gtagtgagaa attttctggt taaaataatt tccattattc taatttttac ttttgtcaag + 16261 tctacagagg actttgacaa atacatatgg ataacagtag gctctacttt aatgggtaat + 16321 ttgacattat ggagttattt acaccattat attattaaaa ttccgataaa aagccttaag + 16381 ttgagtgaac acttagttcc cattttgact ttattcatac cacaaattgc ttctattgta + 16441 tttatgtcaa tcaataaaat tttactaggt aatatttcga cgatatcgca agcaggctac + 16501 tttgagaatg cggataaggt gattagaatt cttctggctt tagtatcatc tattggagta + 16561 gttgtttttc ctaaagttgc tcatgcgtat aggagtggtg atatgaagag agtattaggg + 16621 ttgacttata tgacttttga tgcagttaat attataacta ttccaattgt agttggaata + 16681 gtttctatta gccctacatt ctcttctatt ttttttggga cggaattcca aggaatagat + 16741 aaggttctgt ctgttctagt attggagtta attttcatgg gatatacttc ggttttaggt + 16801 agtcaatatc tcattgtaac agggcaaact tactttttaa gtatctcggt gttcctagga + 16861 atattttcta cagtgatatc ttctttcttt ttcattccga tatacggagc gcttggaagt + 16921 gcgatttcat ctgtaattgg agaagcatct attatgattg gtgaaattta cttgttaagg + 16981 aatcaagttg atttctatta tctatatagg gatgtaccga aatacatgat tgctagcgct + 17041 gttatgtata ttagtatctc gtcattgaat tattttattt cttcgccatt tgtatctttg + 17101 ctatcaagta ttgctatggg tgcagtgact tatgttactg ttgtcttatt actatgccca + 17161 agaatagtaa taaaattatt aaataaaaac acaagatttt tttgaaatga tatataaaat + 17221 cgtaacaaaa atccaattac aattcatgac tttttactaa ttataaattt gcgattcatc + 17281 taattaaaat tgaattatag ataatgaaaa tttagaaagg tggccccatt atgaaaggta + 17341 ttattcttgc aggtggttcg ggaacgcgcc tgtacccact tactcgagct gcgtcaaaac + 17401 agctgatgcc ggtttatgac aaacccatga tttattatcc tttgtcaacc ctaatgttgg + 17461 ctggaatcaa ggatattttg attatctcaa caccacagga tttgccccgt tttaaggacc + 17521 tgctcttgga tggttccgaa tttgggatta agctttccta tgcggaacaa cctagtcccg + 17581 atggacttgc tcaggctttt cttatcggtg aagaatttat cggtgacgat agcgttgcgc + 17641 tgatcttagg tgacaatatc tatcacggtt ctggtttgag caaaatgctt caaaaagcag + 17701 ccaagaaaga gaaaggtgcg actgtctttg gctaccatgt caaggatcca gaacgctttg + 17761 gtgttgtaga atttgatgaa aatatgaatg ctatctccat cgaagaaaaa ccagaacagc + 17821 cgcgctctaa ctatgcagtg acaggactgt atttctatga taacgatgtt gtcgaaattg + 17881 ccaagagtat caaaccaagt cctcgcggag aattagaaat cacagatgtc aacaaggctt + 17941 acttggatcg tggagattta tcagttgagc ttatgggacg tggctttgct tggctggata + 18001 ctggaactca tgaaagttta ctagaggctt cacagtacat cgaaacagtg caacggatgc + 18061 aaaatgttca ggtagcaaac ttagaagaaa ttgcctatcg catgggttat atcagtcgtg + 18121 aagatgtatt gaccttagcc caaccactta agaaaaatga atacggacag tatctgctcc + 18181 gtttgattgg agaagcatag atgacagata attttttcgg taagacgctt gcggcacgca + 18241 aggttgaagc tattccaggc atgttggagt ttgatatccc cgttcatgga gataatcgtg + 18301 gctggtttaa agaaaatttc caaaaggaaa aaatgcttcc acttggattt ccagagtctt + 18361 tctttgcaga aggaaaattg caaaacaatg tatccttctc acgtaaaaat gtccttcgag + 18421 gcctccacgc agagccttgg gataagtaca tctctgtagc agatggaggg aaagttctgg + 18481 gttcttgggt tgatctacgc gagggtgaaa cctttgggaa tacctatcag acagtaattg + 18541 atgcaagcaa gggaatcttt gttcctcgag gcgtagctaa tggcttccaa gttctatcag + 18601 atacagtgtc atatagctat ctggtcaatg attactgggc tctcgagctc aaacccaagt + 18661 atgcctttgt gaactacgct gatccaagcc ttggtattga atgggaaaat attgcagaag + 18721 cagaggtttc agaagcagat aaacatcatc ccctacttaa ggatgtaaaa cctttgaaaa + 18781 aagaagattt gtaaaaagga aagaatatga ctgaatacaa aaatattatc gtgacaggtg + 18841 gagctggctt tatcggttct aactttgtcc attatgttta cgagaacttt ccaggtgttc + 18901 acgtgacagt cctagataag ttgacttatg ctggaaatcg cgcgaatatt gaggaaattt + 18961 taggtaatcg tgttgagtta gttgttggtg acattgctga tgcggagttg gtagacaagt + 19021 tggctgctca agcagatgct atcgttcatt atgcagcgga aagccacaat gataattcgc + 19081 tcaatgatcc atcgccattt attcatacta acttcatcgg aacctatact cttttagaag + 19141 ctgctcgtaa gtatgatatt cgcttccacc atgtatcgac agatgaagtt tatggggatc + 19201 tccctttacg cgaagatttg ccaggtcatg gtgaaggacc aggtgagaaa tttactgctg + 19261 aaaccaagta caatccaagc tcgccttact catcaaccaa ggcagcctca gatttgattg + 19321 tcaaagcctg ggtccgttct tttggagtca aggcaacgat ttccaactgt tcaaataact + 19381 acggtcctta tcaacatatc gaaaaattca tcccacgtca gattactaac atcctaagtg + 19441 gaattaagcc aaaactttac ggtgaaggta agaacgttcg tgactggatt cataccaatg + 19501 accattcttc aggagtttgg acaatcttga caaaagggca aattggtgaa acctacttga + 19561 ttggggctga tggtgagaag aacaataagg aagttttgga acttatcctt aaggaaatgg + 19621 gacaagctgc ggatgcctat gatcatgtga ctgaccgtgc aggacatgac cttcgctatg + 19681 cgattgatgc tagcaagctc cgtgatgagt tggggtggaa acctgaattt accaactttg + 19741 aagctgggct caaggcaaca atcaagtggt atacagataa ccaagaatgg tggaaagcag + 19801 aaaaagaagc tgttgaagcc aattatgcta agactcagga gattattaca gtataaaaag + 19861 caggaaatag ctgcttttta ttgctatatt gggaagagtt acatattaga aaggtctaga + 19921 gatgatttta attacagggg caaatggcca attaggaacg gaacttcgct atttattgga + 19981 tgaacgtaat gaagaatacg tggcagtaga tgtggctgag atggacatta ccgatgcaga + 20041 aatggttgag aaagtttttg aagaggtgaa accgacttta gtctaccact gtgcagccta + 20101 caccgctgtt gatgcagcag aggatgaagg aaaagagttg gacttcgcca tcaatgtgac + 20161 ggggacaaaa aatgtcgcaa aagcatctga aaagcatggt gcaactctag tttatatttc + 20221 tacggactat gtctttgacg gtaagaaacc agttggacaa gagtgggaag ttgatgaccg + 20281 accagatcca cagacagaat atggccgtac taagcgtatg ggggaagagt tagttgagaa + 20341 gcatgtgtct aatttctata ttatccgtac tgcctgggta tttggaaatt atggcaaaaa + 20401 cttcgttttt accatgcaaa atcttgcgaa aactcataag actttaacag ttgtaaatga + 20461 ccagtacggt cgtccgactt ggactcgtac cttggctgag ttcatgacct acctagctga + 20521 aaatcgtaag gaatttggtt attatcattt gtcaaatgat gcgacagaag acacaacatg + 20581 gtatgatttt gcagttgaaa ttttgaaaga tacagatgtc gaagtcaatc cagtagattc + 20641 cagtcaattt ccagccaaag ctaaacgtcc gctaaactca acgatgagcc tggccaaagc + 20701 caaagctact ggatttgtta ttccaacttg gcaagatgca ttgcaagaat tttacaaaca + 20761 agaagtgaga taagtagtag aatgattttc tagtctaata aaagaggcag ataatgaact + 20821 ccaaaggagc ttaagatgta cgattatctt gttgttggtg ctggtctctt tggcgcagtc + 20881 tttgcccatg aagtagcctt aaaaggaaaa aagtaaaagt cattgaaaaa cggaatcata + 20941 tcgtgggtaa tatctatact cgtgaagagg aaggaattca agttcatcaa tatggtgctc + 21001 atatcttcca tacttctgat aaggagatct gggattatgt aaatcagttt gcagggttta + 21061 accgttacac caattctcct gttgcaaact ataagggtga gatttataac cttcctttta + 21121 atatgaatac tttcaataaa ctctggggag ttgtaacgcc agcagaagca caagctaaga + 21181 ttgaggaaca acgtgctatt ttaaatggta aaactcctga aaatttggaa gaacaggcga + 21241 tttctcttgt aggtacagac atctacgaaa aattaatcaa agactataca gagaaacagt + 21301 ggggcaaacc aactactgaa cttccatcct ttattattcg ccgtttacca gtacacctga + 21361 cctatgataa caactatttt aacgatacct atcaagggat tccaattggt ggatacactc + 21421 aaatagttga aaaatgtgga tcatgaaaat attgatgtag aaacaaatgt tgatttcttt + 21481 gtgaacaaag agcaatatct gaaagatttt cctaagattg tctttactgg tatgattgat + 21541 gaattctttg actataagtt gggcgaacta gagtaccgta gtcttcgttt tgaaaatgag + 21601 accttggata tggaaaatta ccaaggaaat gcagttgtga actatacgga tgcagaaacc + 21661 ccatatactc gcattattga acacaaacat tttgagtttg ggagtcaagc aaagactatc + 21721 attaccaaag aacattctaa aacatgggaa aaaggtgatg agccttatta tccagttaat + 21781 aatgatcgta ataatcattt gtataaatca tataaaaaac ttgctgatga gcaagggaat + 21841 gttatctttg gtggccgctt aggacactat cgttattacg atatgcacca agtaattgga + 21901 gcagctttgc agtgcgtgag aaatgagtta gattcatact caatgaaaat caaagagcaa + 21961 actaggaagc tagccacagg ttgctcaaaa cactgttttg aggttgcaga tgaaagctga + 22021 cgcggtttga agagattttc gaagagtata aacaagtaaa actgactacc agttattatt + 22081 tagaaatagt attaaaaatt ccggctcttt gtcaactgta gtgggttgaa aaaaagctaa + 22141 gctcgagaaa ggacaaattt cgtcctttct tttttgatat tcagggcgat aaaaatccgt + 22201 tttttgaagt tttcaaagtt ccgaaaacca aaggcattgc gctttataag tttgatgaga + 22261 ttattggtcg cttccaattt ggcgtttgaa tagggtagtt gaagggcgtt gacgattttc + 22321 tctttgtcct ttagaaaggt tttaaagaca gtctgaaaaa taggatgaac ctgcttaaga + 22381 ttgtcctcaa taagtccgaa aaatttctct ggttccttat tctgaaagtg aaacagcaag + 22441 agttgataga gctgatagtg atgtttcaac ccaaatcatt catacctctc tcaactagat + 22501 gtaacttaca aaacccctga cctcatgagc cactttcttc ctcctcatga ggtcagtttt + 22561 actttctgct gttccagtat cgtttttcct cgctagattt cctcaaaagg gcagactcct + 22621 cccttggttc gtcacacgat tttttcatct cgactgttct ttaatcccca attattcacc + 22681 ccaaatctaa aaaccatcca gaatccttgc cttagcttag atcctggatg gtttttagat + 22741 ttggggtgaa taattggggt tcaagtcttg tgaatagctc aaaagcttgt ctaaaatctc + 22801 tttattggtt aaatgcatac gaaaagtagg acgataaaat cgcttatcac tcagtttacg + 22861 gctatcctgt tgtatgagct tccagtagcg cttgatagcc ttgtattcat gggattttcg + 22921 atgaaactga ttcatgattt gaacacgcac acgactcata gcacggctaa gatgttgtac + 22981 aatgtgaaag cgatccaaca cgattttagc atacgggaaa agttgtctag ctaagtcata + 23041 gtaagggcta aacatatcca tagtaataat tttgacgcga catcggacag ctctatcgta + 23101 gcgaagaaag tgatttcgaa tgatagcttg tgttcttccc tcaagaacag tgatgatatt + 23161 gagattgtta aaatcttgcg caatgaagct catctttccc tttgtaaaag catactcatc + 23221 ccaagacata atctcaggaa gacaagaaaa atcatgttta aagtgaaaat cattgagctt + 23281 acgaataaca gttgaagttg agatggaaag ctgatgggca atatcagtca tagaaatctt + 23341 ttcaattaac ttttgagcaa tcttttggtt gatgatacga gggatttggt gatttttctt + 23401 gacgagggaa gtctcagcga ccgctatttt tgagcactga tagcacttga agcgacgctt + 23461 tctaaggaga attctagtag gcataccagt cgtttcaaga taaggaattt tagaaggttt + 23521 ttgaaagtca tatttcttca attggtttcc gcactcaggg caagatgggg cgtcgtagtc + 23581 cagtttggcg atgatttcct tgtgtgtatc cttattgatg atgtctaaaa tctggatatt + 23641 agggtcttta atgtctagta attttgtgat aaaatgtaat tgttccatat gattctttct + 23701 aatgagttgt tttgtcgctt ttcattatag gtcatatggg actttttttc tacacaaaaa + 23761 taggctccat aatatccata gggaatttac ccactacaaa tattatagag ccaaaattcc + 23821 ttgactatgt gatatagttg agggattttt aaatgatatt catatttttt gcaaagatgt + 23881 tgtttgaaaa ataattttca aaaattctga aaattctgtt gacatctttc tgaaaagagt + 23941 ctataatgga gagaaagttt taaaggagaa aatgatgaaa agttcaaaac tacttgccct + 24001 tgcgggcgtg acattattg +// + diff --git a/public/res/serotype_genbank/serotype_7B.gb b/public/res/serotype_genbank/serotype_7B.gb new file mode 100644 index 0000000..d392462 --- /dev/null +++ b/public/res/serotype_genbank/serotype_7B.gb @@ -0,0 +1,960 @@ +LOCUS contig_1 21441 bp DNA linear UNK 11-JUN-2024 +DEFINITION contig_1, whole genome shotgun sequence. +ACCESSION contig_1 +VERSION contig_1 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/11/2024, 07:41:56 + CDSs :: 21 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..21441 + /mol_type="genomic DNA" + gene complement(459..797) + /locus_tag="POEHKI_00005" + CDS complement(459..797) + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_D2ZX36" + /db_xref="UniRef:UniRef90_A0A4J1YQ37" + /product="IS630-Spn1, transposase Orf2" + /locus_tag="POEHKI_00005" + /protein_id="gnl|Bakta|POEHKI_00005" + /translation="MVAGLTNGELIAPMTYEEMMTSDFFEVWFQKFFLPTLTTPSVIIM + DNARFHRMGKLELLCEEFGHKLLPLPPYSPEYNPIEKTWAHIKKHLKKVLPSCNTFYEA + LLSCSCFN" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A4J1YQ37" + gene 1219..2664 + /locus_tag="POEHKI_00010" + /gene="wzg" + CDS 1219..2664 + /db_xref="BlastRules:WP_000091082" + /db_xref="COG:COG1316" + /db_xref="COG:M" + /db_xref="RefSeq:WP_050079295.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE30" + /db_xref="UniRef:UniRef100_Q4JZ21" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_O54604" + /db_xref="UniprotKB:Q4K2U9" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="POEHKI_00010" + /protein_id="gnl|Bakta|POEHKI_00010" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKLSQNTDLTVDQ + SSSYLVAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALSFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYS + TIIDSLQDSIQTNMPLETMIDLVNAQLESGGTYKVNSQDLKGTGRMDLPSYAMPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079295.1" + /gene="wzg" + gene 2666..3397 + /locus_tag="POEHKI_00015" + /gene="wzh" + CDS 2666..3397 + /db_xref="EC:3.1.3.48" + /db_xref="GO:0004725" + /db_xref="GO:0030145" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_050079293.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE31" + /db_xref="UniRef:UniRef100_Q4JZ20" + /db_xref="UniRef:UniRef50_Q54518" + /db_xref="UniRef:UniRef90_Q54518" + /db_xref="UniprotKB:Q4JZ20" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="POEHKI_00015" + /protein_id="gnl|Bakta|POEHKI_00015" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDSRY + ALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQIN + SCHVSKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIAKKYG + AKKAKELFVDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079293.1" + /gene="wzh" + gene 3406..4098 + /locus_tag="POEHKI_00020" + /gene="wzd" + CDS 3406..4098 + /db_xref="BlastRules:WP_000664160" + /db_xref="GO:0005351" + /db_xref="GO:0005886" + /db_xref="GO:0009103" + /db_xref="GO:0015774" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_050079291.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE32" + /db_xref="UniRef:UniRef100_Q4JZ19" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_Q54519" + /db_xref="UniprotKB:Q4JZ19" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="POEHKI_00020" + /protein_id="gnl|Bakta|POEHKI_00020" + /translation="MQDQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVIK + PEFTSTTRIYVVNRNQEEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVISDLKLDLT + PKGLANKIKVIVPIDTRIVSVSVNDRVPEEASRIANSLREVAAKKIISITRVSDVTTLE + EARPAISPSSPNIKRNTLIGFLAGGLGTSVIVLLLELLDTRVKRPEDIEDTLQMTLLGV + VPNLSKLK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079291.1" + /gene="wzd" + gene 4108..4791 + /locus_tag="POEHKI_00025" + /gene="wze" + CDS 4108..4791 + /db_xref="BlastRules:WP_001142521" + /db_xref="COG:COG0489" + /db_xref="COG:D" + /db_xref="EC:2.7.10.2" + /db_xref="GO:0004715" + /db_xref="GO:0005524" + /db_xref="GO:0016310" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_050079289.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE33" + /db_xref="UniRef:UniRef100_Q4JZ18" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_Q54520" + /db_xref="UniprotKB:Q4JZ18" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="POEHKI_00025" + /protein_id="gnl|Bakta|POEHKI_00025" + /translation="MPTLEIAQKKLEFIKKAEEHYNALCTNIQLSGDKLKVISVTSVNP + GEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVMSGFFKSREKITGLTEFLSGTADLSH + GLCDTNIENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVIDAA + IITQKCDASILVTATGEVNKRDAQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVYGSYG + NYGKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079289.1" + /gene="wze" + gene 4807..6174 + /locus_tag="POEHKI_00030" + /gene="wchA" + CDS 4807..6174 + /db_xref="RefSeq:WP_050079287.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE34" + /db_xref="UniRef:UniRef100_Q4JZ17" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_P72513" + /db_xref="UniprotKB:Q4JZ17" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="POEHKI_00030" + /protein_id="gnl|Bakta|POEHKI_00030" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETEVERSSMVILYLLH + FFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAIGVLNFFIVERFSISRRGMVYFLT + LEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKLVAV + SVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFINLPGESYDIGEIISRFETMGIDVT + VNLNAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHLISKRILDICGATIGLILFAIAS + LVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTMQGGMFK + INNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPKQKRRLSF + KPGITGLWQVSGRSKITDFDAVVKLDVAYIDNWTIWKDIEILLKTVKVVFMRDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079287.1" + /gene="wchA" + gene 6205..7386 + /locus_tag="POEHKI_00035" + /gene="wchF" + CDS 6205..7386 + /db_xref="RefSeq:WP_050079285.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE35" + /db_xref="UniRef:UniRef100_Q4JZ16" + /db_xref="UniRef:UniRef50_A0A4L8A7M3" + /db_xref="UniRef:UniRef90_Q4K2S4" + /db_xref="UniprotKB:Q4JZ16" + /db_xref="UserProtein:wchF" + /product="""putative rhamnosyl transferase WchF""" + /locus_tag="POEHKI_00035" + /protein_id="gnl|Bakta|POEHKI_00035" + /translation="MKKSVYIIGSKGIPAKYGGFETFVEKLTAFQQDKAIQYYVACMRE + NSAKSGTTEDVFEHNGAICYNVDVPNIGPARAIAYDIAAINRAIEIAKENKDENPIFYI + LACRIGPFIHGIKKRIQAIGGTLLVNPDGHEWLREKWSLPVRKYWKYSERLMVKYADLL + VCDSKNIEQYIQEDYKQFQPKTTYIAYGTDTTPSILKFEDTKVRNWYQEKGISENGYYL + VVGRFVPENNYEAMIREFIKSQSKKDFVLITNVEQNKFYDKLLRETGFDQDPRIKFVGT + VYDQELLKYIRENAFAYLHGHEVGGTNPSLLEALGSTKLNLLLDVGFNREVGEDGAIYW + QKDELSRVIEYVETINQATIANLNFKSTQRILSDFTWEKIVADYEGVFCFAKS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079285.1" + /gene="wchF" + gene 7373..8233 + /locus_tag="POEHKI_00040" + /gene="wcwI" + CDS 7373..8233 + /db_xref="RefSeq:WP_050079283.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005DFE1CF" + /db_xref="UniRef:UniRef100_UPI0005DFE1CF" + /db_xref="UniRef:UniRef50_A0A853PIH8" + /db_xref="UniRef:UniRef90_A0A853PIH8" + /db_xref="UniprotKB:Q4K2U3" + /db_xref="UserProtein:wcwI" + /product="""putative glycosyl transferase""" + /locus_tag="POEHKI_00040" + /protein_id="gnl|Bakta|POEHKI_00040" + /translation="MRRVSVPNLYAVVVLYNSLLSEAKILKTLNTLNCKELNLIVVDNS + DRKEIQLKNKNFSTENNITLVNMNGNQGLSKAYNKVLELLKGRIGYVVWLDDDTEISVE + YLTKLLYASRGNYDIILPIIQDTHGKIVSPNSRGLLSNKPIKSYKDGKKLEKFNAINSC + TAVNLDIYEEYRYDERLFLDEIDHSFFYDHRNKNLKIELINTIVIQNFSQRADNLNFDT + AWSRLKIRIRDLIVAYKIRGGIFMGLVAVLKSILLGLQLYLKIKDLRIVIYSFTSALCI + FFRKT" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079283.1" + /gene="wcwI" + gene 8254..9426 + /locus_tag="POEHKI_00045" + /gene="wcwL" + CDS 8254..9426 + /db_xref="RefSeq:WP_160313365.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E850D9" + /db_xref="UniRef:UniRef100_Q4K2U2" + /db_xref="UniRef:UniRef50_Q4K2U2" + /db_xref="UniRef:UniRef90_Q4K2U2" + /db_xref="UniprotKB:Q4K2U2" + /db_xref="UserProtein:wcwL" + /product="""putative glycosyl transferase""" + /locus_tag="POEHKI_00045" + /protein_id="gnl|Bakta|POEHKI_00045" + /translation="MNNTDHGGAALALLDLVTQINENYPEYELIVVTGKKNNLNVKLTE + IGIENYFFPFRNFISSYKKPAILWTILYKIRHYIGNRMALKKIEKKIDLKKIDIIHSNL + NRIDIGAILAKKHSIPHLWHIREHLDVWYFYNKLDHRKFEYGLKVLTTEKNYIFYMCSF + STKYIAISNSVAMDWCKKGLSQSSIVKVYDGIKLPQVFGDKKWFRNKKINIVFVGGYDI + KKGQELFLSYFLKLPKEIQMQYTLTFYGSGKSKYIKKLQKMSQHLCSDQVKFHSYIDNL + TELLPNYDIGINFSTTEGFGRVIVEYLANGLCVVASKNGASPELITEEVGFLIDKDNQD + EFIQLFTKLSIEKNKIRQMGNKAIEHAQKFSIDQHTREIINVYQEMRNKQ" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_160313365.1" + /gene="wcwL" + gene 9423..10430 + /locus_tag="POEHKI_00050" + /gene="wcwK" + CDS 9423..10430 + /db_xref="EC:2.7.-.-" + /db_xref="GO:0000271" + /db_xref="GO:0016772" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE38" + /db_xref="UniRef:UniRef100_Q4K2U1" + /db_xref="UniRef:UniRef50_Q4K2S1" + /db_xref="UniRef:UniRef90_Q4K2S1" + /db_xref="UniprotKB:Q4K2U1" + /db_xref="UserProtein:wcwK" + /product="""putative glycosyl transferase""" + /locus_tag="POEHKI_00050" + /protein_id="gnl|Bakta|POEHKI_00050" + /translation="MKNMEQIDFVVTWVNDKDVDWCKRKSEFEKEYNIFQDLNSEERYR + EWGLMKYWFRAVEKYAPWVNKIYFITEGHVPNWLDVNHPKLVHVKHEDYIEKQFLPTFN + SNVIEMNLIHLKDLSEKFVLFNDDFFINDFVKQSDFFENNLPKDTGIFSPLIPRENSLT + PIILNNMEIINKYFSKKKILEQNFSKFFNIKYGKHLLKNICLLPWSDLLGFYDNHIPVS + YCKSNFLEVYEKEHAIFNLTFKNKFRNKNEINHWLIRYWQLSSGNFIPRNINFGKNYAI + SNDPTDIINELKLSKYKIICINDGESIDNFDAVKGLMINAFEKKFPEKSSFEKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K2U1" + /gene="wcwK" + gene 10442..11353 + /locus_tag="POEHKI_00055" + /gene="wcxU" + CDS 10442..11353 + /db_xref="RefSeq:WP_057604654.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005DCCEAF" + /db_xref="UniRef:UniRef100_Q4K2U0" + /db_xref="UniRef:UniRef50_Q4K2S0" + /db_xref="UniRef:UniRef90_Q4K2S0" + /db_xref="UniprotKB:Q4K2U0" + /db_xref="UserProtein:wcxU" + /product="""putative glycosyl transferase""" + /locus_tag="POEHKI_00055" + /protein_id="gnl|Bakta|POEHKI_00055" + /translation="MNLEDLVLIILNYNSAKDTLRCLEILRSFNMNFKIIVVDNNSTDN + SIELLKNIEDPQTTFLISDENRGYGAGNNIGIHFAENHFSSNIIGIINPDIVIPNQEVI + ISMYNVLKNSDFAMVGGSVIDNEGNYRLLNSSWDLPSFKSVVLERFLIYNRHKVPYCLN + MYNDETAIVDCVAGCFFMIKADVMKEIGYFDENVFLYNEENILGMKLREKGFQSIILTK + QFYYHLHDFEKDKVELSLSKKCKRDWVKFQSRKYFTEKYYSKFLGFLLFFVEIFNLFQI + MIGHLKNNIIKKNLKGNSSEKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_057604654.1" + /gene="wcxU" + gene 11340..12587 + /locus_tag="POEHKI_00060" + /gene="wzy" + CDS 11340..12587 + /db_xref="RefSeq:WP_050079275.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE3A" + /db_xref="UniRef:UniRef100_Q4K2T9" + /db_xref="UniRef:UniRef50_Q4K2R9" + /db_xref="UniRef:UniRef90_Q4K2R9" + /db_xref="UniprotKB:Q4K2T9" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="POEHKI_00060" + /protein_id="gnl|Bakta|POEHKI_00060" + /translation="MKKSSTLHSSTLHIGLILFLIVLSKNFFNLVPNIALFSDFNLMII + IIIMTVVNIKYYNRSTKYQYRWYIIFTLIFVLYSAINEKLLYGQPFLLGLLPQRQFFLC + LMTYFPLRKYFQEQNISLKKLYVGIMNLGSISSLIYILQKIVILYGGTQFVNVMYSFAG + YFSGYRLYVGSSLIILATLISTAYFLETLKLKYLCHLILGWFTEIWITQGRIEMIVLLI + STIVCIIVQGRLTRKKIIYWLLTILGLWMITLTPIFENIVGAILKVDGAGRGSDSLTIR + AIGRQLYWDQLNETTSKLLFGTGYPNYNYALAFQRTGFSSNIFLTDNGFMTYIYIFGIV + GSSIMGLLFLKYLKNSIKYARQSADMIPLMYIISLLIVAYNIILWYWNADGTFILVIMI + CALEHGEQLLHQRNGV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079275.1" + /gene="wzy" + gene 12592..14544 + /locus_tag="POEHKI_00065" + /gene="rbsF" + CDS 12592..14544 + /db_xref="RefSeq:WP_050079274.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE3B" + /db_xref="UniRef:UniRef100_Q4K2T8" + /db_xref="UniRef:UniRef50_Q4K2T8" + /db_xref="UniRef:UniRef90_Q4K2T8" + /db_xref="UniprotKB:Q4K2T8" + /db_xref="UserProtein:rbsF" + /product="""putative phosphotransferase""" + /locus_tag="POEHKI_00065" + /protein_id="gnl|Bakta|POEHKI_00065" + /translation="MNLNKEVRWKDKQYIAFDFFDTTIHRNCHPEVILFEWSKKISIYF + SFKISATEIYSIRKKSEIHEKQEKQLEEIKYERLLQLVFYTILSRLKSDVTDYTLEDFL + IYARTCEEEIELRHISIDTDTINFIEFLKQNGKKIILISDFYSDKKLIEKLMVSLGIRD + YFSKIFISSEIGLRKSSGNLYEYVINELSCKPINLLMIGDNIYSDVKVPKKLGIDSYHK + SYSDSHVTVSPNDIVKAMNNVISQACTESLFNLYIPEILYFISKLYKELSVNKASDILF + CAREGFFIKKLFDLYQKKMNLKLINSHYFYVSRKSTLYPSFKNIEDEDFEVIFRQFPEI + TLENFLINLNFSNNDINNISKQTEIKQTDKVSDKSIINKLKQNKLFKDVYDLNCKEEKY + SFREYLKSVGVENDNSTINMVDIGWKGTIQDNIQKAFPSLNIKGYYMGLNFQRYSTRNS + MNKTGILFTDDPQKTKFFNLFNYKYLFYERIFVADHGPTVRYEFMNGVGVPTLDTDENH + IEIYRFSEEFQITFFNTFEKILDLFNESLVTPDELFNEIANLSLKKHCIYLPRLSVSIK + KLDRAAKENFGIIKSTNRNSDNKVRNFWKNRDFLFLDYIYKAYGKNRLLNPILDIYGYF + VYLIKTLQIKIVGDI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079274.1" + /gene="rbsF" + gene 14544..16001 + /locus_tag="POEHKI_00070" + /gene="wzx" + CDS 14544..16001 + /db_xref="RefSeq:WP_224781814.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E9F0F1" + /db_xref="UniRef:UniRef100_Q4JZ09" + /db_xref="UniRef:UniRef50_I1ZPG7" + /db_xref="UniRef:UniRef90_Q4K0A9" + /db_xref="UniprotKB:Q4K2T7" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="POEHKI_00070" + /protein_id="gnl|Bakta|POEHKI_00070" + /translation="MSMKEKSINKNAILNIILTLTNIVFPLITFPYISRILNPSGIGAI + SFFSSIGSYGVLVASLGISTYGIRVIAKDRYHKDKITKIFQELIVINSVMSIIVTFFLV + LMSFRLEQLSSEKGLLIITCITILSSPFNLNWFYSGIEEYSYITKRSIFFKLVSLILTF + LFVKSKDDYILYAVITLFSTLASNFINILESRKYINFNLRRDLEFRYHLKPMWYLFASL + LAVNIYINLDSVMLGIINGNDAVGIYSIASKVKWILLSVVTSVSSVLLPRLSFYSNKYD + ETKFNNILRKSSTIIFMISIPLTIFFMIKAKESILLLGGEQYIQAVLAMQILMPILVIS + GFSNITGNQILIPTGNEKYFMRAVSIGAIVNLCLNLLLMPILGIIGGAIATLCAESVQM + IIQFYFSRNKLMGNISLNSIKKIAYSSIFAGILLIVIQNIIENFNSFLNLAASSFLYFG + VYFFLLVLFKESTIKKFLNQIFYKDIS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_224781814.1" + /gene="wzx" + gene 16176..17045 + /locus_tag="POEHKI_00075" + /gene="rmlA" + CDS 16176..17045 + /db_xref="EC:2.7.7.24" + /db_xref="GO:0008879" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="RefSeq:WP_050079273.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE3D" + /db_xref="UniRef:UniRef100_Q4K2T6" + /db_xref="UniRef:UniRef50_A0A366WAT5" + /db_xref="UniRef:UniRef90_Q4K105" + /db_xref="UniprotKB:Q4K2T6" + /db_xref="UserProtein:rmlA" + /product="""glucose-1-phosphate thymidylyltransferase + RmlA""" + /locus_tag="POEHKI_00075" + /protein_id="gnl|Bakta|POEHKI_00075" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLAG + IRDILIISTPQDLHRFQELLQDGSEFGLKLSYAEQPSPDGLAQAFIIGEEFISDDSVAL + ILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEKPEH + PRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRGFAWL + DTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKNEYGQY + LLRLIGEA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079273.1" + /gene="rmlA" + gene 17046..17642 + /locus_tag="POEHKI_00080" + /gene="rmlC" + CDS 17046..17642 + /db_xref="RefSeq:WP_050079271.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE3E" + /db_xref="UniRef:UniRef100_Q4JZ07" + /db_xref="UniRef:UniRef50_Q5XCG7" + /db_xref="UniRef:UniRef90_A0A1S0ZBJ9" + /db_xref="UniprotKB:Q4JZ07" + /db_xref="UserProtein:rmlC" + /product="""dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC""" + /locus_tag="POEHKI_00080" + /protein_id="gnl|Bakta|POEHKI_00080" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEKM + LPLGFPASFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREGET + FGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYADPS + LGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDLE" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079271.1" + /gene="rmlC" + gene 17652..18701 + /locus_tag="POEHKI_00085" + /gene="rmlB" + CDS 17652..18701 + /db_xref="COG:COG1088" + /db_xref="COG:M" + /db_xref="EC:4.2.1.46" + /db_xref="GO:0008460" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="RefSeq:WP_050079266.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE3F" + /db_xref="UniRef:UniRef100_Q4K2T4" + /db_xref="UniRef:UniRef50_P95780" + /db_xref="UniRef:UniRef90_F3UAC1" + /db_xref="UniprotKB:Q4K2T4" + /db_xref="UserProtein:rmlB" + /product="""dTDP-D-glucose 4,6-dehydratase RmlB""" + /locus_tag="POEHKI_00085" + /protein_id="gnl|Bakta|POEHKI_00085" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGNR + ANIEEILGSRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTNFI + GTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSPYSS + TKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLYGEGK + NVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAADAYDHV + TDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKEAVEANY + AKTQEIITV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_050079266.1" + /gene="rmlB" + gene 18767..19618 + /locus_tag="POEHKI_00090" + /gene="rmlD" + CDS 18767..19618 + /db_xref="COG:COG1091" + /db_xref="COG:M" + /db_xref="EC:1.1.1.133" + /db_xref="GO:0008831" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="KEGG:K00067" + /db_xref="RefSeq:WP_000600913.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000003EFAD" + /db_xref="UniRef:UniRef100_Q9AH81" + /db_xref="UniRef:UniRef50_Q9AH81" + /db_xref="UniRef:UniRef90_Q9AH81" + /db_xref="UniprotKB:Q9AH81" + /db_xref="UserProtein:rmlD" + /product="""dTDP-4-keto-L-rhamnose reductase RmlD""" + /locus_tag="POEHKI_00090" + /protein_id="gnl|Bakta|POEHKI_00090" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEKV + FEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTDYV + FDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKNFVF + TMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDTTWYD + FAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQEFYKQE + VR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000600913.1" + /gene="rmlD" + gene 19954..20187 + /locus_tag="POEHKI_00095" + CDS 19954..20187 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00020451F3" + /db_xref="UniRef:UniRef100_A0A916L630" + /db_xref="UniRef:UniRef50_A0A916L630" + /db_xref="UniRef:UniRef90_A0A916L630" + /product="UDP-galactopyranose mutase Glf" + /locus_tag="POEHKI_00095" + /protein_id="gnl|Bakta|POEHKI_00095" + /translation="MNTFNKLWGVVTPAEAQAKIDEQRAILNGKTPENLEEQAISLVGT + DIYEKLIKDYTEKQWGKPTTELPAFIIVCQYA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef100_A0A916L630" + gene 20261..20764 + /locus_tag="POEHKI_00100" + CDS 20261..20764 + /db_xref="EC:5.4.99.9" + /db_xref="KEGG:K01854" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A822VKG6" + /db_xref="UniRef:UniRef90_A0A4J2E3K5" + /product="UDP-galactopyranose mutase Glf" + /locus_tag="POEHKI_00100" + /protein_id="gnl|Bakta|POEHKI_00100" + /translation="MLDHENIDVETNVDFFVNKEQYLKDFPKIVFTGMIDEFFDYKLGE + LEYRSLRFENETLDMENYQGNAVVNYTDAEIPYTRIIEHKHFEFGSQAKTIITKEHSKT + WEKGDEPYYPVNNDRNNHLYKSYKKLADEQGNVIFGGRLGHYRYYDMHQVIGAALQCVR + NELD" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A4J2E3K5" + gene 20771..20848 + /locus_tag="POEHKI_00105" + CDS 20771..20848 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A9Q5N676" + /db_xref="UniRef:UniRef90_A0A9Q5N676" + /product="Chlorohydrolase" + /locus_tag="POEHKI_00105" + /protein_id="gnl|Bakta|POEHKI_00105" + /translation="MKIKEQTRKLATGCSKYCFEVADGS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Bakta:1.9" + /inference="similar to AA + sequence:UniRef:UniRef50_A0A9Q5N676" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcgta taaaaacaag + 181 ggaggactgt ataaaaggca gaaatccttt gttttttata accaaggttt ataaaccttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agacgaacat + 301 aaagaagcgt atccttagtg caggcctgac ttttacatct gctttgcttt tagctgcttg + 361 cgaccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cataaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcgca taaaagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga aaaacttctg aaaccatact + 721 tcaaaaaagt cgctcgtcat catctcttcg taagtcattg gagcgattaa ttcaccattt + 781 gttagacctg caaccaaaga aatcctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 tttctgggtc ttgttcataa ttagattgaa actagagtag tagacctctg cttctaaaac + 1021 attgttagaa atcgatttga ctgtcctgat cgatttgtca tgttcttatt tcattttact + 1081 atatttttgt ttcgcgggaa gtctactaag atacttaaag atgcagatag taaaaaaaga + 1141 tgcagatagt aaaaaaatgt agacattacc gtaaaaaagt gatataatca taagatgttc + 1201 aatgtatagg tgttaatcat gagtagacgt tttaaaaaat caggttcaca gaaagtgaag + 1261 cgaagtgtta atatagtttt gctgactatt tatttattgt tagtttgttt tttattgttc + 1321 ttaatcttta agtacaatat ccttgctttt agatatctta atctagtggt aactgcgtta + 1381 gtcttactag tagccttggt agggctactc ttgattatct ataaaaaagc tgaaaaattt + 1441 actatttttc tgttggtgtt ctctatcctt gtcagctcag tgtcgctctt tgcagtacag + 1501 cagtttgttg gactgaccaa tcgtttaaat gcgacttcta attactcaga atattcgctc + 1561 agtgtcgctg ttttagcaga tagtgagatc gaaaatgtta cgcaactgac gagtgtgaca + 1621 gcaccgactg ggactgataa tgaaaatatt caaaaactac tagctgatat caagttaagt + 1681 cagaataccg atttgacagt cgaccagagt tcgtcttact tggttgctta caagagtttg + 1741 attgcagggg agactaaggc cattgtccta aatagtgtct ttgaaaatat catcgagtca + 1801 gagtatccag actacgcatc gaagataaag aagatttata ccaagggatt tactaaaaaa + 1861 gtagaagctc ctaagacgtc taagaatcag tctttcaata tctatgttag tggaattgac + 1921 acctatggtc ctattagttc ggtgtcgcga tcagatgtca atatcctgat gactgtcaat + 1981 cgtgatacca agaaaatcct cttgaccaca acgccacgtg atgcctatgt accaatcgca + 2041 gatggtggaa ataatcaaaa agataaatta acccatgcgg gcatttatgg agttgattcg + 2101 tccattcaca ccttagaaaa tctctatgga gtggatatca attactatgt gcgattgaac + 2161 ttcacttctt tcttgaaaat gattgactta ttgggagggg tagatgttca taatgatcaa + 2221 gagttttcag ctctacatgg gaagttccat ttcccagtag ggaatgtcca cctagactct + 2281 gagcaggctc taagttttgt acgtgaacgc tactcactag ccgatggaga ccgtgaccgt + 2341 ggtcgcaacc aacaaaaggt gattgtggct atccttcaaa aattaacgtc aaccgaagca + 2401 ctgaaaaatt atagtacgat cattgatagc ttgcaagatt ctatccaaac aaatatgcca + 2461 cttgagacca tgatagattt ggtcaatgct cagttagaaa gtggtggaac ttacaaagtg + 2521 aattcgcaag acttgaaagg tacaggtcgg atggatcttc cttcttatgc aatgccagac + 2581 agtaacctct atgtgatgga aatagatgat agtagtttag ctgtagttaa agcagctata + 2641 caggatgtga tggagggtag atgaaatgat agacatccat tcgcatatcg tttttgatgt + 2701 agatgacggt cccaagtcaa gagaggaaag caaggctctc ttggcagaat cctacaggca + 2761 gggggtgcga accattgtct ctacctctca ccgtcgcaag ggcatgtttg aaactccgga + 2821 agagaagata gcagaaaact ttcttcaggt tcgggaaatt gcaaaagaag tagcagatga + 2881 tttagtcatt gcttatggtg cagagatata ctatactctg gatgctctag aaaagctaga + 2941 aaaaaaagaa attcctaccc ttaatgatag tcgttatgcc ttgattgagt ttagcatgca + 3001 tacttcctat cgtcagattc atacgggatt gagcaatatt ttgatgttgg gaatcacacc + 3061 agtaattgct catattgaac gttatgatgc tttagagaat aacgaaaaac gtgttcgtga + 3121 actgattgat atggggtgct atactcagat aaatagttgt catgtttcaa aacctaagtt + 3181 ctttggtgaa aaatataaat tcatgaaaaa gagagctcgg tattttttgg aacgtgattt + 3241 agttcatgta gttgcaagtg acatgcacaa tttagacagt agacctccat atatgcaaca + 3301 ggcatatgat atcattgcta agaaatatgg agcgaaaaaa gcgaaagaac tttttgtaga + 3361 taatcccaga aaaattataa tggatcaatt aatttaggag aaaatatgca agatcaaaac + 3421 actttggaaa tcgatgtatt gcagctattc agagctttat ggaaaagaaa gttggtcatt + 3481 ttattagtgg caattataac ttcttcagtt gcttttgcct acagtacttt tgttatcaaa + 3541 cctgagttta ctagtacgac tcggatttat gtagttaacc gtaatcagga agagaagtct + 3601 ggtttaacca atcaagactt gcaggcagga acttatctgg taaaagacta ccgtgaaatt + 3661 atcctatcgc aggatgtttt ggaggaagtt atttctgatt tgaaactaga tttgacgcca + 3721 aaaggtttgg ctaataaaat taaagtaata gtaccaattg atacccgtat tgtctctgtt + 3781 tcagttaatg atcgagttcc tgaagaagca agccgtatcg ctaactcttt gagagaagta + 3841 gctgctaaaa aaattatcag tattactcgt gtttctgatg tgacaacact ggaggaggca + 3901 agaccggcga tatcaccgtc ttcgccaaat attaaacgca atacactaat tggttttttg + 3961 gcaggggggc ttggaactag tgttatagtt cttcttcttg aacttttgga cactcgtgtg + 4021 aaacgtccag aagatatcga agatacactg cagatgacac ttttgggagt tgtaccaaac + 4081 ttgagtaagt tgaaatagga gagaggaatg ccgacattag aaatagcaca aaaaaaactg + 4141 gagttcatta agaaggcaga agaacattac aatgccttgt gtacaaatat acagttgagc + 4201 ggagataaac taaaagtaat ttccgttact tctgttaacc ctggggaagg aaaaacaact + 4261 acttccgtaa atatagcaag gtcgtttgcg cgtgcaggct ataaaactct tttgatcgat + 4321 ggcgatactc gaaattcagt tatgtcagga ttttttaaat ctcgtgaaaa aattacaggg + 4381 ctaacagaat ttttatctgg gacagctgat ttatctcacg gtttatgtga tacaaatatt + 4441 gaaaatttat ttgtagttca atcgggatct gtatcaccaa accctacagc cttgttacag + 4501 agtaaaaatt ttaatgatat gattgaaaca ttgcgtaaat attttgatta tatcattgtt + 4561 gatacagcac ctattggaat tgttattgat gcggcaatta tcactcaaaa gtgtgatgcg + 4621 tccatcttgg taacagcaac cggtgaggtg aataaacgtg atgcccaaaa agctaaacaa + 4681 caattagaac aaacagggaa actgttccta ggagttgttt taaataaatt ggatatctcg + 4741 gttgataagt atggggtata cggttcctat ggaaattatg gtaaaaaata acttaggaaa + 4801 gattttatgg atgaaaaagg attgaaaatt tttctggcag tattacagag tattattgtc + 4861 attttattgg tttattttct tagctttgtt agagagacag aagttgaacg ttcttcgatg + 4921 gttatactat accttctcca cttttttgta ttctatttta gttcctatgg taacaatttt + 4981 tttaaaagag ggtacctagt tgagtttaat agtaccataa gatatatttt tttctttgca + 5041 atagctatag gtgtattaaa cttttttata gtggaacggt ttagtatctc tagaagagga + 5101 atggtatact tcttaacttt agaaggaata tccttatact tgttaaattt cttagtaaag + 5161 aaatattgga agcatgtgtt ttttaatcta aaaaatagca agaaaatttt actgttaaca + 5221 gtaacgaaaa atatggaaaa agttcttgat aaattgctag aatctgatga actttcatgg + 5281 aaattggtag cagtaagtgt tttggataaa tctgattttc aacatgataa aatacctgta + 5341 attgaaaagg aaaaaattat tgaatttgca acgcatgaag ttgtggatga ggtgtttatc + 5401 aatcttccag gagagagcta cgatattgga gaaattatct ctaggtttga gacaatgggg + 5461 atagatgtaa ctgtaaatct taatgcattt gataagaatt tgggtcgcaa taaacaaatt + 5521 catgagatgg taggattgaa tgtagtcact ttctctacaa atttttataa aactagtcat + 5581 ttgatttcaa agagaattct cgatatttgt ggtgccacta ttggccttat tctttttgct + 5641 atagctagtc tagttttagt tccattgatt cgtaaagatg gcggaccagc tatttttgct + 5701 caaactcgta tagggaaaaa tggtcgacat tttacctttt ataaattccg ttcaatgcgg + 5761 atcgatgctg aagctatcaa agaacagttg atggatcaaa atacgatgca aggtggtatg + 5821 tttaagataa acaatgatcc tcgtgttaca aaaattggtc gctttattcg taaaaccagt + 5881 ttggatgaat tgccacaatt ttggaatgtc tttattggag atatgagttt ggttgggacg + 5941 cgtccaccga cagtagacga atatgatcag tatactccaa aacagaaacg tcgactcagc + 6001 tttaagcctg gtattacagg cttatggcag gttagtgggc gtagtaaaat aaccgatttt + 6061 gatgctgttg taaaattaga tgtggcttat attgataatt ggacaatctg gaaagatatt + 6121 gaaattttgc ttaaaactgt taaagttgta tttatgagag atggagcgaa gtaatttctg + 6181 tatatccatc atattaggag agaaatgaaa aagtcagttt atatcattgg ttcaaaagga + 6241 attcctgcta agtatggagg atttgaaact tttgttgaaa aattaacagc cttccaacaa + 6301 gataaggcta tccaatatta tgtggcttgt atgcgtgaaa actctgcaaa atcagggact + 6361 actgaggatg tttttgaaca taatggtgct atctgttata acgtcgatgt tcctaatatt + 6421 ggtccagcgc gagctatagc gtatgatatc gctgcaatta acagagctat tgaaattgcc + 6481 aaagaaaata aggatgaaaa tccaatcttc tatattttag cttgtcgaat tggtccgttc + 6541 atccatggaa ttaagaaaag aattcaagca ataggtggga ctcttctggt taatccggat + 6601 ggtcatgagt ggctacgaga aaaatggagt ttacctgttc gcaaatattg gaaatactct + 6661 gaaagactta tggtcaaata tgcagattta ttggtttgtg acagtaaaaa tatcgaacag + 6721 tatatccaag aagattataa acagttccaa cctaagacca cctatatcgc ttatgggacc + 6781 gatacaactc cctcaatctt gaaatttgaa gatactaaag tccgaaattg gtatcaagag + 6841 aagggaatta gtgaaaacgg ttattattta gtggtgggac gatttgtccc tgagaataac + 6901 tatgaagcta tgattcgtga atttatcaaa tcccagtcta aaaaggattt tgtcctcatt + 6961 acaaatgtgg aacaaaataa attttacgac aagttgcttc gggaaacagg ttttgaccaa + 7021 gacccaagaa tcaaatttgt tggtactgtt tatgatcagg aattgttaaa atatattcga + 7081 gaaaatgcct ttgcatattt acatggtcat gaggtggggg ggacaaatcc atcactttta + 7141 gaggctttag gatcaacaaa gttaaatttg ttgcttgatg ttggttttaa ccgtgaagtt + 7201 ggtgaggatg gagctattta ttggcaaaaa gatgaacttt cacgagtcat cgaatatgtg + 7261 gaaacgataa atcaagcaac tatcgcaaac ttaaatttta aatcaaccca aagaatcctc + 7321 tcagatttta catgggaaaa aattgtggca gattatgaag gagtattttg ttttgcgaag + 7381 agttagtgtg cccaatttat atgcagtagt agttttatac aatagtttat tatcagaagc + 7441 aaaaatttta aaaaccttaa atacattaaa ttgtaaagaa ttaaacttaa ttgtagtaga + 7501 caatagtgat aggaaagaaa tacagttaaa aaataagaac ttttccactg aaaataatat + 7561 aacattggtg aatatgaatg gaaatcaggg attatctaaa gcttataata aagtcctaga + 7621 attattaaag ggtagaatag gttatgtggt ttggttagat gatgatactg agattagtgt + 7681 agaatattta acaaaattat tgtatgcatc aagaggtaat tacgacatta ttttgcctat + 7741 tattcaagat acccatggta aaattgtttc tccaaattct cgtggtttac tttcaaataa + 7801 accgattaaa agttacaaag atggaaaaaa acttgaaaaa tttaacgcaa taaatagttg + 7861 tacagctgtc aatttagaca tttatgaaga atatagatat gatgaacgac ttttcttgga + 7921 tgaaattgat cattcgtttt tctatgacca cagaaataaa aatttaaaga tcgaattaat + 7981 taatacaata gttattcaaa atttttctca aagggctgat aatttaaatt ttgatactgc + 8041 atggagtaga ttgaaaatta gaattcggga tttgatagtg gcttataaaa ttagaggtgg + 8101 gatttttatg ggtcttgtag ctgttttaaa aagtatccta cttggactcc agttatactt + 8161 gaaaattaag gatttgcgta tagttatcta tagtttcaca tctgctttat gtattttttt + 8221 tagaaagact tgaaaatgaa gattttatat tttatgaata atacagatca tggtggggct + 8281 gctttagcat tattagattt agttactcag ataaatgaga attatcctga gtatgaactt + 8341 attgttgtaa cagggaaaaa aaataattta aatgttaagt taacagaaat tggtattgaa + 8401 aattactttt ttccatttag aaattttatt agttcatata aaaaacctgc aatactatgg + 8461 acgattttat ataaaattcg tcattatatc ggaaatcgaa tggctctaaa aaaaatagaa + 8521 aaaaaaattg atttgaaaaa aatcgatatt attcattcta atttaaatag aatcgatata + 8581 ggagcaatat tagccaaaaa gcacagtata ccccatttat ggcatataag agagcatttg + 8641 gatgtatggt atttttataa taaattagat catagaaagt ttgagtatgg cttgaaggtc + 8701 ttgactacgg aaaaaaatta tattttttat atgtgttctt tttcaacgaa atatattgca + 8761 atctctaact ctgtagctat ggattggtgt aaaaaaggac tatctcagtc atctattgtt + 8821 aaagtttacg acggtatcaa gttacctcaa gtatttggtg ataaaaaatg gtttagaaat + 8881 aaaaaaataa atattgtatt tgttggtggt tacgatatta aaaaaggtca ggagttgttt + 8941 ttaagctatt ttttaaaatt accaaaagaa atacaaatgc aatatacttt gactttctat + 9001 ggaagtggga aatctaagta tataaagaaa ttacaaaaga tgtctcagca tctatgttct + 9061 gatcaagtta aatttcatag ttatatagat aatcttacag aattactacc aaattatgat + 9121 attgggatta atttttcaac aacggaaggt tttggaagag tgattgttga atatttagcg + 9181 aacggtcttt gtgttgttgc aagtaaaaat ggagctagtc cagaattaat aacagaagaa + 9241 gttggatttt taatcgacaa ggataatcag gatgaattta ttcagttgtt tactaaatta + 9301 tctattgaaa agaataagat aagacaaatg gggaataaag caattgaaca tgcacaaaag + 9361 ttttcaatag accaacatac aagagagatt ataaatgtat atcaagaaat gagaaataaa + 9421 cagtgaaaaa tatggaacaa attgattttg tggtgacatg ggttaatgat aaagatgtag + 9481 attggtgtaa aagaaagtct gaatttgaga aagaatataa tatatttcaa gatttaaata + 9541 gtgaagagcg ataccgtgaa tggggtctta tgaaatattg gtttagagct gtggaaaaat + 9601 atgccccttg ggtaaataaa atttatttta taaccgaagg gcatgtacca aattggttag + 9661 atgtaaatca tcctaaattg gttcatgtta aacatgagga ttatatcgaa aaacagtttt + 9721 tgccaacttt taattcaaac gttatagaga tgaatttgat tcatttgaaa gatttatcag + 9781 agaaatttgt tctttttaat gatgattttt tcataaatga ttttgtaaaa caaagtgatt + 9841 tttttgaaaa taatttaccc aaagatacgg ggatttttag tcctttaata ccaagagaaa + 9901 attctttaac tcctattata ttaaacaata tggagattat taacaaatat ttttcaaaga + 9961 aaaaaattct tgagcagaat ttttctaagt tttttaacat caaatatgga aaacatctat + 10021 tgaagaatat ttgtttactg ccatggtcag atttgttagg cttctatgat aatcatattc + 10081 cagtaagtta ttgtaaaagt aatttcttgg aagtttatga gaaagaacat gccattttta + 10141 atttgacgtt taaaaataaa tttaggaata aaaatgagat taatcattgg ttaattagat + 10201 attggcaatt gtctagcggt aatttcatac ctagaaacat taattttggg aaaaattatg + 10261 ccatttcaaa tgatcctacg gatattatta atgaattaaa actttctaaa tataagatta + 10321 tatgtattaa tgatggtgaa agtatagata attttgatgc agtgaaaggt ctaatgatta + 10381 atgcttttga aaaaaagttt cctgagaaat cgagttttga gaaaaagtga ggcagataag + 10441 aatgaatttg gaagatttag tattaataat tttaaattat aatagtgcta aagatacact + 10501 acgttgttta gaaattctac gttcttttaa tatgaatttt aaaattattg tagtggataa + 10561 taattctacg gacaattcaa tagaactact caagaatata gaggatcctc aaactacttt + 10621 tttaatttct gatgagaata gaggatatgg agcaggtaat aatattggga ttcactttgc + 10681 agaaaatcat ttttcttcaa atatcatagg tattattaat ccagatatag tcattcccaa + 10741 tcaggaagtg ataatttcaa tgtataatgt tttgaaaaat agtgactttg ctatggttgg + 10801 tgggtcagta atcgataatg agggaaatta tagactatta aattcatcat gggatttacc + 10861 ttcttttaag agcgttgtac ttgaaagatt tttaatatat aatcgacata aagttccata + 10921 ttgtttaaat atgtataatg atgaaacagc gattgtagat tgtgtagcag gttgcttttt + 10981 tatgataaaa gctgatgtaa tgaaggaaat cggttatttt gatgaaaatg tttttttata + 11041 taatgaagag aacattcttg gaatgaaact gagagaaaag ggcttccaat caattatatt + 11101 aaccaaacag ttttactatc atttgcatga ttttgaaaag gataaggtag aattatcctt + 11161 gagtaaaaaa tgtaaacgag attgggtgaa atttcagtca cgtaagtatt ttaccgaaaa + 11221 atattattca aaatttttag gttttcttct tttttttgtt gaaatattta atttgtttca + 11281 aattatgata ggacacttaa aaaataatat tataaagaag aatctgaaag gaaactctag + 11341 tgaaaaaaag tagtacgtta catagtagta cgttacatat agggcttatt ctttttttga + 11401 ttgtactgag taaaaacttc tttaatttag taccaaatat agcactgttt tctgatttta + 11461 atcttatgat tattataatc atcatgacag ttgttaatat taaatactat aatcgctcaa + 11521 ccaaatatca gtatcgttgg tatattattt ttacattgat atttgtgttg tatagtgcaa + 11581 ttaatgagaa actattatat ggccaaccat ttctattagg tttacttcct caaagacaat + 11641 tttttttatg tttaatgact tatttccctt taagaaagta tttccaagaa caaaatatta + 11701 gtttaaaaaa actttatgtt ggtattatga atttgggatc tatttcatcg ttaatttaca + 11761 ttttacaaaa gatagtaata ttatatgggg gaacacaatt tgttaacgta atgtatagtt + 11821 ttgccggata ttttagcggg tatagattgt atgtaggtag ttctttaatt attttagcaa + 11881 cattaatttc tactgcttat tttttagaaa cattaaaact caagtatctg tgccacctta + 11941 tattaggttg gtttactgaa atttggataa cgcaaggtcg aatagagatg attgttttgc + 12001 taatttcaac gatagtttgc ataatagtcc aaggaagatt aactagaaag aaaataattt + 12061 attggttgct gacaattttg ggactgtgga tgattactct aacacctatt tttgaaaata + 12121 ttgttggagc tattttaaaa gtagatggag caggtagagg aagtgattca ttgactattc + 12181 gagcaattgg acgacagtta tattgggatc aattgaatga gacaacttca aaacttcttt + 12241 ttggaacagg atatcctaat tataattatg ctttagcctt tcaacgtaca ggtttttcaa + 12301 gcaatatttt tttaacagac aatggtttta tgacatatat atatatattt ggtattgtgg + 12361 gttcctcaat tatgggatta ttatttttaa aatatcttaa aaattcaata aagtatgcta + 12421 gacaatctgc agatatgatt ccgttgatgt atattatttc tttactaatt gtagcctata + 12481 atattattct ttggtattgg aatgcggacg gtacttttat attagtaatc atgatttgcg + 12541 cattggagca tggagaacaa ttattacatc agaggaatgg agtgtgatta gatgaattta + 12601 aataaagaag ttagatggaa ggataagcaa tatattgctt ttgatttttt tgatacaact + 12661 atccatagaa attgtcatcc tgaagtgatt ttatttgaat ggtctaaaaa aatttctatt + 12721 tatttctctt tcaaaatatc tgctacagaa atttattcaa ttaggaaaaa atctgaaata + 12781 catgagaagc aagaaaaaca attggaagaa attaaatatg aaagattact tcaacttgtt + 12841 ttttatacta ttttaagtcg tttgaagtca gatgttaccg actatactct tgaagatttt + 12901 ttaatttatg caagaacgtg tgaagaggaa atagaattaa gacatattag tattgataca + 12961 gatacaatta attttattga atttttaaaa caaaatggga aaaaaataat tttaatttca + 13021 gatttttatt ctgataaaaa gctaattgaa aaattaatgg tttcattagg gattagagat + 13081 tatttctcta aaatatttat ttcaagtgaa attggcttac gtaagtcatc aggaaattta + 13141 tatgaatatg tgatcaatga attgagctgt aagcctataa atttacttat gattggtgat + 13201 aatatttatt ctgatgtaaa agttccaaaa aaactaggaa tagattctta tcataaatct + 13261 tattcagatt cacatgtgac tgtgagtcct aacgatattg taaaagcgat gaataatgtt + 13321 atttctcaag cttgtactga atctttattt aatctctata tacctgaaat actttatttt + 13381 atttcaaagt tatacaaaga attatctgtt aacaaagcta gtgatatatt attttgtgca + 13441 agagaaggtt tttttataaa aaaattattt gatctttatc aaaaaaaaat gaacttaaag + 13501 cttattaact cacattattt ttatgtttct agaaaatcaa cgctatatcc atcatttaaa + 13561 aatattgagg atgaagattt tgaagttatt tttagacaat ttcctgaaat tactttagaa + 13621 aattttttga ttaatttaaa tttttccaat aatgatatta acaatatttc taagcaaaca + 13681 gaaattaaac aaacagacaa agtatcagat aaatctatta ttaacaaatt aaaacaaaat + 13741 aaattattta aagatgttta tgatttgaac tgtaaagaag aaaaatattc ttttagagaa + 13801 tatttaaagt ctgtaggagt tgagaatgac aattctacaa taaatatggt agatattggt + 13861 tggaaaggca cgatacaaga caatattcaa aaagcttttc catctttaaa tataaaaggg + 13921 tattatatgg ggttgaattt tcaacggtat tctactagga atagtatgaa taagacggga + 13981 atactgttta ctgacgatcc tcaaaaaaca aagtttttta acttatttaa ttataaatat + 14041 ttattctatg aaagaatttt tgttgcagat catggaccga cagttagata tgaatttatg + 14101 aatggtgttg gggtaccaac attggataca gatgaaaatc atatagaaat ttatagattt + 14161 tctgaggaat ttcagattac atttttcaac acatttgaga aaattttaga tttgttcaat + 14221 gaatcactag taacaccaga tgaattattt aacgaaatag ctaatttatc gttaaaaaaa + 14281 cattgcatct atttacctag gctttcagta agtataaaaa aattagatag agcagcaaaa + 14341 gaaaattttg gtattataaa atctactaac aggaatagtg ataataaggt aagaaatttt + 14401 tggaaaaata gagatttttt atttttagat tatatatata aagcgtatgg aaagaataga + 14461 ttgttaaacc ctatattgga tatttacgga tattttgtat atctgattaa aacactgcaa + 14521 ataaaaatag taggggatat ttgatgagca tgaaagaaaa atcaataaat aaaaatgcta + 14581 ttttgaatat tattttaaca ctaacaaata ttgtgtttcc attaattact tttccttata + 14641 tttctagaat tctgaatccg tcaggaatag gtgcaatctc ttttttttca tctattggtt + 14701 cttatggtgt tttagttgcc tcgcttggaa tttcaactta tgggattcgg gtgattgcaa + 14761 aggatcgtta tcataaagat aagataacta aaatattcca agaattgata gttattaata + 14821 gtgtaatgtc tattatagtg acgttcttcc ttgttttaat gagtttccga ttagagcagt + 14881 taagttcaga aaaaggttta ttaataatca catgtattac tattttgtcc tctcctttta + 14941 atttgaattg gttttatagt ggaatagaag agtattcata tataacaaaa cgttcaatat + 15001 tttttaaatt agtttcattg atattaacct ttttatttgt taaaagtaaa gacgattata + 15061 ttctatatgc tgtgataaca ttgttttcaa cattggcttc caattttata aatattttgg + 15121 agagtagaaa atacatcaat tttaatttga gaagggattt agaatttaga tatcatctaa + 15181 aaccaatgtg gtatttattt gcttcgttac ttgcagttaa tatttatata aatttggatt + 15241 ctgtgatgtt aggaattatt aatggaaatg atgcggtagg tatttactca atcgcatcaa + 15301 aagtaaaatg gattttatta tcagtcgtta cttcagtgag ttcagtttta ttacccagat + 15361 tatcatttta tagcaataaa tatgacgaaa cgaagtttaa taatattttg agaaagtcat + 15421 ctacaataat ttttatgatt tcaattcctc taacaatttt ttttatgata aaagcgaaag + 15481 agagtatatt attgttaggt ggagagcagt atattcaggc agttttagca atgcaaatat + 15541 taatgccgat cttggtaata tcaggttttt ctaatattac aggtaatcag atattgatcc + 15601 ctactggtaa tgagaaatat tttatgagag cagtttctat aggagcaata gtaaatttat + 15661 gtttaaattt gttgcttatg cctattttgg gaattatcgg aggtgcgatc gcaactcttt + 15721 gtgcagaatc agtccaaatg attattcaat tttatttttc tcgtaataaa ttaatgggta + 15781 atatttcatt aaattcaatc aaaaaaatag cctattcatc aatttttgcg ggtatactgt + 15841 taatagtaat acaaaatatt atagagaatt ttaatagctt cttaaattta gctgcatcta + 15901 gttttctata ttttggagta tattttttct tattggtatt gtttaaagaa agtacaatta + 15961 agaaatttct aaatcaaatt ttttataagg atatttcatg aatttattac caattattta + 16021 tggagcgatt cttgatttaa tatcagaata attttttaaa gtgaatgaaa tcaaagcaat + 16081 aaaagattaa aaaataaatt gctatctatt atgtttttct caaactaagt aaaacataac + 16141 tcatgaaaac aaattaaaaa aggagggact atagtatgaa aggtattatt ctagcaggtg + 16201 gttcggggac acgtttatat cctttgactc gcgctgcatc aaaacaactt atgccggttt + 16261 atgataaacc gatgatttac tacccacttt caacattgat gttggctggg attagggata + 16321 ttttgattat ttccactcca caggatttac atcgattcca agagcttctt caagacggat + 16381 ctgagtttgg gctcaaactt tcttatgcag agcaaccaag tccagatggt ttggcacaag + 16441 cctttatcat tggggaagag tttatttctg atgatagcgt tgcgctgatc ttaggtgaca + 16501 atatctatca cggttctggg ctttccaaga tgctacaaaa ggcagcgagt aaggagtcgg + 16561 gagcaactgt ttttggctac catgtcaagg atccagagcg ctttggtgtg gttgagtttg + 16621 atcaggatat gaaggctatt tctattgaag aaaagccaga gcaccctcgt tcaaactatg + 16681 cagttacagg tctctatttc tatgataatg atgtagtaga gattgccaag agtattaaac + 16741 caagtcctcg tggtgaactg gaaattacag atgtaaacaa ggcttaccta gatcgtggtg + 16801 atttgtctgt tgagcttatg ggacgtggct ttgcttggtt ggatactggc actcatgaaa + 16861 gtttactaga ggcttcgcag tacatcgaaa cagtccaacg gatgcaaaat gttcaggtag + 16921 caaacttaga agaaattgct taccgtatgg gctatatcag tcgagaagat gtattggcct + 16981 tagcccaacc acttaagaaa aatgaatacg gacagtatct gctccgtttg attggagaag + 17041 catagatgac agataatttt ttcggtaaga cgcttgcggc acgcaaggtt gaagctattc + 17101 caggcatgtt ggagtttgat atccccgttc atggagataa tcgtggctgg tttaaagaaa + 17161 atttccaaaa ggaaaaaatg cttccacttg gatttccagc gtctttcttt gcagaaggaa + 17221 aattgcaaaa caatgtatcc ttctcacgta aaaatgtcct tcgaggcctc cacgcagagc + 17281 cttgggataa gtacatctct gtagcagatg gagggaaagt tctgggttct tgggttgatc + 17341 tacgcgaggg tgaaaccttt gggaatacct atcagacagt aattgatgca agcaagggaa + 17401 tctttgttcc tcgaggcgta gctaatggct tccaagtttt atcagataca gtgtcatata + 17461 gctatctggt caatgattac tgggcgcttg aactcaaacc caagtatgcc tttgtgaact + 17521 acgctgatcc aagccttggt attgaatggg aaaatattgc agaagcagag gtttcagaag + 17581 cagataaaca tcatccccta cttaaggacg tgaagccttt gaaaaaagaa gatttggaat + 17641 aaggaaagaa tatgactgaa tacaaaaata ttatcgtgac aggtggagct ggctttatcg + 17701 gttctaactt tgtccattat gtttacgaga actttccaga tgttcacgtg acagtcctag + 17761 ataagttgac ttatgctgga aaccgcgcga atattgagga aattttaggt agtcgtgttg + 17821 agttagttgt tggtgacatt gctgatgcgg agttggtaga caagttggct gctcaagcag + 17881 atgctatcgt tcattatgca gcggaaagcc acaatgataa ttcgctcaat gatccatcgc + 17941 catttattca tactaacttc attggaacct atactctttt agaagctgct cgtaagtatg + 18001 atattcgctt ccaccatgta tcgacagatg aagtttatgg ggatctccct ttacgcgaag + 18061 atttgccagg tcatggagaa gggccgggtg agaaatttac ggctgaaacc aagtacaatc + 18121 caagctcgcc ttactcatca accaaggcag cctcagattt gattgtcaaa gcctgggtgc + 18181 gttcttttgg agtcaaggca acgatttcca actgttcaaa taactacggt ccttaccagc + 18241 atattgagaa gtttattcca cgacaaatca ccaatatctt gagcggtatc aagccaaaac + 18301 tttacggtga aggtaagaac gttcgtgact ggattcatac caatgaccat tcttcaggag + 18361 tttggacaat cttgacaaaa gggcaaatcg gtgaaaccta cttgattggg gctgatggtg + 18421 agaagaacaa taaggaagtt ttggaactta tccttaagga aatgggacaa gctgcggatg + 18481 cctatgatca tgtgactgac cgtgcaggac atgaccttcg ctatgcgatt gatgctagca + 18541 agctccgtga tgagttgggg tggaaacctg aatttaccaa ctttgaagct gggctcaagg + 18601 caacaatcaa gtggtataca gataaccaag aatggtggaa agcagaaaaa gaagctgttg + 18661 aagccaatta tgctaagact caggagatta ttacagtata aaaagcagga aatagctgct + 18721 ttttattgct atattgggaa gagttacata ttagaaaggt ctagagatga ttttaattac + 18781 aggggcaaat ggccaattag gaacggaact tcgctattta ttggatgaac gtaatgaaga + 18841 atacgtggca gtagatgtgg ctaagatgga cattaccaat gaagaaatgg ttgagaaagt + 18901 ttttgaagag gtgaaaccga ctttagtcta ccattgtgca gcctacaccg ctgttgatgc + 18961 agcagaggat gaaggaaaag agttggactt cgccatcaat gtgacgggga caaaaaatgt + 19021 cgcaaaagca tctgaaaagc atggtgcaac tctagtttat atttctacgg actatgtctt + 19081 tgatggtaag aaaccagttg gacaagagtg ggaagttgat gaccgaccag atccacagac + 19141 agaatatgga cgcactaagc gtatggggga agagttagtt gagaagcatg tgtctaattt + 19201 ctatattatc cgtactgcct gggtatttgg aaattatggc aaaaacttcg tttttaccat + 19261 gcaaaatctt gcgaaaactc ataagacttt aacagttgta aatgaccagt acggtcgtcc + 19321 gacttggact cgtaccttgg ctgagttcat gacctaccta gctgaaaatc gtaaggaatt + 19381 tggttattat catttgtcaa atgatgcgac agaagataca acatggtatg attttgcagt + 19441 tgaaattttg aaagatacag atgtcgaagt caagccagta gattccagtc aatttccagc + 19501 caaagctaaa cgtccgctaa actcaacgat gagcctggcc aaagccaaag ctactggatt + 19561 tgttattcca acttggcaag atgcattgca agaattttac aaacaagaag tgagataagt + 19621 agtagaatga ttttctagtc taataaaaga ggcagagaat gaactccaaa ggagcttaag + 19681 atgtacgatt atcttgttgt tggtgcagtc tttgcccatg aagcagtctt aaaaggaaaa + 19741 aaagtaaaag ttattgaaaa atgaaatcat atcgcgggta atatctatac tcgtgaagag + 19801 gaaggaattc aagttcatca atatggtgct catatcttcc atacttctga taaggagatc + 19861 tgggattatg taaatcagtt tgcagacttt aaccgttata ccaattctcc tgttgcaaac + 19921 tataagggtg agatttataa ccttcctttt aatatgaata ccttcaataa actctgggga + 19981 gttgtgacgc cagcagaagc acaagctaag attgatgaac aacgtgctat tttaaatggt + 20041 aaaactcctg aaaatttgga agaacaggcg atttctcttg taggtacaga catctacgaa + 20101 aaattaatca aagactatac agagaaacag tggggcaaac caactactga acttccagcc + 20161 tttattattg tttgccagta cgcctgacct atgataacaa ctattttaac gatacctatc + 20221 aagggattcc aattggtgga tacactcaaa tagttgaaaa atgttggatc atgaaaatat + 20281 tgatgtagaa acaaatgttg atttctttgt gaataaagag caatatctga aagattttcc + 20341 taagattgtc tttactggta tgattgatga attctttgac tataagttgg gcgaactaga + 20401 gtaccgtagt cttcgttttg aaaatgagac cttggatatg gaaaattacc aaggaaatgc + 20461 agttgtgaac tatacggatg cagaaatccc atatactcgc attattgaac acaaacattt + 20521 tgagtttggg agtcaagcaa agactatcat tactaaagaa cattctaaaa catgggaaaa + 20581 aggtgatgag ccttattatc cagttaataa tgatcgtaat aatcatttgt ataaatcgta + 20641 taaaaaactt gctgatgagc aagggaatgt tatctttggt ggtcgcttag gacactatcg + 20701 ttattacgat atgcaccaag taattggagc agctttgcag tgcgtgagaa atgagttaga + 20761 ttaatactca atgaaaatca aagagcaaac taggaagcta gccacaggtt gctcaaaata + 20821 ctgttttgag gttgcagatg gaagctgacg cggtttgaag agattttcga agagtataaa + 20881 caagtaaaac tgactaccag ttattattta gaaatagtat taaaaattcc ttgactatgt + 20941 gatatagttg agggattttt aaatgatatt catatttttt gcaaagatgt tgtttgaaaa + 21001 ataattttca aaaattctga aaattctgtt gacaactttc tgaaaagagt ctataatgga + 21061 gagaaagttt taaaggagaa aatgatgaaa agttcaaaac tatttgccct tgcgggcgtg + 21121 acattattgg cggcgactac tttagctgca tgctctggat caggttcaag cactaaaggt + 21181 gagaagacat tctcatacat ttatgagaca gaccctgata acctcaacta tttgacaact + 21241 gctaaggctg cgacagcaaa tattaccagt aacgtggttg atggtttgct agaaaatgat + 21301 cgctacggga actttgtgcc gtctatggct gaggattggt ctgtatccaa ggatggattg + 21361 acttacactt atactatccg taaggatgca aaatggtata cttctgaagg tgaagaatac + 21421 gcggcagtca aagctcaaga c +// diff --git a/public/res/serotype_genbank/serotype_7C.gb b/public/res/serotype_genbank/serotype_7C.gb new file mode 100644 index 0000000..fb7a87a --- /dev/null +++ b/public/res/serotype_genbank/serotype_7C.gb @@ -0,0 +1,959 @@ +LOCUS contig_1 21759 bp DNA linear UNK 11-JUN-2024 +DEFINITION contig_1, whole genome shotgun sequence. +ACCESSION contig_1 +VERSION contig_1 +KEYWORDS . +SOURCE None + ORGANISM . + . +COMMENT Annotated with Bakta + Software: v1.9.3 + Database: v5.1, full + DOI: 10.1099/mgen.0.000685 + URL: github.com/oschwengers/bakta + + ##Genome Annotation Summary:## + Annotation Date :: 06/11/2024, 07:54:57 + CDSs :: 20 + tRNAs :: 0 + tmRNAs :: 0 + rRNAs :: 0 + ncRNAs :: 0 + regulatory ncRNAs :: 0 + CRISPR Arrays :: 0 + oriCs/oriVs :: 0 + oriTs :: 0 + gaps :: 0 + pseudogenes :: 0 +FEATURES Location/Qualifiers + source 1..21759 + /mol_type="genomic DNA" + gene complement(281..1678) + /locus_tag="IHBIEM_00005" + /gene="tnp" + CDS complement(281..1678) + /db_xref="GO:0003677" + /db_xref="GO:0004803" + /db_xref="GO:0006310" + /db_xref="GO:0015074" + /db_xref="GO:0032196" + /db_xref="IS:IS1202" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE41" + /db_xref="UniRef:UniRef100_Q4K2T0" + /db_xref="UniRef:UniRef50_Q54513" + /db_xref="UniRef:UniRef90_Q54513" + /product="ISNCY family IS1202 transposase" + /locus_tag="IHBIEM_00005" + /protein_id="gnl|Bakta|IHBIEM_00005" + /translation="MNETKKYLVIKAIAQGKKTKKRACVELNLSERQINRLLLAYQQKG + KEAFRHGNRNRKPKHAIPDEIKERVLKKYLSYETYKPNVLHFCELLAEEEGIKLSDTTV + RKILYKKNILSPKSHRKTKKRVRKQAKLNLNQPLDNPILPTTKDFLEDPKKVHPSRPRK + KFAGELIQMDASPHAWFGPETTNLHLAIDDASGNILGAYFDKQETLNAYYHVLEQILAN + HGIPLQMKTDKRTVFTYQASNSKKMEDDTYTQFGYACHQLGILLETTSIPQAKGRVERL + NQTLQSRLPIELERNKIHTLEEANTFLLSYIQTFNEQFGNKTKLSVFEEAPNPSERNLI + LARLAERVVDSGHHIRFQNRYYIPTEQGKEVYFIRKTKALVIKAFDGDIYLNIADKIYH + TKELLNHELYSKNFEQEPEQKKERRKYIPPQTHPWKLTSFKQYLHKNKKDYEEFTSEEL + NSPQLQV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K2T0" + /gene="tnp" + gene 1854..3299 + /locus_tag="IHBIEM_00010" + /gene="wzg" + CDS 1854..3299 + /db_xref="BlastRules:WP_000091082" + /db_xref="COG:COG1316" + /db_xref="COG:M" + /db_xref="RefSeq:WP_000091061.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE42" + /db_xref="UniRef:UniRef100_Q4K2S9" + /db_xref="UniRef:UniRef50_G3G7D5" + /db_xref="UniRef:UniRef90_O54604" + /db_xref="UniprotKB:Q4K2S9" + /db_xref="UserProtein:wzg" + /product="""integral membrane regulatory protein Wzg""" + /locus_tag="IHBIEM_00010" + /protein_id="gnl|Bakta|IHBIEM_00010" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAFR + YLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNRLN + ATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLTVNQ + SSSYLAAYRSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAPKTSK + NQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADGGNNQK + DKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQEFSALH + GKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTSTEALKNYS + TIIDSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSYAMPDSNLY + VMEIDDSSLAVVKAAIQDVMEGR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000091061.1" + /gene="wzg" + gene 3301..4032 + /locus_tag="IHBIEM_00015" + /gene="wzh" + CDS 3301..4032 + /db_xref="EC:3.1.3.48" + /db_xref="GO:0004725" + /db_xref="GO:0030145" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_000565354.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE43" + /db_xref="UniRef:UniRef100_Q4K2S8" + /db_xref="UniRef:UniRef50_Q54518" + /db_xref="UniRef:UniRef90_Q54518" + /db_xref="UniprotKB:Q4K2S8" + /db_xref="UserProtein:wzh" + /product="""protein-tyrosine phosphatase Wzh""" + /locus_tag="IHBIEM_00015" + /protein_id="gnl|Bakta|IHBIEM_00015" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRRK + GMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDSRY + ALIEFSMNTLYRDIHSALNKILMLGITPVIAHIERYDALENNEKRVRELIDMGCYTQVN + SSHVLKPKLFGERYKFMKKRAQYFLEKDLVHIIASDMHNLDGRPPYMQQAYDIIAKKYG + AKKAKELFVDNPRKIIMDQLI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000565354.1" + /gene="wzh" + gene 4041..4733 + /locus_tag="IHBIEM_00020" + /gene="wzd" + CDS 4041..4733 + /db_xref="BlastRules:WP_000664160" + /db_xref="GO:0005351" + /db_xref="GO:0005886" + /db_xref="GO:0009103" + /db_xref="GO:0015774" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_000664164.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE44" + /db_xref="UniRef:UniRef100_Q4K2S7" + /db_xref="UniRef:UniRef50_Q54519" + /db_xref="UniRef:UniRef90_Q54519" + /db_xref="UniprotKB:Q4K2S7" + /db_xref="UserProtein:wzd" + /product="""capsular polysaccharide biosynthesis protein + Wzd""" + /locus_tag="IHBIEM_00020" + /protein_id="gnl|Bakta|IHBIEM_00020" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSLVAFAYSTFVIK + PEFTSTTRIYVVNRNQEEKSGLTNQDLQAGTYLVKDYREIILSQDVLEEVISDLKLDLT + PKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVTTLE + EARPAISPSSPNIKRNTLIGFLAGGIGTGVIVLLLELLDTRVKRPEDIEDTLQMTLLGV + VPNLSKLK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000664164.1" + /gene="wzd" + gene 4743..5426 + /locus_tag="IHBIEM_00025" + /gene="wze" + CDS 4743..5426 + /db_xref="COG:COG0489" + /db_xref="COG:D" + /db_xref="EC:2.7.10.2" + /db_xref="GO:0004715" + /db_xref="GO:0005524" + /db_xref="GO:0016310" + /db_xref="GO:0045227" + /db_xref="RefSeq:WP_001142506.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE45" + /db_xref="UniRef:UniRef100_Q4K0X5" + /db_xref="UniRef:UniRef50_Q54520" + /db_xref="UniRef:UniRef90_Q54520" + /db_xref="UniprotKB:Q4K0X5" + /db_xref="UserProtein:wze" + /product="""tyrosine-protein kinase Wze""" + /locus_tag="IHBIEM_00025" + /protein_id="gnl|Bakta|IHBIEM_00025" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVNP + GEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADLSR + GLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVIDAA + IITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVYGSYG + NYGKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001142506.1" + /gene="wze" + gene 5442..6809 + /locus_tag="IHBIEM_00030" + /gene="wchA" + CDS 5442..6809 + /db_xref="RefSeq:WP_000343587.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE46" + /db_xref="UniRef:UniRef100_Q4K2S5" + /db_xref="UniRef:UniRef50_Q8VU30" + /db_xref="UniRef:UniRef90_P72513" + /db_xref="UniprotKB:Q4K2S5" + /db_xref="UserProtein:wchA" + /product="""undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)""" + /locus_tag="IHBIEM_00030" + /protein_id="gnl|Bakta|IHBIEM_00030" + /translation="MDEKGLKIFLAVLQSIIVILSVYFLSFVRETELERSSMVILYLLH + FFVFYFSSYGNNFFKRGYLVEFNNTIRYIFFFAIAISVLNFFIAERFSISRRGMVYFLT + LEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKLVAV + SVLDKSDFQHDKIPVIEKEKIIEFTTHEVVDEVFVNLPGENYDIGEIISRFETMGIDVT + VNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLILFAIAS + LVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTMQGGMFK + IENDPRVTKIGHFIRKTSLDELPQFWNVLKGDMSLVGTRPPTIDEYMKYTPEQKRRLSF + KPGITGLWQISGRSNIKNFDDVVKLDVTYLDGWTIWKDIEILLKTIKVVVMKDGAK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000343587.1" + /gene="wchA" + gene 6844..8025 + /locus_tag="IHBIEM_00035" + /gene="wchF" + CDS 6844..8025 + /db_xref="RefSeq:WP_001232427.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE47" + /db_xref="UniRef:UniRef100_Q4K2S4" + /db_xref="UniRef:UniRef50_A0A4L8A7M3" + /db_xref="UniRef:UniRef90_Q4K2S4" + /db_xref="UniprotKB:Q4K2S4" + /db_xref="UserProtein:wchF" + /product="""putative rhamnosyl transferase WchF""" + /locus_tag="IHBIEM_00035" + /protein_id="gnl|Bakta|IHBIEM_00035" + /translation="MRKSVYIIGSKGIPAKYGGFETFVEKLTEYQKNSNIQYYVACMRE + NSTKSGITDDQFEHNGAICFNIDVPNIGPARAIAYDIAAINKAIKLAKENKDEAPIFYI + LACRIGPFISEIKKKIRAIGGNLFVNPDGHEWLREKWSLPIRKYWKYSEKLMVKHADLL + VCDSKNIEQYIQEDYKQYHPKTTYIAYGTDTTPSILKLEDAKVRNWYQEKGISENGYYL + VVGRFVPENNYEAMIREFIKSQSKKDFVLITNVEQNKFYDKLLRETGFDQDPRIKFVGT + VYDQELLKYIRENAFAYLHGHEVGGTNPSLLEALGSTKLNLLLDVGFNREVGEDGAIYW + QKDELSRVIEYVETINQATIANLNFKSTQRILSDFTWEKIVADYEGVFCFAKS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001232427.1" + /gene="wchF" + gene 8012..8899 + /locus_tag="IHBIEM_00040" + /gene="wcwI" + CDS 8012..8899 + /db_xref="RefSeq:WP_001255333.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00027339F4" + /db_xref="UniRef:UniRef100_A0A853PIH8" + /db_xref="UniRef:UniRef50_A0A853PIH8" + /db_xref="UniRef:UniRef90_A0A853PIH8" + /db_xref="UniprotKB:Q4K2S3" + /db_xref="UserProtein:wcwI" + /product="""putative glycosyl transferase""" + /locus_tag="IHBIEM_00040" + /protein_id="gnl|Bakta|IHBIEM_00040" + /translation="MRRVSVPNLYAVVVLYNSLLSEAKILKTLNTLNCKELNLIVVDNS + DRKEIQLKNKNFSTENNITLVNMNGNKGLSKAYNKVLELLKGRIGYVVWLDDDTEISIE + YLTKLLYASRGNYDIILPIIQDTHGKIVSPNSRGLLSNKPIKSYKDGKKLEKFNAINSC + TAVNLDIYEEYRYDERLFLDEIDHSFFYDHRNKNLKIELINTIVIQNFSQRADNLNFDT + AWSRLKIRIRDLIVAYKIRGGIFMGLVAVLKSILLGLQLYLKIKDLRIVIYSFTSAVCI + FLERLENEDFIFYE" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001255333.1" + /gene="wcwI" + gene 8892..10064 + /locus_tag="IHBIEM_00045" + /gene="wcwL" + CDS 8892..10064 + /db_xref="RefSeq:WP_160313365.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI0005E850D9" + /db_xref="UniRef:UniRef100_Q4K2U2" + /db_xref="UniRef:UniRef50_Q4K2U2" + /db_xref="UniRef:UniRef90_Q4K2U2" + /db_xref="UniprotKB:Q4K2S2" + /db_xref="UserProtein:wcwL" + /product="""putative glycosyl transferase""" + /locus_tag="IHBIEM_00045" + /protein_id="gnl|Bakta|IHBIEM_00045" + /translation="MNNTDHGGAALALLDLVTQINENYPEYELIVVTGKKNNLNVKLTE + IGIENYFFPFRNFISSYKKPAILWTILYKIRHYIGNRMALKKIEKKIDLKKIDIIHSNL + NRIDIGAILAKKHSIPHLWHIREHLDVWYFYNKLDHRKFEYGLKVLTTEKNYIFYMCSF + STKYIAISNSVAMDWCKKGLSQSSIVKVYDGIKLPQVFGDKKWFRNKKINIVFVGGYDI + KKGQELFLSYFLKLPKEIQMQYTLTFYGSGKSKYIKKLQKMSQHLCSDQVKFHSYIDNL + TELLPNYDIGINFSTTEGFGRVIVEYLANGLCVVASKNGASPELITEEVGFLIDKDNQD + EFIQLFTKLSIEKNKIRQMGNKAIEHAQKFSIDQHTREIINVYQEMRNKQ" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_160313365.1" + /gene="wcwL" + gene 10061..11068 + /locus_tag="IHBIEM_00050" + /gene="wcwK" + CDS 10061..11068 + /db_xref="EC:2.7.-.-" + /db_xref="GO:0000271" + /db_xref="GO:0016772" + /db_xref="RefSeq:WP_000794114.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE4A" + /db_xref="UniRef:UniRef100_Q4K2S1" + /db_xref="UniRef:UniRef50_Q4K2S1" + /db_xref="UniRef:UniRef90_Q4K2S1" + /db_xref="UniprotKB:Q4K2S1" + /db_xref="UserProtein:wcwK" + /product="""putative glycosyl transferase""" + /locus_tag="IHBIEM_00050" + /protein_id="gnl|Bakta|IHBIEM_00050" + /translation="MKNMEQIDFVVTWVNGKDVDWCKRKSEFEKEYNIFQDLNSEERYR + EWGLMKYWFRAVEKYAPWVNKIYFITEGHVPNWLDVNHPKLVHVKHEDYIEKQFLPTFN + SNVIEMSLIHLKDLSEKFVLFNDDCFINDFVKQSDFFENNLPKDTGIFSPLIPRENSLA + PIVLNNMEIINKYFSKKKILEQNFSKFFNIKYGKHLLKNICLLPWSDLLGFYDSHIPVS + YCKSNFLEVYEKEHAIFNLTFKNKFRNKNEINHWLIRYWQLSSGNFIPRNINFGKNYAI + SNEPTDIINELKLSKYKIICINDGESIDNFDEVKGLMINAFEKKFPEKSSFEKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000794114.1" + /gene="wcwK" + gene 11080..11991 + /locus_tag="IHBIEM_00055" + /gene="wcxU" + CDS 11080..11991 + /db_xref="RefSeq:WP_001047162.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00027339F8" + /db_xref="UniRef:UniRef100_Q4K2S0" + /db_xref="UniRef:UniRef50_Q4K2S0" + /db_xref="UniRef:UniRef90_Q4K2S0" + /db_xref="UniprotKB:Q4K2S0" + /db_xref="UserProtein:wcxU" + /product="""putative glycosyl transferase""" + /locus_tag="IHBIEM_00055" + /protein_id="gnl|Bakta|IHBIEM_00055" + /translation="MNLEDLVLIILNYNSAKDTLRCLEILRSFNMNFKIIVVDNNSTDN + SIELLKNIEDPQTTFLISDENRGYGAGNNIGIHFAENNFSSNIIGIINPDIVIPNQEVI + ISMYNVLKNSDFAMVGGSVIDNEGNYRLLNSSWDLPSFKSVVLERFLIYNRHKVPYCLN + MYNDETAIVDCVAGCFFMIKADVMKEIGYFDENVFLYNEENILGMKLREKDFQSIILTK + QFYYHLHDFEKDKVELSLSKKCKRDWVKFQSRKYFTEKYYSKFLGFLLFFVEIFNLFQI + MIGHLKNNIIKKNLKGNSSEKK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001047162.1" + /gene="wcxU" + gene 11978..13225 + /locus_tag="IHBIEM_00060" + /gene="wzy" + CDS 11978..13225 + /db_xref="RefSeq:WP_000749811.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE4C" + /db_xref="UniRef:UniRef100_Q4K2R9" + /db_xref="UniRef:UniRef50_Q4K2R9" + /db_xref="UniRef:UniRef90_Q4K2R9" + /db_xref="UniprotKB:Q4K2R9" + /db_xref="UserProtein:wzy" + /product="""oligosaccharide repeat unit polymerase Wzy""" + /locus_tag="IHBIEM_00060" + /protein_id="gnl|Bakta|IHBIEM_00060" + /translation="MKKSSTLHSSTLHIGLILFLIVLSKNFFNLVPNIALFSDFNLMII + IIIMTVVNIKYYNRSTKYQYRWYIIFTLIFVLYSAINEKLLYGQPFLLGLLPQRQFFLC + LMTYFPLRKYFQEQNISLKKLYVGIMNLGSISSLIYILQKIVILYGGTQFVNVIYSFAG + YFSGYRLYVGSSLIILATLISTAYFLETLKLKYLCHLILGWFTQIWITQGRIEMIVLLI + STIVCIIVQGRLTRKKIIYWLLTILGLWMITLTPIFENIVGAILKVDGAGRGSDSLTIR + AIGRQLYWEQLNETTSKLLFGTGYPNYNYALAFQRTGFSSNIFLTDNGFMTYIYIFGIV + GSSIMGLLFLKYLKNSIKYARQSADMIPLMYIISLLIVAYNIILWYWNADGTFILVIMI + CALEHGEQLLHQRNGV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000749811.1" + /gene="wzy" + gene 13230..15182 + /locus_tag="IHBIEM_00065" + /gene="rbsF" + CDS 13230..15182 + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE4D" + /db_xref="UniRef:UniRef100_Q4K2R8" + /db_xref="UniRef:UniRef50_Q4K2T8" + /db_xref="UniRef:UniRef90_Q4K2T8" + /db_xref="UniprotKB:Q4K2R8" + /db_xref="UserProtein:rbsF" + /product="""putative phosphotransferase""" + /locus_tag="IHBIEM_00065" + /protein_id="gnl|Bakta|IHBIEM_00065" + /translation="MNLNKEVRWKDKQYIAFDFFDTTIHRNCHPEVILFEWSKKISIYF + SFKISATEIYSIRKKSEIHEKQEKQLEEIKYERLLQLVFYTILSRLKSDVTDYNLEDFL + IYARTCEEEIELRHISIDTDTINFIEFLKQNGKKIILISDFYSDKKLIEKLMVSLGIRD + YFSKIFISSEIGLRKSSGNLYQYVINELSCKPINLLMIGDNIYSDVKVPKKLGIDSYHK + SYSDSHVTVSPNDIVKAMNNVISQACTESLFNLYIPEILYFISKLYKELSVNKASDILF + CAREGFFIKKLFDLYQKKMNLKLINSHYFYVSRKSTLYPSFKNIEDEDFEVIFRQFPEI + ILENFLINLNFSNNDINSISEQTEIKQTDKVSDKSIINKLKQNKLFKDVYDLNCKEEKY + SFREYLKSVGVENDNSTINMVDIGWKGTIQDNIQKAFPSLNIKGYYMGLNFQRYSTRNS + MNKTGILFTDDPQKTKFFNLFNYKYLFYERIFVADHGPTVRYEFMNGVGVPTLDTDENH + IEIYRFSEEFQITFFNTFEKILDLFNESLVTPDELFNEIANLSLKKHCIYLPRLSVSIK + KLDRAAKENFGIIKSTNRNSDNKVRNFWKNRDFLFLDYIYKAYGKNRLLNPILDIYGYF + VYLIKTLQIKIVGDI" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef100_Q4K2R8" + /gene="rbsF" + gene 15182..16639 + /locus_tag="IHBIEM_00070" + /gene="wzx" + CDS 15182..16639 + /db_xref="RefSeq:WP_224782372.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE4E" + /db_xref="UniRef:UniRef100_Q4K2R7" + /db_xref="UniRef:UniRef50_I1ZPG7" + /db_xref="UniRef:UniRef90_Q4K0A9" + /db_xref="UniprotKB:Q4K2R7" + /db_xref="UserProtein:wzx" + /product="""flippase Wzx""" + /locus_tag="IHBIEM_00070" + /protein_id="gnl|Bakta|IHBIEM_00070" + /translation="MSMKEKSINKNAILNIILTLTNIVFPLITFPYISRILNPSGIGAI + SFFSSIGSYGVLVASLGISTYGIRVIAKDRYHKDKITKIFQELIVINSVMSIIVTFFLV + LMSFRLEQLSSEKGLLIITCITILSSPFNLNWFYSGIEEYSYITKRSIFFKLVSLILTF + LFVKSKDDYILYAVITLFSTLASNFINILESRKYINFNLRRDLEFRYHLKPMWYLFASL + LAVNIYINLDSVMLGIINGNDAVGIYSIASKVKWILLSVVTSVSSVLLPRLSFYSNKYD + ETKFNNILRKSSTIIFMISIPLTIFFMIKAKESILLLGGEQYIQAVLAMQILMPILIIS + GFSNITGNQILIPTGNEKYFMRAVSIGAIVNLCLNLLLMPIWGIIGGAIATLCAELVQM + IIQFYFSRNKLMGNISLNSIKKVAYSSIFAGILLIVIQNIIENFNSFLNLAASSFLYFG + VYFFLLVLFKESTIKKFLNQIFYKDIS" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_224782372.1" + /gene="wzx" + gene 16813..17682 + /locus_tag="IHBIEM_00075" + /gene="rmlA" + CDS 16813..17682 + /db_xref="EC:2.7.7.24" + /db_xref="GO:0008879" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="RefSeq:WP_000676137.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FFCE" + /db_xref="UniRef:UniRef100_Q4K2R6" + /db_xref="UniRef:UniRef50_A0A366WAT5" + /db_xref="UniRef:UniRef90_Q4K105" + /db_xref="UniprotKB:Q4K2R6" + /db_xref="UserProtein:rmlA" + /product="""glucose-1-phosphate thymidylyltransferase + RmlA""" + /locus_tag="IHBIEM_00075" + /protein_id="gnl|Bakta|IHBIEM_00075" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLAG + IRDILIISTPQDLHRFQELLQDGSEFGIKLSYAEQPSPDGLAQAFIIGEEFISDDSVAL + ILGDNIYHGSGLSKMLQKAASKESGATVFGYHVKDPERFGVVEFDQDMKAISIEEKPEQ + PRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRGFAWL + DTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLALAQPLKKNEYGQY + LLRLIGEA" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000676137.1" + /gene="rmlA" + gene 17683..18279 + /locus_tag="IHBIEM_00080" + /gene="rmlC" + CDS 17683..18279 + /db_xref="RefSeq:WP_000130018.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000053FE50" + /db_xref="UniRef:UniRef100_Q4K0Y4" + /db_xref="UniRef:UniRef50_Q5XCG7" + /db_xref="UniRef:UniRef90_A0A1S0ZBJ9" + /db_xref="UniprotKB:Q4K0Y4" + /db_xref="UserProtein:rmlC" + /product="""dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC""" + /locus_tag="IHBIEM_00080" + /protein_id="gnl|Bakta|IHBIEM_00080" + /translation="MTDKFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEKM + LPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREGET + FGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYADPS + LGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDLE" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000130018.1" + /gene="rmlC" + gene 18289..19338 + /locus_tag="IHBIEM_00085" + /gene="rmlB" + CDS 18289..19338 + /db_xref="COG:COG1088" + /db_xref="COG:M" + /db_xref="EC:4.2.1.46" + /db_xref="GO:0008460" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_F0ENA6" + /db_xref="UniRef:UniRef90_Q4K0Q5" + /db_xref="UniprotKB:O54546" + /db_xref="UserProtein:rmlB" + /product="""dTDP-D-glucose 4,6-dehydratase RmlB""" + /locus_tag="IHBIEM_00085" + /protein_id="gnl|Bakta|IHBIEM_00085" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPDVHVTVLDKLTYAGNR + ANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTNFI + GTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSPYSS + TKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLYGEGK + NVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAADAYDHV + TDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKEAVEANY + AKTQEIITV" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:UniRef:UniRef90_Q4K0Q5" + /gene="rmlB" + gene 19404..20255 + /locus_tag="IHBIEM_00090" + /gene="rmlD" + CDS 19404..20255 + /db_xref="COG:COG1091" + /db_xref="COG:M" + /db_xref="EC:1.1.1.133" + /db_xref="GO:0008831" + /db_xref="GO:0009243" + /db_xref="GO:0019305" + /db_xref="KEGG:K00067" + /db_xref="RefSeq:WP_000600913.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI000003EFAD" + /db_xref="UniRef:UniRef100_Q9AH81" + /db_xref="UniRef:UniRef50_Q9AH81" + /db_xref="UniRef:UniRef90_Q9AH81" + /db_xref="UniprotKB:Q9AH81" + /db_xref="UserProtein:rmlD" + /product="""dTDP-4-keto-L-rhamnose reductase RmlD""" + /locus_tag="IHBIEM_00090" + /protein_id="gnl|Bakta|IHBIEM_00090" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAKMDITNEEMVEKV + FEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTDYV + FDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKNFVF + TMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDTTWYD + FAVEILKDTDVEVKPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQEFYKQE + VR" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_000600913.1" + /gene="rmlD" + gene 20340..20765 + /locus_tag="IHBIEM_00095" + CDS 20340..20765 + /db_xref="SO:0001217" + /db_xref="UniRef:UniRef50_A0A0H2ZN29" + /db_xref="UniRef:UniRef90_A0A1A9BIN6" + /product="Transposase" + /locus_tag="IHBIEM_00095" + /protein_id="gnl|Bakta|IHBIEM_00095" + /translation="MLVSLAHSFGSVSIIAHTIHQKFNLKVPNYRQEEDWARMGLPITR + KEISNWHIKASQYYLESLYNLLREKLLEQPLLHADETSYRVLESDSQLTYYWTFLSGKA + ENQVITLYHHDQCRSGSVVQEFLGDYSGYVHCDMLRQ" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA + sequence:UniRef:UniRef90_A0A1A9BIN6" + gene 21358..21516 + /locus_tag="IHBIEM_00100" + CDS 21358..21516 + /db_xref="GO:0004803" + /db_xref="RefSeq:WP_001811052.1" + /db_xref="SO:0001217" + /db_xref="UniParc:UPI00000517C7" + /db_xref="UniRef:UniRef100_A0A3A4RVM5" + /db_xref="UniRef:UniRef50_A0A844FQK0" + /db_xref="UniRef:UniRef90_A0A4N5NNP0" + /product="IS66 family transposase" + /locus_tag="IHBIEM_00100" + /protein_id="gnl|Bakta|IHBIEM_00100" + /translation="MSLLETAKRHQLNSEKYLSYLLECLPNEETLVNKEVLEAYLPWTK + VVQEKCK" + /codon_start=1 + /transl_table=11 + /inference="ab initio prediction:Prodigal:2.6" + /inference="similar to AA sequence:RefSeq:WP_001811052.1" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaaacct caagtttttg aagcttgagg ttttttacta + 181 tagtggattg aaactagaat agtgcacctc tgcttctaaa acattgttag aaatcgattt + 241 gactgtcccg atcgatttgt cctattctta tttcattttg ctatacttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttatga agatattgtt + 361 tgaaagatgt gagtttccac ggatgggttt gtggagggat atacttgcgt ctttcttttt + 421 tttgttctgg ttcttgttca aagtttttcg aatagagttc atgatttagt agctcctttg + 481 tgtgatagat tttgtcagcg atattgaggt agatgtctcc gtcaaatgct tttataacta + 541 atgctttcgt ctttctgatg aaatagactt cttttccttg ttcggtaggg atatagtaac + 601 gattttggaa tcggatatgg tgtccactat cgacgactct ctccgccagt ctagctagaa + 661 tgagattccg ttcagagggg ttaggagcct cctcaaaaac agagagtttt gtcttgtttc + 721 caaactgttc attaaaggtt tggatgtagg aaagaaggaa agtattggct tcttccaatg + 781 tatgaatctt gtttcgttcc agttcgatag gcaggcgtga ttgtagtgtc tgattgagtc + 841 tttcgaccct ccctttagct tgagggatag aggtggtctc aaggagaatc cctagttggt + 901 gacaggcgta tccaaattgt gtataggtgt cgtcctccat tttcttagag ttggatgctt + 961 gataggtaaa gaccgttctc ttatcagttt tcatttgaag gggaatgccg tgattggcta + 1021 agatttgttc gaggacatgg tagtaggcat tcaaggtctc ttgtttgtca aaataagcgc + 1081 ctaggatatt gccagaagca tcatcaatgg ctaagtgtaa gttggtggtt tctggtccaa + 1141 accaggcatg agggctggca tccatttgaa tgagttctcc agcaaatttc tttctgggtc + 1201 tactaggatg taccttttta gggtcttcca ggaagtcttt agtcgtcggt aagattggat + 1261 tgtctagggg ttgattcagg ttcagtttag cttgttttct tactctcttc tttgtctttc + 1321 tgtgagactt aggagaaagg atgtttttct tatagagtat ttttctaaca gttgtatcag + 1381 agagcttaat tccctcttct tcagctagta attcacagaa atgaaggaca tttggtttat + 1441 atgtttcata ggagaggtat ttctttagga cacgttcttt gatttcatca gggattgcat + 1501 gttttggttt tcgatttctg tttccgtgtc tgaaggcttc ttttcctttc tgttgatagg + 1561 ctagtagcag acgattgatt tgtctttcag aaagattgag ttcgacacag gcccgtttct + 1621 ttgttttctt tccttgggct atagctttta ttacaagata ttttttcgtt tcattcatat + 1681 tcagttggat ccttttcata tgactattct accaaatggg acattatcac gttcgattta + 1741 ctaaagacat tatcacattc gaatcacagt caaagtcccg tgaaaataaa agtgtagaca + 1801 ttaccgtaaa aaagtgatat aatcgtatga tgttcaatgt ataggtgtta atcatgagta + 1861 gacgttttaa aaaatcaggt tcacagaaag tgaagcgaag tgttaatata gttttgttga + 1921 ctatttattt attgttagtt tgttttttat tgttcttaat ctttaagtac aatatccttg + 1981 cttttagata tcttaatcta gtggtaactg cgttagtcct actagttgcc ttggtagggc + 2041 tactcttgat tatctataaa aaagctgaaa aatttactat ttttctgttg gtgttttcta + 2101 tccttgtcag ctcagtgtcg ctctttgcag tacagcagtt tgttggactg accaatcgtt + 2161 taaatgcgac ttctaattac tcagaatatt cgctcagtgt cgctgtttta gcagatagtg + 2221 agatcgaaaa tgttacgcaa ctgacgagtg tgacagcacc gactgggact gataatgaaa + 2281 atattcaaaa actactagct gatatcaagt caagtcagaa taccgatttg acggtcaacc + 2341 agagttcgtc ttacttggca gcttacagga gtttgattgc aggggagact aaggccattg + 2401 tcctaaatag tgtctttgaa aatatcatcg agtcagagta tccagactac gcatcgaaga + 2461 taaaaaagat ttataccaag ggattcacta aaaaagtaga agctcctaag acgtctaaga + 2521 atcagtcttt caatatctat gttagtggaa ttgacaccta tggtcctatt agttcggtgt + 2581 cgcgatcaga tgtcaatatc ctgatgactg tcaatcgaga taccaagaaa atcctcttga + 2641 ccacaacacc acgtgatgcc tatgtaccaa tcgcagatgg tggaaataat caaaaagata + 2701 aattaaccca tgcgggcatt tatggagttg attcgtccat tcacacctta gaaaatctct + 2761 atggagtgga tatcaattac tatgtgcgat tgaacttcac ttctttcttg aaaatgattg + 2821 acttattggg aggggtagat gttcataatg accaagagtt ttcagctcta catgggaagt + 2881 tccatttccc agtagggaat gtccatctag actctgagca agctctaggt tttgtacgtg + 2941 aacgctactc actagccgat ggagaccgtg accgtggtcg caaccaacaa aaggtgattg + 3001 tggctatcct tcaaaaatta acgtcaaccg aagcactgaa aaattatagt acgatcattg + 3061 atagcttgca agattctatc caaacaaata tgccacttga gaccatgata aatttggtca + 3121 atgctcagtt agaaagtgga gggaattata aagtaaattc tcaagattta aaaggtacag + 3181 gtcggatgga tcttccttct tatgcaatgc cagacagtaa cctctatgtg atggaaatag + 3241 atgatagtag tttagctgta gttaaagcag ctatacagga tgtgatggag ggtagatgaa + 3301 atgatagaca tccattcgca tatcgttttt gatgtagatg acggtcccaa gtcaagagag + 3361 gaaagcaagg ctctcttggc agaatcctac aggcaggggg tgcgaaccat tgtctctacc + 3421 tctcaccgtc gcaagggcat gtttgaaact ccggaagaga agatagcaga aaactttctt + 3481 caggttcggg aaatagctaa ggaagtggcg agtgacttag tcattgctta cggagctgaa + 3541 atttactaca caccagatgt tctggataag ctgggaaaaa agcggattcc gaccctcaat + 3601 gatagtcgtt atgccttgat agagtttagt atgaacactc tttatcgcga tattcatagc + 3661 gccttgaaca agatcttgat gttgggaatt actccagtca ttgcccacat cgaacgctat + 3721 gatgctcttg aaaataatga aaaacgcgtt cgggaactga tcgatatggg ctgttacacg + 3781 caagtaaata gttcacatgt cctcaaaccc aaactttttg gcgaacgtta taaattcatg + 3841 aaaaaaagag ctcagtattt tttagagaag gatttggttc atatcattgc aagtgatatg + 3901 cacaatctag acggtagacc tccatatatg caacaggcat atgatatcat tgctaagaaa + 3961 tatggagcga aaaaagcgaa agaacttttt gtagataatc ccagaaaaat tataatggat + 4021 caattaattt aggagaaaat atgaaggaac aaaacacttt ggaaatcgat gtattgcaac + 4081 tattcagagc tttatggaaa agaaagttgg tcattttatt agtggcaatt ataacttctt + 4141 tagttgcttt tgcctacagt acttttgtta tcaaacctga gtttactagt acgactcgga + 4201 tttatgtagt taaccgtaat caggaagaga agtctggttt aaccaatcaa gacttgcagg + 4261 caggaacata cttggttaaa gactatcgtg aaattatcct atcgcaggat gttttggagg + 4321 aagttatttc tgatttgaaa ctagatttga cgccaaaagg tttggctaat aaaattaaag + 4381 taacagtacc agttgatacc cgtattgtct ctgtttcagt taatgatcga gttcctgaag + 4441 aggcaagccg tatcgctaac tctttgagag aagtagctgc tcaaaaaatt atcagtatta + 4501 ctcgtgtttc tgatgtgaca acactggagg aggcaagacc ggcgatatca ccgtcttcgc + 4561 caaatattaa acgcaataca ctaattggtt ttttggcagg ggggattgga actggtgtta + 4621 tagttcttct tcttgaactt ttggacactc gtgtgaaacg tccggaagat atcgaagata + 4681 cactgcagat gacacttttg ggagttgtac caaacttgag taagttgaaa taggagagag + 4741 gaatgccgac attagaaata gcacaaaaaa aactggagtt cattaagaag gcagaagaat + 4801 attacaatgc cttgtgtaca aatatacagt tgagcggaga taaactaaaa gtaatttccg + 4861 ttacttctgt taaccctggg gaaggaaaaa caactacttc cgtaaatata gcaaggtcgt + 4921 ttgcgcgtgc aggttataaa actcttttga tcgatggcga tactcgaaat tcagttatat + 4981 caggagtttt taaatcgcgt gaaaaaatta cagggctaac agaattttta tctgggacag + 5041 ctgatttatc tcgcggttta tgtgatacaa atattgaaaa tttatttgta attcaatcgg + 5101 gatctgtatc accaaaccct acagccttgt tacaaagtaa aaattttaat gatatgattg + 5161 aaacattgcg taaatatttt gattatatca ttgttgatac agcacctatt ggaattgtta + 5221 ttgatgcggc aattatcact caaaagtgtg atgcgtccat cttggtaaca gcaacaggtg + 5281 aggtgaataa acgtgatgtc caaaaagcga aacaacaatt agaacaaaca gggaaactgt + 5341 tcctaggagt tgttttaaat aaattggata tctcggttga taagtatgga gtttacggtt + 5401 cctatggaaa ttatggtaaa aaataactta ggaaagattt tatggatgaa aaaggattga + 5461 aaatttttct ggcagtatta cagagtatta ttgtcatttt atcggtttat tttcttagct + 5521 ttgttagaga gacagaactt gaacgttctt cgatggttat actatacctt ctccactttt + 5581 ttgtattcta ttttagttcc tatggtaaca atttttttaa aagagggtac ctagttgagt + 5641 ttaataatac tataagatat atttttttct ttgcaatagc tataagtgta ttaaactttt + 5701 ttatagcgga acggtttagt atctctagaa gaggaatggt atacttctta actttagaag + 5761 ggatatcctt atacttgtta aatttcttag taaagaaata ttggaagcat gtgtttttta + 5821 atctaaaaaa tagcaagaaa attttactgt taacagtaac gaaaaatatg gaaaaagttc + 5881 ttgataaatt gctagaatct gatgaacttt catggaaatt ggtagcagta agtgttttgg + 5941 ataaatctga ttttcaacat gataaaatac ctgtaattga aaaggaaaaa attattgaat + 6001 ttacaacgca tgaagttgtg gatgaggtgt ttgtcaatct tccaggagag aactacgata + 6061 ttggagaaat tatctctagg tttgagacaa tggggataga tgtaactgta aatcttaaag + 6121 catttgataa gaatttgggt cgcaataaac aaattcatga gatggtagga ttgaatgtag + 6181 tcactttctc tacaaatttt tataaaacta gtcatgtgat ttcaaagaga attctcgata + 6241 tttgtggtgc cactattggc cttattcttt ttgctatagc tagtctagtt ttagttccat + 6301 tgattcgtaa agatggcgga ccagctattt ttgctcaaac tcgtataggg aaaaatggtc + 6361 gacattttac cttttataaa ttccgttcaa tgcgaatcga tgctgaagct atcaaagaac + 6421 agttgatgga tcaaaatacg atgcaaggtg gaatgtttaa gattgaaaat gatccacgcg + 6481 tgacaaagat tggacacttt attagaaaaa cgagtctaga tgaattgcca caattttgga + 6541 atgttctaaa aggggatatg agtttagttg gtactagacc accgactata gatgagtata + 6601 tgaagtatac gccggaacaa aaacgtcgtc taagttttaa acctggaatt acaggacttt + 6661 ggcagattag tggtagaagt aatattaaaa actttgatga tgtagtaaaa ttagacgtta + 6721 cttatttaga tggttggaca atttggaaag atattgaaat tttattgaag actataaaag + 6781 ttgtagtaat gaaagatgga gcgaagtaat ttttgtttta tcgttaaatg aagtaggagt + 6841 gatatgagaa aatcggttta tatcattggt tcaaaaggga tccctgccaa atatggaggg + 6901 tttgaaactt ttgttgaaaa attaacagaa tatcaaaaaa atagtaacat acaatattat + 6961 gttgcttgta tgcgtgaaaa ttcgactaaa tctggtatta cagatgatca gtttgagcat + 7021 aacggagcga tatgttttaa tatagatgtt ccgaatattg gtccagctcg agcgattgct + 7081 tatgatatag ctgctatcaa taaagctata aaactagcta aggaaaataa ggatgaagct + 7141 ccaatttttt acattttggc ttgtcgtatt ggtcctttta tttcagaaat taagaaaaag + 7201 attcgtgcta ttggtggaaa cttatttgta aatccagatg ggcatgaatg gctacgagaa + 7261 aaatggagtt tacctattcg caaatattgg aagtactctg aaaaactaat ggtcaaacat + 7321 gcagatttat tggtttgtga cagcaaaaat atcgaacagt atatccaaga agattataaa + 7381 cagtatcatc ctaagaccac ctatattgct tatgggacgg atacaactcc ctccatcttg + 7441 aaattggaag atgctaaagt ccgaaattgg tatcaggaga aagggattag tgaaaatggt + 7501 tattatttag tggtaggacg atttgtccct gagaataact atgaagctat gattcgtgaa + 7561 tttatcaaat cccagtctaa aaaggatttt gtcctcatta caaatgtgga acaaaataaa + 7621 ttttacgaca agttgcttcg ggaaacaggt tttgaccaag acccaagaat caaatttgtt + 7681 ggtactgttt atgatcagga attgttaaaa tatattcgag aaaatgcctt tgcatattta + 7741 catggtcatg aggtgggggg gacaaatcca tcacttttag aggctttagg atcaacaaag + 7801 ttaaatttgt tgcttgatgt tggttttaac cgtgaagttg gtgaggatgg agctatttat + 7861 tggcaaaaag atgaactttc acgagtcatc gaatatgtgg aaacgataaa tcaagcaact + 7921 atcgcaaact taaattttaa atcaacccaa agaatcctct cagatttcac atgggaaaaa + 7981 attgtggcag attatgaagg agtattttgt tttgcgaaga gttagtgtgc ccaatttata + 8041 tgcagtagta gttttataca atagtttatt atcagaagca aaaattttaa aaaccttaaa + 8101 tacattaaat tgtaaagaat taaacttaat tgtagtagac aatagtgata ggaaagaaat + 8161 acagttaaaa aataagaact tttccactga aaataatata acattggtga atatgaatgg + 8221 aaataaggga ttatctaaag cttataataa agtcctagaa ttattaaagg gtagaatagg + 8281 ttatgtggtt tggttagatg atgatactga gattagtata gaatatttaa caaaattatt + 8341 gtatgcatca agaggtaatt acgacattat tttgcctatt attcaagata cccatggtaa + 8401 aattgtctct ccaaattctc gtggtttact ttcaaataaa ccgattaaaa gttacaaaga + 8461 tggaaagaaa cttgaaaaat ttaacgcaat aaatagttgt acagctgtca atttagacat + 8521 ttatgaagaa tatagatatg atgaacgact tttcttggat gaaattgatc attcgttttt + 8581 ctatgaccac agaaataaaa atttaaagat cgaattaatt aatacaatag ttattcaaaa + 8641 tttttctcaa agagctgata atttaaattt tgatactgca tggagtagat tgaaaattag + 8701 aattcgggat ttgatagtgg cttataaaat tagaggtggg atttttatgg gtcttgtagc + 8761 tgttttaaaa agtatcctac ttggactcca attatacttg aaaattaagg atttgcgtat + 8821 agttatctat agtttcacat ctgctgtatg tattttttta gaaagacttg aaaatgaaga + 8881 ttttatattt tatgaataat acagatcatg gtggggctgc tttagcatta ttagatttag + 8941 ttactcagat aaacgagaat tatcctgagt atgaacttat tgttgtaaca gggaaaaaaa + 9001 ataatttaaa tgttaagtta acagaaattg gtattgaaaa ttactttttt ccatttagaa + 9061 attttattag ttcatataaa aaacctgcaa tactatggac gattttatat aaaattcgtc + 9121 attatatcgg aaatcgaatg gctctaaaaa aaatagaaaa aaaaattgat ttgaaaaaaa + 9181 tcgatattat tcattctaat ttaaatagaa tcgatatagg agcaatatta gccaaaaagc + 9241 acagtatacc ccatttatgg catataagag agcatttgga tgtatggtat ttttataata + 9301 aattagatca tagaaagttt gagtatggct tgaaggtctt gactacggaa aaaaattata + 9361 ttttttatat gtgttctttt tcaacgaaat atattgcaat ctctaactct gtagctatgg + 9421 attggtgtaa aaaaggacta tctcagtcat ctattgttaa agtttacgac gggatcaagt + 9481 tacctcaagt atttggtgat aaaaaatggt ttagaaataa aaaaataaat attgtatttg + 9541 ttggtggtta cgatattaaa aaaggtcagg agttgttttt aagctatttt ttaaaattac + 9601 caaaagaaat acaaatgcaa tatactttga ctttctatgg aagtggaaaa tctaagtata + 9661 taaagaaatt acaaaagatg tctcaacatc tatgttctga tcaagttaaa tttcatagtt + 9721 atatagataa tcttacagaa ttactaccaa attatgatat tgggattaat ttttcaacaa + 9781 cggaaggttt tggaagagtg attgttgaat atttagcgaa cggtctttgt gttgttgcaa + 9841 gtaaaaatgg agctagtcca gaattaataa cagaagaagt tggattttta atcgacaagg + 9901 ataatcagga tgaatttatt cagttgttta ctaaattatc tattgaaaag aataagataa + 9961 gacaaatggg aaataaagca attgaacatg cacaaaagtt ttcaatagac caacatacaa + 10021 gagagattat aaatgtatat caagaaatga gaaataaaca atgaaaaata tggaacaaat + 10081 tgattttgtg gtgacatggg ttaatggtaa agatgtagat tggtgtaaaa gaaagtctga + 10141 atttgagaaa gaatataata tatttcaaga tttaaatagt gaagagcgat accgtgaatg + 10201 gggtcttatg aaatattggt ttagagctgt ggaaaaatat gccccttggg taaataaaat + 10261 ttattttata accgaagggc atgtaccaaa ttggttagat gtaaatcatc ctaaattggt + 10321 tcatgttaaa catgaggatt atatcgaaaa acagtttttg ccaactttta attcaaacgt + 10381 tatagagatg agtttgattc atttgaaaga tttatcagag aaatttgttc tttttaatga + 10441 tgattgtttc ataaatgatt ttgtaaaaca aagtgatttt tttgaaaata atttacccaa + 10501 agatacgggg atttttagtc ctttaatacc aagagaaaat tctttagctc ctattgtatt + 10561 aaacaatatg gagattatta acaaatattt ttcaaagaaa aaaattcttg agcagaattt + 10621 ttctaagttt tttaacatca aatatggaaa acatctattg aagaatattt gtttactgcc + 10681 atggtcagat ttgttaggct tttatgatag tcatattcca gtaagttatt gtaaaagtaa + 10741 tttcttggaa gtttatgaga aagaacatgc catttttaat ttgacgttta aaaataaatt + 10801 taggaataaa aatgagatta atcattggtt aattagatat tggcaattgt ctagcggtaa + 10861 tttcatacca agaaacatta attttgggaa aaattatgcc atttcaaatg aacctacgga + 10921 tattattaat gaattaaaac tttctaaata taagattata tgtattaatg atggtgaaag + 10981 tatagataat tttgatgaag tgaaaggtct aatgattaat gcttttgaaa aaaagtttcc + 11041 tgagaaatcg agttttgaga aaaagtgagg catataagaa tgaatttgga agatttagta + 11101 ttaataattt taaattataa tagtgctaaa gatacactac gttgtttaga aattctacgt + 11161 tcttttaata tgaattttaa aatcattgta gtggataata attctacgga caattcaata + 11221 gaactactca agaatataga ggatcctcaa actacttttt taatttctga tgagaataga + 11281 ggatatggag caggtaataa tattgggatt cactttgcag aaaataattt ttcttcaaat + 11341 atcataggta ttattaatcc agatatagtc attcccaatc aggaagtgat aatttcaatg + 11401 tataatgttt tgaaaaatag tgactttgct atggttggtg ggtcagtaat cgataatgag + 11461 ggaaattata gactattaaa ttcatcatgg gatttacctt cttttaagag cgttgtactt + 11521 gaaagatttt taatatataa tcgacataaa gttccatatt gtttaaatat gtataatgat + 11581 gaaacagcga ttgtagattg tgtagcaggt tgctttttta tgataaaagc tgatgtaatg + 11641 aaggaaatcg gttattttga tgaaaatgtt tttttatata atgaagagaa cattcttgga + 11701 atgaaactga gagaaaagga cttccaatca attatattaa ccaaacagtt ttactatcat + 11761 ttgcatgatt ttgaaaagga taaggtagaa ttatccttga gtaaaaaatg taaacgagat + 11821 tgggtgaaat ttcagtcacg taagtatttt accgaaaaat attattcaaa atttttaggt + 11881 tttcttcttt tttttgttga aatatttaat ttgtttcaaa ttatgatagg acacttaaaa + 11941 aataatatta taaagaagaa tctgaaagga aactctagtg aaaaaaagta gtacgttaca + 12001 tagtagtacg ttacatatag gacttattct ttttttgatt gtactgagta aaaacttctt + 12061 taatttagta ccaaatatag cactgttttc tgattttaat cttatgatta ttataatcat + 12121 catgacagtt gttaatatta aatactataa tcgctcaacc aaatatcagt atcgttggta + 12181 tattattttc acattgatat ttgtgttgta tagtgcaatt aatgagaaac tattatatgg + 12241 gcaaccattt ctattaggtt tacttcctca aagacaattt tttttatgtt taatgactta + 12301 tttcccttta agaaagtatt tccaagaaca aaatattagt ttaaaaaaac tttatgttgg + 12361 tattatgaat ttgggatcta tttcatcgtt aatttacatt ttacaaaaga tagtaatatt + 12421 atatggggga acacaatttg ttaacgtaat atatagtttt gccggatatt ttagcgggta + 12481 tagattgtat gtaggtagtt ctttaattat tttagcaaca ttaatttcta ccgcttattt + 12541 tttagaaaca ttaaaactca agtatctgtg ccaccttata ttaggttggt ttactcaaat + 12601 ttggataacg caaggtcgaa tagagatgat tgttttgcta atttcaacga tagtttgcat + 12661 aatagtccaa ggaagattaa ctagaaagaa aataatttat tggttgctga caattttggg + 12721 actgtggatg attactctaa cacctatttt tgaaaatatt gttggagcta ttttaaaagt + 12781 agatggagca ggtagaggaa gtgattcatt gactattcga gcaattggac gacagttata + 12841 ttgggaacaa ttgaatgaga caacttcaaa acttcttttt ggaacaggat accctaatta + 12901 taattatgct ttagcctttc aacgtacagg tttttcaagc aatatttttt taacagacaa + 12961 tggttttatg acatatatat atatatttgg tattgtgggt tcctcaatta tgggattatt + 13021 atttttaaaa tatcttaaaa attcaataaa gtatgctaga caatctgcag atatgattcc + 13081 gttgatgtat attatttctt tactaattgt agcctataat attattcttt ggtattggaa + 13141 tgcggacggt acttttatat tagtaatcat gatttgcgca ttggagcatg gagaacaatt + 13201 attacatcag aggaatggag tgtgattaga tgaatttaaa taaagaagtt agatggaagg + 13261 ataagcaata tattgctttt gatttttttg atacaactat ccatagaaat tgtcatcctg + 13321 aagtgatttt atttgaatgg tctaaaaaaa tttctattta tttctctttc aaaatatctg + 13381 ctacagaaat ttattcaatt aggaaaaaat ctgaaataca tgagaagcaa gaaaaacaat + 13441 tggaagaaat taaatatgaa agattacttc aacttgtttt ttatactatt ttaagtcgtt + 13501 tgaagtcaga tgttaccgac tataatcttg aagatttttt aatttatgca agaacgtgtg + 13561 aagaggaaat agaattaaga catattagta ttgatacaga tacaattaat tttattgaat + 13621 ttttaaaaca aaatgggaaa aaaataattt taatttcaga tttttattct gataaaaagc + 13681 taattgaaaa attaatggtt tcattaggga ttagagatta tttctctaaa atatttattt + 13741 caagtgaaat tgggttacgt aagtcatcag gaaatttata tcaatatgtg atcaatgaat + 13801 tgagctgtaa gcctataaat ttacttatga ttggtgataa tatttattct gatgtaaaag + 13861 ttccaaaaaa actaggaata gattcttatc ataaatctta ttcagattca catgtgactg + 13921 tgagtcctaa cgatattgta aaagcgatga ataatgttat ttctcaagct tgtactgaat + 13981 ctttatttaa tctctatata cctgaaatac tttattttat ttcaaagtta tacaaagaat + 14041 tatctgttaa caaagctagt gatatattat tttgtgcaag agaaggtttt tttataaaaa + 14101 aattatttga tctttatcaa aaaaaaatga acttaaagct tattaactca cattattttt + 14161 atgtttctag aaaatcaacg ctatatccat catttaaaaa tattgaggat gaagactttg + 14221 aagttatttt tagacaattt cctgaaatta ttttagaaaa ttttttgatt aatttaaatt + 14281 tttccaataa tgatattaac agtatttctg agcaaacaga aattaaacaa acagacaaag + 14341 tatcagataa atctattatt aacaaattaa aacaaaataa attatttaaa gatgtttatg + 14401 atttgaactg taaagaagaa aaatattctt ttagagaata tttaaagtct gtaggagttg + 14461 agaatgacaa ttctacaata aatatggtag atattggttg gaaaggcacg atacaagaca + 14521 atattcaaaa agcttttcca tctttaaata taaaagggta ttatatgggg ttgaattttc + 14581 aacggtattc tactaggaat agtatgaata agacgggaat actgtttact gatgatcctc + 14641 aaaaaacaaa gttttttaac ttatttaatt ataaatattt attctatgaa agaatctttg + 14701 ttgcagatca tggaccgaca gttagatatg aatttatgaa tggtgttggg gtaccaacat + 14761 tggatacaga tgaaaatcat atagaaattt atagattttc tgaggaattt cagattacat + 14821 ttttcaacac atttgagaaa attttagatt tgttcaatga atcactagta acaccagatg + 14881 aattatttaa cgaaatagct aatttatcat taaaaaaaca ttgcatctat ttaccaaggc + 14941 tttcagtaag tataaaaaaa ttagatagag cagcaaaaga aaattttggt attataaaat + 15001 ctactaacag gaatagtgat aataaggtaa gaaatttttg gaaaaataga gattttttat + 15061 ttttagatta tatatataaa gcgtatggaa agaatagatt gttaaaccct atattggata + 15121 tttacggata ttttgtatat ctgattaaaa cactgcaaat aaaaatagta ggggatattt + 15181 gatgagcatg aaagaaaaat caataaataa aaatgctatt ttgaatatta ttttaacact + 15241 aacaaatatt gtgtttccat taattacttt tccttatatt tctagaattc tgaatccgtc + 15301 aggaataggt gcaatctctt ttttttcatc tattggttct tatggtgttt tagttgcttc + 15361 gcttggaatt tcaacttatg ggattcgggt gattgcaaag gatcgttatc ataaagataa + 15421 gataactaaa atattccaag aattgatagt tattaatagt gtaatgtcta ttatagtgac + 15481 gttcttcctt gttttaatga gtttccgatt agagcagtta agttcagaaa aaggtttatt + 15541 aataatcaca tgtattacta ttttgtcctc tccttttaat ttgaattggt tttatagtgg + 15601 aatagaagag tattcatata taacaaaacg ttcaatattt tttaaattag tttcattgat + 15661 attaaccttt ttatttgtta aaagtaaaga cgattatatt ctatatgctg tgataacatt + 15721 gttttcaaca ttggcttcca attttataaa tattttggag agtagaaaat acatcaattt + 15781 taatttgaga agggatttag aatttagata tcatctaaaa ccaatgtggt atttatttgc + 15841 ttcgttactt gcagttaata tttatataaa tttggattct gtgatgttag gaattattaa + 15901 tggaaatgat gcggtaggta tttactcaat cgcatcaaaa gtaaaatgga ttttattatc + 15961 agtcgttact tcagtgagtt cagttttatt acccagatta tcattttata gcaataaata + 16021 tgacgaaacg aagtttaata atattttgag aaagtcatct acaataattt ttatgatttc + 16081 aattcctcta acaatttttt ttatgataaa agcgaaagag agtatattat tgttaggtgg + 16141 agagcagtat attcaggcag ttttagcaat gcaaatatta atgccgatct tgataatatc + 16201 aggtttttcc aatattacag gtaatcagat attgatccct actggtaatg agaaatattt + 16261 tatgagagca gtttctatag gggcaatagt aaatttatgt ttaaatttgt tgcttatgcc + 16321 tatttgggga attatcggag gtgcgatcgc aactctttgt gcagaattag tccaaatgat + 16381 tattcaattt tatttttctc gtaataaatt aatgggtaat atttcattaa attcaatcaa + 16441 aaaagtagcc tattcatcaa tttttgcggg tatactgtta atagtaatac aaaatattat + 16501 agagaatttt aatagcttct taaatttagc tgcatctagt tttctatatt ttggagtata + 16561 ttttttctta ttggtattgt ttaaagaaag tacaattaag aaatttctaa atcaaatttt + 16621 ttataaggat atttcatgaa tttattacca attatttatg gagcgattct tgatttaata + 16681 ttagaataat tttttaaagt gaatgaaatc aaagcaataa aagactaaaa ataaattgct + 16741 atctattatg tttttctcaa actaagtaaa acataactca tgaaaacaaa tttaaaaagg + 16801 agggactata gtatgaaagg tattattctt gcaggtggtt cggggacacg tttatatcct + 16861 ttgactcgcg ctgcatcaaa acaacttatg ccggtttatg ataaaccgat gatttactac + 16921 ccactttcaa cattgatgtt ggctgggatt agggatattt tgattatttc cactccacag + 16981 gatttacatc gatttcaaga gcttcttcaa gacggatctg agtttgggat caaactttct + 17041 tatgcagagc aaccaagtcc agatggtttg gcacaagcct ttatcattgg ggaagagttt + 17101 atttctgatg atagcgttgc gctaatctta ggtgataata tctatcacgg ttctgggctt + 17161 tccaagatgc tacaaaaggc agcgagtaag gagtcgggag caactgtttt tggctaccac + 17221 gtcaaggatc cagagcgctt tggtgtggtt gagtttgatc aggatatgaa ggctatttct + 17281 attgaagaaa agccagagca acctcgttca aactatgcag tgacaggact ctatttctat + 17341 gataatgatg tagtagagat tgccaagagt atcaaaccaa gtcctcgtgg tgaattggaa + 17401 attacagatg tcaacaaggc ttacttggat cgtggtgatt tgtctgttga gctcatggga + 17461 cgtggttttg cttggttgga tactggcact catgaaagtt tactagaggc ttcgcagtac + 17521 atcgaaacag tccaacggat gcaaaatgtt caggtagcaa acttagaaga aattgcttac + 17581 cgtatgggct atatcagtcg agaagatgta ttggccttag cccaaccact taagaaaaat + 17641 gaatacggac agtatctgct ccgtttgatt ggagaagcat agatgacaga taagtttttc + 17701 ggtaagacgc ttgcggcacg caaggttgaa gctattccag gcatgttgga gtttgatatc + 17761 cccgttcatg gagataatcg tggctggttt aaagaaaatt tccaaaagga aaaaatgctt + 17821 ccacttggat ttccagagtc tttctttgca gaaggaaaat tgcaaaacaa tgtatccttc + 17881 tcacgtaaaa atgtccttcg aggcctccac gcagagcctt gggataagta catctctgta + 17941 gcagatggag ggaaagttct gggttcttgg gttgatctac gcgagggtga aacctttggg + 18001 aatacctatc agacagtgat tgatgcgagt aagggaatct ttgttcctcg aggcgtagct + 18061 aatggcttcc aagttttatc agatacagtg tcatatagct atctggtcaa tgattactgg + 18121 gcgcttgaac tcaaacccaa gtatgccttt gtgaactacg ctgatccaag ccttggtatt + 18181 gaatgggaaa atattgcaga agcagaggtt tcagaagcag ataaacatca tcccctactt + 18241 aaggacgtga agcctttgaa aaaagaagat ttggaataag gaaagaatat gactgaatac + 18301 aaaaatatta tcgtgacagg tggagctggc tttatcggtt ctaactttgt ccattatgtt + 18361 tacgagaact ttccagatgt tcacgtgaca gtcctagata agttgactta tgctggaaac + 18421 cgcgcgaata ttgaggaaat tttaggtaat cgtgttgagt tagttgttgg tgacattgct + 18481 gatgcggagt tggtagacaa gttggctgct caagcagatg ctatcgttca ttatgcagcg + 18541 gaaagccaca atgataattc gctcaatgat ccatcgccat ttattcatac taacttcatt + 18601 ggaacctata ctcttttaga agctgctcgt aagtatgata ttcgcttcca ccatgtatcg + 18661 acagatgaag tttatgggga tctcccttta cgcgaagatt tgccaggtca tggagaaggg + 18721 ccgggtgaga aatttacggc tgaaaccaag tacaatccaa gctcgcctta ctcatcaacc + 18781 aaggcagcct cagatttgat tgtcaaagcc tgggtgcgtt cttttggagt caaggcaacg + 18841 atttccaact gttcaaataa ctacggtcct tatcaacata tcgaaaaatt catcccacgt + 18901 cagattacta acatcctaag tggtatcaag ccaaaacttt acggtgaagg taaaaacgtt + 18961 cgtgactgga ttcataccaa tgaccattct tcaggagttt ggacaatctt gacaaaaggg + 19021 caaatcggtg aaacctactt gattggggct gatggtgaga agaacaataa ggaagttttg + 19081 gaacttatcc ttaaggaaat gggacaagct gcggatgcct atgatcatgt gactgaccgt + 19141 gcaggacatg accttcgcta tgcgattgat gctagcaagc tccgtgatga gttggggtgg + 19201 aaacctgaat ttaccaactt tgaagctggg ctcaaggcaa caatcaagtg gtatacagat + 19261 aaccaagaat ggtggaaagc agaaaaagaa gctgttgaag ccaattatgc taagactcag + 19321 gagattatta cagtataaaa agcaggaaat agctgctttt tattgctata ttgggaagag + 19381 ttacatatta gaaaggtcta gagatgattt taattacagg ggcaaatggc caattaggaa + 19441 cggaacttcg ctatttattg gatgaacgta atgaagaata cgtggcagta gatgtggcta + 19501 agatggacat taccaatgaa gaaatggttg agaaagtttt tgaagaggtg aaaccgactt + 19561 tagtctacca ttgtgcagcc tacaccgctg ttgatgcagc agaggatgaa ggaaaagagt + 19621 tggacttcgc catcaatgtg acggggacaa aaaatgtcgc aaaagcatct gaaaagcatg + 19681 gtgcaactct agtttatatt tctacggact atgtctttga cggtaagaaa ccagttggac + 19741 aagagtggga agttgatgac cgaccagatc cacagacaga atatggacgc actaagcgta + 19801 tgggggaaga gttagttgag aagcatgtgt ctaatttcta tattatccgt actgcctggg + 19861 tatttggaaa ttatggcaaa aacttcgttt ttaccatgca aaatcttgcg aaaactcata + 19921 agactttaac agttgtaaat gatcagtacg gtcgtccgac ttggactcgt accttggctg + 19981 agttcatgac ctacctagct gaaaatcgta aggaatttgg ttattatcat ttgtcaaatg + 20041 atgcgacaga agacacaaca tggtatgatt ttgcagttga aattttgaaa gatacagatg + 20101 tcgaagtcaa gccagtagat tccagtcaat ttccagccaa agctaaacgt ccgctaaact + 20161 caacgatgag cctggccaaa gccaaagcta ctggatttgt tattccaact tggcaagatg + 20221 cattgcaaga attttacaaa caagaagtga gataagtagt agaatgattt tctagtctaa + 20281 taaaagaggc agataatgaa ctccaaagga gcttaagatg tacgattatc ttgttgttgg + 20341 tgctggtctc tttggcgcat agctttggct cagtttctat tatcgctcac accatccatc + 20401 agaagtttaa tctgaaggta cccaattatc gccaagaaga agattgggct aggatgggtt + 20461 taccaatcac acgtaaggaa atctctaatt ggcatatcaa ggcaagtcaa tactatttag + 20521 agtcccttta taacctttta cgagaaaagt tgttagaaca acctcttctt catgcggatg + 20581 aaacctctta tcgggtctta gaaagtgata gtcagctgac ctactattgg acctttttgt + 20641 ctgggaaagc tgagaatcaa gtaatcacgc tgtaccacca tgatcagtgt cggagtggtt + 20701 cggtagtgca agaattccta ggagattatt ctggctatgt gcattgtgat atgttgcggc + 20761 agtaacttag gactttagtc ctctagttct gtctatgcga tagcagtcca aggtttagga + 20821 gcaaggcgac gctaagcttg gtaaactgcg aaccgctaga agcttatcgt caactggaag + 20881 aagctgaact tgttggatgt tgggcgcatg tgagaaggaa attttttgaa gtgcccccca + 20941 agcaagcaga taaatcatcc ttaggagcta aaggtttagc ttattgtgat cagttatttt + 21001 ccttggaaag agactgggag gctttgccag ctgatgaacg actacagaaa cgtcaagaac + 21061 atctccaacc cctaatggaa gacttctttg cttagtgccg tcgtcagtca gttttatcgg + 21121 gttcaaaact aggaagggca attgaataca gcctcaagta tgaagaaacc tttaagacca + 21181 ttttaaaaga cggacatctg gtcctttcca ataatctagc tgaacgcgcc attaaatcat + 21241 tggttatggg acggagtaaa agagtccagt ggactctttt agcctaagct aaattttaaa + 21301 aagcgagggt ggttattttc tcaaagtttt gaaagagcta aagcaagagc tattattatg + 21361 agcttattgg aaacagctaa acgtcatcaa ctaaatagtg agaaatatct atcctatctt + 21421 ctagaatgtc ttccaaacga ggaaactctc gtaaacaaag aggttttaga ggcctattta + 21481 ccatggacta aagttgtaca agaaaagtgc aaataagaaa tctccagatt aggaactatc + 21541 cgtgagttca ctaatctgga gatttttcaa tagacctcgt tattgggcgg ttacgatatt + 21601 catatttttt gcaaagatgt tgtttgaaaa ataattttca aaaattctga aaattctgtt + 21661 gacatctttc tgaaaagagt ctataatgga gagaaagttt taaaggagaa aatgatgaaa + 21721 agttcaaaac tacttgccct tgcgggcgtg acattattg +// diff --git a/public/res/serotype_genbank/serotype_7F.gb b/public/res/serotype_genbank/serotype_7F.gb new file mode 100644 index 0000000..9c454ee --- /dev/null +++ b/public/res/serotype_genbank/serotype_7F.gb @@ -0,0 +1,1041 @@ +LOCUS CR931643 24127 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 554/62 (serotype 7f). +ACCESSION CR931643 +VERSION CR931643.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 24127) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 24127) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..24127 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="554/62" + /db_xref="taxon:1313" + gene <1..163 + /gene="dexB" + /locus_tag="SPC07F_0001" + CDS <1..163 + /gene="dexB" + /locus_tag="SPC07F_0001" + /codon_start=2 + /transl_table=11 + /protein_id="CAI32919.1" + /db_xref="GOA:Q4K2R1" + /db_xref="InterPro:IPR013780" + /db_xref="UniProtKB/TrEMBL:Q4K2R1" + /translation="DRRFLVVANLSNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVP + WDAFCVELL" + gene 322..487 + /gene="aliB" + /locus_tag="SPC07F_0002" + /pseudo + CDS 322..487 + /gene="aliB" + /locus_tag="SPC07F_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(488..1351) + /gene="tnp" + /locus_tag="SPC07F_0003" + /pseudo + CDS complement(488..1351) + /gene="tnp" + /locus_tag="SPC07F_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(977..1333) + /gene="tnp" + /locus_tag="SPC07F_0003" + /note="HMMPfam hit to PF01710, Transposase, score 4e-17" + /pseudo + gene 1572..3026 + /gene="wzg" + /locus_tag="SPC07F_0004" + CDS 1572..3026 + /gene="wzg" + /locus_tag="SPC07F_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32922.1" + /db_xref="GOA:Q4K2R0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2R0" + /translation="MLIMSGRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNI + LAFRYLNLVVTVLVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGL + TNRLNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNT + DLTVNQSSSYLATYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKV + EAPKTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKRILLTTTPRDSYVPI + ADGGNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVH + NDQEFSAPHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKL + TSTEALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDL + PSYAMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1572..1697 + /gene="wzg" + /locus_tag="SPC07F_0004" + /note="Signal peptide predicted for SPC0236 by SignalP 2.0 + HMM (Signal peptide probability 0.990) with cleavage site + probability 0.547 between residues 42 and 43" + misc_feature 1785..2132 + /gene="wzg" + /locus_tag="SPC07F_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 8.5e-63" + misc_feature 2310..2753 + /gene="wzg" + /locus_tag="SPC07F_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 3e-70" + gene 3028..3759 + /gene="wzh" + /locus_tag="SPC07F_0005" + CDS 3028..3759 + /gene="wzh" + /locus_tag="SPC07F_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32923.1" + /db_xref="GOA:Q4K2Q9" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2Q9" + /translation="MIDIHSHIVFDVDDGPKSREESKALLEESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYRQIHTGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSHHISKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGVKKAKELFVDNPRKIIMDQLI" + misc_feature 3031..3639 + /gene="wzh" + /locus_tag="SPC07F_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.7e-39" + gene 3768..4460 + /gene="wzd" + /locus_tag="SPC07F_0006" + CDS 3768..4460 + /gene="wzd" + /locus_tag="SPC07F_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32924.1" + /db_xref="GOA:Q4K2Q8" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2Q8" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFVYSTFVI + KPEFTSTTRIYVVNRDQGEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVVSDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGVIGTSVIVLLLELLDTRVKRPEDIEDTLQMT + LLVVVPNLSKLK" + misc_feature 3786..4202 + /gene="wzd" + /locus_tag="SPC07F_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.3e-52" + misc_feature 4308..4385 + /gene="wzd" + /locus_tag="SPC07F_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4470..5153 + /gene="wze" + /locus_tag="SPC07F_0007" + CDS 4470..5153 + /gene="wze" + /locus_tag="SPC07F_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32925.1" + /db_xref="GOA:Q4K2Q7" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K2Q7" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLLDGDTRNSVISGFFKSREKITGLTEFLSGTADL + SHGLCDTNTENLFVVQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTGKLFLGVVLNKLDISVDKYGVY + GSYGSYGKK" + gene 5169..6536 + /gene="wchA" + /locus_tag="SPC07F_0008" + CDS 5169..6536 + /gene="wchA" + /locus_tag="SPC07F_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI32926.1" + /db_xref="GOA:Q4K2Q6" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K2Q6" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVREAELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIYEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRSDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYVQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + REGAK" + misc_feature 5952..6533 + /gene="wchA" + /locus_tag="SPC07F_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 8.8e-145" + gene 6565..7737 + /gene="wchF" + /locus_tag="SPC07F_0009" + CDS 6565..7737 + /gene="wchF" + /locus_tag="SPC07F_0009" + /note="member of homology group 15" + /codon_start=1 + /transl_table=11 + /product="putative rhamnosyl transferase WchF" + /protein_id="CAI32927.1" + /db_xref="GOA:Q4K2Q5" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR015393" + /db_xref="UniProtKB/TrEMBL:Q4K2Q5" + /translation="MKQSVYIIGSKGIPAKYGGFETFVEKLTEYQKDSNIQYYVACMR + ENSAKSGIMDDQFEHNGAICFNIDVPNIGPARAIAYDIAAVNKAIELAKKNKDEAPIF + YILACRIGPFISGLKKKIRAIGGRLLVNPDGHEWLRAKWSLPVRKYWKFSEQLMVKHA + DLLVCDSKNIEKYIQEDYKQYQPKTTYIAYGTDTTPSILKAEDAKVRDWYQEKGVSEN + GYYLVVGRFVPENNYEAMIREFIKSKSKKDFVLITNVEQNKFYDQLLQDTGFDKDPRV + KFVGTVYDQELLKYIREYAFAYFHGHEVGGTNPSLLEALASTKLNLLLDVGFNREVGE + DGAIYWKKDELARVIEEVEGFDQAAITDLDFKSSQRILSAFTWEKIVSDYEEVFKG" + gene 7741..8889 + /gene="wcwA" + /locus_tag="SPC07F_0010" + CDS 7741..8889 + /gene="wcwA" + /locus_tag="SPC07F_0010" + /note="member of homology group 63" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32928.1" + /db_xref="GOA:Q4K2Q4" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2Q4" + /translation="MKRILYLHAGAEMYGADKVLLELIKGLDSKEFEAHVILPNDGVL + VKALRQVGAQVSVLDYPILRRKYFNPKGILEYLKSYRRYSQKISQYVRENGIDLVHNN + TTAVLEGIYLKRKVKLPLIWHVHEIIVKPKAISDFINFLMGRYADKIVTVSQAVSSHV + KQSPFIKEGQVQVVYNGVDNAVYHPMQASTVREQFAIPEESLVIGMVGRVNAWKGQGD + FLEAVAPILEQNPNSIAFLAGSAFAGEEWRVEELESTIAKSSVASQIKRIDYYEHTTE + LYNMFDIFVLPSTNPDPLPTVVLEAMACGKPVVGYRHGGVCEMIKEGKNGLLATPNKP + AELSKAIQELADNIEKREQLGSASFQRQKEFFSLESYIRNFSELYKKY" + misc_feature 8302..8823 + /gene="wcwA" + /locus_tag="SPC07F_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 4.1e-30" + gene 8891..9568 + /gene="wcwC" + /locus_tag="SPC07F_0011" + CDS 8891..9568 + /gene="wcwC" + /locus_tag="SPC07F_0011" + /note="member of homology group 48" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI32929.1" + /db_xref="GOA:Q4K2Q3" + /db_xref="InterPro:IPR015037" + /db_xref="UniProtKB/TrEMBL:Q4K2Q3" + /translation="MNTKMNTKMNTKMNTETIKNKLKPIVYPIINFIPRRRLKNKNFT + IICDNCWAGKVYQELGLPYQTPFVGMFVFSPDYIKMLKNLKHYLSGNIPLTFVKESKY + VKDFDNAYPLALLDDIELHFLHYADEEEATQKWNRRLERIHWDNLYFKFNDNDACTYE + LMKEFEELPYKSKVIFSSRNYSGLPSLVHFKSAEKQGHVGIDLKTYHRYFNCVTWLNK + GGEDLTK" + gene 9565..10527 + /gene="wcwD" + /locus_tag="SPC07F_0012" + CDS 9565..10527 + /gene="wcwD" + /locus_tag="SPC07F_0012" + /note="member of homology group 98" + /codon_start=1 + /transl_table=11 + /product="conserved hypothetical protein" + /protein_id="CAI32930.1" + /db_xref="UniProtKB/TrEMBL:Q4K2Q2" + /translation="MKKIRIIIPYFGKLPTFFPYFLLTAKRNQKIDFLVYTDQKVDEF + AMLNAKNIEFVTLSFDELREKVQSKFDFKISLKTPYKFCDYRPAYGLIFEEELKGYDY + WGFCDTDVLLGDIYQFLEEHSFFENDYARYGLFGHLQIFKNLREVNHIFMSGQGSDYR + LDYHNVYTSEQSFIFDESEGIQKLFEKCHFKQLQDKFFDDIDISHFSFREYGENKSKR + YYFWSEENGLESINLINDDIVVKRPLYAHFQKRMIKCPDFKLVDSFYVIPNQLVIGEK + ISKQELVEVTRNKFYWEYVKSTMLKKLKKEKWTFEFIRHKLRMK" + gene 10538..11049 + /gene="HG140" + /locus_tag="SPC07F_0013" + /pseudo + CDS join(10538..10687,10690..10794,10798..11049) + /gene="HG140" + /locus_tag="SPC07F_0013" + /note="member of homology group 140" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase (pseudogene)" + gene 11377..12390 + /gene="wcwF" + /locus_tag="SPC07F_0014" + CDS 11377..12390 + /gene="wcwF" + /locus_tag="SPC07F_0014" + /note="member of homology group 141" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32932.1" + /db_xref="GOA:Q4K2Q1" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2Q1" + /translation="MKDDMIIQNILLTIVIPVYNVEKYLKRCIDSVISQEWDKYEVIL + VNDGSTDASPNICEEYAQKYHFISVIHKENGGLSETRNTGLSHANGKYVFFLDSDDWI + TKDMFRNLSKMIMEQNYDILQFGMQMFHSEREELKNVQCKEKNFNSSDAFKNMLSVEG + ITSFATDKIYKRELFEKNGIEFPIGYFYEDLGTVYKLILSAKKIYLTTQVYYCYFIGN + DAAITKQWSEKKISDVYKFHKKIFNVSSLMVSDDIFLSKSYYNNGLVYLLMKLYEENQ + EDTQLFRLILAELDANIVPIKYLRNYPNFLKYVFYRIRLLKLIVILKLTLTKIKKWNQ + KKH" + misc_feature 11413..11913 + /gene="wcwF" + /locus_tag="SPC07F_0014" + /note="HMMPfam hit to PF00535, Glycosyl transferase + family, score 1.2e-44" + gene 12369..13307 + /gene="wcwG" + /locus_tag="SPC07F_0015" + CDS 12369..13307 + /gene="wcwG" + /locus_tag="SPC07F_0015" + /note="member of homology group 142" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32933.1" + /db_xref="GOA:Q4K2Q0" + /db_xref="UniProtKB/TrEMBL:Q4K2Q0" + /translation="MESKKTLIIFEQIDTFEQFLERNIIFNNVDIFTPYKKVSNVFMH + NFRAIAKRLPGFLFHNWWLEEWSRKLPDYTNIVVFDNAISLKLLEYIDAHKTRSSKLK + LWLWNVPNKQVNYLNSNYDVYCFDKTYSENYNLKFVEQFYVLGSTKKRDILDIEYDFY + FIGADKGRLPKLKSLAKQIVLNNYSYRFDVFSVKKQYFDSEFEGIQVIDTLLPYDEVL + DNILASNVIVELNKKGQDGLTLRAMESIFYKKKLITNNKKIINYDFYHPNNILVWEEG + KDIKLDEFIQKPYVQLEKDIIDRYSFSNWLSKITEI" + gene 13317..14384 + /gene="wcwH" + /locus_tag="SPC07F_0016" + CDS 13317..14384 + /gene="wcwH" + /locus_tag="SPC07F_0016" + /note="member of homology group 143" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32934.1" + /db_xref="GOA:Q4K2P9" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2P9" + /translation="MRITFCLPEISTVPTGGYKIIFEYANRLSERGHEITLVFLTNNV + WNRVTKNCKIKSIVGNIRGKKNPSWFKLKPTIRKIMTPYLDGRDFPEADFIFATAVTT + ANIVKEMPEKYGKKCYLIQGFETWLLPESKVIETYNYGFLNITVSKWLCDIVQSYTET + PVFCVSNPIDTEIFYLLNPIEKRNPFHLGMLYHEGEHKGISYAIDAIKKVKKIYPEIE + VNIFGVPSRPVFLPEYFNYTQQATQQELQKIYNDTSIFLCATIDEGFGLTGAESMACG + CALVSTAYSGVFEYAIDGENALLSPIKDSVSLATNIIKLIRNHDLRLSIATQATKDMK + KRGWEKTTLKLENILSEFTNF" + misc_feature 13821..14312 + /gene="wcwH" + /locus_tag="SPC07F_0016" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1e-15" + gene 14365..15816 + /gene="wzy" + /locus_tag="SPC07F_0017" + CDS 14365..15816 + /gene="wzy" + /locus_tag="SPC07F_0017" + /note="member of homology group 144" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32935.1" + /db_xref="UniProtKB/TrEMBL:Q4K2P8" + /translation="MNLLIFKDVLISMIIKLDKQKCYFIMLLLLMCVVQLTASVSMGV + ISIALTVLPILWNLNNPSKLLFSQILYLFQFQFYVSYLSFPLGISFICDIINLFLLFN + IFKDSKLLQWELRNINLKTIIFVWVLFFLIGIFSNFLYDLNIALIVWSLRNYIRFIIF + FISCCLYIDKYSINLGEYLIKLFYWFNIFFTSFQYFVLLKSGDFLGGIFGNELGISNT + YLHILLILILILSVVNYVSDNSSLVILTSYIVSTLYVAALSELKIIFVELPIIIILTL + LFKRLGIKILLKIISITCIVVVALAISIPILYELFPIFDNFFKLEKLFGYSTGNYSTS + SDFGRLSSIVQIISTIFYGDVWQTLFGIGLGEAEISKIPIFSGSFYYNYEYTHYYLFT + LSYVFIENGFIGLFLFMFMPIYLALKMIFERGTSKYDLLLIVLSISLFMLLLYNNTMR + SEIYYLYLFVLSWGVAINRGNGGCYENNKKLCL" + misc_feature 14365..14484 + /gene="wzy" + /locus_tag="SPC07F_0017" + /note="Signal peptide predicted for SPC0249 by SignalP 2.0 + HMM (Signal peptide probability 0.623) with cleavage site + probability 0.185 between residues 40 and 41" + gene 15740..17209 + /gene="wzx" + /locus_tag="SPC07F_0018" + CDS 15740..17209 + /gene="wzx" + /locus_tag="SPC07F_0018" + /note="member of homology group 7" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32936.1" + /db_xref="GOA:Q4K2P7" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K2P7" + /translation="MFFHGELQSIEEMGDVMKTIKNYAYKSFYQLFLIIVPFITIPYV + SRILGAELIGINSYTNTIISYFVLIANLGILIYGNRTIAYHRESIEERSKKFWEIVSI + KLLVAIVAYVIFIIFLFFYSKYSWVFVIQSVQIIATAFDISWLFDGVEDFKRTVVRNF + LVKIISIILIFTFVKSTEDFDKYIWITVGSTLMGNLTLWSYLHHYIIKIPIKSLKLSE + HLVPILTLFIPQIASIVFMSINKILLGNISTISQAGYFENADKVIRILLALVSSIGVV + VFPKVAHAYRSGDMKRVLGLTYMTFDAVNIITIPIVVGIVSISPTFSSIFFGTEFQGI + DKVLSVLVLELIFMGYTSVLGSQYLIVTGQTYFLSISVFLGIFSTVISSFFFIPIYGA + LGSAISSVIGEASIMIGEIYLLRNQVDFYYLYRDVPKYMIASAVMYISISSLNYFISS + PFVSLLSSIAMGAVTYVTVVLLLCPRIVIKLLNKNTRFF" + misc_feature 15794..16594 + /gene="wzx" + /locus_tag="SPC07F_0018" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.4e-47" + gene 17335..18204 + /gene="rmlA" + /locus_tag="SPC07F_0019" + CDS 17335..18204 + /gene="rmlA" + /locus_tag="SPC07F_0019" + /EC_number="2.7.7.24" + /note="member of homology group 10" + /codon_start=1 + /transl_table=11 + /product="glucose-1-phosphate thymidylyltransferase RmlA" + /protein_id="CAI32937.1" + /db_xref="GOA:Q4K2P6" + /db_xref="InterPro:IPR005835" + /db_xref="InterPro:IPR005907" + /db_xref="UniProtKB/TrEMBL:Q4K2P6" + /translation="MKGIILAGGSGTRLYPLTRAASKQLMPVYDKPMIYYPLSTLMLA + GIKDILIISTPQDLPRFKDLLLDGSEFGIKLSYAEQPSPDGLAQAFLIGEEFIGDDSV + ALILGDNIYHGSGLSKMLQKAAKKEKGATVFGYHVKDPERFGVVEFDENMNAISIEEK + PEQPRSNYAVTGLYFYDNDVVEIAKSIKPSPRGELEITDVNKAYLDRGDLSVELMGRG + FAWLDTGTHESLLEASQYIETVQRMQNVQVANLEEIAYRMGYISREDVLTLAQPLKKN + EYGQYLLRLIGEA" + misc_feature 17338..18054 + /gene="rmlA" + /locus_tag="SPC07F_0019" + /note="HMMPfam hit to PF00483, Nucleotidyl transferase, + score 2.2e-119" + gene 18205..18798 + /gene="rmlC" + /locus_tag="SPC07F_0020" + CDS 18205..18798 + /gene="rmlC" + /locus_tag="SPC07F_0020" + /EC_number="5.1.3.13" + /note="member of homology group 11" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-6-deoxy-D-glucose 3,5-epimerase + RmlC" + /protein_id="CAI32938.1" + /db_xref="GOA:Q7BTQ6" + /db_xref="InterPro:IPR000888" + /db_xref="InterPro:IPR011051" + /db_xref="InterPro:IPR014710" + /db_xref="UniProtKB/TrEMBL:Q7BTQ6" + /translation="MTDNFFGKTLAARKVEAIPGMLEFDIPVHGDNRGWFKENFQKEK + MLPLGFPESFFAEGKLQNNVSFSRKNVLRGLHAEPWDKYISVADGGKVLGSWVDLREG + ETFGNTYQTVIDASKGIFVPRGVANGFQVLSDTVSYSYLVNDYWALELKPKYAFVNYA + DPSLGIEWENIAEAEVSEADKHHPLLKDVKPLKKEDL" + misc_feature 18241..18771 + /gene="rmlC" + /locus_tag="SPC07F_0020" + /note="HMMPfam hit to PF00908, dTDP-4-dehydrorhamnose + 3,5-epimerase, score 8.8e-16" + gene 18811..19860 + /gene="rmlB" + /locus_tag="SPC07F_0021" + CDS 18811..19860 + /gene="rmlB" + /locus_tag="SPC07F_0021" + /EC_number="4.2.1.46" + /note="member of homology group 8" + /codon_start=1 + /transl_table=11 + /product="dTDP-D-glucose 4,6-dehydratase RmlB" + /protein_id="CAI32939.1" + /db_xref="GOA:Q4K2P4" + /db_xref="InterPro:IPR001509" + /db_xref="InterPro:IPR005888" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P4" + /translation="MTEYKNIIVTGGAGFIGSNFVHYVYENFPGVHVTVLDKLTYAGN + RANIEEILGNRVELVVGDIADAELVDKLAAQADAIVHYAAESHNDNSLNDPSPFIHTN + FIGTYTLLEAARKYDIRFHHVSTDEVYGDLPLREDLPGHGEGPGEKFTAETKYNPSSP + YSSTKAASDLIVKAWVRSFGVKATISNCSNNYGPYQHIEKFIPRQITNILSGIKPKLY + GEGKNVRDWIHTNDHSSGVWTILTKGQIGETYLIGADGEKNNKEVLELILKEMGQAAD + AYDHVTDRAGHDLRYAIDASKLRDELGWKPEFTNFEAGLKATIKWYTDNQEWWKAEKE + AVEANYAKTQEIITV" + misc_feature 18826..19782 + /gene="rmlB" + /locus_tag="SPC07F_0021" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 0.0001" + misc_feature 18829..19569 + /gene="rmlB" + /locus_tag="SPC07F_0021" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase fam, score 2.7e-76" + misc_feature 18832..19644 + /gene="rmlB" + /locus_tag="SPC07F_0021" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/iso, score 1.7e-05" + gene 19926..20777 + /gene="rmlD" + /locus_tag="SPC07F_0022" + CDS 19926..20777 + /gene="rmlD" + /locus_tag="SPC07F_0022" + /EC_number="1.1.1.133" + /note="member of homology group 9" + /codon_start=1 + /transl_table=11 + /product="dTDP-4-keto-L-rhamnose reductase RmlD" + /protein_id="CAI32940.1" + /db_xref="GOA:Q4K2P3" + /db_xref="InterPro:IPR005913" + /db_xref="InterPro:IPR016040" + /db_xref="UniProtKB/TrEMBL:Q4K2P3" + /translation="MILITGANGQLGTELRYLLDERNEEYVAVDVAEMDITDAEMVEK + VFEEVKPTLVYHCAAYTAVDAAEDEGKELDFAINVTGTKNVAKASEKHGATLVYISTD + YVFDGKKPVGQEWEVDDRPDPQTEYGRTKRMGEELVEKHVSNFYIIRTAWVFGNYGKN + FVFTMQNLAKTHKTLTVVNDQYGRPTWTRTLAEFMTYLAENRKEFGYYHLSNDATEDT + TWYDFAVEILKDTDVEVNPVDSSQFPAKAKRPLNSTMSLAKAKATGFVIPTWQDALQE + FYKQEVR" + misc_feature 19926..20774 + /gene="rmlD" + /locus_tag="SPC07F_0022" + /note="HMMPfam hit to PF04321, RmlD substrate binding + domain, score 5.7e-148" + misc_feature 19929..20570 + /gene="rmlD" + /locus_tag="SPC07F_0022" + /note="HMMPfam hit to PF02719, Polysaccharide biosynthesis + protein, score 0.0001" + misc_feature 19929..20558 + /gene="rmlD" + /locus_tag="SPC07F_0022" + /note="HMMPfam hit to PF01370, NAD dependent + epimerase/dehydratase f, score 5.6e-19" + misc_feature 19932..20660 + /gene="rmlD" + /locus_tag="SPC07F_0022" + /note="HMMPfam hit to PF01073, 3-beta hydroxysteroid + dehydrogenase/i, score 1.9e-08" + gene 20947..22021 + /gene="glf" + /locus_tag="SPC07F_0023" + /pseudo + CDS join(20947..21447,21446..22021) + /gene="glf" + /locus_tag="SPC07F_0023" + /EC_number="5.4.99.9" + /note="member of homology group 6" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase Glf" + misc_feature order(21274..21446,21447..21880) + /gene="glf" + /locus_tag="SPC07F_0023" + /note="HMMPfam hit to PF03275, UDP-galactopyranose mutase, + score 1.2e-107" + /pseudo + gene complement(order(22144..22425,22754..23692)) + /gene="tnp" + /locus_tag="SPC07F_0024" + /pseudo + CDS complement(join(22144..22425,22754..23692)) + /gene="tnp" + /locus_tag="SPC07F_0024" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + misc_feature complement(22940..23236) + /gene="tnp" + /locus_tag="SPC07F_0024" + /note="HMMPfam hit to PF01610, Transposase, score 1.3e-45" + /pseudo + gene 23975..>24127 + /gene="aliA" + /locus_tag="SPC07F_0025" + CDS 23975..>24127 + /gene="aliA" + /locus_tag="SPC07F_0025" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32943.1" + /db_xref="UniProtKB/TrEMBL:Q4K0S2" + /translation="MMKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETD + PDNLNYL" + misc_feature 23975..24061 + /gene="aliA" + /locus_tag="SPC07F_0025" + /note="Signal peptide predicted for SPC0259 by SignalP 2.0 + HMM (Signal peptide probability 1.000) with cleavage site + probability 0.277 between residues 29 and 30" +ORIGIN + 1 cgaccgtcgc ttcctagttg tggctaactt gtccaatgaa gagcaagact tgacagtaga + 61 aggaaaagtc aaatctgtct tgattgaaaa caccctagct caagaagtct ttgaaaaaca + 121 aatcttagtt ccatgggatg ctttctgtgt ggaattacta taaatatttt ttgcagaaaa + 181 atttaaaatt gaaatcatat aaaaacaagg gaggactgta taaaaggcgg aaatcctttg + 241 ttttttataa ccaaggttta taaactttca ttctcgaaat tcaattaact ttacaaattc + 301 ccactattaa ggagaaagaa gatgaacata aagaagcgtg tccttagtgc aggcctgact + 361 tttgcatctg ccttgctttt agctgcttgc ggccaatcag gttcagatac aaaaacttac + 421 tcatcaacct ttagtggaaa tccaactaca tttaactatc tattagacta ttacgctgat + 481 aatatagtta attgaaacaa gaacaagaca aaagagcctc gtaaaaggta ttgcaacttg + 541 gtaatacctt tttggggtgc tttttgatat gagcccatgt tttctcaata ggattgtact + 601 caggtaagta gggaggaaga ggtaaaagtt tatgcccaaa ctcttcgcat aaaagttcta + 661 gcttccccat tctatggaat cttgcattat ccataataat aaccgatggt gtggttaatg + 721 ttggtaagag aaaattctga aaccaagctt caaaaaagtc gctcgtcatc gtctcttcgt + 781 aagtcattgg aacgattaac tcaccatttg ttagccctgc aaccaaagaa atcctctgat + 841 atcttcttcc agatactttg cctcttatta actgaccttt taaagagcga ccatattctc + 901 gataaaaata agtatcgaat cctgtttcgt caatataaac aggtgctagg tgctttaaac + 961 tattaaattc ttaagaaata aggctacttt ttctgggtct tgttcatagt aggtgtggtt + 1021 ctttttttcg agtgtagccc acagctttga gcgcatagtg gatggtagtt ggatgacagc + 1081 caaattcaga agctatttca gtcaaataag cgtctggatt gtcagtaaga tagtttttaa + 1141 gtctatctct atcaactttt cttggttttg ttccttttac ttggtggttt agctctcctg + 1201 ttttctcttt tagctttaac cagccataaa tggtattacg tgagatttgg aaaacgtgtg + 1261 atgcttctgt tatactacct gttcgctcac aataagagag aactttttta cgaaaatcta + 1321 ttgaatatgc tataaaaaga ttataccaca ttgtgtacca tattgaaact agaatagtac + 1381 atccctgctt ctaaaacatt gttagaaatc gatgtaactg tcctgatcgt tttgtcatgt + 1441 tcttatttca ttttactata tttttggttc gcgggaagtc tactaagata cttaaagatg + 1501 cagatagtga aaataaaggt gtagacatta ccgtaaaaaa gtgatataat cgtacaatgt + 1561 tcaaggtata ggtgttaatc atgagtggac gttttaaaaa atcacgttca cagaaagtga + 1621 agcgaagtgt taatatcgtt ttgctgacta tttatttatt attagtttgt tttttattgt + 1681 tcttaatctt taagtacaat atccttgctt ttagatatct taatctagtg gtaactgtgt + 1741 tagtcctact agttgccttg gtagggctac tcttgattat ctataaaaaa gctgaaaagt + 1801 ttactatttt tctgttggtg ttctctatcc ttgtcagctc tgtgtcgctc tttgcagtac + 1861 agcagtttgt tggactgacc aatcgtttaa atgcgacttc taattactca gaatattcaa + 1921 tcagtgtcgc tgttttagca gatagtgaga tcgaaaatgt tacgcaactg acgagtgtga + 1981 cagcaccgac tgggactgat aatgaaaata ttcaaaaact actagctgat atcaagtcaa + 2041 gtcagaatac cgatttgacg gtcaaccaga gttcgtctta cttggcaact tacaagagtt + 2101 tgattgcagg ggagactaag gccattgtcc taaatagtgt ctttgaaaat atcattgagt + 2161 cagagtatcc agactacgca tcgaagataa aaaagattta taccaaggga ttcactaaaa + 2221 aagtagaagc tcctaagacg tctaagaatc agtctttcaa tatctatgtt agtggaattg + 2281 acacctatgg tcctattagt tcggtgtcgc gatcagatgt caatatcctg atgactgtca + 2341 atagggatac gaagagaatc cttcttacaa caactcctcg agattcatat gttcctattg + 2401 ctgatggtgg aaataatcaa aaagataaat taacccatgc gggcatttat ggagttgatt + 2461 cgtccattca caccttagaa aatctctatg gagtggatat caattactat gtgcgattga + 2521 acttcacttc tttcttgaaa atgattgact tattgggagg ggtagatgtt cataatgatc + 2581 aagagttttc agctccacat gggaagttcc atttcccagt agggaatgtc catctagact + 2641 ctgagcaggc tctaggtttt gtacgtgaac gctactcact agccgatgga gaccgtgacc + 2701 gtggtcgcaa ccaacaaaag gtgattgtgg ctatccttca aaaattaacg tcaaccgaag + 2761 cactgaaaaa ttatagtacg atcattaata gcttgcaaga ttctatccaa acaaatatgc + 2821 cacttgagac tatgataaat ttggtcaatg ctcagttgga aagtggaggg aattataaag + 2881 taaattctca agatttaaaa gggacaggtc ggatggatct tccttcttat gcaatgccag + 2941 acagtaacct ctatgtgatg gaaatagatg atagcagttt agctgtagtt aaagcagcta + 3001 tacaggatgt gatggagggt agatgaaatg atagatatcc attcgcatat cgtttttgat + 3061 gtagatgacg gtcccaagtc aagagaggaa agcaaggctc tcttggaaga atcctacagg + 3121 cagggggtgc gaaccattgt ctctacctct caccgtcgca agggcatgtt tgaaactcca + 3181 gaagagaaga tagcagaaaa ctttcttcag gttcgggaaa ttgcaaaaga agtagcagat + 3241 gatttagtca tcgcttatgg agcagagata tactatactc tggatgctct agaaaagcta + 3301 gaaaaaaaag aaattcctac ccttaatgat agtcgttatg ctttgattga gtttagcatg + 3361 catacttcct atcgtcagat tcatacggga ttgagcaata ttttgatgtt gggaatcacg + 3421 ccagtaattg ctcatattga acgttatgat gctttagaga ataacgaaaa acgtgttcgt + 3481 gaactgattg atatggggtg ctatactcag ataaatagtc atcatatttc aaaacctaag + 3541 ttctttggtg aaaaatataa attcatgaaa aagagagctc ggtatttttt ggaacgtgat + 3601 ttagttcatg tagttgcaag tgacatgcac aatttagaca gcagacctcc atatatgcaa + 3661 caggcatatg atatcattgc taagaaatat ggagtgaaaa aagcgaaaga actttttgta + 3721 gataatccca gaaaaattat aatggatcaa ttaatttagg agaaaatatg aaggaacaaa + 3781 acactttgga aatcgatgta ttgcaactat tcagagcttt atggaaaaga aagttggtta + 3841 ttttattagt ggcaattata acttcttcag ttgcttttgt ctacagtact tttgttatca + 3901 aacctgagtt tactagtacg actcggattt atgtagttaa ccgtgatcag ggagagaagt + 3961 ctggtttaac caatcaagac ttgcaggcag gatcatactt ggttaaagac tatcgtgaaa + 4021 ttatcctatc gcaggatgtt ttggaggaag ttgtttctga tttgaaacta gatttgacgc + 4081 caaaaggttt ggctaataaa attaaagtaa cagtaccagt tgatacccgt attgtctctg + 4141 tttcagttaa tgatcgagtt cctgaagagg caagccgtat cgctaactct ttgagagaag + 4201 tagctgctca aaaaattatt agtattactc gtgtttctga tgtgacaaca ctggaggagg + 4261 caaggccggc gatatcaccg tcttcgccaa atattaaacg caatacacta attggttttt + 4321 tggcaggggt gattggaact agtgttatag ttcttcttct tgaacttttg gacactcgtg + 4381 tgaaacgtcc ggaagatatc gaagatacac tgcagatgac acttttggta gttgtaccaa + 4441 acttgagtaa gttgaaatag gagagaggaa tgccgacatt agaaatagca caaaaaaaac + 4501 tggagttcat taagaaggca gaagaatatt acaatgcctt gtgtacaaat atacagttga + 4561 gcggagataa actaaaagta atttccgtta cttctgttaa ccctggggaa ggaaaaacaa + 4621 ctacttccgt aaatatagca aggtcgtttg cgcgtgcagg ctataaaact cttttgctcg + 4681 atggcgatac tcgaaattca gttatatcag gattttttaa atctcgtgaa aaaattacag + 4741 ggctaacaga atttttatct gggacagctg atttatctca cggtttatgt gatacaaata + 4801 ctgaaaattt atttgtagtt caatcgggat ctgtatcacc aaaccctaca gccttgttac + 4861 aaagtaaaaa ttttaatgat atgattgaaa cgttgcgtaa atattttgac tatatcattg + 4921 ttgatacagc acctattgga attgttattg atgcggcaat tatcactcaa aagtgtgatg + 4981 cgtccatctt ggtaacagca acaggtgagg tgaataaacg tgatgtccaa aaagcgaaac + 5041 aacaattaga acaaacaggg aaactgttcc taggagttgt tttaaataaa ttggatatct + 5101 cggttgataa gtatggagtt tacggttcct atggaagtta tggtaaaaaa taatttagga + 5161 aaaattttat ggatgaaaaa ggattgaaaa tttttctggc agtattacag agtattattg + 5221 tcattttatt ggtttatttt cttagctttg ttagagaggc agaacttgaa cgttcttcga + 5281 tggttatact ataccttctc cacttttttg tattctattt tagttcctat ggtaacaatt + 5341 tttttaaaag agggtaccta gttgagttta atagtactat aagatatatt tttttctttg + 5401 caatagctat aagtgtatta aactttttta tagcggaacg gtttagtatc tctagaagag + 5461 gaatggtata cttcttaact ttagaaggaa tatccttata cttgttaaat ttcttagtaa + 5521 agaaatattg gaaacatgtg ttttttaatc taaaaaatag caagaaaatt ttactgttaa + 5581 cagtaacgaa aaatatggaa aaagttcttg ataaactgct agaatccgat gaactttcat + 5641 ggaagttggt agcagtaagt gttttggata aatctgattt tcaacatgat aaaatacctg + 5701 taattgaaaa ggaaaaaatt attgaatttg caacgcatga agttgtggat gaggtgtttg + 5761 tcaatcttcc aggagagagc tacgatattg gagaaattat ctctaggttt gagacaatgg + 5821 ggatagatgt aactgtaaat cttaaagcat ttgataagaa tttgggtcgc aataaacaaa + 5881 tttatgagat ggtaggattg aatgtagtca ctttctctac aaatttttat aaaactagtc + 5941 atgtgatttc aaagagaatt ctcgatattt gtggtgccac tattggcctt attctttttg + 6001 ctatagctag tctagtttta gttccattga ttcgtaaaga tggcggacca gctatttttg + 6061 ctcaaactcg tatagggaaa aatggtcgac attttacctt ttataaattc cgttcgatgc + 6121 ggagcgatgc tgaagctatc aaagaacagt tgatggatca aaatacgatg caaggtggta + 6181 tgtttaagat agacaacgat cctcgtgtta caaaaattgg tcgctttatt cgtaaaacca + 6241 gtttagatga gttaccccag ttttggaatg tctttatagg agatatgagt ttggtgggaa + 6301 cacgtccacc tacagtagac gagtatgttc agtatactcc agaacagaaa cgtcgactca + 6361 gctttaaacc tggtattaca ggtttatggc aggttagcgg ccgtagtaaa ataaccgatt + 6421 ttgacgatgt tgtaaaatta gatgtggctt atattgataa ttggacaatc tggaaagata + 6481 ttgaaatatt gttaaagacc gtcaaagtgg tatttatgag agaaggggcg aagtgatttc + 6541 tgccctcaac ctgttaggag agaaatgaaa cagtcagttt atattattgg ttcaaagggg + 6601 attcctgcta agtatggagg atttgaaacc tttgttgaaa aattaaccga atatcaaaaa + 6661 gacagcaaca tacaatacta tgttgcttgt atgcgtgaaa attcagctaa atctggcatc + 6721 atggatgatc agtttgagca caatggagcc atttgtttca acatcgatgt acccaatatt + 6781 ggaccagctc gtgccatcgc ttacgatatt gcagcggtca acaaagctat tgaattggct + 6841 aagaaaaata aggacgaagc tcccattttt tacattctag cttgtcgcat tggtcctttt + 6901 atttctgggc ttaagaaaaa aattcgtgcc atcggaggcc ggttgttggt aaatcctgat + 6961 ggtcatgaat ggttgcgagc aaagtggagt ttaccagttc gtaagtattg gaaattttca + 7021 gagcagctca tggtcaaaca tgcagattta ctggtctgtg acagtaaaaa cattgaaaaa + 7081 tatatccaag aggattataa gcagtaccaa ccaaagacca cctatattgc ctatggaacg + 7141 gatactactc cttcaatcct gaaagcagaa gatgccaaag ttcgggattg gtatcaggaa + 7201 aaaggagtta gcgaaaatgg ctattatcta gtggtgggga gattcgttcc tgaaaataac + 7261 tacgaagcaa tgattcgtga atttatcaag tccaagtcca agaaggactt tgtcctcatc + 7321 acaaatgtgg agcagaataa attttacgac cagttgttac aggatactgg ttttgataaa + 7381 gatcctaggg ttaaatttgt tgggactgtc tatgaccaag agttgctcaa gtacatccgt + 7441 gagtatgcct ttgcctattt ccatgggcat gaggttggag ggaccaaccc ttctctattg + 7501 gaagccctag catccacaaa actgaatttg ttgctagatg ttggctttaa ccgtgaggtt + 7561 ggtgaagacg gggccattta ttggaaaaaa gatgagttgg ctcgtgtcat tgaggaagta + 7621 gaaggatttg atcaggcagc aataactgac ttggatttca agtcaagcca aagaatcctc + 7681 tcagctttca catgggaaaa gattgtgtca gattatgaag aagtgtttaa aggataggga + 7741 atgaaacgga ttttatactt gcatgctggt gcagaaatgt atggagcaga taaggtttta + 7801 ttggaattga tcaaaggatt ggattccaaa gaatttgaag ctcatgtcat cctgccaaat + 7861 gatggtgttt tagtcaaggc cttgcgtcaa gttggggctc aggtcagtgt gttggattat + 7921 ccgattttac gtagaaaata ctttaatcct aaggggattt tagaatatct gaaatcctat + 7981 cggcgctact ctcaaaaaat ttcccaatat gtgcgtgaga atgggataga tcttgttcat + 8041 aacaatacga cagccgttct ggaaggaatc tatctcaaga gaaaagtaaa actcccctta + 8101 atctggcatg ttcatgagat tattgtcaag cccaaggcta tttcagattt tatcaacttt + 8161 ttgatggggc gatatgcaga taagatcgta acagtatctc aagctgtttc cagccatgtc + 8221 aaacaatctc cttttatcaa agaaggtcag gtacaggttg tatataacgg agtggacaat + 8281 gctgtctatc atcccatgca agcaagcaca gtgcgtgaac aatttgctat tccagaagaa + 8341 tctcttgtca ttggtatggt aggccgcgtc aacgcttgga agggacaggg agattttcta + 8401 gaagcagtgg cgccgatttt ggagcagaat cccaattcta tcgcttttct ggcaggaagt + 8461 gcctttgcgg gagaagagtg gcgagttgaa gaactcgaat ctacgattgc caaatcaagt + 8521 gtagcctcac aaatcaaacg aattgactat tatgagcata cgactgagct ttataatatg + 8581 tttgatatct ttgtcttgcc aagcaccaat cccgatcccc taccgacagt ggtactagag + 8641 gcgatggcat gtggcaaacc agtagttggc tatcggcatg gtggtgtctg tgaaatgatt + 8701 aaggagggca aaaacggtct cctagccact ccaaataagc ctgcagaatt gtctaaggct + 8761 attcaagaat tggctgacaa tatcgagaaa agagaacagt taggaagtgc atctttccaa + 8821 cgtcaaaaag aattcttttc gttggaaagt tatattcgga atttctcaga gctatataaa + 8881 aaatactaag atgaatacta agatgaatac taagatgaat actaagatga atactgaaac + 8941 aattaagaat aaattaaaac caatcgttta tccaattatc aattttatcc ctagacgaag + 9001 actcaagaat aaaaatttta caatcatttg cgacaattgt tgggcaggaa aagtctatca + 9061 ggaattgggc ttgccttatc aaactccatt tgtaggtatg tttgtctttt ctcctgacta + 9121 catcaaaatg ctcaagaatt taaaacacta tttgagtgga aatatccctt tgacatttgt + 9181 taaggaatca aaatatgtca aagactttga taatgcctat cccctggctc ttttagacga + 9241 tatcgaattg catttcttac attatgcaga tgaggaagaa gcaactcaaa aatggaaccg + 9301 tcgtttagaa agaattcatt gggataattt gtatttcaag ttcaatgata atgatgcctg + 9361 tacttatgaa ttgatgaaag agtttgaaga acttccgtac aagagtaagg ttatcttctc + 9421 ttcgagaaat tacagtggtt taccttcctt agttcatttc aaatcagctg aaaagcaagg + 9481 acacgttggg attgatttga aaacttatca ccgctatttt aattgtgtta cttggttgaa + 9541 taagggtggg gaggatttaa ctaaatgaaa aaaataagaa ttattattcc ttattttggg + 9601 aaactaccaa ccttttttcc ttatttttta ttaactgcta aacgtaatca aaaaattgat + 9661 ttcttagttt atacggatca aaaggtggat gaattcgcta tgttaaatgc taaaaatata + 9721 gaatttgtaa ctctttcttt tgatgagtta agagaaaaag ttcagtctaa gtttgatttt + 9781 aaaatctctc tcaaaacacc ttataaattt tgtgactata gacctgctta tgggcttatc + 9841 tttgaagaag aattaaaggg ttatgattac tggggttttt gtgacacaga tgtcttacta + 9901 ggtgatattt atcaatttct tgaagagcat agcttttttg agaacgacta tgctcgatat + 9961 ggtctttttg gtcatcttca aatttttaag aatttaagag aagttaatca tatttttatg + 10021 tctgggcaag gttcagacta tcgattagat tatcacaatg tctatactag tgaacaaagt + 10081 tttatttttg atgaatcaga aggtatccaa aagctttttg aaaaatgtca tttcaaacaa + 10141 ctgcaagata agttttttga tgatattgat attagtcatt tctcatttcg ggaatatggc + 10201 gaaaataaat cgaaacgcta ttatttttgg tctgaagaaa atggtttgga atcaataaat + 10261 ttaatcaatg atgatatagt ggttaagcgt cctctatacg cacatttcca aaagagaatg + 10321 attaaatgcc ctgactttaa actagtcgat tcattttatg ttataccaaa tcaattagtt + 10381 attggagaga aaatttctaa gcaagagcta gtagaggtga caagaaataa attctattgg + 10441 gaatatgtta aatcaacaat gttaaagaaa ttaaaaaaag aaaaatggac atttgaattt + 10501 attcgtcata aattaaggat gaaatgagct tagtattatg gcttttccta ttgattttgt + 10561 tgtatgctga attgacgaac acgatcctga ttggagggct aaaaatagca agtatgactc + 10621 tgcttttaca acatctgaaa ataatacgaa tttcgatgaa gcatactgtt agtggagaac + 10681 gtttaagttt tggttagaga gatagaaaaa tttgctcctt gggtgaataa agtttatctt + 10741 gttacagaaa atcaaaaacc ggtctggttg actattaata gtgataagtt atattaattg + 10801 aacatttggg atgatttgta tttcaagttc aataataatg atatttgtac ttatgaattg + 10861 atgaaagaat ttgaagagct tccatacaag agtaaggtta tcttctcttc aaaaaattac + 10921 agtgacctac cttccttgat tcattttaaa tcagccgaga agtaagcgca tgttggaatt + 10981 gatttgaaaa cttatcaccg ctattttgat gttgttagtt ggataaacca agatagtgta + 11041 tagttcacta aataattaaa tacagattat ttcaatgttt ctataagttc aaaatttaat + 11101 tagaaactat agaggaatcc atctttaaga ttattattta taagtgagca atattaactg + 11161 gagtcaatga tttaacagaa aattcaggtg ctagtcagtc attgattatg tttatgaata + 11221 taataatgaa aggaatttct aattttacaa gaattgaatc ttgtatcgaa atacattagt + 11281 tctataaaaa tgaattaatt aaaaaattag agatttacac aatatcagtt ctactaagat + 11341 tatgcaataa aaagtttcta aaaaattatt tactaagtga aggatgatat gattatacaa + 11401 aatatattgc taacaattgt aataccagta tataatgttg aaaaatattt gaaacgttgt + 11461 attgatagcg tcatttctca ggaatgggat aaatatgaag ttattctagt aaatgatggc + 11521 agtacagatg cttcacccaa tatttgtgaa gagtatgccc agaagtatca ttttatttct + 11581 gttattcata aggaaaatgg tggactatca gagactcgta atacaggtct ttctcatgcg + 11641 aatggaaaat acgtattttt tcttgattct gatgattgga ttacaaaaga tatgtttcga + 11701 aatttaagta aaatgattat ggaacaaaat tatgatattt tgcaattcgg aatgcaaatg + 11761 tttcattctg aaagagaaga gttgaaaaat gtacaatgca aagaaaaaaa ctttaattct + 11821 tcagatgcat ttaaaaacat gttaagtgtt gaagggatta caagttttgc tacagacaaa + 11881 atatataaaa gagaattgtt tgagaagaac ggaatagagt ttcctatagg atatttttac + 11941 gaagatttag gaacggttta taaattaatt ttatctgcta aaaaaattta tttaacaaca + 12001 caagtgtatt attgttattt tattgggaat gatgcggcta ttaccaaaca gtggtctgaa + 12061 aaaaaaatta gtgatgtgta taaatttcat aaaaaaattt ttaatgtttc atctcttatg + 12121 gtttcagatg acatcttcct gtctaaatcc tattataata atggtctggt ttatctttta + 12181 atgaaattgt atgaagaaaa tcaggaagac actcaacttt ttaggttgat acttgcagaa + 12241 ctggatgcaa acatagttcc tataaaatat ttgcgaaatt atcctaattt tttgaaatat + 12301 gtattttatc gcattcgatt attgaaatta attgtaatat tgaaattaac tttaacaaaa + 12361 ataaaaaaat ggaatcaaaa aaaacattaa taatatttga acaaatagat acatttgaac + 12421 aatttttaga acgtaatata atttttaata atgtagacat atttacaccg tacaaaaaag + 12481 tttcgaatgt ttttatgcac aattttagag caattgcaaa acgattaccc ggatttttat + 12541 tccataattg gtggttagaa gaatggtcta gaaaattacc ggattatact aatatagtag + 12601 tatttgacaa tgctatttcc cttaaattat tagagtatat agatgcacat aagactcgta + 12661 gttcaaagtt gaaattatgg ttatggaatg ttccgaataa gcaagtgaat tatttgaatt + 12721 cgaattatga tgtttattgc tttgataaga catattctga aaactataat ttaaaatttg + 12781 tagaacaatt ctatgtatta ggttcgacta agaaaagaga tatattggat attgagtatg + 12841 atttttattt tattggtgca gataaaggaa gattgccaaa attaaaaagc ttagctaagc + 12901 agatagtttt aaataattat agttatcgat ttgacgtttt tagtgtaaaa aaacagtatt + 12961 tcgattctga gtttgaggga attcaagtta tagatacatt actcccttat gatgaagtct + 13021 tggataacat actagcttcg aatgttattg ttgagttaaa taaaaaggga caggatggtc + 13081 taacccttag agcaatggaa tccatttttt ataaaaaaaa attaataaca aataataaaa + 13141 aaattattaa ctatgatttt tatcacccaa ataatatttt agtttgggag gaaggaaaag + 13201 atatcaaatt agatgagttt attcaaaagc catatgttca attagaaaaa gatattattg + 13261 accgttattc ttttagtaat tggttaagta aaattacaga aatttaggag ttaaatatga + 13321 gaataacttt ttgtctacct gagataagca ctgttcctac gggaggatat aaaattattt + 13381 ttgagtacgc aaataggttg tctgaacgag gtcatgagat aacccttgtt tttttaacca + 13441 ataatgtatg gaacagagtt actaagaatt gtaaaatcaa atcaattgta ggcaatatac + 13501 gtggcaaaaa aaatccaagt tggtttaaac tgaaaccaac tattcgtaaa ataatgactc + 13561 cttatttaga tgggagagat tttcctgaag cagattttat atttgctact gcggttacaa + 13621 ctgctaatat tgtaaaagaa atgccagaaa aatatgggaa aaaatgttac ctaatccaag + 13681 gttttgaaac atggcttctt ccagaaagta aagttattga aacttataat tatggattcc + 13741 ttaatattac agtatctaag tggttatgtg acatagtcca atcttataca gagactccag + 13801 ttttttgtgt atctaatccg attgatacag aaatttttta tttgctaaat cctatagaga + 13861 aacgaaaccc atttcatcta ggtatgttat atcatgaagg agagcataaa ggaatctctt + 13921 atgcgataga tgcaattaag aaagttaaga aaatttatcc ggaaatagag gttaatattt + 13981 ttggagttcc tagtagacca gtatttttac cagaatattt taattatact caacaagcta + 14041 cacaacagga attacaaaag atatacaacg atacgtctat ttttttgtgt gcaacaattg + 14101 atgaaggctt tggtttgaca ggagcagaga gtatggcttg tggctgtgcg ttagtctcaa + 14161 cagcctatag tggtgtattt gaatatgcaa ttgatggcga gaatgcactt ttatctccga + 14221 taaaagatag tgttagtttg gcaacaaaca taataaaatt gattagaaat catgatttgc + 14281 gcttatccat agcaacgcaa gcaactaaag atatgaaaaa gagaggatgg gagaaaacta + 14341 ctttaaaatt agaaaatatt ttaagtgaat ttactaattt ttaaagatgt tttaatatca + 14401 atgattataa aactagataa acaaaaatgt tattttatta tgttactttt attgatgtgc + 14461 gtagtacagt tgactgcaag tgtttcaatg ggagtaataa gtatagctct aacagtatta + 14521 ccaatattgt ggaatttaaa taatccatcc aaattattat tttcacagat tctttatttg + 14581 tttcagttcc aattctatgt aagttattta tcatttccgt taggaatttc ctttatctgt + 14641 gatattatta atttattttt gttattcaat atttttaaag attccaaact attacagtgg + 14701 gaattacgga atattaattt aaaaacaatt atttttgttt gggtcttgtt ttttttgata + 14761 ggtatttttt caaatttttt gtatgattta aatattgcgc ttattgtatg gtccctccgt + 14821 aattatataa gatttatcat ttttttcatt tcttgttgtt tgtatattga taaatacagt + 14881 ataaatctag gtgaatactt aataaagcta ttctattggt ttaatatatt ttttacctcg + 14941 ttccaatatt ttgtgctttt aaaatcagga gattttcttg gaggaatttt tggaaacgaa + 15001 ttgggaattt ctaataccta cttgcatatt cttttaattc tcatcttgat attatctgtt + 15061 gttaattatg tatcagataa ttcgagttta gttattttaa caagttatat cgtttcaact + 15121 ctatacgtag ctgctttgtc agagttaaag attatttttg tggaattacc tattattatt + 15181 attttgactt tactatttaa aagattagga ataaaaatac tgcttaaaat aatatctatc + 15241 acttgcatag tggtggtcgc tttggcaatc tcaattccta ttttatatga attattccct + 15301 atatttgaca atttttttaa attagaaaaa ttatttggct attcaacagg aaactattca + 15361 actagttctg attttggtcg gttaagttca attgttcaaa taatctcaac tattttttat + 15421 ggagatgttt ggcagacttt atttggtatt ggtttaggag aggcggaaat ttcaaaaatt + 15481 ccgatattta gtggttcctt ttattataat tacgaataca cccattacta tctgttcact + 15541 ttatcatatg tttttattga gaatggattt ataggattgt tcctattcat gtttatgcca + 15601 atttaccttg ctttaaagat gatttttgag cgagggacat ctaaatatga tcttcttctg + 15661 atagtattat ctatttcttt atttatgctc ttgttgtata ataatacaat gaggtcagag + 15721 atatattatc tttatttatt tgttctttca tggggagttg caatcaatag aggaaatggg + 15781 ggatgttatg aaaacaataa aaaattatgc ttataaatct ttttatcaac tatttttgat + 15841 aatagtacct tttataacaa tcccatatgt ttctagaatt ttaggagcag agttaatagg + 15901 gataaattct tatacaaaca ctataataag ttattttgtg ttaatagcaa atcttgggat + 15961 tttgatatat ggtaatagaa ccatagcata tcatagagaa agtattgagg agcgtagtaa + 16021 aaaattttgg gaaattgtct caattaagtt gctggtagca attgttgcct atgtcatatt + 16081 tattatattt ttattctttt attcaaaata tagttgggtt tttgtgattc aatctgtaca + 16141 aattatagct acggcatttg atatatcttg gctttttgat ggtgtagaag attttaaacg + 16201 tacagtagtg agaaattttc tggttaaaat aatttccatt attctaattt ttacttttgt + 16261 caagtctaca gaggactttg acaaatacat atggataaca gtaggctcta ctttaatggg + 16321 taatttgaca ttatggagtt atttacacca ttatattatt aaaattccga taaaaagcct + 16381 taagttgagt gaacacttag ttcccatttt gactttattc ataccacaaa ttgcttctat + 16441 tgtatttatg tcaatcaata aaattttact aggtaatatt tcgacgatat cgcaagcagg + 16501 ctactttgag aatgcggata aggtgattag aattcttctg gctttagtat catctattgg + 16561 agtagttgtt tttcctaaag ttgctcatgc gtataggagt ggtgatatga agagagtatt + 16621 agggttgact tatatgactt ttgatgcagt taatattata actattccaa ttgtagttgg + 16681 aatagtttct attagcccta cattctcttc tatttttttt gggacggaat tccaaggaat + 16741 agataaggtt ctgtctgttc tagtattgga gttaattttc atgggatata cttcggtttt + 16801 aggtagtcaa tatctcattg taacagggca aacttacttt ttaagtatct cggtgttcct + 16861 aggaatattt tctacagtga tatcttcttt ctttttcatt ccgatatacg gagcgcttgg + 16921 aagtgcgatt tcatctgtaa ttggagaagc atctattatg attggtgaaa tttacttgtt + 16981 aaggaatcaa gttgatttct attatctata tagggatgta ccgaaataca tgattgctag + 17041 cgctgttatg tatattagta tctcgtcatt gaattatttt atttcttcgc catttgtatc + 17101 tttgctatca agtattgcta tgggtgcagt gacttatgtt actgttgtct tattactatg + 17161 cccaagaata gtaataaaat tattaaataa aaacacaaga tttttttgaa atgatatata + 17221 aaatcgtaac aaaaatccaa ttacaattca tgacttttta ctaattataa atttgcgatt + 17281 catctaatta aaattgaatt atagataatg aaaatttaga aaggtggccc cattatgaaa + 17341 ggtattattc ttgcaggtgg ttcgggaacg cgcctgtacc cacttactcg agctgcgtca + 17401 aaacagctga tgccggttta tgacaaaccc atgatttatt atcctttgtc aaccctaatg + 17461 ttggctggaa tcaaggatat tttgattatc tcaacaccac aggatttgcc ccgttttaag + 17521 gacctgctct tggatggttc cgaatttggg attaagcttt cctatgcgga acaacctagt + 17581 cccgatggac ttgctcaggc ttttcttatc ggtgaagaat ttatcggtga cgatagcgtt + 17641 gcgctgatct taggtgacaa tatctatcac ggttctggtt tgagcaaaat gcttcaaaaa + 17701 gcagccaaga aagagaaagg tgcgactgtc tttggctacc atgtcaagga tccagaacgc + 17761 tttggtgttg tagaatttga tgaaaatatg aatgctatct ccatcgaaga aaaaccagaa + 17821 cagccgcgct ctaactatgc agtgacagga ctgtatttct atgataacga tgttgtcgaa + 17881 attgccaaga gtatcaaacc aagtcctcgc ggagaattag aaatcacaga tgtcaacaag + 17941 gcttacttgg atcgtggaga tttatcagtt gagcttatgg gacgtggctt tgcttggctg + 18001 gatactggaa ctcatgaaag tttactagag gcttcacagt acatcgaaac agtgcaacgg + 18061 atgcaaaatg ttcaggtagc aaacttagaa gaaattgcct atcgcatggg ttatatcagt + 18121 cgtgaagatg tattgacctt agcccaacca cttaagaaaa atgaatacgg acagtatctg + 18181 ctccgtttga ttggagaagc atagatgaca gataattttt tcggtaagac gcttgcggca + 18241 cgcaaggttg aagctattcc aggcatgttg gagtttgata tccccgttca tggagataat + 18301 cgtggctggt ttaaagaaaa tttccaaaag gaaaaaatgc ttccacttgg atttccagag + 18361 tctttctttg cagaaggaaa attgcaaaac aatgtatcct tctcacgtaa aaatgtcctt + 18421 cgaggcctcc acgcagagcc ttgggataag tacatctctg tagcagatgg agggaaagtt + 18481 ctgggttctt gggttgatct acgcgagggt gaaacctttg ggaataccta tcagacagta + 18541 attgatgcaa gcaagggaat ctttgttcct cgaggcgtag ctaatggctt ccaagttcta + 18601 tcagatacag tgtcatatag ctatctggtc aatgattact gggctctcga gctcaaaccc + 18661 aagtatgcct ttgtgaacta cgctgatcca agccttggta ttgaatggga aaatattgca + 18721 gaagcagagg tttcagaagc agataaacat catcccctac ttaaggatgt aaaacctttg + 18781 aaaaaagaag atttgtaaaa aggaaagaat atgactgaat acaaaaatat tatcgtgaca + 18841 ggtggagctg gctttatcgg ttctaacttt gtccattatg tttacgagaa ctttccaggt + 18901 gttcacgtga cagtcctaga taagttgact tatgctggaa atcgcgcgaa tattgaggaa + 18961 attttaggta atcgtgttga gttagttgtt ggtgacattg ctgatgcgga gttggtagac + 19021 aagttggctg ctcaagcaga tgctatcgtt cattatgcag cggaaagcca caatgataat + 19081 tcgctcaatg atccatcgcc atttattcat actaacttca tcggaaccta tactctttta + 19141 gaagctgctc gtaagtatga tattcgcttc caccatgtat cgacagatga agtttatggg + 19201 gatctccctt tacgcgaaga tttgccaggt catggtgaag gaccaggtga gaaatttact + 19261 gctgaaacca agtacaatcc aagctcgcct tactcatcaa ccaaggcagc ctcagatttg + 19321 attgtcaaag cctgggtccg ttcttttgga gtcaaggcaa cgatttccaa ctgttcaaat + 19381 aactacggtc cttatcaaca tatcgaaaaa ttcatcccac gtcagattac taacatccta + 19441 agtggaatta agccaaaact ttacggtgaa ggtaagaacg ttcgtgactg gattcatacc + 19501 aatgaccatt cttcaggagt ttggacaatc ttgacaaaag ggcaaattgg tgaaacctac + 19561 ttgattgggg ctgatggtga gaagaacaat aaggaagttt tggaacttat ccttaaggaa + 19621 atgggacaag ctgcggatgc ctatgatcat gtgactgacc gtgcaggaca tgaccttcgc + 19681 tatgcgattg atgctagcaa gctccgtgat gagttggggt ggaaacctga atttaccaac + 19741 tttgaagctg ggctcaaggc aacaatcaag tggtatacag ataaccaaga atggtggaaa + 19801 gcagaaaaag aagctgttga agccaattat gctaagactc aggagattat tacagtataa + 19861 aaagcaggaa atagctgctt tttattgcta tattgggaag agttacatat tagaaaggtc + 19921 tagagatgat tttaattaca ggggcaaatg gccaattagg aacggaactt cgctatttat + 19981 tggatgaacg taatgaagaa tacgtggcag tagatgtggc tgagatggac attaccgatg + 20041 cagaaatggt tgagaaagtt tttgaagagg tgaaaccgac tttagtctac cactgtgcag + 20101 cctacaccgc tgttgatgca gcagaggatg aaggaaaaga gttggacttc gccatcaatg + 20161 tgacggggac aaaaaatgtc gcaaaagcat ctgaaaagca tggtgcaact ctagtttata + 20221 tttctacgga ctatgtcttt gacggtaaga aaccagttgg acaagagtgg gaagttgatg + 20281 accgaccaga tccacagaca gaatatggcc gtactaagcg tatgggggaa gagttagttg + 20341 agaagcatgt gtctaatttc tatattatcc gtactgcctg ggtatttgga aattatggca + 20401 aaaacttcgt ttttaccatg caaaatcttg cgaaaactca taagacttta acagttgtaa + 20461 atgaccagta cggtcgtccg acttggactc gtaccttggc tgagttcatg acctacctag + 20521 ctgaaaatcg taaggaattt ggttattatc atttgtcaaa tgatgcgaca gaagacacaa + 20581 catggtatga ttttgcagtt gaaattttga aagatacaga tgtcgaagtc aatccagtag + 20641 attccagtca atttccagcc aaagctaaac gtccgctaaa ctcaacgatg agcctggcca + 20701 aagccaaagc tactggattt gttattccaa cttggcaaga tgcattgcaa gaattttaca + 20761 aacaagaagt gagataagta gtagaatgat tttctagtct aataaaagag gcagataatg + 20821 aactccaaag gagcttaaga tgtacgatta tcttgttgtt ggtgctggtc tctttggcgc + 20881 agtctttgcc catgaagtag ccttaaaagg aaaaaagtaa aagtcattga aaaacggaat + 20941 catatcgtgg gtaatatcta tactcgtgaa gaggaaggaa ttcaagttca tcaatatggt + 21001 gctcatatct tccatacttc tgataaggag atctgggatt atgtaaatca gtttgcaggg + 21061 tttaaccgtt acaccaattc tcctgttgca aactataagg gtgagattta taaccttcct + 21121 tttaatatga atactttcaa taaactctgg ggagttgtaa cgccagcaga agcacaagct + 21181 aagattgagg aacaacgtgc tattttaaat ggtaaaactc ctgaaaattt ggaagaacag + 21241 gcgatttctc ttgtaggtac agacatctac gaaaaattaa tcaaagacta tacagagaaa + 21301 cagtggggca aaccaactac tgaacttcca tcctttatta ttcgccgttt accagtacac + 21361 ctgacctatg ataacaacta ttttaacgat acctatcaag ggattccaat tggtggatac + 21421 actcaaatag ttgaaaaatg tggatcatga aaatattgat gtagaaacaa atgttgattt + 21481 ctttgtgaac aaagagcaat atctgaaaga ttttcctaag attgtcttta ctggtatgat + 21541 tgatgaattc tttgactata agttgggcga actagagtac cgtagtcttc gttttgaaaa + 21601 tgagaccttg gatatggaaa attaccaagg aaatgcagtt gtgaactata cggatgcaga + 21661 aaccccatat actcgcatta ttgaacacaa acattttgag tttgggagtc aagcaaagac + 21721 tatcattacc aaagaacatt ctaaaacatg ggaaaaaggt gatgagcctt attatccagt + 21781 taataatgat cgtaataatc atttgtataa atcatataaa aaacttgctg atgagcaagg + 21841 gaatgttatc tttggtggcc gcttaggaca ctatcgttat tacgatatgc accaagtaat + 21901 tggagcagct ttgcagtgcg tgagaaatga gttagattca tactcaatga aaatcaaaga + 21961 gcaaactagg aagctagcca caggttgctc aaaacactgt tttgaggttg cagatgaaag + 22021 ctgacgcggt ttgaagagat tttcgaagag tataaacaag taaaactgac taccagttat + 22081 tatttagaaa tagtattaaa aattccggct ctttgtcaac tgtagtgggt tgaaaaaaag + 22141 ctaagctcga gaaaggacaa atttcgtcct ttcttttttg atattcaggg cgataaaaat + 22201 ccgttttttg aagttttcaa agttccgaaa accaaaggca ttgcgcttta taagtttgat + 22261 gagattattg gtcgcttcca atttggcgtt tgaatagggt agttgaaggg cgttgacgat + 22321 tttctctttg tcctttagaa aggttttaaa gacagtctga aaaataggat gaacctgctt + 22381 aagattgtcc tcaataagtc cgaaaaattt ctctggttcc ttattctgaa agtgaaacag + 22441 caagagttga tagagctgat agtgatgttt caacccaaat cattcatacc tctctcaact + 22501 agatgtaact tacaaaaccc ctgacctcat gagccacttt cttcctcctc atgaggtcag + 22561 ttttactttc tgctgttcca gtatcgtttt tcctcgctag atttcctcaa aagggcagac + 22621 tcctcccttg gttcgtcaca cgattttttc atctcgactg ttctttaatc cccaattatt + 22681 caccccaaat ctaaaaacca tccagaatcc ttgccttagc ttagatcctg gatggttttt + 22741 agatttgggg tgaataattg gggttcaagt cttgtgaata gctcaaaagc ttgtctaaaa + 22801 tctctttatt ggttaaatgc atacgaaaag taggacgata aaatcgctta tcactcagtt + 22861 tacggctatc ctgttgtatg agcttccagt agcgcttgat agccttgtat tcatgggatt + 22921 ttcgatgaaa ctgattcatg atttgaacac gcacacgact catagcacgg ctaagatgtt + 22981 gtacaatgtg aaagcgatcc aacacgattt tagcatacgg gaaaagttgt ctagctaagt + 23041 catagtaagg gctaaacata tccatagtaa taattttgac gcgacatcgg acagctctat + 23101 cgtagcgaag aaagtgattt cgaatgatag cttgtgttct tccctcaaga acagtgatga + 23161 tattgagatt gttaaaatct tgcgcaatga agctcatctt tccctttgta aaagcatact + 23221 catcccaaga cataatctca ggaagacaag aaaaatcatg tttaaagtga aaatcattga + 23281 gcttacgaat aacagttgaa gttgagatgg aaagctgatg ggcaatatca gtcatagaaa + 23341 tcttttcaat taacttttga gcaatctttt ggttgatgat acgagggatt tggtgatttt + 23401 tcttgacgag ggaagtctca gcgaccgcta tttttgagca ctgatagcac ttgaagcgac + 23461 gctttctaag gagaattcta gtaggcatac cagtcgtttc aagataagga attttagaag + 23521 gtttttgaaa gtcatatttc ttcaattggt ttccgcactc agggcaagat ggagcctcat + 23581 aatccagctt agcgataatt tctttgtggg tatccatatt gatgatatct agaatcttga + 23641 tgtttgggtc tttaatgtct agtaattttg tgataaaatg taattgttcc atatgattct + 23701 ttctaatgag ttgttttgtc gcttttcatt atagatctta tgggactttt ttctgcacaa + 23761 aaataggctc cataatatcc ataggggatt tacccactac aaatattata gagccaaaat + 23821 tccttgacta tgtgatatag ttgagggatt tttaaatgat attcatattt tttgcaaaga + 23881 tgttgtttga aaaataattt tcaaaaattc tgaaaattct gttgacatct ttctgaaaag + 23941 agtctataat ggagagaaag ttttaaagga gaaaatgatg aaaagttcaa aactatttgc + 24001 ccttgcgggc gtgacattat tggcggcgac tactttagct gcatgctctg gatcaggttc + 24061 aagcactaaa ggtgagaaga cattctcata catttatgaa acagaccctg ataacctcaa + 24121 ctatttg +// + diff --git a/public/res/serotype_genbank/serotype_8.gb b/public/res/serotype_genbank/serotype_8.gb new file mode 100644 index 0000000..6b2f8b3 --- /dev/null +++ b/public/res/serotype_genbank/serotype_8.gb @@ -0,0 +1,708 @@ +LOCUS CR931644 13844 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 573/62 (serotype 8). +ACCESSION CR931644 +VERSION CR931644.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 13844) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 13844) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..13844 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="573/62" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC08_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC08_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI32944.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..458 + /gene="aliB" + /locus_tag="SPC08_0002" + /pseudo + CDS 293..458 + /gene="aliB" + /locus_tag="SPC08_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(459..1334) + /gene="tnp" + /locus_tag="SPC08_0003" + /pseudo + CDS complement(459..1334) + /gene="tnp" + /locus_tag="SPC08_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(945..1316) + /gene="tnp" + /locus_tag="SPC08_0003" + /note="HMMPfam hit to PF01710, Transposase, score 3.1e-23" + /pseudo + gene 1568..3013 + /gene="wzg" + /locus_tag="SPC08_0004" + CDS 1568..3013 + /gene="wzg" + /locus_tag="SPC08_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32947.1" + /db_xref="GOA:Q4K2P0" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2P0" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSLSVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLVAYKSLIAGETKAIVLNSVFENIIELEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTSRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVLLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EVLKNYSTIINSLQDSIQTNMPIETMIDLVNTQLESGGNYKVNFQDLKGTGRMDLPSY + AMPDSNLYMMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1568..1684 + /gene="wzg" + /locus_tag="SPC08_0004" + /note="Signal peptide predicted for SPC0263 by SignalP 2.0 + HMM (Signal peptide probability 0.999) with cleavage site + probability 0.540 between residues 39 and 40" + misc_feature 1772..2119 + /gene="wzg" + /locus_tag="SPC08_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 3.1e-62" + misc_feature 2297..2740 + /gene="wzg" + /locus_tag="SPC08_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 2.3e-67" + gene 3015..3746 + /gene="wzh" + /locus_tag="SPC08_0005" + CDS 3015..3746 + /gene="wzh" + /locus_tag="SPC08_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32948.1" + /db_xref="GOA:Q9AHA6" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q9AHA6" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAESFLQVREIAKEVADDLVIAYGAEIYYTPDVLDKLGKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGITPVIAHIERYDALGNNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQNLVHVIASDMHNLDGRPPHMAEAYDFVT + QKYGEAKAQELFIDNPRKIIMDQLI" + misc_feature 3018..3626 + /gene="wzh" + /locus_tag="SPC08_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 2.7e-36" + gene 3752..4447 + /gene="wzd" + /locus_tag="SPC08_0006" + CDS 3752..4447 + /gene="wzd" + /locus_tag="SPC08_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32949.1" + /db_xref="GOA:Q9AHA5" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q9AHA5" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILLVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNRNQGDKSGLTNQDLQAGSYLVKDYREIILSQDALEKVATNLKL + DMPAKTLASKVQVTVPTDTRIVSISVKDKQPEEASRIANSLREVAVERIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGAVVTVIAVLLIELFDTRVKRPEDVEDVLQI + PLLGLVPDLDKMK" + misc_feature 3752..3868 + /gene="wzd" + /locus_tag="SPC08_0006" + /note="Signal peptide predicted for SPC0265 by SignalP 2.0 + HMM (Signal peptide probability 0.721) with cleavage site + probability 0.467 between residues 39 and 40" + misc_feature 3773..4189 + /gene="wzd" + /locus_tag="SPC08_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1e-55" + misc_feature 4295..4372 + /gene="wzd" + /locus_tag="SPC08_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4457..5146 + /gene="wze" + /locus_tag="SPC08_0007" + CDS 4457..5146 + /gene="wze" + /locus_tag="SPC08_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32950.1" + /db_xref="GOA:Q9AHA4" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q9AHA4" + /translation="MPTLEISQAKLDFVKKAEEYYNSLCMNLQLSGDGLKVFSITSVK + LGEGKSTTSTNIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGVVLNKFDTSVNKYGSY + GNYGDYGKNKK" + gene 5161..6528 + /gene="wchA" + /locus_tag="SPC08_0008" + CDS 5161..6528 + /gene="wchA" + /locus_tag="SPC08_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI32951.1" + /db_xref="GOA:Q4K2N6" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K2N6" + /translation="MNGKVVNSSLAIIHSFLVILLTYLLSAVREAEIASATAIALYIL + HYFVFYISDYGQDFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFSISRRGMIYF + LTLHALLVYVLNLFIKWYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + VAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVIFSTTFYKTSHVIAKRIIDIVGALVGLIL + CGLVSVVLVPLIRKDGGSAIFAQTRIGKNGRHFTFYKFRSMCVDAEDKKRELMEQNTM + QGGMFKVDDDPRITKVGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQVSGRSEIKNFDEVVKLDVAYIDDWTIWKDIEILLKTVKVVLM + KDGAK" + misc_feature 5161..5268 + /gene="wchA" + /locus_tag="SPC08_0008" + /note="Signal peptide predicted for SPC0267 by SignalP 2.0 + HMM (Signal peptide probability 0.810) with cleavage site + probability 0.396 between residues 36 and 37" + misc_feature 5944..6525 + /gene="wchA" + /locus_tag="SPC08_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 5.3e-157" + gene 6533..7012 + /gene="wciQ" + /locus_tag="SPC08_0009" + CDS 6533..7012 + /gene="wciQ" + /locus_tag="SPC08_0009" + /note="member of homology group 220" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase (in conjunction + with wciR) WciQ" + /protein_id="CAI32952.1" + /db_xref="GOA:Q4K2N5" + /db_xref="InterPro:IPR013969" + /db_xref="UniProtKB/TrEMBL:Q4K2N5" + /translation="MKNKKKVCFCASSGGHYEQLMKLEPIMRQQDSYLITEYTDYNKG + ESEKKDINKVFYLLQINRLEFFWIVKLIWISLKSLYILLRIRPKVVICTGVLAMIPFC + LLSKMFGAKLIYIESFAKVTTPTLTGRILYRYADRFYVQWESMLDIYPNAVYKGGLY" + gene 7013..7492 + /gene="wciR" + /locus_tag="SPC08_0010" + CDS 7013..7492 + /gene="wciR" + /locus_tag="SPC08_0010" + /note="member of homology group 221" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase (in conjunction + with wciQ) WciR" + /protein_id="CAI32953.1" + /db_xref="GOA:Q9AHA2" + /db_xref="InterPro:IPR007235" + /db_xref="UniProtKB/TrEMBL:Q9AHA2" + /translation="MIFITVGTQKHPFNRLLKKIDQLIELEVIKEEVFAQIGASDYKP + KYFSYNSFLSSIDMNEKMREASMVITHGGTASIVKALKLRKKIIAVPRLEQFGEHVDN + HQLQIITVLGEEGYILPCFDIEQLGTVYQKAQTFTTKPYISNSYALLEDIRQYIDSL" + misc_feature 7013..7489 + /gene="wciR" + /locus_tag="SPC08_0010" + /note="HMMPfam hit to PF04101, Glycosyltransferase family, + score 4.8e-59" + gene 7505..8569 + /gene="wciS" + /locus_tag="SPC08_0011" + CDS 7505..8569 + /gene="wciS" + /locus_tag="SPC08_0011" + /note="member of homology group 222" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase WciS" + /protein_id="CAI32954.1" + /db_xref="GOA:Q9X9A5" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q9X9A5" + /translation="MTKVLQIGPSINLSKGGMSAVIRDLTYSPLLSGDFDITAYQSFI + DGSLVTRLTYSSYALLKFVVHSGNYDIYHIHTATRGSCWRKLLYLKLLKSKNKKAILH + IHGAEFQIFYDSLPEYKKNKVREMLELSDYVIVLSQTWYDFFSNININAKIVIVENGV + DTSFYVEKKKSITSNNFLFLGRMGKRKGAYDLIDAMNQAVAINPNLHLTMAGDGELED + IRQKISNLNLTDHITIYDWVNQRDKKILFQANQTLILPSYNEGLPMAILEAMASGLAI + ISTPVGGIPEIIHEDNGWLIQPGDISQLSNIILEASYNPDVVSLMGSNNHKLVEEKYS + FHSMHGKIKKIYNTLLETKK" + misc_feature 7988..8488 + /gene="wciS" + /locus_tag="SPC08_0011" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.3e-33" + gene 8569..10029 + /gene="wzx" + /locus_tag="SPC08_0012" + CDS 8569..10029 + /gene="wzx" + /locus_tag="SPC08_0012" + /note="member of homology group 47" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32955.1" + /db_xref="GOA:Q9X9A6" + /db_xref="InterPro:IPR002528" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q9X9A6" + /translation="MTKKSITRNFIFNTILTMSSFIFPLISFPYVSRVLMADGLGRVT + FASSIIDYALTFAMLGMPLYGVKVCAGYIKNKEKLSQTVRELLVINLLVGFLVMLLLA + TMVIIIPRFRQEWQLIIITSSTIPLNIIGIEWLYKALEDYSYISIRTLTFKILGFLLM + FLVVRTKDDYMVYAAITVLASHGSFILNFFRSRTFLLENISQRLNLKQHIKPLLILFF + LSVSWTIYKNTDVVMMGFLTSDTEIGYYSTALKIRSIVLSVVTSLGTVVLPRLVKYYK + EGKYNEAKKILNKSSSFIMLSSLYFIGYIVINAREIILFIAGRNYLGAIPTLQVSIFS + AIFVGYSIMYGTNILVSIGKENVTIQASIIGVVLNICLNFIMIPKFAALGAGIATSIG + EAVMVLYEIIYLGKDGWSYFERLNILKIIVVFIFSTFMLYIMKDFFVGYPLFIYIVIS + GVIYSIIYIFGLMILRENLLSSWKISILNRFNIIKE" + misc_feature 8569..8679 + /gene="wzx" + /locus_tag="SPC08_0012" + /note="Signal peptide predicted for SPC0271 by SignalP 2.0 + HMM (Signal peptide probability 0.910) with cleavage site + probability 0.543 between residues 37 and 38" + misc_feature 8584..9393 + /gene="wzx" + /locus_tag="SPC08_0012" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.6e-40" + gene 10042..10770 + /gene="wciT" + /locus_tag="SPC08_0013" + CDS 10042..10770 + /gene="wciT" + /locus_tag="SPC08_0013" + /note="member of homology group 211" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32956.1" + /db_xref="GOA:Q9AHA0" + /db_xref="InterPro:IPR007577" + /db_xref="UniProtKB/TrEMBL:Q9AHA0" + /translation="MIPKKIHYIWFGGSEKPDVVLKCINSWKKYMPDYEIVEWNEDNF + DLSDSQFAKSAYESRKWAFASDYARFKILSKYGGIYFDTDVELLKTIPDDILAHSSFT + GFEYIGEVNPGLVYACMPDDKIAKYMVQYYEQASFDINHLVTVNTIITDYLLKNNFQK + NNQFQIIDGLAIYPDDYFCGYDQEVKEVRLTERTISIHHYSATWKTRTLKRKVQMIVK + TIIGAENYRKLLYCKRKITNAVSK" + misc_feature 10114..10380 + /gene="wciT" + /locus_tag="SPC08_0013" + /note="HMMPfam hit to PF04488, Glycosyltransferase + sugar-binding regi, score 8.3e-27" + gene 10754..11917 + /gene="wzy" + /locus_tag="SPC08_0014" + CDS 10754..11917 + /gene="wzy" + /locus_tag="SPC08_0014" + /note="member of homology group 223" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32957.1" + /db_xref="UniProtKB/TrEMBL:Q9X9A8" + /translation="MPYLNNVPQNKFSIRLFDIAIVLLTLKMLVSSIPVFDFVFPQKF + QNILVILGYILIFLHIFEKRKYTLQFIISIILITTLLLYTSIQMQNYVYFTSWFMLIG + TIHYDLRRVIKIIFIVSLSIMFISIFISLLMYIIDYKREILINIRRNETVRAFTFGFI + HPNKFTIVLSNLCLMFIWLIKDRLKYYHVTFCLFIQLFFYFFTQTRTALLVSIVIFAL + LYIYMFVENLELRWIGYSFFCISTFLGVLAFQFYPSNNKFSIFIDNILTGRIKLAAYA + RTFFGYTFWGQYVDKEIVWDPIWGLTSFTFDSFYSFLMSNAGIIWLLILSVLFVKLQK + YLDNKSLILLLAWSMYAVTETDLIFPSYGFQFLFLSILFTNTSTCSTIMLKNN" + gene 11986..13224 + /gene="ugd" + /locus_tag="SPC08_0015" + CDS 11986..13224 + /gene="ugd" + /locus_tag="SPC08_0015" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI32958.1" + /db_xref="GOA:Q9AH99" + /db_xref="HSSP:1DLJ" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR006168" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q9AH99" + /translation="MKIAVTGTGYVGLSIAVLLAQHHQVIAVDIIPEKVELINQRKSP + IQDDYIEKYLAEKDLNLVATLDAKEAYKDADFVVIAAPTNYDPKKNFFDTSAVESVIE + TVLKYNPDAIMVIKSTVPVGYTESARKKFQTENILFSPEFLRESKALYDNLYPSRIIL + GTDKNNERLVSVAETFAGLLQEGALKEDIDTLYMGFTEAEAVKLFANTYLALRVSYFN + ELDTYSEMKGLDTQAIIDGVGLDPRIGSHYNNPSFGYGGYCLPKDTKQLLANYEDVPE + ELIGAIVRSNSTRKDFIADQVLKMVDYYDYSAHNVFNERVEKDIIIGIYRLTMKSNSD + NFRQSSIQGIMKRIKAKGVRVVIYEPTLESGSTFFGSSIINDLEEFKRLSNAIVANRY + DNSLEDVKEKVYTRDIFERD" + misc_feature 11986..12528 + /gene="ugd" + /locus_tag="SPC08_0015" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 6.7e-53" + misc_feature 11986..12498 + /gene="ugd" + /locus_tag="SPC08_0015" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 3.4e-05" + misc_feature 11986..12402 + /gene="ugd" + /locus_tag="SPC08_0015" + /note="HMMPfam hit to PF00056, lactate/malate + dehydrogenase, NAD bind, score 0.00018" + misc_feature 11986..12066 + /gene="ugd" + /locus_tag="SPC08_0015" + /note="Signal peptide predicted for SPC0274 by SignalP 2.0 + HMM (Signal peptide probability 0.610) with cleavage site + probability 0.508 between residues 27 and 28" + misc_feature 12571..12852 + /gene="ugd" + /locus_tag="SPC08_0015" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 4.3e-38" + misc_feature 12952..13203 + /gene="ugd" + /locus_tag="SPC08_0015" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 4.9e-06" + gene 13286..13381 + /gene="HG265" + /locus_tag="SPC08_0016" + /pseudo + CDS 13286..13381 + /gene="HG265" + /locus_tag="SPC08_0016" + /note="member of homology group 265" + /pseudo + /codon_start=1 + /transl_table=11 + /product="UDP-galactopyranose mutase (pseudogene)" + gene 13435..13635 + /gene="HG266" + /locus_tag="SPC08_0017" + /pseudo + CDS 13435..13635 + /gene="HG266" + /locus_tag="SPC08_0017" + /note="member of homology group 266" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative acetyltransferase (fragment)" + gene 13797..>13844 + /gene="aliA" + /locus_tag="SPC08_0018" + CDS 13797..>13844 + /gene="aliA" + /locus_tag="SPC08_0018" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32961.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtt tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaaagca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attttcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggctcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agagcaggac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgagcccatg ttttctcaat aggattgtac tcaggtgagt agggaggaag aggtaaaagt + 601 ttacgcctaa actcttcaca caagagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaaccaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ctcaccattc + 781 atttgttaga cctgcaacca aagaaatcct ctgatatctt cttccagata ctttgcctct + 841 tattaactga ttaactgact ttttaatgag cgaccatatt ctcgataaaa ataagtatcg + 901 aatcctgttt catcaatcta aacaggtgct aggtgcttta aactattaaa attcttaaga + 961 aataaggcta ctttttctgg gtcttgttca tagtaggtgt ggttcttttt tcgagtgtag + 1021 cccatagctt tgagcgcata gtggatggta gttggatgac agccaaattc agaagctatt + 1081 tcagtcaaat aagcatctgg attgtcagta agatagtttt taagtctatc tctatcaact + 1141 tttcttggtt ttgttccttt tacttggtgg tttagctctc ctgttttctc ttttagcttt + 1201 aaccagccat aaatggtatt acgtgagatt tggaaaacgt gtgatgcttc tgttatacta + 1261 cctgttcgct cacaataaga gagaactttt ttacgaaaat ctattgaata tgccataaga + 1321 agattatacc tcattgtgta ctatagtaga ttgaaactag aatagtacac atctgcttct + 1381 aaaacattgt tagaaatcga tttgactgtc ccgatcgatt tgtcatgttc ttatttcatt + 1441 ttactatatt tttgttttgc gggaagtcta ctaagatact taaagatgca gatagtgaaa + 1501 aaaaggtgta gacattaccg taaaaaagtg atataatcgt aagatgttca atgtataggt + 1561 gttaatcatg agtagacgtt ttaaaaaatc acgttcacag aaagtgaagc gaagtgttaa + 1621 tatagttttg ttgactattt atttattgtt agtttgtttt ttattgttct taatctttaa + 1681 gtacaatatc cttgctttta gatatcttaa tctagtggta actgcgttag tcctactagt + 1741 tgccttggta gggctactct tgattatcta taaaaaagct gaaaaattta ctatttttct + 1801 gttggtgttc tctatccttg tcagctcagt gtcgctcttt gcagtacagc agtttgttgg + 1861 actgaccaat cgtttaaatg cgacttctaa ttactcagaa tattcgctca gtgtcgctgt + 1921 tttagcagat agtgagatcg aaaatgttac gcaactgacg agtgtgacag caccgactgg + 1981 gactgataat gaaaatattc aaaaactact agctgatatc aagtcaagtc agaataccga + 2041 tttgacggtc gaccagagtt cgtcttactt ggttgcttac aagagtttga ttgcagggga + 2101 gactaaggcc attgtcctaa atagtgtctt tgaaaatatc atcgagttag agtatccaga + 2161 ctacgcatcg aagataaaga agatttatac caagggattc actaaaaaag tagaagctcc + 2221 taagacgtct aagaatcagt ctttcaatat ctatgttagt ggaattgaca cctatggacc + 2281 tattagttcg gtgtcgcgat cagatgtcaa tatcctgatg actgtcaatc gtgataccaa + 2341 gaaaatcctc ttgaccacaa cgtcacgtga tgcctatgta ccaatcgcag atggtggaaa + 2401 taatcaaaaa gataaattaa cccatgcggg catttatgga gttgattcgt ccattcacac + 2461 cttagaaaac ctctatggag tggatatcaa ttactatgtg ctattgaact tcacttcttt + 2521 cttgaaaatg attgacttat tgggaggggt agatgttcat aatgatcaag agttttcagc + 2581 tctacatggg aagttccatt tcccagtagg gaatgtccat ctagactctg agcaggctct + 2641 aggttttgta cgtgaacgct actcactagc cgatggagac cgtgaccgtg gtcgcaacca + 2701 acaaaaggtg attgtggcta tccttcaaaa attaacgtca accgaagtac tgaaaaatta + 2761 tagtacgatc attaatagct tgcaagattc tatccaaaca aatatgccga ttgagactat + 2821 gatagattta gtgaatactc agttggaaag tggaggtaat tataaagtaa attttcaaga + 2881 tttaaaaggg acaggtcgga tggatcttcc ttcttatgca atgccagaca gtaacctcta + 2941 tatgatggaa atagatgata gtagtttagc tgtagttaaa gcagctatac aggatgtgat + 3001 ggagggtaga tgaaatgata gacatccatt cgcatatcgt ttttgatgta gatgacggtc + 3061 ccaagtcaag agaggaaagc aaggctctct tggcagaatc ctacaggcag ggggtgcgaa + 3121 ccattgtctc tacctctcac cgtcgcaagg gtatgtttga aactccggaa gagaagatag + 3181 cagaaagctt tcttcaggtt cgggaaattg caaaagaagt agcagatgat ttagtcattg + 3241 cttacggggc tgaaatttac tacacaccag atgttctgga taagctggga aaaaagcgga + 3301 ttccgaccct caatgatagt cgttatgcct tgatagagtt tagtatgaac actccttatc + 3361 gcgatattca tagcgccttg agcaagatct tgatgttggg aattactcca gtcattgccc + 3421 acattgagcg ctatgatgct cttggaaata atgaaaaacg cgttcgagaa ctgattgata + 3481 tgggctgtta cacgcaagta aatagttcac atgtcctcaa accaaaactt tttggagaac + 3541 gttataaatt catgaaaaaa agagctcagt attttttaga gcagaatttg gttcatgtca + 3601 ttgcaagtga catgcacaat ctagacggca gacctcctca tatggcagaa gcatatgact + 3661 ttgttaccca aaaatacgga gaagcgaagg ctcaggaact ttttatagac aatcctcgaa + 3721 aaattataat ggatcaacta atttaggaga aatgatgaaa gaacaaaaca cgatagaaat + 3781 cgatgtattt caattattta aaaccttgtg gaaacgcaag ctaatgattt tattagtggc + 3841 acttgtgaca ggtgcggggg cttttgcata tagcactttt attgttaagc cagaatatac + 3901 gagtaccacg cgaatttacg tagtgaatcg caatcaagga gacaagtcgg ggctgacaaa + 3961 tcaggatttg caggcaggat cttatctggt aaaagactac cgtgagatta tcctttcgca + 4021 ggatgcattg gaaaaagtag cgacaaattt gaagttggac atgccagcaa aaacgttagc + 4081 tagcaaagtt caagtgactg taccaactga cactcgtatc gtctcaatct ctgtcaagga + 4141 taaacagcca gaggaagcca gtcgtatcgc taattctcta cgagaagttg ctgtagaaag + 4201 gatcgtcgct gtaacgcgag tatctgatgt aacgacactt gaagaagcgc gaccagctac + 4261 gactccttct tctccaaatg ttcgacgcaa ttccttgttt ggttttcttg gaggagcagt + 4321 tgtaacagta attgctgttc ttttgattga gttgttcgac acccgtgtga aacgtcctga + 4381 agatgttgaa gatgtactgc aaattccact tttagggctc gttccagatt tggacaaaat + 4441 gaaataggag gaagttatgc caacattaga aatctcacag gcaaaattgg attttgtaaa + 4501 aaaggcagag gaatattata actctttgtg catgaaccta cagttaagtg gagatggttt + 4561 gaaagtattt tctatcactt ctgtgaaact aggagaagga aaatcaacga cttccaccaa + 4621 tatcgcttgg gcttttgcgc gtgcaggtta caaaacgctg ctgattgatg gagatattcg + 4681 caattctgtt atgttaggtg tctttaaagc aagggataag attacaggcc tgacagaatt + 4741 tttatcagga actacagacc tatcacaagg gctttgtgat accaatatcg aaaatctctt + 4801 tgtaattcag gctggctctg tgtcaccgaa tccgacagct cttcttcaaa gtaagaattt + 4861 cagtacaatg cttgaaacct tgcgtaaata ttttgactac atcattgtag atactgctcc + 4921 tgtcggtgtc gtgattgatg cggctattat tacgcgaaaa tgcgatgctt ctattttagt + 4981 gacggaggca ggtgaaataa atcgacggga tattcaaaaa gcaaaagaac agttggaaca + 5041 cacagggaag ccgtttttgg gagttgtgtt gaataaattc gatacttcag taaacaaata + 5101 cggttcttat ggaaattatg gagattacgg gaaaaataaa aaatagattg agggatagag + 5161 atgaatggaa aagtagtaaa ttcttcattg gccataatcc atagttttct tgttatttta + 5221 ttgacttatc tacttagtgc tgtgagagaa gcggagattg cttcagcaac agctattgca + 5281 ctttatatcc tccattattt tgtcttttat atcagtgatt atggacagga tttctttaaa + 5341 aggggatatt tgattgaact tgtccagaca ttgaaatata tcctattctt tgcactagcg + 5401 attagtattt ctaatttttt cttagaggat cgatttagta tttccagacg aggcatgatt + 5461 tacttcctca cattacatgc tctcttagtc tatgtgctaa acctatttat caagtggtat + 5521 tggaagcggg cttatcccaa ctttaaagga agtaagaaga ttctcctact tacagcaact + 5581 tctcgtgtcg aaaaggtact ggatagatta atagaatcaa atgaggttgt tggggagttg + 5641 gtagccgtca gtgtcttaga taaaccagat tttcagcatg attgtttaaa ggtagtagca + 5701 gagggggaga tagtaaactt tgcgactcat gaggtggtcg atgaagtctt tatcaatctt + 5761 ccaagtgaaa aatacaatat tggagagctt gtctctcagt ttgaaacgat gggaattgat + 5821 gtaacagtca atctaaatgc ttttgatcgt agtttggcac gtaacaagca aattcgtgag + 5881 atggcaggat taaacgttgt gattttttct acaacatttt ataagactag ccacgtgatt + 5941 gctaagcgga ttattgatat cgtgggtgca ttggtagggc tgatactatg tggtctagtc + 6001 agtgttgtac tggtcccttt gattcgaaag gatgggggct ctgctatttt tgctcagacg + 6061 cgtattggaa aaaatggtcg ccacttcact ttttacaagt tccgctccat gtgtgtagat + 6121 gctgaggaca aaaaaagaga actcatggaa caaaatacca tgcagggtgg aatgtttaag + 6181 gtggatgatg acccacgtat cacgaaagtt ggtcgtttta tacggaagac tagcttggac + 6241 gagctgccac agttttataa tgttctaaag ggagatatga gtttggttgg tacacgacca + 6301 ccaacagtgg acgagtatga acactatact ccagaacaaa aacgtcgtct aagttttaaa + 6361 cctggtataa caggtttatg gcaggttagt ggacgaagtg agattaagaa tttcgatgaa + 6421 gttgtcaagt tagatgtagc ttatatagat gattggacaa tctggaaaga tattgaaatc + 6481 ttattgaaga cagttaaagt tgtattgatg aaggatggag cgaagtaaag gaatgaaaaa + 6541 taaaaaaaaa gtatgttttt gtgcttcgtc agggggacat tatgagcaac taatgaagct + 6601 tgaaccgatt atgagacaac aagacagcta tttaatcaca gaatatactg attataacaa + 6661 aggagagtct gagaagaaag atataaacaa ggtgttttat cttttgcaaa ttaatcgttt + 6721 ggaatttttt tggatcgtta aattgatttg gatttccttg aaatcacttt atatactgtt + 6781 aagaatacgc ccaaaagtag ttatctgtac aggtgttctt gcaatgatac cgttttgttt + 6841 gctttcaaaa atgtttgggg ctaaattaat ttatattgaa tcttttgcaa aagtgaccac + 6901 tcctacttta acaggtagaa tactataccg ttacgcagat agattctatg tgcaatggga + 6961 gagtatgcta gatatctacc caaatgctgt ttataaaggg gggctttatt aggtgatttt + 7021 tataactgta gggactcaaa aacacccttt taatcgcttg ttaaaaaaaa tagatcaact + 7081 tattgaatta gaagtgataa aggaagaggt gtttgctcag attggagctt ctgattataa + 7141 acctaaatac ttttcttata attcattttt gagttcaatt gatatgaatg agaagatgag + 7201 agaagctagt atggtaatta cacatggtgg gactgctagt attgttaaag ctttgaaatt + 7261 aagaaaaaaa attatagcgg ttccacgatt agagcagttt ggagaacatg tggataatca + 7321 ccaattacaa atcatcacag ttcttggtga ggaaggttat attttgccat gctttgatat + 7381 agagcagtta ggaactgttt atcaaaaagc tcagactttt acaacaaagc catatatttc + 7441 taatagttat gcacttttag aagatatacg acaatacata gatagtcttt gaaaggaaat + 7501 ttagatgaca aaagttttgc aaattgggcc tagtataaat ttatctaaag gtggtatgag + 7561 cgctgttatt agagatttga catatagccc gttattgtca ggtgattttg atataactgc + 7621 ttatcaatct tttattgatg gctctcttgt aacacggtta acctattcta gttatgctct + 7681 tcttaaattt gtagttcatt ctggtaatta tgacatatac catattcaca ctgctacaag + 7741 agggagttgt tggagaaaat tactgtattt gaaattactt aaaagtaaaa ataaaaaagc + 7801 tattttgcat attcatggag cagaatttca aatattttat gactcacttc ctgagtataa + 7861 aaaaaataaa gttagagaaa tgttagaatt atctgattat gtgattgtac tttcccaaac + 7921 ttggtatgat tttttttcaa atattaatat aaatgcaaaa attgtaatag ttgaaaatgg + 7981 tgtagacact tctttttatg tagaaaaaaa gaaaagtata acaagcaaca actttctttt + 8041 tttaggaagg atgggcaaaa gaaaaggagc ctatgattta atagatgcca tgaatcaagc + 8101 agtggctata aatcctaatt tgcatttgac aatggctgga gatggagaac ttgaagacat + 8161 acgtcaaaag atatcaaatc tgaatttgac tgatcatatt acaatatatg attgggttaa + 8221 tcagagagat aaaaaaatac tatttcaagc taatcagact ttgatattgc cttcttataa + 8281 tgaggggctc ccgatggcaa tattggaagc tatggcttct ggattagcaa tcatatcaac + 8341 gcctgtaggt ggcatacctg aaattataca cgaggataat ggctggttaa ttcaaccggg + 8401 tgatatttct cagttatcta atattatttt agaagcaagt tacaatcccg atgttgtaag + 8461 tttaatgggg agcaataatc ataagttggt tgaagagaag tatagttttc atagtatgca + 8521 tggtaaaatt aaaaaaattt ataatactct attagaaacg aaaaaataat gactaaaaaa + 8581 tctattacta gaaattttat tttcaataca attctaacta tgtccagttt tatttttcca + 8641 ctcatcagtt tcccatatgt ttcaagggtt ctgatggcag atgggttggg acgagtaacg + 8701 ttcgcttctt caattattga ttatgcccta acatttgcaa tgttagggat gccattatat + 8761 ggtgttaaag tctgtgcagg atatattaaa aataaggaga agctaagtca gactgtcaga + 8821 gaattgttag tcattaattt attagtagga tttcttgtga tgcttctttt agcaactatg + 8881 gtaataataa ttcctcgttt tagacaggaa tggcagctta ttattatcac gtcatctaca + 8941 attcctctca atattatagg aatagagtgg ttatacaaag cattggaaga ctattcgtat + 9001 atttcaatta gaacattgac ttttaaaata ttaggtttcc ttttgatgtt tttagtcgtc + 9061 cgaacaaaag atgactatat ggtatatgcg gcaattacag ttttagctag tcatggttct + 9121 tttattttga atttttttag atctagaact ttcctactag aaaatatctc tcaaagattg + 9181 aatttaaagc aacatataaa gccgttatta attttatttt ttttatctgt atcatggact + 9241 atttataaga atacagatgt cgttatgatg ggatttctaa ctagtgatac agaaattggt + 9301 tactattcaa cagcattaaa aattcgttct atagtgctca gtgtagtaac ttctttaggg + 9361 acagttgtac tacctcgttt agtcaaatat tataaagaag gaaagtataa tgaagcaaag + 9421 aaaatactaa acaaaagttc ttcatttatt atgctaagtt ctttatattt tattggctat + 9481 attgtaatta atgccagaga aattattctt tttattgcgg gtaggaatta cttaggggct + 9541 atcccgacac ttcaagtatc tatttttagt gcaatatttg ttggctactc tattatgtat + 9601 ggaaccaata tcctagtatc tataggtaaa gaaaatgtaa ccattcaggc aagtattatt + 9661 ggtgttgttt taaatatttg tttgaatttt attatgatac ccaaatttgc tgcactaggg + 9721 gcaggtattg caacttctat aggagaagct gttatggtat tatatgaaat aatatacttg + 9781 ggaaaggatg gttggagcta ttttgaaaga ttaaatattt taaagattat tgtagtattt + 9841 atatttagta cgtttatgtt atatattatg aaagattttt ttgttggcta tcctttattt + 9901 atttatattg taatttcagg ggttatttat agtattatat atatatttgg tcttatgata + 9961 ctaagagaaa atttgctttc aagttggaaa atatcaatac taaatcggtt taatattatt + 10021 aaagaatgag gagaatatta tatgattcct aaaaaaatcc actatatttg gttcggtgga + 10081 agtgagaaac cagatgttgt cttaaaatgt attaattctt ggaaaaaata tatgccagac + 10141 tatgagattg ttgaatggaa tgaggataat tttgatttat cagattcaca atttgcgaag + 10201 tctgcatatg aatctaggaa atgggcattt gcatcggatt atgctcgttt taaaatttta + 10261 tctaagtatg gtgggatcta ttttgatacg gatgttgagt tgttaaaaac aataccagat + 10321 gatatattag ctcattcatc ttttacaggt tttgaatata ttggtgaagt aaatccagga + 10381 cttgtatatg cttgtatgcc agatgataag atagcaaaat atatggtgca atattatgag + 10441 caagcaagtt ttgatatcaa tcatttggta actgtcaata caattattac agattatcta + 10501 ttaaaaaata actttcaaaa aaataatcag ttccaaataa ttgatggatt agcaatttat + 10561 ccagatgatt acttttgtgg ttatgatcag gaggtcaagg aggttaggct tacggaacgg + 10621 acgattagta ttcatcatta tagtgctact tggaaaacaa gaactttaaa aagaaaagta + 10681 cagatgattg ttaaaacaat tataggagct gagaattata ggaaattatt atattgtaag + 10741 aggaaaataa ccaatgccgt atctaaataa tgtaccgcaa aataaatttt ctataagatt + 10801 atttgatatt gctatagttt tattgacttt aaagatgtta gtttcttcga ttccagtttt + 10861 tgactttgtg tttcctcaaa aatttcaaaa tatccttgtt attttaggtt atatattgat + 10921 ttttttacat atttttgaga aaagaaagta cacattacaa tttataatta gtataattct + 10981 aattactaca ttactgcttt atactagtat acaaatgcaa aattatgttt actttacgag + 11041 ttggtttatg ttgattggta cgattcatta tgatttaaga agagtaataa aaattatatt + 11101 tattgtatca ttaagtatta tgttcatatc aatttttata tcacttctta tgtatataat + 11161 tgattataaa cgagaaattc ttattaatat ccgaagaaac gaaactgtca gagcatttac + 11221 atttggtttt atacatccca ataaatttac tattgtacta tctaacttat gtcttatgtt + 11281 tatttggtta atcaaagatc gtttgaaata ttatcatgta actttttgtc tttttattca + 11341 gttattcttt tattttttca cgcagactag aacagctcta ctagtatcta tagtaatttt + 11401 tgctctttta tatatttata tgtttgttga aaatcttgaa cttagatgga taggatactc + 11461 attcttttgt atttctactt ttttaggagt tttggcattt caattttatc cttctaataa + 11521 taagttttca atttttattg ataatatcct gactggacgt attaaattag ctgcatacgc + 11581 aagaaccttt tttggttata cattctgggg tcaatatgtt gataaagaaa ttgtttggga + 11641 tcctatttgg ggattaacta gtttcacttt tgattcgttt tattccttct tgatgagtaa + 11701 tgctggcatc atatggctac ttatcttatc agtcttattt gtaaaactac aaaaatattt + 11761 agacaataaa agtttgattt tattattagc ttggtctatg tatgcggtaa cagaaactga + 11821 tttaatattt ccaagttatg gattccagtt cttattttta agtatacttt ttactaatac + 11881 tagtacatgt tctacaataa tgttaaagaa taattaattg aaggaatcta tatattttct + 11941 aatttgtaga atgataggca aatatatgag gagggaagaa aaagtatgaa aatagcagta + 12001 acaggtacgg gatatgttgg cctatccatt gcggttttat tggctcagca tcatcaagta + 12061 atagcggtgg acattattcc tgagaaggtc gagttaatta atcaaagaaa gtcacctatt + 12121 caagatgact acatagagaa atatctggca gaaaaggatt taaatttagt ggctacattg + 12181 gatgcaaaag aagcatataa agatgcggat tttgttgtga ttgcagctcc aactaactat + 12241 gatccaaaga agaacttctt tgacacttct gctgtagagt ctgtcattga aacggtgctt + 12301 aaatataatc cagatgctat catggtcatt aaaagtacgg ttccagttgg ttatacagag + 12361 tcagctcgaa agaaatttca gactgaaaat atcttattta gtcctgaatt tttgcgtgag + 12421 tcaaaagcac tttacgataa cttatatccc agccgtatta ttttagggac agataaaaat + 12481 aatgaacgct tggtaagtgt tgctgagacg tttgcgggat tgctccaaga aggcgcttta + 12541 aaagaagata ttgatacatt gtacatgggc tttactgaag ctgaggcggt caagcttttt + 12601 gcaaatactt acctagcttt gcgtgtttct tattttaatg agctggatac ttattctgag + 12661 atgaaggggc tagatactca agctattatt gatggagttg gtttggatcc acgaatcggc + 12721 tctcactata acaatccttc cttcgggtat ggtggttact gtctccctaa agataccaag + 12781 caacttcttg ccaactatga agatgtacca gaagaactta taggagctat agtacggagc + 12841 aattcgacac gtaaagactt tattgccgat caggttctta agatggtaga ttattatgat + 12901 tattcagccc ataatgtttt taatgagaga gtagaaaaag atattattat tggtatctat + 12961 agattgacca tgaagagtaa tagcgataat tttcgtcaaa gttctattca aggtattatg + 13021 aaacgtataa aagctaaggg agtaagagta gttatttatg aaccaacttt agaaagtggg + 13081 agtacatttt ttggaagttc cattatcaat gatttagagg aattcaaacg actgagtaat + 13141 gccattgttg ctaatcgcta tgataactca ttagaagatg tcaaggaaaa agtctataca + 13201 cgtgatattt ttgaaagaga ttgatttagt ataataaaaa tgtaaaaaat taattgttag + 13261 aagcggtcta tactgagaag caatgggacg cttagcagat tatacatatt acgatatgca + 13321 tgttgtgatt gaacgagcgc tcgaagttat agaaaaagag tttgaaaatg acaaaaatta + 13381 gaatcaattg gatagatttt ggaaaagggt tctcaatatt tttagtttta gtagagcgtc + 13441 tatatcctcc attccccaat ttgtagtatg attctaattc tgatgttgaa agtgggaatt + 13501 agctctactt tacttcatat tgttatcgga attgttttgg gctggcattt atccatccta + 13561 gcaacctata tattgaaaaa aattccattt ttgaatattg ttttattacc acagaagtat + 13621 attaaattaa aataaattat tttggctctt tgtcagctaa catctggaga ggacaatcac + 13681 cgtcttctcc tttttggtct tttcagaata tactaaacta acccaaaaat tctgaaaatt + 13741 ctgttgacat ctttttgaaa agagtctata atggagagaa agttttaaag gagaaaatga + 13801 tgaaaagttc aaaactactt gcccttgcgg gcgtgacatt attg +// + diff --git a/public/res/serotype_genbank/serotype_9A.gb b/public/res/serotype_genbank/serotype_9A.gb new file mode 100644 index 0000000..333c84a --- /dev/null +++ b/public/res/serotype_genbank/serotype_9A.gb @@ -0,0 +1,920 @@ +LOCUS CR931645 20538 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain Wilder (serotype 9a). +ACCESSION CR931645 +VERSION CR931645.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 20538) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 20538) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..20538 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="Wilder" + /db_xref="taxon:1313" + gene <1..134 + /gene="dexB" + /locus_tag="SPC09A_0001" + CDS <1..134 + /gene="dexB" + /locus_tag="SPC09A_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI32962.1" + /db_xref="UniProtKB/TrEMBL:Q4JZI8" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVELL" + gene 293..458 + /gene="aliB" + /locus_tag="SPC09A_0002" + /pseudo + CDS 293..458 + /gene="aliB" + /locus_tag="SPC09A_0002" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative oligopeptide-binding protein AliB + (pseudogene)" + gene complement(order(459..995,997..1323)) + /gene="tnp" + /locus_tag="SPC09A_0003" + /pseudo + CDS complement(join(459..995,997..1323)) + /gene="tnp" + /locus_tag="SPC09A_0003" + /note="member of homology group 4" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS630-Spn1 transposase" + misc_feature complement(join(933..995,997..1305)) + /gene="tnp" + /locus_tag="SPC09A_0003" + /note="HMMPfam hit to PF01710, Transposase, score 2.2e-23" + /pseudo + gene 1536..2981 + /gene="wzg" + /locus_tag="SPC09A_0004" + CDS 1536..2981 + /gene="wzg" + /locus_tag="SPC09A_0004" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32965.1" + /db_xref="GOA:Q8KWQ3" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q8KWQ3" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNAASNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYGTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVLEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1536..1652 + /gene="wzg" + /locus_tag="SPC09A_0004" + /note="Signal peptide predicted for SPC0281 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 1740..2087 + /gene="wzg" + /locus_tag="SPC09A_0004" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 3e-61" + misc_feature 2265..2708 + /gene="wzg" + /locus_tag="SPC09A_0004" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 2983..3714 + /gene="wzh" + /locus_tag="SPC09A_0005" + CDS 2983..3714 + /gene="wzh" + /locus_tag="SPC09A_0005" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32966.1" + /db_xref="GOA:Q8KWQ2" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q8KWQ2" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGVTPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQEFFIDNPRKIVMDQLI" + misc_feature 2986..3594 + /gene="wzh" + /locus_tag="SPC09A_0005" + /note="HMMPfam hit to PF02811, PHP domain, score 6.2e-37" + gene 3720..4415 + /gene="wzd" + /locus_tag="SPC09A_0006" + CDS 3720..4415 + /gene="wzd" + /locus_tag="SPC09A_0006" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32967.1" + /db_xref="GOA:Q4K2H5" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2H5" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNHNQGNKLGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLASKVQVTVPDDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGVVVTVIAVLFIELLDTRVKRPEDVEDVLQI + PLLGLVPDLNKMK" + misc_feature 3720..3836 + /gene="wzd" + /locus_tag="SPC09A_0006" + /note="Signal peptide predicted for SPC0283 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 3741..4157 + /gene="wzd" + /locus_tag="SPC09A_0006" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.7e-55" + misc_feature 4263..4340 + /gene="wzd" + /locus_tag="SPC09A_0006" + /note="PS00217 Sugar transport proteins signature 2." + gene 4425..5114 + /gene="wze" + /locus_tag="SPC09A_0007" + CDS 4425..5114 + /gene="wze" + /locus_tag="SPC09A_0007" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32968.1" + /db_xref="GOA:Q8KWQ0" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q8KWQ0" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + LGEGKSTTSINIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDQYGSY + GNYGDYGKNKK" + gene 5129..6496 + /gene="wchA" + /locus_tag="SPC09A_0008" + CDS 5129..6496 + /gene="wchA" + /locus_tag="SPC09A_0008" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI32969.1" + /db_xref="GOA:Q8KWP9" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q8KWP9" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQAFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFNISRRGMIYF + LTLHALLVYVLNLFIKRYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + IAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGAFVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQISGRSEIKNFDEVVKLDVAYIDGWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5129..5221 + /gene="wchA" + /locus_tag="SPC09A_0008" + /note="Signal peptide predicted for SPC0285 by SignalP 2.0 + HMM (Signal peptide probability 0.938) with cleavage site + probability 0.364 between residues 31 and 32" + misc_feature 5912..6493 + /gene="wchA" + /locus_tag="SPC09A_0008" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.4e-159" + gene 6502..7245 + /gene="wchO" + /locus_tag="SPC09A_0009" + CDS 6502..7245 + /gene="wchO" + /locus_tag="SPC09A_0009" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI32970.1" + /db_xref="GOA:Q8KWP8" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q8KWP8" + /translation="MNERMQILGIIIDPLTMKETVDAVEQYVLKKHPLHLMGVNADKI + NQCHEDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMQCLLELSNKKG + YSVYFFGAKEEILQDMLKVFKQRYPNLNVVGYRNGYFSPEDEKKIQEDIKGGKPDFVF + VGITSPKKEYIIQSFMDNGINAVFMGVGGSFDVLSGHIKRAPLWMQKLNLEWLFRVVN + EPKRLFKRYFVGNVTFIKRVLDEKRKSKK" + misc_feature 6664..7179 + /gene="wchO" + /locus_tag="SPC09A_0009" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 1.2e-93" + gene 7220..8305 + /gene="wcjA" + /locus_tag="SPC09A_0010" + CDS 7220..8305 + /gene="wcjA" + /locus_tag="SPC09A_0010" + /note="member of homology group 66" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32971.1" + /db_xref="GOA:Q8KWP7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q8KWP7" + /translation="MKSENQKNNILHISRTMDIGGAERIVYQLSSDLKDEFDSVHVAS + TGGLWESKLLSKGVQHHKILDVDSKNPLTMVKILSSFYRIIKNNDITIVHTHHRMAAF + YIRLLKIINPKLIHVYTAHNVFKNKLPLYKFSLKKAYCVAVGKAVNDNLKHDVGISDS + TVIYNGVVFEKTDKLVDEIVNYNGIKLGCIARLSEQKGLTYLIDAMSLVKHRDITLFI + VGDGELRDELENKVKQLNLQKSVIFLGYRKDVVECINSFDYLVSSSLYEGLALNVIEA + FMNGKTMVASDIPGINEVVNNKNGILVPVKDDVALARAIEKLATDKKLREKLAYQAKK + DYETKFNYSLFLDNYRRLYRKLTGESK" + misc_feature 7733..8224 + /gene="wcjA" + /locus_tag="SPC09A_0010" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 4e-43" + gene 8302..9390 + /gene="mnaA" + /locus_tag="SPC09A_0011" + CDS 8302..9390 + /gene="mnaA" + /locus_tag="SPC09A_0011" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI32972.1" + /db_xref="GOA:Q8KWP6" + /db_xref="HSSP:1O6C" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q8KWP6" + /translation="MKKVMLVFGTRPEAIKMCPLVNELKQNDSIKTLVCVTGQHKEML + EQVLEVFKVVPDHDLGIMKANQTLFSITISILDKIQAVLEQEMPDIVLVHGDTTTTFA + TALAAFYMGIKVGHVEAGLRTHNLQSPFPEEFNRQTTSIIADYHFAPTEVAKENLLRE + GRKNIFVTGNTVIDALKTTVQCNYHHPILEWAKGSKLIMLTAHRRENLGEPMENMFNA + VNRILDEFEDVKVVYPIHKNPKVRELASKVFGDNERMKIIEPLEVIDFHNFMDQSYMI + LTDSGGVQEEAPSLGKPVLVMRDTTERPEGVAAGTLKLVGTEEENIYNNFKLLLEDET + EYNKMSKASNPYGDGMTCKRVVDIILEV" + misc_feature 8365..9381 + /gene="mnaA" + /locus_tag="SPC09A_0011" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 1.4e-181" + gene 9432..10571 + /gene="wzy" + /locus_tag="SPC09A_0012" + CDS 9432..10571 + /gene="wzy" + /locus_tag="SPC09A_0012" + /note="member of homology group 83" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32973.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q8KWP5" + /translation="MIKRKIYIICVLLSYFLPSFFTVGSMATIFTLLSTVIRLFVTIY + HVPKVFSQYKVTLIDILVVLFLFFQVFVGVQSQTVNLNYIGGQFFFLGLYSFLKYFLL + FDCKTTIESLFLTFILFLCVQVITQLLFPVGFDSLYPTGDNRLYFLGRKNIATPYIIV + GLGSFYLLNKKMNEFISLKEIIFLGLFGILSFLTQSSTAIICYVLFIFMRMLGLKENI + GKPYSLVSITVYICFSFSIIFSQSTILSTFTAIFSKNATFSGRINIWQLAIRIFEENF + WFGKGLNIDFNAWTNGIIVNSAHNTLLDILARTGIFPGILFVVVLLSLFLGKYRVKSK + TLLTMLISFMVYITMEATSVSILLLIIAICVYWSFGEEKLYEQVT" + misc_feature 9432..9506 + /gene="wzy" + /locus_tag="SPC09A_0012" + /note="Signal peptide predicted for SPC0289 by SignalP 2.0 + HMM (Signal peptide probability 0.955) with cleavage site + probability 0.276 between residues 25 and 26" + misc_feature 10194..10379 + /gene="wzy" + /locus_tag="SPC09A_0012" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1e-07" + gene 10555..11424 + /gene="wcjB" + /locus_tag="SPC09A_0013" + CDS 10555..11424 + /gene="wcjB" + /locus_tag="SPC09A_0013" + /note="member of homology group 84" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32974.1" + /db_xref="GOA:Q8KWP4" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q8KWP4" + /translation="MSKLLNAIYYRLFGLYKKIYLQVFSKKTINILGEKANLENELIV + SFTTIPSRLNYLPSMIKSIFNQTIIPNRFIMYVYKDEFEGINLESILETEIKNGLEIV + YVDENLRSHKKYFYAMKDNPNSIVILVDDDTVYSSNTIEKLVASYRKYPSCISAMRCH + RIKLLTDGSLAPYNEWEYEFFGDIKPSYFNFFTGCGGVLFPPTARTDEFFNISNIMNL + SYLADDVWLNFLAIKNRIKIVKATRCKGTPLTIDDNPEESLVYLNAIYDNNNDRCIKN + MVDFYHIDFSEVD" + gene 11424..12848 + /gene="wzx" + /locus_tag="SPC09A_0014" + CDS 11424..12848 + /gene="wzx" + /locus_tag="SPC09A_0014" + /note="member of homology group 85" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32975.1" + /db_xref="GOA:Q8KWP3" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q8KWP3" + /translation="MDISNKFKVGILYTALGKYSNVIIQLFVTAVLSRILTPEEYGVV + AVVNVFLVFFQILADSGIGPAIVQNKTLTQNDLNDIFTLTIYSGLILSFVFVLIGYPI + SIVYGNEVYIKLYSLLGMCVLFYTMTIVPQSILTRNMNFKRMNLLSLIANIFSGVIGV + VLAIHDFGVYSLIFSNIMKATILFFVFFSSVELSFKKKIEKTSLVKILNFSKFQFMFN + FLNYFARNLDNLLIGRFINPAALGYYDKAYQLSLYPNQILLQVISPVIHPIMSNFQND + RQKMEEVFAKIFNILLLIGMPISVYLFFNASDVITFMFGNNWFQSVPVFQILSASIWI + QMANSPIGIFYQASNRVDLLFKVGLLASGFNIIAIVIGLLSKSIVTIAAMLIISFIIG + LSLNLYVLSHVVFKNDIIKYLKIILVHLVTVIPYIIFNMIGFRFEQGVVINLVLQGLV + LGLIWSIGIFVTGQYKQLIMMFSR" + misc_feature 11442..12245 + /gene="wzx" + /locus_tag="SPC09A_0014" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.4e-21" + gene 12855..14048 + /gene="wcjC" + /locus_tag="SPC09A_0015" + CDS 12855..14048 + /gene="wcjC" + /locus_tag="SPC09A_0015" + /note="member of homology group 86" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32976.1" + /db_xref="GOA:Q8KWP2" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR009695" + /db_xref="UniProtKB/TrEMBL:Q8KWP2" + /translation="MKILFVNMFYNEEGGAQKSTKFLAEQLVKEGHEVFAYSDDAIDS + DIEEVINGVKVFRRRTPLFSLHYIFSAKKNPAKHFFYKIFETYNVFAKKKFIDIIEEI + QPDIVHFNTISGMSLSIVKEAKKRNIRTIWTLRDYWLEYPWGEKDIALIKLLNRIYRP + FVKKSLKHLDIVTAPSAFTLNNFINKGFINPSSQKCMAIENAVIFSKSKLENIIKRKQ + ETKRNPEKTNFLFVGSILEIKGVFNLVMAFKKLTNPEISLKIVGKGKDLEKLQKEIES + DPRIQYLGFQDTKNLYETYQNSDVLVVPSAWDEPFGRVVIEGNANGLPVITSDRGGLP + EIVQTVGGGEVFTDKSGNTLYSILKKFVEMENYNVYYRCILENIDIYSIEKQSEKFIS + LYREG" + misc_feature 13491..13988 + /gene="wcjC" + /locus_tag="SPC09A_0015" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.2e-30" + gene 14049..14714 + /gene="wcjD" + /locus_tag="SPC09A_0016" + CDS 14049..14714 + /gene="wcjD" + /locus_tag="SPC09A_0016" + /note="member of homology group 145" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI32977.1" + /db_xref="GOA:Q8KWP1" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q8KWP1" + /translation="MQVRHLLTYLISLPKTIFFNFKCLPINQAIHLPILVAYNVKLLN + LKKNVIGIETVVKFGLVRIGFSGTEIISSNRSLINLRQGKVIFKGKSVITKGCTISVT + GGTIILGDNFYANRNCLISCTDRLIVGNNVLLGWNVILFDSAGHTLSYDGKKKIKMTE + EIVIGNHVWICAEAHLLKGSKIADGSVVAYSSLVTGYFAEKNCLIGGIPAKTLRKGVS + WEK" + gene complement(14840..16066) + /gene="tnp" + /locus_tag="SPC09A_0017" + /pseudo + CDS complement(14840..16066) + /gene="tnp" + /locus_tag="SPC09A_0017" + /note="member of homology group 146" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative ISIS116-IS110-IS902-like transposase" + misc_feature complement(15047..15379) + /gene="tnp" + /locus_tag="SPC09A_0017" + /note="HMMPfam hit to PF02371, Transposase + IS116/IS110/IS902 family, score 7.4e-11" + /pseudo + gene 16366..17598 + /gene="ugd" + /locus_tag="SPC09A_0018" + CDS 16366..17598 + /gene="ugd" + /locus_tag="SPC09A_0018" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI32979.1" + /db_xref="GOA:Q8KWP0" + /db_xref="HSSP:1DLJ" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q8KWP0" + /translation="MKIAVAGTGYVGLSIAVLLAQHHEIKAVDIVAEKVELINQKKSP + IQDDYIEKYLVEKDLNLEATMDAKYAYEDAEFVVVAAPTNYDSKKNFFDTSAVEAVIQ + QVKKINPKAVIIIKSTIPVGFTESVRKKYQYKNILFSPEFLRESKALYDNLYPSRIIV + GTDLEDTYLKDKANIFASLLKEGAIKEDIDTLFMGVTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDAKAIIDGIGLDPRIGNHYNNPSFGYGGYCLPKDSKQLLANYFDVPQ + NMMTATVESNRTRKDFIAQRILEKAGVSETDSLDAFKNTQDIVIGIYRLTMKSNSDNF + RHSSIQGVMKRLKAKGVTVIIYEPTLKDGETFFGNKVVNNLDKFKEASNVIVANRFEP + SLEDVSNKVYSRDIFKRD" + misc_feature 16366..16986 + /gene="ugd" + /locus_tag="SPC09A_0018" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00028" + misc_feature 16366..16920 + /gene="ugd" + /locus_tag="SPC09A_0018" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 2e-52" + misc_feature 16951..17232 + /gene="ugd" + /locus_tag="SPC09A_0018" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-35" + misc_feature 17326..17577 + /gene="ugd" + /locus_tag="SPC09A_0018" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 1.3e-05" + gene 17810..18843 + /gene="wcjE" + /locus_tag="SPC09A_0019" + CDS join(17810..18532,18532..18843) + /gene="wcjE" + /locus_tag="SPC09A_0019" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI32980.1" + /db_xref="GOA:Q8KWN9" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q8KWN9" + /translation="MKSIGKRINWIDFGKGFAIFSVLVGHVLMGLYESNIFSIANDVL + LLLITQIYIFHIPVFFALSGYFFRPVSDMKEFWHYAKKKTIILGIPYVFYSIIHFCLQ + KVAGASVRVPTTIFNLLNIYKFPLGVSWYLYTLWSILIVYGLLSVVFKNRKSLLLVSV + FAYIFTLFIQTDIFIVQRTLVWGVCFCLGSVLSAIHFDKINLKKFLFFFVLFDFIYMF + AWFLFYEVGSKKDYVSYSNPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKD + SLGIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIV + LLPQKYIKLK" + misc_feature join(17831..18532,18532..18804) + /gene="wcjE" + /locus_tag="SPC09A_0019" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 6.5e-05" + gene complement(order(18887..19471,19525..20193)) + /gene="tnp" + /locus_tag="SPC09A_0020" + CDS complement(join(18887..19471,19525..20193)) + /gene="tnp" + /locus_tag="SPC09A_0020" + /note="member of homology group 13" + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /protein_id="CAI32981.1" + /db_xref="GOA:Q4K2L1" + /db_xref="InterPro:IPR002560" + /db_xref="InterPro:IPR012287" + /db_xref="UniProtKB/TrEMBL:Q4K2L1" + /translation="MEQLHFITKLLDIKDPNIQILDIINKDTHKEIIAKLDYDAPSCP + ECGNQLKKYDFQKPSKIPYLETTGMPTRILLRKRRFKCYHCSKMMVAETSIVKKNHQI + PRIINQKIAQKLIEKISMTDIAHQLSISTSTVIRKLNDFHFKHDFSCLPEIMSWDEYA + FTKGKMSFIAQDFNNLNIITVLEGRTQAVIRDHFLKYDRAVRCRVKIITMDMFSPYYD + LAKQLPNAKIVLDRFHIVQHLSRAMSRVRVQIMNQFHRKSHEYKAIKRYWKLIQQDSR + KLSDKRFYRPTFRMHLTNKEILNKLLSYSEDLKHHYQLYQLLLFHFQNKEPEKFFGLI + EDNLKQVHPIFQTVFKTFLKDKEKLVNTLQLHYSNAKLEATNNLIKLIKRNAFGFRNF + ENFKKRIFIALNIKKERTKFVLSQA" + misc_feature complement(join(19391..19471,19525..19737)) + /gene="tnp" + /locus_tag="SPC09A_0020" + /note="HMMPfam hit to PF01610, Transposase, score 6.7e-44" + misc_feature complement(19777..19842) + /gene="tnp" + /locus_tag="SPC09A_0020" + /note="Predicted helix-turn-helix motif with score + 1860.000, SD 5.52 at aa 118-139, sequence + ISMTDIAHQLSISTSTVIRKLN" + gene 20491..>20538 + /gene="aliA" + /locus_tag="SPC09A_0021" + CDS 20491..>20538 + /gene="aliA" + /locus_tag="SPC09A_0021" + /codon_start=1 + /transl_table=11 + /protein_id="CAI32982.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaattact ataaatattt tttgcagaaa aatttaaaat tgaaatcata taaaaacaag + 181 ggaggactgt ataaaaagca gaaatccttt gttttttata accaaggttt ataaactttc + 241 attctcgaaa ttcaattaac tttacaaatt cccactatta aggagaaaga agatgaacat + 301 aaagaagcgt gtccttagtg caggcctgac ttttgcatct gctttgcttt tagctgcttg + 361 cggccaatca ggttcagata caaaaactta ctcatcaacc tttagtggaa atccaactac + 421 atttaactat ctattagact attacgctga taatatagtc aattgaaaca agaacaagac + 481 aaaagagcct cgtaaaaggt attgcaactt ggtaatacct ttttgaggtg ctttttgata + 541 tgaacccatg ttttctcaat aggattgtac tcaggtgaat agggaggaag aggtaaaagt + 601 ttatgcccaa actcttcaca caagagttct agcttcccca ttctatggaa tcttgcatta + 661 tccataataa taaccgatgg tgtggttaat gttggtaaga gaaacttctg aaactaagct + 721 tcaaaaaagt cgctcgtcat cgtctcttcg taagtcattg gagcgattaa ttcaccattt + 781 gttagacctg caaccaaaga aattctctga tatcttcttc cagatacttt gcctcttctt + 841 aactgacctt ttaatgagcg accatattct cgataaaaat aagtatcgaa tcctgtttca + 901 tcaatctaaa caggtgctag gtgctttaaa ctattaaaat tcttaagaaa taaggctact + 961 ttttctgggt cttgttcata gtaggtgtgg ttcttttttt cgagtgtagc ccatagcttt + 1021 gagcgcatag tggatggtag ttggatgaca gccaaattca gaagctattt cagtcaaata + 1081 agcgtctgga ttgtcagtaa gatagttttt aagtctatct ctatcaactt ttcttggttt + 1141 tgttcctttt acttggtggt ttagctctcc tgttttctct tttagcttta accagccata + 1201 aatggtatta cgtgagattt ggaaaacgtg tgacgcttct gttatactat ctgttcgctc + 1261 acaataagag agaacttttt tacgaaaatc tattgaatat gccataaaaa gattatacca + 1321 cattgtgtac tatattagat tgaaactaga atagtacaca tctgcttcta aaacattgtt + 1381 agaaatcgat ttgactgtcc ttatttcatt ttattatatt tttggttcgc gggaagtcta + 1441 ctaagatact taaagatgca gatagtaaaa aaaatgtaga cattaccgta aaaaagtgat + 1501 ataatcgtat gatgttcaag gtataggtgt taatcatgag tagacgtttt aaaaaatcag + 1561 gttcacagaa agtgaagcga agtgttaata tcgttttgct gactatttat ttattgttag + 1621 tttgtttttt attgttctta atctttaagt acaatatcct tgcttttaga tatcttaacc + 1681 tagtggtaac tgcgttagtc ctactagttg ccttggtagg gctactcttg attatctata + 1741 aaaaagctga aaagtttact atttttctgt tgctgttctc tatccttgtc agctctgtgt + 1801 cgctctttgc agtacagcag tttgttggac tgaccaatcg tttaaatgcg gcttcgaatt + 1861 actcagaata ttcgatcagt gtcgctgttt tagcagatag tgagatcgaa aatgttacgc + 1921 aactgacgag tgtgacagca ccgactggga ctgataatga aaatattcaa aaactactag + 1981 ctgatatcaa gtcaagtcag aataccgatt tgacggtcaa ccagagttcg tcttacttgg + 2041 cagcttacaa gagtttgatt gcaggggaga ctaaggccat tgtcctaaat agtgtctttg + 2101 aaaatatcat cgagtcagag tatccagact acgcatcgaa gataaagaag atttatacca + 2161 agggattcac taaaaaagta gaagctccta agacgtctaa gaatcagtct ttcaatatct + 2221 atgttagtgg aattgacacc tatggtccta ttagttcggt gtcgcgatca gatgtcaata + 2281 tcctgatgac tgtcaatcga gataccaaga aaatcctctt gaccacaacg ccacgtgatg + 2341 cctatgtacc aatcgcagat ggtggaaata atcaaaaaga taaattaacc catgcgggca + 2401 tttatggagt tgattcgtcc attcacacct tagaaaatct ctatggagtg gatatcaatt + 2461 actatgtgcg attgaacttc acttctttct tgaaattgat tgacttattg ggaggggtag + 2521 atgttcataa tgatcaagag ttttcagctc tacatgggaa gttccatttc ccagtaggga + 2581 atgtccatct agactctgag caagctctag gttttgtacg tgaacgctac tcactagccg + 2641 atggagaccg tgaccgtggt cgcaaccaac aaaaggtgat tgtggctatc cttcaaaaat + 2701 taacgtcaac cgaagcactg aaaaattatg gtacgatcat taatagcttg caagattcta + 2761 tccaaacaaa tatgccactt gagaccatga taaatttggt caatgctcag ttagaaagtg + 2821 gagggaatta taaagtaaat tctcaagatt taaaagggac aggtcggatg gatcttcctt + 2881 cttatgcaat gccagacagt aacctctatg tgctggaaat agatgatagt agtttagctg + 2941 tagttaaagc agctatacag gatgtgatgg agggtagatg aaatgataga catccattcg + 3001 catatcgttt ttgatgtaga tgacggtccc aagtcaagag aggaaagcaa ggctctcttg + 3061 gcagaatcct acaggcaagg ggtgcgaacc attgtctcta cctctcaccg tcgcaagggc + 3121 atgtttgaaa ctccggaaga gaagatagca gaaaactttc ttcaggttcg ggaaatagct + 3181 aaggaagtgg cgagtgactt ggtcattgct tacggggctg aaatttacta cacaccagat + 3241 gttctggata agctggaaaa aaagcggatt ccgaccctca atgatagtcg ttatgccttg + 3301 atagagttta gtatgaacac tccttatcgc gatattcata gcgccttgag caagatcttg + 3361 atgttgggag ttactccagt cattgcccac attgagcgct atgatgctct tgaaaataat + 3421 gaaaaacgcg ttcgagaact gatcgatatg ggctgttaca cgcaagtaaa tagttcacat + 3481 gtcctcaaac ccaaactttt tggcgaacgt tataaattca tgaaaaaaag agctcagtat + 3541 tttttagagc aggatttggt tcatgtcatt gcaagtgaca tgcacaatct agacggtaga + 3601 cctcctcata tggcagaagc atatgacctt gttacccaaa aatacggaga agcgaaggct + 3661 caggaatttt ttatagacaa tcctcgaaaa attgtaatgg atcaactaat ttaggagaaa + 3721 tgatgaaaga acaaaacacg atagaaatcg atgtatttca attatttaaa accttgtgga + 3781 aacgcaagct aatgatttta atagtggcac ttgtgacagg tgcgggggct tttgcatata + 3841 gcacttttat tgttaagcca gaatatacga gtaccacgcg aatttacgta gtgaatcaca + 3901 atcaaggaaa caagctgggg ctgacaaatc aggatttgca ggcaggttct tatctggtaa + 3961 aagactaccg tgagattatc ctttcgcagg atgtattgga aaaagtagcg acaaatttga + 4021 agttggatat gccagcaaaa acgttagcca gcaaagttca agtgactgta ccagatgaca + 4081 ctcgtatcgt ctcaatctct gtcaaggata aacagccaga ggaagccagt cgtatcgcta + 4141 attctctacg agaagttgct gcagaaaaga tcgtcgctgt aacgcgagta tctgatgtaa + 4201 cgacacttga agaagcgcga ccagctacga ctccctcttc tccaaatgtt cgacgcaatt + 4261 ccttgtttgg ttttcttgga ggagtagtcg taacagtaat tgctgttctt tttattgagt + 4321 tgctcgacac ccgtgtgaaa cgtcctgaag atgttgaaga tgtactgcaa attccacttt + 4381 tagggctcgt tccagatttg aacaaaatga aataggagga agttatgcca acgttagaaa + 4441 tctcacaggc aaaattggat tttgtaaaaa aggcagagga atattataac gctttgtgca + 4501 cgaacctaca gttaagtgga gatggtttga aagtattttc tatcacttct gtgaaactag + 4561 gagaaggaaa atcaacgact tccatcaata tcgcttgggc ttttgcgcgt gcaggttaca + 4621 aaacgctgct gattgatgga gatattcgca attctgttat gttaggtgtc tttaaagcaa + 4681 gggataagat tacaggcctg acagaatttt tatcaggaac tacagaccta tcacaagggc + 4741 tttgtgatac caatatcgaa aatctctttg taattcaggc tggctctgtg tcaccgaatc + 4801 cgacagctct tcttcaaagt aagaatttca gtacaatgct tgaaaccttg cgtaaatatt + 4861 ttgactacat cattgtagat actgctcctg tcggtgtcgt gattgatgcg gctattatta + 4921 cgcgaaaatg cgatgcttct attttagtga cggaggcagg tgaaataaat cgacgggata + 4981 ttcaaaaagc aaaagaacag ttggaacaca cagggaagcc gtttttggga attgtgttga + 5041 ataaattcga tacttcagta gaccaatacg gttcttatgg aaattatgga gattacggga + 5101 aaaataaaaa ataggtcggg ggatagagat gaatgggaaa atattaaggt cttcattggc + 5161 cataatccag agttttcttg ttattttatt gacttatcta cttagtgctg tgagagaagc + 5221 ggagattgtt tcaacaacag ctattgcact ttatatccta cattattttg tcttttatat + 5281 cagtgattat ggacaggctt tctttaaaag gggatatttg attgaacttg tccagacatt + 5341 gaaatatatc ctattctttg cactagcgat tagtatttct aattttttct tagaggatcg + 5401 atttaatatt tccagacgag gcatgattta cttcctcaca ttacatgctc tcttggtcta + 5461 tgtgctaaac ctatttatca agcggtattg gaagcgggct tatcccaact ttaaaggaag + 5521 taagaagatt ctcctactta cagcaacttc tcgtgtcgaa aaggtactgg atagattaat + 5581 agaatcaaat gaggttgttg gggagttgat agccgtcagt gtcttagata aaccagattt + 5641 tcagcatgat tgtttaaagg tagtagcaga gggggagata gtaaactttg cgactcatga + 5701 ggtggtcgat gaagtcttta tcaatcttcc aagtgaaaaa tacaatattg gagagcttgt + 5761 ctctcagttt gaaacgatgg gaattgatgt aacagtcaat ctaaatgctt ttgatcgtag + 5821 tttggcacgt aacaagcaaa ttcgtgagat ggcaggatta aacgttgtga ctttttctac + 5881 aacattttat aagactagtc atgtaattgc taagcggatt attgatatcg tgggtgcatt + 5941 tgtagggctg atattatgtg gtttagttag tattgtactg gttcctttga ttcgaaagga + 6001 tgggggctct gctatttttg ctcagacgcg tataggaaaa aatggtcgtc agttcacttt + 6061 ttataagttt cgctctatgt gtgtagatgc cgaggcgaaa aaaagagaac tcatggaaca + 6121 aaataccatg cagggtggaa tgtttaaggt ggacgatgat cctcgtatca cgaaaattgg + 6181 tcgttttata cggaagacta gcttggacga gctaccacag ttttataatg ttctaaaggg + 6241 agatatgagt ttggttggca cacggccacc aacagtggac gagtatgaac actatacccc + 6301 agaacaaaaa cgtcggctaa gttttaaacc tggtataaca ggcttatggc agatcagtgg + 6361 acgaagtgag attaagaatt ttgatgaagt tgtcaaatta gatgtggcct atattgatgg + 6421 ttggacaatc tggaaagata ttgaaatttt gcttaaaact gttaaagttg tatttatgag + 6481 agatggagcg aagtaattca tatgaatgag agaatgcaaa tattaggaat tattatagat + 6541 ccattaacga tgaaagaaac agtggatgct gttgaacagt atgttttaaa gaagcatcct + 6601 ttgcacttga tgggagttaa cgcagataaa attaatcagt gccatgaaga tgagaaaatc + 6661 aaaaaaatcg ttaatgaatc aggaatcatt aatgcggatg gagcatcagt tgttcttgca + 6721 agtaagtttt taggaacgcc tgttcctgaa cgagtagcgg gtattgattt gatgcaatgt + 6781 cttttagagt tgtcaaataa aaaaggatat tcagtttact tttttggagc caaagaagaa + 6841 attttacaag atatgctaaa agtttttaaa caaagatatc ctaatcttaa tgttgttggc + 6901 tatagaaacg gatatttttc acctgaagat gaaaaaaaga ttcaggaaga tattaaagga + 6961 ggcaaaccag attttgtatt tgtagggatt acttctccta aaaaggaata tatcatccaa + 7021 tcattcatgg ataatgggat taatgctgtc tttatgggtg ttggtggcag ttttgatgta + 7081 ttatcaggac acattaaacg agctccatta tggatgcaaa aattgaatct ggaatggttg + 7141 ttccgtgtag ttaatgaacc caaacgtctt tttaagcgtt attttgtagg gaatgttact + 7201 tttattaagc gagttttaga tgaaaagcga aaatcaaaaa aataatattc tacatatttc + 7261 tcgtacaatg gatattggtg gtgcagaacg tattgtatat caattgagtt ctgatttgaa + 7321 agatgaattt gatagtgtcc atgtcgcttc aacaggtgga ctatgggaga gcaaactttt + 7381 atcaaaagga gttcaacatc ataaaatttt agatgttgac agtaagaatc ccctaactat + 7441 ggtaaagatc ctttcaagtt tttatagaat tatcaaaaat aatgatatta ccattgttca + 7501 cactcatcat cggatggctg ccttttatat tcgcttgttg aaaatcatta atcctaagtt + 7561 gatacatgtt tacactgcac ataatgtatt taaaaataaa ttaccattat acaaattttc + 7621 cttaaaaaaa gcgtattgtg tagctgtggg taaagcggtt aatgataatt tgaaacatga + 7681 tgtaggaatc agtgatagta cagtaatcta taatggggtt gtttttgaaa aaactgataa + 7741 gctagttgat gagattgtaa attataacgg aatcaaattg gggtgtattg ctaggttatc + 7801 agagcaaaaa ggattgacct acctaattga tgcgatgtct ttagtgaaac acagggatat + 7861 tacattgttc attgtcggag atggagagct tcgagatgaa cttgaaaaca aggtgaaaca + 7921 attaaatctt caaaaatcag tgatattttt aggttatcga aaagatgttg ttgaatgtat + 7981 caatagtttt gattacttag tgtcatcatc tttatatgag gggttggctc taaatgtaat + 8041 tgaagcattt atgaatggga aaacgatggt tgcatcagat atccccggaa taaatgaagt + 8101 agtcaataac aaaaatggga ttcttgttcc tgttaaggat gatgttgcct tagcgagagc + 8161 gattgaaaag cttgcgactg acaaaaaact tagagaaaaa ctcgcttatc aagcaaaaaa + 8221 agactatgag acaaaattta attattcctt gtttttggat aattatcgga gactttatag + 8281 aaaattaacg ggagaatcaa aatgaaaaaa gtcatgttgg tttttgggac acgtccagag + 8341 gctattaaaa tgtgtcccct agtaaatgaa ctgaaacaaa atgattcaat caagacactt + 8401 gtgtgtgtaa ctggtcaaca taaggaaatg ctagagcagg ttttggaggt gttcaaggtt + 8461 gtcccagatc atgatttggg tatcatgaaa gcaaatcaaa ccctattttc cattacgatt + 8521 agtattttgg ataagattca agcagttcta gaacaagaaa tgcctgatat cgttcttgtt + 8581 catggagata caacaacaac atttgcgaca gctttggcag cattttatat gggaatcaaa + 8641 gtgggacacg tcgaagccgg tctcagaacc cacaatctcc aaagtccatt tccagaggag + 8701 ttcaatcgcc agacgacttc tatcattgcc gactatcatt tcgcgccgac tgaagttgca + 8761 aaggaaaatc tactaagaga gggcagaaaa aatatctttg tgacgggaaa tacagtcatt + 8821 gatgctttga agacgactgt tcaatgcaac tatcatcacc caattttgga atgggcaaag + 8881 ggtagtaagt taatcatgct aacggctcat cgacgagaaa atcttgggga accgatggaa + 8941 aacatgttta atgctgttaa tcgaatttta gacgaatttg aagatgtaaa agttgtatat + 9001 cccatccata aaaatcctaa ggttcgagag ttggcaagta aagtttttgg cgataatgaa + 9061 cgaatgaaga tcattgaacc gttagaagtt attgatttcc ataattttat ggatcaaagc + 9121 tatatgattt tgacagattc tggaggtgtg caggaagaag caccttcttt agggaaacct + 9181 gtcttagtga tgcgtgatac aacagagcgt cctgaaggag tcgctgctgg cacattgaag + 9241 ttggtaggta cagaagaaga gaatatttat aataacttta aacttcttct tgaggatgaa + 9301 acagaatata acaagatgag taaagctagc aatccttatg gagatggaat gacttgtaaa + 9361 cgggttgttg atattattct ggaagtataa aaataattca attatgaatg aggaaagaat + 9421 aaattagatt gatgataaaa agaaaaatat atataatctg tgtattactg tcgtattttt + 9481 tacctagttt ttttacagtt ggatcaatgg caactatatt taccctactc tccacagtaa + 9541 ttaggctatt cgtaactata tatcatgttc ctaaagtttt ttcacagtat aaggtaacgc + 9601 tgattgacat tttggttgtt ctgtttttgt tttttcaagt gtttgtgggg gttcaaagtc + 9661 agacagtgaa tcttaactat attggaggac agtttttctt tttaggatta tattcatttt + 9721 tgaaatactt tttattgttt gattgtaaaa caacaattga aagcctcttt ttaaccttta + 9781 tcttgttttt gtgtgttcaa gtaataactc aattgctttt tccggttggt ttcgactctt + 9841 tgtaccctac aggagataat agactttact ttttaggaag aaaaaacata gccaccccat + 9901 atatcattgt tggattaggt agtttttact tattaaataa aaaaatgaat gagtttatat + 9961 cactaaagga gattattttt ttaggattgt tcggaatttt atcattttta acacaatcca + 10021 gtacagcgat tatatgttat gtgcttttta tttttatgcg tatgttaggt ttaaaggaaa + 10081 atataggaaa accatattct ttagtcagta taactgtgta tatttgtttt agtttttcta + 10141 taattttttc acaaagtaca attttatcaa cttttacagc aattttttcc aaaaatgcaa + 10201 ccttttcagg acgtatcaat atttggcagt tagcgattcg tatttttgaa gaaaattttt + 10261 ggtttggaaa aggacttaat attgatttca atgcttggac aaatgggatt atcgttaact + 10321 ccgcacacaa taccttacta gatatacttg ctcgaacggg tatatttccg ggtattttat + 10381 ttgtagtggt tcttctaagt ctatttcttg gaaaatatag agtaaaatca aaaacgctac + 10441 tgacaatgtt gatttcattc atggtttata ttacgatgga ggctacatct gtaagtattc + 10501 ttctattaat aattgctatt tgtgtgtatt ggtcttttgg agaggagaag ttatatgagc + 10561 aagttactta atgcaatcta ttatcgacta tttggattat ataaaaaaat ttatctacaa + 10621 gtttttagta aaaaaacaat taatatttta ggtgaaaagg ctaatttaga aaatgaacta + 10681 attgtttcgt ttacaacaat tccaagccgt cttaattatt taccaagtat gattaaaagt + 10741 attttcaatc agacaattat ccctaaccgt tttattatgt atgtttataa agatgaattt + 10801 gaaggtatta atttggagag tatcctagaa actgaaatca aaaatggttt ggaaattgtc + 10861 tatgtggacg aaaatcttcg ctcgcataaa aaatattttt atgctatgaa ggataatccg + 10921 aatagtattg taattttggt tgatgatgac actgtctatt catcgaatac catcgaaaag + 10981 ttagttgctt cttacaggaa atacccaagt tgtatttcgg caatgcgatg tcatcgaatt + 11041 aaactgctta ctgatggaag tctggcacca tacaatgagt gggaatatga atttttcggt + 11101 gatattaaac catcttactt taatttcttt acaggttgtg gaggagtact ttttcctcct + 11161 actgctcgaa cagatgaatt ttttaatatt tctaatataa tgaatctcag ttatttagct + 11221 gatgatgtat ggttgaattt tttagcaata aaaaatagaa ttaaaatagt aaaagcaaca + 11281 cgatgtaagg gaacaccatt aactatagat gacaaccctg aagagagttt ggtgtatctg + 11341 aatgctatat atgataataa taatgatagg tgtatcaaga atatggtaga tttttatcat + 11401 attgattttt cagaggttga ttaatggata taagtaataa gtttaaggta ggtatcctat + 11461 atactgcttt aggtaagtat tctaatgtta taattcaatt atttgtaacg gcggtattaa + 11521 gtagaatatt aacacctgaa gagtatggcg ttgtagcggt tgtcaatgtg tttttagtat + 11581 tctttcagat attggcagat tcgggaatag gacctgcaat tgtacaaaat aagacattaa + 11641 ctcaaaatga tttaaatgat atttttactt taacaattta ttcaggttta attctttcgt + 11701 ttgtttttgt attgataggc tatccaatta gtatagtcta tgggaatgaa gtctatatca + 11761 aactgtactc attattaggt atgtgtgtac tattttatac tatgacaatt gttcctcagt + 11821 caattttaac aagaaacatg aactttaaac ggatgaactt attgagtctg attgccaata + 11881 tttttagtgg agttattggt gttgtgctgg ccatacatga tttcggggta tattctctga + 11941 ttttttctaa tattatgaag gctactatat tattttttgt ttttttttca agtgttgagt + 12001 tgagttttaa gaaaaagata gagaaaactt cgttagttaa aattctaaat ttttctaagt + 12061 ttcaatttat gtttaatttt ctaaactact ttgcaagaaa tttagacaat ctcttgattg + 12121 gtagattcat taatcccgct gcgttgggtt attatgataa ggcttaccag ttatcattat + 12181 atcctaatca gattttattg caggtgattt cacctgtaat tcatccgata atgtcgaatt + 12241 ttcaaaatga tagacaaaaa atggaagaag tttttgcaaa aatttttaat attctacttt + 12301 taataggaat gccaatctca gtgtatttgt ttttcaatgc aagtgatgtg ataacattta + 12361 tgtttggaaa taattggttt cagagcgttc cagtatttca aatactatct gctagcatct + 12421 ggattcaaat ggctaatagt ccaataggaa ttttttatca agcttcgaat cgtgttgatc + 12481 tgttatttaa ggtaggatta ttagcgtcag gatttaatat tatagctatt gtgatagggc + 12541 tattatcgaa aagtatagtg acaattgctg ctatgttaat tatttcattt ataatagggc + 12601 tatcactgaa tctctacgtt ttatcacatg tagtctttaa aaatgatata attaaatatt + 12661 taaaaataat tttagttcac cttgtaacag ttatcccata tattatattc aatatgattg + 12721 gctttagatt tgaacagggt gtagttatca atcttgtgtt gcaaggactg gtattgggac + 12781 taatttggtc tataggaata tttgtaacag gtcaatacaa gcagttaata atgatgttta + 12841 gtaggtgaaa atttatgaaa attttatttg tgaatatgtt ttacaatgaa gaaggaggag + 12901 cacaaaagag caccaaattt ctagctgaac aacttgtaaa agaaggacat gaggtatttg + 12961 catactctga tgatgctatt gattcagata ttgaggaagt tattaatggg gttaaggttt + 13021 ttagaagaag aactccgctt tttagtcttc actatatttt cagtgccaag aagaatccag + 13081 ctaaacattt tttctataaa atatttgaaa cctataatgt atttgcgaaa aaaaaattta + 13141 tcgatatcat tgaggaaata caaccagata ttgttcattt taatacaatt tcaggaatgt + 13201 ctttatcaat agttaaagaa gctaaaaaga gaaatatcag aaccatttgg accttgcgag + 13261 actattggct agaatatcca tggggggaga aagatattgc tcttattaaa ctgctaaata + 13321 gaatatatag accttttgtt aagaaaagtt taaaacactt agacatagta acagcacctt + 13381 cagcatttac cttgaataat tttatcaata aaggatttat taacccatct tctcaaaaat + 13441 gtatggccat tgaaaatgct gttatatttt caaagagtaa attggaaaat attatcaaac + 13501 gaaagcaaga aacaaaaaga aatccagaaa aaacgaattt tctttttgta ggctctatac + 13561 ttgaaataaa gggcgttttt aacttagtaa tggcttttaa aaaactaact aatccagaaa + 13621 tttctttgaa aattgtagga aaaggaaaag atttagaaaa acttcaaaaa gaaatcgaaa + 13681 gtgatcctag aatacaatat ttaggctttc aagatacaaa aaacctctat gaaacttatc + 13741 aaaattcgga tgtattggtc gttccatcag cttgggatga accgtttggt agagttgtaa + 13801 ttgaaggaaa tgcaaatggc cttccggtca tcacttcaga tagaggtgga ttacctgaaa + 13861 ttgtgcaaac agtaggagga ggggaagttt ttacagacaa atcgggaaat acattatata + 13921 gtattttaaa gaaatttgta gaaatggaaa actacaatgt ctattaccga tgcattcttg + 13981 agaatattga tatttattct atcgaaaaac aaagtgaaaa gtttataagt ttatataggg + 14041 agggatagat gcaggttcga catttattaa cttatctgat ttcgctacct aaaacaatct + 14101 tttttaattt taagtgttta ccaattaatc aggcaattca ccttccaata cttgtagcat + 14161 ataatgtcaa gttgttaaat ttgaaaaaga atgtaattgg tatagaaact gtagtaaaat + 14221 ttggtttagt tcgaattggt ttctcaggta cggagataat atcctctaat cgatcgctca + 14281 taaacttgag acaaggaaaa gttattttta aagggaagtc agtgatcaca aaaggttgca + 14341 caattagtgt tacaggagga accatcattt tgggcgataa cttttatgcg aatagaaatt + 14401 gtcttatatc atgtactgat aggctcattg ttggtaataa tgtactttta ggttggaatg + 14461 ttattctttt tgactcagct ggtcatacac taagctacga tggtaagaaa aagataaaaa + 14521 tgacagaaga aattgtaatt ggtaaccatg tatggatttg tgctgaagca cacttattga + 14581 aaggaagtaa gattgcagat ggttctgtag tagcttattc tagtttagtt acaggttatt + 14641 tcgcagaaaa gaattgcttg attggaggaa tacctgcaaa aacacttaga aaaggagtaa + 14701 gttgggaaaa gtaactttat tttattgatt caaaatatta gaggtggaag tttgaaaaaa + 14761 ataaaagtta gttgattgat tacttctcta aattttgggc acactaaaaa gaggtcttga + 14821 cacctaaact ttaaaattaa agcatattga atccgcgctg ctgtgcgaag cgaatagcgt + 14881 cttggacgga cattgtctta tctggatttc ttatttctgt aaggccttgt aatcttggat + 14941 tataactctc ctgttttagg aatacatggt agatggcaac caataatctg cgacagatag + 15001 cgatgatagc ttttcgatga ccacgtcgtt tcttgagttt gagatattta tttcgtagtt + 15061 caggatgctt ctctgattta accacggcat tagctatttg aacaagaaaa ggtttgagat + 15121 agtgaccgcc tttcgaaata cgagtagaga atttctttcc tgcactttca ttgttggcag + 15181 gaactaatcc gccccaagaa tagagtttac ctgcagtacc aaagacagtc atatcagctc + 15241 cgatttcaga gagtattctg agggcagata gttcctcttt gaaaccaggc acagtttgga + 15301 tcagtttgac ctgttcttgg tattcgtgac cgagcttccg aatcatggtt tctaaatctt + 15361 ctttacagac ggcaagagca tcatagtgtt ccttgatgat tctgattttc tcagcttgtt + 15421 caggtgtcac ctccccctca atagcgattt tcaagtcttg caccttatcc ttcattctct + 15481 tgtgaatcaa ctgttcaatg tttggtttgt cctctggatt gtcaaggatg ctctgaataa + 15541 tagcctgagc actttttccg aacacgtcgg aaacgacact tgcaatctga aggttagacc + 15601 aagtcagaca gttctggtaa cgatttttct cgctgacttg aagttgtgtt aatttcatgc + 15661 gatagcgaaa aaggtctcgg agttgtctga ttttaagagg gggaataaag ctagaagcaa + 15721 ccaaatcatg cttgaagagg tcggctatcc attgcgcatc tttcttgtcg gttttctttc + 15781 ctctgatagc cttgacatac ttagggtgag ctaagcaaat cttgcaggat ttttcaagga + 15841 tattgaagac aggaatccaa tatttactgg tagattccat acagacatca aatcaagaat + 15901 agtattctag ccaatctcgt agctgtacta acccatttgt aaaagttgag aaacgtttac + 15961 gatggtagct tgtgagtcct tgcttgtcgg tgatggtaac aaccgctaca acaaaggttt + 16021 tatgcacatc aatgccacaa caattaggat agataatttt taacatgagg ggtctccctt + 16081 caccaaattt gagtctgcct atcccttgac tattctttcc tttcacaaac gagtcgctta + 16141 ttcaattata agtttacgtg ctcttagtca cagttcttgt gcttgatgga aagaatgaca + 16201 cctataaata tgcgaggtag tggctgtacc actcacttat tcacctcccc gtgatttgta + 16261 atagtgatag gctttctcac tattattata aaccaaaata aagagcacaa cactttttca + 16321 tgctgtgttg tgccttgagt gaaacgaaag gaatgaatta taaatatgaa aatagcggta + 16381 gcaggaacag gttatgtagg attgtcaatt gccgtgttgt tggcacaaca tcacgaaata + 16441 aaagcagttg atattgttgc tgaaaaagtt gaattaatca atcaaaaaaa atctccaatt + 16501 caggatgatt atattgaaaa atatttagtg gaaaaagatt taaatttgga agcaactatg + 16561 gatgctaagt atgcttatga agatgcagaa tttgttgttg ttgcagcacc aacaaattat + 16621 gattcgaaaa agaacttttt tgatacatca gcagtagagg cggtcattca acaagtaaaa + 16681 aaaattaatc ccaaagcggt aataattatt aaatctacaa tccctgttgg attcacagag + 16741 tccgttcgaa agaaatatca gtataaaaat atcctattta gtccagaatt tttacgcgaa + 16801 tctaaagcat tatacgataa cctgtatcca agtcgcatca ttgttggaac tgacttagaa + 16861 gatacttatt taaaagacaa agctaatata tttgcttccc tactaaaaga gggggctatt + 16921 aaagaagaca tagatacact tttcatggga gtaacggaag ctgaggcagt taaattattt + 16981 gccaatactt accttgcgtt gcgtgtttct tactttaatg aattggatac ttatgcagag + 17041 gtgaaaggtt tggatgcaaa agccattatt gatggtattg gcctagatcc acgtatagga + 17101 aatcattata acaatccatc ctttggctac ggtgggtatt gtttacctaa agatagtaag + 17161 cagttattag caaattactt tgatgtacca caaaatatga tgacggcaac tgttgaaagc + 17221 aatcgaacgc gtaaggattt tatcgctcaa cggattttag aaaaagctgg agtatctgag + 17281 actgatagtt tagatgcgtt taagaacaca caagatattg ttataggtat ttatcgttta + 17341 acaatgaaaa gtaattcgga taacttccgt cactcctcta ttcaaggtgt tatgaaacga + 17401 ttgaaagcta agggagttac ggttatcatc tatgagccaa ctttgaagga cggggaaaca + 17461 ttctttggta ataaagtggt aaataatcta gataaattta aagaagctag taatgttatt + 17521 gtagccaatc gttttgaacc ttcactagag gatgtgtcta ataaagttta tagtcgggat + 17581 atttttaagc gtgactaata aatatgtcca cgtgacgtaa tatctattaa atggataaaa + 17641 tattaataaa catggcatct atatcttttt ggggataata aaaggcatat gattatctaa + 17701 gttagtttat ataattaagc agttacgtca acttatttta ttatgaatta tatataacat + 17761 gaatatcatt attaaatgag cactaaatag ataacaagag gagaaataaa tgaaatcaat + 17821 cggaaagcga atcaattgga tagattttgg gaaaggattc gcaatatttt cagttctagt + 17881 aggacatgta ttgatggggt tgtatgaatc caatattttt tcaattgcaa atgatgtgtt + 17941 attattattg ataactcaaa tttatatatt tcacatacca gtgttttttg ccctgtcagg + 18001 atactttttt agacctgtat cagatatgaa ggagttttgg cattatgcta aaaagaagac + 18061 gattatttta ggtataccat atgtttttta ttcaattatt cacttttgtc ttcaaaaggt + 18121 cgctggtgcc tctgtccgag tacccactac gatatttaac ctattgaata tctataaatt + 18181 tcctctggga gtttcatggt atctatatac gttatggtcg atattgatag tttatggttt + 18241 actatctgtt gttttcaaaa atcgtaagtc ccttttgtta gttagtgttt ttgcctatat + 18301 tttcacacta tttattcaaa ctgatatttt tattgtacaa cggacgttgg tttggggtgt + 18361 ttgcttctgt cttggcagtg tattgagcgc aattcacttt gataaaatta atttgaaaaa + 18421 atttcttttt ttctttgtgc tatttgattt tatttatatg ttcgcttggt ttttgtttta + 18481 tgaagtaggg tctaagaagg attatgtaag ctatagcaac ccaggtttgt ggggattgct + 18541 tttattgtct gtgtattagt tgcttttgcg atttttccta aaatggagaa aaattttcct + 18601 aaaactttcc tatatttcac taaatacggg aaagatagtt tagggatcta tattcttcat + 18661 gcaccaattt gtagcatgat tcggattcta atgttgaaag taggaataaa ctcagttttt + 18721 cttcacgttg ttgttgggat tgtgctaggc tggtatttat ccatactagc aacttatata + 18781 ttgaaaaaaa ttccattttt gaatattgtt ttattaccac aaaagtatat taaattaaaa + 18841 taaattattt tcggctcttt gtcaactgta gtgggttgaa aaaaagctaa gcttgagaaa + 18901 ggacaaattt tgtcctttct tttttgatgt tcagagcgat gaaaatccgt tttttgaagt + 18961 tttcaaagtt tcgaaaacca aaggcattgc gcttgataag tttgatgaga ttattggtcg + 19021 cttccagttt ggcgttagaa tagtgtagtt gaagggtgtt gacaagcttt tctttatctt + 19081 tgaggaaggt tttaaagaca gtctgaaaaa taggatgaac ctgcttaaga ttgtcctcaa + 19141 taagtccgaa aaatttctcc ggttccttat tctgaaagtg aaacagcaag agttgataga + 19201 gctgatagtg gtgtttcaag tcttccgaat aactcaaaag cttgtttaaa atctctttat + 19261 tggttaagtg catacgaaaa gtaggacgat aaaatcgctt atcactcagt ttacgactat + 19321 cctgttgtat gagcttccag tagcgcttga tagccttgta ttcatgagac tttcgatgaa + 19381 actgattcat gatttgaaca cgcacacgac tcatagcacg gctaagatgt tgtacaatgt + 19441 gaaagcgatc aagaacgatt ttagcattcg ggagtgaaac agtctgggag actgtttcag + 19501 cctgagccta gaaatttgaa agcgaagctg tttagccaag tcatagtaag gactaaacat + 19561 atccatcgta atgattttga cgcgacatcg gacggctcta tcatatttaa gaaagtgatc + 19621 tcggatgaca gcttgtgttc taccttcaag aacagtgatg atattgagat tgttaaaatc + 19681 ttgcgcaatg aagctcatct ttccctttgt aaaagcatac tcatcccaag acataatctc + 19741 aggaagacaa gaaaaatcat gtttaaagtg aaaatcattg agcttacgaa taacagttga + 19801 agttgaaatg gaaagctgat gggcaatatc agtcatagaa atcttttcaa ttaacttttg + 19861 agcaatcttt tggttgatga tacgagggat ttggtgattc ttcttgacga tagaagtttc + 19921 agcgaccatc atttttgaac agtgatagca cttgaaacga cgctttctaa ggagaattct + 19981 agtaggcata ccagtcgttt caagataagg aattttagaa ggtttttgaa agtcatattt + 20041 cttcaattgg tttccgcact cagggcaaga tggggcgtcg tagtccagtt tggcgatgat + 20101 ttccttgtgt gtatccttat tgatgatgtc taaaatctgg atattagggt ctttaatgtc + 20161 tagtaatttt gtgataaaat gtaattgttc catatgattc tttctaatga gttgttttgt + 20221 cgcttttcat tataggtcat atgggacttt ttttctacac aaaaataggc tccataatat + 20281 ccatagggga tttacccact acaaatatta tagagcctta ttttagattt ataatgtgtc + 20341 tctttgtcaa ctaacatctg gagaggacaa tcactgtctt ctcctttttt gtcttttcag + 20401 aatataccaa attaacacaa aaattctgaa aattctgttg acaactttct gaaaagagtc + 20461 tataatggag agaaagtttt aaaggagaaa atgatgaaaa gttcaaaact acttgccctt + 20521 gcgggcgtga cattattg +// + diff --git a/public/res/serotype_genbank/serotype_9L.gb b/public/res/serotype_genbank/serotype_9L.gb new file mode 100644 index 0000000..4b57d4a --- /dev/null +++ b/public/res/serotype_genbank/serotype_9L.gb @@ -0,0 +1,807 @@ +LOCUS CR931646 17618 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain T9233/128/68 (serotype 9l). +ACCESSION CR931646 +VERSION CR931646.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17618) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17618) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17618 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="T9233/128/68" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC09L_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC09L_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI32983.1" + /db_xref="UniProtKB/TrEMBL:Q4K2K9" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVEMTD + " + gene complement(281..1698) + /gene="tnp" + /locus_tag="SPC09L_0002" + /pseudo + CDS complement(join(281..418,418..1698)) + /gene="tnp" + /locus_tag="SPC09L_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(694..1194) + /gene="tnp" + /locus_tag="SPC09L_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.8e-21" + /pseudo + gene 1855..3300 + /gene="wzg" + /locus_tag="SPC09L_0003" + CDS 1855..3300 + /gene="wzg" + /locus_tag="SPC09L_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI32985.1" + /db_xref="GOA:Q4K2K8" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2K8" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTETDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGTDRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1855..1971 + /gene="wzg" + /locus_tag="SPC09L_0003" + /note="Signal peptide predicted for SPC0303 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 2059..2406 + /gene="wzg" + /locus_tag="SPC09L_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 5e-64" + misc_feature 2584..3027 + /gene="wzg" + /locus_tag="SPC09L_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 3302..4033 + /gene="wzh" + /locus_tag="SPC09L_0004" + CDS 3302..4033 + /gene="wzh" + /locus_tag="SPC09L_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI32986.1" + /db_xref="GOA:Q4K2J1" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2J1" + /translation="MIDIHSHIVFDVDDGPKSIEESKALLREAYNQGVRMIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHAGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + misc_feature 3305..3913 + /gene="wzh" + /locus_tag="SPC09L_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 3.4e-38" + gene 4042..4734 + /gene="wzd" + /locus_tag="SPC09L_0005" + CDS 4042..4734 + /gene="wzd" + /locus_tag="SPC09L_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI32987.1" + /db_xref="GOA:Q4K2K6" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2K6" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLELD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 4060..4476 + /gene="wzd" + /locus_tag="SPC09L_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-52" + misc_feature 4582..4659 + /gene="wzd" + /locus_tag="SPC09L_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4744..5427 + /gene="wze" + /locus_tag="SPC09L_0006" + CDS 4744..5427 + /gene="wze" + /locus_tag="SPC09L_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI32988.1" + /db_xref="GOA:Q4K2I9" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K2I9" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARTGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTAIGEVNKRDVQKAKQQLEQTEKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 5443..6810 + /gene="wchA" + /locus_tag="SPC09L_0007" + CDS 5443..6810 + /gene="wchA" + /locus_tag="SPC09L_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI32989.1" + /db_xref="GOA:Q4K2K4" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K2K4" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKYDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 6226..6807 + /gene="wchA" + /locus_tag="SPC09L_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.2e-146" + gene 6816..7559 + /gene="wchO" + /locus_tag="SPC09L_0008" + CDS 6816..7559 + /gene="wchO" + /locus_tag="SPC09L_0008" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI32990.1" + /db_xref="GOA:Q4K2K3" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q4K2K3" + /translation="MNERMQILGVTIDPLTMKETVDAVEQYVLKKHPLHLMGVNADKI + NQCHEDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMQCLLELSNKKG + YSVYFFGAKEEVLQDMLKVFKQRYPNLNVVGYRNGYFSPEDEKKIQEDIKGGKPDFVF + VGITSPKKEYIIQSFMDNGINAVFMGVGGSFDVLSGHIKRAPLWMQKLNLEWLFRVVN + EPKRLFKRYFVGNVTFIKRVLDEKRKSKK" + misc_feature 6978..7493 + /gene="wchO" + /locus_tag="SPC09L_0008" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 5.6e-94" + gene 7534..8619 + /gene="wcjA" + /locus_tag="SPC09L_0009" + CDS 7534..8619 + /gene="wcjA" + /locus_tag="SPC09L_0009" + /note="member of homology group 66" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32991.1" + /db_xref="GOA:Q4K2K2" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2K2" + /translation="MKSENQKNNILHISRTMDIGGAERIVYQLSSDLKDEFDSVHVAS + TGGLWESKLLSKGVQHHKILDVDSKNPLTMVKILSSFYRIIKNNDITIVHTHHRMAAF + YIRLLKIINPKLIHVYTAHNVFKNKLPLYKFSLKKAHCVAVGKAVNDNLKHDVGISDS + TVVYNGVVFEKTDKLVDEIVNYNGIKLGCIARLSEQKGLTYLIDAMSLVKHRDITLFI + VGDGELRDELENKVKQLNLQKSVIFLGYRKDVVECINSFDYLVSSSLYEGLALNVIEA + FMNGKTMVASDIPGINEVVNNKNGILVPVKDDVALARAIEKLAIDKKLREKLAYQAKK + DYETKFNYSLFLDNYRRLYRKLMGESK" + misc_feature 8047..8538 + /gene="wcjA" + /locus_tag="SPC09L_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 2.1e-42" + gene 8616..9704 + /gene="mnaA" + /locus_tag="SPC09L_0010" + CDS 8616..9704 + /gene="mnaA" + /locus_tag="SPC09L_0010" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI32992.1" + /db_xref="GOA:Q4K2K1" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K2K1" + /translation="MKKVMLVFGTRPEAIKMCPLVSELKQNDSIKTLVCVTGQHKEML + EQVLEVFKVVPDYDLGIMKSNQTLFTITTSILDKIQAVLEKEKPDLVLVHGDTTTTFA + TALAAFYMGIKVGHVEAGLRTYNLQSPFPEEFNRQTTSIIADYHFAPTEVAKENLLRE + DRKNIFVTGNTVIDALKTTVQDNYHHPILEWAKGSKLIMLTAHRRENLGKPMENMFNA + VNRILNEFEDVKVVYPIHKNPKVRELASKVFGDNERMKIIEPLEVIDFHNFMNQSYMI + LTDSGGVQEEAPSLGKPVLVMRDTTERPEGVVAGTLKLVGTEEENIYSNFKLLLEDET + EYNKMSKASNPYGDGMTCKRIVDIILEV" + misc_feature 8679..9695 + /gene="mnaA" + /locus_tag="SPC09L_0010" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 1.5e-185" + gene 9746..10885 + /gene="wzy" + /locus_tag="SPC09L_0011" + CDS 9746..10885 + /gene="wzy" + /locus_tag="SPC09L_0011" + /note="member of homology group 83" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI32993.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K2K0" + /translation="MIKRKIYIICVLLSYFLPSFFTVGSMATLFALLSTLVKLFVTFD + YIPKVLLQHKVTLIDILVVLFLFFQAFAAFQSQTLYLNYVGGQFFLLGLYSFLKHFLL + LDCKTTIKSLFLTFILFLCVQVITQLLFPVGFDSLHPTGDNRLYFLGRKNIATPYIIV + GLGGFYLLNKKMNEFISLKEIIFLGLFGILSFLTQSSTAIICYGLFIFIRLLGLKENI + GKLYSLVSMAVYVCFSLSIIFSQSTILSTFTAIFSKNATFSGRINIWQLAIRIFEENF + WFGRGLDVNFNAWTNGIIVNSAHNTLLDILARTGIFPGVLFIVLLMNLFLGKYRIESK + TLLAMLASFMIYITMETSSMSILLLIIVLCVYWPRGEEKLHEQVT" + misc_feature 9746..9838 + /gene="wzy" + /locus_tag="SPC09L_0011" + /note="Signal peptide predicted for SPC0311 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.673 between residues 31 and 32" + misc_feature 10508..10693 + /gene="wzy" + /locus_tag="SPC09L_0011" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 7.8e-09" + gene 10869..11738 + /gene="wcjB" + /locus_tag="SPC09L_0012" + CDS 10869..11738 + /gene="wcjB" + /locus_tag="SPC09L_0012" + /note="member of homology group 84" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32994.1" + /db_xref="GOA:Q4K2J9" + /db_xref="UniProtKB/TrEMBL:Q4K2J9" + /translation="MSKLLNTIYYRLFRLYKKIYLQVFSKKTVDILGEKANLENELIV + SFTTIPSRLNYLPSMIKSIFNQTIIPNRFIMYVYKDEFEGINLESILELEIKNGLEIV + YVDENLRSHKKYFYAMKDNPNSIVVLVDDDIIYPRNTIKKLIASYRIYPQCVSAMRCH + RIKLFSDGSLYPYNQWEYEISGATIPSYFNFFTSGGGTLFPPCTRNEDLFNKKNIREL + SFLADDVWLNFLVVKNGIKTVKATRYKGTPLTIDDNPEESLVYLNAVYDNNNDKCIRN + MVEYYQINFTEDK" + gene 11738..13162 + /gene="wzx" + /locus_tag="SPC09L_0013" + CDS 11738..13162 + /gene="wzx" + /locus_tag="SPC09L_0013" + /note="member of homology group 85" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI32995.1" + /db_xref="GOA:Q4K2J8" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K2J8" + /translation="MNVEKNLKRGIFYTAIGKYSNVVIQLLVTAILSRILSPVEYGIV + AVVNVFLLFFQMLADSGIGPAIVQNKELNKSDLISIFSLTIYSGIVLSCIFALLGYPM + GVLYGETIYVSLFPLLGLCVLFYTITIVPQAILMKTMNFKIVNFLTIFSNIASGLVGV + ILAVSHFGVYSLIFSNIVRAMVLFIALYSKAKINFYWKVSKSSIGKIFEFSKFQFLFN + FWNYFARNLDNLLIGRLISPSDLGYYDKAYQLSLYPNQILSQVVTPALHPIMSNFQDN + ISKIGEVYLQISRIFVIVGIPISAYLYFNAQYVVTFMFGDNWSQSVPVFQILAATIWL + QMANSPTGAFYQATNQTRLLFRIGLLTSFINILAIVIGVMLQSIQCVAYMLLISFSLS + LVINTLYLTKKVLNISAQKYIKPILINLTIISPYIVFNLFISDFVNDLILHLSVQFVI + LFLIWGIGMYISGEYRRVFAVIRK" + misc_feature 11756..12559 + /gene="wzx" + /locus_tag="SPC09L_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 1.4e-28" + gene 13175..14377 + /gene="wcjC" + /locus_tag="SPC09L_0014" + CDS 13175..14377 + /gene="wcjC" + /locus_tag="SPC09L_0014" + /note="member of homology group 86" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI32996.1" + /db_xref="GOA:Q4K2I1" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR009695" + /db_xref="UniProtKB/TrEMBL:Q4K2I1" + /translation="MKILFVNMFYNEAGGAQKSTKFLAEQLVKEGHEVFAYSDDAIDS + DIDEVINRVKIFRRRTPLFSLHYIFSAKKNPAKHFFYKIFETYNVFAKRKFINIIEEV + QPDIVHFNTISGMSLSIVKEAKKRNIRTVWTLRDYWLEYPWGEKDISLIKLLNRIYRP + FVKKSLRHLDIVTAPSAFTLNNFINKGFINPSSQKCMVIENAVIFSKGKLENIIKQKQ + ETKRNPEKTNFLFVGSILEIKGVFNLVKAFKKLTSPEISLKIVGKGKDLEKLQKEIES + DPRIQYLGFQDTETLYKTYQNSDVLVVPSAWDEPFGRVVIEGNANGLPVITSDRGGLP + EIVQTVGGGEIFTDESGNTLYSLLKKFVEMENYNVYYQCILENIDIYSIEKQSEKFTN + LYLDKEIE" + misc_feature 13811..14308 + /gene="wcjC" + /locus_tag="SPC09L_0014" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 6.6e-31" + gene 14411..15643 + /gene="ugd" + /locus_tag="SPC09L_0015" + CDS 14411..15643 + /gene="ugd" + /locus_tag="SPC09L_0015" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI32997.1" + /db_xref="GOA:Q4K2J6" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K2J6" + /translation="MKIAVAGTGYVGLSIAVLLAQHHEIKAVDIVAEKVELINQKKSP + IQDDYIEKYLVEKDLNLEATMDAKYAYEDAEFVVVAAPTNYDSKKNFFDTSAVEAVIQ + QVKKINPKAVIIIKSTIPVGFTESVQKKYQYKNILFSPEFLRESKALYDNLYPSRIIV + GTDLEDTYLKDKANIFASLLKEGAIKEDIDTLFMGVTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDAKAIIDGIGLDPRIGNHYNNPSFGYGGYCLPKDSKQLLANYFDVPQ + NMMTATVESNRTRKDFIAQRILEKAGVSETDSLDAFKNIQDIVIGIYRLTMKSNSDNF + RHSSIQGVMKRLKAKGVTVIIYEPTLKDGETFFGNKVVNTLDKFKEASNVIVANRFEP + SLEDVSNKVYSRDIFKRD" + misc_feature 14411..15031 + /gene="ugd" + /locus_tag="SPC09L_0015" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00028" + misc_feature 14411..14965 + /gene="ugd" + /locus_tag="SPC09L_0015" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-52" + misc_feature 14996..15277 + /gene="ugd" + /locus_tag="SPC09L_0015" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-35" + misc_feature 15371..15622 + /gene="ugd" + /locus_tag="SPC09L_0015" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 1e-05" + gene order(15943..16248,16277..16711) + /gene="tnp" + /locus_tag="SPC09L_0016" + CDS join(15943..16248,16277..16711) + /gene="tnp" + /locus_tag="SPC09L_0016" + /note="member of homology group 19" + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + /protein_id="CAI32998.1" + /db_xref="GOA:Q4K2J5" + /db_xref="InterPro:IPR002559" + /db_xref="UniProtKB/TrEMBL:Q4K2J5" + /translation="MLTVLKTAYQLKHAKGGRKPKLSLEDLLMTTLQYMREYRTYEEI + AADFGIHESNLIHRSQWVEVTLVQSGFTISRTPLSSEDTVMIDATEVKINRPKKTISE + MKAQTIVTSQGRIVSLDITVNYCYDMKLFKMSRRNIGQAGKILADSGYQGLTKIYPQA + QTPRKSSKLKPLTVEDKACNHALSKERSKVENIFAKAKTFKMFSTTYRNHRKRFGYFR + HTIYFLFNYSLLYSKGCGCLCPSTHYDI" + misc_feature 16057..16122 + /gene="tnp" + /locus_tag="SPC09L_0016" + /note="Predicted helix-turn-helix motif with score + 1061.000, SD 2.80 at aa 39-60, sequence + RTYEEIAADFGIHESNLIHRSQ" + misc_feature 16150..16583 + /note="Predicted helix-turn-helix motif with score + 1061.000, SD 2.80 at aa 205-60, sequence + QWVEVTLVQSGFTISRTPLSSEDTVMIDATEVKINRPKKTISEMKAQTIVTSQGRIV + SLDITVNYCYDMKLFKMSRRNIGQAGKILADSGYQGLTKIYPQAQTPRKSSKLKPLT + VEDKACNHALSKERSKVENIFAKAKTFKMFST" + misc_feature join(16189..16248,16277..16657) + /gene="tnp" + /locus_tag="SPC09L_0016" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 4.3e-09" + misc_feature 16583..16648 + /gene="tnp" + /locus_tag="SPC09L_0016" + /note="Predicted helix-turn-helix motif with score + 1061.000, SD 2.80 at aa 205-226, sequence + TTYRNHRKRFGYFRHTIYFLFN" + gene 16713..17396 + /gene="wcjE" + /locus_tag="SPC09L_0017" + /pseudo + CDS 16713..17396 + /gene="wcjE" + /locus_tag="SPC09L_0017" + /note="member of homology group 18; + This is suspicious. The database match Q8KWN9 suggest that + the sequence match continues into the upstream + transposase" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase (pseudogene)" + gene 17571..>17618 + /gene="aliA" + /locus_tag="SPC09L_0018" + CDS 17571..>17618 + /gene="aliA" + /locus_tag="SPC09L_0018" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33000.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaaacct caagtttttg aagcttgagg ttttttacta + 181 tagtggattg aaactagaat agtgcacctc tgcttctaaa acattgttag aaatcgattt + 241 gactgtcccg atcgatttgt cctattctta tttcattttg ctatacttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttatga agatattgtt + 361 tgaaagatgt gagtttccac ggatgggttt gtggagggat atacttgcgt ctttcttttt + 421 ttgttctggt tcttgttcaa agtttttcga atagagttca tgatttagta gctcctttgt + 481 gtgatagatt ttgtcagcga tattgaggta gatgtctccg tcaaatgctt ttataactaa + 541 tgctttcgtc tttctgatga aatagacttc ttttccttgt tcggtaggga tatagtaacg + 601 attttggaat cggatatggt gtccactatc gacgactctc tccgccagtc tagccagaat + 661 gagattcctt tcagaggggt taggaacctc ctcgaagaca gagagttttg tcttgtttcc + 721 aaactgttca ttaaaggttt gaatgtagga aagcaggaag gtattggctt cttccaaggt + 781 atgaatattg ttttgttcca gttcgatagg caggcgagat tgtagtgtct gattgagtct + 841 ttcgactctc cctttagctt gagggataga ggttgtctca aggagaatcc ctagttggtg + 901 acaggcgtat ccaaactgtg tatgggtatc gtcctccatt ttcttagagt tggaggcttg + 961 ataggtaaag accgttctct tatctgtttt aatttgaagg ggaatgccgt gattggctaa + 1021 gatttgttcg aggacatgat agtaagcatt caagttctct tgtttatcaa aataagcgcc + 1081 taggatattg ccagaagcat catcaatggc taagtgtaag ttagatgttt gggctccaaa + 1141 ctaggcatga gggctggcat ccatttgaat gagttcacca gcaaatttct ttctgggtct + 1201 actaggatgt acttttttag ggtcttcaag gaagttttca gccgtcggta agattggatt + 1261 gtctaggggt tgattcaggt tcagtttagc ttgttttctt actctcttct ttgtctttct + 1321 atgggactta ggcgacagga tatttttctt atagagtatt tttctaacag tagtatcaga + 1381 gagctgaatt ccttcttctt cagctagcaa ttcacagaaa tgaaggacat ttggtttata + 1441 tgtttcatag gagaggtatt tttttaggag acgttctttg atttcatcag ggattgcatg + 1501 ttttggtttt cgatttctgt ttccgtgtct gaaggcttct tttcctttca gttgataggc + 1561 tagtagcaga cgattgattt gtctttcaga aagattgagc tcgacacagg ctcgtttctt + 1621 tgttttcttt ccttgggcta tagcttttat cacaagatat tttttcgttt cattcatatt + 1681 cagttggatc cttttcatat gactattcta ccaaatggga cattttcacg ttcgatttac + 1741 taaagacatt atcacattcg aattacacaa gatgcagata gtgaaaataa aggtgtagac + 1801 attaccgtaa aaaagtgata taattgtatg atgttcaatg tataggtgtt aatcatgagt + 1861 agacgtttta aaaaatcagg ttcacagaaa gtgaagcgaa gtgttaatat cgttttgctg + 1921 actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta caatatcctt + 1981 gcttttagat atcttaatct agtggtaact gcgttagtcc tactagttgc cttggtaggg + 2041 ctactcttga ttatctataa aaaagctgaa aagtttacta tttttctgtt ggtgttctct + 2101 atccttgtca gctctgtgtc gctctttgca gtacagcagt ttgttggact gaccaatcgt + 2161 ttaaatgcga cttcgaatta ctcagaatat tcaatcagtg tcgctgtttt agcagatagt + 2221 gagatcgaaa atgttacgca actgacgagt gtgacagcac cgactgagac tgataatgaa + 2281 aatattcaaa aactactagc tgatatcaag tcaagtcaga ataccgattt gacggtcaac + 2341 cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac taaggccatt + 2401 gtcctaaata gtgtctttga aaatatcatc gagtcagagt atccagacta cgcatcgaag + 2461 ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa gacgtctaaa + 2521 aatcagtctt tcaatatcta tgttagtgga attgacacct atggtcctat tagttcggtg + 2581 tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa aatcctcttg + 2641 accacaacgc cacgtgatgc ctatgtacca atcgcagatg gtggaaataa tcaaaaagat + 2701 aaattaaccc atgcgggcat ttatggagtt gattcgtcca ttcataccct agagaacctt + 2761 tatggtgtag atattaatta ttatgttcgt ttgaatttta cctcattttt gaaattgatt + 2821 gacttattgg gaggggtaga tgttcataat gatcaagagt tttcagctct acatgggaag + 2881 ttccatttcc cagtagggaa tgtccatcta gactctgagc aggctctagg ttttgtacgt + 2941 gaacgctact cactagccga tggagaccgt gaccgtggtc gcaaccaaca aaaggtgatt + 3001 gtggctatcc ttcaaaaatt aacgtcaacc gaagcactga aaaattatag tacgatcatt + 3061 aatagcttgc aagattctat ccaaacaaat atgccacttg agactatgat aaatttggtc + 3121 aatgctcagt tagaaagtgg tggaacttac aaagtgaatt ctcaagattt aaaagggaca + 3181 gatcggatgg atcttccttc ttatgcaatg ccagacagta acctctatgt gatggaaata + 3241 gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga gggtagatga + 3301 aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca agtcaataga + 3361 ggaaagcaag gcacttttaa gagaagctta taatcaagga gttcgaatga ttgtgtctac + 3421 ttcgcatcgt cgaaaaggga tgtttgaaac tccggaagag aagatagcag aaaactttct + 3481 tcaggttcgg gaaattgcaa aagaagtagc agatgattta gtcatagctt atggcgcaga + 3541 gatatactat actctggatg ctctagaaaa gctagaaaaa aaagaaattc ctacccttaa + 3601 tgatagtcgt tatgctttga ttgagtttag catgcatact tcctatcgtg agattcatgc + 3661 gggattgagc aatattttga tgttgggaat cacgccagta attgctcata ttgaacgtta + 3721 tgatgcctta gagaataatg aaaaacgtgt tcgtgaactg attgatatgg ggtgctatac + 3781 tcagataaat agttatcatg ttttaaaacc taagttcttt ggtgaaaaat ataaattcat + 3841 gaaaaagaga gctcggtatt ttttggaacg tgatttagtt catgtagttg caagtgacat + 3901 gcacaattta gacagtagac ctccatatat gcaacaggca tatgatatca ttgctaagaa + 3961 atatggagcg aaaaaagcga aagaattttt tgtagataat cccagaaaaa ttataatgga + 4021 tcaattaatt taggagaaaa tatgaaggaa caaaacactt tggaaatcga tgtattgcaa + 4081 ctattcaggg ctttatggaa aagaaagttg gtcattttat tagtggcaat tataacttct + 4141 tcagttgctt ttgcctacag tacttttgtt atcaaacctg agtttactag tacgactcgg + 4201 atttatgtag ttaaccgtaa tcaggaagag aagtctggtt taaccaatca agacttgcag + 4261 gcaggatcat acttggttaa agactatcgt gaaattatcc tatcgcagga tgttttggag + 4321 gaagttattt ctgatttgga actagatttg acgccaaaag gtttggctaa taaaattaaa + 4381 gtaacagtac cagttgatac ccgtattgtc tctgtctcag ttaatgatcg agttcctgaa + 4441 gaggcaagcc gtatcgctaa ctctttgaga gaagtagctg ctcaaaaaat tatcagtatt + 4501 actcgtgttt ctgatgtgac aacactggag gaggcaagac cggcgatatc accatcttcg + 4561 ccaaatatta aacgcaatac actaattggt tttttggcag gggggattgg aactagtgtt + 4621 atagttcttc ttcttgaact tttggacact catgtgaaac gtccggaaga tatcgaagat + 4681 acactgcaga tgacactttt gggagttgta ccaaacttga gtaagttgaa ataggagaga + 4741 ggaatgccga cattagaaat agcacaaaaa aaactggagt tcattaagaa ggcagaagaa + 4801 tattacaatg ccttgtgtac aaatatacag ttgagcggag ataaactaaa agtaatttcc + 4861 gttacttctg ttaaccctgg ggaaggaaaa acaactactt ccgtaaatat agcaaggtcg + 4921 tttgcgcgta caggctataa aactcttttg atcgatggcg atactcgaaa ttcagttata + 4981 tcaggagttt ttaaatcgcg tgaaaaaatt acagggctaa cagaattttt atctgggaca + 5041 gctgatttat ctcacggttt atgtgataca aatattgaaa atttatttgt aattcaatcg + 5101 ggatctgtat caccaaaccc tacagccttg ttacaaagta aaaattttaa tgatatgatt + 5161 gaaacattgc gtaaatattt tgattatatc attgttgata cagcacctat tggaattgtt + 5221 attgatgcgg caattatcac tcaaaagtgt gatgcgtcca tcttggtaac agcaataggt + 5281 gaggtgaata aacgtgatgt ccaaaaagcg aaacaacaat tagaacaaac agagaaactg + 5341 ttcctaggag ttgttttaaa taaattggat atctcggttg ataagtatgg agtttacggt + 5401 tcctatggaa attatggtaa aaaataactt aggaaagatt ttatggatga aaaaggattg + 5461 aaaatttttc tagcagtatt acagagtatt attgtcattt tattggttta ttttcttagc + 5521 tttgttagag agacagaact tgaacgttct tcgatggtta tactatacct tctccacttt + 5581 tttgtattct attttagttc ctatggtaac aattttttta aaagagggta cctagttgag + 5641 tttaatagta ctataagata tatttttttc tttgcaatag ctataagtgt attaaacttt + 5701 tttatagcgg aacggtttag tatctctaga agaggaatgg tatacttctt aactttagaa + 5761 ggaatatcct tatacttgtt aaatttctta gtaaagaaat attggaagca tgtgtttttt + 5821 aatctaaaaa atagcaagaa aattttactg ttaacagtaa caaaaaatat ggaaaaagtt + 5881 cttgataaat tgctagaatc tgatgaactt tcatggaaat tggtagcagt aagtgttttg + 5941 gataaatatg attttcaaca tgataaaata cctgtaattg aaaaggaaaa aattattgaa + 6001 tttgcaacgc atgaagttgt ggatgaggtg tttgtcaatc ttccaggaga gagctacgat + 6061 attggagaaa ttatctctag gtttgagaca atggggatag atgtaactgt aaatcttaaa + 6121 gcatttgata agaatttggg tcgcaataaa caaattcatg agatggtagg attgaatgta + 6181 gtcactttct ctacaaattt ttataaaact agtcatgtga tttcaaagag aattctcgat + 6241 atttgtggtg ccactattgg ccttattctt tttgctatag ctagtctagt tttagttcca + 6301 ttgattcgta aagatggcgg accagctatt tttgctcaaa ctcgtatagg gaaaaatggt + 6361 cgacatttta ccttttataa attccgttcg atgcggatcg atgctgaagc tatcaaagaa + 6421 cagttgatgg atcaaaatac gatgcaaggt ggtatgttta agatagacaa tgatcctcgt + 6481 gttacaaaaa ttggtcgctt tattcgtaaa accagtttag atgaattgcc gcagttttgg + 6541 aatgtcttta taggagatat gagtttggtg ggaacacgtc cacctacagt agacgagtat + 6601 gatcagtata ctccagaaca gaaacgtcga ctcagcttta aacctggtat tacaggttta + 6661 tggcaggtta gcggccgtag taaaataacc gattttgacg atgttgtaaa attagatgtg + 6721 gcttatattg ataattggac aatctggaaa gatattgaaa ttttgcttaa aactgttaaa + 6781 gttgtattta tgagagatgg agcgaagtaa ttcatatgaa tgagagaatg caaatattag + 6841 gagttactat agatccatta acgatgaaag aaacagtgga tgctgttgaa cagtatgttt + 6901 taaagaagca tcctttgcac ttgatgggag ttaacgcaga taaaattaat cagtgccatg + 6961 aagatgagaa aatcaaaaaa atcgttaatg aatcaggaat tattaatgcg gatggagcat + 7021 cagttgttct tgcaagtaag tttttaggaa cgcctgttcc tgaacgagta gcgggtattg + 7081 atttgatgca atgtctttta gagttgtcaa ataaaaaagg atattcagtt tacttttttg + 7141 gagctaaaga agaagtttta caagatatgc taaaagtttt taaacaaaga tatcctaatc + 7201 ttaatgttgt tggctataga aacggatatt tttcacctga agatgaaaaa aagattcagg + 7261 aagatattaa aggaggaaaa ccagattttg tatttgtagg gattacttct cctaaaaagg + 7321 aatatatcat ccaatcattc atggataatg ggattaatgc tgtctttatg ggtgttggtg + 7381 gcagttttga tgtattatca ggacacatta aacgagctcc attatggatg caaaaattga + 7441 atctggaatg gttgttccgt gtagttaatg aacccaagcg cctttttaag cgttattttg + 7501 tagggaatgt tacttttatt aagcgagttt tagatgaaaa gcgaaaatca aaaaaataat + 7561 attctacata tttctcgtac aatggatatt ggtggtgcag aacgtattgt atatcaattg + 7621 agttctgatt tgaaagatga atttgatagt gtccatgtcg cttcaacagg tggactatgg + 7681 gagagcaaac ttttatcaaa aggagttcaa catcataaaa ttttagatgt tgacagtaag + 7741 aatcccctaa ctatggtaaa gatcctttca agtttttata gaattatcaa aaataatgat + 7801 attaccattg ttcacactca tcatcggatg gctgcctttt atattcgctt gttgaaaatc + 7861 attaatccta agttgataca tgtttacact gcacataatg tatttaaaaa taaattacca + 7921 ttatacaaat tttccttaaa aaaagcgcat tgtgtagctg tgggtaaagc ggttaatgat + 7981 aatttgaaac atgatgtagg aatcagtgat agtacagtag tctataatgg ggttgttttt + 8041 gaaaaaactg ataagctagt tgatgagatt gtaaactata acggaatcaa attggggtgt + 8101 attgctaggt tatcagagca aaaaggattg acctacctaa ttgatgcgat gtctttagtg + 8161 aaacacaggg atattacgtt gttcattgtc ggagatggag agcttcgaga tgagcttgaa + 8221 aacaaggtga aacaattaaa tcttcaaaaa tcagtgatat ttttaggtta tcgaaaagat + 8281 gttgttgaat gtatcaatag ttttgattac ttagtgtcat catctttata tgaggggttg + 8341 gctctaaatg taattgaagc atttatgaat gggaaaacga tggttgcatc agatatccca + 8401 ggaataaatg aagtagtcaa taacaaaaat gggattcttg ttcctgttaa ggatgatgtt + 8461 gccttagcga gagcgattga aaagcttgcg attgacaaaa aacttagaga aaaactcgct + 8521 tatcaagcaa aaaaagatta tgagacaaaa tttaattatt ccttgttttt agataattat + 8581 cggagacttt atagaaaatt aatgggagaa tcaaaatgaa aaaagtcatg ttggtttttg + 8641 ggacacgtcc agaagctatt aaaatgtgtc ctttagtaag tgaactgaaa caaaatgatt + 8701 caatcaagac acttgtgtgt gtaactggtc aacataagga aatgttagag caggttttag + 8761 aggtgttcaa ggttgtccca gattatgatt tgggtatcat gaaatcaaat cagaccctat + 8821 ttaccattac gactagtatc ttggataaaa ttcaggcggt tctagagaaa gaaaaaccag + 8881 atcttgttct tgttcatgga gatactacaa caacatttgc gacagcttta gcagcatttt + 8941 atatgggaat caaagtggga cacgtcgaag caggtctcag aacctataat ctccaaagtc + 9001 catttccaga ggaattcaat cgccagacaa cttctatcat tgccgactat cattttgcgc + 9061 cgactgaagt tgcgaaggaa aatctactaa gagaggacag aaaaaatatc tttgtgacgg + 9121 gaaatacagt cattgatgct ttgaagacga ctgttcaaga taactaccat cacccaattt + 9181 tagaatgggc aaagggtagt aagttaatca tgctaacggc tcatcgacga gaaaatcttg + 9241 ggaaaccgat ggaaaacatg tttaatgctg ttaatcgaat tttaaacgaa ttcgaagatg + 9301 taaaagttgt atatcccatc cataaaaatc ctaaggttcg agaattagca agtaaagttt + 9361 ttggcgataa tgaacgaatg aaaatcattg aaccgttaga ggttattgat tttcataatt + 9421 ttatgaatca aagctatatg attttgacag attctggagg tgtacaggaa gaagcacctt + 9481 ctttaggaaa acctgtcttg gtgatgcgtg atacaacaga gcgtcctgag ggggtcgttg + 9541 ctggcacgtt gaagttggta ggaacagaag aagagaatat ctatagcaac ttcaaacttc + 9601 ttcttgaaga tgaaacagaa tataacaaga tgagcaaagc tagcaaccct tatggagatg + 9661 gaatgacttg taaacggatt gttgatatta ttctggaagt ataaaaataa ttcaattatg + 9721 gatgaggaaa gaataaatta gattgatgat aaaaagaaaa atatatataa tctgtgtatt + 9781 actgtcgtat tttttaccta gtttttttac agttggctca atggcgactt tatttgcttt + 9841 gctttctact ttagttaagc tatttgtgac ttttgattat attcccaaag ttcttttaca + 9901 acataaagta acactgattg atattctagt tgttctattt ttattttttc aagcatttgc + 9961 agcttttcaa agccaaacgt tgtaccttaa ctacgttgga ggtcagtttt tccttttagg + 10021 actatattca tttttgaaac actttttatt gttggattgt aaaacaacaa taaaaagcct + 10081 ctttttaacc tttatcttgt ttttgtgtgt tcaggtaata actcaattgc tttttccggt + 10141 cggtttcgat tctttgcacc ctacaggaga taatagactt tactttttag gaagaaagaa + 10201 catagctacc ccgtatatca ttgttggatt aggtggtttt tacttattaa ataaaaaaat + 10261 gaatgagttc atatcactaa aggagattat ttttttagga ttgttcggaa ttttatcatt + 10321 tttaacacaa tccagtacag cgattatatg ttatgggctt tttattttca tacgtctatt + 10381 gggattaaag gaaaatatag gaaaactata ttctttagtc agtatggctg tatatgtttg + 10441 tttttctctt tctataatct tttcacaaag tacaatttta tcaactttta cagcgatttt + 10501 ttccaaaaat gcaacttttt caggacgtat taatatttgg caattagcga ttcgtatttt + 10561 tgaagagaat ttttggtttg gacgaggcct cgacgttaat tttaatgctt ggacaaatgg + 10621 gattatcgtt aattcagcac acaatacctt attagatata cttgctcgaa ctggcatatt + 10681 tccaggtgtt ttatttatag tgcttcttat gaatctgttt cttggaaaat atagaataga + 10741 atcaaaaaca ctgttggcta tgttagcctc atttatgatt tatattacaa tggagacttc + 10801 atctatgagc atattgctgc taattattgt tctttgtgta tattggccac gtggagagga + 10861 gaagttgcat gagcaagtta cttaatacca tctattatcg actatttaga ttatataaaa + 10921 aaatttatct acaagttttt agtaaaaaaa cggttgacat cttgggtgaa aaggctaatt + 10981 tagaaaatga actaattgtt tcgtttacaa caattccaag tcgtcttaat tatttaccaa + 11041 gtatgattaa aagtattttc aatcagacaa ttatccctaa ccgttttatt atgtatgttt + 11101 ataaagatga atttgaaggc attaatttgg agagtattct agaacttgaa atcaaaaatg + 11161 gtttggaaat tgtctatgtg gatgagaatc ttcgttcaca caaaaaatat ttttatgcta + 11221 tgaaagataa tccgaacagt atagttgttc tagttgatga cgatatcatt tatcctcgaa + 11281 atactataaa gaaactgatt gcatcctata gaatttatcc acagtgtgtt tcagcaatgc + 11341 gatgtcatcg aattaagttg ttttctgatg gaagtttata tccatataat caatgggaat + 11401 atgaaatatc aggagctact ataccatcgt attttaattt ttttactagc ggaggtggga + 11461 cattatttcc tccatgtact cgcaatgagg atctttttaa taaaaaaaat atcagggaac + 11521 tcagttttct agctgatgat gtatggttga attttttggt agtcaaaaat ggaattaaaa + 11581 cagtaaaagc aacacgatat aaagggacac cattaactat agatgacaat cctgaggaga + 11641 gtttggtata tttgaatgcc gtatatgata acaacaatga taaatgtatt agaaatatgg + 11701 ttgaatatta tcaaattaat tttacagagg ataaataatg aatgttgaaa aaaatttgaa + 11761 acgtggaatt ttctatactg caatagggaa gtattcgaat gtagttattc aattacttgt + 11821 aacagcaatt cttagccgga ttctctcacc tgtagaatat ggtatcgtag cagtagtaaa + 11881 tgtatttctt ttattttttc aaatgttagc agattcagga ataggacctg ctattgttca + 11941 aaataaagaa ctgaataagt cagatttaat cagcattttc tcattaacga tttatagtgg + 12001 aatcgtactt tcttgtattt ttgctttact aggatatcct atgggggtgt tatacggcga + 12061 aactatttat gttagtttat ttccgctttt aggtctttgt gttttatttt ataccattac + 12121 aattgtaccg caagctattc taatgaaaac gatgaacttt aaaatagtta attttctaac + 12181 tattttttct aacattgcta gtggcttggt gggcgttatt ttagcggtat cacattttgg + 12241 tgtctattct ctaatttttt ctaatattgt aagagcaatg gttttattta tcgctttata + 12301 ttctaaagca aagataaatt tctattggaa agtttcaaaa agttctattg gtaaaatttt + 12361 tgagttttca aaattccaat ttttgtttaa tttttggaat tattttgcta gaaatttaga + 12421 taatttatta attggacgat tgattagccc gtcagatctt ggttattatg ataaggctta + 12481 tcaattatct ttgtacccta atcaaatttt atcacaggtt gtgacaccag cattgcatcc + 12541 tattatgtcc aattttcaag ataatatcag taagataggc gaagtttatc ttcagatttc + 12601 tagaatattc gtaatagttg gcatacctat ttcggcttat ttatacttta atgctcaata + 12661 tgttgttaca tttatgtttg gagataattg gtcccaaagc gttccggtgt ttcaaatatt + 12721 agcagcaaca atttggttac aaatggctaa tagtcctact ggtgcatttt accaagcaac + 12781 taatcagaca aggttattgt ttagaattgg cttattgaca tcttttatta atattttagc + 12841 tattgttatt ggtgtaatgt tgcaaagcat ccaatgtgtt gcgtacatgc ttttgatttc + 12901 tttcagtctt agtttagtaa tcaatactct ttacttaaca aaaaaagtat taaatatttc + 12961 tgctcaaaaa tatataaaac cgatattaat taatttgaca attatcagtc cctatattgt + 13021 gtttaatttg tttatctcgg attttgtaaa cgaccttatt ttacatttat cagttcagtt + 13081 tgttatttta tttttaatat ggggaattgg gatgtatatt agcggagagt atcgacgagt + 13141 cttcgcggtt ataagaaaat aaaggagcaa ttttgtgaaa attttatttg tgaatatgtt + 13201 ttataatgaa gcaggaggtg cacaaaagag taccaaattt ctagctgaac aacttgtaaa + 13261 agaaggacat gaggtatttg catactctga tgatgccatt gattcagata ttgatgaagt + 13321 tattaatagg gttaagattt ttagaagaag aactccgctt tttagtcttc actatatttt + 13381 cagtgctaag aagaatccag ctaaacattt tttctataaa atatttgaaa cctataatgt + 13441 atttgcgaaa agaaaattta tcaatatcat tgaggaagta caaccagata ttgttcactt + 13501 taatacaatt tcaggaatgt ctttatcaat agttaaagaa gctaaaaaga gaaatatcag + 13561 gaccgtttgg accttgcgag actattggct agaatatcca tggggtgaga aagatatttc + 13621 tcttatcaaa cttctaaata gaatatatag accttttgtt aagaaaagtt taagacactt + 13681 agacatagta acagcaccat cagcatttac tttgaataat tttatcaata aaggatttat + 13741 taacccatct tctcaaaaat gtatggtcat tgaaaatgct gttatatttt caaagggtaa + 13801 gttggaaaat attatcaaac aaaagcaaga aacaaaaaga aatccagaaa aaacgaattt + 13861 tctttttgta ggttctatac ttgaaataaa gggcgttttt aacttagtaa aggcctttaa + 13921 aaaactaact agtccggaaa tttctttgaa aattgtagga aaaggaaaag atttagaaaa + 13981 acttcaaaaa gaaattgaga gtgatcctag aatacaatat ttaggctttc aagatacaga + 14041 aaccctctat aaaacttatc aaaattcgga tgtattggtc gtcccatctg cttgggatga + 14101 accgtttggt agagttgtaa ttgaaggaaa tgcaaatggc cttcctgtca tcacttcaga + 14161 tagaggtgga ttacctgaaa ttgtgcaaac agtaggagga ggagaaattt ttacagatga + 14221 atcgggaaat acattatata gtcttttaaa gaaatttgta gaaatggaaa actacaatgt + 14281 ctattaccaa tgcattcttg agaatattga tatttattct atcgaaaaac aaagtgaaaa + 14341 gttcactaat ctgtatttag ataaagaaat tgaataataa gttgtttttg tagcagtaac + 14401 ggaggtaatt atgaaaatag cggtagcagg aacaggttat gtaggattat caattgctgt + 14461 gttgttggca caacatcacg aaataaaagc agttgatatt gttgctgaaa aagttgaatt + 14521 aatcaatcaa aaaaagtctc caattcagga tgattatatt gaaaaatatt tagtggaaaa + 14581 agatttaaat ttggaagcaa ctatggatgc taagtatgct tatgaagatg cagaatttgt + 14641 tgttgttgca gcaccaacaa attatgattc gaaaaagaac ttttttgata catcagcagt + 14701 agaggcggtc attcaacaag taaaaaaaat taatcccaaa gcggtaataa ttattaaatc + 14761 tacaatccct gttggattca cagagtccgt tcaaaagaaa tatcagtata aaaatatctt + 14821 atttagtcca gaatttttac gcgaatctaa agcattatac gataacctgt atccaagtcg + 14881 catcattgtt ggaactgact tagaagatac ttatttaaaa gacaaagcta atatatttgc + 14941 ttccctacta aaagaggggg ctattaaaga agacatagat acacttttca tgggagtaac + 15001 ggaagctgag gcagttaaat tatttgccaa tacctacctt gcgttgcgtg tttcttactt + 15061 taatgaattg gatacttatg cagaggtgaa aggtttggat gcaaaagcca ttattgatgg + 15121 tattggccta gatccacgta taggaaatca ttataacaat ccatcctttg gctacggtgg + 15181 gtattgttta cctaaagata gtaagcagtt attagcaaat tactttgatg taccacaaaa + 15241 tatgatgaca gcaactgttg aaagcaatcg aacgcgtaag gattttatcg ctcaacggat + 15301 tttagaaaaa gctggagtat ctgagactga tagtttagat gcgtttaaga acatacaaga + 15361 tattgttata ggtatttatc gtttaacaat gaaaagtaat tcggataact tccgtcactc + 15421 ctctattcaa ggcgttatga aacgattgaa agctaaggga gttacggtta tcatctatga + 15481 gccaactttg aaggacgggg aaacattctt tggtaataaa gtggtaaata ctctagataa + 15541 atttaaagaa gctagtaatg ttattgtagc caatcgtttt gaaccttcac tagaggatgt + 15601 ttctaataaa gtttatagtc gagatatatt taagcgtgac taataaatac gtccacgtga + 15661 cgtaatatct attaaatgga taaaatatta ataaacatgg catcgatatc ttttttggac + 15721 ttgaattgtc aaattaagtg cacatttttt tcatagaaaa cttcataaga tgttttccgg + 15781 ttaagacatt ttcgtggtct attatctaag ttggtttata taatagactt cctgcgaaac + 15841 aaaatatggt atagtagttc tatgaatgat gaagcaagta aacaactaac tgatgcacga + 15901 tttaagcgtc ttgttggtgt tcagcgcacg acttttgaag agatgttaac tgtattaaaa + 15961 acagcttatc aacttaaaca tgcaaaaggt ggacgaaaac ctaaattaag cctagaagac + 16021 cttcttatga ccactcttca atatatgcga gaataccgca cttatgaaga aattgcggct + 16081 gattttggta ttcacgaaag caacttaatc catcggagcc aatgggttga agtaactctt + 16141 gttcaaagtg gttttacgat ttcaagaact cctctcagtt ctgaggacac ggtaatgatt + 16201 gatgcgacgg aagtaaaaat caatcgccct aaaaaaacaa ttagcgaatt attatggtaa + 16261 aaagaaatgc cacgctatga aggctcaaac gattgtcaca agtcaaggga gaattgtttc + 16321 tttggatatc actgtgaact attgttatga tatgaagttg ttcaaaatga gtcgcagaaa + 16381 tatcggacaa gctggtaaaa tcttggctga cagtggttat caaggactca cgaagatata + 16441 tcctcaagca caaactccac gtaaatccag caaactcaag ccgctaacag ttgaagataa + 16501 agcctgtaac catgcgctat ctaaggagag aagcaaggtt gagaatatct ttgccaaagc + 16561 aaaaacgttt aaaatgtttt caacaaccta tcgaaatcat cgtaaacgct tcggatattt + 16621 taggcatact atatattttt tattcaatta ttcacttttg tattcaaaag gttgcgggtg + 16681 cctctgtccg agtacccact acgatattta acctattgaa tatctataaa tttcctctgg + 16741 gagtttcatg gtatctatat acgttatggt cgatattgat agtttatggt ttactatctg + 16801 ctgttttcaa aaatcgtaga atgttatttt tgataagtgt tttcgcttat tgtttaaccc + 16861 tatttgttca aacagatatt tatattattc aaagaacgct agtttggggg ctttgtttct + 16921 ttcttggcag tgtattgagt gaaattcact ttgataaaat taatttgaaa aaatttcttt + 16981 ttttctttgt gctatttgat tttatttata tgttcgcttg gttcttgttt tatgaagtag + 17041 agtctaagaa ggattatgta agctatagta acccaggttt gtgggggatt gcttttattg + 17101 tctgtgtatt agttgctttt gcgatttttc ctaaaatgga gaaaaatttt cctaaaactt + 17161 tcctatattt cactaaatac gggaaagata gtttagggat ctatattctt catgcaccaa + 17221 tttgtagcat gattcggatt ctaatgttga aagtgggaat aaactcagtt tttcttcacg + 17281 ttgttgttgg gattgtgcta ggctggtatt tatccatact agcaacttat atattgaaaa + 17341 aaattccatt tttgaatatt gttttattac cacaaaagta tattaaatta aaataaatta + 17401 ttttagattt ataatgtggc tctttgtcaa ctaacatctg gagaggacaa tcactgtctt + 17461 ctcttttttt gtcttttcag aacataccaa attaacacaa aaattctgaa aattctgttg + 17521 acaactttct gaaaagagtc tataatggag agaaagtttt aaaggagaaa atgatgaaaa + 17581 gttcaaaact acttgccctt gcgggcgtga cattattg +// + diff --git a/public/res/serotype_genbank/serotype_9N.gb b/public/res/serotype_genbank/serotype_9N.gb new file mode 100644 index 0000000..49f0bb4 --- /dev/null +++ b/public/res/serotype_genbank/serotype_9N.gb @@ -0,0 +1,784 @@ +LOCUS CR931647 17619 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 533/62 (serotype 9n). +ACCESSION CR931647 +VERSION CR931647.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 17619) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 17619) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..17619 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="533/62" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC09N_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC09N_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33001.1" + /db_xref="UniProtKB/TrEMBL:Q4K2K9" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVEMTD + " + gene complement(order(281..403,412..1677)) + /gene="tnp" + /locus_tag="SPC09N_0002" + /pseudo + CDS complement(join(281..403,412..1677)) + /gene="tnp" + /locus_tag="SPC09N_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(694..1194) + /gene="tnp" + /locus_tag="SPC09N_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.8e-21" + /pseudo + gene 1855..3300 + /gene="wzg" + /locus_tag="SPC09N_0003" + CDS 1855..3300 + /gene="wzg" + /locus_tag="SPC09N_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33003.1" + /db_xref="GOA:Q4K2J2" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q4K2J2" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHRKFLFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGTYKVNSQDLKGTDRMDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1855..1971 + /gene="wzg" + /locus_tag="SPC09N_0003" + /note="Signal peptide predicted for SPC0322 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 2059..2406 + /gene="wzg" + /locus_tag="SPC09N_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 2.3e-64" + misc_feature 2584..3027 + /gene="wzg" + /locus_tag="SPC09N_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.5e-68" + gene 3302..4033 + /gene="wzh" + /locus_tag="SPC09N_0004" + CDS 3302..4033 + /gene="wzh" + /locus_tag="SPC09N_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33004.1" + /db_xref="GOA:Q4K2J1" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q4K2J1" + /translation="MIDIHSHIVFDVDDGPKSIEESKALLREAYNQGVRMIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDALEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHAGLSNILMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QINSYHVLKPKFFGEKYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKEFFVDNPRKIIMDQLI" + misc_feature 3305..3913 + /gene="wzh" + /locus_tag="SPC09N_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 3.4e-38" + gene 4042..4734 + /gene="wzd" + /locus_tag="SPC09N_0005" + CDS 4042..4734 + /gene="wzd" + /locus_tag="SPC09N_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33005.1" + /db_xref="GOA:Q4JZA0" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4JZA0" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + misc_feature 4060..4476 + /gene="wzd" + /locus_tag="SPC09N_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.1e-53" + misc_feature 4582..4659 + /gene="wzd" + /locus_tag="SPC09N_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4744..5427 + /gene="wze" + /locus_tag="SPC09N_0006" + CDS 4744..5427 + /gene="wze" + /locus_tag="SPC09N_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33006.1" + /db_xref="GOA:Q4K2I9" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q4K2I9" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARTGYKTLLIDGDTRNSVISGVFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTAIGEVNKRDVQKAKQQLEQTEKLFLGVVLNKLDISVDKYGVY + GSYGNYGKK" + gene 5443..6810 + /gene="wchA" + /locus_tag="SPC09N_0007" + CDS 5443..6810 + /gene="wchA" + /locus_tag="SPC09N_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33007.1" + /db_xref="GOA:Q4K2I8" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q4K2I8" + /translation="MDEKGLKIFLAVIQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGYLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNFLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGSAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 6226..6807 + /gene="wchA" + /locus_tag="SPC09N_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 1.3e-146" + gene 6816..7559 + /gene="wchO" + /locus_tag="SPC09N_0008" + CDS 6816..7559 + /gene="wchO" + /locus_tag="SPC09N_0008" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI33008.1" + /db_xref="GOA:Q4K2I7" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q4K2I7" + /translation="MNERMQILGVTIDPLTMKETVDAVEQYVLKKHPLHLMGVNADKI + NQCHEDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMQCLLELSNKKG + YSVYFFGAKEEILQDMLKVFKQRYPNLNVVGYRNGYFSPEDEKKIQEDIKGGKPDFVF + VGITSPKKEYIIQSFMDNGINAVFMGVGGSFDVLSGHIKRAPLWMQKLNLEWLFRVVN + EPKRLFKRYFIGNVTFIKRVLDEKRKSKK" + misc_feature 6978..7493 + /gene="wchO" + /locus_tag="SPC09N_0008" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 1.2e-93" + gene 7534..8619 + /gene="wcjA" + /locus_tag="SPC09N_0009" + CDS 7534..8619 + /gene="wcjA" + /locus_tag="SPC09N_0009" + /note="member of homology group 66" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33009.1" + /db_xref="GOA:Q4K2I6" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q4K2I6" + /translation="MKSENQKNNILHISRTMDIGGAERIVYQLSSDLKDEFDSVHVAS + TGGLWESKLLSKGVQHHKILDVDSKNPLTMVKILSSFYRIIKNNDITIVHTHHRMAAF + YIRLLKIINPKLIHVYTAHNVFKNKLPLYKFSLKKAYCVAVSKAVNDNLKHDVGISDS + TVIYNGVVFEKTDKLVGEIVNYNGIKLGCIARLSEQKGLTYLIDAMSLVKHRNITLFI + VGDGELRDELENKVKQLNLQKSVIFLGYRKDIVECINSFDYLVSSSLYEGFGLNAIEA + FMKGKTMVSSDIPGINEVVNNKNGILVPVKDDVALARAIEKLATDKKLREKLAYQAKK + DYETKFNYSLFLDNYRRLYRKLMGESK" + misc_feature 8047..8538 + /gene="wcjA" + /locus_tag="SPC09N_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 6.9e-43" + gene 8616..9704 + /gene="mnaA" + /locus_tag="SPC09N_0010" + CDS 8616..9704 + /gene="mnaA" + /locus_tag="SPC09N_0010" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33010.1" + /db_xref="GOA:Q4K2I5" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q4K2I5" + /translation="MKKVMLVFGTRPEAIKMCPLVNELKQNDSIKTLVCVTGQHKEML + EQVLEVFKVVPDYDLGIMKANQTLFTITTSILDKIQAVLEKEKPDLVLVHGDTTTTFA + TALAAFYMGIKVGHVEAGLRTYNLQSPFPEEFNRQTTSIIADYHFAPTEVAKENLLRE + DRKNIFVTGNTVIDALKTTVQDNYHHPILEWAKGSKLIMLTAHRRENLGKPMENMFNA + VNRILNEFEDVKVVYPIHKNPKVRELASKVFGDNERMKIIEPLEVIDFHNFMNQSYMI + LTDSGGVQEEAPSLGKPVLVMRDTTERPEGVVAGTLKLVGTEEENIYSNFKLLLEDET + EYNKMSKASNPYGDGMTCKRIVDIILEV" + misc_feature 8679..9695 + /gene="mnaA" + /locus_tag="SPC09N_0010" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 3.6e-185" + gene 9746..10885 + /gene="wzy" + /locus_tag="SPC09N_0011" + CDS 9746..10885 + /gene="wzy" + /locus_tag="SPC09N_0011" + /note="member of homology group 83" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33011.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K2I4" + /translation="MIKRKIYIICVLLSYFLPSFFTVGSMATLFALLSTLVKLFVTFD + YIPKVLLQHKVTLIDILVVLFLFFQAFAAFQSQTLYLNYVGGQFFLLGLYSFLKHFLL + LDCKTTIKSLFLTFILFLCVQVITQLLFPVGFDSLHPTGDNRLYFLGRKNIATPYIIV + GLGGFYLLNKKMNEFISLKEIIFLGLFGILSFLTQSSTAIICYGLFIFIRLLGLKENI + GKLYSLVSMAVYVCFSLSIIFSQSTILSTFTAIFSKNATFSGRINIWQLAIRIFEENF + WFGRGLNVNFNAWTNGIIVNSAHNTLLDILARTGIFPGVLFIVLLMNLFLGKYRIESK + TLLAMLASFMIYITMETSSMSILLLIIVLCVYWPRGEEKLHEQVT" + misc_feature 9746..9838 + /gene="wzy" + /locus_tag="SPC09N_0011" + /note="Signal peptide predicted for SPC0330 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.673 between residues 31 and 32" + misc_feature 10508..10693 + /gene="wzy" + /locus_tag="SPC09N_0011" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1.4e-08" + gene 10869..11738 + /gene="wcjB" + /locus_tag="SPC09N_0012" + CDS 10869..11738 + /gene="wcjB" + /locus_tag="SPC09N_0012" + /note="member of homology group 84" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33012.1" + /db_xref="GOA:Q4K2I3" + /db_xref="UniProtKB/TrEMBL:Q4K2I3" + /translation="MSKLLNTIYYRLFRLYKKIYLQVFSKKTVDILGEKANLENELIV + SFTTIPSRLNYLPSMIKSIFNQTIIPNRFIMYVYKDEFEGINLESILELEIKNGLEIV + YVDENLRSHKKYFYAMKDNPNSIVVLVDDDIIYPRNTIKKLIASYRIYPQCVSAMRCH + RIKLFSDGSLYPYNQWEYEISGATIPSYFNFFTSGGGTLFPPCTRNEDLFNKKNIREL + SFLADDVWLNFLVVKNGIKTVKATRYKGTPLTIDDNPEESLVYLNTVYDNNNDKCIRN + MVEYYQINFTEDK" + gene 11738..13162 + /gene="wzx" + /locus_tag="SPC09N_0013" + CDS 11738..13162 + /gene="wzx" + /locus_tag="SPC09N_0013" + /note="member of homology group 85" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33013.1" + /db_xref="GOA:Q4K2I2" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q4K2I2" + /translation="MNVEKNLKRGIFYTAIGKYSNVVIQLLVTAILSRILSPVEYGIV + AVVNVFLLFFQMLADSGIGPAIVQNKELNKSDLISIFSLTIYSGIVLSCIFALLGYPM + GVLYGETIYVSLFPLLGLCVLFYTITIVPQAILMKTMNFKIVNFLTIFSNIASGLVGV + ILAVSHFGVYSLIFSNIVKAMVLFIALYSKAKINFYWKVSKSSIGKIFEFSKFQFLFN + FWNYFARNLDNLLIGRLISPSDLGYYDKAYQLSLYPNQILSQVVTPALHPIMSNFQDN + ISKIGEVYLQISRIFVIVGIPISAYLYFNAQYVVTFMFGDNWSQSVPVFQILAATIWL + QMANSPTGAFYQATNQTKLLFRIGLLTSFINILAIVIGVMLQSIQCVAYMLLISFSLS + LVINTLYLTKKVLNISAQKYIKPILINLTIISPYIVFNLFISDFVNDLILHLSVQFVI + LFLIWGIGMYISGEYRRVFAVIRK" + misc_feature 11756..12559 + /gene="wzx" + /locus_tag="SPC09N_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 9.2e-29" + gene 13175..14377 + /gene="wcjC" + /locus_tag="SPC09N_0014" + CDS 13175..14377 + /gene="wcjC" + /locus_tag="SPC09N_0014" + /note="member of homology group 86" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33014.1" + /db_xref="GOA:Q4K2I1" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR009695" + /db_xref="UniProtKB/TrEMBL:Q4K2I1" + /translation="MKILFVNMFYNEAGGAQKSTKFLAEQLVKEGHEVFAYSDDAIDS + DIDEVINRVKIFRRRTPLFSLHYIFSAKKNPAKHFFYKIFETYNVFAKRKFINIIEEV + QPDIVHFNTISGMSLSIVKEAKKRNIRTVWTLRDYWLEYPWGEKDISLIKLLNRIYRP + FVKKSLRHLDIVTAPSAFTLNNFINKGFINPSSQKCMVIENAVIFSKGKLENIIKQKQ + ETKRNPEKTNFLFVGSILEIKGVFNLVKAFKKLTSPEISLKIVGKGKDLEKLQKEIES + DPRIQYLGFQDTETLYKTYQNSDVLVVPSAWDEPFGRVVIEGNANGLPVITSDRGGLP + EIVQTVGGGEIFTDESGNTLYSLLKKFVEMENYNVYYQCILENIDIYSIEKQSEKFTN + LYLDKEIE" + misc_feature 13811..14308 + /gene="wcjC" + /locus_tag="SPC09N_0014" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 6.6e-31" + gene 14411..15643 + /gene="ugd" + /locus_tag="SPC09N_0015" + CDS 14411..15643 + /gene="ugd" + /locus_tag="SPC09N_0015" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI33015.1" + /db_xref="GOA:Q4K2I0" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q4K2I0" + /translation="MKIAVAGTGYVGLSIAVLLAQHHEIKAVDIVAEKVELINQKKSP + IQDDYIEKYLVEKDLNLEATMDAKYAYEDAEFVVVAAPTNYDSKKNFFDTSAVEAVIQ + QVKKINPKAVIIIKSTIPVGFTESVQKKYQYKNILFSPEFLRESKALYDNLYPSRIIV + GTDLEDTYLKDKANIFASLLKEGAIKEDIDTLFMGVTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDAKAIIDGIGLDPRIGNHYNNPSFGYGGYCLPKDSKQLLANYFDVPQ + NMMTATVESNRTRKDFIAQRILEKAGVSETDSLDAFKNIQDIVIGIYRLTMKSNSDNF + RHSSIQGVMKRLKAKGVTVIIYEPTLKDGETFFGNKVVNNLDKFKEASNVIVANRFEP + SLEDVSNKVYSRDIFKRD" + misc_feature 14411..15031 + /gene="ugd" + /locus_tag="SPC09N_0015" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00028" + misc_feature 14411..14965 + /gene="ugd" + /locus_tag="SPC09N_0015" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-52" + misc_feature 14996..15277 + /gene="ugd" + /locus_tag="SPC09N_0015" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-35" + misc_feature 15371..15622 + /gene="ugd" + /locus_tag="SPC09N_0015" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 1.3e-05" + gene order(15943..16137,16139..16249,16278..16712) + /gene="tnp" + /locus_tag="SPC09N_0016" + /pseudo + CDS join(15943..16137,16139..16249,16278..16712) + /gene="tnp" + /locus_tag="SPC09N_0016" + /note="member of homology group 19" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1381 transposase" + misc_feature join(16184..16249,16278..16652) + /gene="tnp" + /locus_tag="SPC09N_0016" + /note="HMMPfam hit to PF01609, Transposase DDE domain, + score 3.7e-09" + /pseudo + gene 16705..17397 + /gene="wcjE" + /locus_tag="SPC09N_0017" + /pseudo + CDS 16705..17397 + /gene="wcjE" + /locus_tag="SPC09N_0017" + /note="member of homology group 18; + This is suspicious. The database match Q8KWN9 suggest that + the sequence match continues into the upstream + transposase" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase (pseudogene)" + /db_xref="PSEUDO:CAI33017.1" + gene 17572..>17619 + /gene="aliA" + /locus_tag="SPC09N_0018" + CDS 17572..>17619 + /gene="aliA" + /locus_tag="SPC09N_0018" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33018.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaaacct caagtttttg aagcttgagg ttttttacta + 181 tagtggattg aaactagaat agtgcacctc tgcttctaaa acattgttag aaatcgattt + 241 gactgtcccg atcgatttgt cctattctta tttcattttg ctatacttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttataa agatattgtt + 361 tgaaagatgt gagtttccac ggatgggttt gtggagggat atacttgcgt ctttcttttt + 421 ttgttctggt tcttgttcaa agtttttcga atagagttca tgatttagta gctcctttgt + 481 gtgatagatt ttgtcagcga tattgaggta gatgtctccg tcaaatgctt ttataactaa + 541 tgctttcgtc tttctgatga aatagacttc ttttccttgt tcggtaggga tatagtaacg + 601 attttggaat cggatatggt gtccactatc gacgactctc tccgccagtc tagccagaat + 661 gagattcctt tcagaggggt taggaacctc ctcgaagaca gagagttttg tcttgtttcc + 721 aaactgttca ttaaaggttt gaatgtagga aagcaggaag gtattggctt cttccaaggt + 781 atgaatattg ttttgttcca gttcgatagg caggcgagat tgtagtgtct gattgagtct + 841 ttcgactctc cctttagctt gagggataga ggttgtctca aggagaatcc ctagttggtg + 901 acaggcgtat ccaaactgtg tatgggtatc gtcctccatt ttcttagagt tggaggcttg + 961 ataggtaaag accgttctct tatctgtttt aatttgaagg ggaatgccgt gattggctaa + 1021 gatttgttcg aggacatgat agtaagcatt caagttctct tgtttatcaa aataagcgcc + 1081 taggatattg ccagaagcat catcaatggc taagtgtaag ttagatgttt gggctccaaa + 1141 ctaggcatga gggctggcat ccatttgaat gagttcacca gcaaatttct ttctgggtct + 1201 actaggatgt acttttttag ggtcttcaag gaagttttca gccgtcggta agattggatt + 1261 gtctaggggt tgattcaggt tcagtttagc ttgttttctt actctcttct ttgtctttct + 1321 atgggactta ggcgacagga tatttttctt atagagtatt tttctaacag tagtatcaga + 1381 gagctgaatt ccttcttctt cagctagcaa ttcacagaaa tgaaggacat ttggtttata + 1441 tgtttcatag gagaggtatt tttttaggag acgttctttg atttcatcag ggattgcatg + 1501 ttttggtttt cgatttctgt ttccgtgtct gaaggcttct tttcctttca gttgataggc + 1561 tagtagcaga cgattgattt gtctttcaga aagattgagc tcgacacagg ctcgtttctt + 1621 tgttttcttt ccttgggcta tagcttttat cacaagatat tttttcgttt cattcatatt + 1681 cagttggatc cttttcatat gactattcta ccaaatggga cattttcacg ttcgatttac + 1741 taaagacatt atcacattcg aattacacaa gatgcagata gtgaaaataa aggtgtagac + 1801 attaccgtaa aaaagtgata taattgtatg atgttcaatg tataggtgtt aatcatgagt + 1861 agacgtttta aaaaatcagg ttcacagaaa gtgaagcgaa gtgttaatat cgttttgctg + 1921 actatttatt tattgttagt ttgtttttta ttgttcttaa tctttaagta caatatcctt + 1981 gcttttagat atcttaatct agtggtaact gcgttagtcc tactagttgc cttagtaggg + 2041 ctactcttga ttatctataa aaaagctgaa aagtttacta tttttctgtt ggtgttctct + 2101 atccttgtca gctctgtgtc gctttttgca gtacagcagt ttgttggact gaccaatcgt + 2161 ttaaatgcga cttcgaatta ctcagaatat tcaatcagtg tcgctgtttt agcagatagt + 2221 gagatcgaaa atgttacgca actgacgagt gtgacagcac cgactgggac tgataatgaa + 2281 aatattcaaa aactactagc tgatatcaag tcaagtcaga ataccgattt gacggtcaac + 2341 cagagttcgt cttacttggc agcttacaag agtttgattg caggggagac taaggccatt + 2401 gtcctaaata gtgtctttga aaatatcatc gagtcagagt atccagacta cgcatcgaag + 2461 ataaaaaaga tttataccaa gggattcact aaaaaagtag aagctcctaa gacgtctaag + 2521 aatcagtctt tcaatatcta tgttagtgga attgacacct atggtcctat tagttcggtg + 2581 tcgcgatcag atgtcaatat cctgatgact gtcaatcgag ataccaagaa aatcctcttg + 2641 accacaacgc cacgtgatgc ctatgtacca atcgcagatg gtggaaataa tcaaaaagat + 2701 aaattaaccc atgcgggcat ttatggagtt gattcgtcca ttcataccct agagaacctt + 2761 tatggtgtag atattaatta ttatgttcgt ttgaatttta cctcattttt gaaattgatt + 2821 gacttattgg gaggggtaga tgttcataat gatcaagagt tttcagctct acataggaag + 2881 ttccttttcc cagtagggaa tgtccatcta gactctgagc aggctctagg ttttgtacgt + 2941 gaacgctact cactagccga tggagaccgt gaccgtggtc gcaaccaaca aaaggtgatt + 3001 gtggctattc ttcaaaaatt aacgtcaacc gaagcactga aaaattatag tacgatcatt + 3061 aatagcttgc aagattctat ccaaacaaat atgccacttg agactatgat aaatttggtc + 3121 aatgctcagt tagaaagtgg tggaacttac aaagtgaatt ctcaagattt aaaagggaca + 3181 gatcggatgg atcttccttc ttatgcaatg cctgacagta acctctatgt gatggaaata + 3241 gatgatagta gtttagctgt agttaaagca gctatacagg atgtgatgga gggtagatga + 3301 aatgatagac atccattcgc atatcgtttt tgatgtagat gacggtccca agtcaataga + 3361 ggaaagcaag gcacttttaa gagaagctta taatcaagga gttcgaatga ttgtgtctac + 3421 ttcgcatcgt cgaaaaggga tgtttgaaac tccggaagag aagatagcag aaaactttct + 3481 tcaggttcgg gaaattgcaa aagaagtagc agatgattta gtcatagctt atggcgcaga + 3541 gatatactat actctggatg ctctagaaaa gctagaaaaa aaagaaattc ctacccttaa + 3601 tgatagtcgt tatgctttga ttgagtttag catgcatact tcctatcgtg agattcatgc + 3661 gggattgagc aatattttga tgttgggaat cacgccagta attgctcata ttgaacgtta + 3721 tgatgcctta gagaataacg aaaaacgtgt tcgtgaactg attgatatgg ggtgctatac + 3781 tcagataaat agttatcatg ttttaaaacc taagttcttt ggtgaaaaat ataaattcat + 3841 gaaaaagaga gctcggtatt ttttggaacg tgatttagtt catgtagttg caagtgacat + 3901 gcacaattta gacagtagac ctccatatat gcaacaggca tatgatatca ttgctaagaa + 3961 atatggagcg aaaaaagcga aagaattttt tgtagataat cccagaaaaa ttataatgga + 4021 tcaattaatt taggagaaaa tatgaaggaa caaaacactt tggaaatcga tgtattgcaa + 4081 ctattcaggg ctttatggaa aagaaagttg gtcattttat tagtggcaat tataacttct + 4141 tcagttgctt ttgcctacag tacttttgtt atcaaacctg agtttactag tacgactcgg + 4201 atttatgtag ttaaccgtaa tcaggaagag aagtctggtt taaccaatca agacttgcag + 4261 gcaggatcat acttggttaa agactatcgt gaaattatcc tatcgcagga tgttttggag + 4321 gaagttattt ctgatttgaa actagatttg acgccaaaag gtttggctaa taaaattaaa + 4381 gtaacagtac cagttgatac ccgtattgtc tctgtctcag ttaatgatcg agttcctgaa + 4441 gaggcaagcc gtatcgctaa ctctttgaga gaagtagctg ctcaaaaaat tatcagtatt + 4501 actcgtgttt ctgatgtgac aacactggag gaggcaagac cggcgatatc accatcttcg + 4561 ccaaatatta aacgcaatac actaattggt tttttggcag gggggattgg aactagtgtt + 4621 atagttcttc ttcttgaact tttggacact catgtgaaac gtccggaaga tatcgaagat + 4681 acactgcaga tgacactttt gggagttgta ccaaacttga gtaagttgaa ataggagaga + 4741 ggaatgccga cattagaaat agcacaaaaa aaactggagt tcattaagaa ggcagaagaa + 4801 tattacaatg ccttgtgtac aaatatacag ttgagcggag ataaactaaa agtaatttcc + 4861 gttacttctg ttaaccctgg ggaaggaaaa acaactactt ccgtaaatat agcaaggtcg + 4921 tttgcgcgta caggctataa aactcttttg atcgatggcg atactcgaaa ttcagttata + 4981 tcaggagttt ttaaatcgcg tgaaaaaatt acagggctaa cagaattttt atctgggaca + 5041 gctgatttat ctcacggttt atgtgataca aatattgaaa atttatttgt aattcaatcg + 5101 ggatctgtat caccaaaccc tacagccttg ttacaaagta aaaattttaa tgatatgatt + 5161 gaaacattgc gtaaatattt tgattatatc attgttgata cagcacctat tggaattgtt + 5221 attgatgcgg caattatcac tcaaaagtgt gatgcgtcca tcttggtaac agcaataggt + 5281 gaggtgaata aacgtgatgt ccaaaaagcg aaacaacaat tagaacaaac agagaaactg + 5341 ttcctaggag ttgttttaaa taaattggat atctcggttg ataagtatgg agtttacggt + 5401 tcctatggaa attatggtaa aaaataactt aggaaagatt ttatggatga aaaaggattg + 5461 aaaatttttc tagcagtaat acagagtatt attgtcattt tattggttta ttttcttagc + 5521 tttgttagag agacagaact tgaacgttct tcgatggtta tactatacct tctccacttt + 5581 tttgtattct attttagttc ctatggtaac aattttttta aaagagggta cctagttgag + 5641 tttaatagta ctataagata tatttttttc tttgcaatag ctataagtgt attaaacttt + 5701 tttatagcgg aacggtttag tatctctaga agaggaatgg tatacttctt aactttagaa + 5761 ggaatatcct tatacttgtt aaatttctta gtaaagaaat attggaagca tgtgtttttt + 5821 aatctaaaaa atagcaagaa aattttactg ttaacagtaa cgaaaaatat ggaaaaagtt + 5881 cttgataaat tgctagaatc tgatgaactt tcatggaaat tggtagcagt aagtgttttg + 5941 gataaatctg attttcaaca tgataaaata cctgtaattg aaaaggaaaa aattattgaa + 6001 tttgcaacgc atgaagttgt ggatgaggtg tttgtcaatc ttccaggaga gagctacgat + 6061 attggagaaa ttatctctag gtttgagaca atggggatag atgtaactgt aaatcttaaa + 6121 gcatttgata agaatttggg tcgcaataaa caaattcatg agatggtagg attgaatgta + 6181 gtcactttct ctacaaattt ttataaaact agtcatgtga tttcaaagag aattctcgat + 6241 atttgtggtg ccactattgg ccttattctt tttgctatag ctagtctagt tttagttcca + 6301 ttgattcgta aagatggcgg atcagctatt tttgctcaaa ctcgtatagg gaaaaatggt + 6361 cgacatttta ccttttataa attccgttcg atgcgaatcg atgctgaagc tatcaaagaa + 6421 cagttgatgg atcaaaatac gatgcaaggt ggtatgttta agatagacaa tgatcctcgt + 6481 gttacaaaaa ttggtcgctt tattcgtaaa actagtttag atgaattgcc gcagttttgg + 6541 aatgtcttta taggagatat gagtttggtg ggaacacgtc cacctacagt agacgagtat + 6601 gatcagtata ctccagaaca gaaacgtcga ctcagcttta aacctggtat tacaggttta + 6661 tggcaggtta gcggccgtag taaaataacc gattttgacg atgttgtaaa attagatgtg + 6721 gcttatattg ataattggac aatctggaaa gatattgaaa ttttgcttaa aactgttaaa + 6781 gttgtattta tgagagatgg agcgaagtaa ttcatatgaa tgagagaatg caaatattag + 6841 gagttactat agatccatta acgatgaaag aaacagtgga tgctgttgaa cagtatgttt + 6901 taaagaagca tcctttgcac ttgatgggag ttaacgcaga taaaattaat cagtgccatg + 6961 aagatgagaa aatcaaaaaa atcgttaatg aatcaggaat cattaatgcg gatggagcat + 7021 cagttgttct tgcaagtaag tttttaggaa cgcctgttcc tgaacgagta gcgggtattg + 7081 atttgatgca atgtctttta gagttgtcaa ataaaaaagg atattcagtt tacttttttg + 7141 gagctaaaga agaaatttta caagatatgc taaaagtttt taaacaaaga tatcctaatc + 7201 ttaatgttgt tggctataga aacggatatt tttcacctga agatgaaaaa aagattcagg + 7261 aagatattaa aggaggaaaa ccagattttg tatttgtagg gattacttct cctaaaaagg + 7321 agtatatcat ccaatcattc atggataatg ggattaatgc tgtctttatg ggtgttggtg + 7381 gcagttttga tgtattatca ggacacatta aacgagctcc attatggatg caaaaattga + 7441 atctggaatg gttgttccgt gtagttaatg aacccaaacg cctttttaag cgttatttta + 7501 tagggaatgt tacttttatt aagcgagttt tagatgaaaa gcgaaaatca aaaaaataat + 7561 attctacata tttctcgtac aatggatatt ggtggtgcag aacgtattgt atatcaattg + 7621 agttctgatt tgaaagatga atttgatagt gtccatgtcg cttcaacagg tggactatgg + 7681 gagagcaaac ttttatcaaa aggagttcaa catcataaaa ttttagatgt tgacagtaag + 7741 aatcccctaa ctatggtaaa gatcctttca agtttttata gaattatcaa aaataatgat + 7801 attaccattg ttcacactca tcatcggatg gctgcctttt atattcgctt gttgaaaatc + 7861 attaatccta agttgataca tgtttacact gcacataatg tatttaaaaa taaattacca + 7921 ttatacaaat tttccttaaa aaaagcgtat tgtgtagctg taagtaaagc ggttaatgat + 7981 aatttgaaac atgatgtagg aatcagtgat agtacagtaa tctataatgg ggttgttttt + 8041 gaaaaaactg ataagctagt tggtgaaatt gtaaactata acggaatcaa attggggtgt + 8101 attgctaggt tatcagagca aaaaggattg acctacctaa ttgatgcgat gtctttagtg + 8161 aaacacagga atattacgtt gttcattgtc ggagatggag agcttcgaga tgagcttgaa + 8221 aacaaggtga aacaattaaa tcttcaaaaa tcagtgatat ttttaggtta tcgaaaagat + 8281 attgttgaat gtatcaatag ttttgattac ttagtgtcat catctttata tgaggggttt + 8341 ggtctaaatg caattgaagc atttatgaag gggaaaacga tggtttcatc agatatccca + 8401 ggaataaatg aagtagtcaa taacaaaaat gggattcttg ttcctgttaa ggatgatgtt + 8461 gccttagcga gagcgattga aaagcttgcg actgacaaaa aacttagaga aaaactcgct + 8521 tatcaagcaa aaaaagatta tgagacaaaa tttaattatt ccttgttttt ggataattat + 8581 cggagacttt atagaaaatt aatgggagaa tcaaaatgaa aaaagtcatg ttggtttttg + 8641 ggacacgtcc agaagctatt aaaatgtgtc ctttagtaaa tgaactgaaa caaaatgatt + 8701 caatcaagac acttgtgtgt gtaactggtc aacataagga aatgttagag caggttttag + 8761 aggtgttcaa ggttgtccca gattatgatt tgggtatcat gaaagcaaat cagaccctat + 8821 ttaccattac gactagtatc ttggataaaa ttcaggcggt tctagagaaa gaaaaaccag + 8881 atcttgttct tgttcatgga gatactacaa caacatttgc gacagcttta gcagcatttt + 8941 atatgggaat caaagtggga cacgtcgaag caggtctcag aacctataat ctccaaagtc + 9001 catttccaga ggaattcaat cgccagacaa cttctatcat tgccgactat cattttgcgc + 9061 cgactgaagt tgcgaaggaa aatctactaa gagaggacag aaaaaatatc tttgtgacgg + 9121 gaaatacagt cattgatgct ttgaagacga ctgttcaaga taactaccat cacccaattt + 9181 tagaatgggc aaagggtagt aagttaatca tgctaacggc tcatcgacga gaaaatcttg + 9241 ggaaaccgat ggaaaacatg tttaatgctg ttaatcgaat tttaaacgaa ttcgaagatg + 9301 taaaagttgt atatcccatc cataaaaatc ctaaggttcg agaattagca agtaaagttt + 9361 ttggcgataa tgaacgaatg aaaatcattg aaccgttaga ggttattgat tttcataatt + 9421 ttatgaatca aagctatatg attttgacag attctggagg tgtacaggaa gaagcacctt + 9481 ctttaggaaa acctgtcttg gtgatgcgtg atacaacaga gcgtcctgag ggggtcgttg + 9541 ctggcacgtt gaagttggta ggaacagaag aagagaatat ctatagcaac ttcaaacttc + 9601 ttcttgaaga tgaaacagaa tataacaaga tgagcaaagc tagcaaccct tatggagatg + 9661 gaatgacttg taaacggatt gttgatatta ttctggaagt ataaaaataa ttcaattatg + 9721 gatgaggaaa gaataaatta gattgatgat aaaaagaaaa atatatataa tctgtgtatt + 9781 actgtcgtat tttttaccta gtttttttac agttggatca atggcgactt tatttgcttt + 9841 gctttctact ttagttaagc tatttgtaac ttttgattat attcccaaag ttcttttaca + 9901 gcataaagta acactgattg atattctagt tgttctattt ttattttttc aagcatttgc + 9961 agcttttcaa agccaaacgt tgtaccttaa ctatgttgga ggtcagtttt tccttttagg + 10021 actatattca tttttgaaac actttttatt gttggattgt aaaacaacaa taaaaagcct + 10081 ctttttaacc tttatcttgt ttttgtgtgt tcaagtaata actcaattgc tttttccggt + 10141 cggtttcgat tctttgcacc ctacaggaga taatagactt tactttttag gaagaaagaa + 10201 catagctacc ccgtatatca ttgttggatt aggtggtttt tacttattaa ataaaaaaat + 10261 gaatgagttt atatcactaa aggagattat ttttttagga ttgttcggaa ttttatcatt + 10321 tttaacacaa tccagtacag cgattatatg ttatgggctt tttattttca tacgtctatt + 10381 gggattaaag gaaaatatag gaaaactata ttctttagtc agtatggctg tatatgtttg + 10441 tttttctctt tctataatct tttcacaaag tacaatttta tcaactttta cagcgatttt + 10501 ttccaaaaat gcaacttttt caggacgtat caatatttgg caattagcga ttcgtatttt + 10561 tgaagagaat ttttggtttg gacgaggcct caacgttaat tttaatgctt ggacaaatgg + 10621 gattatcgtt aattcagcac acaatacctt attagatata cttgctcgaa ctggtatatt + 10681 tccaggtgtt ttatttatag tgcttcttat gaatctgttt cttggaaaat atagaataga + 10741 atcaaaaaca ctgttggcta tgttagcctc atttatgatt tatattacaa tggagacttc + 10801 atctatgagc atattgctgc taattattgt tctttgtgta tattggccac gtggagagga + 10861 gaagttgcat gagcaagtta cttaatacca tctattatcg actatttaga ttatataaaa + 10921 aaatttatct acaagttttt agtaaaaaaa cggttgacat cttgggtgaa aaggctaatt + 10981 tagaaaatga actaattgtt tcgtttacaa caattccaag tcgtcttaat tatttaccaa + 11041 gtatgattaa aagtattttc aatcagacaa ttatccctaa ccgttttatt atgtatgttt + 11101 ataaagatga atttgaaggc attaatttgg agagtattct agaacttgaa atcaaaaatg + 11161 gtttggaaat tgtctatgtg gatgagaatc ttcgttcaca caaaaaatat ttttatgcta + 11221 tgaaggataa tccgaacagt atagttgttc tagttgatga cgatatcatt tatcctcgaa + 11281 atactataaa gaaactgatt gcatcctata gaatttatcc acagtgtgtt tcagcaatgc + 11341 gatgtcatcg aattaagttg ttttctgatg gaagtttata tccatataat caatgggaat + 11401 atgaaatatc aggagctact ataccatcgt attttaattt ttttactagc ggaggtggga + 11461 cattatttcc tccatgtact cgcaatgagg atctttttaa taaaaaaaat atcagggaac + 11521 tcagttttct agctgatgat gtatggttga attttttggt agtcaaaaat ggaattaaaa + 11581 cagtaaaagc aacacgatat aaagggacac cattaactat agatgacaat cctgaggaga + 11641 gtttggtata tttgaatacc gtatatgata acaacaatga taaatgtatt agaaatatgg + 11701 ttgaatatta tcaaattaat tttacagagg ataaataatg aatgttgaaa aaaatttgaa + 11761 acgtggaatt ttctatactg caatagggaa gtattcgaat gtagttattc aattacttgt + 11821 aacagcaatt cttagccgga ttctctcacc tgtagaatat ggtatcgtag cagtagtaaa + 11881 tgtatttctt ttattttttc aaatgttagc agattcagga ataggacctg ctattgttca + 11941 aaataaagaa ctgaataagt cagatttaat cagcattttc tcattaacga tttatagtgg + 12001 aatcgtactt tcttgtattt ttgctttact aggatatcct atgggggtgt tatacggcga + 12061 aactatttat gttagtttat ttccgctttt aggtctttgt gttttatttt ataccattac + 12121 aattgtaccg caagctattc taatgaaaac gatgaacttt aaaatagtta attttctaac + 12181 tattttttct aacattgcta gtggcttggt gggcgttatt ctagcggtat cacattttgg + 12241 tgtctattct ctaatttttt ctaatattgt aaaagcaatg gttttattta tcgctttata + 12301 ttctaaagca aagataaatt tctattggaa agtttcaaaa agttctattg gtaaaatttt + 12361 tgagttttca aaattccaat ttttgtttaa tttttggaat tattttgcta gaaatttaga + 12421 taatttatta attggacgat tgattagccc gtcagatctt ggttattatg ataaggctta + 12481 tcaattatct ttgtacccta atcaaatttt atcacaggtt gtgacaccag cattgcatcc + 12541 tattatgtcc aattttcaag ataatatcag taagataggc gaagtttatc ttcagatttc + 12601 tagaatattc gtaatagttg gcatacctat ttcggcttat ttatacttta atgctcaata + 12661 tgttgttaca tttatgtttg gagataattg gtcccaaagc gttccggtgt ttcaaatatt + 12721 agcagcaaca atttggttac aaatggctaa tagccctact ggtgcatttt accaagcaac + 12781 taatcagaca aagttattgt ttagaattgg cttattgaca tcttttatta atattttagc + 12841 tattgttatt ggtgtaatgt tgcaaagcat ccaatgtgtt gcgtacatgc ttttgatttc + 12901 tttcagtctt agtttagtaa tcaatactct ttacttaaca aaaaaagtat taaatatttc + 12961 tgctcaaaaa tatataaaac cgatattaat taatttgaca attatcagtc cctatattgt + 13021 gtttaatttg tttatctcgg attttgtaaa cgaccttatt ttacatttat cagttcagtt + 13081 tgttatttta tttttaatat ggggaattgg gatgtatatt agcggagagt atcgacgagt + 13141 cttcgcggtt ataagaaaat aaaggagcaa ttttgtgaaa attttatttg tgaatatgtt + 13201 ttataatgaa gcaggaggtg cacaaaagag caccaaattt ctagctgaac aacttgtaaa + 13261 agaaggacat gaggtatttg catactctga tgatgccatt gattcagata ttgatgaagt + 13321 tattaatagg gttaagattt ttagaagaag aaccccgctt tttagtcttc actatatttt + 13381 cagtgctaag aagaatccag ctaaacattt tttctataaa atatttgaaa cctataatgt + 13441 atttgcgaaa agaaaattta tcaatatcat tgaggaagta caaccagata ttgttcactt + 13501 taatacaatt tcaggaatgt ctttatcaat agttaaagaa gctaaaaaga gaaatatcag + 13561 gaccgtttgg accttgcgag actattggct agaatatcca tggggtgaga aagatatttc + 13621 tcttatcaaa cttctaaata gaatatatag accttttgtt aagaaaagtt taagacactt + 13681 agacatagta acagcaccat cagcatttac tttgaataat tttatcaata aaggatttat + 13741 taacccatct tctcaaaaat gtatggtcat tgaaaatgct gttatatttt caaagggtaa + 13801 gttggaaaat attatcaaac aaaagcaaga aacaaaaaga aatccagaaa aaacgaattt + 13861 tctttttgta ggttctatac ttgaaataaa gggcgttttt aacttagtaa aggcctttaa + 13921 aaaactaact agtccggaaa tttctttgaa aattgtagga aaaggaaaag atttagaaaa + 13981 acttcaaaaa gaaattgaga gtgatcctag aatacaatat ttaggctttc aagatacaga + 14041 aaccctctat aaaacttatc aaaattcgga tgtattggtc gtcccatctg cttgggatga + 14101 accgtttggt agagttgtaa ttgaaggaaa tgcaaatggc cttcctgtca tcacttcaga + 14161 tagaggtgga ttacctgaaa ttgtgcaaac agtaggagga ggagaaattt ttacagatga + 14221 atcgggaaat acattatata gtcttttaaa gaaatttgta gaaatggaaa actacaatgt + 14281 ctattaccaa tgcattcttg agaatattga tatttattct atcgaaaaac aaagtgaaaa + 14341 gttcactaat ctgtatttag ataaagaaat cgaataataa gttgtttttg tagcagtaac + 14401 ggaggtaatt atgaaaatag cggtagcagg aacaggttat gtaggattat caattgctgt + 14461 gttgttggca caacatcacg aaataaaagc agttgatatt gttgctgaaa aagttgaatt + 14521 aatcaatcaa aaaaagtctc caattcagga tgattatatt gaaaaatatt tagtggaaaa + 14581 agatttaaat ttggaagcaa ctatggatgc taagtatgct tatgaagatg cagaatttgt + 14641 tgttgttgca gcaccaacaa attatgattc gaaaaagaac ttttttgata catcagcagt + 14701 agaggcggtc attcaacaag taaaaaaaat taatcccaaa gcggtaataa ttattaaatc + 14761 tacaatccct gttggattca cagagtccgt tcaaaagaaa tatcagtata aaaatatctt + 14821 atttagtcca gaatttttac gcgaatctaa agcattatac gataacctgt atccaagtcg + 14881 catcattgtt ggaactgact tagaagatac ttatttaaaa gacaaagcta atatatttgc + 14941 ttccctacta aaagaggggg ctattaaaga agacatagat acacttttca tgggagtaac + 15001 ggaagctgag gcagttaaat tatttgccaa tacctacctt gcgttgcgtg tttcttactt + 15061 taatgaattg gatacttatg cagaggtgaa aggtttggat gcaaaagcca ttattgatgg + 15121 tattggccta gatccacgta taggaaatca ttataacaat ccatcctttg gctacggtgg + 15181 gtattgttta cctaaagata gtaagcagtt attagcaaat tactttgatg taccacaaaa + 15241 tatgatgaca gcaactgttg aaagcaatcg aacgcgtaag gattttatcg ctcaacggat + 15301 tttagaaaaa gctggagtat ctgagactga tagtttagat gcgtttaaga acatacaaga + 15361 tattgttata ggtatttatc gtttaacaat gaaaagtaat tcggataact tccgtcactc + 15421 ctctattcaa ggcgttatga aacgattgaa agctaaggga gttacggtta tcatctatga + 15481 gccaactttg aaggacgggg aaacattctt tggtaataaa gtggtaaata atctagataa + 15541 atttaaagaa gctagtaatg ttattgtagc caatcgtttt gaaccttcac tagaggatgt + 15601 gtctaataaa gtttatagtc gagatatatt taagcgtgac taataaatac gtccacgtga + 15661 cgtaatatct attaaatgaa taaaatatta ataaacatgg catcgatatc ttttttggac + 15721 ttgaattgtc aaattaagtg cacatttttt tcatagaaaa cttcataagg tgttttccgg + 15781 ttaagacatt ttcgtggtct attatctaag ttggtttata taatagactt cctgcgaaac + 15841 aaaatatggt ataatagttc tatgaattat gaagcaagta aacaactaac cgatgtacga + 15901 tttaagcgtc ttgttggtgt tcaacgcacg acttttgaag agatgttagc tgtattaaaa + 15961 acagcttatc aacttaaaca cgcaaaaggt ggacgaaaac ctaaattaag cctagaagac + 16021 tttcttatgg cgactcttca ataagtgcga gaataccgca cttatgaaca aattgcggct + 16081 gattttggta ttcacgaaag caacttaatc cgtcggagct aatgggttga agtaactctt + 16141 gttcaaaggt ggtgttacga tttcaagaac tcctctcagt tctgaggaca cggtaatgat + 16201 tgatgcgacg gaagtaaaaa tcaatcgccc taaaaaaaga attagcgaat tattctggta + 16261 aaaagaaatt tcacgctatg aagactcaag cgattgtcac aagtcaaggg agaattgttt + 16321 ctttggatat cactgtgaac tattgtcatg atatgaagtt gttcaaaatg agtcgcagaa + 16381 atatcggaca agctggtaaa atcttggctg acagtggtta tcaagggctc atgaagatat + 16441 atcctcaagc acaaattcca cgtaaatcca gcaaactcaa gccgctaata gctgaagata + 16501 aagcctataa ccatgcactg tctaaggata gaagcaaggt tgagaacatc cttgccaaag + 16561 taaaaacgtt taaaatgttt tcaacaacct atcgaaatca tcgtaaacgc ttcggatatt + 16621 ttaggcatac tatatatttt ttattcaatt attcactttt gtattcaaaa ggttgcgggt + 16681 gcctctgtcc gagtacccac tatgatattt aacctattga atatctataa atttcctctg + 16741 ggagtttcat ggtatctata tacgttatgg tcgatattga tagtttatgg tttactatct + 16801 gttgttttca aaaatcgtaa gtcccttttg ttagttagtg tttttgccta tattttcaca + 16861 ctatttattc aaactgatat ttttattgtg caacggacgt tggtttgggg gatttgtttc + 16921 tttcttggca gtgtattgag tgaaattcac tttgataaaa ttaatttgaa aaaatttctt + 16981 tttttctttg tgttatttga ttttatttat atgttcgctt ggttcttgtt ttatgaagta + 17041 gggtctaaga aggattatgt aagctatatt aacccaggtt tgtgggggat tgcttttatt + 17101 gtctgtgtat tagttgcttt tgcgattttt cctaaaatgg agaaaaattt tcctaaaact + 17161 ttcctatatt tcactaaata cgggaaagat agtttaggga tctatattct tcatgcacca + 17221 atttgtagca tgattcggat tctaatgttg aaagtgggaa taaactcagt ttttcttcac + 17281 gttgttgttg ggattgtgct aggctggtat ttatccatac tagcaactta tatattgaaa + 17341 aaaattccat ttttgaatat tgttttatta ccacaaaagt atattaaatt aaaataaatt + 17401 attttagatt tataatgtgg ctctttgtca actaacatct ggagaggaca atcactgtct + 17461 tctctttttt tgtcttttca gaatatacca aattaacaca aaaattctga aaattctgtt + 17521 gacatctttc tgaaaagagt ttataatgga gagaaagttt taaaggagaa aatgatgaaa + 17581 agttcaaaac tacttgccct tgcgggcgtg acattattg +// + diff --git a/public/res/serotype_genbank/serotype_9V.gb b/public/res/serotype_genbank/serotype_9V.gb new file mode 100644 index 0000000..8fa4eaf --- /dev/null +++ b/public/res/serotype_genbank/serotype_9V.gb @@ -0,0 +1,900 @@ +LOCUS CR931648 20856 bp DNA linear BCT 26-JUL-2016 +DEFINITION Streptococcus pneumoniae strain 980/68 (serotype 9v). +ACCESSION CR931648 +VERSION CR931648.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 20856) + AUTHORS Bentley,S.D., Aanensen,D.M., Mavroidi,A., Saunders,D., + Rabbinowitsch,E., Collins,M., Donohoe,K., Harris,D., Murphy,L., + Quail,M.A., Samuel,G., Skovsted,I.C., Kaltoft,M.S., Barrell,B., + Reeves,P.R., Parkhill,J. and Spratt,B.G. + TITLE Genetic analysis of the capsular biosynthetic locus from all 90 + pneumococcal serotypes + JOURNAL PLoS Genet. 2 (3), E31 (2006) + PUBMED 16532061 +REFERENCE 2 (bases 1 to 20856) + AUTHORS Bentley,S.D. + TITLE Direct Submission + JOURNAL Submitted (09-DEC-2004) Submitted on behalf of the Pathogen + Sequencing Unit, Sanger Institute, Wellcome Trust Genome Campus, + Hinxton, Cambridge CB10 1SA, E-mail: sdb@sanger.ac.uk +COMMENT NOTE: This sequence was generated from a PCR product representing + the region from dexB to aliA and is not necessarily responsible for + the expressed capsule serotype. For a detailed description of how + CDS products were predicted see the associated publication. +FEATURES Location/Qualifiers + source 1..20856 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="980/68" + /db_xref="taxon:1313" + gene <1..137 + /gene="dexB" + /locus_tag="SPC09V_0001" + CDS <1..137 + /gene="dexB" + /locus_tag="SPC09V_0001" + /codon_start=3 + /transl_table=11 + /protein_id="CAI33019.1" + /db_xref="UniProtKB/TrEMBL:Q4K2K9" + /translation="SNEEQDLTVEGKVKSVLIENTLAQEVFEKQILVPWDAFCVEMTD + " + gene complement(order(284..403,412..1678)) + /gene="tnp" + /locus_tag="SPC09V_0002" + /pseudo + CDS complement(join(284..403,412..1548,1547..1678)) + /gene="tnp" + /locus_tag="SPC09V_0002" + /note="member of homology group 17" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1202 transposase" + misc_feature complement(694..1194) + /gene="tnp" + /locus_tag="SPC09V_0002" + /note="HMMPfam hit to PF00665, Integrase core domain, + score 1.8e-21" + /pseudo + gene 1853..3298 + /gene="wzg" + /locus_tag="SPC09V_0003" + CDS 1853..3298 + /gene="wzg" + /locus_tag="SPC09V_0003" + /note="member of homology group 0" + /codon_start=1 + /transl_table=11 + /product="integral membrane regulatory protein Wzg" + /protein_id="CAI33021.1" + /db_xref="GOA:Q8KWQ3" + /db_xref="InterPro:IPR004190" + /db_xref="InterPro:IPR004474" + /db_xref="UniProtKB/TrEMBL:Q8KWQ3" + /translation="MSRRFKKSGSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLLFSILVSSVSLFAVQQFVGLTNR + LNAASNYSEYSISVAVLADSEIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VNQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKLIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVIVAILQKLTST + EALKNYGTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRMDLPSY + AMPDSNLYVLEIDDSSLAVVKAAIQDVMEGR" + misc_feature 1853..1969 + /gene="wzg" + /locus_tag="SPC09V_0003" + /note="Signal peptide predicted for SPC0341 by SignalP 2.0 + HMM (Signal peptide probability 0.993) with cleavage site + probability 0.538 between residues 39 and 40" + misc_feature 2057..2404 + /gene="wzg" + /locus_tag="SPC09V_0003" + /note="HMMPfam hit to PF02916, DNA polymerase processivity + factor, score 3e-61" + misc_feature 2582..3025 + /gene="wzg" + /locus_tag="SPC09V_0003" + /note="HMMPfam hit to PF03816, Cell envelope-related + transcriptional a, score 8.4e-70" + gene 3300..4031 + /gene="wzh" + /locus_tag="SPC09V_0004" + CDS 3300..4031 + /gene="wzh" + /locus_tag="SPC09V_0004" + /EC_number="3.1.3.48" + /note="member of homology group 1" + /codon_start=1 + /transl_table=11 + /product="protein-tyrosine phosphatase Wzh" + /protein_id="CAI33022.1" + /db_xref="GOA:Q8KWQ2" + /db_xref="InterPro:IPR004013" + /db_xref="InterPro:IPR016667" + /db_xref="UniProtKB/TrEMBL:Q8KWQ2" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVASDLVIAYGAEIYYTPDVLDKLEKKRIPTLNDS + RYALIEFSMNTPYRDIHSALSKILMLGVTPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLKPKLFGERYKFMKKRAQYFLEQDLVHVIASDMHNLDGRPPHMAEAYDLVT + QKYGEAKAQEFFIDNPRKIVMDQLI" + misc_feature 3303..3911 + /gene="wzh" + /locus_tag="SPC09V_0004" + /note="HMMPfam hit to PF02811, PHP domain, score 6.2e-37" + gene 4037..4732 + /gene="wzd" + /locus_tag="SPC09V_0005" + CDS 4037..4732 + /gene="wzd" + /locus_tag="SPC09V_0005" + /note="member of homology group 2" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Wzd" + /protein_id="CAI33023.1" + /db_xref="GOA:Q4K2H5" + /db_xref="InterPro:IPR003856" + /db_xref="InterPro:IPR005701" + /db_xref="UniProtKB/TrEMBL:Q4K2H5" + /translation="MMKEQNTIEIDVFQLFKTLWKRKLMILIVALVTGAGAFAYSTFI + VKPEYTSTTRIYVVNHNQGNKLGLTNQDLQAGSYLVKDYREIILSQDVLEKVATNLKL + DMPAKTLASKVQVTVPDDTRIVSISVKDKQPEEASRIANSLREVAAEKIVAVTRVSDV + TTLEEARPATTPSSPNVRRNSLFGFLGGVVVTVIAVLFIELLDTRVKRPEDVEDVLQI + PLLGLVPDLNKMK" + misc_feature 4037..4153 + /gene="wzd" + /locus_tag="SPC09V_0005" + /note="Signal peptide predicted for SPC0343 by SignalP 2.0 + HMM (Signal peptide probability 0.625) with cleavage site + probability 0.411 between residues 39 and 40" + misc_feature 4058..4474 + /gene="wzd" + /locus_tag="SPC09V_0005" + /note="HMMPfam hit to PF02706, Chain length determinant + protein, score 1.7e-55" + misc_feature 4580..4657 + /gene="wzd" + /locus_tag="SPC09V_0005" + /note="PS00217 Sugar transport proteins signature 2." + gene 4742..5431 + /gene="wze" + /locus_tag="SPC09V_0006" + CDS 4742..5431 + /gene="wze" + /locus_tag="SPC09V_0006" + /EC_number="2.7.10.1" + /note="member of homology group 3" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein kinase Wze" + /protein_id="CAI33024.1" + /db_xref="GOA:Q8KWQ0" + /db_xref="InterPro:IPR002586" + /db_xref="InterPro:IPR005702" + /db_xref="UniProtKB/TrEMBL:Q8KWQ0" + /translation="MPTLEISQAKLDFVKKAEEYYNALCTNLQLSGDGLKVFSITSVK + LGEGKSTTSINIAWAFARAGYKTLLIDGDIRNSVMLGVFKARDKITGLTEFLSGTTDL + SQGLCDTNIENLFVIQAGSVSPNPTALLQSKNFSTMLETLRKYFDYIIVDTAPVGVVI + DAAIITRKCDASILVTEAGEINRRDIQKAKEQLEHTGKPFLGIVLNKFDTSVDQYGSY + GNYGDYGKNKK" + gene 5446..6813 + /gene="wchA" + /locus_tag="SPC09V_0007" + CDS 5446..6813 + /gene="wchA" + /locus_tag="SPC09V_0007" + /note="member of homology group 5" + /codon_start=1 + /transl_table=11 + /product="undecaprenylphosphate glucosephosphotransferase + WchA (initial sugar transferase)" + /protein_id="CAI33025.1" + /db_xref="GOA:Q8KWP9" + /db_xref="InterPro:IPR003362" + /db_xref="InterPro:IPR017475" + /db_xref="UniProtKB/TrEMBL:Q8KWP9" + /translation="MNGKILRSSLAIIQSFLVILLTYLLSAVREAEIVSTTAIALYIL + HYFVFYISDYGQAFFKRGYLIELVQTLKYILFFALAISISNFFLEDRFNISRRGMIYF + LTLHALLVYVLNLFIKRYWKRAYPNFKGSKKILLLTATSRVEKVLDRLIESNEVVGEL + IAVSVLDKPDFQHDCLKVVAEGEIVNFATHEVVDEVFINLPSEKYNIGELVSQFETMG + IDVTVNLNAFDRSLARNKQIREMAGLNVVTFSTTFYKTSHVIAKRIIDIVGAFVGLIL + CGLVSIVLVPLIRKDGGSAIFAQTRIGKNGRQFTFYKFRSMCVDAEAKKRELMEQNTM + QGGMFKVDDDPRITKIGRFIRKTSLDELPQFYNVLKGDMSLVGTRPPTVDEYEHYTPE + QKRRLSFKPGITGLWQISGRSEIKNFDEVVKLDVAYIDGWTIWKDIEILLKTVKVVFM + RDGAK" + misc_feature 5446..5538 + /gene="wchA" + /locus_tag="SPC09V_0007" + /note="Signal peptide predicted for SPC0345 by SignalP 2.0 + HMM (Signal peptide probability 0.938) with cleavage site + probability 0.364 between residues 31 and 32" + misc_feature 6229..6810 + /gene="wchA" + /locus_tag="SPC09V_0007" + /note="HMMPfam hit to PF02397, Bacterial sugar + transferase, score 2.4e-159" + gene 6819..7562 + /gene="wchO" + /locus_tag="SPC09V_0008" + CDS 6819..7562 + /gene="wchO" + /locus_tag="SPC09V_0008" + /note="member of homology group 33" + /codon_start=1 + /transl_table=11 + /product="putative WecB-family glycosyl transferase" + /protein_id="CAI33026.1" + /db_xref="GOA:Q8KWP8" + /db_xref="InterPro:IPR004629" + /db_xref="UniProtKB/TrEMBL:Q8KWP8" + /translation="MNERMQILGIIIDPLTMKETVDAVEQYVLKKHPLHLMGVNADKI + NQCHEDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMQCLLELSNKKG + YSVYFFGAKEEILQDMLKVFKQRYPNLNVVGYRNGYFSPEDEKKIQEDIKGGKPDFVF + VGITSPKKEYIIQSFMDNGINAVFMGVGGSFDVLSGHIKRAPLWMQKLNLEWLFRVVN + EPKRLFKRYFVGNVTFIKRVLDEKRKSKK" + misc_feature 6981..7496 + /gene="wchO" + /locus_tag="SPC09V_0008" + /note="HMMPfam hit to PF03808, Glycosyl transferase + WecB/TagA/CpsF f, score 1.2e-93" + gene 7537..8622 + /gene="wcjA" + /locus_tag="SPC09V_0009" + CDS 7537..8622 + /gene="wcjA" + /locus_tag="SPC09V_0009" + /note="member of homology group 66" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33027.1" + /db_xref="GOA:Q8KWP7" + /db_xref="InterPro:IPR001296" + /db_xref="UniProtKB/TrEMBL:Q8KWP7" + /translation="MKSENQKNNILHISRTMDIGGAERIVYQLSSDLKDEFDSVHVAS + TGGLWESKLLSKGVQHHKILDVDSKNPLTMVKILSSFYRIIKNNDITIVHTHHRMAAF + YIRLLKIINPKLIHVYTAHNVFKNKLPLYKFSLKKAYCVAVGKAVNDNLKHDVGISDS + TVIYNGVVFEKTDKLVDEIVNYNGIKLGCIARLSEQKGLTYLIDAMSLVKHRDITLFI + VGDGELRDELENKVKQLNLQKSVIFLGYRKDVVECINSFDYLVSSSLYEGLALNVIEA + FMNGKTMVASDIPGINEVVNNKNGILVPVKDDVALARAIEKLATDKKLREKLAYQAKK + DYETKFNYSLFLDNYRRLYRKLTGESK" + misc_feature 8050..8541 + /gene="wcjA" + /locus_tag="SPC09V_0009" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 4e-43" + gene 8619..9707 + /gene="mnaA" + /locus_tag="SPC09V_0010" + CDS 8619..9707 + /gene="mnaA" + /locus_tag="SPC09V_0010" + /EC_number="5.1.3.14" + /note="member of homology group 23" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine-2-epimerase MnaA" + /protein_id="CAI33028.1" + /db_xref="GOA:Q8KWP6" + /db_xref="HSSP:1O6C" + /db_xref="InterPro:IPR003331" + /db_xref="UniProtKB/TrEMBL:Q8KWP6" + /translation="MKKVMLVFGTRPEAIKMCPLVNELKQNDSIKTLVCVTGQHKEML + EQVLEVFKVVPDHDLGIMKANQTLFSITISILDKIQAVLEQEMPDIVLVHGDTTTTFA + TALAAFYMGIKVGHVEAGLRTHNLQSPFPEEFNRQTTSIIADYHFAPTEVAKENLLRE + GRKNIFVTGNTVIDALKTTVQCNYHHPILEWAKGSKLIMLTAHRRENLGEPMENMFNA + VNRILDEFEDVKVVYPIHKNPKVRELASKVFGDNERMKIIEPLEVIDFHNFMDQSYMI + LTDSGGVQEEAPSLGKPVLVMRDTTERPEGVAAGTLKLVGTEEENIYNNFKLLLEDET + EYNKMSKASNPYGDGMTCKRVVDIILEV" + misc_feature 8682..9698 + /gene="mnaA" + /locus_tag="SPC09V_0010" + /note="HMMPfam hit to PF02350, UDP-N-acetylglucosamine + 2-epimerase, score 1.4e-181" + gene 9746..10888 + /gene="wzy" + /locus_tag="SPC09V_0011" + CDS 9746..10888 + /gene="wzy" + /locus_tag="SPC09V_0011" + /note="member of homology group 83" + /codon_start=1 + /transl_table=11 + /product="oligosaccharide repeat unit polymerase Wzy" + /protein_id="CAI33029.1" + /db_xref="InterPro:IPR007016" + /db_xref="UniProtKB/TrEMBL:Q4K2G9" + /translation="MMIKRKIYIICVLLSYFLPSFFTVGSMATIFTLLSTVIRLFVTI + YHVPKVFSQYKVTLIDILVVLFLFFQVFVGVQSQTVNLNYIGGQFFFLGLYSFLKYFL + LFDCKTTIESLFLTFILFLCVQVITQLLFPVGFDSLYPTGDNRLYFLGRKNIATPYII + VGLGSFYLLNKKMNEFISLKEIIFLGLFGILSFLTQSSTAIICYVLFIFMRMLGLKEN + IGKPYSLVSITVYICFSFSIIFSQSTILSTFTAIFSKNATFSGRINIWQLAIRIFEEN + FWFGKGLNIDFNAWTNGIIVNSAHNTLLDILARTGIFPGILFVVVLLSLFLGKYRVKS + KTLLTMLISFMVYITMEATSVSILLLIIAICVYWSFGEEKLYEQVT" + misc_feature 9746..9823 + /gene="wzy" + /locus_tag="SPC09V_0011" + /note="Signal peptide predicted for SPC0349 by SignalP 2.0 + HMM (Signal peptide probability 0.966) with cleavage site + probability 0.281 between residues 26 and 27" + misc_feature 10511..10696 + /gene="wzy" + /locus_tag="SPC09V_0011" + /note="HMMPfam hit to PF04932, O-Antigen Polymerase, score + 1e-07" + gene 10872..11741 + /gene="wcjB" + /locus_tag="SPC09V_0012" + CDS 10872..11741 + /gene="wcjB" + /locus_tag="SPC09V_0012" + /note="member of homology group 84" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33030.1" + /db_xref="GOA:Q4K2G8" + /db_xref="InterPro:IPR001173" + /db_xref="UniProtKB/TrEMBL:Q4K2G8" + /translation="MSKLLNAIYYRLFGLYKKIYLQVFSKKTINILGEKANLENELIV + SFTTIPSRLNYLPSMIKSIFNQTIIPNRFIMYVYKDKFEGINLESILETEIKNGLEIV + YVDENLRSHKKYFYAMKDNPNSIVILVDDDTVYSSNTIEKLVASYRKYPSCISAMRCH + RIKLLTDGSLAPYNEWEYEFFGDIKPSYFNFFTGCGGVLFPPTARTDEFFNISNIMNL + SYLADDVWLNFLAIKNRIKIVKATRCKGTPLTIDDNPEESLVYLNAIYDNNNDRCIKN + MVDFYHIDFSEVD" + gene 11741..13165 + /gene="wzx" + /locus_tag="SPC09V_0013" + CDS 11741..13165 + /gene="wzx" + /locus_tag="SPC09V_0013" + /note="member of homology group 85" + /codon_start=1 + /transl_table=11 + /product="flippase Wzx" + /protein_id="CAI33031.1" + /db_xref="GOA:Q8KWP3" + /db_xref="InterPro:IPR002797" + /db_xref="UniProtKB/TrEMBL:Q8KWP3" + /translation="MDISNKFKVGILYTALGKYSNVIIQLFVTAVLSRILTPEEYGVV + AVVNVFLVFFQILADSGIGPAIVQNKTLTQNDLNDIFTLTIYSGLILSFVFVLIGYPI + SIVYGNEVYIKLYSLLGMCVLFYTMTIVPQSILTRNMNFKRMNLLSLIANIFSGVIGV + VLAIHDFGVYSLIFSNIMKATILFFVFFSSVELSFKKKIEKTSLVKILNFSKFQFMFN + FLNYFARNLDNLLIGRFINPAALGYYDKAYQLSLYPNQILLQVISPVIHPIMSNFQND + RQKMEEVFAKIFNILLLIGMPISVYLFFNASDVITFMFGNNWFQSVPVFQILSASIWI + QMANSPIGIFYQASNRVDLLFKVGLLASGFNIIAIVIGLLSKSIVTIAAMLIISFIIG + LSLNLYVLSHVVFKNDIIKYLKIILVHLVTVIPYIIFNMIGFRFEQGVVINLVLQGLV + LGLIWSIGIFVTGQYKQLIMMFSR" + misc_feature 11759..12562 + /gene="wzx" + /locus_tag="SPC09V_0013" + /note="HMMPfam hit to PF01943, Polysaccharide biosynthesis + protein, score 2.4e-21" + gene 13172..14365 + /gene="wcjC" + /locus_tag="SPC09V_0014" + CDS 13172..14365 + /gene="wcjC" + /locus_tag="SPC09V_0014" + /note="member of homology group 86" + /codon_start=1 + /transl_table=11 + /product="putative glycosyl transferase" + /protein_id="CAI33032.1" + /db_xref="GOA:Q8KWP2" + /db_xref="InterPro:IPR001296" + /db_xref="InterPro:IPR009695" + /db_xref="UniProtKB/TrEMBL:Q8KWP2" + /translation="MKILFVNMFYNEEGGAQKSTKFLAEQLVKEGHEVFAYSDDAIDS + DIEEVINGVKVFRRRTPLFSLHYIFSAKKNPAKHFFYKIFETYNVFAKKKFIDIIEEI + QPDIVHFNTISGMSLSIVKEAKKRNIRTIWTLRDYWLEYPWGEKDIALIKLLNRIYRP + FVKKSLKHLDIVTAPSAFTLNNFINKGFINPSSQKCMAIENAVIFSKSKLENIIKRKQ + ETKRNPEKTNFLFVGSILEIKGVFNLVMAFKKLTNPEISLKIVGKGKDLEKLQKEIES + DPRIQYLGFQDTKNLYETYQNSDVLVVPSAWDEPFGRVVIEGNANGLPVITSDRGGLP + EIVQTVGGGEVFTDKSGNTLYSILKKFVEMENYNVYYRCILENIDIYSIEKQSEKFIS + LYREG" + misc_feature 13808..14305 + /gene="wcjC" + /locus_tag="SPC09V_0014" + /note="HMMPfam hit to PF00534, Glycosyl transferases + group, score 1.2e-30" + gene 14366..15031 + /gene="wcjD" + /locus_tag="SPC09V_0015" + CDS 14366..15031 + /gene="wcjD" + /locus_tag="SPC09V_0015" + /note="member of homology group 145" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33033.1" + /db_xref="GOA:Q8KWP1" + /db_xref="InterPro:IPR011004" + /db_xref="UniProtKB/TrEMBL:Q8KWP1" + /translation="MQVRHLLTYLISLPKTIFFNFKCLPINQAIHLPILVAYNVKLLN + LKKNVIGIETVVKFGLVRIGFSGTEIISSNRSLINLRQGKVIFKGKSVITKGCTISVT + GGTIILGDNFYANRNCLISCTDRLIVGNNVLLGWNVILFDSAGHTLSYDGKKKIKMTE + EIVIGNHVWICAEAHLLKGSKIADGSVVAYSSLVTGYFAEKNCLIGGIPAKTLRKGVS + WEK" + gene complement(15157..16383) + /gene="tnp" + /locus_tag="SPC09V_0016" + /pseudo + CDS complement(15157..16383) + /gene="tnp" + /locus_tag="SPC09V_0016" + /note="member of homology group 146" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS116-IS110-IS902-like transposase" + misc_feature complement(15364..15696) + /gene="tnp" + /locus_tag="SPC09V_0016" + /note="HMMPfam hit to PF02371, Transposase + IS116/IS110/IS902 family, score 7.4e-11" + /pseudo + gene 16683..17915 + /gene="ugd" + /locus_tag="SPC09V_0017" + CDS 16683..17915 + /gene="ugd" + /locus_tag="SPC09V_0017" + /note="member of homology group 20" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase Ugd" + /protein_id="CAI33035.1" + /db_xref="GOA:Q8KWP0" + /db_xref="HSSP:1DLJ" + /db_xref="InterPro:IPR001732" + /db_xref="InterPro:IPR008927" + /db_xref="InterPro:IPR013328" + /db_xref="InterPro:IPR014026" + /db_xref="InterPro:IPR014027" + /db_xref="InterPro:IPR014028" + /db_xref="InterPro:IPR016040" + /db_xref="InterPro:IPR017476" + /db_xref="UniProtKB/TrEMBL:Q8KWP0" + /translation="MKIAVAGTGYVGLSIAVLLAQHHEIKAVDIVAEKVELINQKKSP + IQDDYIEKYLVEKDLNLEATMDAKYAYEDAEFVVVAAPTNYDSKKNFFDTSAVEAVIQ + QVKKINPKAVIIIKSTIPVGFTESVRKKYQYKNILFSPEFLRESKALYDNLYPSRIIV + GTDLEDTYLKDKANIFASLLKEGAIKEDIDTLFMGVTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDAKAIIDGIGLDPRIGNHYNNPSFGYGGYCLPKDSKQLLANYFDVPQ + NMMTATVESNRTRKDFIAQRILEKAGVSETDSLDAFKNTQDIVIGIYRLTMKSNSDNF + RHSSIQGVMKRLKAKGVTVIIYEPTLKDGETFFGNKVVNNLDKFKEASNVIVANRFEP + SLEDVSNKVYSRDIFKRD" + misc_feature 16683..17303 + /gene="ugd" + /locus_tag="SPC09V_0017" + /note="HMMPfam hit to PF01210, NAD-dependent + glycerol-3-phosphate deh, score 0.00028" + misc_feature 16683..17237 + /gene="ugd" + /locus_tag="SPC09V_0017" + /note="HMMPfam hit to PF03721, UDP-glucose/GDP-mannose + dehydrogenase, score 2e-52" + misc_feature 17268..17549 + /gene="ugd" + /locus_tag="SPC09V_0017" + /note="HMMPfam hit to PF00984, UDP-glucose/GDP-mannose + dehydrogenase, score 1.6e-35" + misc_feature 17643..17894 + /gene="ugd" + /locus_tag="SPC09V_0017" + /note="HMMPfam hit to PF03720, UDP-glucose/GDP-mannose + dehydrogenase, score 1.3e-05" + gene 18127..19161 + /gene="wcjE" + /locus_tag="SPC09V_0018" + CDS 18127..19161 + /gene="wcjE" + /locus_tag="SPC09V_0018" + /note="member of homology group 18" + /codon_start=1 + /transl_table=11 + /product="putative acetyl transferase" + /protein_id="CAI33036.1" + /db_xref="GOA:Q8KWN9" + /db_xref="InterPro:IPR002656" + /db_xref="UniProtKB/TrEMBL:Q8KWN9" + /translation="MKSIGKRINWIDFGKGFAIFSVLVGHVLMGLYESNIFSIANDVL + LLLITQIYIFHIPVFFALSGYFFRPVSDMKEFWHYAKKKTIILGIPYVFYSIIHFCLQ + KVAGASVRVPTTIFNLLNIYKFPLGVSWYLYTLWSILIVYGLLSVVFKNRKSLLLVSV + FAYIFTLFIQTDIFIVQRTLVWGVCFCLGSVLSAIHFDKINLKKFLFFFVLFDFIYMF + AWFLFYEVGSKKDYVSYSNPGLWGIAFIVCVLVAFAIFPKMEKNFPKTFLYFTKYGKD + SLGIYILHAPICSMIRILMLKVGINSVFLHVVVGIVLGWYLSILATYILKKIPFLNIV + LLPQKYIKLK" + misc_feature 18148..19122 + /gene="wcjE" + /locus_tag="SPC09V_0018" + /note="HMMPfam hit to PF01757, Acyltransferase family, + score 6.5e-05" + gene complement(order(19205..19789,19843..20511)) + /gene="tnp" + /locus_tag="SPC09V_0019" + /pseudo + CDS complement(join(19205..19789,19843..20511)) + /gene="tnp" + /locus_tag="SPC09V_0019" + /note="member of homology group 13" + /pseudo + /codon_start=1 + /transl_table=11 + /product="putative IS1167 transposase" + /db_xref="PSEUDO:CAI33037.1" + misc_feature complement(join(19709..19789,19843..20055)) + /gene="tnp" + /locus_tag="SPC09V_0019" + /note="HMMPfam hit to PF01610, Transposase, score 6.7e-44" + /pseudo + gene 20809..>20856 + /gene="aliA" + /locus_tag="SPC09V_0020" + CDS 20809..>20856 + /gene="aliA" + /locus_tag="SPC09V_0020" + /codon_start=1 + /transl_table=11 + /protein_id="CAI33038.1" + /db_xref="UniProtKB/TrEMBL:Q4JZ89" + /translation="MMKSSKLLALAGVTLL" +ORIGIN + 1 tgtccaatga agagcaagac ttgacagtag aaggaaaagt caaatctgtc ttgattgaaa + 61 acaccctagc tcaagaagtc tttgaaaaac aaatcttagt tccatgggat gctttctgtg + 121 tggaaatgac tgactagaat gagcaaacct caagtttttg aagcttgagg ttttttacta + 181 tagtggattg aaactagaat agtgcacctc tgcttctaaa acattgttag aaatcgattt + 241 gactgtcccg atcgatttgt cctattctta tttcattttg ctatacttgt agttgaggag + 301 aattaagctc ctcactagta aactcttcat aatccttttt atttttatga agatattgtt + 361 tgaaagatgt gagtttccac ggatgggttt gtggagggat atacttgcgt ctttcttttt + 421 ttgttctggt tcttgttcaa agtttttcga atagagttca tgatttagta gctcctttgt + 481 gtgatagatt ttgtcagcga tattgaggta gatgtctccg tcaaatgctt ttataactaa + 541 tgctttcgtc tttctgatga aatagacttc ttttccttgt tcggtaggga tatagtaacg + 601 attttggaat cggatatggt gtccactatc gacgactctc tccgccagtc tagccagaat + 661 gagattcctt tcagaggggt taggaacctc ctcgaagaca gagagttttg tcttgtttcc + 721 aaactgttca ttaaaggttt gaatgtagga aagcaggaag gtattggctt cttccaaggt + 781 atgaatattg ttttgttcca gttcgatagg caggcgagat tgtagtgtct gattgagtct + 841 ttcgactctc cctttagctt gagggataga ggttgtctca aggagaatcc ctagttggtg + 901 acaggcgtat ccaaactgtg tatgggtatc gtcctccatt ttcttagagt tggaggcttg + 961 ataggtaaag accgttctct tatctgtttt aatttgaagg ggaatgccgt gattggctaa + 1021 gatttgttcg aggacatgat agtaagcatt caagttctct tgtttatcaa aataagcgcc + 1081 taggatattg ccagaagcat catcaatggc taagtgtaag ttagatgttt gggctccaaa + 1141 ctaggcatga ggactggcat ccatttgaat gagttcacca gcaaatttct ttctgggtct + 1201 actaggatgt acttttttag ggtcttcaag gaagttttca gccgtcggta agattggatt + 1261 gtctaggggt tgattcaggt tcagtttagc ttgttttctt actctcttct ttgtctttct + 1321 atgggactta ggcgacagga tatttttctt atagagtatt tttctaacag tagtatcaga + 1381 gagctgaatt ccttcttctt cagctagcaa ttcacagaaa tgaaggacat ttggtttata + 1441 tgtttcatag gagaggtatt tttttaggag acgttctttg atttcatcag ggattgcatg + 1501 ttttggtttt cgatttctgt ttccgtgtct gaaggcttct ttgtcctttc agttgatagg + 1561 ctagtagcag acgattgatt tgtctttcag aaagattgag ctcgacacag gctcgtttct + 1621 ttgttttctt tccttgggct atagccttta tcacaagata ttttttcgtt tcattcatat + 1681 tcagttggat ccttttcata tgactattct accaaatggg acattttcac gttcgattta + 1741 ctaaagacat tatcacattc gaattacaca agatgcagat agtaaaaaaa atgtagacat + 1801 taccgtaaaa aagtgatata atcgtatgat gttcaaggta taggtgttaa tcatgagtag + 1861 acgttttaaa aaatcaggtt cacagaaagt gaagcgaagt gttaatatcg ttttgctgac + 1921 tatttattta ttgttagttt gttttttatt gttcttaatc tttaagtaca atatccttgc + 1981 ttttagatat cttaacctag tggtaactgc gttagtccta ctagttgcct tggtagggct + 2041 actcttgatt atctataaaa aagctgaaaa gtttactatt tttctgttgc tgttctctat + 2101 ccttgtcagc tctgtgtcgc tctttgcagt acagcagttt gttggactga ccaatcgttt + 2161 aaatgcggct tcgaattact cagaatattc gatcagtgtc gctgttttag cagatagtga + 2221 gatcgaaaat gttacgcaac tgacgagtgt gacagcaccg actgggactg ataatgaaaa + 2281 tattcaaaaa ctactagctg atatcaagtc aagtcagaat accgatttga cggtcaacca + 2341 gagttcgtct tacttggcag cttacaagag tttgattgca ggggagacta aggccattgt + 2401 cctaaatagt gtctttgaaa atatcatcga gtcagagtat ccagactacg catcgaagat + 2461 aaagaagatt tataccaagg gattcactaa aaaagtagaa gctcctaaga cgtctaagaa + 2521 tcagtctttc aatatctatg ttagtggaat tgacacctat ggtcctatta gttcggtgtc + 2581 gcgatcagat gtcaatatcc tgatgactgt caatcgagat accaagaaaa tcctcttgac + 2641 cacaacgcca cgtgatgcct atgtaccaat cgcagatggt ggaaataatc aaaaagataa + 2701 attaacccat gcgggcattt atggagttga ttcgtccatt cacaccttag aaaatctcta + 2761 tggagtggat atcaattact atgtgcgatt gaacttcact tctttcttga aattgattga + 2821 cttattggga ggggtagatg ttcataatga tcaagagttt tcagctctac atgggaagtt + 2881 ccatttccca gtagggaatg tccatctaga ctctgagcaa gctctaggtt ttgtacgtga + 2941 acgctactca ctagccgatg gagaccgtga ccgtggtcgc aaccaacaaa aggtgattgt + 3001 ggctatcctt caaaaattaa cgtcaaccga agcactgaaa aattatggta cgatcattaa + 3061 tagcttgcaa gattctatcc aaacaaatat gccacttgag accatgataa atttggtcaa + 3121 tgctcagtta gaaagtggag ggaattataa agtaaattct caagatttaa aagggacagg + 3181 tcggatggat cttccttctt atgcaatgcc agacagtaac ctctatgtgc tggaaataga + 3241 tgatagtagt ttagctgtag ttaaagcagc tatacaggat gtgatggagg gtagatgaaa + 3301 tgatagacat ccattcgcat atcgtttttg atgtagatga cggtcccaag tcaagagagg + 3361 aaagcaaggc tctcttggca gaatcctaca ggcaaggggt gcgaaccatt gtctctacct + 3421 ctcaccgtcg caagggcatg tttgaaactc cggaagagaa gatagcagaa aactttcttc + 3481 aggttcggga aatagctaag gaagtggcga gtgacttggt cattgcttac ggggctgaaa + 3541 tttactacac accagatgtt ctggataagc tggaaaaaaa gcggattccg accctcaatg + 3601 atagtcgtta tgccttgata gagtttagta tgaacactcc ttatcgcgat attcatagcg + 3661 ccttgagcaa gatcttgatg ttgggagtta ctccagtcat tgcccacatt gagcgctatg + 3721 atgctcttga aaataatgaa aaacgcgttc gagaactgat cgatatgggc tgttacacgc + 3781 aagtaaatag ttcacatgtc ctcaaaccca aactttttgg cgaacgttat aaattcatga + 3841 aaaaaagagc tcagtatttt ttagagcagg atttggttca tgtcattgca agtgacatgc + 3901 acaatctaga cggtagacct cctcatatgg cagaagcata tgaccttgtt acccaaaaat + 3961 acggagaagc gaaggctcag gaatttttta tagacaatcc tcgaaaaatt gtaatggatc + 4021 aactaattta ggagaaatga tgaaagaaca aaacacgata gaaatcgatg tatttcaatt + 4081 atttaaaacc ttgtggaaac gcaagctaat gattttaata gtggcacttg tgacaggtgc + 4141 gggggctttt gcatatagca cttttattgt taagccagaa tatacgagta ccacgcgaat + 4201 ttacgtagtg aatcacaatc aaggaaacaa gctggggctg acaaatcagg atttgcaggc + 4261 aggttcttat ctggtaaaag actaccgtga gattatcctt tcgcaggatg tattggaaaa + 4321 agtagcgaca aatttgaagt tggatatgcc agcaaaaacg ttagccagca aagttcaagt + 4381 gactgtacca gatgacactc gtatcgtctc aatctctgtc aaggataaac agccagagga + 4441 agccagtcgt atcgctaatt ctctacgaga agttgctgca gaaaagatcg tcgctgtaac + 4501 gcgagtatct gatgtaacga cacttgaaga agcgcgacca gctacgactc cctcttctcc + 4561 aaatgttcga cgcaattcct tgtttggttt tcttggagga gtagtcgtaa cagtaattgc + 4621 tgttcttttt attgagttgc tcgacacccg tgtgaaacgt cctgaagatg ttgaagatgt + 4681 actgcaaatt ccacttttag ggctcgttcc agatttgaac aaaatgaaat aggaggaagt + 4741 tatgccaacg ttagaaatct cacaggcaaa attggatttt gtaaaaaagg cagaggaata + 4801 ttataacgct ttgtgcacga acctacagtt aagtggagat ggtttgaaag tattttctat + 4861 cacttctgtg aaactaggag aaggaaaatc aacgacttcc atcaatatcg cttgggcttt + 4921 tgcgcgtgca ggttacaaaa cgctgctgat tgatggagat attcgcaatt ctgttatgtt + 4981 aggtgtcttt aaagcaaggg ataagattac aggcctgaca gaatttttat caggaactac + 5041 ggacctatca caagggcttt gtgataccaa tatcgaaaat ctctttgtaa ttcaggctgg + 5101 ctctgtgtca ccgaatccga cagctcttct tcaaagtaag aatttcagta caatgcttga + 5161 aaccttgcgt aaatattttg actacatcat tgtagatact gctcctgtcg gtgtcgtgat + 5221 tgatgcggct attattacgc gaaaatgcga tgcttctatt ttagtgacgg aggcaggtga + 5281 aataaatcga cgggatattc aaaaagcaaa agaacagttg gaacacacag ggaagccgtt + 5341 tttgggaatt gtgttgaata aattcgatac ttcagtagac caatacggtt cttatggaaa + 5401 ttatggagat tacgggaaaa ataaaaaata ggtcggggga tagagatgaa tgggaaaata + 5461 ttaaggtctt cattggccat aatccagagt tttcttgtta ttttattgac ttatctactt + 5521 agtgctgtga gagaagcgga gattgtttca acaacagcta ttgcacttta tatcctacat + 5581 tattttgtct tttatatcag tgattatgga caggctttct ttaaaagggg atatttgatt + 5641 gaacttgtcc agacattgaa atatatccta ttctttgcac tagcgattag tatttctaat + 5701 tttttcttag aggatcgatt taatatttcc agacgaggca tgatttactt cctcacatta + 5761 catgctctct tggtctatgt gctaaaccta tttatcaagc ggtattggaa gcgggcttat + 5821 cccaacttta aaggaagtaa gaagattctc ctacttacag caacttctcg tgtcgaaaag + 5881 gtactggata gattaataga atcaaatgag gttgttgggg agttgatagc cgtcagtgtc + 5941 ttagataaac cagattttca gcatgattgt ttaaaggtag tagcagaggg ggagatagta + 6001 aactttgcga ctcatgaggt ggtcgatgaa gtctttatca atcttccaag tgaaaaatac + 6061 aatattggag agcttgtctc tcagtttgaa acgatgggaa ttgatgtaac agtcaatcta + 6121 aatgcttttg atcgtagttt ggcacgtaac aagcaaattc gtgagatggc aggattaaac + 6181 gttgtgactt tttctacaac attttataag actagtcatg taattgctaa gcggattatt + 6241 gatatcgtgg gtgcatttgt agggctgata ttatgtggtt tagttagtat tgtactggtt + 6301 cctttgattc gaaaggatgg gggctctgct atttttgctc agacgcgtat aggaaaaaat + 6361 ggtcgtcagt tcacttttta taagtttcgc tctatgtgtg tagatgccga ggcgaaaaaa + 6421 agagaactca tggaacaaaa taccatgcag ggtggaatgt ttaaggtgga cgatgatcct + 6481 cgtatcacga aaattggtcg ttttatacgg aagactagct tggacgagct accacagttt + 6541 tataatgttc taaagggaga tatgagtttg gttggcacac ggccaccaac agtggacgag + 6601 tatgaacact ataccccaga acaaaaacgt cggctaagtt ttaaacctgg tataacaggc + 6661 ttatggcaga tcagtggacg aagtgagatt aagaattttg atgaagttgt caaattagat + 6721 gtggcctata ttgatggttg gacaatctgg aaagatattg aaattttgct taaaactgtt + 6781 aaagttgtat ttatgagaga tggagcgaag taattcatat gaatgagaga atgcaaatat + 6841 taggaattat tatagatcca ttaacgatga aagaaacagt ggatgctgtt gaacagtatg + 6901 ttttaaagaa gcatcctttg cacttgatgg gagttaacgc agataaaatt aatcagtgcc + 6961 atgaagatga gaaaatcaaa aaaatcgtta atgaatcagg aatcattaat gcggatggag + 7021 catcagttgt tcttgcaagt aagtttttag gaacgcctgt tcctgaacga gtagcgggta + 7081 ttgatttgat gcaatgtctt ttagagttgt caaataaaaa aggatattca gtttactttt + 7141 ttggagccaa agaagaaatt ttacaagata tgctaaaagt ttttaaacaa agatatccta + 7201 atcttaatgt tgttggctat agaaacggat atttttcacc tgaagatgaa aaaaagattc + 7261 aggaagatat taaaggaggc aaaccagatt ttgtatttgt agggattact tctcctaaaa + 7321 aggaatatat catccaatca ttcatggata atgggattaa tgctgtcttt atgggtgttg + 7381 gtggcagttt tgatgtatta tcaggacaca ttaaacgagc tccattatgg atgcaaaaat + 7441 tgaatctgga atggttgttc cgtgtagtta atgaacccaa acgtcttttt aagcgttatt + 7501 ttgtagggaa tgttactttt attaagcgag ttttagatga aaagcgaaaa tcaaaaaaat + 7561 aatattctac atatttctcg tacaatggat attggtggtg cagaacgtat tgtatatcaa + 7621 ttgagttctg atttgaaaga tgaatttgat agtgtccatg tcgcttcaac aggtggacta + 7681 tgggagagca aacttttatc aaaaggagtt caacatcata aaattttaga tgttgacagt + 7741 aagaatcccc taactatggt aaagatcctt tcaagttttt atagaattat caaaaataat + 7801 gatattacca ttgttcacac tcatcatcgg atggctgcct tttatattcg cttgttgaaa + 7861 atcattaatc ctaagttgat acatgtttac actgcacata atgtatttaa aaataaatta + 7921 ccattataca aattttcctt aaaaaaagcg tattgtgtag ctgtgggtaa agcggttaat + 7981 gataatttga aacatgatgt aggaatcagt gatagtacag taatctataa tggggttgtt + 8041 tttgaaaaaa ctgataagct agttgatgag attgtaaatt ataacggaat caaattgggg + 8101 tgtattgcta ggttatcaga gcaaaaagga ttgacctacc taattgatgc gatgtcttta + 8161 gtgaaacaca gggatattac attgttcatt gtcggagatg gagagcttcg agatgaactt + 8221 gaaaacaagg tgaaacaatt aaatcttcaa aaatcagtga tatttttagg ttatcgaaaa + 8281 gatgttgttg aatgtatcaa tagttttgat tacttagtgt catcatcttt atatgagggg + 8341 ttggctctaa atgtaattga agcatttatg aatgggaaaa cgatggttgc atcagatatc + 8401 cccggaataa atgaagtagt caataacaaa aatgggattc ttgttcctgt taaggatgat + 8461 gttgccttag cgagagcgat tgaaaagctt gcgactgaca aaaaacttag agaaaaactc + 8521 gcttatcaag caaaaaaaga ctatgagaca aaatttaatt attccttgtt tttggataat + 8581 tatcggagac tttatagaaa attaacggga gaatcaaaat gaaaaaagtc atgttggttt + 8641 ttgggacacg tccagaggct attaaaatgt gtcccctagt aaatgaactg aaacaaaatg + 8701 attcaatcaa gacacttgtg tgtgtaactg gtcaacataa ggaaatgcta gagcaggttt + 8761 tggaggtgtt caaggttgtc ccagatcatg atttgggtat catgaaagca aatcaaaccc + 8821 tattttccat tacgattagt attttggata agattcaagc agttctagaa caagaaatgc + 8881 ctgatatcgt tcttgttcat ggagatacaa caacaacatt tgcgacagct ttggcagcat + 8941 tttatatggg aatcaaagtg ggacacgtcg aagccggtct cagaacccac aatctccaaa + 9001 gtccatttcc agaggagttc aatcgccaga cgacttctat cattgccgac tatcatttcg + 9061 cgccgactga agttgcaaag gaaaatctac taagagaggg cagaaaaaat atctttgtga + 9121 cgggaaatac agtcattgat gctttgaaga cgactgttca atgcaactat catcacccaa + 9181 ttttggaatg ggcaaagggt agtaagttaa tcatgctaac ggctcatcga cgagaaaatc + 9241 ttggggaacc gatggaaaac atgtttaatg ctgttaatcg aattttagac gaatttgaag + 9301 atgtaaaagt tgtatatccc atccataaaa atcctaaggt tcgagagttg gcaagtaaag + 9361 tttttggcga taatgaacga atgaagatca ttgaaccgtt agaagttatt gatttccata + 9421 attttatgga tcaaagctat atgattttga cagattctgg aggtgtgcag gaagaagcac + 9481 cttctttagg gaaacctgtc ttagtgatgc gtgatacaac agagcgtcct gaaggagtcg + 9541 ctgctggcac attgaagttg gtaggtacag aagaagagaa tatttataat aactttaaac + 9601 ttcttcttga ggatgaaaca gaatataaca agatgagtaa agctagcaat ccttatggag + 9661 atggaatgac ttgtaaacgg gttgttgata ttattctgga agtataaaaa taattcaatt + 9721 atgaatgagg aaagaataaa ttagattgat gataaaaaga aaaatatata taatctgtgt + 9781 attactgtcg tattttttac ctagtttttt tacagttgga tcaatggcaa ctatatttac + 9841 cctactctcc acagtaatta ggctattcgt aactatatat catgttccta aagttttttc + 9901 acagtataag gtaacgctga ttgacatttt ggttgttctg tttttgtttt ttcaagtgtt + 9961 tgtgggggtt caaagtcaga cagtgaatct taactatatt ggaggacagt ttttcttttt + 10021 aggattatat tcatttttga aatacttttt attgtttgat tgtaaaacaa caattgaaag + 10081 cctcttttta acctttatct tgtttttgtg tgttcaagta ataactcaat tgctttttcc + 10141 ggttggtttc gactctttgt accctacagg agataataga ctttactttt taggaagaaa + 10201 aaacatagcc accccatata tcattgttgg attaggtagt ttttacttat taaataaaaa + 10261 aatgaatgag tttatatcac taaaggagat tattttttta ggattgttcg gaattttatc + 10321 atttttaaca caatccagta cagcgattat atgttatgtg ctttttattt ttatgcgtat + 10381 gttaggttta aaggaaaata taggaaaacc atattcttta gtcagtataa ctgtgtatat + 10441 ttgttttagt ttttctataa ttttttcaca aagtacaatt ttatcaactt ttacagcaat + 10501 tttttccaaa aatgcaacct tttcaggacg tatcaatatt tggcagttag cgattcgtat + 10561 ttttgaagaa aatttttggt ttggaaaagg acttaatatt gatttcaatg cttggacaaa + 10621 tgggattatc gttaactccg cacacaatac cttactagat atacttgctc gaacgggtat + 10681 atttccgggt attttatttg tagtggttct tctaagtcta tttcttggaa aatatagagt + 10741 aaaatcaaaa acgctactga caatgttgat ttcattcatg gtttatatta cgatggaggc + 10801 tacatctgta agtattcttc tattaataat tgctatttgt gtgtattggt cttttggaga + 10861 ggagaagtta tatgagcaag ttacttaatg caatctatta tcgactattt ggattatata + 10921 aaaaaattta tctacaagtt tttagtaaaa aaacaattaa tattttaggt gaaaaggcta + 10981 atttagaaaa tgaactaatt gtttcgttta caacaattcc aagccgtctt aattatttac + 11041 caagtatgat taaaagtatt ttcaatcaga caattatccc taaccgtttt attatgtatg + 11101 tttataaaga taaatttgaa ggtattaatt tggagagtat cctagaaact gaaatcaaaa + 11161 atggtttgga aattgtctat gtggacgaaa atcttcgctc gcataaaaaa tatttttatg + 11221 ctatgaagga taatccgaat agtattgtaa ttttggttga tgatgacact gtctattcat + 11281 cgaataccat cgaaaagtta gttgcttctt acaggaaata cccaagttgt atttcggcaa + 11341 tgcgatgtca tcgaattaaa ctgcttactg atggaagtct ggcaccatac aatgagtggg + 11401 aatatgaatt tttcggtgat attaaaccat cttactttaa tttctttaca ggttgtggag + 11461 gagtactttt tcctcctact gctcgaacag atgaattttt taatatttct aatataatga + 11521 atctcagtta tttagctgat gatgtatggt tgaatttttt agcaataaaa aatagaatta + 11581 aaatagtaaa agcaacacga tgtaagggaa caccattaac tatagatgac aaccctgaag + 11641 agagtttggt gtatctgaat gctatatatg ataataataa tgataggtgt atcaagaata + 11701 tggtagattt ttatcatatt gatttttcag aggttgatta atggatataa gtaataagtt + 11761 taaggtaggt atcctatata ctgctttagg taagtattct aatgttataa ttcaattatt + 11821 tgtaacggcg gtattaagta gaatattaac acctgaagag tatggcgttg tagcggttgt + 11881 caatgtgttt ttagtattct ttcagatatt ggcagattcg ggaataggac ctgcaattgt + 11941 acaaaataag acattaactc aaaatgattt aaatgatatt tttactttaa caatttattc + 12001 aggtttaatt ctttcgtttg tttttgtatt gataggctat ccaattagta tagtctatgg + 12061 gaatgaagtc tatatcaaac tgtactcatt attaggtatg tgtgtactat tttatactat + 12121 gacaattgtt cctcagtcaa ttttaacaag aaacatgaac tttaaacgga tgaacttatt + 12181 gagtctgatt gccaatattt ttagtggagt tattggtgtt gtgctggcca tacatgattt + 12241 cggggtatat tctctgattt tttctaatat tatgaaggct actatattat tttttgtttt + 12301 tttttcaagt gttgagttga gttttaagaa aaagatagag aaaacttcgt tagttaaaat + 12361 tctaaatttt tctaagtttc aatttatgtt taattttcta aactactttg caagaaattt + 12421 agacaatctc ttgattggta gattcattaa tcccgctgcg ttgggttatt atgataaggc + 12481 ttaccagtta tcattatatc ctaatcagat tttattgcag gtgatttcac ctgtaattca + 12541 tccgataatg tcgaattttc aaaatgatag acaaaaaatg gaagaagttt ttgcaaaaat + 12601 ttttaatatt ctacttttaa taggaatgcc aatctcagtg tatttgtttt tcaatgcaag + 12661 tgatgtgata acatttatgt ttggaaataa ttggtttcag agcgttccag tatttcaaat + 12721 actatctgct agcatctgga ttcaaatggc taatagtcca ataggaattt tttatcaagc + 12781 ttcgaatcgt gttgatctgt tatttaaggt aggattatta gcgtcaggat ttaatattat + 12841 agctattgtg atagggctat tatcgaaaag tatagtgaca attgctgcta tgttaattat + 12901 ttcatttata atagggctat cactgaatct ctacgtttta tcacatgtag tctttaaaaa + 12961 tgatataatt aaatatttaa aaataatttt agttcacctt gtaacagtta tcccatatat + 13021 tatattcaat atgattggct ttagatttga acagggtgta gttatcaatc ttgtgttgca + 13081 aggactggta ttgggactaa tttggtctat aggaatattt gtaacaggtc aatacaagca + 13141 gttaataatg atgtttagta ggtgaaaatt tatgaaaatt ttatttgtga atatgtttta + 13201 caatgaagaa ggaggagcac aaaagagcac caaatttcta gctgaacaac ttgtaaaaga + 13261 aggacatgag gtatttgcat actctgatga tgctattgat tcagatattg aggaagttat + 13321 taatggggtt aaggttttta gaagaagaac tccgcttttt agtcttcact atattttcag + 13381 tgccaagaag aatccagcta aacatttttt ctataaaata tttgaaacct ataatgtatt + 13441 tgcgaaaaaa aaatttatcg atatcattga ggaaatacaa ccagatattg ttcattttaa + 13501 tacaatttca ggaatgtctt tatcaatagt taaagaagct aaaaagagaa atatcagaac + 13561 catttggacc ttgcgagact attggctaga atatccatgg ggggagaaag atattgctct + 13621 tattaaactg ctaaatagaa tatatagacc ttttgttaag aaaagtttaa aacacttaga + 13681 catagtaaca gcaccttcag catttacctt gaataatttt atcaataaag gatttattaa + 13741 cccatcttct caaaaatgta tggccattga aaatgctgtt atattttcaa agagtaaatt + 13801 ggaaaatatt atcaaacgaa agcaagaaac aaaaagaaat ccagaaaaaa cgaattttct + 13861 ttttgtaggc tctatacttg aaataaaggg cgtttttaac ttagtaatgg cttttaaaaa + 13921 actaactaat ccagaaattt ctttgaaaat tgtaggaaaa ggaaaagatt tagaaaaact + 13981 tcaaaaagaa atcgaaagtg atcctagaat acaatattta ggctttcaag atacaaaaaa + 14041 cctctatgaa acttatcaaa attcggatgt attggtcgtt ccatcagctt gggatgaacc + 14101 gtttggtaga gttgtaattg aaggaaatgc aaatggcctt ccggtcatca cttcagatag + 14161 aggtggatta cctgaaattg tgcaaacagt aggaggaggg gaagttttta cagacaaatc + 14221 gggaaataca ttatatagta ttttaaagaa atttgtagaa atggaaaact acaatgtcta + 14281 ttaccgatgc attcttgaga atattgatat ttattctatc gaaaaacaaa gtgaaaagtt + 14341 tataagttta tatagggagg gatagatgca ggttcgacat ttattaactt atctgatttc + 14401 gctacctaaa acaatctttt ttaattttaa gtgtttacca attaatcagg caattcacct + 14461 tccaatactt gtagcatata atgtcaagtt gttaaatttg aaaaagaatg taattggtat + 14521 agaaactgta gtaaaatttg gtttagttcg aattggtttc tcaggtacgg agataatatc + 14581 ctctaatcga tcgctcataa acttgagaca aggaaaagtt atttttaaag ggaagtcagt + 14641 gatcacaaaa ggttgcacaa ttagtgttac aggaggaacc atcattttgg gcgataactt + 14701 ttatgcgaat agaaattgtc ttatatcatg tactgatagg ctcattgttg gtaataatgt + 14761 acttttaggt tggaatgtta ttctttttga ctcagctggt catacactaa gctacgatgg + 14821 taagaaaaag ataaaaatga cagaagaaat tgtaattggt aaccatgtat ggatttgtgc + 14881 tgaagcacac ttattgaaag gaagtaagat tgcagatggt tctgtagtag cttattctag + 14941 tttagttaca ggttatttcg cagaaaagaa ttgcttgatt ggaggaatac ctgcaaaaac + 15001 acttagaaaa ggagtaagtt gggaaaagta actttatttt attgattcaa aatattagag + 15061 gtggaagttt gaaaaaaata aaagttagtt gattgattac ttctctaaat tttgggcaca + 15121 ctaaaaagag gtcttgacac ctaaacttta aaattaaagc atattgaatc cgcgctgctg + 15181 tgcgaagcga atagcgtctt ggacggacat tgtcttatct ggatttctta tttctgtaag + 15241 gccttgtaat cttggattat aactctcctg ttttaggaat acatggtaga tggcaaccaa + 15301 taatctgcga cagatagcga tgatagcttt tcgatgacca cgtcgtttct tgagtttgag + 15361 atatttattt cgtagttcag gatgcttctc tgatttaacc acggcattag ctatttgaac + 15421 aagaaaaggt ttgagatagt gaccgccttt cgaaatacga gtagagaatt tctttcctgc + 15481 actttcattg ttggcaggaa ctaatccgcc ccaagaatag agtttacctg cagtaccaaa + 15541 gacagtcata tcagctccga tttcagagag tattctgagg gcagatagtt cctctttgaa + 15601 accaggcaca gtttggatca gtttgacctg ttcttggtat tcgtgaccga gcttccgaat + 15661 catggtttct aaatcttctt tacagacggc aagagcatca tagtgttcct tgatgattct + 15721 gattttctca gcttgttcag gtgtcacctc cccctcaata gcgattttca agtcttgcac + 15781 cttatccttc attctcttgt gaatcaactg ttcaatgttt ggtttgtcct ctggattgtc + 15841 aaggatgctc tgaataatag cctgagcact ttttccgaac acgtcggaaa cgacacttgc + 15901 aatctgaagg ttagaccaag tcagacagtt ctggtaacga tttttctcgc tgacttgaag + 15961 ttgtgttaat ttcatgcgat agcgaaaaag gtctcggagt tgtctgattt taagaggggg + 16021 aataaagcta gaagcaacca aatcatgctt gaagaggtcg gctatccatt gcgcatcttt + 16081 cttgtcggtt ttctttcctc tgatagcctt gacatactta gggtgagcta agcaaatctt + 16141 gcaggatttt tcaaggatat tgaagacagg aatccaatat ttactggtag attccataca + 16201 gacatcaaat caagaatagt attctagcca atctcgtagc tgtactaacc catttgtaaa + 16261 agttgagaaa cgtttacgat ggtagcttgt gagtccttgc ttgtcggtga tggtaacaac + 16321 cgctacaaca aaggttttat gcacatcaat gccacaacaa ttaggataga taatttttaa + 16381 catgaggggt ctcccttcac caaatttgag tctgcctatc ccttgactat tctttccttt + 16441 cacaaacgag tcgcttattc aattataagt ttacgtgctc ttagtcacag ttcttgtgct + 16501 tgatggaaag aatgacacct ataaatatgc gaggtagtgg ctgtaccact cacttattca + 16561 cctccccgtg atttgtaata gtgataggct ttctcactat tattataaac caaaataaag + 16621 agcacaacac tttttcatgc tgtgttgtgc cttgagtgaa acgaaaggaa tgaattataa + 16681 atatgaaaat agcggtagca ggaacaggtt atgtaggatt gtcaattgcc gtgttgttgg + 16741 cacaacatca cgaaataaaa gcagttgata ttgttgctga aaaagttgaa ttaatcaatc + 16801 aaaaaaaatc tccaattcag gatgattata ttgaaaaata tttagtggaa aaagatttaa + 16861 atttggaagc aactatggat gctaagtatg cttatgaaga tgcagaattt gttgttgttg + 16921 cagcaccaac aaattatgat tcgaaaaaga acttttttga tacatcagca gtagaggcgg + 16981 tcattcaaca agtaaaaaaa attaatccca aagcggtaat aattattaaa tctacaatcc + 17041 ctgttggatt cacagagtcc gttcgaaaga aatatcagta taaaaatatc ctatttagtc + 17101 cagaattttt acgcgaatct aaagcattat acgataacct gtatccaagt cgcatcattg + 17161 ttggaactga cttagaagat acttatttaa aagacaaagc taatatattt gcttccctac + 17221 taaaagaggg ggctattaaa gaagacatag atacactttt catgggagta acggaagctg + 17281 aggcagttaa attatttgcc aatacttacc ttgcgttgcg tgtttcttac tttaatgaat + 17341 tggatactta tgcagaggtg aaaggtttgg atgcaaaagc cattattgat ggtattggcc + 17401 tagatccacg tataggaaat cattataaca atccatcctt tggctacggt gggtattgtt + 17461 tacctaaaga tagtaagcag ttattagcaa attactttga tgtaccacaa aatatgatga + 17521 cggcaactgt tgaaagcaat cgaacgcgta aggattttat cgctcaacgg attttagaaa + 17581 aagctggagt atctgagact gatagtttag atgcgtttaa gaacacacaa gatattgtta + 17641 taggtattta tcgtttaaca atgaaaagta attcggataa cttccgtcac tcctctattc + 17701 aaggtgttat gaaacgattg aaagctaagg gagttacggt tatcatctat gagccaactt + 17761 tgaaggacgg ggaaacattc tttggtaata aagtggtaaa taatctagat aaatttaaag + 17821 aagctagtaa tgttattgta gccaatcgtt ttgaaccttc actagaggat gtgtctaata + 17881 aagtttatag tcgggatatt tttaagcgtg actaataaat atgtccacgt gacgtaatat + 17941 ctattaaatg gataaaatat taataaacat ggcatctata tctttttggg gataataaaa + 18001 ggcatatgat tatctaagtt agtttatata attaagcagt tacgtcaact tattttatta + 18061 tgaattatat ataacatgaa tatcattatt aaatgagcac taaatagata acaagaggag + 18121 aaataaatga aatcaatcgg aaagcgaatc aattggatag attttgggaa aggattcgca + 18181 atattttcag ttctagtagg acatgtattg atggggttgt atgaatccaa tattttttca + 18241 attgcaaatg atgtgttatt attattgata actcaaattt atatatttca cataccagtg + 18301 ttttttgccc tgtcaggata cttttttaga cctgtatcag atatgaagga gttttggcat + 18361 tatgctaaaa agaagacgat tattttaggt ataccatatg ttttttattc aattattcac + 18421 ttttgtcttc aaaaggtcgc tggtgcctct gtccgagtac ccactacgat atttaaccta + 18481 ttgaatatct ataaatttcc tctgggagtt tcatggtatc tatatacgtt atggtcgata + 18541 ttgatagttt atggtttact atctgttgtt ttcaaaaatc gtaagtccct tttgttagtt + 18601 agtgtttttg cctatatttt cacactattt attcaaactg atatttttat tgtacaacgg + 18661 acgttggttt ggggtgtttg cttctgtctt ggcagtgtat tgagcgcaat tcactttgat + 18721 aaaattaatt tgaaaaaatt tctttttttc tttgtgctat ttgattttat ttatatgttc + 18781 gcttggtttt tgttttatga agtagggtct aagaaggatt atgtaagcta tagcaaccca + 18841 ggtttgtggg ggattgcttt tattgtctgt gtattagttg cttttgcgat ttttcctaaa + 18901 atggagaaaa attttcctaa aactttccta tatttcacta aatacgggaa agatagttta + 18961 gggatctata ttcttcatgc accaatttgt agcatgattc ggattctaat gttgaaagta + 19021 ggaataaact cagtttttct tcacgttgtt gttgggattg tgctaggctg gtatttatcc + 19081 atactagcaa cttatatatt gaaaaaaatt ccatttttga atattgtttt attaccacaa + 19141 aagtatatta aattaaaata aattattttc ggctctttgt caactgtagt gggttgaaaa + 19201 aaagctaagc ttgagaaagg acaaattttg tcctttcttt tttgatgttc agagcgatga + 19261 aaatccgttt tttgaagttt tcaaagtttc gaaaaccaaa ggcattgcgc ttgataagtt + 19321 tgatgagatt attggtcgct tccagtttgg cgttagaata gtgtagttga agggtgttga + 19381 caagcttttc tttatctttg aggaaggttt taaagacagt ctgaaaaata ggatgaacct + 19441 gcttaagatt gtcctcaata agtccgaaaa atttctccgg ttccttattc tgaaagtgaa + 19501 acagcaagag ttgatagagc tgatagtggt gtttcaagtc ttccgaataa ctcaaaagct + 19561 tgtttaaaat ctctttattg gttaagtgca tacgaaaagt aggacgataa aatcgcttat + 19621 cactcagttt acgactatcc tgttgtatga gcttccagta gcgcttgata gccttgtatt + 19681 catgagactt tcgatgaaac tgattcatga tttgaacacg cacacgactc atagcacggc + 19741 taagatgttg tacaatgtga aagcgatcaa gaacgatttt agcattcggg agtgaaacag + 19801 tctgggagac tgtttcagcc tgagcctaga aatttgaaag cgaagctgtt tagccaagtc + 19861 atagtaagga ctaaacatat ccatcgtaat gattttgacg cgacatcgga cggctctatc + 19921 atatttaaga aagtgatctc ggatgacagc ttgtgttcta ccttcaagaa cagtgatgat + 19981 attgagattg ttaaaatctt gcgcaatgaa gctcatcttt ccctttgtaa aagcatactc + 20041 atcccaagac ataatctcag gaagacaaga aaaatcatgt ttaaagtgaa aatcattgag + 20101 cttacgaata acagttgaag ttgaaatgga aagctgatgg gcaatatcag tcatagaaat + 20161 cttttcaatt aacttttgag caatcttttg gttgatgata cgagggattt ggtgattctt + 20221 cttgacgata gaagtttcag cgaccatcat ttttgaacag tgatagcact tgaaacgacg + 20281 ctttctaagg agaattctag taggcatacc agtcgtttca agataaggaa ttttagaagg + 20341 tttttgaaag tcatatttct tcaattggtt tccgcactca gggcaagatg gggcgtcgta + 20401 gtccagtttg gcgatgattt ccttgtgtgt atccttattg atgatgtcta aaatctggat + 20461 attagggtct ttaatgtcta gtaattttgt gataaaatgt aattgttcca tatgattctt + 20521 tctaatgagt tgttttgtcg cttttcatta taggtcatat gggacttttt ttctacacaa + 20581 aaataggctc cataatatcc ataggggatt tacccactac aaatattata gagccttatt + 20641 ttagatttat aatgtgtctc tttgtcaact aacatctgga gaggacaatc actgtcttct + 20701 ccttttttgt cttttcagaa tataccaaat taacacaaaa attctgaaaa ttctgttgac + 20761 aactttctga aaagagtcta taatggagag aaagttttaa aggagaaaat gatgaaaagt + 20821 tcaaaactac ttgcccttgc gggcgtgaca ttattg +// + diff --git a/public/res/serotype_genbank/serotype_9X.gb b/public/res/serotype_genbank/serotype_9X.gb new file mode 100755 index 0000000..bb1a123 --- /dev/null +++ b/public/res/serotype_genbank/serotype_9X.gb @@ -0,0 +1,885 @@ +LOCUS MK606437 22233 bp DNA linear BCT 30-SEP-2020 +DEFINITION Streptococcus pneumoniae strain GPS_US_PATH4387 cps gene cluster, + complete sequence. +ACCESSION MK606437 +VERSION MK606437.1 +KEYWORDS . +SOURCE Streptococcus pneumoniae + ORGANISM Streptococcus pneumoniae + Bacteria; Bacillota; Bacilli; Lactobacillales; Streptococcaceae; + Streptococcus. +REFERENCE 1 (bases 1 to 22233) + AUTHORS van Tonder,A.J., Gladstone,R.A., Lo,S.W., Nahm,M.H., du Plessis,M., + Cornick,J., Kwambana-Adams,B., Madhi,S.A., Hawkins,P.A., + Benisty,R., Dagan,R., Everett,D., Antonio,M., Klugman,K.P., von + Gottberg,A., Breiman,R.F., McGee,L., Bentley,S.D. and The Global + Pneumococcal Sequencing,C.O. + TITLE Putative novel cps loci in a large global collection of pneumococci + JOURNAL Microb Genom 5 (7) (2019) + PUBMED 31184299 +REFERENCE 2 (bases 1 to 22233) + AUTHORS van Tonder,A.J. + TITLE Direct Submission + JOURNAL Submitted (06-MAR-2019) Parasites and Microbes, Wellcome Sanger + Institute, Wellcome Genome Campus, Hinxton, Cambridge CB10 1SA, + United Kingdom +COMMENT ##Assembly-Data-START## + Assembly Method :: Velvet v. 1.2 + Sequencing Technology :: Illumina + ##Assembly-Data-END## +FEATURES Location/Qualifiers + source 1..22233 + /organism="Streptococcus pneumoniae" + /mol_type="genomic DNA" + /strain="GPS_US_PATH4387" + /isolation_source="nasopharyngeal swab" + /host="Homo sapiens" + /db_xref="taxon:1313" + /geo_loc_name="Ethiopia" + misc_feature 1..22233 + /note="cps gene cluster" + gene 1..1611 + /gene="dexB" + CDS 1..1611 + /gene="dexB" + /EC_number="3.2.1.70" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3280" + /inference="protein motif:CLUSTERS:PRK10933" + /inference="protein motif:Pfam:PF00128.18" + /inference="protein motif:TIGRFAMs:TIGR02403" + /inference="similar to AA sequence:RefSeq:YP_004326655.1" + /inference="similar to AA sequence:UniProtKB:Q99040" + /note="trehalose-6-phosphate hydrolase; maltooligosyl + trehalose synthase; alpha,alpha-phosphotrehalase; alpha + amylase catalytic domain protein" + /codon_start=1 + /transl_table=11 + /product="glucan 1,6-alpha-glucosidase" + /protein_id="QCO92046.1" + /translation="MQEKWWHNAVVYQVYPKSFMDSNGDGVGDLPGITSKLDYLAKLG + ITAIWLSPVYDSPMDDNGYDIADYQAIATIFGTMEDMDQLIAEAKKRDIRIIMDLVVN + HTSDEHAWFVEACENTDSPERDYYIWRDEPNDLDSIFSGSAWEYDEKSGQYYLHFFSK + KQPDLNWENEKLRQKIYEMMNFWIDKGIGGFRMDVIDMIGKIPDEKVVNNGPMLHPYL + KEMNQATFGAKDLLTVGETWGATPEIAKLYSDPKGQELSMVFQFEHIGLQYQEGQPKW + HYQKELNIAKLKEIFNKWQTELGVEDGWNSLFWNNHDLPRIVSIWGNDQEYREKSAKA + FAILLHLMRGTPYIYQGEEIGMTNYPFETLDQVEDIESLNYAREALEKSVPIEEIMDS + IRVIGRDNARTPMQWDESKNAGFSTGQPWLAVNPNYEMINVQEALANPDSIFYTYQKL + VQIRKENSWLIRADFELLDTADKVFAYIRKDGDRRFLVVANLSNEEQDLTVEGKVKSV + LIENTLAQEVFEKQILVPWDAFCVEMTD" + gene 2101..3153 + /gene="tnp" + CDS complement(2101..3153) + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3415" + /inference="protein motif:Pfam:PF00665.20" + /inference="similar to AA sequence:RefSeq:YP_003878591.1" + /note="integrase core domain protein" + /codon_start=1 + /transl_table=11 + /product="IS transposase" + /protein_id="QCO92047.1" + /translation="MNETKKYLVIKAIAQGKKTKKRACVELNLSERQINRLLLAYQQK + EKEAFRHGNRNRKPKHAIPDEIKERILKKYLSYQTYKPNVRHFCELLAEEEGIQLSDT + TVRKILYKKNILSPKSHRKTKKRVRKQAKLNPKQPLDNPILPTAENFLEDPKKVHPSR + PRKKFAGELIQMDASPHAWFGVETSNLHLAIDDASGNILGAYFDKQETLNAYYHVLEQ + ILANHGIPLQIKTDKRTVFTYQASNSKKMEDDTHTQFGYACHQLGILLETTSIPQAKG + RVERLNQTLQSRLPIELERNNIHTLEEANTFLPSYIQTFNEQFGNKTKLSVFEEAPKP + SERNLILARLAGESRR" + gene 3330..4775 + /gene="wzg" + CDS 3330..4775 + /gene="wzg" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK09379" + /inference="protein motif:Pfam:PF03816.8" + /inference="protein motif:TIGRFAMs:TIGR00350" + /inference="similar to AA sequence:RefSeq:YP_001835063.1" + /inference="similar to AA sequence:UniProtKB:Q7WY78" + /note="putative transcriptional regulator ywtF; + membrane-bound transcriptional regulator LytR; cell + envelope-related function transcriptional attenuator + common domain; cell envelope-related transcriptional + attenuator domain protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14A" + /protein_id="QCO92048.1" + /translation="MSRRFKKSRSQKVKRSVNIVLLTIYLLLVCFLLFLIFKYNILAF + RYLNLVVTALVLLVALVGLLLIIYKKAEKFTIFLLVFSILVSSVSLFAVQQFVGLTNR + LNATSNYSEYSISVAVLADSDIENVTQLTSVTAPTGTDNENIQKLLADIKSSQNTDLT + VDQSSSYLAAYKSLIAGETKAIVLNSVFENIIESEYPDYASKIKKIYTKGFTKKVEAP + KTSKNQSFNIYVSGIDTYGPISSVSRSDVNILMTVNRDTKKILLTTTPRDAYVPIADG + GNNQKDKLTHAGIYGVDSSIHTLENLYGVDINYYVRLNFTSFLKMIDLLGGVDVHNDQ + EFSALHGKFHFPVGNVHLDSEQALGFVRERYSLADGDRDRGRNQQKVLVAILQKLTST + EALKNYSTIINSLQDSIQTNMPLETMINLVNAQLESGGNYKVNSQDLKGTGRTDLPSY + AMPDSNLYVMEIDDSSLAVVKAAIQDVMEGR" + gene 4777..5508 + /gene="wzh" + CDS 4777..5508 + /gene="wzh" + /EC_number="3.1.3.48" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4464" + /inference="protein motif:Pfam:PF02811.13" + /inference="similar to AA sequence:RefSeq:YP_002739714.1" + /inference="similar to AA sequence:UniProtKB:Q54518" + /note="capsular polysaccharide biosynthesis protein; PHP + domain protein" + /codon_start=1 + /transl_table=11 + /product="tyrosine-protein phosphatase wzh" + /protein_id="QCO92049.1" + /translation="MIDIHSHIVFDVDDGPKSREESKALLAESYRQGVRTIVSTSHRR + KGMFETPEEKIAENFLQVREIAKEVADDLVIAYGAEIYYTLDVLEKLEKKEIPTLNDS + RYALIEFSMHTSYREIHTGLNNVLMLGITPVIAHIERYDALENNEKRVRELIDMGCYT + QVNSSHVLNPKLFGERYKFMKKRARYFLERDLVHVVASDMHNLDSRPPYMQQAYDIIA + KKYGAKKAKELFVDNPRKMIMDQLI" + gene 5517..6209 + /gene="wzd" + CDS 5517..6209 + /gene="wzd" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:Pfam:PF02706.9" + /inference="protein motif:TIGRFAMs:TIGR01006" + /inference="similar to AA sequence:RefSeq:YP_001835065.1" + /inference="similar to AA sequence:UniProtKB:P72367" + /note="capsular polysaccharide type 8 biosynthesis protein + cap8A; capsular polysaccharide biosynthesis protein; MPA1 + family polysaccharide export protein; chain length + determinant protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14C" + /protein_id="QCO92050.1" + /translation="MKEQNTLEIDVLQLFRALWKRKLVILLVAIITSSVAFAYSTFVI + KPEFTSTTRIYVVNRNQEEKSGLTNQDLQAGSYLVKDYREIILSQDVLEEVISDLKLD + LTPKGLANKIKVTVPVDTRIVSVSVNDRVPEEASRIANSLREVAAQKIISITRVSDVT + TLEEARPAISPSSPNIKRNTLIGFLAGGIGTSVIVLLLELLDTHVKRPEDIEDTLQMT + LLGVVPNLSKLK" + gene 6219..6902 + /gene="wze" + CDS 6219..6902 + /gene="wze" + /EC_number="2.7.10.2" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3944" + /inference="protein motif:CLUSTERS:PRK11519" + /inference="protein motif:Pfam:PF01656.17" + /inference="protein motif:TIGRFAMs:TIGR01007" + /inference="similar to AA sequence:RefSeq:YP_001835066.1" + /inference="similar to AA sequence:UniProtKB:Q54520" + /note="tyrosine-protein kinase CpsD; tyrosine kinase; + capsular polysaccharide biosynthesis protein; capsular + exopolysaccharide family protein; CobQ/CobB/MinD/ParA + nucleotide binding domain" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + Cps14D" + /protein_id="QCO92051.1" + /translation="MPTLEIAQKKLEFIKKAEEYYNALCTNIQLSGDKLKVISVTSVN + PGEGKTTTSVNIARSFARAGYKTLLIDGDTRNSVMSGFFKSREKITGLTEFLSGTADL + SHGLCDTNIENLFVIQSGSVSPNPTALLQSKNFNDMIETLRKYFDYIIVDTAPIGIVI + DAAIITQKCDASILVTATGEVNKRDVQKAKQQLEQTEKLFLGVILNKFDVQHKKYGSY + GGYGNYGKK" + gene 6918..8285 + /gene="wchA" + CDS 6918..8285 + /gene="wchA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15204" + /inference="protein motif:Pfam:PF02397.10" + /inference="protein motif:TIGRFAMs:TIGR03025" + /inference="similar to AA sequence:RefSeq:YP_001835067.1" + /inference="similar to AA sequence:UniProtKB:P71241" + /note="putative colanic biosynthesis UDP-glucose lipid + carrier transferase; undecaprenyl-phosphate galactose + phosphotransferase; exopolysaccharide biosynthesis + polyprenyl glycosylphosphotransferase; Bacterial sugar + transferase" + /codon_start=1 + /transl_table=11 + /product="glucosyl-1-phosphate transferase" + /protein_id="QCO92052.1" + /translation="MDEKGLKIFLAVLQSIIVILLVYFLSFVRETELERSSMVILYLL + HFFVFYFSSYGNNFFKRGHLVEFNSTIRYIFFFAIAISVLNFFIAERFSISRRGMVYF + LTLEGISLYLLNLLVKKYWKHVFFNLKNSKKILLLTVTKNMEKVLDKLLESDELSWKL + VAVSVLDKSDFQHDKIPVIEKEKIIEFATHEVVDEVFVNLPGESYDIGEIISRFETMG + IDVTVNLKAFDKNLGRNKQIHEMVGLNVVTFSTNFYKTSHVISKRILDICGATIGLIL + FAIASLVLVPLIRKDGGPAIFAQTRIGKNGRHFTFYKFRSMRIDAEAIKEQLMDQNTM + QGGMFKIDNDPRVTKIGRFIRKTSLDELPQFWNVFIGDMSLVGTRPPTVDEYDQYTPE + QKRRLSFKPGITGLWQVSGRSKITDFDDVVKLDVAYIDNWTIWKDIEILLKTVKVVFM + RDGAK" + gene 8291..9034 + /gene="wchO" + CDS 8291..9034 + /gene="wchO" + /EC_number="2.4.1.187" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK03692" + /inference="protein motif:Pfam:PF03808.7" + /inference="protein motif:TIGRFAMs:TIGR00696" + /inference="similar to AA sequence:RefSeq:YP_001693870.1" + /inference="similar to AA sequence:UniProtKB:Q7A714" + /note="putative N-acetylmannosaminyltransferase; putative + UDP-N-acetyl-D-mannosaminuronic acid transferase; + WecB/TagA/CpsF family glycosyltransferase" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetyl-D-mannosamine transferase WchO" + /protein_id="QCO92053.1" + /translation="MNERMQILGITIDPLTMKETVDAVEQYVLKKHPLHLMGVNADKI + NQCHEDEKIKKIVNESGIINADGASVVLASKFLGTPVPERVAGIDLMQCLLELSNKKG + YSVYFFGAKEEILQDMLKVFKQRYPNLNVVGYRNGYFSPEDEKKIQEDIKGGKPDFVF + VGITSPKKEYIIQSFIDNGINAVFMGVGGSFDVLSGHIKRAPLWMQKLNLEWLFRVVN + EPKRLFKRYFVGNVTFIKRVLDEKRKSKK" + gene 9009..10094 + /gene="wcjA" + CDS 9009..10094 + /gene="wcjA" + /EC_number="2.4.1.11" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0297" + /inference="protein motif:CLUSTERS:PRK09922" + /inference="protein motif:Pfam:PF00534.14" + /inference="protein motif:TIGRFAMs:TIGR03088" + /inference="similar to AA sequence:RefSeq:NP_344886.1" + /inference="similar to AA sequence:UniProtKB:O53279" + /note="putative poly(glycerol-phosphate) + alpha-glucosyltransferase; + UDP-D-galactose:(glucosyl)lipopolysaccharide-1, + 6-D-galactosyltransferase; glycogen synthase; + PEP-CTERM/EpsH1 system-associated sugar transferase, ; + glycosyl transferase group 1 protein" + /codon_start=1 + /transl_table=11 + /product="capsular polysaccharide biosynthesis protein + wcjA" + /protein_id="QCO92054.1" + /translation="MKSENQKNNILHISRTMDIGGAERIVYQLSSDLKDEFDSVHVAS + TGGLWESKLLSKGVQHHKILDVDSKNPLTMVKILSSFYRVIKNNDIIIVHTHHRMAAF + YIRLLKIINPKLIHVYTAHNVFKNKLPLYKFSLKKAYCVAVGKAVNDNLKHDVGISDS + TVIYNGVVFEKTDKLVDEIVNYNGIKLGCIARLSEQKGLTYLIDAMSLVKHRDITLFI + VGDGELRDELENKVKQLNLQKSVIFLGYRKDVVECINSFDYLVSSSLYEGLALNVIEA + FMNGKTMVASDIPGINEVVNNKNGILVPVKDDVALARAIEKLATDKKLREKLAYQAKK + DYETKFNYSLFLDNYRRLYRKLMGESK" + gene 10103..11179 + /gene="mnaA" + CDS 10103..11179 + /gene="mnaA" + /EC_number="5.1.3.14" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0381" + /inference="protein motif:Pfam:PF02350.13" + /inference="protein motif:TIGRFAMs:TIGR00236" + /inference="similar to AA sequence:RefSeq:YP_004622336.1" + /inference="similar to AA sequence:UniProtKB:P39131" + /note="diacylglycerol glucosyltransferase" + /codon_start=1 + /transl_table=11 + /product="UDP-N-acetylglucosamine 2-epimerase" + /protein_id="QCO92055.1" + /translation="MLVFGTRPEAIKMCPLVNELKQNDSIKTLVCVTGQHKEMLEQVL + EVFKVVPDYDLGIMKANQTLFTITTSILDKIQAVLEKEKPDLVLVHGDTTTTFATALA + AFYMGIKVGHVEAGLRTYNLQSPFPEEFNRQTTSIITDYHFAPTEVAKENLLREDRKN + IFVTGNTVIDALKTTVQDNYHHPILEWAKGSKLIMLTAHRRENLGKPMENMFNAVNRI + LNEFEDVKVVYPIHKNPKVRELASKVFGDNERMKIIEPLEVIDFHNFMNQSYMILTDS + GGVQEEAPSLGKPVLVMRDTTERPEGVVAGTLKLVGTEEGNIYSNFKLLLEDETEYNK + MSKASNPYGDGMTCKRIVDIILEV" + gene 11221..12360 + /gene="wzy" + CDS 11221..12360 + /gene="wzy" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3307" + /inference="protein motif:Pfam:PF04932.9" + /note="O-antigen ligase" + /codon_start=1 + /transl_table=11 + /product="lipid A core O-antigen ligase-related enzyme" + /protein_id="QCO92056.1" + /translation="MIKRKIYIICVLLSYFLPSFFTVGSMATLFALLSTLVKLFVTFY + YIPKVLLQHKVTLIDILVVLFLFFQAFAAFQSQTLYLNYVGGQFFLLGLYSFLKHFLL + LDCKTTIKSLFLTFILFLCIQVITQLLFPVGFDSLHPTGDNRLYFLGRKNIATPYIIV + GLGSFYLLNKKMNEFISLKEIIFLGLFGILSFLTQSSTAIICYGLFIFIRLLGLKENI + GKLYSLVSMAVYVCFSLSIIFSQSTILSTFTAIFSKNATFSGRINIWQLAIRIFEENF + EFGRGIEVNFNAWTNGIIVNSAHNTLLDILARTGIFPGVLFVVLLLSLFLGKYRVKSK + TLLTMLISFMVYITMEATSVSILLLIIDICVYWPFGEEKLYEKVT" + gene 12344..13213 + /gene="wcjB" + CDS 12344..13213 + /gene="wcjB" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3594" + /codon_start=1 + /transl_table=11 + /product="fucose 4-O-acetylase-related acetyltransferase" + /protein_id="QCO92057.1" + /translation="MRKLLNAIYYRLFGLYKKIYLQVFGKKTINLLGERANLENELIV + SFTTIPSRLNYLPTMIKSIFNQTIIPNRFIMYVYKDEFEGINLESILETEIENGLEIV + YVDENLRSHKKYFYAMKDNPNSIVVLVDDDIIYPRNTIKKLIASYRIYPQCVSAMRCH + RIKLFSDGSLYPYNQWEYEISGATIPSYFNFFTSGGGTLFPPCTRNEDLFNKKNIREL + SFLSDDVWLNFLVVKNGIKTVKATRYKGTPLTIDDNPEESLVYLNAVYDNNNDKCIRN + MVEYYQINFTEAK" + gene 13213..14637 + /gene="wzx" + CDS 13213..14637 + /gene="wzx" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK10459" + /inference="protein motif:Pfam:PF01943.11" + /inference="similar to AA sequence:UniProtKB:P77377" + /note="colanic acid exporter; polysaccharide biosynthesis + protein" + /codon_start=1 + /transl_table=11 + /product="lipopolysaccharide biosynthesis protein Wzx" + /protein_id="QCO92058.1" + /translation="MNVEKNLKRGIFYTAIGKYSNVVIQLLVTAILSRIISPVEYGIV + AVVNVFLLFFQMLADSGIGPAIVQNKELNKSDLISIFSLTIYSGIVLSCIFALLGYPM + GVLYGETIYVSLFPLLGLCVLFYTITIVPQAILMKTMNFKIVNFLTIFSNIASGLVGV + ILAVSHFGVYSLIFSNIVKAMVLFVALYSKAKINFYWKVSKSSVGKIFEFSKFQFLFN + FWNYFARNLDNLLIGRLISPSDLGYYDKAYQLSLYPNQILSQVVTPALHPIMSNFQDN + ISKIGEVYLQISRIFVIVGIPISAYLYFNAQYVVTFMFGDNWSQSVPVFQILAATIWL + QMANSPTGAFYQATNQTKLLFRIGLLTSFINILAIVIGVMLQSIQCVAYMLLISFSLS + LVINTLYLTKKVLNISVQKYIKPILINLTIISPYIMFNLFISDFVNDLILHLSVQFVI + LFLIWGIGMYISGEYRRVFAVIRK" + gene 14650..15840 + /gene="wcjC" + CDS 14650..15840 + /gene="wcjC" + /EC_number="2.4.1.-" + /EC_number="2.4.1.11" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG0297" + /inference="protein motif:CLUSTERS:PRK15484" + /inference="protein motif:Pfam:PF00534.14" + /inference="protein motif:TIGRFAMs:TIGR04157" + /inference="similar to AA sequence:RefSeq:YP_815839.1" + /inference="similar to AA sequence:UniProtKB:O53279" + /note="glycogen synthase; lipopolysaccharide + 1,2-N-acetylglucosaminetransferase; glycosyltransferase, + GG-bacteroidales peptide system; glycosyl transferase + group 1 protein" + /codon_start=1 + /transl_table=11 + /product="glycoside hydrolase family protein" + /protein_id="QCO92059.1" + /translation="MKILFVNMFYNEAGGAQKSTKFLAEQLVKEGHEVFAYSDDAIDS + DIDEVINGVKVFRRRTPLFSLHYIFSAKKNPAKHFFYKIFEIYNVFAKRKFINIMEEV + QPDIVHFNTISGMSLSIVKEAKKRNIRTVWTLRDYWLEYPWGEKDISLIKLLNRIYRP + FVKKSLRHLDIVTAPSAFTLNNFINKGFINPSSQKCMVIENAVIFSKGKLENIIKQKQ + ETKRNPEKTNFLFVGSILEIKGVFNLVKAFKKLTSPEISLKIVGKGKDLEKLQKEIES + DPRIQYLGFQDTETLYKTYQNSDVLVVPSAWDEPFGRVVIEGNANGLPVITSDRGGLP + EIVQTVGGGEVFTDESGNTLYSFLKKFVEMENYNVYYQCILENIDIYSIEKQSKKFTN + LYLD" + gene 15918..17150 + /gene="ugd" + CDS 15918..17150 + /gene="ugd" + /EC_number="1.1.1.22" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:CLUSTERS:PRK15057" + /inference="protein motif:Pfam:PF03721.8" + /inference="protein motif:TIGRFAMs:TIGR03026" + /inference="similar to AA sequence:RefSeq:YP_006742606.1" + /inference="similar to AA sequence:UniProtKB:P76373" + /note="nucleotide sugar dehydrogenase; + UDP-glucose/GDP-mannose dehydrogenase family NAD-binding + domain protein" + /codon_start=1 + /transl_table=11 + /product="UDP-glucose 6-dehydrogenase" + /protein_id="QCO92060.1" + /translation="MKIAVAGTGYVGLSIAVLLAQHHEIKAVDIVAEKVELINQKKSP + IQDDYIEKYLVEKDLNLEATMDAKYAYEDAEFVVVAAPTNYDSKKNFFDTSAVEAVIQ + QVKKINPKAVIIIKSTIPVGFTESVRKKYQYKNILFSPEFLRESKALYDNLYPSRIIV + GTDLEDTYLKDKANIFASLLKEGAIKEDIDTLFMGVTEAEAVKLFANTYLALRVSYFN + ELDTYAEVKGLDTKAIIDGIGLDPRIGNHYNNPSFGYGGYCLPKDSKQLLANYFDVPQ + NMMTATVESNRTRKDFIAQRILEKAGVSETDSLDAFKNIQDIVIGIYRLTMKSNSDNF + RHSSIQGVMKRLKAKGVTVIIYEPTLKDGETFFGNKVVNNLDKFKEASNVIVANRFEP + SLEDVSNKVYSRDIFKRD" + gene 17369..17752 + /gene="tnp" + CDS 17369..17752 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_008084845.1" + /codon_start=1 + /transl_table=11 + /product="mobile element protein" + /protein_id="QCO92061.1" + /translation="MNYEASKQLTDARFKRLVGVQRTIFEEMLAVLKTAYQLKHAKGG + RKPKLSLEDLLMATLQYVREYRTYEQIAADFGIHESNLIRRRQWVEVTLVQSGVTISK + THLSAENTVIVDATEVKINRPKKIN" + gene 17786..18175 + /gene="tnp" + CDS 17786..18175 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3293" + /inference="protein motif:Pfam:PF01609.15" + /inference="similar to AA sequence:RefSeq:YP_003879974.1" + /note="transposase DDE domain protein" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO92062.1" + /translation="MEPQAIVTSQGRIVSLDIAVNYCHDIKLFKMSRKNIGQAGKILA + DSGYQGLMKIYPQAQTPRKSSKLKPLTAEDKAYNHALSKERSKVENIFAKVKTFKMFS + TTYRNHRKRFGLRMNLIAGIINHELGF" + gene 18316..18555 + /gene="tnp" + CDS 18316..18555 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="similar to AA sequence:RefSeq:YP_001836149.1" + /codon_start=1 + /transl_table=11 + /product="IS66 family Orf1" + /protein_id="QCO92063.1" + /translation="MELLLYTISKVKLLEDILMPQPIVPVEIPQSRPFDSKKRNDILL + KIRIGKLELSFFQSLNLEMIEQLLDKVLLYDNSSI" + gene 18536..18859 + /gene="tnp" + CDS 18536..18859 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG3436" + /inference="protein motif:Pfam:PF05717.7" + /inference="similar to AA sequence:RefSeq:YP_002037914.1" + /note="transposase IS66 Orf2-like protein" + /codon_start=1 + /transl_table=11 + /product="IS66-Spn1 transposase" + /protein_id="QCO92064.1" + /translation="MTIHLSSLGQVYLVCGKTDMRQGIDSLAYLVKTHFELDSFSGQV + FLFCGGRKDRFKALYWDGQGFWLLYKRFENGRLTWPSTEKDVKALTPEQVDWLMKGFS + ITPKI" + gene 19232..19489 + /gene="tnp" + CDS 19232..19489 + /gene="tnp" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Pfam:PF13005.1" + /inference="similar to AA sequence:RefSeq:YP_002736396.1" + /note="putative helix-turn-helix transposase IS66" + /codon_start=1 + /transl_table=11 + /product="transposase" + /protein_id="QCO92065.1" + /translation="MEMFPVETEEITYKRKKSKGKRQALIAQFDSEEVHHQVEERICP + DCQGDLKEIGATLQRQELVFIPAKLKRIDHIQHAYKCQASR" + gene 20251..22233 + /gene="aliA" + CDS 20251..22233 + /gene="aliA" + /inference="ab initio prediction:Prodigal:2.60" + /inference="protein motif:Cdd:COG4166" + /inference="protein motif:CLUSTERS:PRK15104" + /inference="protein motif:Pfam:PF00496.16" + /inference="protein motif:TIGRFAMs:TIGR02294" + /inference="similar to AA sequence:RefSeq:YP_001835080.1" + /inference="similar to AA sequence:UniProtKB:P31306" + /note="76 kDa cell surface lipoprotein; oligopeptide ABC + transporter substrate-binding protein OppA; ABC-type + oligopeptide transport system, periplasmic component; + nickel ABC transporter, nickel/metallophore periplasmic + binding protein; Bacterial extracellular solute-binding + proteins, family 5 Middle" + /codon_start=1 + /transl_table=11 + /product="oligopeptide ABC transporter + oligopeptide-binding protein AliA" + /protein_id="QCO92066.1" + /translation="MKSSKLFALAGVTLLAATTLAACSGSGSSTKGEKTFSYIYETDP + DNLNYLTTAKAATANITSNVVDGLLENDRYGNFVPSMAEDWSVSKDGLTYTYTIRKDA + KWYTSEGEEYAAVKAQDFVTGLKYAADKKSDALYLVQESIKGLDAYVKGEIKDFSQVG + IKALDEQTVQYTLNKPESFWNSKTTMGVLAPVNEEFLNSKGDDFAKATDPSSLLYNGP + YLLKSIVTKSSVEFAKNPNYWDKDNVHVDKVKLSFWDGQDTSKPAENFKDGSLTAARL + YPTSASFAELEKSMKDNIVYTQQDSITYLVGTNIDRQSYKYTSKTSDEQKASTKKALL + NKDFRQAIAFGFDRTAYASQLNGQTGASKILRNIFVPPTFVQADGKNFGDMVKEKLVT + YGDEWKDVNLADSQDGLYNPEKAKAEFAKAKSALQAEGVTFPIHLDMPVDQTATTKVQ + RVQSMKQSLEATLGADNVVIDIQQLQKDEVNNITYFAENAAGEDWDLSDNVGWGPDFA + DPSTYLDIIKPSVGESTKTYLGFDSGEDNVAAKKVGLYDYEKLVTEAGDETTDVAKRY + DKYAAAQAWLTDSALIIPTTSRTGRPILSKMIPFTIPFALSGNKGTSEPILYKYLELQ + DKAVTVDEYQKAQEKWMKEKEESNKKAQEDLAKHVK" +ORIGIN + 1 atgcaagaaa aatggtggca taatgccgta gtctatcaag tctatccaaa gagttttatg + 61 gatagtaatg gagatggagt tggtgattta ccaggtatta ccagtaagtt ggactatcta + 121 gctaagttag gaatcacagc gatttggctt tctcccgttt atgacagccc tatggatgat + 181 aatggctacg atattgctga ttatcaagcg attgcaacga tttttggaac catggaggat + 241 atggatcaac tgattgcgga agctaagaag cgtgacattc gtatcatcat ggacttggtg + 301 gttaatcata cctcagatga acatgcttgg tttgtcgaag cctgtgaaaa tactgatagc + 361 cctgagcgag actactatat ctggcgcgat gaacccaatg acctagattc tatctttagt + 421 gggtctgctt gggaatacga tgaaaagtca ggtcaatact atctccactt tttcagcaag + 481 aaacagccgg atctcaactg ggaaaatgaa aaacttcgcc agaaaattta tgagatgatg + 541 aacttctgga ttgataaagg tattggtggt ttccgtatgg atgttattga catgattggc + 601 aaaattcctg acgagaaggt agtcaataat ggtcctatgc tccatcccta tctcaaggaa + 661 atgaatcagg cgacctttgg agctaaggat ctcttgacag taggggagac ttggggagca + 721 acgccagaga ttgccaagct ctactctgat ccaaaggggc aagaattgtc tatggtcttc + 781 cagtttgaac atatcggtct tcagtatcag gaaggtcaac ctaaatggca ctatcaaaaa + 841 gagctgaata tcgctaagtt aaaagaaatc ttcaacaaat ggcagacaga gttaggagtt + 901 gaggacggct ggaattccct cttctggaac aaccatgacc tccctcgtat tgtctcaatc + 961 tggggaaatg accaagaata ccgcgaaaaa tctgccaaag cctttgcaat cttacttcat + 1021 ctcatgagag gaactcctta tatctaccaa ggtgaggaga ttgggatgac caactatccg + 1081 tttgaaacac tggatcaagt agaagatatt gaatccctca actatgcgcg tgaggctctt + 1141 gaaaaaagtg ttccgattga agaaatcatg gacagtatcc gtgttattgg acgtgacaat + 1201 gcccgtaccc ctatgcaatg ggacgagagc aaaaacgctg gtttctcaac aggtcaacct + 1261 tggttggcgg ttaatccaaa ttacgagatg atcaatgtcc aagaagcgct ggcaaatcca + 1321 gattctattt tctataccta tcagaaactg gtccaaattc gcaaggagaa tagctggcta + 1381 attcgagctg actttgaatt gcttgatacg gctgataagg tctttgctta tatacgtaag + 1441 gatggcgacc gtcgcttcct agttgtggct aacttgtcca atgaagagca agacttgaca + 1501 gtagaaggaa aagtcaaatc tgtcttgatt gaaaacaccc tagctcaaga agtctttgaa + 1561 aaacaaatct tagttccatg ggatgctttc tgtgtggaaa tgactgacta gaatgagcaa + 1621 acctcaagtt tttgaagctt gaggtttttt actatagtgg attgaaacta gaatagtgca + 1681 cctctgcttc taaaacattg ttagaaatcg atttgactgt cccgatcgat ttgtcctatt + 1741 cttatttcat tttgctatac ttgtagttga ggagaattaa gctcctcact agtaaactct + 1801 tcataatcct ttttattttt atgaagatat tgtttgaaag atgtgagttt ccacggatgg + 1861 gtttgtggag ggatatactt gcgtctttct tttttttgtt ctggttcttg ttcaaagttt + 1921 ttcgaataga gttcatgatt tagtagctcc tttgtgtgat agattttgtc agcgatattg + 1981 aggtagatgt caccatcaaa tgcttttata actaatgctt ttgtctttct gatgaaatag + 2041 acttcttttc cttgctcggt agggatatag caacgatttt ggaatcggat atggtgtcca + 2101 ctatcgacga ctctctcccg ccagtctagc tagaatgaga tttcgttcag agggcttagg + 2161 agcctcctca aagacagaga gttttgtctt gtttccaaac tgttcattaa aggtttggat + 2221 ataggaaggt agaaaggtat tggcttcttc caaggtatga atattgtttc gttccagttc + 2281 gataggcagg cgagattgta gtgtctgatt gagtctttcg actctccctt tagcttgagg + 2341 gatagaggtt gtctcaagga gaattcccag ttggtgacag gcgtatccaa attgtgtatg + 2401 ggtgtcgtcc tccattttct tagagttgga ggcttgatag gtaaaaacag ttctcttatc + 2461 tgttttaatt tgaagaggaa tgccgtggtt ggctaagatt tgttcgagga catgatagta + 2521 agcattcaag gtctcttgtt tgtcaaaata agcgcctagg atattgccag aagcatcatc + 2581 aatggctagg tgtaagttag aggtttctac tccaaaccag gcatgagggc tggcatccat + 2641 ttggatgagt tctccagcaa atttttttct gggtctacta ggatgtacct ttttagggtc + 2701 ttccaggaag ttttcagctg tcggtaagat tggattgtct aggggttgct tggggttcag + 2761 tttagcttgt tttcttactc tcttctttgt ctttctgtga gacttaggcg acaggatatt + 2821 tttcttatag agtatttttc taacagttgt atcagagagc tgaattcctt cttcttcagc + 2881 tagcaattca cagaaatgac ggacatttgg tttatatgtt tgataggaga ggtatttctt + 2941 taggatacgt tctttgattt catcagggat tgcatgtttt ggttttcgat ttctgtttcc + 3001 gtgtctgaag gcttcttttt ctttctgttg ataggctagt agcagacgat tgatttgtct + 3061 ttcagaaaga ttgagttcga cacaggcccg tttctttgtt ttctttcctt gggctatagc + 3121 ttttatcaca agatattttt tcgtttcatt catattcagt tggatccttt tcatatgact + 3181 attctaccaa atgggacatt ttcacgttcg atttactaaa gacattatca ccttcgaatc + 3241 acaaagatgc agatagtgaa aataaaggtg tagacattac cgtaaaaaag tgatataatc + 3301 gtatgatgtt caaggtatag gtgttaatca tgagtagacg ttttaaaaaa tcacgttcac + 3361 agaaagtgaa gcgaagtgtt aatatcgttt tgctgactat ttatttattg ttagtttgtt + 3421 ttttattgtt cttaatcttt aagtacaata tccttgcttt tagatatctt aacctagtgg + 3481 taactgcgtt agtcctacta gttgccttgg tagggctact cttgattatc tataaaaaag + 3541 ctgaaaagtt tactattttt ctgttggtgt tctctatcct tgtcagctct gtgtcgctct + 3601 ttgcagtaca gcagtttgtt ggactgacca atcgtttaaa tgcgacttct aattactcag + 3661 aatattcaat cagtgtcgct gttttagcag atagtgatat cgaaaatgtt acgcaactga + 3721 cgagtgtgac agcaccgact gggactgata atgaaaatat tcaaaaacta ctagctgata + 3781 ttaagtcaag tcagaatacc gatttgacgg tcgaccagag ttcgtcttac ttggcagctt + 3841 acaagagttt gattgcaggg gagactaagg ccattgtctt aaatagtgtc tttgaaaata + 3901 tcatcgagtc agagtatcca gactacgcat cgaagataaa aaagatttat accaagggat + 3961 tcactaaaaa agtagaagct cctaagacgt ctaagaatca gtctttcaat atctatgtta + 4021 gtggaattga cacctatggt cctattagtt cggtgtcgcg atcagatgtc aatatcctga + 4081 tgactgtcaa tcgagatacc aagaaaatcc tcttgaccac aacgccacgt gatgcctatg + 4141 taccaatagc agatggtgga aataatcaaa aagataaatt aacccatgcg ggcatttatg + 4201 gagttgattc gtccattcac accttagaaa atctctatgg agtggatatc aattactatg + 4261 tgcgattgaa cttcacttct ttcttgaaaa tgattgactt attgggaggg gtagatgttc + 4321 ataatgatca agagttttca gctctacatg ggaagttcca tttcccagta gggaatgtcc + 4381 atctagactc tgagcaggct ctaggttttg tacgtgaacg ctactcacta gccgatggag + 4441 accgtgaccg tggtcgcaac caacaaaagg tgcttgtggc tatccttcaa aaattaacgt + 4501 caaccgaagc actgaaaaat tatagtacga tcattaatag cttgcaagat tctatccaaa + 4561 caaatatgcc acttgagact atgataaatt tggtcaatgc tcagttagaa agtggaggga + 4621 attataaagt aaattctcaa gatttaaaag ggacaggtcg gacggatctt ccttcttatg + 4681 caatgccaga cagtaacctc tatgtgatgg aaatagatga tagtagttta gctgtagtta + 4741 aagcagctat acaggatgtg atggagggta gatgaaatga tagacatcca ttcgcatatc + 4801 gtttttgatg tagatgacgg tcccaagtca agagaagaaa gcaaggctct cttggcagaa + 4861 tcctacaggc agggggtgcg aaccattgtc tctacctctc accgtcgcaa gggcatgttt + 4921 gaaactccgg aagagaagat agcagaaaac tttcttcagg ttcgggaaat tgcaaaagaa + 4981 gtagcagatg atttagtcat tgcttatggc gcagagatat actatactct ggatgttcta + 5041 gaaaagctag aaaaaaaaga aatccctacc cttaatgata gtcgttatgc tttgattgag + 5101 tttagcatgc atacttccta tcgtgagatt catacgggat tgaacaatgt tttgatgttg + 5161 ggaatcacgc cagtcattgc ccacatcgag cgctatgatg ctcttgaaaa taatgaaaaa + 5221 cgcgttcggg aactgatcga tatgggctgt tacacgcaag taaatagttc acatgtcctc + 5281 aaccccaaac tttttggcga acgttataaa ttcatgaaaa agagagctcg gtattttttg + 5341 gaacgtgatt tagttcatgt ggttgcaagt gacatgcaca atttagacag tagacctcca + 5401 tatatgcaac aggcatatga tatcattgct aagaaatatg gagcgaaaaa agcgaaagag + 5461 ctttttgtag ataatcccag aaaaatgata atggatcaat taatttagga gaaaacatga + 5521 aggaacaaaa cactttagaa atcgatgtat tgcaactatt cagagcttta tggaaaagaa + 5581 agttggtcat tttattagtg gcaattataa cttcttcagt tgcttttgcc tacagtactt + 5641 ttgttatcaa acctgagttt actagtacga ctcggattta tgtagttaac cgtaatcagg + 5701 aagagaagtc tggtttaact aatcaagact tgcaggcagg atcatacttg gttaaagact + 5761 atcgtgaaat tatcctatcg caggatgttt tggaggaagt tatttctgat ttgaaactag + 5821 atttgacgcc aaaaggtttg gctaataaaa ttaaagtaac agtaccagtt gatacccgta + 5881 ttgtctctgt ttcagttaat gatcgagttc ctgaagaggc aagccgtatc gctaattctt + 5941 tgagagaagt agctgctcaa aaaattatca gtattactcg tgtttctgat gtgacaacac + 6001 tggaggaggc aagaccggcg atatcaccgt cttcgccaaa tattaaacgc aatacactaa + 6061 ttggtttttt ggcagggggg attggaacta gtgttatagt tcttcttctt gaacttttgg + 6121 acactcatgt gaaacgtccg gaagatatcg aagatacact gcagatgaca cttttgggag + 6181 ttgtaccaaa cttgagtaag ttgaaatagg agagaggaat gccgacatta gaaatagcac + 6241 aaaaaaaact ggagttcatt aagaaggcag aagaatatta caatgccttg tgtacaaata + 6301 tacagttgag cggagataaa ctaaaagtaa tttccgttac ttctgttaac cctggggaag + 6361 gaaaaacaac tacttccgta aatatagcaa ggtcgtttgc gcgtgcaggc tataaaactc + 6421 ttttgatcga tggcgatact cgaaattcag ttatgtcagg attttttaaa tcgcgtgaaa + 6481 aaattacagg gctaacagaa tttttatctg ggacagctga tttatctcac ggtttatgtg + 6541 atacaaatat tgaaaattta tttgtaattc aatcgggatc tgtatcacca aaccctacag + 6601 ccttgttaca aagtaaaaat tttaatgata tgattgaaac attgcgtaaa tattttgatt + 6661 atatcattgt tgatacagca cctattggaa ttgttattga tgcggcaatt atcactcaaa + 6721 agtgtgatgc gtccatcttg gtaacagcaa caggtgaggt gaataaacgt gatgtccaaa + 6781 aagcgaaaca acaattagaa caaacagaga aactgttttt aggtgtcatt ctcaataaat + 6841 ttgatgttca acataaaaaa tatggttctt acggtggcta tggtaattat ggtaaaaaat + 6901 aacttaggaa agattttatg gatgaaaaag gattgaaaat ttttctggca gtattacaga + 6961 gtattattgt cattttattg gtttattttc ttagctttgt tagagagacg gaacttgaac + 7021 gttcttcgat ggttatacta taccttctcc acttttttgt attctatttt agttcctatg + 7081 gtaacaattt ttttaaaaga gggcacttag ttgagtttaa tagtactata agatatattt + 7141 ttttctttgc aatagctata agtgtattaa acttttttat agcggaacgg tttagtatct + 7201 ctagaagagg aatggtatac ttcttaactt tagaaggaat atccttatac ttgttaaatt + 7261 tattagtaaa gaaatattgg aagcatgtgt tttttaatct aaaaaatagc aagaaaattt + 7321 tactgttaac agtaacaaaa aatatggaaa aagttcttga taaattgcta gaatctgatg + 7381 aactttcatg gaaattggta gcagtaagtg ttttggataa atctgatttt caacatgata + 7441 aaatacctgt aattgaaaag gaaaaaatta ttgaatttgc aacgcatgaa gttgtggatg + 7501 aggtgtttgt caatcttcca ggagagagct acgatattgg agaaattatc tctaggtttg + 7561 agacaatggg gatagatgta actgtaaatc ttaaagcatt tgataagaat ttgggtcgca + 7621 ataaacaaat tcatgagatg gtaggattga atgtagtcac tttctctaca aatttttata + 7681 aaactagtca tgtgatttca aagagaattc tcgatatttg tggtgccact attggcctta + 7741 ttctttttgc tatagctagt ctagttttag ttccattgat tcgtaaagat ggcggaccag + 7801 ctatttttgc tcaaactcgt atagggaaaa atggtcgaca ttttaccttt tataagttcc + 7861 gttcgatgcg gatcgatgct gaagctatca aagaacagtt gatggatcaa aatacgatgc + 7921 aaggtggtat gtttaagata gacaatgatc ctcgtgttac aaaaattggt cgctttattc + 7981 gtaaaaccag tttggatgaa ttgccacaat tttggaatgt ctttatagga gatatgagtt + 8041 tggtgggaac acgtccacct acagtagacg agtatgatca gtatactcca gaacagaaac + 8101 gtcgactcag ctttaaacct ggtattacag gtttatggca ggttagcggc cgtagtaaaa + 8161 taaccgattt tgacgatgtt gtaaaattag atgtggctta tattgataat tggacaatct + 8221 ggaaagatat tgaaattttg cttaaaactg ttaaagttgt atttatgaga gatggagcga + 8281 agtaattcat atgaatgaga gaatgcaaat attaggaatt actatagatc cattaacgat + 8341 gaaagaaaca gtggatgctg ttgaacagta tgttttaaag aagcatcctt tgcacttgat + 8401 gggagttaac gcagataaaa ttaatcagtg ccatgaagat gagaaaatca aaaaaatcgt + 8461 taatgaatca ggaatcatta atgcggatgg agcatcagtt gttcttgcaa gtaagttttt + 8521 aggaacgcct gttcctgaac gagtagcggg tattgatttg atgcaatgtc ttttagagtt + 8581 gtcaaataaa aaaggatatt cagtttactt ttttggagcc aaagaagaaa ttttacaaga + 8641 tatgctaaaa gtttttaaac aaagatatcc taatcttaat gttgttggct atagaaacgg + 8701 atatttttca cctgaagatg aaaaaaagat tcaggaagat attaaaggag gaaaaccaga + 8761 ttttgtattt gtagggatta cttctcctaa aaaggaatat atcatccaat cattcataga + 8821 taatgggatt aatgctgtct ttatgggtgt tggtggcagt tttgatgtat tatcaggaca + 8881 cattaaacga gctccattat ggatgcaaaa attgaatctg gaatggttgt tccgtgtagt + 8941 taatgaaccc aaacgccttt ttaagcgtta ttttgtaggg aatgttactt ttattaagcg + 9001 agttttagat gaaaagcgaa aatcaaaaaa ataatattct acatatttct cgtacaatgg + 9061 atattggtgg tgcagaacgt attgtatatc aattgagttc tgatttgaaa gatgaatttg + 9121 atagtgtcca tgtcgcttca acaggtggac tatgggagag caaactttta tcaaaaggag + 9181 ttcaacatca taaaatttta gatgttgaca gtaagaatcc cctaactatg gtaaagatcc + 9241 tttcaagttt ttatagagtt atcaaaaata atgatattat cattgttcac actcatcatc + 9301 ggatggctgc cttttatatt cgcttgttga aaatcattaa tcctaagttg atacatgttt + 9361 acactgcaca taatgtattt aaaaataaat taccattata caaattttcc ttaaaaaaag + 9421 cgtactgtgt agctgtgggt aaagcggtta atgataattt gaaacatgat gtaggaatca + 9481 gtgatagtac agtaatctat aatggggttg tttttgaaaa aactgataag ctagttgatg + 9541 agattgtaaa ctataacgga atcaaattgg ggtgtattgc taggttatca gagcaaaaag + 9601 gattgaccta cctaattgat gcgatgtctt tagtgaaaca cagggatatt acgttgttca + 9661 ttgtcggaga tggagagctt cgagatgagc ttgaaaacaa ggtgaaacaa ttaaatcttc + 9721 aaaaatcagt gatattttta ggttatcgaa aagatgttgt tgaatgtatc aatagttttg + 9781 attacttagt gtcatcatct ttatatgagg ggttggctct aaatgtaatt gaagcattta + 9841 tgaatgggaa aacgatggtt gcatcagata tccccggaat aaatgaagta gtcaataaca + 9901 aaaatgggat tcttgttcct gttaaggatg atgttgcctt agcgagagcg attgaaaagc + 9961 ttgcgactga caaaaaactt agagaaaaac tcgcttatca agcaaaaaaa gattatgaga + 10021 caaaatttaa ttattccttg tttttggata attatcggag actttataga aaattaatgg + 10081 gagaatcaaa atgaaaaaag tcatgttggt ttttgggaca cgtccagaag ctattaaaat + 10141 gtgtccttta gtaaatgaac tgaaacaaaa tgattcaatc aagacacttg tgtgtgtaac + 10201 tggtcaacat aaggaaatgt tagagcaggt tttagaggtg ttcaaggttg tcccagatta + 10261 tgatttgggt atcatgaaag caaatcaaac cctatttacc attacgacta gtatcttgga + 10321 taaaattcag gcggttctag agaaagaaaa accagatctt gttcttgttc atggagatac + 10381 gacaacaaca tttgcgacag ctttagcagc attttatatg ggaatcaaag tgggacacgt + 10441 cgaagcaggt ctcagaacct ataatctcca aagtccattt ccagaggaat tcaatcgcca + 10501 gacaacttct atcattaccg actatcattt tgcgccgact gaagttgcga aggaaaatct + 10561 actaagagag gacagaaaaa atatctttgt gacgggaaat acagtcattg atgctttgaa + 10621 gacgactgtt caagataact accatcaccc aattttagaa tgggcaaagg gtagtaagtt + 10681 aatcatgcta acagctcatc gacgagaaaa tcttgggaaa ccgatggaaa acatgtttaa + 10741 tgctgttaat cgaattttaa acgaattcga agatgtaaaa gttgtatatc ccatccataa + 10801 aaatcctaag gttcgagaat tagcaagtaa agtttttggc gataatgaac gaatgaaaat + 10861 cattgaaccg ttagaggtta ttgattttca taattttatg aatcaaagct atatgatttt + 10921 gacagattct ggaggtgtac aggaagaagc accttcttta ggaaaacctg tcttggtgat + 10981 gcgtgataca acagagcgtc ctgaaggggt cgttgctggc acattgaagt tggtaggaac + 11041 agaagaaggg aatatctata gtaacttcaa acttcttctt gaagatgaaa cagaatataa + 11101 caagatgagc aaagctagca acccttatgg agatggaatg acttgtaaac ggattgttga + 11161 tattattctg gaagtataaa aataattcaa ttatgaatga ggaaagaata aattagattg + 11221 atgataaaaa gaaaaatata tataatctgt gtattgctgt cgtatttttt acctagtttt + 11281 tttacagttg gatcaatggc gactttattt gctttgcttt ctactttagt taagctattt + 11341 gtgacttttt attatattcc caaagttctt ttacagcata aagtaacact gattgatatt + 11401 ctagttgttc tatttttatt ttttcaagca tttgcagctt ttcaaagcca aacgttgtac + 11461 cttaactacg ttggaggtca gtttttcctt ttaggactat attcattttt aaaacacttt + 11521 ttattgttgg attgtaaaac aacaataaaa agcctctttt taacctttat cttgtttttg + 11581 tgtattcaag taataactca attgcttttt ccggtcggtt tcgattcttt gcaccctaca + 11641 ggagataata gactttactt tttaggaaga aagaacatag ctaccccgta tatcattgtt + 11701 ggattaggta gtttttactt attaaataaa aaaatgaatg agttcatatc actaaaggag + 11761 attatttttt taggattgtt cggaatttta tcatttttaa cacaatccag tacagcgatt + 11821 atatgttatg ggctttttat tttcatacgt ctattgggat taaaggaaaa tataggaaaa + 11881 ctatattctt tagtcagtat ggctgtatat gtttgttttt ctctttctat aattttttca + 11941 caaagtacaa ttttatcaac ttttacagcg attttttcca aaaatgcaac tttttcagga + 12001 cgtatcaata tttggcaatt agcgattcgt atttttgaag agaattttga gtttggacga + 12061 gggatcgaag ttaattttaa tgcttggaca aacgggatta tcgttaactc tgcacacaat + 12121 accttattag atatacttgc tcgaacgggt atatttccag gtgttttatt tgtagtgctt + 12181 cttctaagtt tatttcttgg aaaatataga gtaaaatcaa aaacgctact gacaatgttg + 12241 atttcattca tggtttatat tacgatggag gctacatctg taagtattct tctattaata + 12301 attgatattt gtgtgtattg gccttttgga gaggagaaat tatatgagaa agttacttaa + 12361 tgcaatctat tatcgactat ttggattata taaaaaaatt tatctacaag tttttggtaa + 12421 aaaaacaatt aatcttttgg gcgaaagagc taatttagaa aatgaactaa ttgtttcatt + 12481 tacaacaatt ccaagtcgtc ttaattattt accaactatg attaaaagca tttttaatca + 12541 gacaattatt cctaaccgtt ttattatgta tgtttataaa gatgaatttg aaggtattaa + 12601 tttggagagt atcctagaaa ctgaaatcga aaatggttta gagattgtgt atgtggacga + 12661 aaatcttcgc tcacataaaa aatattttta tgctatgaag gataatccga atagtatagt + 12721 tgttctagtt gatgacgata tcatttatcc tcgaaatact ataaagaaac tgattgcatc + 12781 ctatagaatt tatccacagt gtgtttcagc aatgcgatgt catcgaatta agttgttttc + 12841 tgatggaagt ttatatccat ataatcaatg ggaatatgaa atatcaggag ctactatacc + 12901 atcgtatttt aattttttta ctagcggagg tgggacatta tttcctccat gtactcgcaa + 12961 tgaggatctt tttaataaaa aaaatatcag ggaacttagt tttctatctg atgatgtatg + 13021 gttgaatttt ttggtagtca aaaatggaat taaaacagta aaagcaacac gatataaagg + 13081 gacaccatta actatagatg acaatcctga ggagagtttg gtatatttga atgccgtata + 13141 tgataacaac aatgataaat gtattagaaa tatggttgaa tattatcaaa ttaattttac + 13201 agaggctaaa taatgaatgt tgaaaaaaat ttgaaacgtg gaattttcta tactgcaata + 13261 gggaagtatt cgaatgtagt tattcaatta cttgtaacag caattcttag ccggattatc + 13321 tcacctgtag aatatggtat cgtagcagta gtaaatgtat ttcttttatt ttttcaaatg + 13381 ttagcagatt caggaatagg acctgctatt gttcaaaata aagaactgaa taagtcagat + 13441 ttaatcagca ttttctcatt aacgatttat agtggaatcg tactttcttg tatttttgct + 13501 ttactaggat atcctatggg ggtgttatac ggcgaaacta tttatgttag tttatttccg + 13561 cttttaggtc tttgtgtttt attttatacc attacaattg taccgcaagc tattctaatg + 13621 aaaacgatga actttaaaat agttaatttt ctaactattt tttctaacat tgctagtggc + 13681 ttggtgggcg ttattttagc ggtatcacat tttggtgtct attctctaat tttttctaat + 13741 attgtaaaag caatggtttt atttgtcgct ttatattcta aagcaaagat aaatttctat + 13801 tggaaagttt caaaaagttc tgttggtaaa atttttgagt tttcaaaatt ccaatttttg + 13861 tttaattttt ggaattattt tgctagaaat ttagataatt tattaattgg acgattgatt + 13921 agcccgtcag atcttggtta ttatgataag gcttatcaat tatctttgta ccctaatcaa + 13981 attttatcac aggttgtgac accagcattg catcctatta tgtccaattt tcaagataat + 14041 atcagtaaga taggcgaagt ttatcttcag atttctagaa tattcgtaat agttggcata + 14101 cctatttcgg cttatttata ctttaatgct caatatgttg ttacatttat gtttggagat + 14161 aattggtccc aaagcgttcc agtgtttcaa atattagcag caacaatttg gttacaaatg + 14221 gctaatagtc ctactggtgc attttaccaa gcaactaatc agacaaagtt attgtttaga + 14281 attggcttat tgacatcttt tattaatatt ttagctattg ttattggtgt aatgttgcaa + 14341 agcatccaat gtgttgcgta catgcttttg atttctttca gtcttagttt agtaatcaat + 14401 actctttact taacaaaaaa agtattaaat atttctgttc aaaaatatat aaaaccgata + 14461 ttaattaatt tgacaattat cagtccctat attatgttta atttgtttat ctcggatttt + 14521 gtaaacgacc ttattttaca tttatcagtt cagtttgtta ttttattttt aatatgggga + 14581 attgggatgt atattagcgg agagtatcga cgagtcttcg cggttataag aaaataaagg + 14641 agcgattttg tgaaaatttt atttgtgaat atgttttata atgaagcagg aggtgcacaa + 14701 aagagtacca aatttctagc tgaacaactt gtaaaagaag gacatgaggt atttgcatac + 14761 tctgatgatg ccattgattc agatattgat gaagttatta atggggttaa ggtttttaga + 14821 agaagaactc cgctttttag tcttcactat atttttagtg ctaagaagaa tccagctaaa + 14881 cattttttct ataaaatatt tgaaatctat aatgtatttg cgaaaagaaa atttatcaat + 14941 atcatggagg aagtacaacc agatattgtt cactttaata caatttcagg aatgtcttta + 15001 tcaatagtta aagaagctaa aaagagaaat atcaggaccg tttggacctt gcgagactat + 15061 tggctagaat atccatgggg tgagaaagat atttctctta tcaaacttct aaatagaata + 15121 tatagacctt ttgttaagaa aagtttaaga cacttagaca tagtaacagc accatcagca + 15181 tttactttga ataattttat caataaagga tttattaacc catcttctca aaaatgtatg + 15241 gtcattgaaa atgctgttat attttcaaag ggtaagttgg aaaatattat caaacaaaag + 15301 caagaaacaa aaagaaatcc agaaaaaacg aattttcttt ttgtaggttc tatacttgaa + 15361 ataaagggcg tttttaactt agtaaaggcc tttaaaaaac taactagtcc ggaaatttct + 15421 ttgaaaattg taggaaaagg aaaagattta gaaaaacttc aaaaagaaat tgagagtgat + 15481 cctagaatac aatatttagg ctttcaagat acagaaaccc tctataaaac ttatcaaaat + 15541 tcggatgtat tggtcgtccc atctgcttgg gatgaaccgt ttggtagagt tgtaattgaa + 15601 ggaaatgcaa atggccttcc tgtcatcact tcagatagag gtggattacc tgaaattgtg + 15661 caaacagtag gaggaggaga agtttttaca gatgaatcgg gaaatacatt atatagtttt + 15721 ttaaagaaat ttgtagaaat ggaaaactac aatgtctatt accaatgcat tcttgagaat + 15781 attgatattt attctatcga aaaacaaagt aaaaagttta ctaatctgta tttagattga + 15841 caaaaaagtt tactaatctg tatttagata aagaaatcga ataataagtt gtttttgtag + 15901 cagtaacgga ggtaattatg aaaatagcgg tagcaggaac aggttatgta ggattatcaa + 15961 ttgctgtgtt gttggcacaa catcacgaaa taaaagcagt tgatattgtt gctgaaaaag + 16021 ttgaattaat caatcaaaaa aagtctccaa ttcaggatga ttatattgaa aaatatttag + 16081 tggaaaaaga tttaaatttg gaagcaacta tggatgctaa gtatgcttat gaagatgcag + 16141 aatttgttgt tgttgcagca ccaacaaatt atgattcgaa aaagaacttt tttgatacat + 16201 cagcagtaga ggcggtcatt caacaagtaa aaaaaattaa tcccaaagcg gtaataatta + 16261 ttaaatctac aatccctgtt ggattcacag agtccgttcg aaagaaatat cagtataaaa + 16321 atatcctatt tagtccagaa tttttacgtg aatctaaagc attatacgat aacctgtatc + 16381 caagtcgcat cattgttgga actgacttag aagatactta tttaaaagac aaagctaata + 16441 tatttgcttc cctactaaaa gagggggcta ttaaagaaga catagataca cttttcatgg + 16501 gagtaacgga agctgaggca gttaaattat ttgccaatac ctaccttgcg ttgcgtgttt + 16561 cttactttaa tgaattggat acttatgcag aggtgaaagg tttggataca aaagccatta + 16621 ttgatggtat tggcctagat ccacgtatag gaaatcatta taacaatcca tcctttggct + 16681 acggtgggta ttgtttacct aaagatagta agcagttatt agcaaattac tttgatgtac + 16741 cacaaaatat gatgacggca actgttgaaa gcaatcgaac gcgtaaggat tttatcgctc + 16801 aacggatttt agaaaaagct ggagtatctg agactgatag tttagatgcg tttaagaaca + 16861 tacaagatat tgttataggt atttatcgtt taacaatgaa aagtaattcg gataacttcc + 16921 gtcactcatc tattcaaggc gttatgaaac gattgaaagc taagggagtt acggttatca + 16981 tctatgagcc aactttgaag gacggggaaa cattctttgg taataaagta gtaaataatc + 17041 tagataaatt taaagaagct agtaatgtta ttgtagccaa tcgttttgaa ccttcactag + 17101 aggatgtgtc taataaagtt tatagtcggg atatatttaa gcgtgactaa taaatacgtc + 17161 cacgtgacgt aatatctatt aaatggataa aatattaata aacatggcat ctatatcttt + 17221 tttggacttg aattgttaaa ttaagtgcac atttttttca tagaaaactt cataaggtgt + 17281 tttccggtta agacattttc gtggtctatt atctaagtta gtttatataa tagacttcct + 17341 gcgaaacaaa atatggtata gtagttctat gaattatgaa gcaagtaaac aactaactga + 17401 tgcacgattt aagcgtcttg ttggtgttca gcgtaccatt tttgaagaga tgttagctgt + 17461 attaaaaaca gcttatcaac ttaaacacgc aaaaggtgga cgaaaaccta aattaagcct + 17521 agaagacctt cttatggcca ctcttcaata tgtgcgagaa tatcgaactt atgaacaaat + 17581 tgcggctgat tttggtatcc acgaaagcaa cttaatccgt cggagacaat gggttgaagt + 17641 aactcttgtt caaagtggtg ttacgatttc aaaaactcat cttagtgctg agaatacggt + 17701 gattgtggat gcaacagagg taaaaataaa tcgtcctaaa aaaatcaact agccaattat + 17761 tctggtaaaa tagaaatgtc attctatgga acctcaagcg attgtcacaa gtcaagggag + 17821 aattgtttct ttggatatcg ctgtgaacta ttgtcatgat ataaagttgt tcaaaatgag + 17881 tcgcaaaaat atcggacaag ctggtaaaat cttggctgac agtggttatc aagggctcat + 17941 gaagatatat cctcaagcac aaactccacg taaatccagc aaactcaagc cgctaacagc + 18001 tgaagataaa gcctataacc atgcgctatc caaggagaga agcaaggttg agaacatctt + 18061 tgccaaagta aaaacgttta aaatgttttc aacaacctat cgaaatcatc gtaaacgctt + 18121 cggattacga atgaatttga ttgctggtat tatcaatcat gaactaggat tctagttttg + 18181 caggaagtct attaaattaa aataaattat tttagattta taatgtggct ctttgtcaac + 18241 taacatctgg agaggacaat cactgtcttc tccttttttg tctgtaagcg cgtcataaca + 18301 aggtatctat cattcatgga gctcctcctg tatactatta gtaaagtaaa actattggag + 18361 gatattttaa tgccacaacc tattgttcct gtagagattc cacaatctcg tccttttgat + 18421 tctaaaaaga gaaatgatat tctgcttaaa attcgtattg gcaagcttga actaagtttt + 18481 tttcaatctc tcaatctcga aatgatagaa cagcttttgg ataaggtgtt gctctatgac + 18541 aattcatcta tctagcctag ggcaggtcta tctcgtatgt gggaaaacgg atatgaggca + 18601 aggcattgat tcactggctt atctcgttaa aacccacttt gaattggatt ctttctcagg + 18661 tcaagttttt ctcttttgtg gtggacgtaa agaccgcttt aaagcccttt actgggatgg + 18721 tcaaggattt tggctactat ataaacgctt tgagaacggc agactgactt ggcccagtac + 18781 agaaaaggat gtcaaagctc tcacaccaga acaagtagac tggcttatga agggcttttc + 18841 tatcactcca aaaatatagt agattgaaac tagaatagta cacctctact tctaaaacat + 18901 tgttagaaat cgatttgact gtcctgatcg atttgtcctg ttattatttc attttactat + 18961 aaatccatca gaaagttgtg atttctattg aaatgaggac tttcttttta gtataataaa + 19021 ggtagaaaac aaggagggga agcccatgga agaagattga aaatcattca acaacagagt + 19081 gctacaattg atagtctcac caatgaactt gcccttctgc gtgaacaagt agcttatctg + 19141 actcaaaagc tctatggaaa atcctctgag aaaagtgttt gcccatctgg acaactcaac + 19201 ctttttgagg aagagtctcc atctgaggaa gatggagatg ttcccagttg aaacagagga + 19261 aattacctac aaacgtaaga aatctaaagg gaaacgccaa gctcttattg cccaatttga + 19321 ttcagaagaa gttcatcatc aagtagaaga gaggatttgc cctgattgtc agggagatct + 19381 aaaagagatt ggagcaaccc ttcaacgaca agaattagtc tttattcctg cgaaattaaa + 19441 acgaatagat catatccaac acgcttataa gtgccaagca agcagataaa tcatccttag + 19501 gagctaaagg tttagcttat tgtgatcagt tattttccct ggaaagagac tgggaggctt + 19561 tgccagctga tgaacgacta cagaaacgtc aagaacatct ccagccctta atggaagact + 19621 tctttgctta gtgccgccgt cagtcagttt tagcaggttc aaaactagga agggcaattg + 19681 aatacagcct caagtataaa gaaaccttta agaccatttt aaaagacgga catctggtcc + 19741 tttccaataa tctagctgaa cgcgccatta aatcattggt tatgggacgg agtaaaagag + 19801 tccagtggac tcttttagcc tgagctcagt ttaaaaaagc gagggtggtt attttctcaa + 19861 agttttgaag gagctaaagc aacagctatt attataagct tgttggaaac agctaaacgt + 19921 cagcaattaa atagcgagaa atatctatcc tatcttctag aatgtcttcc aaacgaggaa + 19981 actctcgtaa acaaagaggt tttagaggcc tatttaccgt ggactaaagt tgtacaagaa + 20041 aagtgcaaat aagaaatctc cagattagga actatccgtg agttctctag tctggagatt + 20101 tttcaatata cttcgttatt ggacggttac gatattcata ttttttgcaa agatgttgtt + 20161 tgaaaaataa ttttcaaaaa ttctgaaaat tctgttgaca tctttctgaa aagagtctat + 20221 aatggagaga aagttttaaa ggagaaaatg atgaaaagtt caaaactatt tgcccttgcg + 20281 ggcgtgacat tattggcggc gactacttta gctgcatgct ctggatcagg ttcaagtact + 20341 aaaggtgaga agacattctc atacatttat gagacagacc ctgataacct caactatttg + 20401 acaactgcta aggctgcgac agcaaatatt accagtaacg tggttgatgg tttgctagaa + 20461 aatgatcgct acgggaactt tgtgccgtct atggctgagg attggtctgt atccaaggat + 20521 ggattgactt acacttatac tatccgtaag gatgcaaaat ggtatacttc tgaaggtgaa + 20581 gaatacgcgg cagtcaaagc tcaagacttt gtaacaggac taaaatatgc tgctgataaa + 20641 aaatcagatg ctctttacct tgttcaagaa tcaatcaaag ggttggatgc ctatgtaaaa + 20701 ggggaaatca aagatttctc acaagtagga attaaggctc tggatgaaca gacagttcag + 20761 tacactttga acaaaccaga aagcttctgg aattctaaga caaccatggg tgtgcttgcg + 20821 ccagttaatg aagagttttt gaattcaaaa ggagatgatt ttgccaaagc tacggatcca + 20881 agtagtctct tgtataacgg tccttatttg ttgaaatcca ttgtgaccaa atcctctgtt + 20941 gaatttgcga aaaatccgaa ctactgggat aaggacaatg tgcatgttga caaagttaaa + 21001 ttgtcattct gggatggtca agataccagc aaacctgcag aaaactttaa agatggtagc + 21061 cttacagcag ctcgtctcta tccaacaagt gcaagtttcg cagagcttga gaagagtatg + 21121 aaggacaata ttgtctatac tcaacaagac tctattacgt atctagttgg tacaaatatt + 21181 gaccgtcagt cctataaata cacatctaag accagcgacg aacaaaaggc atcgactaaa + 21241 aaggctctct taaacaagga tttccgtcag gctattgcct ttggatttga ccgtacagcc + 21301 tatgcctctc agttgaatgg acaaactgga gcaagcaaaa tcttacgtaa tatctttgtt + 21361 ccaccaacat ttgttcaagc agatggtaaa aactttggcg atatggtcaa agagaaattg + 21421 gtcacttatg gggatgaatg gaaggatgtt aatcttgcag attctcagga tggtctttac + 21481 aatccagaaa aagccaaggc tgaatttgct aaagctaaat cagccttaca agcagaaggt + 21541 gtgactttcc caattcattt ggatatgcca gttgaccaga cagcaactac aaaagttcag + 21601 cgcgtccaat ctatgaaaca atccttggaa gcaactttag gagcggataa tgtagtcatt + 21661 gatattcaac aactacaaaa agacgaagta aacaatatta catattttgc tgaaaatgct + 21721 gctggcgaag actgggattt atcagataat gtcggttggg gtccagactt tgccgatcca + 21781 tcaacctacc ttgatatcat caaaccatct gtaggagaaa gtactaaaac atatttaggg + 21841 tttgactcag gggaagataa tgtagctgct aaaaaagtag gtctatatga ctacgaaaaa + 21901 ttggttactg aggctggtga tgagactaca gatgttgcta aacgctatga taaatacgct + 21961 gcagcccaag cttggttgac agatagtgct ttgattattc caactacatc tcgtacaggg + 22021 cgtccaatct tgtctaagat gataccattt acaataccat ttgcattgtc aggaaataaa + 22081 ggtacaagtg aaccaatctt atataaatac ttggaacttc aagacaaggc agtcactgta + 22141 gatgaatacc aaaaagctca ggaaaaatgg atgaaagaaa aagaagagtc taataaaaag + 22201 gctcaagaag atctcgcaaa acatgtgaaa taa +// + diff --git a/src/components/CapacityBuilding.js b/src/components/CapacityBuilding.js index ce4d76c..65a9e70 100644 --- a/src/components/CapacityBuilding.js +++ b/src/components/CapacityBuilding.js @@ -1,15 +1,24 @@ +import LocalSequencing from "./LocalSequencing" +import LocalDataAnalysis from "./LocalDataAnalysis" +import OneToOneTraining from "./OneToOneTraining" + import { TitleText, Section } from "./Common" import content from '../content/capacityBuildingContent' const CapacityBuilding = () => ( -
-
- +
+
+
+ +
+ {content.sections.map( (props, index) => +
+ )}
- {content.sections.map( (props, index) => -
- )} +
+
+
) diff --git a/src/components/Common.js b/src/components/Common.js index 3f1a29f..bcdddc4 100644 --- a/src/components/Common.js +++ b/src/components/Common.js @@ -137,7 +137,7 @@ const PublicationCard = ({cards}) => ( {card.youtube_id ? : null}
{card.buttons.map((button, index) => ( - ↓ {button.text} + {button.text} ))}
@@ -156,6 +156,27 @@ const Carousel = ({photos}) => (
) +const Timeline = ({items}) => ( + +) + const SectionContent = ({type, content}) => { switch (type) { case 'md': @@ -184,6 +205,8 @@ const SectionContent = ({type, content}) => { return
{content.alt}
case 'html': return
+ case 'timeline': + return default: return } @@ -226,7 +249,7 @@ const ParseTable = ({content}) => { return tableData } -const Table = ({columns, data, pageSizeOverride}) => { +const Table = ({columns, data, pageSizeOverride, heroContent=false}) => { const [columnFilters, setColumnFilters] = useState([]) const defaultColumn = useMemo(() => ({enableColumnFilter: false}), []) @@ -326,18 +349,18 @@ const Table = ({columns, data, pageSizeOverride}) => { ) return ( -
+
{pageSelector} {recordCountSelector}
-
+
{table.getHeaderGroups().map(headerGroup => ( {headerGroup.headers.map(header => ( - {table.getRowModel().rows.map(row => ( - + {row.getVisibleCells().map(cell => ( -
+
{flexRender( header.column.columnDef.header, @@ -353,7 +376,7 @@ const Table = ({columns, data, pageSizeOverride}) => { type="text" value={(header.column.getFilterValue() ?? '')} onChange={event => header.column.setFilterValue(event.target.value)} - placeholder={header.column.columnDef.meta && header.column.columnDef.meta.searchPlaceHolder ? header.column.columnDef.meta.searchPlaceHolder : 'Search...' } + placeholder={header.column.columnDef.meta?.searchPlaceHolder ? header.column.columnDef.meta.searchPlaceHolder : 'Search...' } />
: @@ -366,9 +389,9 @@ const Table = ({columns, data, pageSizeOverride}) => {
+ {flexRender( cell.column.columnDef.cell, cell.getContext() diff --git a/src/components/Content.js b/src/components/Content.js index 87bcd29..1bffacb 100644 --- a/src/components/Content.js +++ b/src/components/Content.js @@ -3,6 +3,8 @@ import { Routes, Route } from "react-router-dom" import Home from "./Home" import About from "./About" import Resources from "./Resources" +import SeroBAnk from "./SeroBAnk" +import GPSC from "./GPSC" import Publications from "./Publications" import CapacityBuilding from "./CapacityBuilding" import Training from "./Training" @@ -15,6 +17,8 @@ const Content = () => ( } /> } /> } /> + } /> + } /> } /> } /> } /> diff --git a/src/components/GPSC.js b/src/components/GPSC.js new file mode 100644 index 0000000..7a2bce2 --- /dev/null +++ b/src/components/GPSC.js @@ -0,0 +1,15 @@ +import Lineages from "./Lineages" +import GPSCSTLookupTable from "./GPSCSTLookupTable" +import PMENClones from "./PMENClones" +import GPSCTopTrumps from "./GPSCTopTrumps" + +const GPSC = () => ( +
+
+
+
+
+
+) + +export default GPSC \ No newline at end of file diff --git a/src/components/GPSCSTLookupTable.js b/src/components/GPSCSTLookupTable.js index 72045d6..9c98ebc 100644 --- a/src/components/GPSCSTLookupTable.js +++ b/src/components/GPSCSTLookupTable.js @@ -39,7 +39,7 @@ const GPSCSTLookupTable = () => { {content.sections.map( (props, index) =>
)} - +
) } diff --git a/src/components/GPSPipeline.js b/src/components/GPSPipeline.js new file mode 100644 index 0000000..0645edc --- /dev/null +++ b/src/components/GPSPipeline.js @@ -0,0 +1,16 @@ +import { TitleText, Section } from "./Common" + +import content from '../content/gpsPipelineContent' + +const GPSPipline = () => ( +
+
+ +
+ {content.sections.map( (props, index) => +
+ )} +
+) + +export default GPSPipline diff --git a/src/components/LocalDataAnalysis.js b/src/components/LocalDataAnalysis.js new file mode 100644 index 0000000..d8584b7 --- /dev/null +++ b/src/components/LocalDataAnalysis.js @@ -0,0 +1,16 @@ +import { TitleText, Section } from "./Common" + +import content from '../content/localDataAnalysisContent' + +const LocalDataAnalysis = () => ( +
+
+ +
+ {content.sections.map( (props, index) => +
+ )} +
+) + +export default LocalDataAnalysis diff --git a/src/components/LocalSequencing.js b/src/components/LocalSequencing.js new file mode 100644 index 0000000..471109b --- /dev/null +++ b/src/components/LocalSequencing.js @@ -0,0 +1,16 @@ +import { TitleText, Section } from "./Common" + +import content from '../content/localSequencingContent' + +const LocalSequencing = () => ( +
+
+ +
+ {content.sections.map( (props, index) => +
+ )} +
+) + +export default LocalSequencing diff --git a/src/components/Navbar.js b/src/components/Navbar.js index 59a2933..40bc1f7 100644 --- a/src/components/Navbar.js +++ b/src/components/Navbar.js @@ -112,7 +112,7 @@ const Navbar = () => ( -
    +
    diff --git a/src/components/OneToOneTraining.js b/src/components/OneToOneTraining.js new file mode 100644 index 0000000..0814848 --- /dev/null +++ b/src/components/OneToOneTraining.js @@ -0,0 +1,16 @@ +import { TitleText, Section } from "./Common" + +import content from '../content/oneToOneTrainingContent' + +const OneToOneTraining = () => ( +
    +
    + +
    + {content.sections.map( (props, index) => +
    + )} +
    +) + +export default OneToOneTraining diff --git a/src/components/PMENClones.js b/src/components/PMENClones.js index d3bee68..a4b2356 100644 --- a/src/components/PMENClones.js +++ b/src/components/PMENClones.js @@ -22,6 +22,9 @@ const PMENClones = () => { header: "Clone", accessorKey: "clone", enableColumnFilter: true, + meta: { + className: "sticky left-0 glass z-10" + }, cell: props => { const value = props.getValue() diff --git a/src/components/Resources.js b/src/components/Resources.js index 7339482..ec6e985 100644 --- a/src/components/Resources.js +++ b/src/components/Resources.js @@ -1,22 +1,15 @@ import Overview from "./Overview" import Countries from "./Countries" -import Lineages from "./Lineages" -import GPSCSTLookupTable from "./GPSCSTLookupTable" -import Serortypes from "./Serotypes" -import PMENClones from "./PMENClones" +import GPSPipline from "./GPSPipeline" import IsolateBankRequest from "./IsolateBankRequest" -import GPSCTopTrumps from "./GPSCTopTrumps" + const Resources = () => (
    -
    -
    -
    -
    +
    -
    ) diff --git a/src/components/SeroBAnk.js b/src/components/SeroBAnk.js new file mode 100644 index 0000000..d5c0cea --- /dev/null +++ b/src/components/SeroBAnk.js @@ -0,0 +1,13 @@ +import Serotypes from "./Serotypes" +import VaccineInformation from "./VaccineInformation" +import VaccineHistory from "./VaccineHistory" + +const SeroBAnk = () => ( +
    +
    +
    +
    +
    +) + +export default SeroBAnk \ No newline at end of file diff --git a/src/components/Serotypes.js b/src/components/Serotypes.js index e8ae2ed..10a39d3 100644 --- a/src/components/Serotypes.js +++ b/src/components/Serotypes.js @@ -19,6 +19,9 @@ const Serortype = () => { header: "Serotype", accessorKey: "serotype", enableColumnFilter: true, + meta: { + className: "sticky left-0 glass z-10" + }, cell: props => { const cellValue = props.getValue() const commentvalue = props.row.original.comments @@ -89,41 +92,143 @@ const Serortype = () => { } } }, + { + header: , + accessorKey: "otherSerum", + meta: { + className: "!align-middle" + }, + cell: props => { + const otherSerumValue = props.getValue() + const otherSerumValueRemark = props.row.original.otherSerumRemark + const poolSerumValue = props.row.original.poolSerum + const typeSerumValue = props.row.original.typeSerum + const groupSerumValue = props.row.original.groupSerum + const factorSerumValue = props.row.original.factorSerum + const antiserumNote = props.row.original.antiserumNote + + if (otherSerumValue === '-' && poolSerumValue === '-' && typeSerumValue === '-' && groupSerumValue === '-' && factorSerumValue === '-' ){ + return
    No Serological Profile
    + } + + return ( +
    + { + antiserumNote === '-' ? null : + } + { + poolSerumValue === '-' ? null : poolSerumValue.split(",").map((val) =>
    {val}
    ) + } + { + typeSerumValue === '-' ? null : typeSerumValue.split(",").map((val) =>
    {val}
    ) + } + { + groupSerumValue === '-' ? null : groupSerumValue.split(",").map((val) =>
    {val}
    ) + } + { + factorSerumValue === '-' ? null : factorSerumValue.split(",").map((val) =>
    {val}
    ) + } + { + otherSerumValue === '-' + ? + null + : + otherSerumValue.indexOf(",") === -1 + ? + + : + otherSerumValue.split(',').map((element, index) => + + ) + } +
    + ) + } + }, { header: , accessorKey: "cpsImage", + meta: { + className: "!align-middle" + }, cell: props => { const cellValue = props.getValue() const serotypeValue = props.row.original.serotype const remarkValue = props.row.original.cpsRemark if (cellValue === '-'){ - return
    -
    - } else if (remarkValue === '-') { + return
    {remarkValue === '-' ? "No Sequence Available" : remarkValue}
    + } else { return ( -
    +
    {`Chart + {remarkValue === "-" ? null :
    {remarkValue}
    }
    ) + } + } + }, + { + header: , + accessorKey: "capsularStructureImage", + meta: { + className: "!align-middle" + }, + cell: props => { + const cellValue = props.getValue() + const serotypeValue = props.row.original.serotype + const remarkValue = props.row.original.capsularStructureRemark + + if (cellValue === '-'){ + return
    {remarkValue === '-' ? "No Structure Available" : remarkValue}
    } else { return ( -
    +
    {`Chart -
    {remarkValue}
    + {remarkValue === "-" ? null :
    {remarkValue}
    }
    ) } } }, - + { + header: "Annotation (.gb)", + accessorKey: "genBankFile", + meta: { + className: "!align-middle" + }, + cell: props => { + const cellValue = props.getValue() + if (cellValue === '-'){ + return
    -
    + } else { + return ( +
    + + + +
    + + ) + } + } + }, ], []) return ( diff --git a/src/components/VaccineHistory.js b/src/components/VaccineHistory.js new file mode 100644 index 0000000..c07c114 --- /dev/null +++ b/src/components/VaccineHistory.js @@ -0,0 +1,16 @@ +import { TitleText, Section } from "./Common" + +import content from '../content/vaccineHistoryContent' + +const VaccineHistory = () => ( +
    +
    + +
    + {content.sections.map( (props, index) => +
    + )} +
    +) + +export default VaccineHistory diff --git a/src/components/VaccineInformation.js b/src/components/VaccineInformation.js new file mode 100644 index 0000000..4f012c1 --- /dev/null +++ b/src/components/VaccineInformation.js @@ -0,0 +1,16 @@ +import { TitleText, Section } from "./Common" + +import content from '../content/vaccineInformationContent' + +const VaccineInformation = () => ( +
    +
    + +
    + {content.sections.map( (props, index) => +
    + )} +
    +) + +export default VaccineInformation diff --git a/src/content/capacityBuildingContent.js b/src/content/capacityBuildingContent.js index 3c5797e..90f00d8 100644 --- a/src/content/capacityBuildingContent.js +++ b/src/content/capacityBuildingContent.js @@ -9,153 +9,6 @@ const content = { }, ] }, - { - subtitle: { - content: 'Sustainable Local Sequencing' - }, - content: [ - { - type: 'md', - content: 'At the beginning of GPS2, the GPS team engaged with key partners to discuss the feasibility of local data generation and resources required, identifying 8 institutes in 6 LMIC countries with which the GPS project is now working to establish decentralised data generation and analysis:' - }, - { - type: 'md', - content: '- Bangladesh ([CHRF](https://chrfbd.org/))' - }, - { - type: 'md', - content: '- India ([CMC](https://www.cmch-vellore.edu/) and [KIMS](https://www.kimsbangalore.edu.in/))' - }, - { - type: 'md', - content: '- Malawi ([MLW](https://www.mlw.mw/))' - }, - { - type: 'md', - content: '- Pakistan ([AKU](https://www.aku.edu/) and [LUMS](https://lums.edu.pk/))' - }, - { - type: 'md', - content: '- South Africa ([NICD](https://www.nicd.ac.za/))' - }, - { - type: 'md', - content: '- The Gambia ([LSHTM MRC Unit The Gambia](https://www.mrc.gm/))' - }, - ] - }, - { - subtitle: { - content: 'Enhancing Local Capacity for Data Analysis' - }, - content: [ - { - type: 'md', - content: 'A key aim of GPS2 is to support the development of skills of local researchers who become confident to independently analyse genomic data. Supporting the development of bioinformatics expertise is achieved through a multi-faceted approach, through a combination of online training, in person workshops and ongoing mentoring.' - }, - { - type: 'carousel', - content: [ - { - url: 'img/advanced_bioinformatics_workshop_colombia.jpg', - alt: 'Advanced Bioinformatics Workshop in Colombia' - }, - { - url: 'img/advanced_bioinformatics_workshop_gambia.jpg', - alt: 'Advanced Bioinformatics Workshop in the Gambia' - }, - { - url: 'img/advanced_bioinformatics_workshop_india.jpg', - alt: 'Advanced Bioinformatics Workshop in India' - }, - { - url: 'img/advanced_bioinformatics_workshop_turkey.jpg', - alt: 'Advanced Bioinformatics Workshop in Turkey' - }, - ] - }, - { - type: 'md', - content: '###### Participants and trainers in Advanced Bioinformatics Training Workshops in different locations' - }, - { - type: 'md', - content: 'In 2019, collaborators from six LMIC countries joined the GPS team at the Wellcome Sanger institute for an intensive week focused on analysis and drafting of country analysis papers for publication, [many of which have since been published](https://www.microbiologyresearch.org/content/global-pneumococcal-sequencing-collection/). After a hiatus owing to the COVID-19 pandemic, in person bioinformatics workshop have since been resumed in 2023.' - }, - { - type: 'md', - content: 'In addition, free [online training](https://training.bactgen.sanger.ac.uk/) resources have been developed by the GPS and JUNO training lead Jolynne Mokaya and we are working with colleagues from Wellcome Connecting Science (WCS) to develop and deploy face-to-face and virtual 5 day bioinformatics courses to supplement the existing online courses. [Other free courses](https://www.futurelearn.com/partners/wellcome-genome-campus) from WCS, in partnership with FutureLearn are currently available online for anyone to take in their own time. Some of these courses offer [continuing professional development](https://cpduk.co.uk/explained) (CPD) credits.' - }, - { - type: 'md', - content: "Below is some feedback from two of our partners who attended the writers workshop. You can also find out more about [Samanta Almeida's](https://www.microbiologyresearch.org/content/journal/mgen/10.1099/mgen.0.000635) and [Paula Gagetti's](https://www.microbiologyresearch.org/content/journal/mgen/10.1099/mgen.0.000636) in-depth country level *S. pneumoniae* genomic analysis work through their publications in Microbial Genomics." - }, - { - type: 'quoteCard', - content: { - photo: 'img/samanta_almeida.jpg', - name: 'Samanta Almeida, Center of Bacteriology, Adolfo Lutz Institute, São Paulo, Brazil', - quotes: ["The participation in the GPS project was an experience analysing WGS data and meeting the challenge of handling a large volume of data. The GPS team made a great effort to help me with the analysis and to address difficulties. In my opinion, it is a project that goes far beyond data generation, as there is a real effort to build capacity by sharing knowledge and providing bioinformatics training. During my participation, I received many incentives to develop studies and opportunities to present these results. I presented abstracts in the most important pneumococcus international events, the International Symposium on Pneumococcal and Pneumococcal Diseases (ISPPD), Australia (2018), and Toronto (2020) editions."] - } - }, - { - type: 'quoteCard', - content: { - photo: 'img/paula_gagetti.jpg', - name: 'Paula Gagetti (National Reference Laboratory on AMR of the National Institute of Infectious Diseases, Buenos Aires, Argentina)', - quotes: ["The most exciting thing was that prestigious professionals in the pneumococcal area dedicated a week of their time to sit down with us, discuss our results and draw conclusions about the impact of vaccines in different regions of the world. That was really amazing. Added to the human warmth of each of them that also allowed us to share beautiful moments drinking a beer in the pubs of Hinxton and Cambridge.", "From there, a very important link was generated. I worked a lot with Steph, whom I thank for the recognition and respect for our work and for answering all my questions immediately. Working with such a prestigious group of experts with the highest level of responsibility gives us the confidence to do other works in the future."] - } - }, - ] - }, - { - subtitle: { - content: 'One-to-One Training' - }, - content: [ - { - type: 'md', - content: "Nida Javaid is a PhD student from a partner group in the Department of Biology, Lahore University of Management Sciences, Pakistan. Nida obtained an 8 months research fellowship funded by Higher Education Commission in Pakistan and joined the Bentley group the Wellcome Sanger Institute for hands-on training in genomic analyses of *S. pneumoniae*. Unfortunately, Nida's arrival coincided with the UK national lockdown and the switch to working from home. Despite these challenges, Nida quickly integrated with the team, and learnt how to apply key tools used for characterising the genomic epidemiology of pneumococci to datasets from South Africa and Pakistan. Dr. Stephanie Lo is Nida's main mentor and together they made a great mentor-mentee team. As the lockdown restrictions started easing, Nida started having weekly in-person meetings with Stephanie, and joined occasional get-togethers with other team members." - }, - { - type: 'imageHalfWidth', - content: { - url: 'img/steph_and_nida.jpg', - alt: 'Nida Javaid and Stephanie Lo at the Wellcome Genome Campus' - } - }, - { - type: 'md', - content: '###### Nida Javaid and Stephanie Lo at the Wellcome Genome Campus' - }, - { - type: 'md', - content: "Find out more about Nida's work with the Bentley team:" - }, - { - type: 'quoteCard', - content: { - name: 'Nida Javid (Department of Biology, Lahore University of Management Sciences, Pakistan)', - quotes: ["The original plan was that I will be working on the population genomics analysis of pneumococcal isolates from Pakistan. However, due to the lockdown, sequencing of isolates from Pakistan was delayed and I started working on the country analysis of pneumococcal carriage isolates from South Africa. I started with running quality control analysis of the sequenced data, followed by *in silico* serotyping, genotyping, prediction of antimicrobial resistance and phylogenetic analysis from pneumococcal genomes using a wide range of command-line tools such as SeroBA and PopPUNK. I then visualized the output using Microreact, a tool that allows me to interactively explore the phylogeny with temporal and geographical data. Now almost a year and a half later, this manuscript is ready for submission. I would like to thank Dr. Shabbir Madhi for allowing me to work on his dataset.", "After a few months, pneumococcal isolates from Pakistan were sequenced. I then analysed these data using the approach and tools that I had learnt during my first few months at Sanger, and am working towards publication of my Pakistan country analysis. We also presented our preliminary results at the ABPHM online conference. Although I am back in Pakistan now, I am still actively working with Stephanie and attend the team meetings regularly. I would like to thank Stephen, Stephanie, and the team for their support and kindness. I would also like to thank my PhD advisor, Dr. Shaper Mirza, for her support and guidance through my PhD."] - } - }, - ] - }, - { - subtitle: { - content: 'GPS Pipeline: A Portable Pipeline to Reduce the Bioinformatics Burden' - }, - content: [ - { - type: 'md', - content: "Ensuring quality control of sequence data and generating succinct, reliable data characterising genomes can be time consuming and require substantial bioinformatic training. During GPS2, a portable pipeline named GPS Pipeline is being developed which will enable collaborators to easily input whole genome sequencing data and generate the *in silico* typing data required for downstream analysis. Although the pipeline is still under active development, its latest version is available on GitHub for testing: [https://github.com/sanger-bentley-group/gps-pipeline/](https://github.com/sanger-bentley-group/gps-pipeline/)" - }, - { - type: 'md', - content: '![GPS Pipeline Flowchart](img/gps_pipeline_flowchart.drawio.png)' - }, - ] - }, ] } diff --git a/src/content/commandLineContent.js b/src/content/commandLineContent.js index 12486a6..3624e05 100644 --- a/src/content/commandLineContent.js +++ b/src/content/commandLineContent.js @@ -184,7 +184,7 @@ const content = { }, { type: 'md', - content: '- GPSC235;9 is an exception. This lineage is a mixture of GPSC9 and GPSC235, but do not indicate the merging of GPSC9 and GPSC235 lineages.', + content: '- GPSC235;9 is an exception. This lineage is a mixture of GPSC9 and GPSC235, but do not indicate the merging of GPSC9 and GPSC235 lineages based on current evidence.', }, ] } diff --git a/src/content/gpsPipelineContent.js b/src/content/gpsPipelineContent.js new file mode 100644 index 0000000..641707c --- /dev/null +++ b/src/content/gpsPipelineContent.js @@ -0,0 +1,22 @@ +const content = { + title: "GPS Pipeline", + sections: [ + { + subtitle: { + content: 'A Portable Pipeline to Reduce the Bioinformatics Burden' + }, + content: [ + { + type: 'md', + content: "Ensuring quality control of sequence data and generating succinct, reliable data characterising genomes can be time consuming and require substantial bioinformatic training. During GPS2, a portable pipeline named GPS Pipeline is being developed which will enable collaborators to easily input whole genome sequencing data and generate the *in silico* typing data required for downstream analysis. The pipeline is still under active development, its latest version is available on GitHub: [https://github.com/GlobalPneumoSeq/gps-pipeline](https://github.com/GlobalPneumoSeq/gps-pipeline)" + }, + { + type: 'md', + content: '![GPS Pipeline Flowchart](img/gps_pipeline_flowchart.drawio.png)' + }, + ] + }, + ] +} + +export default content diff --git a/src/content/localDataAnalysisContent.js b/src/content/localDataAnalysisContent.js new file mode 100644 index 0000000..75c1bd1 --- /dev/null +++ b/src/content/localDataAnalysisContent.js @@ -0,0 +1,68 @@ +const content = { + title: 'Enhancing Local Capacity for Data Analysis', + sections: [ + { + content: [ + { + type: 'md', + content: 'A key aim of GPS2 is to support the development of skills of local researchers who become confident to independently analyse genomic data. Supporting the development of bioinformatics expertise is achieved through a multi-faceted approach, through a combination of online training, in person workshops and ongoing mentoring.' + }, + { + type: 'carousel', + content: [ + { + url: 'img/advanced_bioinformatics_workshop_colombia.jpg', + alt: 'Advanced Bioinformatics Workshop in Colombia' + }, + { + url: 'img/advanced_bioinformatics_workshop_gambia.jpg', + alt: 'Advanced Bioinformatics Workshop in the Gambia' + }, + { + url: 'img/advanced_bioinformatics_workshop_india.jpg', + alt: 'Advanced Bioinformatics Workshop in India' + }, + { + url: 'img/advanced_bioinformatics_workshop_turkey.jpg', + alt: 'Advanced Bioinformatics Workshop in Turkey' + }, + ] + }, + { + type: 'md', + content: '###### Participants and trainers in Advanced Bioinformatics Training Workshops in different locations' + }, + { + type: 'md', + content: 'In 2019, collaborators from six LMIC countries joined the GPS team at the Wellcome Sanger institute for an intensive week focused on analysis and drafting of country analysis papers for publication, [many of which have since been published](https://www.microbiologyresearch.org/content/global-pneumococcal-sequencing-collection/). After a hiatus owing to the COVID-19 pandemic, in person bioinformatics workshop have since been resumed in 2023.' + }, + { + type: 'md', + content: 'In addition, free [online training](https://training.bactgen.sanger.ac.uk/) resources have been developed by the GPS and JUNO training lead Jolynne Mokaya and we are working with colleagues from Wellcome Connecting Science (WCS) to develop and deploy face-to-face and virtual 5 day bioinformatics courses to supplement the existing online courses. [Other free courses](https://www.futurelearn.com/partners/wellcome-genome-campus) from WCS, in partnership with FutureLearn are currently available online for anyone to take in their own time. Some of these courses offer [continuing professional development](https://cpduk.co.uk/explained) (CPD) credits.' + }, + { + type: 'md', + content: "Below is some feedback from two of our partners who attended the writers workshop. You can also find out more about [Samanta Almeida's](https://doi.org/10.1099/mgen.0.000635) and [Paula Gagetti's](https://doi.org/10.1099/mgen.0.000636) in-depth country level *S. pneumoniae* genomic analysis work through their publications in Microbial Genomics." + }, + { + type: 'quoteCard', + content: { + photo: 'img/samanta_almeida.jpg', + name: 'Samanta Almeida, Center of Bacteriology, Adolfo Lutz Institute, São Paulo, Brazil', + quotes: ["The participation in the GPS project was an experience analysing WGS data and meeting the challenge of handling a large volume of data. The GPS team made a great effort to help me with the analysis and to address difficulties. In my opinion, it is a project that goes far beyond data generation, as there is a real effort to build capacity by sharing knowledge and providing bioinformatics training. During my participation, I received many incentives to develop studies and opportunities to present these results. I presented abstracts in the most important pneumococcus international events, the International Symposium on Pneumococcal and Pneumococcal Diseases (ISPPD), Australia (2018), and Toronto (2020) editions."] + } + }, + { + type: 'quoteCard', + content: { + photo: 'img/paula_gagetti.jpg', + name: 'Paula Gagetti (National Reference Laboratory on AMR of the National Institute of Infectious Diseases, Buenos Aires, Argentina)', + quotes: ["The most exciting thing was that prestigious professionals in the pneumococcal area dedicated a week of their time to sit down with us, discuss our results and draw conclusions about the impact of vaccines in different regions of the world. That was really amazing. Added to the human warmth of each of them that also allowed us to share beautiful moments drinking a beer in the pubs of Hinxton and Cambridge.", "From there, a very important link was generated. I worked a lot with Steph, whom I thank for the recognition and respect for our work and for answering all my questions immediately. Working with such a prestigious group of experts with the highest level of responsibility gives us the confidence to do other works in the future."] + } + }, + ] + } + ] +} + +export default content diff --git a/src/content/localSequencingContent.js b/src/content/localSequencingContent.js new file mode 100644 index 0000000..c237502 --- /dev/null +++ b/src/content/localSequencingContent.js @@ -0,0 +1,39 @@ +const content = { + title: 'Sustainable Local Sequencing', + sections: [ + { + content: [ + { + type: 'md', + content: 'At the beginning of GPS2, the GPS team engaged with key partners to discuss the feasibility of local data generation and resources required, identifying 8 institutes in 6 LMIC countries with which the GPS project is now working to establish decentralised data generation and analysis:' + }, + { + type: 'md', + content: '- Bangladesh ([CHRF](https://chrfbd.org/))' + }, + { + type: 'md', + content: '- India ([CMC](https://www.cmch-vellore.edu/) and [KIMS](https://www.kimsbangalore.edu.in/))' + }, + { + type: 'md', + content: '- Malawi ([MLW](https://www.mlw.mw/))' + }, + { + type: 'md', + content: '- Pakistan ([AKU](https://www.aku.edu/) and [LUMS](https://lums.edu.pk/))' + }, + { + type: 'md', + content: '- South Africa ([NICD](https://www.nicd.ac.za/))' + }, + { + type: 'md', + content: '- The Gambia ([LSHTM MRC Unit The Gambia](https://www.mrc.gm/))' + }, + ] + } + ] +} + +export default content diff --git a/src/content/navbarContent.js b/src/content/navbarContent.js index 8b8c621..a3d3374 100644 --- a/src/content/navbarContent.js +++ b/src/content/navbarContent.js @@ -34,28 +34,57 @@ const content = [ url: '/resources#countries', }, { - title: 'Lineages', - url: '/resources#lineages', + title: 'GPS Pipeline', + url: '/resources#gps-pipeline', }, { - title: 'GPSC-ST Lookup Table', - url: '/resources#gpsc-st-lookup-table', + title: 'Isolate Bank Request', + url: '/resources#isolate-bank-request', }, + { + title: 'GPS Visualiser', + url: './gps-visualiser/', + external: true + }, + ] + }, + { + title: 'SeroBAnk', + url: '/serobank', + submenu: [ { title: 'Serotypes', - url: '/resources#serotypes', + url: '/serobank#serotypes', }, { - title: 'PMEN Clones', - url: '/resources#pmen-clones', + title: 'Vaccine Information', + url: '/serobank#vaccine-information', }, { - title: 'Isolate Bank Request', - url: '/resources#isolate-bank-request', + title: 'Vaccine History', + url: '/serobank#vaccine-history', + } + ] + }, + { + title: 'GPSC', + url: '/gpsc', + submenu: [ + { + title: 'Lineages', + url: '/gpsc#lineages', + }, + { + title: 'GPSC-ST Lookup Table', + url: '/gpsc#gpsc-st-lookup-table', + }, + { + title: 'PMEN Clones', + url: '/gpsc#pmen-clones', }, { title: 'GPSC Top Trumps', - url: '/resources#gpsc-top-trumps', + url: '/gpsc#gpsc-top-trumps', }, ] }, @@ -65,7 +94,21 @@ const content = [ }, { title: 'Capacity Building', - url: '/capacity-building' + url: '/capacity-building', + submenu: [ + { + title: 'Local Sequencing', + url: '/capacity-building#local-sequencing', + }, + { + title: 'Local Data Analysis', + url: '/capacity-building#local-data-analysis', + }, + { + title: 'One-to-One Training', + url: '/capacity-building#one-to-one-training', + }, + ] }, { title: 'Training', @@ -94,11 +137,6 @@ const content = [ url: './gps-database-overview/', external: true }, - { - title: 'GPS Visualiser', - url: './gps-visualiser/', - external: true - }, ] export default content \ No newline at end of file diff --git a/src/content/oneToOneTrainingContent.js b/src/content/oneToOneTrainingContent.js new file mode 100644 index 0000000..19acaea --- /dev/null +++ b/src/content/oneToOneTrainingContent.js @@ -0,0 +1,37 @@ +const content = { + title: 'One-to-One Training', + sections: [ + { + content: [ + { + type: 'md', + content: "Nida Javaid is a PhD student from a partner group in the Department of Biology, Lahore University of Management Sciences, Pakistan. Nida obtained an 8 months research fellowship funded by Higher Education Commission in Pakistan and joined the Bentley group the Wellcome Sanger Institute for hands-on training in genomic analyses of *S. pneumoniae*. Unfortunately, Nida's arrival coincided with the UK national lockdown and the switch to working from home. Despite these challenges, Nida quickly integrated with the team, and learnt how to apply key tools used for characterising the genomic epidemiology of pneumococci to datasets from South Africa and Pakistan. Dr. Stephanie Lo is Nida's main mentor and together they made a great mentor-mentee team. As the lockdown restrictions started easing, Nida started having weekly in-person meetings with Stephanie, and joined occasional get-togethers with other team members." + }, + { + type: 'imageHalfWidth', + content: { + url: 'img/steph_and_nida.jpg', + alt: 'Nida Javaid and Stephanie Lo at the Wellcome Genome Campus' + } + }, + { + type: 'md', + content: '###### Nida Javaid and Stephanie Lo at the Wellcome Genome Campus' + }, + { + type: 'md', + content: "Find out more about Nida's work with the Bentley team:" + }, + { + type: 'quoteCard', + content: { + name: 'Nida Javid (Department of Biology, Lahore University of Management Sciences, Pakistan)', + quotes: ["The original plan was that I will be working on the population genomics analysis of pneumococcal isolates from Pakistan. However, due to the lockdown, sequencing of isolates from Pakistan was delayed and I started working on the country analysis of pneumococcal carriage isolates from South Africa. I started with running quality control analysis of the sequenced data, followed by *in silico* serotyping, genotyping, prediction of antimicrobial resistance and phylogenetic analysis from pneumococcal genomes using a wide range of command-line tools such as SeroBA and PopPUNK. I then visualized the output using Microreact, a tool that allows me to interactively explore the phylogeny with temporal and geographical data. Now almost a year and a half later, this manuscript is ready for submission. I would like to thank Dr. Shabbir Madhi for allowing me to work on his dataset.", "After a few months, pneumococcal isolates from Pakistan were sequenced. I then analysed these data using the approach and tools that I had learnt during my first few months at Sanger, and am working towards publication of my Pakistan country analysis. We also presented our preliminary results at the ABPHM online conference. Although I am back in Pakistan now, I am still actively working with Stephanie and attend the team meetings regularly. I would like to thank Stephen, Stephanie, and the team for their support and kindness. I would also like to thank my PhD advisor, Dr. Shaper Mirza, for her support and guidance through my PhD."] + } + }, + ] + } + ] +} + +export default content diff --git a/src/content/outlineContent.js b/src/content/outlineContent.js index 5525c13..9da6eb9 100644 --- a/src/content/outlineContent.js +++ b/src/content/outlineContent.js @@ -23,7 +23,7 @@ const content = { }, { type: 'md', - content: 'Pneumococcal conjugate vaccines (PCVs) target the protective capsule surrounding pneumococcal cells and have proven to be very effective in reducing pneumococcal disease since their first introduction in 2000. However, there are at least [100 different forms of capsule](../resources#serotypes), each giving rise to a distinct "serotype" determined based on interactions between antibodies and antigens on the capsule. Current PCVs only target some serotypes, and the overall pneumococcus population can evolve through a process known as "serotype switching" to evade the vaccines. This creates an arms race between the vaccines and the pneumococcus.' + content: 'Pneumococcal conjugate vaccines (PCVs) target the protective capsule surrounding pneumococcal cells and have proven to be very effective in reducing pneumococcal disease since their first introduction in 2000. However, there are at least [100 different forms of capsule](../serobank), each giving rise to a distinct "serotype" determined based on interactions between antibodies and antigens on the capsule. Current PCVs only target some serotypes, and the overall pneumococcus population can evolve through a process known as "serotype switching" to evade the vaccines. This creates an arms race between the vaccines and the pneumococcus.' }, { type: 'md', @@ -62,7 +62,7 @@ const content = { }, { type: 'md', - content: 'GPS sequence data confirmed that after the introduction of vaccines, pneumococci with vaccine serotypes were replaced by those with non-vaccine serotypes. Importantly, with such large-scale genome data, we were able to classify all the strains circulating globally, for the first time. Pneumococcal strains could be defined at high-resolution by taking genome-wide DNA variations into account ([Gladstone and Lo *et al* 2019](https://doi.org/10.1016/j.ebiom.2019.04.021)). This robust typing method is coupled with a coherent and dynamic naming system known as [global pneumococcal sequence clusters (GPSCs)](../resources#lineages), which enable collaborations in the tracking of pneumococcal lineages across geographical regions and over time, especially before and after the roll-out of PCVs.' + content: 'GPS sequence data confirmed that after the introduction of vaccines, pneumococci with vaccine serotypes were replaced by those with non-vaccine serotypes. Importantly, with such large-scale genome data, we were able to classify all the strains circulating globally, for the first time. Pneumococcal strains could be defined at high-resolution by taking genome-wide DNA variations into account ([Gladstone and Lo *et al* 2019](https://doi.org/10.1016/j.ebiom.2019.04.021)). This robust typing method is coupled with a coherent and dynamic naming system known as [global pneumococcal sequence clusters (GPSCs)](../gpsc#lineages), which enable collaborations in the tracking of pneumococcal lineages across geographical regions and over time, especially before and after the roll-out of PCVs.' }, { type: 'md', @@ -81,7 +81,7 @@ const content = { content: [ { type: 'md', - content: 'The GPS project generates a rich source of genome and epidemiological data for tracking pneumococcal transmission and evolution on both national and international levels. The genome data are deposited in [ENA](https://www.ebi.ac.uk/ena/data/view/PRJEB3084). High-level analyses are interactively presented by [countries](../resources#countries) and by [strains](../resources#lineages) using [Microreact](https://microreact.org/) and [Phandango](https://jameshadfield.github.io/phandango/#/GPS). Illustrations of how to use these resources are summarised in a publication ([Gladstone *et al* 2020](https://doi.org/10.1099/mgen.0.000357)) and videos on the [Resources pages](../resources#overview). ' + content: 'The GPS project generates a rich source of genome and epidemiological data for tracking pneumococcal transmission and evolution on both national and international levels. The genome data are deposited in [ENA](https://www.ebi.ac.uk/ena/data/view/PRJEB3084). High-level analyses are interactively presented by [countries](../resources#countries) and by [strains](../gpsc#lineages) using [Microreact](https://microreact.org/) and [Phandango](https://jameshadfield.github.io/phandango/#/GPS). Illustrations of how to use these resources are summarised in a publication ([Gladstone *et al* 2020](https://doi.org/10.1099/mgen.0.000357)) and videos on the [Resources pages](../resources#overview). ' }, ] }, diff --git a/src/content/serotypeTableContent.tsv b/src/content/serotypeTableContent.tsv index bb3ec75..19805e4 100644 --- a/src/content/serotypeTableContent.tsv +++ b/src/content/serotypeTableContent.tsv @@ -1,119 +1,123 @@ -count serotype accessionNumber comments reference referenceUrl cpsImage cpsRemark -1 1 CR931632 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_1_cps.svg - -2 2 CR931633 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_2_cps.svg - -3 3 CR931634 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_3_cps.svg - -4 4 CR931635 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_4_cps.svg - -5 5 CR931637 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_5_cps.svg - -6 6A CR931638 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_6A_cps.svg - -- 6E(6A) - Genetic variant of 6A Park et al 2017 Genome Announc https://doi.org/10.1128/genomeA.01728-16 - - -7 6B CR931639 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_6B_cps.svg - -- 6E(6B) KU168827 Genetic variant of 6B Burton et al 2016 J Clin Microbiol https://doi.org/10.1128/JCM.03194-15 - - -8 6C "EF538714,EF538715,EF538716,EF538717,EF538718" - "Park et al 2007 J Clin Microbiol,Park et al 2007 Infect Immun" "https://doi.org/10.1128/JCM.02199-06,https://doi.org/10.1128/iai.00510-07" img/serotype_cps/serotype_6C_cps.svg - -9 6D HM448897 - Nahm et al 2011 J Med Microbiol https://doi.org/10.1099%2Fjmm.0.023853-0 img/serotype_cps/serotype_6D_cps.svg - -10 6H KF597302 - Park et al 2015 Clin Vaccine Immunol https://doi.org/10.1128/CVI.00647-14 img/serotype_cps/serotype_6H_cps.svg Partial sequence only -11 7A CR931640 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_7A_cps.svg - -12 7B CR931641 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_7B_cps.svg - -13 7C CR931642 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_7C_cps.svg - -14 7D - - Kjeldsen et al 2018 Carbohydr Res https://doi.org/10.1016/j.carres.2018.04.011 - - -15 7F CR931643 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_7F_cps.svg - -16 8 CR931644 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_8_cps.svg - -17 9A CR931645 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_9A_cps.svg - -18 9L CR931646 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_9L_cps.svg - -19 9N CR931647 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_9N_cps.svg - -20 9V CR931648 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_9V_cps.svg - -21 10A CR931649 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_10A_cps.svg - -22 10B CR931650 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_10B_cps.svg - -23 10C CR931651 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_10C_cps.svg - -24 10D ERR051587 - Ganaie et al 2020 mBio https://doi.org/10.1128/mBio.00937-20 img/serotype_cps/serotype_10D_cps.svg - -25 10F CR931652 - "Bentley et al 2006 PloS Genet,Yang et al 2011 J Biol Chem" "https://doi.org/10.1371/journal.pgen.0020031,https://doi.org/10.1074/jbc.M111.255422" img/serotype_cps/serotype_10F_cps.svg - -26 11A CR931653 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_11A_cps.svg - -27 11B CR931654 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_11B_cps.svg - -28 11C CR931655 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_11C_cps.svg - -29 11D CR931656 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_11D_cps.svg - -30 11E - - Calix et al 2010 J Infect Dis https://doi.org/10.1086/653123 img/serotype_cps/serotype_11E_cps.svg - -- 11Av - A serovariant which is an intermediate variant of 11A and 11E Camilli et al 2014 PloS ONE https://doi.org/10.1371/journal.pone.0100722 - - -31 11F CR931657 - Calix et al 2011 J Bacteriology https://doi.org/10.1128/JB.05034-11 img/serotype_cps/serotype_11F_cps.svg - -32 11F_like MF140334 - Manna et al 2018 Clin Microbiol Infect https://doi.org/10.1016%2Fj.cmi.2017.06.031 img/serotype_cps/serotype_11F_like_cps.svg - -33 12A CR931658 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_12A_cps.svg - -34 12B CR931659 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_12B_cps.svg - -35 12F CR931660 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_12F_cps.svg - -36 13 CR931661 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_13_cps.svg - -37 14 CR931662 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_14_cps.svg - -38 15A CR931663 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_15A_cps.svg - -39 15B CR931664 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_15B_cps.svg - -40 15C CR931665 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_15C_cps.svg - -41 15D SAMN14150919 - Pimenta et al 2021 J Clin Microbiol https://doi.org/10.1128/jcm.00329-21 img/serotype_cps/serotype_15D_cps.svg - -42 15F CR931666 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_15F_cps.svg - -43 16A CR931667 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_16A_cps.svg - -44 16F CR931668 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_16F_cps.svg - -45 17A CR931669 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_17A_cps.svg - -46 17F CR931670 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_17F_cps.svg - -47 18A CR931671 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_18A_cps.svg - -48 18B CR931672 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_18B_cps.svg - -49 18C CR931673 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_18C_cps.svg - -50 18F CR931674 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_18F_cps.svg - -51 19A CR931675 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_19A_cps.svg - -52 19B CR931676 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_19B_cps.svg - -53 19C CR931677 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_19C_cps.svg - -54 19F CR931678 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_19F_cps.svg - -55 20A JQ653094 - Calix et al 2012 J Biol Chem https://doi.org/10.1074/jbc.M112.380451 img/serotype_cps/serotype_20A_cps.svg - -56 20B JQ653093 - Calix et al 2012 J Biol Chem https://doi.org/10.1074/jbc.M112.380451 img/serotype_cps/serotype_20B_cps.svg - -57 21 CR931680 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_21_cps.svg - -58 22A CR931681 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_22A_cps.svg - -59 22F CR931682 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_22F_cps.svg - -60 23A CR931683 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_23A_cps.svg - -61 23B CR931684 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_23B_cps.svg - -62 23F CR931685 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_23F_cps.svg - -63 24A CR931686 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_24A_cps.svg - -64 24B CR931687 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_24B_cps.svg - -65 24C MW683298 - Ganaie et al 2021 J Clin Microbiol https://doi.org/10.1128/JCM.00540-21 img/serotype_cps/serotype_24C_cps.svg - -66 24F CR931688 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_24F_cps.svg - -67 25A CR931689 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_25A_cps.svg - -68 25F CR931690 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_25F_cps.svg - -69 27 CR931691 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_27_cps.svg - -70 28A CR931692 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_28A_cps.svg - -71 28F CR931693 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_28F_cps.svg - -72 29 CR931694 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_29_cps.svg - -73 31 CR931695 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_31_cps.svg - -74 32A CR931696 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_32A_cps.svg - -75 32F CR931697 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_32F_cps.svg - -76 33A CR931698 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33A_cps.svg - -77 33B CR931699 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33B_cps.svg - -78 33C CR931700 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33C_cps.svg - -79 33D CR931701 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33D_cps.svg - -80 33E SAMEA2203953 - Ganaie et al 2023 J Biol Chem https://doi.org/10.1016/j.jbc.2023.105085 img/serotype_cps/serotype_33E_cps.svg - -81 33F CR931702 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33F_cps.svg - -82 33G OR509570 - Manna et al 2023 Microbiol Spectr https://doi.org/10.1128%2Fspectrum.03579-23 img/serotype_cps/serotype_33G_cps.svg - -83 34 CR931703 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_34_cps.svg - -84 35A CR931704 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_35A_cps.svg - -85 35B CR931705 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_35B_cps.svg - -86 35C CR931706 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_35C_cps.svg - -87 35D KY084476 various disruptive mutations in wciG "Geno et al 2017 J Clin Microbiol,Lo et al 2018 J Clin Microbiol" "https://doi.org/10.1128/JCM.00054-17,https://doi.org/10.1128/jcm.00228-18" img/serotype_cps/serotype_35D_cps.svg - -88 35F CR931707 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_35F_cps.svg - -89 36A CR931708 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_36A_cps.svg - -90 36B MK606436 - Ganaie et al 2023 J Clin Microbiol https://doi.org/10.1128/jcm.00024-23 img/serotype_cps/serotype_36B_cps.svg - -91 37 CR931709 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_37_cps.svg - -92 38 CR931710 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_38_cps.svg - -93 39 CR931711 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_39_cps.svg - -94 40 CR931712 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_40_cps.svg - -95 41A CR931713 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_41A_cps.svg - -96 41F CR931714 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_41F_cps.svg - -97 42 CR931715 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_42_cps.svg - -98 43 CR931716 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_43_cps.svg - -99 44 CR931717 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_44_cps.svg - -100 45 CR931718 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_45_cps.svg - -101 46 CR931719 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_46_cps.svg - -102 47A CR931720 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_47A_cps.svg - -103 47F CR931721 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_47F_cps.svg - -104 48 CR931722 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_48_cps.svg - -- 9X MK606437 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_9X_cps.svg - -- 11X MK606429 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_11X_cps.svg - -- 16X MK606430 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_16X_cps.svg - -- 18X1 MK606431 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_18X1_cps.svg - -- 18X2 MK606432 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_18X2_cps.svg - -- 18X3 MK606433 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_18X3_cps.svg - -- 29X MK606434 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_29X_cps.svg - -- 33X MK606435 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_33X_cps.svg - -- 36X MK606436 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_36X_cps.svg - -- Group I nonencapsulated - do not produce capsule due to mutations or deletion of genes encoding capsule Hathaway et al 2014 J Bacteriology https://doi.org/10.1128/JB.186.12.3721-3729.2004 - - -- Group II nonencapsulated - do not produce capsule due to novel genes in place of genes encoding capsule "Park et al 2012 mBio,Salter et al 2012 Microbiology" "https://doi.org/10.1128/mBio.00035-12,https://doi.org/10.1099%2Fmic.0.056580-0" - - \ No newline at end of file +count serotype accessionNumber comments reference referenceUrl cpsImage cpsRemark genBankFile poolSerum typeSerum groupSerum factorSerum otherSerum otherSerumRemark antiserumNote capsularStructureImage capsularStructureRemark +1 1 CR931632 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_1_cps.svg - res/serotype_genbank/serotype_1.gb "A,P" 1 - - - - - img/serotype_capsular_structure/serotype_1_capsular_structure.svg - +2 2 CR931633 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_2_cps.svg - res/serotype_genbank/serotype_2.gb "A,T" 2 - - - - - img/serotype_capsular_structure/serotype_2_capsular_structure.svg - +3 3 CR931634 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_3_cps.svg - res/serotype_genbank/serotype_3.gb "B,R" 3 - - - - - img/serotype_capsular_structure/serotype_3_capsular_structure.svg - +4 4 CR931635 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_4_cps.svg - res/serotype_genbank/serotype_4.gb "A,R" 4 - - - - - img/serotype_capsular_structure/serotype_4_capsular_structure.svg - +5 5 CR931637 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_5_cps.svg - res/serotype_genbank/serotype_5.gb "A,S" 5 - - - - - img/serotype_capsular_structure/serotype_5_capsular_structure.svg - +6 6A CR931638 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_6A_cps.svg - res/serotype_genbank/serotype_6A.gb "B,Q" - 6 6b - - - img/serotype_capsular_structure/serotype_6A_capsular_structure.svg - +- 6E(6A) - Genetic variant of 6A Park et al 2017 Genome Announc https://doi.org/10.1128/genomeA.01728-16 - - - "B,Q" - 6 6b - - - - - +7 6B CR931639 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_6B_cps.svg - res/serotype_genbank/serotype_6B.gb "B,Q" - 6 6c - - - img/serotype_capsular_structure/serotype_6B_capsular_structure.svg - +- 6E(6B) LT594599 Genetic variant of 6B Kapatai et al 2016 PeerJ https://doi.org/10.7717%2Fpeerj.2477 - - res/serotype_genbank/serotype_6E_6B.gb "B,Q" - 6 6c - - - - - +8 6C "EF538714,EF538715,EF538716,EF538717,EF538718" - "Park et al 2007 J Clin Microbiol,Park et al 2007 Infect Immun" "https://doi.org/10.1128/JCM.02199-06,https://doi.org/10.1128/iai.00510-07" img/serotype_cps/serotype_6C_cps.svg - res/serotype_genbank/serotype_6C.gb "B,Q" - 6 6d - - - img/serotype_capsular_structure/serotype_6C_capsular_structure.svg - +9 6D HM448897 - Nahm et al 2011 J Med Microbiol https://doi.org/10.1099%2Fjmm.0.023853-0 img/serotype_cps/serotype_6D_cps.svg - res/serotype_genbank/serotype_6D.gb "B,Q" - 6 "6c,6d" - - - img/serotype_capsular_structure/serotype_6D_capsular_structure.svg - +10 6F KC832410 - Oliver et al 2013 J Biol Chem https://doi.org/10.1074%2Fjbc.M113.480152 img/serotype_cps/serotype_6F_cps.svg - res/serotype_genbank/serotype_6F.gb - - - - - - - - 6A + 6C +11 6G KC832411 - Oliver et al 2013 J Biol Chem https://doi.org/10.1074%2Fjbc.M113.480152 img/serotype_cps/serotype_6G_cps.svg - res/serotype_genbank/serotype_6G.gb - - - - - - - - 6B + 6D +12 6H KF597302 - Park et al 2015 Clin Vaccine Immunol https://doi.org/10.1128/CVI.00647-14 img/serotype_cps/serotype_6H_cps.svg Partial sequence only res/serotype_genbank/serotype_6H.gb - - - - - - - - 6A + 6B +13 7A CR931640 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_7A_cps.svg - res/serotype_genbank/serotype_7A.gb "C,P" - 7 "7b,7c" - - - img/serotype_capsular_structure/serotype_7A_capsular_structure.svg - +14 7B CR931641 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_7B_cps.svg - res/serotype_genbank/serotype_7B.gb "C,P" - 7 7e - - - img/serotype_capsular_structure/serotype_7B_capsular_structure.svg - +15 7C CR931642 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_7C_cps.svg - res/serotype_genbank/serotype_7C.gb "C,P" - 7 7f - - - img/serotype_capsular_structure/serotype_7C_capsular_structure.svg - +16 7D - - Kjeldsen et al 2018 Carbohydr Res https://doi.org/10.1016/j.carres.2018.04.011 - - - - - - - - - - - 7B (1X) + 7C (5X) +17 7F CR931643 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_7F_cps.svg - res/serotype_genbank/serotype_7F.gb "C,P" - 7 7b - - - img/serotype_capsular_structure/serotype_7F_capsular_structure.svg - +18 8 CR931644 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_8_cps.svg - res/serotype_genbank/serotype_8.gb "B,S" 8 - - - - - img/serotype_capsular_structure/serotype_8_capsular_structure.svg - +19 9A CR931645 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_9A_cps.svg - res/serotype_genbank/serotype_9A.gb "D,R" - 9 9d - - - img/serotype_capsular_structure/serotype_9A_capsular_structure.svg - +20 9L CR931646 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_9L_cps.svg - res/serotype_genbank/serotype_9L.gb "D,R" - 9 9b - - - img/serotype_capsular_structure/serotype_9L_capsular_structure.svg - +21 9N CR931647 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_9N_cps.svg - res/serotype_genbank/serotype_9N.gb "D,R" - 9 "9b,9e" - - - img/serotype_capsular_structure/serotype_9N_capsular_structure.svg - +22 9V CR931648 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_9V_cps.svg - res/serotype_genbank/serotype_9V.gb "D,R" - 9 "9d,9g" - - - img/serotype_capsular_structure/serotype_9V_capsular_structure.svg - +23 10A CR931649 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_10A_cps.svg - res/serotype_genbank/serotype_10A.gb "E,S" - 10 10d - - - img/serotype_capsular_structure/serotype_10A_capsular_structure.svg - +24 10B CR931650 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_10B_cps.svg - res/serotype_genbank/serotype_10B.gb "E,S" - 10 "10b,10d" - - - img/serotype_capsular_structure/serotype_10B_capsular_structure.svg - +25 10C CR931651 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_10C_cps.svg - res/serotype_genbank/serotype_10C.gb "E,S" - 10 "10b,10f" - - - img/serotype_capsular_structure/serotype_10C_capsular_structure.svg - +26 10D ERR051587 - Ganaie et al 2020 mBio https://doi.org/10.1128/mBio.00937-20 img/serotype_cps/serotype_10D_cps.svg - res/serotype_genbank/serotype_10D.gb - - - - - - - img/serotype_capsular_structure/serotype_10D_capsular_structure.svg - +27 10F CR931652 - "Bentley et al 2006 PloS Genet,Yang et al 2011 J Biol Chem" "https://doi.org/10.1371/journal.pgen.0020031,https://doi.org/10.1074/jbc.M111.255422" img/serotype_cps/serotype_10F_cps.svg - res/serotype_genbank/serotype_10F.gb "E,S" - 10 10b - - - img/serotype_capsular_structure/serotype_10F_capsular_structure.svg - +28 11A CR931653 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_11A_cps.svg - res/serotype_genbank/serotype_11A.gb "D,T" - 11 11c - - - img/serotype_capsular_structure/serotype_11A_capsular_structure.svg - +29 11B CR931654 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_11B_cps.svg - res/serotype_genbank/serotype_11B.gb "D,T" - 11 "11b,11f,11g" - - - img/serotype_capsular_structure/serotype_11B_capsular_structure.svg - +30 11C CR931655 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_11C_cps.svg - res/serotype_genbank/serotype_11C.gb "D,T" - 11 "11b,11c,11f" - - - img/serotype_capsular_structure/serotype_11C_capsular_structure.svg - +31 11D CR931656 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_11D_cps.svg - res/serotype_genbank/serotype_11D.gb "D,T" - 11 "11b,11c" - - - img/serotype_capsular_structure/serotype_11D_capsular_structure.svg - +32 11E - - Calix et al 2010 J Infect Dis https://doi.org/10.1086/653123 img/serotype_cps/serotype_11E_cps.svg - res/serotype_genbank/serotype_11E.gb - - - - - - - img/serotype_capsular_structure/serotype_11E_capsular_structure.svg - +- 11Av - A serovariant which is an intermediate variant of 11A and 11E Camilli et al 2014 PloS ONE https://doi.org/10.1371/journal.pone.0100722 - - - - - - - - - - - - +33 11F CR931657 - Calix et al 2011 J Bacteriology https://doi.org/10.1128/JB.05034-11 img/serotype_cps/serotype_11F_cps.svg - res/serotype_genbank/serotype_11F.gb "D,T" - 11 "11b,11g" - - - img/serotype_capsular_structure/serotype_11F_capsular_structure.svg - +_ 11F-like MF140334 Genetic variant of 11A Manna et al 2018 Clin Microbiol Infect https://doi.org/10.1016%2Fj.cmi.2017.06.031 img/serotype_cps/serotype_11F-like_cps.svg - res/serotype_genbank/serotype_11F-like.gb - - - - - - - - - +34 12A CR931658 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_12A_cps.svg - res/serotype_genbank/serotype_12A.gb "E,R" - 12 12c - - - img/serotype_capsular_structure/serotype_12A_capsular_structure.svg - +35 12B CR931659 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_12B_cps.svg - res/serotype_genbank/serotype_12B.gb "E,R" - 12 "12b,12c,12e" - - - - - +36 12F CR931660 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_12F_cps.svg - res/serotype_genbank/serotype_12F.gb "E,R" - 12 12b - - - img/serotype_capsular_structure/serotype_12F_capsular_structure.svg - +37 13 CR931661 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_13_cps.svg - res/serotype_genbank/serotype_13.gb H 13 - - - - - img/serotype_capsular_structure/serotype_13_capsular_structure.svg - +38 14 CR931662 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_14_cps.svg - res/serotype_genbank/serotype_14.gb "H,P" 14 - - - - - img/serotype_capsular_structure/serotype_14_capsular_structure.svg - +39 15A CR931663 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_15A_cps.svg - res/serotype_genbank/serotype_15A.gb "H,S" - 15 15c - - - img/serotype_capsular_structure/serotype_15A_capsular_structure.svg - +40 15B CR931664 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_15B_cps.svg - res/serotype_genbank/serotype_15B.gb "H,S" - 15 "15b,15e,15h" - - - img/serotype_capsular_structure/serotype_15B_capsular_structure.svg - +41 15C CR931665 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_15C_cps.svg - res/serotype_genbank/serotype_15C.gb "H,S" - 15 15e - - - img/serotype_capsular_structure/serotype_15C_capsular_structure.svg - +42 15D SAMN14150919 - Pimenta et al 2021 J Clin Microbiol https://doi.org/10.1128/jcm.00329-21 img/serotype_cps/serotype_15D_cps.svg - res/serotype_genbank/serotype_15D.gb "H,S" - 15 "15b,15c" "15bf,15g" "Antiserum available at CDC,Antiserum available at CDC" Cannot be identified only by SSI Antiseria img/serotype_capsular_structure/serotype_15F_capsular_structure.svg Predicted +43 15F CR931666 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_15F_cps.svg - res/serotype_genbank/serotype_15F.gb "H,S" - 15 "15b,15c" - - - img/serotype_capsular_structure/serotype_15F_capsular_structure.svg - +44 16A CR931667 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_16A_cps.svg - res/serotype_genbank/serotype_16A.gb D - 16 16c - - - img/serotype_capsular_structure/serotype_16A_capsular_structure.svg - +45 16F CR931668 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_16F_cps.svg - res/serotype_genbank/serotype_16F.gb D - 16 16b - - - img/serotype_capsular_structure/serotype_16F_capsular_structure.svg - +46 17A CR931669 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_17A_cps.svg - res/serotype_genbank/serotype_17A.gb "F,S" - 17 17c - - - img/serotype_capsular_structure/serotype_17A_capsular_structure.svg - +47 17F CR931670 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_17F_cps.svg - res/serotype_genbank/serotype_17F.gb "F,S" - 17 17b - - - img/serotype_capsular_structure/serotype_17F_capsular_structure.svg - +48 18A CR931671 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_18A_cps.svg - res/serotype_genbank/serotype_18A.gb "A,Q" - 18 18d - - - img/serotype_capsular_structure/serotype_18A_capsular_structure.svg - +49 18B CR931672 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_18B_cps.svg - res/serotype_genbank/serotype_18B.gb "A,Q" - 18 18e - - - img/serotype_capsular_structure/serotype_18B_capsular_structure.svg - +50 18C CR931673 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_18C_cps.svg - res/serotype_genbank/serotype_18C.gb "A,Q" - 18 "18c,18e" - - - img/serotype_capsular_structure/serotype_18C_capsular_structure.svg - +51 18F CR931674 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_18F_cps.svg - res/serotype_genbank/serotype_18F.gb "A,Q" - 18 "18c,18e,18f" - - - img/serotype_capsular_structure/serotype_18F_capsular_structure.svg - +52 19A CR931675 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_19A_cps.svg - res/serotype_genbank/serotype_19A.gb "B,P" - 19 19c - - - img/serotype_capsular_structure/serotype_19A_capsular_structure.svg - +53 19B CR931676 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_19B_cps.svg - res/serotype_genbank/serotype_19B.gb "B,P" - 19 7h - - - img/serotype_capsular_structure/serotype_19B_capsular_structure.svg - +54 19C CR931677 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_19C_cps.svg - res/serotype_genbank/serotype_19C.gb "B,P" - 19 "19f,7h" - - - img/serotype_capsular_structure/serotype_19C_capsular_structure.svg - +55 19F CR931678 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_19F_cps.svg - res/serotype_genbank/serotype_19F.gb "B,P" - 19 19b - - - img/serotype_capsular_structure/serotype_19F_capsular_structure.svg - +56 20A JQ653094 - Calix et al 2012 J Biol Chem https://doi.org/10.1074/jbc.M112.380451 img/serotype_cps/serotype_20A_cps.svg - res/serotype_genbank/serotype_20A.gb - - - - - - - img/serotype_capsular_structure/serotype_20A_capsular_structure.svg - +57 20B JQ653093 - Calix et al 2012 J Biol Chem https://doi.org/10.1074/jbc.M112.380451 img/serotype_cps/serotype_20B_cps.svg - res/serotype_genbank/serotype_20B.gb - - - - - - - img/serotype_capsular_structure/serotype_20B_capsular_structure.svg - +58 20C ERR980181 - Yu et al 2024 Microbiol Spectr https://doi.org/10.1128/spectrum.02443-24 img/serotype_cps/serotype_20C_cps.svg - res/serotype_genbank/serotype_20C.gb - - - - - - - img/serotype_capsular_structure/serotype_20C_capsular_structure.svg - +59 21 CR931680 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_21_cps.svg - res/serotype_genbank/serotype_21.gb E 21 - - - - - - - +60 22A CR931681 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_22A_cps.svg - res/serotype_genbank/serotype_22A.gb "F,T" - 22 22c - - - img/serotype_capsular_structure/serotype_22A_capsular_structure.svg - +61 22F CR931682 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_22F_cps.svg - res/serotype_genbank/serotype_22F.gb "F,T" - 22 22b - - - img/serotype_capsular_structure/serotype_22F_capsular_structure.svg - +62 23A CR931683 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_23A_cps.svg - res/serotype_genbank/serotype_23A.gb "H,Q" - 23 23c - - - img/serotype_capsular_structure/serotype_23A_capsular_structure.svg - +63 23B CR931684 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_23B_cps.svg - res/serotype_genbank/serotype_23B.gb "H,Q" - 23 23d - - - img/serotype_capsular_structure/serotype_23B_capsular_structure.svg - +64 23F CR931685 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_23F_cps.svg - res/serotype_genbank/serotype_23F.gb "H,Q" - 23 23b - - - img/serotype_capsular_structure/serotype_23F_capsular_structure.svg - +65 24A CR931686 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_24A_cps.svg - res/serotype_genbank/serotype_24A.gb C - 24 "24c,24d" - - - img/serotype_capsular_structure/serotype_24A_capsular_structure.svg - +66 24B CR931687 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_24B_cps.svg - res/serotype_genbank/serotype_24B.gb C - 24 24e - - - img/serotype_capsular_structure/serotype_24B_capsular_structure.svg - +67 24C MW683298 - Ganaie et al 2021 J Clin Microbiol https://doi.org/10.1128/JCM.00540-21 img/serotype_cps/serotype_24C_cps.svg - res/serotype_genbank/serotype_24C.gb - - - - - - - - 24B + 24F +68 24F CR931688 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_24F_cps.svg - res/serotype_genbank/serotype_24F.gb C - 24 24d - - - img/serotype_capsular_structure/serotype_24F_capsular_structure.svg - +69 25A CR931689 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_25A_cps.svg - res/serotype_genbank/serotype_25A.gb I - 25 25c - - - - - +70 25F CR931690 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_25F_cps.svg - res/serotype_genbank/serotype_25F.gb I - 25 25b - - - - - +71 27 CR931691 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_27_cps.svg - res/serotype_genbank/serotype_27.gb F 27 - - - - - img/serotype_capsular_structure/serotype_27_capsular_structure.svg - +72 28A CR931692 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_28A_cps.svg - res/serotype_genbank/serotype_28A.gb H - 28 28c - - - img/serotype_capsular_structure/serotype_28A_capsular_structure.svg - +73 28F CR931693 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_28F_cps.svg - res/serotype_genbank/serotype_28F.gb H - 28 28b - - - img/serotype_capsular_structure/serotype_28F_capsular_structure.svg - +74 29 CR931694 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_29_cps.svg - res/serotype_genbank/serotype_29.gb G 29 - - - - - img/serotype_capsular_structure/serotype_29_capsular_structure.svg - +75 31 CR931695 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_31_cps.svg - res/serotype_genbank/serotype_31.gb C 31 - - - - - img/serotype_capsular_structure/serotype_31_capsular_structure.svg - +76 32A CR931696 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_32A_cps.svg - res/serotype_genbank/serotype_32A.gb F - 32 "32a,32b" - - - img/serotype_capsular_structure/serotype_32A_capsular_structure.svg - +77 32F CR931697 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_32F_cps.svg - res/serotype_genbank/serotype_32F.gb F - 32 32a - - - img/serotype_capsular_structure/serotype_32F_capsular_structure.svg - +78 33A CR931698 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33A_cps.svg - res/serotype_genbank/serotype_33A.gb "E,T" - 33 "33b,20b" - - - img/serotype_capsular_structure/serotype_33A_capsular_structure.svg - +79 33B CR931699 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33B_cps.svg - res/serotype_genbank/serotype_33B.gb "E,T" - 33 33f - - - img/serotype_capsular_structure/serotype_33B_capsular_structure.svg - +80 33C CR931700 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33C_cps.svg - res/serotype_genbank/serotype_33C.gb "E,T" - 33 33e(33f) - - - img/serotype_capsular_structure/serotype_33C_capsular_structure.svg - +81 33D CR931701 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33D_cps.svg - res/serotype_genbank/serotype_33D.gb "E,T" - 33 "33f,6a" - - - img/serotype_capsular_structure/serotype_33D_capsular_structure.svg - +82 33E SAMEA2203953 - Ganaie et al 2023 J Biol Chem https://doi.org/10.1016/j.jbc.2023.105085 img/serotype_cps/serotype_33E_cps.svg - res/serotype_genbank/serotype_33E.gb - - - - - - - img/serotype_capsular_structure/serotype_33E_capsular_structure.svg - +83 33F CR931702 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_33F_cps.svg - res/serotype_genbank/serotype_33F.gb "E,T" - 33 33b - - - img/serotype_capsular_structure/serotype_33F_capsular_structure.svg - +84 33G OR509570 - Manna et al 2023 Microbiol Spectr https://doi.org/10.1128%2Fspectrum.03579-23 img/serotype_cps/serotype_33G_cps.svg - res/serotype_genbank/serotype_33G.gb - - - - - - - img/serotype_capsular_structure/serotype_33G_capsular_structure.svg - +85 34 CR931703 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_34_cps.svg - res/serotype_genbank/serotype_34.gb G 34 - - - - - img/serotype_capsular_structure/serotype_34_capsular_structure.svg - +86 35A CR931704 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_35A_cps.svg - res/serotype_genbank/serotype_35A.gb G - 35 "35a,35c" - - - img/serotype_capsular_structure/serotype_35A_capsular_structure.svg - +87 35B CR931705 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_35B_cps.svg - res/serotype_genbank/serotype_35B.gb G - 35 "35a,35c,29b" - - - img/serotype_capsular_structure/serotype_35B_capsular_structure.svg - +88 35C CR931706 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_35C_cps.svg - res/serotype_genbank/serotype_35C.gb G - 35 "35a,35c,42a" - - - img/serotype_capsular_structure/serotype_35C_capsular_structure.svg - +89 35D KY084476 various disruptive mutations in wciG "Geno et al 2017 J Clin Microbiol,Lo et al 2018 J Clin Microbiol" "https://doi.org/10.1128/JCM.00054-17,https://doi.org/10.1128/jcm.00228-18" img/serotype_cps/serotype_35D_cps.svg - res/serotype_genbank/serotype_35D.gb G - - - "fs29b,fs35c" "Antiserum available at Nahm Lab,Antiserum available at Nahm Lab" Can be differentiated from 35B by SSI antisera based on the absence of reaction with SSI Factor Serum 35a img/serotype_capsular_structure/serotype_35D_capsular_structure.svg - +90 35F CR931707 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_35F_cps.svg - res/serotype_genbank/serotype_35F.gb G - 35 "35a,35b" - - - img/serotype_capsular_structure/serotype_35F_capsular_structure.svg - +91 36A CR931708 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_36A_cps.svg - res/serotype_genbank/serotype_36A.gb D 36 - 9e - - - img/serotype_capsular_structure/serotype_36A_capsular_structure.svg - +92 36B MK606436 - Ganaie et al 2023 J Clin Microbiol https://doi.org/10.1128/jcm.00024-23 img/serotype_cps/serotype_36B_cps.svg - res/serotype_genbank/serotype_36B.gb D 36 - - - - - img/serotype_capsular_structure/serotype_36B_capsular_structure.svg - +93 37 CR931709 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_37_cps.svg - res/serotype_genbank/serotype_37.gb D 37 - - - - - img/serotype_capsular_structure/serotype_37_capsular_structure.svg - +94 38 CR931710 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_38_cps.svg - res/serotype_genbank/serotype_38.gb I 38 - - - - - img/serotype_capsular_structure/serotype_38_capsular_structure.svg - +95 39 CR931711 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_39_cps.svg - res/serotype_genbank/serotype_39.gb E 39 - - - - - img/serotype_capsular_structure/serotype_39_capsular_structure.svg - +96 40 CR931712 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_40_cps.svg - res/serotype_genbank/serotype_40.gb C 40 - - - - - - - +97 41A CR931713 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_41A_cps.svg - res/serotype_genbank/serotype_41A.gb F - 41 41a - - - img/serotype_capsular_structure/serotype_41A_capsular_structure.svg - +98 41F CR931714 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_41F_cps.svg - res/serotype_genbank/serotype_41F.gb F - 41 "41a,41b" - - - img/serotype_capsular_structure/serotype_41F_capsular_structure.svg - +99 42 CR931715 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_42_cps.svg - res/serotype_genbank/serotype_42.gb G 42 - - - - - img/serotype_capsular_structure/serotype_42_capsular_structure.svg - +100 43 CR931716 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_43_cps.svg - res/serotype_genbank/serotype_43.gb I 43 - - - - - - - +101 44 CR931717 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_44_cps.svg - res/serotype_genbank/serotype_44.gb I 44 - - - - - - - +102 45 CR931718 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_45_cps.svg - res/serotype_genbank/serotype_45.gb I 45 - - - - - img/serotype_capsular_structure/serotype_45_capsular_structure.svg - +103 46 CR931719 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_46_cps.svg - res/serotype_genbank/serotype_46.gb I 46 - - - - - - - +104 47A CR931720 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_47A_cps.svg - res/serotype_genbank/serotype_47A.gb G - 47 "47a,43b" - - - img/serotype_capsular_structure/serotype_47A_capsular_structure.svg - +105 47F CR931721 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_47F_cps.svg - res/serotype_genbank/serotype_47F.gb G - 47 47a - - - img/serotype_capsular_structure/serotype_47F_capsular_structure.svg - +106 48 CR931722 - Bentley et al 2006 PloS Genet https://doi.org/10.1371/journal.pgen.0020031 img/serotype_cps/serotype_48_cps.svg - res/serotype_genbank/serotype_48.gb I 48 - - - - - - - +- 9X MK606437 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_9X_cps.svg - res/serotype_genbank/serotype_9X.gb - - - - - - - - - +- 11X MK606429 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_11X_cps.svg - res/serotype_genbank/serotype_11X.gb - - - - - - - - - +- 16X MK606430 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_16X_cps.svg - res/serotype_genbank/serotype_16X.gb - - - - - - - - - +- 18X1 MK606431 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_18X1_cps.svg - res/serotype_genbank/serotype_18X1.gb - - - - - - - - - +- 18X2 MK606432 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_18X2_cps.svg - res/serotype_genbank/serotype_18X2.gb - - - - - - - - - +- 18X3 MK606433 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_18X3_cps.svg - res/serotype_genbank/serotype_18X3.gb - - - - - - - - - +- 29X MK606434 putative novel serotype based on nucleotide sequence encoding pneumococcal capsule van Tonder et al 2019 Mgen https://doi.org/10.1099/mgen.0.000274 img/serotype_cps/serotype_29X_cps.svg - res/serotype_genbank/serotype_29X.gb - - - - - - - - - +- Group I nonencapsulated - do not produce capsule due to mutations or deletion of genes encoding capsule Hathaway et al 2014 J Bacteriology https://doi.org/10.1128/JB.186.12.3721-3729.2004 - - - - - - - - - - - N/A - Nonencapsulated +- Group II nonencapsulated - NCC1 pspK JF489996 do not produce capsule due to novel genes in place of genes encoding capsule Park et al 2012 mBio https://doi.org/10.1128/mbio.00035-12 img/serotype_cps/group_II_nonencapsulated-NCC1_pspK.svg - - - - - - - - - - N/A - Nonencapsulated +- Group II nonencapsulated - NCC2 aliC aliD HE651292 do not produce capsule due to novel genes in place of genes encoding capsule "Park et al 2012 mBio,Salter et al 2012 Microbiology (Reading)" "https://doi.org/10.1128/mbio.00035-12,https://doi.org/10.1099/mic.0.056580-0" img/serotype_cps/group_II_nonencapsulated-NCC2_aliC_aliD.svg - - - - - - - - - - N/A - Nonencapsulated +- Group II nonencapsulated - NCC2 S. mitis aliC aliD HE651274 do not produce capsule due to novel genes in place of genes encoding capsule "Park et al 2012 mBio,Salter et al 2012 Microbiology (Reading)" "https://doi.org/10.1128/mbio.00035-12,https://doi.org/10.1099/mic.0.056580-0" img/serotype_cps/group_II_nonencapsulated-NCC2_S_mitis_aliC_aliD.svg - - - - - - - - - - N/A - Nonencapsulated +- Group II nonencapsulated - NCC3 aliD JF490008 do not produce capsule due to novel genes in place of genes encoding capsule Park et al 2012 mBio https://doi.org/10.1128/mbio.00035-12 img/serotype_cps/group_II_nonencapsulated-NCC3_aliD.svg - - - - - - - - - - N/A - Nonencapsulated \ No newline at end of file diff --git a/src/content/substudiesContent.js b/src/content/substudiesContent.js index 30c8222..f11b348 100644 --- a/src/content/substudiesContent.js +++ b/src/content/substudiesContent.js @@ -75,7 +75,7 @@ const content = { title: 'Diversity of ribosomal mutations associated with MLS resistance', authors: 'Paulina Hawkins', affiliations: 'Centers for Disease Control and Prevention', - details: 'Macrolide has increasingly been used as empirical treatment for respiratory tract infection. After PCV13, rising macrolide resistance was observed in pneumococci with non-vaccine serotype ([Lo *et al* 2019](https://www.thelancet.com/journals/laninf/article/PIIS1473-3099(19)30297-X/fulltext)). This study will improve our understanding of the genetic diversity of ribosomal mutations related to macrolide resistance in *S. pneumoniae.*' + details: 'Macrolide has increasingly been used as empirical treatment for respiratory tract infection. After PCV13, rising macrolide resistance was observed in pneumococci with non-vaccine serotype ([Lo *et al* 2019](https://doi.org/10.1016/s1473-3099(19)30297-x)). This study will improve our understanding of the genetic diversity of ribosomal mutations related to macrolide resistance in *S. pneumoniae.*' }, { title: 'Genetic diversity and distribution of the pneumococcal ABC transporter proteins and implications on potential protein-based vaccines', @@ -93,13 +93,13 @@ const content = { title: 'Global distribution and evolution of major penicillin binding proteins that determine β-lactam resistance in *Streptococcus pneumoniae*', authors: 'Yuan Li, Benjamin Metcalf, Lesley McGee, Bernard Beall, Stephen Bentley, Rebecca Gladstone', affiliations: 'Centers for Disease Control and Prevention', - details: '[CDC Strep Lab](https://www.cdc.gov/streplab/index.html) has a strong expertise in using genomic data to predict antibiotic resistance in *S. pneumoniae*. This project will appreciate the genetic diversity and evolution of the penicillin binding protein, that confer resistance to the first-line antibiotic, β-lactam, in treating pneumococcal disease.' + details: '[CDC Strep Lab](https://www.cdc.gov/strep-lab/) has a strong expertise in using genomic data to predict antibiotic resistance in *S. pneumoniae*. This project will appreciate the genetic diversity and evolution of the penicillin binding protein, that confer resistance to the first-line antibiotic, β-lactam, in treating pneumococcal disease.' }, { title: 'Global distribution and evolution of Streptococcus pneumoniae GPSC3 (PMEN33)', authors: 'Stephanie Lo', affiliations: 'Wellcome Sanger Institute', - details: 'GPS headline paper on [Lancet Infectious Diseases](https://www.thelancet.com/journals/laninf/article/PIIS1473-3099(19)30297-X/fulltext) has pointed out that GPSC3 is a major pneumococcal strain expressing non-vaccine serotype after PCV13. Using a global collection, we will investigate the evolutionary history of this important lineage and shed light on its secret of success.' + details: 'GPS headline paper on [Lancet Infectious Diseases](https://doi.org/10.1016/s1473-3099(19)30297-x) has pointed out that GPSC3 is a major pneumococcal strain expressing non-vaccine serotype after PCV13. Using a global collection, we will investigate the evolutionary history of this important lineage and shed light on its secret of success.' }, { title: 'Global distribution and genomic diversity of serotype 5 in context of PCVs', @@ -111,7 +111,7 @@ const content = { title: 'Global diversity of *Streptococcus pneumoniae* serotype 3 isolates; changes in the pre and post PCV eras in comparison with the changes observed in a local collection set in Hong Kong', authors: 'Pak-Leung Ho, Pierra Law', affiliations: 'University of Hong Kong', - details: "[Ho *et al*](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6422485/pdf/khvi-15-02-1526555.pdf) has importantly reported that serotype 3 emerged after PCV13 in Hong Kong and its increase was due to a regional-specific lineage that replaced the common serotype 3 clone CC180. This study will elucidate the circulating serotype 3 strains in Hong Kong and understand this emerging strain's pathogenicity." + details: "[Ho *et al*](https://doi.org/10.1080/21645515.2018.1526555) has importantly reported that serotype 3 emerged after PCV13 in Hong Kong and its increase was due to a regional-specific lineage that replaced the common serotype 3 clone CC180. This study will elucidate the circulating serotype 3 strains in Hong Kong and understand this emerging strain's pathogenicity." }, { title: 'Global emergence and population dynamics of *Streptococcus pneumoniae* serotype 19A/F CC320 (GPSC1)', @@ -153,7 +153,7 @@ const content = { title: 'PneumoCaT2: an investigation into 19A-like cps from serotype 19F pneumococcal isolates', authors: 'Carmen Sheppard, Stephanie Lo', affiliations: 'Public Health of England and Wellcome Sanger Institute', - details: 'PHE developed a WGS-based tool [PneumoCaT](https://pubmed.ncbi.nlm.nih.gov/27672516/) to infer serotype from genome data. This study will harness the global collection in the GPS project to understand a 19F divergent. The knowledge learned will ultimately be integrated into a new version of PneumoCaT.' + details: 'PHE developed a WGS-based tool [PneumoCaT](https://doi.org/10.7717/peerj.2477) to infer serotype from genome data. This study will harness the global collection in the GPS project to understand a 19F divergent. The knowledge learned will ultimately be integrated into a new version of PneumoCaT.' }, { title: 'Population genomics of mobile genetic elements', @@ -183,7 +183,7 @@ const content = { title: 'Validation and improvement of predicting β-Lactam minimum inhibitory concentration of *Streptococcus pneumoniae* using whole-genome sequencing and PBP typing', authors: 'Yuan Li, Benjamin Metcalf, Lesley McGee, Bernard Beall, Mignon du Plessis, Anne von Gottberg', affiliations: 'Centers for Disease Control and Prevention', - details: 'The current machine learning model for prediction of β-Lactam MIC was built and validated using a pneumococcal dataset from the USA (Li *et al* [2016](https://mbio.asm.org/content/7/3/e00756-16) and [2017](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5558719/)). This study will validate and improve the prediction model using genome data from South Africa.' + details: 'The current machine learning model for prediction of β-Lactam MIC was built and validated using a pneumococcal dataset from the USA (Li *et al* [2016](https://doi.org/10.1128/mbio.00756-16) and [2017](https://doi.org/10.1186%2Fs12864-017-4017-7)). This study will validate and improve the prediction model using genome data from South Africa.' }, ] } diff --git a/src/content/vaccineHistoryContent.js b/src/content/vaccineHistoryContent.js new file mode 100644 index 0000000..c827807 --- /dev/null +++ b/src/content/vaccineHistoryContent.js @@ -0,0 +1,105 @@ +const content = { + title: 'Vaccine History', + sections: [ + { + content: [ + { + type: 'timeline', + content: [ + { + time: '1881', + content: "First independently discovered by Louis Pasteur (who called it *microbe septicemique de la salive*) in France from the saliva of a rabies patient, and by George M. Sternberg in the U.S. (who named it *Micrococcus pasteuri*)", + reference: "https://doi.org/10.1093/clinids/17.5.913" + }, + { + time: '1886', + content: "Renamed 'pneumococcus' for its close association with pneumonia", + reference: "https://maidenlab.zoo.ox.ac.uk/history-and-biology-istreptococcus-pneumoniaei" + }, + { + time: '1911', + content: "Start of efforts to develop an effective pneumococcal vaccine", + reference: "https://doi.org/10.1016/S0140-6736(01)56449-1" + }, + { + time: '1920', + content: "Renamed as *Diplococcus pneumoniae* since it was typically observed in pairs", + reference: "https://doi.org/10.1128%2Fjb.5.3.191-229.1920" + }, + { + time: '1928', + content: "The transformation of life was demonstrated by Frederick Griffith, where harmless pneumococci were turned into a lethal form through the co-inoculation of live harmless pneumococci with heat-killed virulent pneumococci in a mouse; This experiment played a vital role in identifying DNA as the genetic material", + reference: "https://doi.org/10.1017%2Fs0022172400031879" + }, + { + time: '1929', + content: "The first 32 serotypes were described by Georgia Cooper", + reference: "https://doi.org/10.1084/jem.49.3.461" + }, + { + time: '1939', + content: "Danish Prince Valdemar died of pneumonia and his failed treatment with serogroup 9 antisera revealed additional diversity in serogroup 9, allowing for the identification of serotype 9V", + reference: "https://doi.org/10.4049/jimmunol.37.4.359" + }, + { + time: '1960s', + content: "Start of efforts to develop a polyvalent pneumococcal vaccine", + reference: "https://www.cdc.gov/pinkbook/hcp/table-of-contents/index.html" + }, + { + time: '1974', + content: "Renamed *Streptococcus pneumoniae* for its similarities in chain formation similar to other *Streptococcus spp.*", + reference: "https://maidenlab.zoo.ox.ac.uk/history-and-biology-istreptococcus-pneumoniaei" + }, + { + time: '1977', + content: "First pneumococcal polysaccharide vaccine licensed in U.S., contained which antigens from 14 serotypes of pneumococci", + reference: "https://www.cdc.gov/pinkbook/hcp/table-of-contents/index.html" + }, + { + time: '1983', + content: "The 23-valent polysaccharide vaccine was licensed (PPSV23), replacing the 14-valent", + reference: "https://www.cdc.gov/pinkbook/hcp/table-of-contents/index.html" + }, + { + time: '2000', + content: "First conjugate pneumococcal vaccine licensed in U.S., covering 7 serotypes (PCV7)", + reference: "https://www.cdc.gov/pinkbook/hcp/table-of-contents/index.html" + }, + { + time: '2010', + content: "Introduction of 13-valent pneumococcal conjugate vaccine (PCV13), covering 6 more serotypes in addition to PCV7", + reference: "https://www.cdc.gov/pinkbook/hcp/table-of-contents/index.html" + }, + { + time: '2020', + content: "The 100th serotype, 10D, is identified", + reference: "https://doi.org/10.1128/mBio.00937-20" + }, + { + time: '2022', + content: "PCV15 is licensed for use in children in the US", + reference: "https://www.cdc.gov/acip/evidence-to-recommendations/pneumo-pcv15-child-etr.html" + }, + { + time: '2023', + content: "PCV20 is licensed for us in children in the US", + reference: "https://www.cdc.gov/acip/evidence-to-recommendations/pcv20-child-etr.html" + }, + { + time: '2024', + content: "PCV20 is licensed for use in children in Europe", + reference: "https://www.ema.europa.eu/en/medicines/human/EPAR/prevenar-20" + }, + ] + }, + { + type: 'md', + content: '###### The above timeline is based on the [curation](https://pneumococcalcapsules.github.io/serotypes/) of Chessley B. Blacklock, Daniel M. Weinberger, Stephanie Perniciaro, and Anne L. Wyllie at the Yale School of Public Health' + }, + ] + } + ] +} + +export default content diff --git a/src/content/vaccineInformationContent.js b/src/content/vaccineInformationContent.js new file mode 100644 index 0000000..172dee7 --- /dev/null +++ b/src/content/vaccineInformationContent.js @@ -0,0 +1,19 @@ +const content = { + title: 'Vaccine Information', + sections: [ + { + content: [ + { + type: 'md', + content: '![Current PCV formulations](img/PCV_formulation.png)' + }, + { + type: 'md', + content: '###### The table above shows the serotypes covered by different pneumococcal vaccines. A blue block in the table indicates the serotype of its column is covered by that vaccine of its row. The shade of the colour represents how frequently that serotype is being covered across all vaccines. The darker the colour, the more frequently the serotype is being covered.' + }, + ] + } + ] +} + +export default content