Skip to content
Snippets Groups Projects
Commit f1c3439c authored by Simeon's avatar Simeon
Browse files

Working minimal test

parent fc911927
Branches
No related tags found
No related merge requests found
Showing
with 261737 additions and 10 deletions
.Rhistory
.nextflow.log
Source diff could not be displayed: it is too large. Options to address this: view the blob.
Source diff could not be displayed: it is too large. Options to address this: view the blob.
/home/nibio/Documents/Git/DivGene-genome-annotation/work/85/b8dd0ed5e01210eb04be69f4e0a434/MidP1831_erik_interpro.gff3
\ No newline at end of file
/home/nibio/Documents/Git/DivGene-genome-annotation/work/85/b8dd0ed5e01210eb04be69f4e0a434/MidP1831_erik_interpro.json
\ No newline at end of file
/home/nibio/Documents/Git/DivGene-genome-annotation/work/85/b8dd0ed5e01210eb04be69f4e0a434/MidP1831_erik_interpro.tsv
\ No newline at end of file
/home/nibio/Documents/Git/DivGene-genome-annotation/work/85/b8dd0ed5e01210eb04be69f4e0a434/MidP1831_erik_interpro.xml
\ No newline at end of file
/home/nibio/Documents/Git/DivGene-genome-annotation/work/e7/a068fcec054038bf87119d1ee6337f/MidP1831_erik_protein.fa
\ No newline at end of file
/home/nibio/Documents/Git/DivGene-genome-annotation/work/70/b78113120a64510c00c77fa6634cdb/fixed.gff
\ No newline at end of file
Submit-block ::= {
contact {
contact {
name name {
last "Lysoe",
first "Erik",
middle "",
initials "",
suffix "",
title ""
},
affil std {
affil "NIBIO",
div "Molecular plant biology",
city "Aas",
country "Norway",
street "Hogskoleveien 8",
email "erik.lysoe@nibio.no",
postal-code "1432"
}
}
},
cit {
authors {
names std {
{
name name {
last "Lysoe",
first "Erik",
middle "",
initials "",
suffix "",
title ""
}
}
},
affil std {
affil "NIBIO",
div "Molecular plant biology",
city "Aas",
country "Norway",
street "Hogskoleveien 8",
postal-code "1432"
}
}
},
subtype new
}
Seqdesc ::= pub {
pub {
gen {
cit "unpublished",
authors {
names std {
{
name name {
last "Lysoe",
first "Erik",
middle "",
initials "",
suffix "",
title ""
}
}
}
},
title "MP1831 genome"
}
}
}
Seqdesc ::= user {
type str "DBLink",
data {
{
label str "BioProject",
num 1,
data strs {
"PRJNA1101761"
}
},
{
label str "BioSample",
num 1,
data strs {
"SAMN41003021"
}
}
}
}
Seqdesc ::= user {
type str "Submission",
data {
{
label str "AdditionalComment",
data str "ALT EMAIL:erik.lysoe@nibio.no"
}
}
}
Seqdesc ::= user {
type str "Submission",
data {
{
label str "AdditionalComment",
data str "Submission Title:None"
}
}
}
>contig_2213
GGCCAAACAGTGGTAATTCTTACTAAAGAATTCTTTGTAGTGTTTCCCGGGTCCGAATACCTAAACTCCAACACAGCGAT
GCGGGGGCCAACCCGCACGAAATAGTAGCCGAATGTATTGATGTGTTGGTGACTTGGAAAATTGGAAAGTGAGTGCCTTG
GGAGACCGTGAGTCTGGTGCTAACCAGCCCGTGCTCGCCAAGGTGAACCCAAAGAGAGAGAGGCAGACTGTCGTAGACAG
ACTGCTGAGAATGTACATGCAACGCACCAAAGGAAACATGCAGTTGGGCTTACTAAATCCTAATACATCTTGGTAAGGCA
ACTTGCTCACCAAGATCACAGAGCTGTACCCATTGTCCATAGAGGAATGCCGTCGGACACATGCGGGTACTTCTGTGATC
TTCACTGTCGACATCTCTCGGTTACTGAGCCCGCCGCTCAGCACCAGATCTGGATGTCTGTCAACCAGCTCGAAGTTCCA
CTGCGGTGAATCCAAGCTGGAAAACCCGGAATCCATTACAACGCTGTTCGACTGCGTTGCTGCACAAATCACAACGACAG
GTTCGACGCTGGGCCGTCAAACTGACACATCTGAAGTTCCGACGTGTGCGAAGGATATTCGAATGAAGTATGGCGCTGGA
GCAAAGCCAAACACTTCGTCGTCGTATCTTTCGTACTCCTGCAGTAGCTTATTCTGTTCGGTATAGGAGAATGATCGGAT
TTTGGTCACGACTTCTCCGTCATACAATAGAGAGTCCTCTGAGCACGCCATGGAAGACGCTCGAGCGCGGACAAGGTCGC
TATTCAGACCCGCAAGAATGACGTTGTCGTATGTAGAGCAGCTAACGGAAGGAGCTATACGAGAACCCATGTTGTCGCGA
TCATCGTCGCTGAGGGATGATTCAGCTTGTTTAAAGGAATGTAGCAAGCATTCCAGTGGCTTCGGAAGCGACAGGAAGCC
GAAATGTGTAAAATCGTTGTCCTTATGGGGATCTCGCCTCGTTTTCCACGACGAGCGCTGCTACAGATATTTCCACATTT
ATCGCCAGGTTTACGAACGGTGCGAGCTCCATTATCTATGGGGTGAGCTATGGAACGGTGCTGGTTGAGCGTTTGATGCA
CTTAAGCCCGCCAAGTGTGGTTGGATACGTTCTAGATGGCATTGCTACCACTTCAGGAGCCTCGGGTAACGAATTCCAGT
ACTTCGACGCTGACTTTGGCAAAGTGGGCGATCACTTCATGGAACTATGTGCGCTAGACGTTGCATGCAATACGCATTTC
AAGGCAACGAGTCTCTCTGAAACACTTCAGCATGTTATAACGCGAATGGATAACGACCCCAACTCAACGTGTGCTTCCTT
AATGAGCATGTTGGGTGACGCTCCACCATCACTTGAGCTACGATCGACTCTAGGTCTACTCGTGAAGGATTCAACAGCGC
GAGTGCTTGTTCCACCGCTGATCTACAGACTTAACCGCTGCGATGCCAACGATGTGGACACCCTGACCCAACTGCTCACC
GCTGTAAACACCTTCGAATTGGGTACAAGCCAGGACGATGCCCTCCAATCGACATTGCTGTACTATCTCATCATCTTCTC
AGAAATGTGGGAGACGCCAGCTCCTACCAGCTCCGAAATGGATTCGCGATTTTCCCATGCAAGTATGGCGGATGGAGTAT
ATCAATACAATTCGCTGTATTGCGCTTTCTCGAAAGAGAAGTCTCCAGCATGCGACGGGTTAAACGTCAGCAACTACGAA
GGCGAAGGAATCATTTACCAGCGTGACCAGTACTGGAACAAGAGCGCTTCAGTACCCACTAAGGCCAGTGGCTGCTCATG
AGTGGGAAACTCGATCCGGTGACGCCTAACAAATACGCAGAGTATCTGGTCGATTCTCTTGCCGGCTCGAACAAAGAGCT
CGTCACATTCGATTACGCTACCCACGGTACTCTAATGTTCACCCCGTTTAAGGATAAGAGTGGGGTCATTCGAAACTGTG
GCATGGAACTACTGGTATCCTATGTCAGCAATAATGGTAACCTCAAGCGTTTGGACCGGTCATGCATGAATGAAATGCCC
GCCTTCAATTTGGAGGTGCCAATTGAGTATGCGCAACACTTTTTCGGTACCGAGAACGCGTACGACGGTGTCTACAACGC
TAGCTTAGCGCAAGCCGCTTAAACGAGACAACGAAGGTAAGAATTCATAACAAGAAACTGCCATTTAGAAACCATTTTCA
CTTGGAGAGCTCGAAGCTTTGGGGCCGGTTCAAGTCAAAACAGAAAAACAAATATGGTCCCCGTACAATGAATGTACTGC
AATATTACTAACTACACCACCTAGCGCGCCCCACCTTTTATTCGTGACTCGCATCAGCCGGCATCGTTTAAGAATTCAAG
CCGCTGCCATGAAATTCCCCACTTCTCTCTTCACTCGAGTGGAATTGCCGAGCGATTTCACCTGTGACAAAGGTCGAACG
CTCCCCATCGTCGGAATCTTTGAGCCTCCAGGACGCTCTCGTACGTTAAAGTCAAAGTCTTCTGGTCCTTCCTGCTGCAT
CTGTCGCAATCTCTCTTGAAATCGCTCCTCTTCTGCAAACTCTCGAATCTTCTCAATCGCATCTGACAGCTTCATACGCT
CAGACGGTTCAAAAGCACACATCTTCTCCACCAATTCCCACTCAGCGTCATTACTAAACGCCTTTGGACGAAGCAAGAAC
TTCCTGCGGGTCACATGAAACTTCACGACTGGGTCTGGTACGTGCTGACCCCACGGCACGTCGCCCGTCACCGCCTCCAC
AATGCACATACCGAATGAATACACGTCCGAAACCACATTAGGAGCCACAGGGCTGTCCTTGCGGATCACCTCGGGCGCTT
TCCATCGAATCGCGCCAACCGTTTTCTCATCTTCGCTCTGCTCGGTCGTCAAGAAGCTCAGTCCGAAATCCGTCAGCATA
GCCACACCGTCCCTGCTCACTAAGATCTGGTTACACTTGAGATCTGTATGCACAATGTGTCGTTCATGCAAGAAGTGCAG
ACCGAGAGCAGCGTCCAACAACTTCCGCCAGACCAGAGATCGTCCCTCTTGTCTTGCGTGGTACAGATAGTCGAGTAATT
TGCCATTCTTGGCCTCTTCACACACGAAGAAATACGTCGCGCCTTCGTCACAAGCTCCGAAGAATGGCACGATGTTCGGG
TGTCTGGCTTTTTGCCAGATACGCGCTTCTCGATGGAAGGTGCGAGTTTCTTGTTCAGTGGCTACAGTGACCGTCTTGAC
GACGACGCGAGTACTCAACCACCAGCCTCGGTACACTTTCCCGAACGATCCTGCAGAAAAAGGTTCCTGATCCTTCCGCA
CCTCGCGACTCGGGATGAACCAATCCGGTTTCGTTAGCCTCGTGGCAACAGTGTTTGATATCCCGCTCGCTTCACTTGTA
TGAGCGCAAAATTCGCCAGACCTCGTACCTGCAATTGATACGAGCCAATTCAGCTGCTGTTCGCCCCGAGCTGCTGACAA
TCTCGGCGTCTGCATTGCTGTCCAGTAGCAGCCGAACGATCTCGTCGTGTCCTCTGTAAGCAGCTTTCATCAACGGTGTT
TGGATGTCCACATCCACTACGTTCACGTCCGCATGATGCTCCAAAAGCAGCCGGACGATCTCCAAATGCCCTTCTTCGGC
AGCGTACATCAGAGCTGTCCGCTGTTCACTTGTTCGTGCATCTACAGTAGCACTTTCCTCAACAAAGAGAGTGACAATAC
CCCCATAGCCACGCTGAGAAGCCACCGTCAGTGGCGACCACCCCATCACATTGACTGCGTTCACATCAGCTCTATGCTCC
AGCAGCAACCGTGCTATCTCGAGACGTCCGTGCAGAACAGCTTCATGGAGCACGAAATCTCCGTCGCTGTCTGCAGTGTT
GCTCGTCCCACCTCTAGCCAATAAAAGCCGCACTAGCTCCAGATGACCTTTAAATACTGCGCTTTGCAAGGCCGAGCAAT
TGTTTCTGCCAGCCAAGTTGACGTCCGCGCCGCAATCTAACAGCAAGCGAGCACACTTGACGCTATCTGCATAACCGACT
AAGCGCAGCGCAGTCTCCCCGCTATGAGTCTTGGCGTCTACAGCTGCACCAGCGCTTAACAGCAACTCCACCACCTCCAC
ATACTGACACTGGACTGCCAGCATCAACGGCGTTTTACCGGACGAGTCTGCCAAGTCTACATTCGCGCCGTGTTTCAGTA
AAACACGGATCGTTTCTGTCTTTCCGAAGAGCGCTGCCATCATGACGGCAGACGACCCATCGTCCAACGTGGCGTCAACG
GCAGCTCCATACTCAATCAGAACCTCGATAACTTCGGGGTGCAGCCGTGCTGAGAATTGTCAATCCGCCAAAAAACAAAA
CGTTCTTGACACGTCAGCCCCTTTCTTCAATAGGAGACGTACAAGCTCTACAAGACCGCTGCCAGCAGCAGCTTCGAGAG
CAGAAATTCTTTTTTCTTGTAGATTGTCAACGACTGCTCCATTGTCGAGCAATAGACGAGCAATGTCCACATAGCCTAGA
GAACAGCTCGCGGCAAGAGGCATGCTGCCGTCAGGGGTCAAGTGGTCAATGTCCGCTCCGTTTTCTAATACAAGACGCAC
ACATTCGATATGGTCGTTTAGTGCAGCGTAGTTGAGAGCAGTGTACCCGTCGTTATCGGTCTTGTCAACGCTGGCTCCCT
TCTCTATCAGCAGACGCGCTGTCTCGACGTGACCGGATGATACTGCAGCAATGAGCGGTGTTGATCCCTCGCTATCTGCT
GCATTAATCATAGCTCCTCTCTTTAGGAGAAGACGTGCCACCTCCACATGGCCGTGTTCAGCAGCGTATATCAGTGCCGT
AGCACCTTTGCAGCTTTTAAAATCGACCTCAGCTCCGTTTATCAACAGCAGACCCACTGTCTCAGTGTATCCTCTCTCTG
CAGCCAGAATCAAAGGCGTGGATCCTAGATGCGCCGCCATGTTGACGTCAGCTCCTCTCCTTAACAACTGTCGGACAGCA
TCTACATTGCCTTTGATAGAGGCATACATGAGCGCTGTGTATGTAGTCAGTTGGGGTTTTCTTCTTGATGTCGGACCCAC
CATCTAGCAAGACGCCAACAACTTCGTCATAGCCATACCCAGCAGCCTGCATTAAAGGTGTCAATCCCTCCTCTGCAGCT
ACATCTACGACAGCTCCCTCCTCCAATAGAAGCTTAACTACGTCCAAATGTCCGTTTGTAGCAGCCCACGTAAGCGCAGT
ACCGCCAGTATCATTTGTGGCATGGATATCGGCTCCTTGGTCCAGTAAGAGCCTCACAACATCCACTTGACCACGTAAAG
CAGCATACAGAAGTGGCGTGTACCCGTCGTTGGTGGCCAAGTCTACAGTAGCCCCCTGTTCCACTAGAAGCTCAACTACT
TTAACGTAGCCACATTCTGCAGCCCACAAAAGAGCAGTAGACCCAAATTGGTTGGTTCGGTTAATGTCTGCCCCGTGCTG
TAGTAGCATCTGCACGACTTTAAGTTGCCCACTTTTGGCTGCACAGATCAACGCGGTGTTCCCATCTTTACCCTTTTGCT
CAACGTCGTCCTTATTTTCAAATAGGCTTTGGACAATCTCCACATGGCCCTCAGTAGCTGCGATGATCAGTGGAGTGTCT
CCTTCTGGGTCGGATTTATTGATATCTGCCCCCTTTTCCACTAAAAGCTGGACGAGTTGCGTGTGGCTTATACGGTACTC
GGAAAGGAGAGCGGTGAGACGATGGACGTCGATGCAGTTGATCTTGGTCGTGTCGGCGTCTTCATCACTAGCAGCAGCGA
CCCGAGACTTGAGAGACGCGGTGGTGGTCATGCTTGCTATGGAGCTCAAATCTTTACCGCCTTCAACAACGAAGAACAAC
ATTTTTTTTTTTTTGTACCCATCAGTACTTATCCTGTCCTTATCCTCCTTTCGACAGCATAAAATGACCTTATCCTACTT
TCTACAGTATATAATGACATTTTTGTAAAGGAAGCGTACGCTGTGATTGGCCAAAACCGAACCTTGTGAGCTCAATTATC
TGCCAATCCCACCAAACATTCTCAAGCTGTAGTACAGATACGCGGACCAGAATTGAGAAGTACGGCCATTTAACCAGCTC
CCCTGTCCCTGCATCGTGTTCACGGCGCTAACTGAAGCGTGCTTACTACTCATACACATGCATGCTCCCAAAGGGTCGTA
CTGGAATCGGTTGCGGTGGCTTCTGCGGTTTCAGAGCCCCGGGATTCTCGAACTGCATCCGTGGGGTCTCCTGGCTGCTC
TACTGCGATCTCCCAGTCGGCTGTTAGACGGCGTGACGGCCTCACATCATCGATATTTAGACCGCGCTGCGGCTGCAGTG
ACGCAGAACCCAGTGCTGTTCCCGAATGGGTTTTTCTCGGATGGGTGGGGAGATCTCAACACCCCAAAACGAATCCGAGA
ACTACTACAGAGTCGACGCATGAGTGACGTTGTGTCACTAAGAGACGGAGAACCGAATTGGAGCAGCGTCAGGAAGCTGT
CGGTGGCTAAAGTGGCGTTGCGAGAGGGCAAATTCAGCAGCTCATTGGACAATGCGCAACAGTTGCTACCCGCAGAGAGT
CAGGACGCTTTTTGTGAACTAGTGACGCCGCTGGAGTGGGAACGAGAAGATCAGCGTATTCCACAAGGGAGACAGGACCG
ACCTCTTGTGGGTAAGTGGATTTCTAAATTTTATCGAAAGAACAGTGGTGAATAACCATGTGGAGTGACGTAGTGCTTCT
ACCGGGGACGGGGGAGCACGGATTTCTACATCGGAGAGCGTCCATTGCTATCCCACTAGCCAAAAGGGGAGTAGCCACTT
TGGTACGTTGAATTAACAAGGTTTATTATCATTGAAGTACTAATTATTGGACACTTGCTGCAGATTCTGGAAGGACCTTT
TTACGGGAAGCGCAAACCATCGAAACAGAAGGGATCCAAGCTACGCAGGTACGCTCTGCCCGTTTTTTTGTGTCGTCTAA
GGTACTGAGTAATTTTTTAATGGGTCTGGTGTTTCACAGGGTAAGCGACTTGCCCATCCTAGGTCAAGCAACCATCGAGG
AGGCCAAGTCGTTGCTGGAACACTTTCGAGATTGCCACGGGTACTCGCAATTAGTAGTTGCAGGCAGTAGCATGGGTGGA
CTACATGCTGCTATGGTCGCATCAGTGTTTCCTGGAGATGTGGGAGCTACGGCCTGGTTGGCGCCACCCTCCGCTGTGCC
TGTGTTCGCAGATGGATTGCTGTCTGGATCTTGCAACTGGCGATCGCTATACAAGCAGCACGAACTTCAAATGCTTGATA
AAATGCTGACCGGTCATGCAGCTGCTGAATCTTACGAAAAGCTGCTCGGTGCTGCAGTTGACGACGAAAAAGAACGAGCT
GAATGCTCTGAATTGGAGCTGGATCCGGTCCAAGAAGCCAAGAAGCGCATGAGACTCTTCCTCTCGATCACCGATATTGA
CAATTTCTTACCTCCACGAAAATCCGATGCTGTTGTGTTCGTGTATGGAACTGAAGACGAATATATCGGCTTCACTGAAC
CGCAGTGGCAGGTAGTGTGCATCCATTTTCACGCGCATTCTTGCATTTAGAAGTTCTTACGGCTCGGTTATTTTTTTTTA
ATATTTTTCAGCGTATGCGTGAGCAGTGGAGACCAGCTCACATTAGAACTATCAAAACGGGTCATGTCAGTGGGATTTTA
CTGGAGCAAGAAGCCTACCGCAAGACGATATTGGAGGTTGTGGATCTTTTGAAGAAGCGAGAGACAACAGCAGACCTATC
GTCAGGAATCGCTGTTGGATCTGCGTGAAATGTTCTTTATAAATATTTCAACAGATCAGAAAATATCTGCATCGTGCACA
GCTACCGTGACCGAATGAAGATCAGGTGCTTGTGATCAACTATCGCATTCAGCTACTGTGACACTGTTACTAGCATACTG
TGCTTGTATCTATTACATGTATACATGTAGTACACTGGAAAGTGTACTGCCGACCTGTCTCTGTTGAGTGTTGTACGAAT
GTTATCCCAGGTTACGCTTACTAGCTTAAAAAAAGTGCTTTCGCTAAAGATAGCTATTTCAGATAATATTTACCTGGAAA
ACAGGCTTTAGTACAAATCGCAAAAGCTAAGCGTCTTTTGCGTACCGGTATTCGAAGTTAAATATCCGAGAGGATATACT
GGGAATTCCGAAGTATGAGGGATGGACAGCCCCAGCGGATTAATGTAACGGTACTTATGAGTTTGTAGGTTTGGCGCCGT
CTCAAATAAACTTGATTTTTGTAAAGCATGAGAGTGTTTACTACACTCCGACCCGAATTAATCTCTGCAGGACTTCGTAC
CAAATCACTACCAGTAAAACGATTGCGATACTAAGGCAAAACCACAACTCTCCTGGTTTTAATTACAGAAGTAGGAAGTT
CCATAATGCCAAATAACTCAATCGTTTGTTTATTGAACTCTTCTTCTGCGCGACTTTCACAGCTAACACAAGTCAAAATT
GTCTTTCTTGCCGTCGTCGTCATCGTCTCCCTCTTCATCGCTTTCGTCTTCTTCCTCGCCGTGCCCAGCTCCACCTACCG
CCTTCCTCATGCCTCTCACTGTCTTCGAAGTCCTCGACATCGGCGACGATCTTGACGTTCGTAAGAGGCGATTCTGAGTA
TCTCCATCAAGCGGTTGAAAAAGCTGTGGTGATCCTATGTGCAAGACGCCAGCTTGATTGTCGGTCACAGCGGCAGATAT
CGCGATTCCGTTTCCAAGGAGGGCAGCTGCAGCAGAAACCACGAGAACAAAAGGTAGGCGCATATTTTTGTTGCTGGAAG
TGGGTGTTGCAGCGGAGAAAGTAAACTGAGGAATAGCAATGCACATGCTTGGGCACGATCGGCAAATCGACCGAGAATAT
TATCCTACACGAAGGGCGAATTTTTAGGACGATGGGCACACAAATACATGTATCTAAATTTTTAAACCATTTGTGTATTG
GTTATTTTCAATCTGGCATCTTAAGTTGATATTTACAAAACAAACCTGTTTTGTTGATCATTCTCTTATTAATAGGCACA
GCTGGCCGACCACGTAATTTGTAGATCGGAAAATATCCCGTTAAACCACGTGCTTCGGGCTGAGTTCGCAGAACATCTCG
TACCTGCTGAAGTATTGGCCTTCCGAGAATGTGCTACACCGTGGCTACGTATCTCTTGCATAGGCTAGTCGTTGACGGCA
ATTTAGCTGCGAACGAGCAGGTATTGGAAAGCTCAGCTCAACAAGTGTCTCGTTAGTTAACAAAAAATCGAAGTTACGGT
ATTGTACCGATACTATATTGTCCGCTAAAAATTTCTTTTCAGAATAACAACGGATGCTATTCAATTATGCCTGCCGTTAC
TTGACGGAAGCTCTAGTTTATGTCGCAGTTTCATATAACATGTGCTACCTAATTCGTAGGCTTACTCAAGAACTACCCGA
CGCATAAAAAAAACAGCTGGACCTCGTCAGCTTCTAAACAAGTACTGTACATTGTATACAGTGTACGCCCTACTGACTTT
AAACTGACAATGACGCGTTCGTAATCTACAAAGTTGGGCATAATCCGCGTGACTTGCTCCTTGGAGTGATCCAATGGAGA
CTATGTTTTATAGTACTAACGCTATAATTGACAGTTGAAGGCTTACAGTAGTTAATGTGGTGGTGTACTTCTCCGTGCTC
TTATTTTTTAACTCACCCTCCTCCACTAAAGTCTCTCATTACTCAAGCACCATGCGCAAGACGTTTCTCCTTCTGATTGT
TACCCTCCTCGGTAACGGAAGTACCATATCTGCAACCACGACCGGAAACCAAGCTGCCATCTCTACCCTGGAATCGCCAG
TTCTGCTCACTCACGATACTCAAAAGCGTTTTCTGCGGAGCCACAGCGAAGCGGAAGAAGGCAGTGAAGAAGACGAATTT
GGAAACGCTGAAGAGAGAAAAGTAGGGGCGAACCTTTTCGCGGATTCGAAGCTCGCGCAAATGTTGAACTCTCGTAAAAC
GTTCCCGAGGTTTGCGAGGTGGAAACGCGAAGGGTTCATCCCCAGCACTCTTAGAACGAAACTAGAGAAACTTGGTCTCT
GGACAAAATACAGTGGCCTCCACACGATGTACTCAAACAACTACTACGTACACCATCGAGAAGGCCAAACCGTCAAAGTA
CGCGTAGATCTGGCGATAATCCACTCGAGGAGAAATACAAATGGAGGGTCTTAATCGATTGTTAAGTATTCACGTAGTTT
TTGACCTATTCTACAAGCAGGGATCATTAAACAGTTCTCCACACAGCTTCATGAATGTAGATAGCTTGCTAATAATTCAA
AAGTATTTGACATCTCAGCATTCTTTGTACCATGTTGGTATGAAGTTCACTCGTGAGGACAGCACACGATGGTATCTTAC
TTCGTGCTCATGACAATGCGAAGCTCGCCACGTGAAAGGTTCTGAAGCCACATGATCTCTTCGATGTGGCGTTCTCCATG
GAAATAAACGCATACTGAAGCAGGTCATAAACTCCCCATCTTCACCGTCACAGCATCCATTAGAGTTGAAGACAATTTCA
CACCCGTTTAGCACCACATGTGCGCTCCCGACTCTTCCAGTACATGGAATACTCGCTTGAGGTCATTATTCGCTAGTACA
CTTTTCCCTAACGAAACACCGATTAGCGTTTGCGACCACCGTCAACGATCCGCCTTCCCGTTAAGATGCAGGTGCATCAG
CACTCGATGCACTATTAGCTTCCGCGTTACTCGTAAAACTACTGCCACTGCTTGTTCGTGTGGCCACCGCTGCACTTGGA
GCATCTCCACCCTGTAAACAGTAGTGGCTGCGGCAAATGCGGTAACTAACTTTTGCCAATTAAAATATCTATCTTAGAAA
GATGAATACTAATCTATTAGAAATGAATTTTCTTTAATTTCGAAAAAAAATAAACTACTTCATCCCCTGTTTTCTAAAAG
GGTTGGGTTTGTGAAACGTCTGAGATACGGTGACTGCGTAATTTATGCTGCACATGTTTGTGTCATGTACAAACATGGGC
AATCATATTCACAGTTCGGCTTAAGAATGGCACCACAATCGCTGCATCGGAAGCGTGAGTCACCATTATATGGTATGGCC
AAGCTACTTGTTGTCATGGCCTAAGTCATGCAGCCATGCCAGAGTATTCACACAACTAAAAAAAATAACATGCATGACAT
GGAGAAGAAGTGAAAGGTGCGGCTATTCAGCAACAGTCTCCACTCTTCGCGTCGCTAAAGTCCACAATTGTTTTCAGAAG
ATCCTATAGCCGGCGCAACAGCCCTGTCTCCGTATAGTCTCTTCATGCCGGCTACTGATAGCATTCCCCGTGTGCTGAAG
GCAAAATATCCAGGGACGGAAAATTTCGCTACAGAGGTGTAGCGAAGCACGATCTGGTGTGTGACGGGGTCACGCCGCAT
CTTGCACAGAGGAAGTGGTTAAGGGCATATACTACCTGAGTGAACGTTAGCTCACGTGTTCCCGGCCTCAAAGGGAACGG
TTTGCTACTTAGAAGAGTAGATGTAAGATGGATGAATTTGTAAGTAAGCTAAGCTTGGGCTCTTTACAAACTGGAGCTTA
CCTATAGTGGAGCTATGTAGTCATGCTCTGACTGGCTCCTAGAGCACCTGGTACCGTGTGCCAGGTGTCCACAAGACTCT
TTTTTTAGCCTGGGACACACTGGACTGTACCCGTTACATACTTCCCCACTTTACTGAGAATCGCCTGATTCTCCAATCAC
AACTGATTCTCCAATCAGAAGTGAGAGAATTAAAACACCCAAAGGTGAATTCTCACACTGAGTAGCCACGAGACTGGCTC
GGCTGTCATTCACACCCACAGTGCCTTTTCTTCCTTAAGCTCACTGGGATTTGCATCCCTATGCTCACAACTGTGTTGGC
CGCAAAGACTACGCTCAGAGCTGCCTTAGCTCCTGCGCTGGCCCGCGTACGGTGCTTTGGCACAGGATGCAATGGCATCC
AAACGTGTGACATTCGCCCACTGCTCGCACCAGAGGGCACGACAGTCCTCGCGAACGCGGCCGGAGCATGGTGTCTCGTC
GCGAGGGACGACCCCGAGAAGGGCAACACCTGCACCAGCACTAGGGGGAGCTCTCAGCTCACCTGGGGCCATTCCTTTGT
CTCCCGCAAGGATGGATCCTTGCGGGCGGAGCTTTTGCCTCGCTCTCTTCGTGTCTTGGCCGTCATTCCAACGGCGCGTA
GGTGTCCTTCATCGACACCGTGTACCGTGATGGTACTCAGTCGAGATGCAGGTGTCTCCCATCGACACCATGTACCTTCC
GCTACTAACCTTTGGTGCGACACGCCCACCACAAGGTTGCCATGTTTGGCGGCAACAGCTTCTGCGGTGCTGTCGCCTGA
ACTGATTCATGGCCAGTGCTCGCATCATGCACGATGCATGTGCAAGCACAGTGTACATGTCCATGGGCCCGTACACGAGA
AACGCTGTGTACGACAAGTACCACAGATACCAGAAGTGCACCGTCATGTTTGTCATGCACGACGAGTTCATTACGCGGAA
CTCCCGACAGGCCGCTCCACAGCAGCCTGTGCCGATGCACGGTACGTGCGCTGACTCACAGCGCATACGCTCAAAACAAC
ATCGGGTCGTGGTATGGCGCAGACCATTTGCACCCATGCCAGTGTCTGTCATAGACACCATGTACCTTGATGGTACTCGA
CCGTGGTGGGGTGTATCTCACCACCATGTCACTGCGGCGTTGGTGTCTGGCATTGACACCGAGTACCCATGCGGTACCGA
ACCATGGTGAGGCAAGCAGCCATCACCACGGTGTGATGCTCGGCGCGGCACCAGTTACGACTGCGTGCGTTGCCTCGACC
ACCACCTCGTCAGTTGTGTGTGCACTCATGCACCACACTTGGGTTATAGGGTCCACGGTCCATTCTACCCGCCGCGTTGC
GTATATTACGTACTACAACCGCTTTGTCAGCGGGTGAGACTTTTCGTTCACCCTGCTCGACATTCATGACCAAGGGATCT
ACGCGGTGATTGCACCACGTCCATGCTTTGCCTCGTGTGTGGTTGATTGCAACACAACACTGCTAATTCGCTCAGCGATT
CCGAGGCAACTAGCGCCAGTGGATTCCGTCGCTACGCTGGCTTGTTTGGCTCGAGCTATCGCAGCTCTAGCCCGTCTGTA
TGCCTCTAGCCTGCGGTCGATGTAAATCGACGCCTGTTTCCGTAAGAAGCTTGGTGTTACCTCAAGACCAGGGACGAAAT
GTATTTCTGAGCCTCTCTCTCACTTAAACTTGGGATTATTGAGTCTCTCGTGGCTTGTGATAGCCACTGGAAGCACGACG
GCTACTTCGCTCATGCAAAGCAAGGGAGGAAAGATATTCCCGACCCCATCCCCACTTAACCTTGAGACTATAGAGTCTCT
CGCGGCTCGTGATAGCCACTGGCAAGCACGACGGCTCTCCGCCTCGTTCACTGCGCTGGTATGAACGCCTGCGTCAGCCG
TGCCAACCAAAGACATCCAGCCTTTGCGTCAGCAGTTTAAGTCTGTGTGACTCAACGTCGAGCGAGCTGCTCATGTCTGG
CGAGGCCAAGACAGCCTCGCGTCTAGCGCCAATGACTCTGTGTATGATACTATGTTACCCGCCTTGGTTGTGGAACTCTG
TTACCCACATTGGTTGCGGAACTGGCGTTACCCGCCTTCGTTGTATGGAACTATGATATCCACCTTGGTTGCAGCGCTGT
GCTACCCGCCTTGATGTGTGGAGCTATGTTACCCACACCGGAAGCGCATACAGCGACTTCCTTATCAGTTATGGTCTGAG
TGACCTTGCGTGGAACTCTGCTACCCACGCTCGGAGCACCGAATGTCGGTCTCCTTAAGCAGTTTCGATGCTTGCGGAAC
TTGTTATCCGCAATGTGGACCTATGTTTCTCACCTGGTGAATACCCTTCGGCACCACCACTGTCGAAGCCCGTACAGCGC
GAGGAACTTCGGCGTTGGACGCTGCAGGTGTAGCAGGTCACACGCCGGGCAAAAGATTCATACCAGTGGCGTTACAGCGG
AACATGTTCTTGTTGTACGAAACGCTGTCGGCGCTGACAGCTCCGTGACGCTTCTGCGTCCGGGCGGTCTGTATTAGACG
CCCAAGTCATGACGGAGGTGGGAACATGACTCAGCAATGCTCCGTCATATGCTTGGACGGGCAGGTCCTTCCAAGCCTTG
CCACACGAAAGTCCGGGCTGTGCCTTATGTTCGGCACAGCCATGTTGTTTATGGCGAGAACTGCGAGCGACACCGCGGTG
CGTGAGTTCATTGAGCCCCAATGTTCAGGTCCGTTAAGGACCGTTGATACTTCCTTCACCGTACCAAAGAGCAGTCCCCT
AAGATCAACCCACGACCGGCAGTCTGCCAAAGAGTGCAGTCGGATGTCGCTACGCCAAGCGACGTTCCGGCGACGTATCA
GCGCCCCAGAACTCATCAAACGTTCGAAGGGTACCGTACACCCGTACACCGAGTGTACTACCAGCAGCCCATCAGTGCCC
TTCACTGGTTTGAGAGTACCACGTCTTTTTGGGCTAAGCCACTTGGTGTGCACAGCCTGCGCACCCATCACAAAGGCTTC
GCGCTCTTCAATAGAGAATACCGCATCTACAGGTGGCCGGGGAGTCTTCAACCACCGGTCCATGGCCTACGCCATCGGAC
CTTGGGCTCACGGGCTGGCTTCTTCCCGAGGACTGGCGAGGACATACCCGCTGGTAGTGTACATGTCCGCCGCATCCGTA
GCAGCGAACGAAGCTCTCGGCTGAGCTTAAGGCCTTGGTCCCGGGCTCGCTGTGCACACTAGTATCAACGGGCTGCGTAG
CAGCAGGAGCAATAGCGTCATTGCTGCGATGCCCGCCTCACGAGGAACGCCATCCTTATCGTGGCGATGTTCCTCTCCCC
GAGAAGTACCAGCCTGCTTGTGGTTGTACCCTTCTTGAAGGGCGATTCGAACCTCCTCCTCCATAGCTGTCGCTAGCACC
CGAAATAGCTGGGTGCGAGCAGGACTCACCTTCAGGCTGTTCATGAAGACTGTTGTCTTGATGTCTTCAGGCAGAGGATA
CCTGCCAGAGAATCCACCAACGTGCGCATCTCTTACACGTACGCCTGCAGCTCACGTTTACCTTGCTTACACGCGAGAAA
GCGTGAGCGCTGGCGGAATTCGTTGTTTGACGGTAGGAACGCGGCTCGAAGCTGTTCACACAGCTGAGATCAGAATGCAT
AACATCCAGGAGATGTCGTCTCCCTGGTGGATGTCCAGTGCTTGGCACGTCCACCAAGGTTCGACAGGGCAAACGCCACC
CGAAGTAGCTCGTCCGAGATGATACCCACCTTCATGGCAATCTCCACCCCACGGAACCAGAAGTGAAGGTTCTCCTCTTC
CTATCTCTCAAAATCGTAGGCCTGACAGAGCGTTTCCACCGCTCATGGAAAGCCTGTGAACGGATAATATCATACATCAA
CCGTGACTTTGTCACTGGCAATTGTCAGTTGCTACGCTCTGATCAAGAAGCAATAGTGCGAGTACGTGTATCCATCATTC
CTACCACTAGTTGCTGGCATCTCTGTTTTTGTCAGATTCGCTGTGAGCAGCCGACAATGAAGAATCGGCTACGGCTTACA
GGCTGATAATTCCCAGACGGTATCCGTATATATTATGGATACAGTACCTACTGGGTTATCTGCTTCACTCATCGTATTTT
CACGGCCTTGCACATTAGAAACATTATTGCCTGCCATTCAAACTGGTATTGAATTATTCGTGCAACATTTAATATTACAA
TATGCGTACTTAACCACGAGGGCGACGGTACATGTAACCTTTGTATAGCTAATGAACTAAATTCGGGTATAAATTTCCAA
GTCCATCACTGTGCATCCTCACACTTTATCTGTATTAACGCCTACTCGGATAGCCTATAATATTACGGAAATTGAAACGC
CACCCGAATCCCCCTTAACTCTGAAAACCAATTCAGAGAAGTGCACAGTCGTCTGTAGACCTGTCGAATCTAAGGCCGCG
TCTGGTCATGGCTACCCCTCCAGGAGAAACCCAGCCAAAATGGAAGGAGAGACTGCAGACATAGTCTCCGAGGTGGTGTC
GGGCTTAGCAACCCCTAAAACGCAAGTAAAGCCCTTATTGTTCTGACAACCCATCATGGCGGCAGCGAGATCACAACGCA
GGCAGCATACTTCAACGAAGTCCTGATCACTATTTCCCAAATTAAATCGGAAGCAGCGCCGTCCAAAAGGACCCTAGAAT
AAACCGAAGCCTGTTCAACTCATCGCCAAACGATACCGGCCGACAGAACAAATGTCAGCGCCGCAAAGCCGCAGCATCAC
GTGCAGGGGAAAAACTAACGAGGGCCCTCCTAGAGAGGGCCCTCACACAAAACGGGCAGAGGTATTACCGGTACTGTTAT
CGGTACAGCGTTACCGTACTGTAACCGGTACAGCGTTGCCAACCAGACGAAAGGTTGTTAACATATTGAAAGGTTGTAAG
AGTACCATTACTGTGGATGGGGTTGCCGTACGCGAATGGCTGGCGTGTACAGGAGCTCAGTAGCGAGTACCACAAACCAA
GTTACCGTACAATGGAGAAGGAGAAACCCCCGCTCTTTTTAATTCCACCTCCACCTGAAGCCAACTACTCGTCTCATGAC
GAAGCAGAAGCCGCAGTACATGCATGGACCTTAAGCCACGGCTTTAATGTATCTCGACGCCGTGTACGCTACAACATCAA
ACAAGTTGAAGTGTTCAAAACACTTCAACAAAGTCTATAGAAAATTGAATAAAAAATATTATAAAAATCACAAAATAAAT
TGAATTGAGCTATTGGGTTAAGAGTGTTTGCGGCTAATGTGACTCCTCAAACTACTTTTCACTGCAAACGATTTTTGGCA
CAGATCACACGAGTAGGTTCCCTTTGCGTTCTGTAGTTGCTGCCGAATCACCCGGTGTTGTTGTCCGACTGGGTTAGATA
AGCAAAAGTAGCGATGGTTACGCATTCGATTGGAAGATGCATCAGCGTAACCAGTATTGACAGTTAAAACTTGAGGTTAA
AGCAGACATGACAATATCAGGTACCCACGAAACACCTTCAAATTGCAAGTAGCAGTGGACTCTGTAGTTGTGCTGTGAAT
AGCTTACTCCAGCGTGAAGAAGATCGCCCCGAAAAACAATGCAGTAACCAATAGGGATATCCACCAACCGGGATCGCTCC
TCGCGTGCCACAGTGTAACATCCGGCGTAAACTCTTAATTGTGTACCACTTTCGAGCGCGACGACGACACTAGCTGGAAT
GCTGCGGGGAAAACGCATCTTGACAGCTTCCACGTCGCTACTTGTGAAGTCTGCATGCGGTCCTTGCTCAGGCCCACCAG
GGCGCGAGTACAAAAATGAATAAACTTGTGCTCGAAAGTTTGCATCAACTAGTGTAACCACCTCCTCAATTTTCCTGTGG
AGCTTTTTCATCTGTGGCGAAAGACAATTTTGACGTGATTGGCTTCGGAATGTGTCGTCTTCTTCGCCACCCACCTCACG
GAAAACACTAATATATACAGATCGTCTTGCTTGTCGAAGCACACATGAAATAGTTGCTTGCGTGAGATTGAGGGGCAGCA
CTAGATAGCCGTCGGGCGGAAACTCAAGTCTTGGGTTGGAAGCCATTTGAAGACTGAAGCTGTTTTCGTTCAGATAGCAC
TTTGGAAGATCTATTTACGTCACAAGCTGTGAATTGCATCACTAACGATTTTTTTGCATCACTAACGGTCTTTTTGCATC
ACTAACGGCTGCGTCACTAACGGTCTATTTGCAGCACTAACGGTAATACCTCTGCCCGTTTTGTGTGAGGGCCCTCTCTA
GGAGGGCCCTCGTTAGTTTTTCCCACGTGCAGGCGCAGCCTTGAACAAGGTAAACGGACGAGGCTACAGCGGCTGTAGCA
CCCCAACTCATTCAAAATGCAGACGCCGAGAATCCCATACCCACTGTACATGCAAGGGTGCCCTTCACATCAGACGGCTC
CACGTTGTCCAACGCCAGGTTAGCATCTCCGACACACACCATAGCCACGGAGCCTGTCACAACTACACGACAAGCGAAGT
GATCTCTACCATCGGTTTTATCATTGTACGTGGACACGCTGGTGGCGTTTTCATCAGCGAAGGAAGGATTCATCACCCAA
ACGAAGAAGTATGTAGGCGTCCGAAACGCTTTCCTGGTTGGGAGAGTCTGTCGGGTGCTGAAACAGTCCTTGTTTCAGAT
CAACTAGCTGATCTCGCAGTTCCAAAGCCATGTCAAGACGTTAGACCTCGGCGCAGTGCAACGAGGAAACGCAAATTATT
GCTCACTACACGGACGATCTACTGAGTTGGGTTAGGGACGGTTGTGCGCAGCTGATGATGGCGAAGTTTATGTCGATGAC
GATACAGACATTTTGGGAGCGGTACTTGGAGCCGTTCGATCCTGTGACGGAGCTTACGCTTCGCTAGCAGAGGTAGAAGC
GATCAAAAACATTCGCTTTGATCCTGAAAGCCAGTGTGATGCTCCAGCAGACCTGTATCAACACTCTGACGAATCTACAG
AGACGCGATTACGGCCAGAATGCAAACATATCTTCCAGCATTGGACCTCCGCAAGTTTTTTTCGCTTACATTCCGGTCTC
GGTTTTGGCACCAGGTTATCGGTGAAACAAATGCATATGCGCGCCTACATAACGTCGCAGTCGGTAAGACCTTTTCACTT
GATGAAGTGATGACATTTTTGGGGATCTCGCTGTTTTTGTCTCTGGTTGACAAAGCAGAATACGCTAACTATTGGGGACA
CAAGTGGAGAAAACGAAATACTGGGTTAAACATCCAGCGCGCTTTATAATGTGACGACTCTGCATCGGTTTAAGGAACTG
AGGAAGGCGTTCTGCTTTCAATGCGTGGAGGCGAATTCGGATATCCAGGATCAAGCTGCAAGGATTCGTCCGTTACTGAA
CTTGCTAAAGACTACCGGATCGAAATATGTGGAAATCGGTCGCAGTGTTGCTCTGACAGAAGCAAGCGGTGCGTGTCGGT
CAAAGTATGGAAAACCACTACTTGTCTATAATCCAATGAAGCCGACAAGGGAAGTATCACTTCCGGATTTACATGTTATG
CTGTTCTTGCGATGTGATTATCGCCACTGAATCAACGAATTTGGATCGGTTGAGAACAATCAACACTAGTTTTGCCAATA
ACACGAGTCTAGTAAAAGCGCTGTTCATTGTACTGCTGTTGAACAAGCTGAATATCGGTGAATTTTCGACTGCATTGTGC
TAGTAATACCTCGGAGCGATTGGGTGGCGTTTTATCGCCGCAAGAAGAACAGGCGTTGAGCGACGAAGCTGCGGAGTTGT
CTGCGATACGGAAATGCGTACTAGAAGCGGCTCGGCCCCTGTATGGTATTTGTCGGATGATCAACACGGACAATCAGTAC
ACTTCGGTGCAATTGCTGATGGCGCTACCTTTCAAGGGTCTCTATGCTCGCAATGCTGTGCAAAAGACTAGCTCGCACTT
GCCTTGCTATGTACTTTTGAAAAACAAAATGATTACTTCCGTGGCGTCTCTCGACAAGGCGTTTCCGCCGACCACTCGCT
GGCTGCGGCGTCATGGTATGCCAGCTCTATGGTGACGGTGATATCGAACGCGAATTTATCAACCCTCACTACGGTAACGC
GTCAGGTTCGAGCTGAAAAATGAAACTATTCAGCCCCATCATGTATCAAGGAATACAATGCGAATATGCAGGGTATTGAT
CATCTTGATCATGTGTGTGCTCGGGTCTCTCTATCGGACGGCCACGCTTCCAAAACAAATGGCATATTAAGCTTGCATTA
GCTCTTATCGATGTGGCCGGAGCTAATGCATATTTGACCCGAAGACTGGCACCGGAGCTGAACAAGGCACGGAATTCTCT
TCGAGCCTTCGTAGCTGAGCTGTGCTCCGAGCCTGTTTAAGAGAAATGGAAGAAGCAGCCGAGTGAACGGCTGGTGTTCT
ACGCTTATACTGCGGTGGGCGAGGTGTTTCCGGATCGCGCGTCTCCGTCGAGCACAGTCTGGATTGCTCGACCAATTGGT
GGAATGCCATGCTCTGAAAGCCCTAAAACAAAATGCTCCGCTATTTCCTCGAAAGCAGTTCGATACAGACAGGAATCGCA
AACGCAAAAAGTGAGTTGGGTGTTGTTGGGAAGATCGCTATGGGAATAAAGTTACGGACGTCAGTCTCTGCCAGAATGTA
CGCGTCTCGATCAAGCCATACGCCTTCCCTGAAACTACCTGGACCCGTAGGGAGAAGCACCATCTTTTCTACCTACCGAA
AAAAAAACCTTCTCACAGAGAGGGATGGTGCGTACGAGCTGTGAGCTGTGCAAGCTGAAGCGCAGTCAGCGTACAACTGA
TGGTCAAGACGAGCAAATGATGGTGAAGGATTTGGCGCTACTGGCGAGACCAGAACGGTTGTAAGGTCTATCGCTCTATG
AATGTTGACAGTTATCTTGATCTACGCTTAAAAAAATTGTATTGAGTGTAATTACGTATAAGACTGGCAAGTCCCTTAAA
CAAAGTATGGAAATGTGAAAGACCAAAACATGTATTGCGTTGAATTCGTTATGTACTTATGCTTATAGTGCCTCGTACAC
AAACATTTGTTGGAGATCGGTCTTCCAGCTGCACGGTAGGTCCAACACTTTCTCCAATTTTAAAGCTTGATAGAACGGGT
TGTGACACAGGCATCAATGCCTTGCGCAGAAATTCAGAGAACTCACCGGTGTTTTTTAACAGCAACGTTTTAGAGAGCCC
TTCCTTGACGATCTCGACAACCTGTGGTTCAAACAGAATATTGTTCCAAAACACTACTGTTGCGTCGGCGTACGGTTGGG
TCGTCAAAATGCGATGTATGTCAGTCATGGCTTGGCAAACAAGTTGGGCTCGCCGGAGGGGCCGTCTAGACCCTCGTGTG
ATTTGCCATCATCTTCATTCCAAGGTTTATGAAATTACGGCGAATCTCGATCTCAATTACCTTGTTCACACTTGTCGCCA
GCGCCACTTGGGCAACCACGTTCCCCACCCTGGAACCGATATCTAGGAAGGTATCATTCCGGTCGAGTCCACCCAATTCA
CGAAGCAGTGTGGAAATTCCTCTCGGCATCAGTCACCCGGCGTTGCGATGCGACAGGTTGCTGGCGCCTTGTACAACCTC
TTCGCAAAGAATGTCAGCAAAAACGCCGCGACAGCTCGCTCGCCACTAGAAAGGGGCATTGGCGGCGATCCATCTTCCTC
AGGAAGGCCAGGAGAGCTTACAGAACGAATGCTCTCACTTAGAGAGCCCACCATGTCTTCGGCGTCGGCAGACTGGGTGA
TGGAAGTAACGTCGGGATACATTTTCACAGAACTTGTCAAAAGCAGCGTGTGGACCGTAGCCGGAGCCTCAGAGCCTCAG
GCTTGCTACATGTGTCACCGGTGGCGTTGGTGCTGGAGATTCTGCAAGCGCTGAAGGCGCTTGTGTAGCTGGGGGTACCG
TACTCGCTGACGCTTCAGTGATAGGAGGATCTTAAAATTGCTGGATGCCCCTGTGTTGCTGGAAGTACTTGATTAACGGG
AGGTACTTGGATTGATGGAGGCACGACAGACACAGGAGACGTTGGAAGTGCTTGAGTGGCTAAAGATGAGGCACCTTACT
CGCTGTAGACGGTAGCGGGTGTTGCTGGGGCCAGAACCCAACACGATCACGTTGTGAGTCAGCTGCTTGCCGCTGTAGAG
GTGGGCGTACCGCAACACTTGCACCTGGACGCTGTGGCCGCACCGAATCATCTCCAGCCGAGCTTTGTTGTTGCACCGAA
GGTCCTGTTCTGCGCTGTCGCTGTTGCGTAGTGTGAACATATTGAACCAACTGACGCGCCACCCTGGGTGGTCGACCGCG
TGGCCGTTGCACCGGCGTGAAGAAGCTTGCCCCCCCTCCCCACGTTTTTTAGCGTCCGAAGGCGCTACTGCAGTGCTCCT
CTGGCATTGTGGCCTGTATGCTGCACGCTGGGCAATATCTGCCCACGCCATTCGCGTACCTGCGTCTACATGGGCGGACG
CTAGCTGAACCATTTCTTTGTCGTCTTCTAAAGTGAACGTAGTTGTCATTGATACTGTGTCAAGAAGGCAACTGACTAAG
TATTTGTAAGGAAATTGTATAAATGGCAACTGGCTAAACTTTTGTGTGACAATTCTGTCGAAACGGACATGCAAGTAATG
GTGCGAAGATGGGGTACGTACCGCATTATGCTGGCGCATCAGCAAAATTACGTACTTAGTATGCAAAATGCTGACGCAAT
CTCAATAATTTTCGCACCTACGCGCGTATTTTACGTGGTGCGGCAACCATCACGTAAAATATGGGAGGTTGGCAACCGAC
CGGATTGGTTGTAATAAGAGAAGGTGATGGATGTGCTGGTTAAACCTCTGTCAAGTGGGTCAAAATGACCCCCGTCATAG
CCATTTGCAGCAAAGTTCTCAAAACATGCATTAACGGGGCTCTAAAGGGCTAATAACTTATCTGAGTGTGAGGTAGCTGA
ATGAACTGCGAAATCGAAGTACATGTAAAAAAAAAGCTGGGCGTATGCCGAAAGAGCAACGCTGTGCTAAAAAGACGTTG
TCGCTTGGGCCATAACGATAGATATTTTAGATGGAGCGAAACTAACTTATATGTGCTGGTAACAATTGCTACTATAAGCG
AATTGAACTCGACCTTTGTATTCTAAAAGTTGTTTAGACAGCAAAAACTGATACTACTAACCTGGCGAACGTCTCGCCGA
CAAGGGCGTAGGATAAAGTTTTAAATGGAGTGGAAAGACAACGACACAACATGCGATGCGTAAATTAAGTAGACCCCAGA
AAGAAAGGGTAATACATCTGAAGCCTAAACGACGCTTAATTACCCTGGAATCATCGCTAAAGATAAAATAAAACGCACTA
CCGTCAACAACAGCAGCAGCAAGGCGTTTTGCGACACATTATCCAAATGCTTTAATAATAAGTTTCACACAGTCGAGTAT
CTGATAACCAATTCCGAATCAGCACAAAACGAACGCTACATGCATAAAAATACTTAATTTTCAAAAACTTCAAGCTTTCA
TTGAGTTTGGTATGAGAAGTGAGTAATATTTAGTTACTACAAGGTCAAATAGGCAGTACAAGCGGGTACGTAGTGCAAGC
TGGACAGGCCCTTACTATCTTTTACGTTAATGTGAGCTAAGTTTCATAGCGGCTCAGAAATGGCCAGTAATATCGTGCAC
GACGCTAAACTAATAAAAATAATATTGTGTAGCGTTTGTATAAATGTTATTTGAAATGCAGGTGTTTTTAGGTAGAATAT
GAAGATACAGTGATAGCCAACAATGATAACGAGATTGCATCAAGAACCTTGATTCAAGATTATTAGAAAATCAGGTAGGC
ATGATGCTGACACAGATTTATGAAATTACACTAGTACAATTGTGTACGTACAGAATAGTCTACTCGTTCATTTGCAAACT
TTGTAATTACATTGCTCTGCTGGTTTTTTTGTGTGATCTGGTGTGACGGGGTCACACAGCACCTTGCGCTAGAGGAAGTT
GGCCTCCGAGTACAAACTCTCAGTGAGCGGCAGTCCACAGGTCTTTTTGCCTAAGGGAGCGAAGTGACCAATTTAAGGTA
AGTTGTAAGCTGAGTATATTTATAGGTATGCTAAGCTTGAGTTAAATATACAAACTATAAGTAACCTATAGAAAACAAAT
GTCATCAGCCAATGGTTGGCCTCGGACGACCCTGGTACTATGTACCAGATATTCCGAAGTGTGACGTGTCATACTTCATG
TACATAGGGGGTACACTTGAGGCTATGTACCCCGTTACATCCTTCTCTGCTTAGGTTCGGTTTACCGACCAATCAGAATG
AGGAAGTGTACGTCACAAACTCTCATTCTTAAAGTCGAAACCCATCGACTTGGCCGCGCGAGCGCGGCGGAGGCTCACTT
CCCAGTTAGAGCCTCGAGCAGCAGTGTGCGCGCTTCTTCTAGGTCTCCACTTCGACCGTTTACCATGCCTCGTGGCACGG
CCAAGAGCGGTGCGAGGACACGCTCCAAGGCTGCTGCCGGAAAGGCGCGAGCCAAGACCGCTAAGCCTCGCAGCAAAGGC
TCTGCACTCCTGGAGGATACTAAGGTGGCCTCGGAGGCGATCGGCTCATCTAGTGACGCGTCTGCGAGCAAGCGTGCAAG
CAAGCGCCACAGTCCGTCGCCTTAGCCGTCCGAACCCACGACTCGCTGAACGTGAGTTAAATTCGGGCAGTGAGGACGAG
GCCGAGTCCGGGAGCACTCACGATGCTCCTGTGGGCTTCGTGGAAGGGTACATTCCAGTGCCCAGCGAGCACGATGGCGA
GAGCGTGCACTCGCTCGCTAGTGATCACTGTGATCGCAGTCTCAGGACGTTTCTGGGTTCTGAGAGTCCTGCCATCTAGG
CTAAGGGCTCTCCCAAAGCTGGCGATGACGACGAAGAGAAACCTCTCAAATATCTCTCGCTCGCCGAGGGCCTTCCGCGT
GCCAAGGCTGCAAAGGCCACAGCCGAAAACGCCAAGCCCACTAAGAAGTGTACGGCTTCGAAGTCTCTACTCCGCTAGGA
GGGGGAGGCTGGGTACTCCTATCGAAACCTCTTCGGTTCCTCGGATGAAGAGGAGGAGGAGGGTGCTATTCCTGAGCCCC
GGGAGATCCATAACGGCCTCGACCAGCAGCAGGAGGACTTCGAAGCTGCTCGGCGCACGCGTGGTGGTCCGGTGGTGGCA
CCCGTTAGCCGGGGAGCTGCAATCAACTCAAGAAGTTATTGGTCTACCGAGAAAAGCTCTGGGGCTGACCTCTTCTTGAA
GATCCTCGTCGCTCCTCGTGGCCTTGTCGGCGGCGACACTTCTAAGGGCGCTCTCAAACGTGCCCTGTTCCAGAATAAAT
AGATGTATGTTGACGACTTGGAGGCGGCCCGGTGCGTGCTTCTCGCGCCGCGCCGAATCCCTCTGAAGGACTTCACGACT
TGTCGTAAGAAGCCCGAGAGCCGGGGTGGTATCTACCCTCTCTGGGGCTACTTCTGTGTTCTTTCCGAGAGCTGTCCCAA
CTGGAGTTCTTGTGCGGACATGTTCTGGGCTTGGGTGGAGTCTCTCAAGTACGCACCCTCGGAGTTACGGGAACTCCAGG
AAGATCAGCTGCTGCCCCGCATCCTGGACCAGCGAGATCTCCGTATTCGGTTTGACCACATGGTCAGCAAGTCCATGCTG
CCAAAAGACATTCTGAAGCGCGCGGCTTCTAGCGCTTACGATGAGCGCGGGTACGGAGTGTCGTCAACGTCCGTACCCCG
TTCGGCCAAGAAGGCCCGGACTATTTATGACGCTACCGCCGCTTCTATTACCAGATTGCGACAGCCTTCGGGCGGTCTAT
CAGGAGCCGCTCAATCGGCTCCCACGAGTTCTCGGAGTGGGCATAACACCTCCACTTCACGAGGAGCTGTCGCATATCGC
GACGCCGTTGCTCCTGGATAATTTGCTCCATGTGATAGTGTACTTCTCTGTTCCGGCCAAGCAGGGGTGGAGGTGCCCTC
GTACGAGTACGAGTACTCGGCGCCTCCGGAACGCGATTCTCGTCCGAGTGCTTCTCCGTCGGGACCGATGCAGGGCCCCG
TGTTTTACCGCCTTCGTCAACGCGTCATCGAGCTTGAGATTGCACTGGGCCGTGGAGTTGGCGGAGATGCTGCCGCCCAG
GCCGGGAATCAGGGCGTGCTCGCTCGTCTTGCGAGCTGCCTGGACTTGTTGACGCGGGCGGTCTCAAGCCGGCTTCTGCG
GGTCTCTTCGTCCGATCTTGACGAAACCTTCTGCATAATCCGACGTGTTGAGGCTCTACTGCCACGTCGGAGCCAATTTC
GGCGCACGCCTAGTCGTACGCGTATGGTGCGTACCCGACGTATTCGACGTACTCGGTGTATGGCTCTGGGGTCCATTCGT
ACGGGGCCTCTCCGGCGTACGGTCTCGACCGCAGCCTTGCTGTTCAGCGCGAAGATTGGGTACCTGTTCAGACGCCCTCG
TCGACGTCTGTGGCCGGCCCTCGCTTCGAGGAGTTGGGCCAAGGTGGGTCTGCGAGTCAGCAACCCCCTGCGGAACATAG
TACCGGCAAAGACGTCCAGCGTAGAGCGTCGGGTGCGTCGCCATTGACATCGGCAGGTCGATAGCGTACGACGCACCATG
CCTGTCCAGAACTGCGAACGGTCCAATAAAGCGGTGCTTCAGCTTGTTGTTGCCGACCGAGCTTACAGTGTCTAGATATA
GGCTCCTCGTGTCCAATAACACTAATTCACCCATTTTAAATACACTTAAGTTTTCTCTTCCATGTACTCCTTCTAACGCT
GTCATGGCATCGCGTACCATCGATTCCTTCTTCGCTGCGAAGGCAGGCGTGGCGGGAGTCAAATTCCCCGCACTCGACGC
CAACTTTCTGCGTTCGGGAGCCGAGCTGGAAGTGGCGTCTAGTTCATGCATATAACAAGCTGAACAACGCGACGGAGCCG
GCCCAGACACCAATCCCACCAAAGGATTGTTGTTGAACAATATGACCGGAAGCGTACTGGACAGTGCGTTGGATTTGGTA
GACGGATACTACCAGATCATGATGCGCAAAAGAGACATCCCGCTCACCGCGGTTAACACTCTAAGTGGCATGTTTTGGGA
GTGGTTCGTCATGCCGCAGCGCCTGTTTAACGCCCCGGCGACATTCAGCCGCCTGGTGACGCAACTGTTCAGGCTATTGC
GCGGCTTCGTACAAACCTACTACGACGACAGCTTCGTCCATAGTCGTGCCGAAGGAGGCAAGACGGTCATGGAGGTGCAT
TTGGGGCACCTCCGTCGAGTTTTGGACGTGATGCGAGCGAACAAAATCAACGTCAACATCGACAAGTATGTCTTCGCGTC
AACAGAGATCAAGGTTCTCGATGGCTTCGTAAGCAACGTGGCTGTTCGGGCTGACCCAGACTAGGTCAAGGCCATAGCAG
CATGGCCAGCACCCCGATCTTAAAAGGATCTTCGAACGTGGTTGGACTTGGCCAACTACCTCCACAAGTACAGTGCAGGG
TACGCGGGTCTCGCTAAGCCCTTGTCGGGCCTCCTTCAGAATGACGCCGACTGGCGCTGGGAGCAAGAGCATCAGGATGC
CTTTGACAGCAACAAGGCCAGTCTCCAAGAGGCTCCTGTCCTGGCCTTGCCGGACGAGACGAAGCCGTTCAGCGTCGTCT
GCGATGCCTCCGATTACACCATCGGGTGTGCATTGCTGCAGACTGACACGGCTGGACATGAACGAGTCATCTCGTTCCAG
TCCAGGCAGCTCAAAGCCGCCGAACGGAAGTACCCTGTACACGATAAGGAGCTTCTGGCAATGCAATATGCCCTTGTGAA
GTTTCGTGTTCACCTTCTGGGCTCCCGGCCCTTCGTGATCTACACAAACCACGCATCCTTGAGGACGTCGACCAACTCGC
CTCACCTCTCCCTAAGGATGGCGATGTGGCTGTCCTTCTTCGCGGAGTACAACTTCCGCGTCGAGTACAAGCCGGGCAAG
CTCAACGTGCTTGCGGACGCCCTCTCTCGGCGTCCTGACTACGAGTTGGCCCACATCACACGGGAGCCAACGGATCTATA
TGATAGGATACGCATGGCGTATCGGGACGATGAGGCTGTAGCGCCTATCGTCAATCTCCTCACGGCACGAGCGAGCGCGA
AGTCCGACTGGCTCTCGTCGCGACAGCGCTCACGGCTCCATCGATATGAGTTGAAGGATGGCCTCCTCTATTACCGGGTG
GAGCCCAATGAACCTCCACGGGTGGTCGTACCCAACGACGAGGATCTGAAGCTCGATATCCTCGCGGAGGCGCACGGCGC
ACCCTCCATCGGCCACTTGGGTCGCGAGAAGACCTTCCTATCGGTTTCTCAGGCCTTCTGGTGGACATACATGTACAAGT
GGGTCGCACGTTATGTGAACACATGTGTAACATGTCAACGGGTTAAACCCGCCGGGGACGCTTCGGCTCCGCTACAGAGC
TTGCCCGTCCCGGCTGACTGTTGGAAGTCGATGGGGTTTGCCTTCATCTTTGGCCTTCCCGCCGATGGACACGGCAACAC
CGGGATTTTGGTGCTCGTGTGTCGGCAGAGTATGATGTACCATCCTGCTCCAGTACCCGTTACCGTCACTGGCGAACAGA
CCGCGAGGTTGTTCGTCGATGGCGTGCTCCGCTATTACGGTCACTCGCGGTTCAAGGCCGCGTGTTGGAAAACGCTGTTT
CCTTTAATGGGAACCCGTCTCGGAAAACGCTGTTTCCTATACTACAGACTCGTCTCCCAGTAAAGGAAACAGCGTTTTCC
AACACGCGGCCTGAACCGCGAGTCTTCGTCCGAGACAATTGTCTCAACTGGAAGCTGCGTCGACCACGTACGTGTGTGCG
CGGAAGCCCCACGTACGTGGTCGACGCAGCTTCCAGTTGTTAAAACTGCGCTCATCAACGCGGTGCACGCGTTCGCAGGG
TTCACGCCGTTTTACCGGAATGGCTTCCCTCACCCCAGAGGACCTCTCACTCTTCGAGGAGACACTGCATCCTCTATGCT
AGGTGGGGAAGAGGCTCGGAAAGCTCTTTCCCAGATAAGAGCCCGGTTTCGCTGCGGAAACAAGTGAAATCCGTTGTGGA
TACCAAGCTGAGCGTGATCAGCAGGACCTCGCACCATTCGCGTGGAAGAAGCCATTGTCTCGTGACACAGTACTTTGTGC
CAGGCACGAGATCGATCTGATGCCGTACGCCTCGATCCGGTGGGAGTTGGGTCGGTGGGTGTTTATTAACGACAACCCGT
CACCAAAGGATACACCGGTTCCTTGGCGTTCTTAAGGATCTCAAAACCCAAGCGCGTCTGACGCTGCTTGCTCAGCTCTT
CCCGGACGTCCTCGGCCAAGACAGAGGAGTCATTCAACTCCTCCCGAGTGGCCTCTGGTCTTATGAGCACCATCTCGGCA
ATCTCCCCAGGCTTGAGGCTTGCCAGGAAAGACGCGACTATCATTTTACTCGAGGTTCAGTATCTCTGCAACCTCTGGCA
ACGGTTCCACGTAGATACCAGATGCCTTGACGGTAATCCGGTCTCGCCATCGGAGACGGTATGTGATCAAGCTCTTCCAC
CGGCCGTGTCGGAAGAGTCCGGTCCCTGGACTCCGAGTCGCTTGAAGCGACGTCGTCGACGGCGTCCGTGACGTGTAACT
TCGTTATCCACGTCAGGGGATGTCGTGGTGCTGACATTCGAGGCACTCGAGGCCTTGTGTGGCTCTATGTTACCCGCACA
AGAAGCGCATCCAGCGCCTTCCTCTTCCGTTATGGTCTGGACGACCTCGTGTGGTACTGTGTTAGCACACACAAGAAGCG
TATCCGATAATTCCCTCTTCAGTTGAGGTCTGGACGAACGCGTGTGGAACTCTGTTAACCACCTTGGACAAGCTATTACC
AGCGCTCGTGGCTGCTGCCACTGTCTGCGGAGCTGTGTTACCCGCTTGTGGACCTAAGTTACCCACTTGGTCAGCGCCTC
CTAGAGCCGCCGCCACCATCGAAGCGTCCTCGGAGTCGTCATATACGTCGACGACTCCCAAGCATCTGCCGAATGCTTGG
GTACCCCGGCAGCCCTTACGGGCGCCCCGGGTCCTGACAGAGGTGGGAACATGACTCACCAATGCTCTGTCGGACTCCGC
GGCACCGATTGCCTTGCCCTGCCAGTCAACCCAGGGCTCGTGCTACTCGAGCCTGGGCATGCCCATGATCATATTGTAGA
GATCCATGTCGAGAACAGTAAGCTGCTCGAGGATGTCAAAGTCTTCAAACTTGACGGCCAGATCTACTTTGATGTTGGGA
ACAGTGACGACCTTCCCGTCGGCCAGTCGCACTGACACCGTCTCGTTGCCTTTGATTTCTCTCATAGCATCAGACAACTT
GTTGCGATTACGAGCAACCGTCTGGCGGCGCGCAAAATTCTTCGACGCCCCAGAATCGATTAAGATTCTAAAGGGGTGAT
CGTATCCTGTACACATCCGTGTACTACGATTAGTCCGCCACCGCCCTTCGCCGATTCGAGAGTGCGAAGACTCTTAGGGG
CTAGGACTACGTGGTACGCGCCACCCGTGCACCCCTCACGATCCTTAGCTCTTCCCTAGTAGGGTGTCCCGCCCCTACTG
GTCTCCGGTGTTCCCCTATCCCCGAAATTCCTGGTTTCTACCAGCGACCCTTGAGGACGGACTTGGGGAAAGTCCGCCTG
TGGTGTCTATCCGCGGGGAGTCGCGCTTGAAGTGTCCCCGATTCCCGCAGCCGAAGCAGCGAATATCTCGCTGCTCGGCG
GACACGAGCTCCTTGGGAATGGGTCCGGTGGGATTTGCTCGACCTGGATTCGACACAGAATTCCCTGGCCATGCTGAGGC
CGGCTTGGGCGCCTGGCGATGGATGTATTCTTCCTGAAGGGCCACTTGAATCGCCTCTTCGAGGGTGCTTGACTGCACCC
GAAAAAGCTGAGTGCGCGCCGGGCCCACTCGAAGGCCGTCCATGAACACAGTCATCTTGACGTGTTCGTTGAGTGGGCTT
CCCACTAGGGACGCCGTGAGCTCCCGCATCTCTTGGGCATACCCGTGCGGCGCGCCTTCCTTGCTTGCATGAGACGGATT
GCGAACGCTGCCGGTACTCATTGTTCGCTGGGAGTAACGCGGCTCGGTGCTGTTCGCACAGCTGAGCCCAGAATATGAAA
CATTCAGGGTATTTCGCCTCCCGCTTGTACAGCCAACTCCGAGCACGACCGCTAAGGTTGGAGAGTGCAAAAGCAACACG
GAGTTGCTCGGTCGAGATCAGAGTCGCGTCCAGCGCGAGGTCTACCTCTCGAACCCAGAAGTGAAGGTTCTCACTTCCCT
TCCCTTGATACGGCTTAACTTTCTGCCGTATTGGCTTCGGGTGGGGCGGGTTTGTTTCCGCCGCCGGAGCATGCAAGTTT
TCCCACACATGTGCGATGATCCCGTGATCGTCAGCGTCAAACGCATTGACTCGCTCGAGCTGCTCGGTCGGTGCTGACGC
CACCAGGCTCTGCAGGACCTCCATCCCGAAGATGCCAGCCATCCTTCGAACCGACTCTAACTGTGAGTCGTTCAGATGGG
AGAAGTCGTTCCTATCCATGGCGACCAACTTCAGACAGGTTCAGGCAGTCTACCCGCGTTGGCGTGGATTGACTACAAGT
GCTACCAAGTGTGATGGGAACACACAGCACCTTGCGCTAGAGGAAGTTGGCCTCCGAGTACAAACTCTCAGTGAGCGGCA
GTCCCCGGGCCCCTTTTTGCCTAAGGGAGCGAAGTGACAAATTTAAGGTAAGCTGTAAGCTGAGTATATTTATAGGTAGG
CTAAGCTTGAGTTAAATGTACAAAGTATGAGTCACCTAGATACAAGCACGACCCTGGTACTATGTACCAATTATCCCGAA
GCGTGACGTGTCACACTTCATGTAACTAGGGCTGCACTTGAGGCTATGTACCCCGTTACATCTGGAAGCACATCCATGTT
TTACTACCACATTTAAGTATTAACAAGGTTGAGCTCATAAATGACTTAGATCTGTATAGTATACTTGACGAAGGAAGCTT
GCGAAAGTGTTAAACGAAAGCTAACTGAAACCTAAGAAATATGCAAATTAGCTACCGCTTCGAAGTCGCATATAAGACTT
CTTTAGGTAAAGAAAAAAATTAAAAATAGAGCGCCTCTAAACGTGCATATAACTAATATGCATTAACATAGTACATGTAC
TCAAAGCTCTTCTGACTGACTGACGTTAACTTATGTGTTATTTATAAACTAATTGCGCCTTTCTGCCAAAAAGTATACTA
GAAACTCGGTCCCTGAAAGTGGCTGGTGAAGATGACCTAAAGGAGCAGGTCTCGCGGATTATGACAGATTACGAGCGCGT
AATTGTACTATAGAAAGTGGCTCTAAAAGCGTACGGGGTCTTGTCAATTACGACCTGAAGTCCTTCTTCGTAACGTTTAT
GTAACGTCATTTATTATTTTGATAACTAAGCGCTCGGTTGTATTAAAAGTTAGGGGTTACACGAGGAGGGATGACCTCCC
TACTTTAGTCTCTCGAATCGTGACAGTGGCAGACTGAACGTGGCTAACGCAAAGTGTCCAAGAAGCGTCCTTCTACTATT
TAATGCATCGGATAGGTAGCACAAGCTGTTTGAAATTGTGCCCGCTCCAAATAAACTAGAACTCTCGTTTGGACATATGT
AATTGGTTAAGTTAGTCTGAAAAGATGTATTGGTATTTTTATCTAGTGAAGCACAGACTACTACAGTACTGTACTAATAC
TGTAAAATACTACTGGATCAACGACTAGTCTATGCTAAAGTCGTCGCCTGTGCTGCACATTCGGGAGGCCAATTTTTCAG
CAGGTGAATGGTGTTTTACGAACTCTGTTCAAAGCAAGAGATTTAAAGATGTGGAGATTGTGCCAGACGACAACGTGGAC
ACAACGGCGACCAACCCCGACAACTGGGCCGACAGCAGCAGCGAATGTGCGACACGGAAAGATCAAGCAGCGTCAACAAC
AATACTGCATAATCAGCCGCGTCAGCAGCACGTAAGGCAAGGGGGACGCTGTCACAGTGCACGCCATCTAAGGGTGAAGG
ATTAAAATGGTAAAACCCTCACTCAATAGATATGTTCGCTCCATAAATGGGACATTTTCTGCTGTGGTCATACAACTGCG
CTTATAAAAATATACTTCGAAGTAAGCTTTGAATTGGGTTTGCCGATTGCAAAGGGGACGACTTTGCCTAGATCCGTGCT
CTCACTTTTCAACTCACCCTCCTCCACTAAAGTCTAATTACTCCAGCACTATGCGCAAGGCTTTTTTCCCTCTGATTGTT
ACTCTCCTCGGCAACGGAAGTGCGATGCCTGCCATATCTGCCACCACGACCGGCAACCAAGCTACCATCTCTACCCTGGA
ATCGCCAGTTCTGCTCGCGTCCGATACTCAAAAGCGTTTTCTGCGGAGCCACAACCAAGCGGAAGAAGACAGTGAAGAAG
ACGAATTCGGAAACGGTGAAGAGAGAAAAGTAGGGGACCGACTTTTCGCGGATTGGAAGCTCGAGCAAATGTTGAACTCT
CATTAAAACGTTCAAGAGGTTTGCGAGATGGAAACGCAAAGGGTTCACCCCCAGCACTCTTCAAACAAAACTAGAGAAGA
TTGGATACTGGGAAAAGTACAAAGACCTCCACACGTTGTACTCAACCAACTACTTCACCATCGCTAAGGCTTATCCATCA
AAGTACACGTAGATGTGGCGATAATCCGCTGAAGGAGTAATGCAAGTGGGGCATATTATTGCGAAGTCTTTATTTGTTTG
TCAATGTTATTAACGTAGCTTGGGACTATTTTGCTAGCAGGAATCATCTCTGGCCATAAGATAGTTCAATGCAAGCTTCA
CATGACTTTGTCAATGTCATTGGCTTCGCTAGCAACGTAGTAGCTGTACTCGACACTTTCAACACTCTTTTCGTTTCAAA
TTCACTCGTGAAGACAGCATACAATGATATCCTGATACGTGCTCATGACAGTGCGCAGTTCGCCACGTGAAAGGTTCTCC
CGCCACATAATCTCTTCGATGTGGTGTTCTCCATGGAAATAGACGCATAGTCTCTTAAACAGCGTAAACACTGAGTTGGG
CTTGGCAATTTTGGCCAAATACGCACGCTCCTGGTCTGTAAACAACAATTGGGTCGCCACACTCATCACTTGAGCCATTG
GTACTGTACTACCCCCACGTGCGTCGGTAGCAGGATTATCATCCAGCAGTGCTGGCACAGGGGACGGCGCCATGTCTGCT
GGGTTCATAGGCGGGATCTGAGCTATAGGCAAACTACCCGGCGCACTGGTGTTTGTTGCGCTACTATTGACTCGTTGTCG
ACGGAAACTTGACACCAGTAACGCAGGAGAGGAGCTACCAACCGATGACGCGCCGTTACCGAGCTCAGCTGCGTAGTCTC
CGTCGGACGGGATCATAAAGTATATGAAGCGGTGGAGCTGTACAATAAATCGTTGTTGCAGTAGCCAGATGAGCATGTGG
ACGTACTCAGTCTTCTTCGCAGTCGACAAGGTCTTCATGTACTCTCCAATACGTCGAGAGCCCGAAAACGTCGACAAGAC
TTCGCCTAGCTCGTACGGAGCGAATTTGCGTCTGAATTCCAACGCCAGAGGCGACGTGATGTGCAGATCTGCCTTGGCAT
TGACTTGATAAATATTGTACAAAGTGATGGCATCCACAATACGACCGAAGCCCCAGTAAACGAGATGTGCAGCCAGTCGA
AAGACCTGATGAATCGGAACTCCCGTCTCTAATGCAATATCCTGGAAGCTCTTTAGAGGGTTTACACTCTCCACCAGATC
GCGCAGTTGTCGCGCATGATCAACTGGGAGTTTGTTGAGGATTTCGTCTTTATCAGCCAATAGCAGAAGCGTGTGATACG
GTCGTAAACTCGCCATCTTCACCGTTACAGCATCCGTTAGAGTTAGCGACAATTTCACCCACCCGTTAAGCACCACATGT
GCAGCTCCCGACTCTTCTAGACCATGGAATACTCGCTTGAGGTCATTGGCTAGCACACACTTCCCTAACGAAACGTCGAT
TAGAGTTTGGGGATCCACCTCCACCGTCGACGATCCGTTTTCCCCGTCCTTCCTGTGGTGATGCAGGTGCATCAGACTCG
ACCCACTTGATGCAGTATTAGCTCCCGTATTACTCGTAAGACTACTGCCACTAGTCGCTCCTGCGGCCACCGCGGCGCTT
AGACTGTTACCACTGGTAACACCTGCATTGTTACTACCTGCATTCCGCTCACTTTGAGCCAATTCGTCTCTTAACTGTAA
CAATTCTCGCACTTCTTTCGACACAAAACCCACGCGAAGTTCCTCGTGTAACAGTCCGTTCGCCAACTGTGCGGCTACGG
TATGGAAAGCTTGAGCGCTGCTGCGTCTTCTGGCTAAAAGTTCCTCCTCGTCTGCTTGTTGCAAAGGTAACATTTGTGTG
TCAACTGAGCCATCTGTAGCGTCAGGAGTGCTAGACACTTGTGGAGGACGATCTTCTAGCGCAAAAATGATGTTAAACAT
GGTTGTCTCATTCCCCATGGCGCCCGTAGAGTTGTTGGTAGACTGCTCTACAGCTGTAGGGGATGCTCCTGTAGCCGATG
TTAAGCTGTTCTGCGCTATAAAACTCCCTCCAGGGCCATCCGCAGGTGCTGCTGCTGGTAGTCGACGCGACACTAGCACC
GGGTGACTCACGAAGCGCAGATCATCCACCACAAGCTCGAAACTGGCGTTACAGAGCGCGTTCTTGGGCCGGAAGAGCTT
GGCCAGTAGAGGAGCTGGAAGGGAGTGGAAGCTCGACGCTCTCTCGCTGGGTGGAGCAGGGTATCGGAAGGCTAGGTTGC
AGCCCTTACTGATGTCGTCCACCACGAGCGCTACGCCCAGGAGCCGGCAACTGCCAGTCAGCCGGACACTCGAACCGTTC
ATCAAGTTTGAAGCTCGTGCGGATTCCGAAAACACTGTATTCGGAATACCGTACAATAGAAAACGCTGTATTCGGAATAC
CGTACAATAGAAAACGCTGTATTCGGAATACCGTACAATACCGTATTGGAAACCGCTATCCTACCGGTTTGTTATCTTAG
CCCTTAAATTAATCGGAAGATCCTTTTTAAAGAGACGCAGAGATTTGACAGGCAAGTCTCAGCATGGCTCTACTAGCGAC
ACTTCTAGCGGTATGTGGACTTTTGGGCTTCACGTGGTGGCTACTAGCTCATTACAAAGATGCCAAAGTGCCCACAGTAG
TCCACGCCGCCGTGTTCTCGACTTGGGTGTTGGGCTTCCTGGGATTGCTCTTGCTGCCGATGGATCTGGCCACCAACGGC
CTCGTCACGAGCTCCCAATCTGTCGGTAACATCACGGAGGAGAAAACGACGTTTAGAGAGTATCTGCTCGTATGGAGACT
ACTGTACTGGACTACGTTCCTTATGAGCTGGGTAGGGCTGCCGTTCCTGGTGGAATTCCGCCAGAACGGAGAGCTCGAAT
TGGACAAACGCGTGTTGAGCTCAATGAGACACCTGGTCTTCCATTGGACGGTGTTGGCCGGTGGACTGTGTATTGTGGCA
TTGTACTTGATCTTAGTGGATCATTTGTCATTGTATGGCGTGCTGGGACTCGCTATGGCAGCCAGTAACACTTACGGATT
GCTATGGGTCATCGCTCTACTGGGGTACGGACTCGTGGAGATCCCAAGAGGATTCTGGGTTCGACGACTGGATGGAGCAC
AGCTTCAGATACTGCACTTTCAAGCAGGCCAATTGCAGGATGAACGGATGGAAGCGAGGTTTGAATACGACGATGTAATC
GCGGATGTTCGCGACGCTTATCAGCGTATGATGCAGGCCGAGAGCGGCGCTATCATCCTTACCAGCGACATGCAGTACAT
CAAGACTTGTCTTCTTCAAGTCGTAGCTCTGATCGAGACGAACAAACCCGCTTTCACCAGTCTAGACGCCTCTGCTGACA
CGAAGCGAGGCGCCAAATCAGCGTCATTTACTGATGTTCCTAGTAAATTAAAACGTGGACTCAGTAACCTCGCTCGAGCC
TTTCGGAAAGCTCCGACGCTTCCGGAAACAGTGAAGCTGCATCGACGTGTGCGTATCGCACAACTGGAGCTACGTCGATG
TGACCAAGCCTTCTTGGAGCTCTGTATCAACGTCGATGTACTACAAGACCGCTGTTCCCAACGTGCGCTACCAGCAAGTA
GTTCGTACCCGGAGACATCAACACTCAACCGCTTGCACAACATGTTTCTGGATACACGACACCAAGTTCGTCAGTGGGCT
ACGTCTCCTGTGGCTGTCACCTGTGCTGTCATTACGGGATTTCTATCGCTCTGTGTAGTATGGGGTGAGCTGACAATGGG
TTGGCGTAGATCGTCGCTATCTCTGTTCCGCTTCTTGATCGCTGTCGAGGTTAAGGAGACGAGTAGTAGTCTACGTAGTG
CAACGGAGCTCGTATCAGCGTTGCTACTCGTGTACTTGGCTGTGTGTTGCTACACAAGTCTCTTTACTCTTCGATTACCT
GGGAAATACTCGCTACGTGCACACGGTAACTCGACGGAGTTGTGTCTACTGAAGACGTCAATTTACCAGTGTAGACTACA
ATTTGCGTTGGGACAGAACGCACTGCTCCTACTTCGA
##gff-version 3
contig_2213 AUGUSTUS gene 2396 5871 . - . ID=g6366
contig_2213 AUGUSTUS mRNA 2396 5871 . - . ID=g6366.t1;Parent=g6366
contig_2213 AUGUSTUS exon 5121 5871 . - . ID=g6366.t1.exon4;Parent=g6366.t1
contig_2213 AUGUSTUS exon 4439 5041 . - . ID=g6366.t1.exon3;Parent=g6366.t1
contig_2213 AUGUSTUS exon 3469 4369 . - . ID=g6366.t1.exon2;Parent=g6366.t1
contig_2213 AUGUSTUS exon 2399 3398 . - . ID=g6366.t1.exon1;Parent=g6366.t1
contig_2213 AUGUSTUS CDS 5121 5871 . - 0 ID=g6366.t1.cds;Parent=g6366.t1
contig_2213 AUGUSTUS CDS 4439 5041 . - 2 ID=g6366.t1.cds;Parent=g6366.t1
contig_2213 AUGUSTUS CDS 3469 4369 . - 2 ID=g6366.t1.cds;Parent=g6366.t1
contig_2213 AUGUSTUS CDS 2399 3398 . - 1 ID=g6366.t1.cds;Parent=g6366.t1
###
contig_2213 AUGUSTUS gene 6218 7868 . + . ID=g6367
contig_2213 AUGUSTUS mRNA 6218 7868 . + . ID=g6367.t1;Parent=g6367
contig_2213 AUGUSTUS exon 6218 6731 . + . ID=g6367.t1.exon1;Parent=g6367.t1
contig_2213 AUGUSTUS exon 6794 6882 . + . ID=g6367.t1.exon2;Parent=g6367.t1
contig_2213 AUGUSTUS exon 6944 7008 . + . ID=g6367.t1.exon3;Parent=g6367.t1
contig_2213 AUGUSTUS exon 7080 7611 . + . ID=g6367.t1.exon4;Parent=g6367.t1
contig_2213 AUGUSTUS exon 7692 7865 . + . ID=g6367.t1.exon5;Parent=g6367.t1
contig_2213 AUGUSTUS CDS 6218 6731 . + 0 ID=g6367.t1.cds;Parent=g6367.t1
contig_2213 AUGUSTUS CDS 6794 6882 . + 2 ID=g6367.t1.cds;Parent=g6367.t1
contig_2213 AUGUSTUS CDS 6944 7008 . + 0 ID=g6367.t1.cds;Parent=g6367.t1
contig_2213 AUGUSTUS CDS 7080 7611 . + 1 ID=g6367.t1.cds;Parent=g6367.t1
contig_2213 AUGUSTUS CDS 7692 7865 . + 0 ID=g6367.t1.cds;Parent=g6367.t1
###
contig_2213 AGAT gene 9719 10294 . + . ID=agat-gene-503;Name=agat-gene-503;Target={'target_id': "{'target_id':", 'start': "'contig_2213_17',", 'end': "'start':", 'strand': '1,'};identity=1.0000;positive=1.0000;rank=1
contig_2213 miniprot mRNA 9719 10294 973.0 + . ID=MP000503;Parent=agat-gene-503;Target={'target_id': "{'target_id':", 'start': "'contig_2213_17',", 'end': "'start':", 'strand': '1,'};identity=1.0000;positive=1.0000;rank=1
contig_2213 AGAT exon 9719 10294 . + . ID=agat-exon-503;Parent=MP000503;Target={'target_id': "{'target_id':", 'start': "'contig_2213_17',", 'end': "'start':", 'strand': '1,'};identity=1.0000;rank=1
contig_2213 miniprot CDS 9719 10294 973.0 + 0 ID=agat-cds-503;Parent=MP000503;Target={'target_id': "{'target_id':", 'start': "'contig_2213_17',", 'end': "'start':", 'strand': '1,'};identity=1.0000;rank=1
contig_2213 miniprot stop_codon 10292 10294 0.0 + 0 ID=agat-stop_codon-501;Parent=MP000503;rank=1
###
contig_2213 AUGUSTUS gene 33762 35762 . - . ID=g6368
contig_2213 AUGUSTUS mRNA 33762 35762 . - . ID=g6368.t1;Parent=g6368
contig_2213 AUGUSTUS exon 33765 35762 . - . ID=g6368.t1.exon1;Parent=g6368.t1
contig_2213 AUGUSTUS CDS 33765 35762 . - 0 ID=g6368.t1.cds;Parent=g6368.t1
###
contig_2213 AUGUSTUS gene 35984 37434 . + . ID=g6369
contig_2213 AUGUSTUS mRNA 35984 37434 . + . ID=g6369.t1;Parent=g6369
contig_2213 AUGUSTUS exon 35984 37337 . + . ID=g6369.t1.exon1;Parent=g6369.t1
contig_2213 AUGUSTUS exon 37415 37431 . + . ID=g6369.t1.exon2;Parent=g6369.t1
contig_2213 AUGUSTUS CDS 35984 37337 . + 0 ID=g6369.t1.cds;Parent=g6369.t1
contig_2213 AUGUSTUS CDS 37415 37431 . + 2 ID=g6369.t1.cds;Parent=g6369.t1
Submit-block ::= {
contact {
contact {
name name {
last "Lysoe",
first "Erik",
middle "",
initials "",
suffix "",
title ""
},
affil std {
affil "NIBIO",
div "Molecular plant biology",
city "Aas",
country "Norway",
street "Hogskoleveien 8",
email "erik.lysoe@nibio.no",
postal-code "1432"
}
}
},
cit {
authors {
names std {
{
name name {
last "Lysoe",
first "Erik",
middle "",
initials "",
suffix "",
title ""
}
}
},
affil std {
affil "NIBIO",
div "Molecular plant biology",
city "Aas",
country "Norway",
street "Hogskoleveien 8",
postal-code "1432"
}
}
},
subtype new
}
Seqdesc ::= pub {
pub {
gen {
cit "unpublished",
authors {
names std {
{
name name {
last "Lysoe",
first "Erik",
middle "",
initials "",
suffix "",
title ""
}
}
}
},
title "MP1831 genome"
}
}
}
Seqdesc ::= user {
type str "DBLink",
data {
{
label str "BioProject",
num 1,
data strs {
"PRJNA1101761"
}
},
{
label str "BioSample",
num 1,
data strs {
"SAMN41003021"
}
}
}
}
Seqdesc ::= user {
type str "Submission",
data {
{
label str "AdditionalComment",
data str "ALT EMAIL:erik.lysoe@nibio.no"
}
}
}
Seqdesc ::= user {
type str "Submission",
data {
{
label str "AdditionalComment",
data str "Submission Title:None"
}
}
}
---
title: "Untitled"
output: github_document
---
```{r setup, include=FALSE}
knitr::opts_chunk$set(echo = TRUE)
library("Biostrings")
library("tidyverse")
library("ape")
```
```{r cars}
path <- "Mid_test_data"
geno <- "MidP1831_erik"
gff <- read.gff(file.path(path, paste0(geno, ".gff")))
geno_fa <- readDNAStringSet(file.path(path, paste0(geno, ".fsa")))
contigs <- unique(gff$seqid)
geno_fa_red <- geno_fa[contigs]
writeXStringSet(geno_fa_red, file.path(path, paste0(geno, ".fsa")))
```
\ No newline at end of file
params.genome = "MP1831"
params.genome = "MidP1831_erik"
params.project = "/home/nibio/Documents/Git/DivGene-genome-annotation/Mid_test_data"
profiles {
conda {
process.conda = '/home/nibio/miniconda3/envs/funannotate/'
}
}
......@@ -2,29 +2,90 @@
1. Parse genome to protein using gff2prot util from funannotate
2. Remove everything after stop codon in protein fasta with:
seqkit -> sed
3. */
3. Search and annotate with Eggnogg
4. Search and annotate with InterPro
5. Integrate custom annotation
6. Run FunAnnotate, integrate Eggnogg and InterPro
*/
// Script parameters
params.project = "/home/nibio/Documents/Erik_NCBI_tbl_test/Simeon_annotering/table2asn/"
// Script parameters, some modified in nextflow.config
params.project = "project_path"
params.genome = "genome_basename"
params.genomeGFF = "${params.project}${params.genome}.gff"
params.genomeFasta = "${params.project}${params.genome}.fsa"
params.genomeGFF = "${params.project}/${params.genome}.gff"
params.genomeFasta = "${params.project}/${params.genome}.fsa"
process fixGFF {
publishDir "${params.project}/nextflow_results", mode: 'symlink'
conda '/home/nibio/miniconda3/envs/funannotate'
input:
path gff
output:
path "fixed.gff"
"""
agat_sp_manage_IDs.pl --gff $gff -o "fixed.gff"
"""
}
process extractProteins {
publishDir "${params.project}/nextflow_results", mode: 'symlink'
input:
path genomeFasta
path genomeGFF
path fixedGFF
output:
path "${params.genome}_protein.fa"
"""
funannotate util gff2prot -g $genomeGFF -f $genomeFasta --no_stop | seqkit seq -w 0 | sed 's/\\*.*//' > "${params.genome}_protein.fa"
funannotate util gff2prot -g $fixedGFF -f $genomeFasta --no_stop | seqkit seq -w 0 | sed 's/\\*.*//' > "${params.genome}_protein.fa"
"""
}
process searchAndAnnotateEggnogg{
input:
path proteinFasta
output:
path "${params.genome}_em*"
publishDir "${params.project}/nextflow_results", mode: 'symlink'
"""
emapper.py -i $proteinFasta -o "${params.genome}_em" --data_dir /home/nibio/funannotate_db --cpu 0 --tax_scope Peronosporales
"""
}
process searchAndAnnotateInterPro{
input:
path proteinFasta
output:
path "${params.genome}_interpro*"
publishDir "${params.project}/nextflow_results", mode: 'symlink'
"""
~/interproscan-5.68-100.0/interproscan.sh -i $proteinFasta -b "${params.genome}_interpro"
"""
}
/*
process funannotateIntegration{
}
*/
workflow {
def genome_ch = Channel.fromPath(params.genomeFasta)
extractProteins(genome_ch, params.genomeGFF)
def gff_ch = Channel.fromPath(params.genomeGFF)
fixGFF(gff_ch)
extractProteins(params.genomeFasta, fixGFF.out)
searchAndAnnotateEggnogg(extractProteins.out)
searchAndAnnotateInterPro (extractProteins.out)
}
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment