LOCUS V037286 8128 bp DNA circular SYN 01-JAN-1980 DEFINITION synthetic circular DNA. ACCESSION V037286 VERSION V037286 KEYWORDS . SOURCE . ORGANISM . . FEATURES Location/Qualifiers LTR 234..414 /note="truncated 5' long terminal repeat (LTR) from HIV-1" /label="5' LTR (truncated)" misc_feature 458..583 /note="packaging signal of human immunodeficiency virus type 1" /label="HIV-1 Ψ" misc_feature 1076..1309 /note="The Rev response element (RRE) of HIV-1 allows for Rev-dependent mRNA export from the nucleus to the cytoplasm." /label="RRE" CDS 1493..1537 /codon_start=1 /note="recognized by the 2H10 single-chain llama nanobody" /product="antigenic peptide corresponding to amino acids 655 to 669 of the HIV envelope protein gp41 (Lutje Hulsik et al., 2013)" /transl_table=1 /translation="KNEQELLELDKWASL" /label="gp41 peptide" misc_feature 1804..1921 /note="central polypurine tract and central termination sequence of HIV-1" /label="cPPT/CTS" promoter 1966..2177 /note="core promoter for human elongation factor EF-1α" /label="EF-1α core promoter" LTR 2190..2458 /note="truncated 5' long terminal repeat (LTR) from human T-cell leukemia virus (HTLV) type 1" /label="5' LTR (truncated)" CDS 2492..3376 /label="MXI1(NM_130439)" /note="MXI1(NM_130439)" /gene="MXI1" CDS 3386..3439 /codon_start=1 /note="Eukaryotic ribosomes fail to insert a peptide bond between the Gly and Pro residues, yielding separate polypeptides." /product="2A peptide from Thosea asigna virus capsid protein" /protein_id="" /transl_table=1 /translation="EGRGSLLTCGDVEENPGP" /label="T2A" CDS 3470..4132 /codon_start=1 /product="green fluorescent protein 2 from Pontellina plumata, also known as ppluGFP2 (Shagin et al., 2004)" /transl_table=1 /translation="PAMEIECRITGTLNGVEFELVGGGEGTPKQGRMTNKMKSTKGALT FSPYLLSHVMGYGFYHFGTYPSGYENPFLHAINNGGYTNTRIEKYEDGGVLHVSFSYRY EAGRVIGDFKVVGTGFPEDSVIFTDKIIRSNATVEHLHPMGDNVLVGSFARTFSLRDGG YYSFVVDSHMHFKSAIHPSILQNGGPMFAFRRVEELHSNTELGIVEYQHAFKTPIAFA" /label="CopGFP" misc_feature 4223..4811 /note="woodchuck hepatitis virus posttranscriptional regulatory element" /label="WPRE" LTR 4885..5118 /note="self-inactivating 3' long terminal repeat (LTR) from HIV-1" /label="3' LTR (ΔU3)" polyA_signal 5190..5311 /note="SV40 polyadenylation signal" /label="SV40 poly(A) signal" rep_origin 5330..5465 /note="SV40 origin of replication" /label="SV40 ori" primer_bind complement(5503..5519) /note="common sequencing primer, one of multiple similar variants" /label="M13 rev" protein_bind 5527..5543 /bound_moiety="lac repressor encoded by lacI" /note="The lac repressor binds to the lac operator to inhibit transcription in E. coli. This inhibition can be relieved by adding lactose or isopropyl-β-D-thiogalactopyranoside (IPTG)." /label="lac operator" promoter complement(5551..5581) /note="promoter for the E. coli lac operon" /label="lac promoter" protein_bind 5596..5617 /bound_moiety="E. coli catabolite activator protein" /note="CAP binding activates transcription in the presence of cAMP." /label="CAP binding site" rep_origin complement(5905..6493) /direction=LEFT /note="high-copy-number ColE1/pMB1/pBR322/pUC origin of replication" /label="ori" CDS complement(6664..7524) /codon_start=1 /gene="bla" /note="confers resistance to ampicillin, carbenicillin, and related antibiotics" /product="β-lactamase" /transl_table=1 /translation="MSIQHFRVALIPFFAAFCLPVFA,HPETLVKVKDAEDQLGARVGY IELDLNSGKILESFRPEERFPMMSTFKVLLCGAVLSRIDAGQEQLGRRIHYSQNDLVEY SPVTEKHLTDGMTVRELCSAAITMSDNTAANLLLTTIGGPKELTAFLHNMGDHVTRLDR WEPELNEAIPNDERDTTMPVAMATTLRKLLTGELLTLASRQQLIDWMEADKVAGPLLRS ALPAGWFIADKSGAGERGSRGIIAALGPDGKPSRIVVIYTTGSQATMDERNRQIAEIGA SLIKHW*" /label="AmpR" promoter complement(7525..7629) /gene="bla" /label="AmpR promoter" primer_bind 8103..8119 /note="common sequencing primer, one of multiple similar variants" /label="M13 fwd" ORIGIN 1 acgcgtgtag tcttatgcaa tactcttgta gtcttgcaac atggtaacga tgagttagca 61 acatgcctta caaggagaga aaaagcaccg tgcatgccga ttggtggaag taaggtggta 121 cgatcgtgcc ttattaggaa ggcaacagac gggtctgaca tggattggac gaaccactga 181 attgccgcat tgcagagata ttgtatttaa gtgcctagct cgatacaata aacgggtctc 241 tctggttaga ccagatctga gcctgggagc tctctggcta actagggaac ccactgctta 301 agcctcaata aagcttgcct tgagtgcttc aagtagtgtg tgcccgtctg ttgtgtgact 361 ctggtaacta gagatccctc agaccctttt agtcagtgtg gaaaatctct agcagtggcg 421 cccgaacagg gacctgaaag cgaaagggaa accagagctc tctcgacgca ggactcggct 481 tgctgaagcg cgcacggcaa gaggcgaggg gcggcgactg gtgagtacgc caaaaatttt 541 gactagcgga ggctagaagg agagagatgg gtgcgagagc gtcagtatta agcgggggag 601 aattagatcg cgatgggaaa aaattcggtt aaggccaggg ggaaagaaaa aatataaatt 661 aaaacatata gtatgggcaa gcagggagct agaacgattc gcagttaatc ctggcctgtt 721 agaaacatca gaaggctgta gacaaatact gggacagcta caaccatccc ttcagacagg 781 atcagaagaa cttagatcat tatataatac agtagcaacc ctctattgtg tgcatcaaag 841 gatagagata aaagacacca aggaagcttt agacaagata gaggaagagc aaaacaaaag 901 taagaccacc gcacagcaag cggccactga tcttcagacc tggaggagga gatatgaggg 961 acaattggag aagtgaatta tataaatata aagtagtaaa aattgaacca ttaggagtag 1021 cacccaccaa ggcaaagaga agagtggtgc agagagaaaa aagagcagtg ggaataggag 1081 ctttgttcct tgggttcttg ggagcagcag gaagcactat gggcgcagcc tcaatgacgc 1141 tgacggtaca ggccagacaa ttattgtctg gtatagtgca gcagcagaac aatttgctga 1201 gggctattga ggcgcaacag catctgttgc aactcacagt ctggggcatc aagcagctcc 1261 aggcaagaat cctggctgtg gaaagatacc taaaggatca acagctcctg gggatttggg 1321 gttgctctgg aaaactcatt tgcaccactg ctgtgccttg gaatgctagt tggagtaata 1381 aatctctgga acagattgga atcacacgac ctggatggag tgggacagag aaattaacaa 1441 ttacacaagc ttaatacact ccttaattga agaatcgcaa aaccagcaag aaaagaatga 1501 acaagaatta ttggaattag ataaatgggc aagtttgtgg aattggttta acataacaaa 1561 ttggctgtgg tatataaaat tattcataat gatagtagga ggcttggtag gtttaagaat 1621 agtttttgct gtactttcta tagtgaatag agttaggcag ggatattcac cattatcgtt 1681 tcagacccac ctcccaaccc cgaggggacc cgacaggccc gaaggaatag aagaagaagg 1741 tggagagaga gacagagaca gatccattcg attagtgaac ggatctcgac ggtatcggtt 1801 aacttttaaa agaaaagggg ggattggggg gtacagtgca ggggaaagaa tagtagacat 1861 aatagcaaca gacatacaaa ctaaagaatt acaaaaacaa attacaaaaa ttcaaaattt 1921 tatcgatact agtaaggatc tgcgatcgct ccggtgcccg tcagtgggca gagcgcacat 1981 cgcccacagt ccccgagaag ttggggggag gggtcggcaa ttgaacgggt gcctagagaa 2041 ggtggcgcgg ggtaaactgg gaaagtgatg tcgtgtactg gctccgcctt tttcccgagg 2101 gtgggggaga accgtatata agtgcagtag tcgccgtgaa cgttcttttt cgcaacgggt 2161 ttgccgccag aacacagctg aagcttcgag gggctcgcat ctctccttca cgcgcccgcc 2221 gccctacctg aggccgccat ccacgccggt tgagtcgcgt tctgccgcct cccgcctgtg 2281 gtgcctcctg aactgcgtcc gccgtctagg taagtttaaa gctcaggtcg agaccgggcc 2341 tttgtccggc gctcccttgg agcctaccta gactcagccg gctctccacg ctttgcctga 2401 ccctgcttgc tcaactctac gtctttgttt cgttttctgt tctgcgccgt tacagatcca 2461 agctgtgacc ggcgcctact ctagagccac catgggcaaa cgcgggcggc cgcgcaagga 2521 ggcgcgctgc gagggcgcgg ggctggcccc cgccgcgccc ccggctgtgc cccccgccgt 2581 ggccgcgccc cagcccccgg ccctgcccga ggaccccgct ggggccaagc ccaggtgccc 2641 cttctcagac attttcaaca ccagcgagaa ctcgatggag aagcacatca acacttttct 2701 gcagaacgtg cagattctgc tcgaggccgc cagctacctg gagcagatcg agaaagaaaa 2761 caaaaagtgt gaacatggct acgcctcttc attcccgtcc atgccgagcc cccgactgca 2821 gcattcaaag cccccacgga ggttgagccg ggcacagaaa cacagcagcg ggagcagcaa 2881 caccagcact gccaacagat ctacacacaa tgagctggaa aagaatcgac gagctcatct 2941 gcgcctttgt ttagaacgct taaaagttct gattccacta ggaccagact gcacccggca 3001 cacaacactt ggtttgctca acaaagccaa agcacacatc aagaaacttg aagaagctga 3061 aagaaaaagc cagcaccagc tcgagaattt ggaacgagaa cagagatttt taaagtggcg 3121 actggaacag ctgcagggtc ctcaggagat ggaacgaata cgaatggaca gcattggatc 3181 aactatttct tcagatcgtt ctgattcaga gcgagaggag attgaagtgg atgttgaaag 3241 cacagagttc tcccatggag aagtggacaa tataagtacc accagcatca gtgacattga 3301 tgaccacagc agcctgccga gtattgggag tgacgagggt tactccagtg ccagtgtcaa 3361 actttcattc acttcagcgg ccgctgaggg cagaggaagt cttctaacat gcggtgacgt 3421 ggaggagaat cccggccctt ccggaatgga gagcgacgag agcggcctgc ccgccatgga 3481 gatcgagtgc cgcatcaccg gcaccctgaa cggcgtggag ttcgagctgg tgggcggcgg 3541 agagggcacc cccaagcagg gccgcatgac caacaagatg aagagcacca aaggcgccct 3601 gaccttcagc ccctacctgc tgagccacgt gatgggctac ggcttctacc acttcggcac 3661 ctaccccagc ggctacgaga accccttcct gcacgccatc aacaacggcg gctacaccaa 3721 cacccgcatc gagaagtacg aggacggcgg cgtgctgcac gtgagcttca gctaccgcta 3781 cgaggccggc cgcgtgatcg gcgacttcaa ggtggtgggc accggcttcc ccgaggacag 3841 cgtgatcttc accgacaaga tcatccgcag caacgccacc gtggagcacc tgcaccccat 3901 gggcgataac gtgctggtgg gcagcttcgc ccgcaccttc agcctgcgcg acggcggcta 3961 ctacagcttc gtggtggaca gccacatgca cttcaagagc gccatccacc ccagcatcct 4021 gcagaacggg ggccccatgt tcgccttccg ccgcgtggag gagctgcaca gcaacaccga 4081 gctgggcatc gtggagtacc agcacgcctt caagaccccc atcgccttcg ccagatcccg 4141 cgctcagtcg tccaattctg ccgtggacgg caccgccgga cccggctcca ccggatctcg 4201 ctagagctga atctaagtcg acaatcaacc tctggattac aaaatttgtg aaagattgac 4261 tggtattctt aactatgttg ctccttttac gctatgtgga tacgctgctt taatgccttt 4321 gtatcatgct attgcttccc gtatggcttt cattttctcc tccttgtata aatcctggtt 4381 gctgtctctt tatgaggagt tgtggcccgt tgtcaggcaa cgtggcgtgg tgtgcactgt 4441 gtttgctgac gcaaccccca ctggttgggg cattgccacc acctgtcagc tcctttccgg 4501 gactttcgct ttccccctcc ctattgccac ggcggaactc atcgccgcct gccttgcccg 4561 ctgctggaca ggggctcggc tgttgggcac tgacaattcc gtggtgttgt cggggaaatc 4621 atcgtccttt ccttggctgc tcgcctgtgt tgccacctgg attctgcgcg ggacgtcctt 4681 ctgctacgtc ccttcggccc tcaatccagc ggaccttcct tcccgcggcc tgctgccggc 4741 tctgcggcct cttccgcgtc ttcgccttcg ccctcagacg agtcggatct ccctttgggc 4801 cgcctccccg cctggtacct ttaagaccaa tgacttacaa ggcagctgta gatcttagcc 4861 actttttaaa agaaaagggg ggactggaag ggctaattca ctcccaacga aaataagatc 4921 tgctttttgc ttgtactggg tctctctggt tagaccagat ctgagcctgg gagctctctg 4981 gctaactagg gaacccactg cttaagcctc aataaagctt gccttgagtg cttcaagtag 5041 tgtgtgcccg tctgttgtgt gactctggta actagagatc cctcagaccc ttttagtcag 5101 tgtggaaaat ctctagcagt agtagttcat gtcatcttat tattcagtat ttataacttg 5161 caaagaaatg aatatcagag agtgagagga acttgtttat tgcagcttat aatggttaca 5221 aataaagcaa tagcatcaca aatttcacaa ataaagcatt tttttcactg cattctagtt 5281 gtggtttgtc caaactcatc aatgtatctt atcatgtctg gctctagcta tcccgcccct 5341 aactccgccc agttccgccc attctccgcc ccatggctga ctaatttttt ttatttatgc 5401 agaggccgag gccgcctcgg cctctgagct attccagaag tagtgaggag gcttttttgg 5461 aggcctagac ttttgcagag acggcccaaa ttcgtaatca tggtcatagc tgtttcctgt 5521 gtgaaattgt tatccgctca caattccaca caacatacga gccggaagca taaagtgtaa 5581 agcctggggt gcctaatgag tgagctaact cacattaatt gcgttgcgct cactgcccgc 5641 tttccagtcg ggaaacctgt cgtgccagct gcattaatga atcggccaac gcgcggggag 5701 aggcggtttg cgtattgggc gctcttccgc ttcctcgctc actgactcgc tgcgctcggt 5761 cgttcggctg cggcgagcgg tatcagctca ctcaaaggcg gtaatacggt tatccacaga 5821 atcaggggat aacgcaggaa agaacatgtg agcaaaaggc cagcaaaagg ccaggaaccg 5881 taaaaaggcc gcgttgctgg cgtttttcca taggctccgc ccccctgacg agcatcacaa 5941 aaatcgacgc tcaagtcaga ggtggcgaaa cccgacagga ctataaagat accaggcgtt 6001 tccccctgga agctccctcg tgcgctctcc tgttccgacc ctgccgctta ccggatacct 6061 gtccgccttt ctcccttcgg gaagcgtggc gctttctcat agctcacgct gtaggtatct 6121 cagttcggtg taggtcgttc gctccaagct gggctgtgtg cacgaacccc ccgttcagcc 6181 cgaccgctgc gccttatccg gtaactatcg tcttgagtcc aacccggtaa gacacgactt 6241 atcgccactg gcagcagcca ctggtaacag gattagcaga gcgaggtatg taggcggtgc 6301 tacagagttc ttgaagtggt ggcctaacta cggctacact agaaggacag tatttggtat 6361 ctgcgctctg ctgaagccag ttaccttcgg aaaaagagtt ggtagctctt gatccggcaa 6421 acaaaccacc gctggtagcg gtggtttttt tgtttgcaag cagcagatta cgcgcagaaa 6481 aaaaggatct caagaagatc ctttgatctt ttctacgggg tctgacgctc agtggaacga 6541 aaactcacgt taagggattt tggtcatgag attatcaaaa aggatcttca cctagatcct 6601 tttaaattaa aaatgaagtt ttaaatcaat ctaaagtata tatgagtaaa cttggtctga 6661 cagttaccaa tgcttaatca gtgaggcacc tatctcagcg atctgtctat ttcgttcatc 6721 catagttgcc tgactccccg tcgtgtagat aactacgata cgggagggct taccatctgg 6781 ccccagtgct gcaatgatac cgcgagaccc acgctcaccg gctccagatt tatcagcaat 6841 aaaccagcca gccggaaggg ccgagcgcag aagtggtcct gcaactttat ccgcctccat 6901 ccagtctatt aattgttgcc gggaagctag agtaagtagt tcgccagtta atagtttgcg 6961 caacgttgtt gccattgcta caggcatcgt ggtgtcacgc tcgtcgtttg gtatggcttc 7021 attcagctcc ggttcccaac gatcaaggcg agttacatga tcccccatgt tgtgcaaaaa 7081 agcggttagc tccttcggtc ctccgatcgt tgtcagaagt aagttggccg cagtgttatc 7141 actcatggtt atggcagcac tgcataattc tcttactgtc atgccatccg taagatgctt 7201 ttctgtgact ggtgagtact caaccaagtc attctgagaa tagtgtatgc ggcgaccgag 7261 ttgctcttgc ccggcgtcaa tacgggataa taccgcgcca catagcagaa ctttaaaagt 7321 gctcatcatt ggaaaacgtt cttcggggcg aaaactctca aggatcttac cgctgttgag 7381 atccagttcg atgtaaccca ctcgtgcacc caactgatct tcagcatctt ttactttcac 7441 cagcgtttct gggtgagcaa aaacaggaag gcaaaatgcc gcaaaaaagg gaataagggc 7501 gacacggaaa tgttgaatac tcatactctt cctttttcaa tattattgaa gcatttatca 7561 gggttattgt ctcatgagcg gatacatatt tgaatgtatt tagaaaaata aacaaatagg 7621 ggttccgcgc acatttcccc gaaaagtgcc acctgacgtc taagaaacca ttattatcat 7681 gacattaacc tataaaaata ggcgtatcac gaggcccttt cgtctcgcgc gtttcggtga 7741 tgacggtgaa aacctctgac acatgcagct cccggagacg gtcacagctt gtctgtaagc 7801 ggatgccggg agcagacaag cccgtcaggg cgcgtcagcg ggtgttggcg ggtgtcgggg 7861 ctggcttaac tatgcggcat cagagcagat tgtactgaga gtgcaccata tgcggtgtga 7921 aataccgcac agatgcgtaa ggagaaaata ccgcatcagg cgccattcgc cattcaggct 7981 gcgcaactgt tgggaagggc gatcggtgcg ggcctcttcg ctattacgcc agctggcgaa 8041 agggggatgt gctgcaaggc gattaagttg ggtaacgcca gggttttccc agtcacgacg 8101 ttgtaaaacg acggccagtg ccaagctg //