LOCUS NW_006238919 18563 bp DNA UNK 01-JAN-1980 DEFINITION Capsella rubella cultivar Monte Gargano unplaced genomic scaffold, Caprub1_0 scaffold_5, whole genome shotgun sequence. ACCESSION NW_006238919 VERSION NW_006238919.1 KEYWORDS . SOURCE . ORGANISM . . FEATURES Location/Qualifiers cluster 1..18563 /note="Cluster number: 30" /note="Detection rule(s) for this cluster type: plants/plant: (minimum(4,[NAD_binding_4, FAE1_CUT1_RppA, HAD_RAM2_N, Orn_DAP_Arg_deC,Pyridoxal_deC,BBE,FA_hydroxylase,CER1-like_ C,ECH_2,Oxidored_FMN,3Beta_HSD,Glyco_hydro_1,ADH_N,ADH_N_2, Abhydrolase_3,Aldo_ket_red,cMT,nMT,oMT,adh_short,Chal_sti_s ynt_C,Chal_sti_synt_N,COesterase,UDPGT,Glyco_transf_28,Glyc os_transf_1,Glycos_transf_2,Lycopene_cycl,NAD_binding_1,p45 0,SQHop_cyclase_C,SQHop_cyclase_N,Prenyltrans,Terpene_synth _C,Terpene_synth,Transferase,Aminotran_1_2,AMP-binding,DIOX _N,Dirigent,Bet_v_1,Cu_amine_oxid,Str_synth,Trp_syntA,His_b iosynth,adh_short_C2,Peptidase_S10,Prenyltransf,Epimerase,2 OG-FeII_Oxy,Aminotran_3,Methyltransf_2,Methyltransf_3,Methy ltransf_7,PRISE,Cellulose_synt,Chalcone,ERG4_ERG24,FA_desat urase,FA_desaturase_2,Methyltransf_11,polyprenyl_synt,SE,SQ S_PSY,TPMT,UbiA,Lipoxygenase,Lyase_aromatic,HMGL-like,Chalc one_3,Chalcone_2,Acetyltransf_1,UDPGT_2,GMC_oxred_N,GMC_oxr ed_C,Amino_oxidase,DAHP_synth_1,DAHP_synth_2],[])); plants/saccharide: (minimum(3,[NAD_binding_4, FAE1_CUT1_RppA, HAD_RAM2_N, Orn_DAP_Arg_deC,Pyridoxal_deC,BBE,FA_hydroxylase,CER1-like_ C,ECH_2,Oxidored_FMN,3Beta_HSD,Glyco_hydro_1,ADH_N,ADH_N_2, Abhydrolase_3,Aldo_ket_red,cMT,nMT,oMT,adh_short,Chal_sti_s ynt_C,Chal_sti_synt_N,COesterase,UDPGT,Glyco_transf_28,Glyc os_transf_1,Glycos_transf_2,Lycopene_cycl,NAD_binding_1,p45 0,SQHop_cyclase_C,SQHop_cyclase_N,Prenyltrans,Terpene_synth _C,Terpene_synth,Transferase,Aminotran_1_2,AMP-binding,DIOX _N,Dirigent,Bet_v_1,Cu_amine_oxid,Str_synth,Trp_syntA,His_b iosynth,adh_short_C2,Peptidase_S10,Prenyltransf,Epimerase,2 OG-FeII_Oxy,Aminotran_3,Methyltransf_2,Methyltransf_3,Methy ltransf_7,PRISE,Cellulose_synt,Chalcone,ERG4_ERG24,FA_desat urase,FA_desaturase_2,Methyltransf_11,polyprenyl_synt,SE,SQ S_PSY,TPMT,UbiA,Lipoxygenase,Lyase_aromatic,HMGL-like,Chalc one_3,Chalcone_2,Acetyltransf_1,UDPGT_2,GMC_oxred_N,GMC_oxr ed_C,Amino_oxidase,DAHP_synth_1,DAHP_synth_2],[Glycos_trans f_1/Glycos_transf_2/Glycos_transf_28/UDPGT/UDPGT_2/Glyco_hy dro_1/Cellulose_synt]));" /cutoff=17925 /extension=3585 /product="saccharide" /clusterblast="1. CM032902.1_c153 Arabidopsis suecica isolate As9502 chromosome 3, whole gen... (100% of genes show similarity)" /clusterblast="2. LR999455.1_c163 Arabidopsis arenosa genome assembly, chromosome: 5 (87% of genes show similarity)" /clusterblast="3. NC_003074.8_c155 Arabidopsis thaliana chromosome 3, partial sequence (100% of genes show similarity)" /clusterblast="4. CM032915.1_c156 Arabidopsis thaliana x Arabidopsis arenosa isolate Allo738... (100% of genes show similarity)" /clusterblast="5. NW_003302551.1_c141 Arabidopsis lyrata subsp. lyrata unplaced genomic scaf... (87% of genes show similarity)" /clusterblast="6. OZ185640.1_c145 Arabidopsis halleri genome assembly, chromosome: 5 (87% of genes show similarity)" /clusterblast="7. CM032909.1_c400 Arabidopsis suecica isolate As9502 chromosome 10, whole ge... (87% of genes show similarity)" /clusterblast="9. NC_025690.1_c144 Camelina sativa cultivar DH55 chromosome 6, Cs, whole gen... (87% of genes show similarity)" /clusterblast="10. NC_025688.1_c87 Camelina sativa cultivar DH55 chromosome 4, Cs, whole gen... (87% of genes show similarity)" /clusterblast="11. JBANAX010000649.1_c190 Cardamine amara subsp. amara voucher SAV:0018104 c... (87% of genes show similarity)" gene complement(1328..3357) /gene="LOC17885200" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /db_xref="GeneID:17885200" mRNA complement(join(1328..1637,1733..1853,1934..1980, 2069..2108,2309..2396,2483..2665,3161..3357)) /gene="LOC17885200" /product="vacuolar protein-sorting-associated protein 37 homolog 1" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 4 Proteins, and 100% coverage of the annotated genomic feature by RNAseq alignments, including 15 samples with support for all annotated introns" /transcript_id="XM_006292241.2" /db_xref="GeneID:17885200" CDS complement(join(1477..1637,1733..1853,1934..1980, 2069..2108,2309..2396,2483..2665,3161..3174)) /gene="LOC17885200" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="vacuolar protein-sorting-associated protein 37 homolog 1" /protein_id="XP_006292303.1" /db_xref="GeneID:17885200" /translation="MFNFWGSKEQQQGTSRPPEASSQSPWYSPSLVSSPSSSRPQTSGQ IPANVSPGEAAGIIAFLKDKSVDELRKLLSDKDAYQQFLLSLDQVKIQNNIKEELRRET LQIARENLEKEPQIMELRNQCRIIRTTELAAAQEKLNELERQKEEILKFYSPGSLLHKL QEAMNQVDEESEALQEKFLEKEIDTAAFVQKFKKLRTTYHRRALIHLAAKTSNI" /kmer_dict="{'MFN': [0], 'FNF': [1], 'NFW': [2], 'FWG': [3], 'WGS': [4], 'GSK': [5], 'SKE': [6], 'KEQ': [7], 'EQQ': [8], 'QQQ': [9], 'QQG': [10], 'QGT': [11], 'GTS': [12], 'TSR': [13], 'SRP': [14, 37], 'RPP': [15], 'PPE': [16], 'PEA': [17], 'EAS': [18], 'ASS': [19], 'SSQ': [20], 'SQS': [21], 'QSP': [22], 'SPW': [23], 'PWY': [24], 'WYS': [25], 'YSP': [26, 153], 'SPS': [27, 33], 'PSL': [28], 'SLV': [29], 'LVS': [30], 'VSS': [31], 'SSP': [32], 'PSS': [34], 'SSS': [35], 'SSR': [36], 'RPQ': [38], 'PQT': [39], 'QTS': [40], 'TSG': [41], 'SGQ': [42], 'GQI': [43], 'QIP': [44], 'IPA': [45], 'PAN': [46], 'ANV': [47], 'NVS': [48], 'VSP': [49], 'SPG': [50, 154], 'PGE': [51], 'GEA': [52], 'EAA': [53], 'AAG': [54], 'AGI': [55], 'GII': [56], 'IIA': [57], 'IAF': [58], 'AFL': [59], 'FLK': [60], 'LKD': [61], 'KDK': [62], 'DKS': [63], 'KSV': [64], 'SVD': [65], 'VDE': [66, 169], 'DEL': [67], 'ELR': [68, 98, 119], 'LRK': [69], 'RKL': [70], 'KLL': [71], 'LLS': [72, 83], 'LSD': [73], 'SDK': [74], 'DKD': [75], 'KDA': [76], 'DAY': [77], 'AYQ': [78], 'YQQ': [79], 'QQF': [80], 'QFL': [81], 'FLL': [82], 'LSL': [84], 'SLD': [85], 'LDQ': [86], 'DQV': [87], 'QVK': [88], 'VKI': [89], 'KIQ': [90], 'IQN': [91], 'QNN': [92], 'NNI': [93], 'NIK': [94], 'IKE': [95], 'KEE': [96, 146], 'EEL': [97], 'LRR': [99], 'RRE': [100], 'RET': [101], 'ETL': [102], 'TLQ': [103], 'LQI': [104], 'QIA': [105], 'IAR': [106], 'ARE': [107], 'REN': [108], 'ENL': [109], 'NLE': [110], 'LEK': [111, 181], 'EKE': [112, 182], 'KEP': [113], 'EPQ': [114], 'PQI': [115], 'QIM': [116], 'IME': [117], 'MEL': [118], 'LRN': [120], 'RNQ': [121], 'NQC': [122], 'QCR': [123], 'CRI': [124], 'RII': [125], 'IIR': [126], 'IRT': [127], 'RTT': [128, 198], 'TTE': [129], 'TEL': [130], 'ELA': [131], 'LAA': [132, 209], 'AAA': [133], 'AAQ': [134], 'AQE': [135], 'QEK': [136, 177], 'EKL': [137], 'KLN': [138], 'LNE': [139], 'NEL': [140], 'ELE': [141], 'LER': [142], 'ERQ': [143], 'RQK': [144], 'QKE': [145], 'EEI': [147], 'EIL': [148], 'ILK': [149], 'LKF': [150], 'KFY': [151], 'FYS': [152], 'PGS': [155], 'GSL': [156], 'SLL': [157], 'LLH': [158], 'LHK': [159], 'HKL': [160], 'KLQ': [161], 'LQE': [162, 176], 'QEA': [163], 'EAM': [164], 'AMN': [165], 'MNQ': [166], 'NQV': [167], 'QVD': [168], 'DEE': [170], 'EES': [171], 'ESE': [172], 'SEA': [173], 'EAL': [174], 'ALQ': [175], 'EKF': [178], 'KFL': [179], 'FLE': [180], 'KEI': [183], 'EID': [184], 'IDT': [185], 'DTA': [186], 'TAA': [187], 'AAF': [188], 'AFV': [189], 'FVQ': [190], 'VQK': [191], 'QKF': [192], 'KFK': [193], 'FKK': [194], 'KKL': [195], 'KLR': [196], 'LRT': [197], 'TTY': [199], 'TYH': [200], 'YHR': [201], 'HRR': [202], 'RRA': [203], 'RAL': [204], 'ALI': [205], 'LIH': [206], 'IHL': [207], 'HLA': [208], 'AAK': [210], 'AKT': [211], 'KTS': [212], 'TSN': [213]}" /ripp_evidence="{}" /top_kmer_word="ELR" /top_kmer_hits=68 /top_kmer_hits=98 /top_kmer_hits=119 /table="ELR" /table="ELR" /table="ELR" gene 3555..6333 /gene="LOC17887227" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /db_xref="GeneID:17887227" mRNA join(3555..4083,4254..4550,4639..4836,4928..5029, 5131..5271,5341..5448,5598..5680,5773..5935,6042..6333) /gene="LOC17887227" /product="carotene epsilon-monooxygenase, chloroplastic" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 3 Proteins, and 100% coverage of the annotated genomic feature by RNAseq alignments, including 13 samples with support for all annotated introns" /transcript_id="XM_023782454.1" /db_xref="GeneID:17887227" CDS join(3586..4083,4254..4550,4639..4836,4928..5029, 5131..5271,5341..5448,5598..5680,5773..5935,6042..6071) /gene="LOC17887227" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="carotene epsilon-monooxygenase, chloroplastic" /protein_id="XP_023638222.1" /db_xref="GeneID:17887227" /translation="MESSLFSPSSSSIFTAKSTLLSSPKPKFFSFSIKSSIEKPKPKPK LETSSSKSQSWVSPDWLTSLTRTLSSGKNDDSGIPIASAKLDDVSDLLGGALFLPLYKW MNEYGPIYRLAAGPRNFVVVSDPAIAKHVLRNYPKYAKGLVAEVSEFLFGSGFAIAEGP LWTARRKAVVPSLHRRYLSVIVERVFCKSAERLVEKLQPYAKDGSAVNMEEKFSQLTLD VIGLSLFNYNFDSLTTDSPVIEAVYTALKEAELRSTDLLPYWKIDALCKIIPRQVKAEK AVTLIRETVEDLISKCKEIVEREGERINDEEYVNDADPSILRFLLASREEVSSVQLRDD LLSMLVAGHETTGSVLTWTLYLLSKNSSALAKAQEEVDRVLEGRNPAFEDIKELKYITR CINESMRLYPHPPVLIRRAQVPDILPGNYKVNTGQDIMISVYNIHRSSEVWEKAEEFLP ERFELEGAIPNETNTDFKFIPFSGGPRKCVGDQFALMEAIVALAVFLQRLNVELVPDQT ISMTTGATIHTTNGLYMKVSQR" /domain_record="plants/p450 (E-value: 6.9e-84, bitscore: 281.4, seeds: 50)" /sec_met="Type: saccharide" /sec_met="Domains detected: p450 (E-value: 6.9e-84, bitscore: 281.4, seeds: 50)" /sec_met="Kind: biosynthetic" /sec_met="Percentage identity: LOC17886373=32.258,LOC17887019=40.0,LOC17884861=29.167" /kmer_dict="{'MES': [0], 'ESS': [1], 'SSL': [2], 'SLF': [3, 226], 'LFS': [4], 'FSP': [5], 'SPS': [6], 'PSS': [7], 'SSS': [8, 9, 48], 'SSI': [10, 34], 'SIF': [11], 'IFT': [12], 'FTA': [13], 'TAK': [14], 'AKS': [15], 'KST': [16], 'STL': [17], 'TLL': [18], 'LLS': [19, 340, 361], 'LSS': [20, 68], 'SSP': [21], 'SPK': [22], 'PKP': [23, 39, 41], 'KPK': [24, 38, 40, 42], 'PKF': [25], 'KFF': [26], 'FFS': [27], 'FSF': [28], 'SFS': [29], 'FSI': [30], 'SIK': [31], 'IKS': [32], 'KSS': [33], 'SIE': [35], 'IEK': [36], 'EKP': [37], 'PKL': [43], 'KLE': [44], 'LET': [45], 'ETS': [46], 'TSS': [47], 'SSK': [49], 'SKS': [50], 'KSQ': [51], 'SQS': [52], 'QSW': [53], 'SWV': [54], 'WVS': [55], 'VSP': [56], 'SPD': [57], 'PDW': [58], 'DWL': [59], 'WLT': [60], 'LTS': [61], 'TSL': [62], 'SLT': [63, 234], 'LTR': [64], 'TRT': [65], 'RTL': [66], 'TLS': [67], 'SSG': [69], 'SGK': [70], 'GKN': [71], 'KND': [72], 'NDD': [73], 'DDS': [74], 'DSG': [75], 'SGI': [76], 'GIP': [77], 'IPI': [78], 'PIA': [79], 'IAS': [80], 'ASA': [81], 'SAK': [82], 'AKL': [83], 'KLD': [84], 'LDD': [85], 'DDV': [86], 'DVS': [87], 'VSD': [88, 123], 'SDL': [89], 'DLL': [90, 258, 339], 'LLG': [91], 'LGG': [92], 'GGA': [93], 'GAL': [94], 'ALF': [95], 'LFL': [96], 'FLP': [97, 455], 'LPL': [98], 'PLY': [99], 'LYK': [100], 'YKW': [101], 'KWM': [102], 'WMN': [103], 'MNE': [104], 'NEY': [105], 'EYG': [106], 'YGP': [107], 'GPI': [108], 'PIY': [109], 'IYR': [110], 'YRL': [111], 'RLA': [112], 'LAA': [113], 'AAG': [114], 'AGP': [115], 'GPR': [116, 482], 'PRN': [117], 'RNF': [118], 'NFV': [119], 'FVV': [120], 'VVV': [121], 'VVS': [122], 'SDP': [124], 'DPA': [125], 'PAI': [126], 'AIA': [127, 157], 'IAK': [128], 'AKH': [129], 'KHV': [130], 'HVL': [131], 'VLR': [132], 'LRN': [133], 'RNY': [134], 'NYP': [135], 'YPK': [136], 'PKY': [137], 'KYA': [138], 'YAK': [139, 202], 'AKG': [140], 'KGL': [141], 'GLV': [142], 'LVA': [143, 344], 'VAE': [144], 'AEV': [145], 'EVS': [146, 330], 'VSE': [147], 'SEF': [148], 'EFL': [149, 454], 'FLF': [150], 'LFG': [151], 'FGS': [152], 'GSG': [153], 'SGF': [154], 'GFA': [155], 'FAI': [156], 'IAE': [158], 'AEG': [159], 'EGP': [160], 'GPL': [161], 'PLW': [162], 'LWT': [163], 'WTA': [164], 'TAR': [165], 'ARR': [166], 'RRK': [167], 'RKA': [168], 'KAV': [169, 280], 'AVV': [170], 'VVP': [171], 'VPS': [172], 'PSL': [173], 'SLH': [174], 'LHR': [175], 'HRR': [176], 'RRY': [177], 'RYL': [178], 'YLS': [179], 'LSV': [180], 'SVI': [181], 'VIV': [182], 'IVE': [183, 299], 'VER': [184, 300], 'ERV': [185], 'RVF': [186], 'VFC': [187], 'FCK': [188], 'CKS': [189], 'KSA': [190], 'SAE': [191], 'AER': [192], 'ERL': [193], 'RLV': [194], 'LVE': [195], 'VEK': [196], 'EKL': [197], 'KLQ': [198], 'LQP': [199], 'QPY': [200], 'PYA': [201], 'AKD': [203], 'KDG': [204], 'DGS': [205], 'GSA': [206], 'SAV': [207], 'AVN': [208], 'VNM': [209], 'NME': [210], 'MEE': [211], 'EEK': [212], 'EKF': [213], 'KFS': [214], 'FSQ': [215], 'SQL': [216], 'QLT': [217], 'LTL': [218], 'TLD': [219], 'LDV': [220], 'DVI': [221], 'VIG': [222], 'IGL': [223], 'GLS': [224], 'LSL': [225], 'LFN': [227], 'FNY': [228], 'NYN': [229], 'YNF': [230], 'NFD': [231], 'FDS': [232], 'DSL': [233], 'LTT': [235], 'TTD': [236], 'TDS': [237], 'DSP': [238], 'SPV': [239], 'PVI': [240], 'VIE': [241], 'IEA': [242], 'EAV': [243], 'AVY': [244], 'VYT': [245], 'YTA': [246], 'TAL': [247], 'ALK': [248], 'LKE': [249], 'KEA': [250], 'EAE': [251], 'AEL': [252], 'ELR': [253], 'LRS': [254], 'RST': [255], 'STD': [256], 'TDL': [257], 'LLP': [259], 'LPY': [260], 'PYW': [261], 'YWK': [262], 'WKI': [263], 'KID': [264], 'IDA': [265], 'DAL': [266], 'ALC': [267], 'LCK': [268], 'CKI': [269], 'KII': [270], 'IIP': [271], 'IPR': [272], 'PRQ': [273], 'RQV': [274], 'QVK': [275], 'VKA': [276], 'KAE': [277, 451], 'AEK': [278], 'EKA': [279, 450], 'AVT': [281], 'VTL': [282], 'TLI': [283], 'LIR': [284, 413], 'IRE': [285], 'RET': [286], 'ETV': [287], 'TVE': [288], 'VED': [289], 'EDL': [290], 'DLI': [291], 'LIS': [292], 'ISK': [293], 'SKC': [294], 'KCK': [295], 'CKE': [296], 'KEI': [297], 'EIV': [298], 'ERE': [301], 'REG': [302], 'EGE': [303], 'GER': [304], 'ERI': [305], 'RIN': [306], 'IND': [307], 'NDE': [308], 'DEE': [309], 'EEY': [310], 'EYV': [311], 'YVN': [312], 'VND': [313], 'NDA': [314], 'DAD': [315], 'ADP': [316], 'DPS': [317], 'PSI': [318], 'SIL': [319], 'ILR': [320], 'LRF': [321], 'RFL': [322], 'FLL': [323], 'LLA': [324], 'LAS': [325], 'ASR': [326], 'SRE': [327], 'REE': [328], 'EEV': [329, 374], 'VSS': [331], 'SSV': [332], 'SVQ': [333], 'VQL': [334], 'QLR': [335], 'LRD': [336], 'RDD': [337], 'DDL': [338], 'LSM': [341], 'SML': [342], 'MLV': [343], 'VAG': [345], 'AGH': [346], 'GHE': [347], 'HET': [348], 'ETT': [349], 'TTG': [350, 520], 'TGS': [351], 'GSV': [352], 'SVL': [353], 'VLT': [354], 'LTW': [355], 'TWT': [356], 'WTL': [357], 'TLY': [358], 'LYL': [359], 'YLL': [360], 'LSK': [362], 'SKN': [363], 'KNS': [364], 'NSS': [365], 'SSA': [366], 'SAL': [367], 'ALA': [368, 499], 'LAK': [369], 'AKA': [370], 'KAQ': [371], 'AQE': [372], 'QEE': [373], 'EVD': [375], 'VDR': [376], 'DRV': [377], 'RVL': [378], 'VLE': [379], 'LEG': [380, 462], 'EGR': [381], 'GRN': [382], 'RNP': [383], 'NPA': [384], 'PAF': [385], 'AFE': [386], 'FED': [387], 'EDI': [388], 'DIK': [389], 'IKE': [390], 'KEL': [391], 'ELK': [392], 'LKY': [393], 'KYI': [394], 'YIT': [395], 'ITR': [396], 'TRC': [397], 'RCI': [398], 'CIN': [399], 'INE': [400], 'NES': [401], 'ESM': [402], 'SMR': [403], 'MRL': [404], 'RLY': [405], 'LYP': [406], 'YPH': [407], 'PHP': [408], 'HPP': [409], 'PPV': [410], 'PVL': [411], 'VLI': [412], 'IRR': [414], 'RRA': [415], 'RAQ': [416], 'AQV': [417], 'QVP': [418], 'VPD': [419, 512], 'PDI': [420], 'DIL': [421], 'ILP': [422], 'LPG': [423], 'PGN': [424], 'GNY': [425], 'NYK': [426], 'YKV': [427], 'KVN': [428], 'VNT': [429], 'NTG': [430], 'TGQ': [431], 'GQD': [432], 'QDI': [433], 'DIM': [434], 'IMI': [435], 'MIS': [436], 'ISV': [437], 'SVY': [438], 'VYN': [439], 'YNI': [440], 'NIH': [441], 'IHR': [442], 'HRS': [443], 'RSS': [444], 'SSE': [445], 'SEV': [446], 'EVW': [447], 'VWE': [448], 'WEK': [449], 'AEE': [452], 'EEF': [453], 'LPE': [456], 'PER': [457], 'ERF': [458], 'RFE': [459], 'FEL': [460], 'ELE': [461], 'EGA': [463], 'GAI': [464], 'AIP': [465], 'IPN': [466], 'PNE': [467], 'NET': [468], 'ETN': [469], 'TNT': [470], 'NTD': [471], 'TDF': [472], 'DFK': [473], 'FKF': [474], 'KFI': [475], 'FIP': [476], 'IPF': [477], 'PFS': [478], 'FSG': [479], 'SGG': [480], 'GGP': [481], 'PRK': [483], 'RKC': [484], 'KCV': [485], 'CVG': [486], 'VGD': [487], 'GDQ': [488], 'DQF': [489], 'QFA': [490], 'FAL': [491], 'ALM': [492], 'LME': [493], 'MEA': [494], 'EAI': [495], 'AIV': [496], 'IVA': [497], 'VAL': [498], 'LAV': [500], 'AVF': [501], 'VFL': [502], 'FLQ': [503], 'LQR': [504], 'QRL': [505], 'RLN': [506], 'LNV': [507], 'NVE': [508], 'VEL': [509], 'ELV': [510], 'LVP': [511], 'PDQ': [513], 'DQT': [514], 'QTI': [515], 'TIS': [516], 'ISM': [517], 'SMT': [518], 'MTT': [519], 'TGA': [521], 'GAT': [522], 'ATI': [523], 'TIH': [524], 'IHT': [525], 'HTT': [526], 'TTN': [527], 'TNG': [528], 'NGL': [529], 'GLY': [530], 'LYM': [531], 'YMK': [532], 'MKV': [533], 'KVS': [534], 'VSQ': [535]}" /ripp_evidence="{}" /top_kmer_word="KPK" /top_kmer_hits=24 /top_kmer_hits=38 /top_kmer_hits=40 /top_kmer_hits=42 /table="KPK" /table="KPK" /table="KPK" /table="KPK" gene 7000..9072 /gene="LOC17886373" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /db_xref="GeneID:17886373" mRNA join(7000..7419,7750..8086,8189..8253,8660..9072) /gene="LOC17886373" /product="caffeic acid 3-O-methyltransferase" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 1 Protein, and 100% coverage of the annotated genomic feature by RNAseq alignments, including 13 samples with support for all annotated introns" /transcript_id="XM_006291309.2" /db_xref="GeneID:17886373" CDS join(7042..7419,7750..8086,8189..8253,8660..8959) /gene="LOC17886373" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="caffeic acid 3-O-methyltransferase" /protein_id="XP_006291371.1" /db_xref="GeneID:17886373" /translation="MEKESSESRNRARLAIMELANMISVPMSLNAAVRLGIADAIWNGG ANSPLSASEILPRLLIPSATTTGGDPENLQRILRMLTSYGVFSEHLVGSSERKFSLTDV GKTLVTDSDGLSYAAYILQHHQEALMRAWPLVHTAVVEPETEPYVKANGEAAYVQYGKS EEMNSLMLKAMSGVSVPFMKAILEGYEGFKSVERLVDVGGSAGDCLRMILQHFPNVREG INFDLPEVVAKAPNIPGVSHVGGDMFQSVPSGDAIFMKWVLTTWTDEECKEIMKNCYNA LPVGGKLIACEPVLPKETDDSHRTRALLEGDIFVMTIYRTKGKHRTEEEFKELGLSAGF PTFRPFYIDYFYTILEFQK" /domain_record="plants/Methyltransf_2 (E-value: 5.3e-52, bitscore: 175.4, seeds: 9); plants/Dimerisation (E-value: 7.2e-08, bitscore: 31.5, seeds: 30)" /sec_met="Type: saccharide" /sec_met="Domains detected: Methyltransf_2 (E-value: 5.3e-52, bitscore: 175.4, seeds: 9);Dimerisation (E-value: 7.2e-08, bitscore: 31.5, seeds: 30)" /sec_met="Kind: biosynthetic" /sec_met="Percentage identity: LOC17887227=32.258,LOC17887019=53.846,LOC17884861=42.857" /kmer_dict="{'MEK': [0], 'EKE': [1], 'KES': [2], 'ESS': [3], 'SSE': [4, 93], 'SES': [5], 'ESR': [6], 'SRN': [7], 'RNR': [8], 'NRA': [9], 'RAR': [10], 'ARL': [11], 'RLA': [12], 'LAI': [13], 'AIM': [14], 'IME': [15], 'MEL': [16], 'ELA': [17], 'LAN': [18], 'ANM': [19], 'NMI': [20], 'MIS': [21], 'ISV': [22], 'SVP': [23, 177, 249], 'VPM': [24], 'PMS': [25], 'MSL': [26], 'SLN': [27], 'LNA': [28], 'NAA': [29], 'AAV': [30], 'AVR': [31], 'VRL': [32], 'RLG': [33], 'LGI': [34], 'GIA': [35], 'IAD': [36], 'ADA': [37], 'DAI': [38, 254], 'AIW': [39], 'IWN': [40], 'WNG': [41], 'NGG': [42], 'GGA': [43], 'GAN': [44], 'ANS': [45], 'NSP': [46], 'SPL': [47], 'PLS': [48], 'LSA': [49, 335], 'SAS': [50], 'ASE': [51], 'SEI': [52], 'EIL': [53], 'ILP': [54], 'LPR': [55], 'PRL': [56], 'RLL': [57], 'LLI': [58], 'LIP': [59], 'IPS': [60], 'PSA': [61], 'SAT': [62], 'ATT': [63], 'TTT': [64], 'TTG': [65], 'TGG': [66], 'GGD': [67, 243], 'GDP': [68], 'DPE': [69], 'PEN': [70], 'ENL': [71], 'NLQ': [72], 'LQR': [73], 'QRI': [74], 'RIL': [75], 'ILR': [76], 'LRM': [77, 208], 'RML': [78], 'MLT': [79], 'LTS': [80], 'TSY': [81], 'SYG': [82], 'YGV': [83], 'GVF': [84], 'VFS': [85], 'FSE': [86], 'SEH': [87], 'EHL': [88], 'HLV': [89], 'LVG': [90], 'VGS': [91], 'GSS': [92], 'SER': [94], 'ERK': [95], 'RKF': [96], 'KFS': [97], 'FSL': [98], 'SLT': [99], 'LTD': [100], 'TDV': [101], 'DVG': [102, 199], 'VGK': [103], 'GKT': [104], 'KTL': [105], 'TLV': [106], 'LVT': [107], 'VTD': [108], 'TDS': [109], 'DSD': [110], 'SDG': [111], 'DGL': [112], 'GLS': [113, 334], 'LSY': [114], 'SYA': [115], 'YAA': [116], 'AAY': [117, 154], 'AYI': [118], 'YIL': [119], 'ILQ': [120, 211], 'LQH': [121, 212], 'QHH': [122], 'HHQ': [123], 'HQE': [124], 'QEA': [125], 'EAL': [126], 'ALM': [127], 'LMR': [128], 'MRA': [129], 'RAW': [130], 'AWP': [131], 'WPL': [132], 'PLV': [133], 'LVH': [134], 'VHT': [135], 'HTA': [136], 'TAV': [137], 'AVV': [138], 'VVE': [139], 'VEP': [140], 'EPE': [141], 'PET': [142], 'ETE': [143], 'TEP': [144], 'EPY': [145], 'PYV': [146], 'YVK': [147], 'VKA': [148], 'KAN': [149], 'ANG': [150], 'NGE': [151], 'GEA': [152], 'EAA': [153], 'AYV': [155], 'YVQ': [156], 'VQY': [157], 'QYG': [158], 'YGK': [159], 'GKS': [160], 'KSE': [161], 'SEE': [162], 'EEM': [163], 'EMN': [164], 'MNS': [165], 'NSL': [166], 'SLM': [167], 'LML': [168], 'MLK': [169], 'LKA': [170], 'KAM': [171], 'AMS': [172], 'MSG': [173], 'SGV': [174], 'GVS': [175, 238], 'VSV': [176], 'VPF': [178], 'PFM': [179], 'FMK': [180, 257], 'MKA': [181], 'KAI': [182], 'AIL': [183], 'ILE': [184, 353], 'LEG': [185, 308], 'EGY': [186], 'GYE': [187], 'YEG': [188], 'EGF': [189], 'GFK': [190], 'FKS': [191], 'KSV': [192], 'SVE': [193], 'VER': [194], 'ERL': [195], 'RLV': [196], 'LVD': [197], 'VDV': [198], 'VGG': [200, 242, 283], 'GGS': [201], 'GSA': [202], 'SAG': [203, 336], 'AGD': [204], 'GDC': [205], 'DCL': [206], 'CLR': [207], 'RMI': [209], 'MIL': [210], 'QHF': [213], 'HFP': [214], 'FPN': [215], 'PNV': [216], 'NVR': [217], 'VRE': [218], 'REG': [219], 'EGI': [220], 'GIN': [221], 'INF': [222], 'NFD': [223], 'FDL': [224], 'DLP': [225], 'LPE': [226], 'PEV': [227], 'EVV': [228], 'VVA': [229], 'VAK': [230], 'AKA': [231], 'KAP': [232], 'APN': [233], 'PNI': [234], 'NIP': [235], 'IPG': [236], 'PGV': [237], 'VSH': [239], 'SHV': [240], 'HVG': [241], 'GDM': [244], 'DMF': [245], 'MFQ': [246], 'FQS': [247], 'QSV': [248], 'VPS': [250], 'PSG': [251], 'SGD': [252], 'GDA': [253], 'AIF': [255], 'IFM': [256], 'MKW': [258], 'KWV': [259], 'WVL': [260], 'VLT': [261], 'LTT': [262], 'TTW': [263], 'TWT': [264], 'WTD': [265], 'TDE': [266], 'DEE': [267], 'EEC': [268], 'ECK': [269], 'CKE': [270], 'KEI': [271], 'EIM': [272], 'IMK': [273], 'MKN': [274], 'KNC': [275], 'NCY': [276], 'CYN': [277], 'YNA': [278], 'NAL': [279], 'ALP': [280], 'LPV': [281], 'PVG': [282], 'GGK': [284], 'GKL': [285], 'KLI': [286], 'LIA': [287], 'IAC': [288], 'ACE': [289], 'CEP': [290], 'EPV': [291], 'PVL': [292], 'VLP': [293], 'LPK': [294], 'PKE': [295], 'KET': [296], 'ETD': [297], 'TDD': [298], 'DDS': [299], 'DSH': [300], 'SHR': [301], 'HRT': [302, 324], 'RTR': [303], 'TRA': [304], 'RAL': [305], 'ALL': [306], 'LLE': [307], 'EGD': [309], 'GDI': [310], 'DIF': [311], 'IFV': [312], 'FVM': [313], 'VMT': [314], 'MTI': [315], 'TIY': [316], 'IYR': [317], 'YRT': [318], 'RTK': [319], 'TKG': [320], 'KGK': [321], 'GKH': [322], 'KHR': [323], 'RTE': [325], 'TEE': [326], 'EEE': [327], 'EEF': [328], 'EFK': [329], 'FKE': [330], 'KEL': [331], 'ELG': [332], 'LGL': [333], 'AGF': [337], 'GFP': [338], 'FPT': [339], 'PTF': [340], 'TFR': [341], 'FRP': [342], 'RPF': [343], 'PFY': [344], 'FYI': [345], 'YID': [346], 'IDY': [347], 'DYF': [348], 'YFY': [349], 'FYT': [350], 'YTI': [351], 'TIL': [352], 'LEF': [354], 'EFQ': [355]}" /ripp_evidence="{'.L.Y..Y': [113]}" /top_kmer_word="SVP" /top_kmer_hits=23 /top_kmer_hits=177 /top_kmer_hits=249 /table="SVP" /table="SVP" /table="SVP" /cyclopeptide_analysis="////MEKESSESRNRARLAIMELANMISVPMSLNA AVRLGIADAIWNGGANSPLSASEILPRLLIPSATTTGGDPENLQRILRMLTSYGVFSEH LVGSSERKFSLTDVGKTLVTDSDGLSYAAYILQHHQEALMRAWPLVHTAVVEPETEPYV KANGEAAYVQYGKSEEMNSLMLKAMSGVSVPFMKAILEGYEGFKSVERLVDVGGSAGDC LRMILQHFPNVREGINFDLPEVVAKAPNIPGVSHVGGDMFQSVPSGDAIFMKWVLTTWT DEECKEIMKNCYNALPVGGKLIACEPVLPKETDDSHRTRALLEGDIFVMTIYRTKGKHR TEEEFKELGLSAGFPTFRPFYIDYFYTILEFQK//CDS//9815577|9817495//LO C17886373//.L.Y..Y//[113]" gene complement(8985..10789) /gene="LOC17887019" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /db_xref="GeneID:17887019" mRNA complement(8985..10789) /gene="LOC17887019" /product="UDP-glycosyltransferase 73D1" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 4 Proteins, and 74% coverage of the annotated genomic feature by RNAseq alignments" /transcript_id="XM_006292180.2" /db_xref="GeneID:17887019" CDS complement(9221..10789) /gene="LOC17887019" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="UDP-glycosyltransferase 73D1" /protein_id="XP_006292242.2" /db_xref="GeneID:17887019" /translation="MRKHLLNPKMETAIDSKAKGLHFVLIPLMAQGHLIPMVDISKILA RQGNIVTIVTTPQNASRFVKTVDRARSEAGLEINVVTFPIPYKDFGLPKDCETLDTLPS KDLLRRFYDALDKLQDPLERFLEQQDIPPSCIISDKCLVWTSKTAKRFKIPRIVFHGMC CFSLLSSHNLHLHSPHLSVSSASEPFSIPAMPHRIEIARAQLPGAFEKLANMDDVRDKM RESESEAFGVIVNSFQELEPGYAEAYAEAINMKVWFVGPVSLCNDRMADLFDRGNNCNI AISKTECLHFLDSMRPRSVLYVCLGSLCRLIPNQLIELGLGLEESGKPFIWVIKTEEKH MNELDEWLKQENFEERVRGRGIVIKGWSPQAMILSHGSTGGFLSHCGWNSTIEAICFGV PMITWPLFAEQFLNEKLIVEILKIGVRVGVEIPVRWGDEEKVGVLVTKQRVVKAIKLLM DEDCQRVDDDVHSEFVRRRRRIQELAVMAKKAVNDKGSSSINVSILMQDVLEHLSLDRV EKFSL" /domain_record="plants/UDPGT_2 (E-value: 2.5e-72, bitscore: 243.6, seeds: 248)" /sec_met="Type: saccharide" /sec_met="Domains detected: UDPGT_2 (E-value: 2.5e-72, bitscore: 243.6, seeds: 248)" /sec_met="Kind: biosynthetic" /sec_met="Percentage identity: LOC17887227=40.0,LOC17886373=53.846,LOC17884861=45.639" /kmer_dict="{'MRK': [0], 'RKH': [1], 'KHL': [2], 'HLL': [3], 'LLN': [4], 'LNP': [5], 'NPK': [6], 'PKM': [7], 'KME': [8], 'MET': [9], 'ETA': [10], 'TAI': [11], 'AID': [12], 'IDS': [13], 'DSK': [14], 'SKA': [15], 'KAK': [16], 'AKG': [17], 'KGL': [18], 'GLH': [19], 'LHF': [20, 288], 'HFV': [21], 'FVL': [22], 'VLI': [23], 'LIP': [24, 33, 310], 'IPL': [25], 'PLM': [26], 'LMA': [27], 'MAQ': [28], 'AQG': [29], 'QGH': [30], 'GHL': [31], 'HLI': [32], 'IPM': [34], 'PMV': [35], 'MVD': [36], 'VDI': [37], 'DIS': [38], 'ISK': [39, 282], 'SKI': [40], 'KIL': [41], 'ILA': [42], 'LAR': [43], 'ARQ': [44], 'RQG': [45], 'QGN': [46], 'GNI': [47], 'NIV': [48], 'IVT': [49, 52], 'VTI': [50], 'TIV': [51], 'VTT': [53], 'TTP': [54], 'TPQ': [55], 'PQN': [56], 'QNA': [57], 'NAS': [58], 'ASR': [59], 'SRF': [60], 'RFV': [61], 'FVK': [62], 'VKT': [63], 'KTV': [64], 'TVD': [65], 'VDR': [66], 'DRA': [67], 'RAR': [68], 'ARS': [69], 'RSE': [70], 'SEA': [71, 226], 'EAG': [72], 'AGL': [73], 'GLE': [74, 321], 'LEI': [75], 'EIN': [76], 'INV': [77, 498], 'NVV': [78], 'VVT': [79], 'VTF': [80], 'TFP': [81], 'FPI': [82], 'PIP': [83], 'IPY': [84], 'PYK': [85], 'YKD': [86], 'KDF': [87], 'DFG': [88], 'FGL': [89], 'GLP': [90], 'LPK': [91], 'PKD': [92], 'KDC': [93], 'DCE': [94], 'CET': [95], 'ETL': [96], 'TLD': [97], 'LDT': [98], 'DTL': [99], 'TLP': [100], 'LPS': [101], 'PSK': [102], 'SKD': [103], 'KDL': [104], 'DLL': [105], 'LLR': [106], 'LRR': [107], 'RRF': [108], 'RFY': [109], 'FYD': [110], 'YDA': [111], 'DAL': [112], 'ALD': [113], 'LDK': [114], 'DKL': [115], 'KLQ': [116], 'LQD': [117], 'QDP': [118], 'DPL': [119], 'PLE': [120], 'LER': [121], 'ERF': [122], 'RFL': [123], 'FLE': [124], 'LEQ': [125], 'EQQ': [126], 'QQD': [127], 'QDI': [128], 'DIP': [129], 'IPP': [130], 'PPS': [131], 'PSC': [132], 'SCI': [133], 'CII': [134], 'IIS': [135], 'ISD': [136], 'SDK': [137], 'DKC': [138], 'KCL': [139], 'CLV': [140], 'LVW': [141], 'VWT': [142], 'WTS': [143], 'TSK': [144], 'SKT': [145, 283], 'KTA': [146], 'TAK': [147], 'AKR': [148], 'KRF': [149], 'RFK': [150], 'FKI': [151], 'KIP': [152], 'IPR': [153], 'PRI': [154], 'RIV': [155], 'IVF': [156], 'VFH': [157], 'FHG': [158], 'HGM': [159], 'GMC': [160], 'MCC': [161], 'CCF': [162], 'CFS': [163], 'FSL': [164], 'SLL': [165], 'LLS': [166], 'LSS': [167], 'SSH': [168], 'SHN': [169], 'HNL': [170], 'NLH': [171], 'LHL': [172], 'HLH': [173], 'LHS': [174], 'HSP': [175], 'SPH': [176], 'PHL': [177], 'HLS': [178, 510], 'LSV': [179], 'SVS': [180], 'VSS': [181], 'SSA': [182], 'SAS': [183], 'ASE': [184], 'SEP': [185], 'EPF': [186], 'PFS': [187], 'FSI': [188], 'SIP': [189], 'IPA': [190], 'PAM': [191], 'AMP': [192], 'MPH': [193], 'PHR': [194], 'HRI': [195], 'RIE': [196], 'IEI': [197], 'EIA': [198], 'IAR': [199], 'ARA': [200], 'RAQ': [201], 'AQL': [202], 'QLP': [203], 'LPG': [204], 'PGA': [205], 'GAF': [206], 'AFE': [207], 'FEK': [208], 'EKL': [209, 413], 'KLA': [210], 'LAN': [211], 'ANM': [212], 'NMD': [213], 'MDD': [214], 'DDV': [215, 466], 'DVR': [216], 'VRD': [217], 'RDK': [218], 'DKM': [219], 'KMR': [220], 'MRE': [221], 'RES': [222], 'ESE': [223, 225], 'SES': [224], 'EAF': [227], 'AFG': [228], 'FGV': [229, 396], 'GVI': [230], 'VIV': [231], 'IVN': [232], 'VNS': [233], 'NSF': [234], 'SFQ': [235], 'FQE': [236], 'QEL': [237, 480], 'ELE': [238], 'LEP': [239], 'EPG': [240], 'PGY': [241], 'GYA': [242], 'YAE': [243, 247], 'AEA': [244, 248], 'EAY': [245], 'AYA': [246], 'EAI': [249, 392], 'AIN': [250], 'INM': [251], 'NMK': [252], 'MKV': [253], 'KVW': [254], 'VWF': [255], 'WFV': [256], 'FVG': [257], 'VGP': [258], 'GPV': [259], 'PVS': [260], 'VSL': [261], 'SLC': [262, 306], 'LCN': [263], 'CND': [264], 'NDR': [265], 'DRM': [266], 'RMA': [267], 'MAD': [268], 'ADL': [269], 'DLF': [270], 'LFD': [271], 'FDR': [272], 'DRG': [273], 'RGN': [274], 'GNN': [275], 'NNC': [276], 'NCN': [277], 'CNI': [278], 'NIA': [279], 'IAI': [280], 'AIS': [281], 'KTE': [284, 334], 'TEC': [285], 'ECL': [286], 'CLH': [287], 'HFL': [289], 'FLD': [290], 'LDS': [291], 'DSM': [292], 'SMR': [293], 'MRP': [294], 'RPR': [295], 'PRS': [296], 'RSV': [297], 'SVL': [298], 'VLY': [299], 'LYV': [300], 'YVC': [301], 'VCL': [302], 'CLG': [303], 'LGS': [304], 'GSL': [305], 'LCR': [307], 'CRL': [308], 'RLI': [309], 'IPN': [311], 'PNQ': [312], 'NQL': [313], 'QLI': [314], 'LIE': [315], 'IEL': [316], 'ELG': [317], 'LGL': [318, 320], 'GLG': [319], 'LEE': [322], 'EES': [323], 'ESG': [324], 'SGK': [325], 'GKP': [326], 'KPF': [327], 'PFI': [328], 'FIW': [329], 'IWV': [330], 'WVI': [331], 'VIK': [332, 362], 'IKT': [333], 'TEE': [335], 'EEK': [336, 437], 'EKH': [337], 'KHM': [338], 'HMN': [339], 'MNE': [340], 'NEL': [341], 'ELD': [342], 'LDE': [343], 'DEW': [344], 'EWL': [345], 'WLK': [346], 'LKQ': [347], 'KQE': [348], 'QEN': [349], 'ENF': [350], 'NFE': [351], 'FEE': [352], 'EER': [353], 'ERV': [354], 'RVR': [355], 'VRG': [356], 'RGR': [357], 'GRG': [358], 'RGI': [359], 'GIV': [360], 'IVI': [361], 'IKG': [363], 'KGW': [364], 'GWS': [365], 'WSP': [366], 'SPQ': [367], 'PQA': [368], 'QAM': [369], 'AMI': [370], 'MIL': [371], 'ILS': [372], 'LSH': [373, 382], 'SHG': [374], 'HGS': [375], 'GST': [376], 'STG': [377], 'TGG': [378], 'GGF': [379], 'GFL': [380], 'FLS': [381], 'SHC': [383], 'HCG': [384], 'CGW': [385], 'GWN': [386], 'WNS': [387], 'NST': [388], 'STI': [389], 'TIE': [390], 'IEA': [391], 'AIC': [393], 'ICF': [394], 'CFG': [395], 'GVP': [397], 'VPM': [398], 'PMI': [399], 'MIT': [400], 'ITW': [401], 'TWP': [402], 'WPL': [403], 'PLF': [404], 'LFA': [405], 'FAE': [406], 'AEQ': [407], 'EQF': [408], 'QFL': [409], 'FLN': [410], 'LNE': [411], 'NEK': [412], 'KLI': [414], 'LIV': [415], 'IVE': [416], 'VEI': [417, 428], 'EIL': [418], 'ILK': [419], 'LKI': [420], 'KIG': [421], 'IGV': [422], 'GVR': [423], 'VRV': [424], 'RVG': [425], 'VGV': [426, 440], 'GVE': [427], 'EIP': [429], 'IPV': [430], 'PVR': [431], 'VRW': [432], 'RWG': [433], 'WGD': [434], 'GDE': [435], 'DEE': [436], 'EKV': [438], 'KVG': [439], 'GVL': [441], 'VLV': [442], 'LVT': [443], 'VTK': [444], 'TKQ': [445], 'KQR': [446], 'QRV': [447, 462], 'RVV': [448], 'VVK': [449], 'VKA': [450], 'KAI': [451], 'AIK': [452], 'IKL': [453], 'KLL': [454], 'LLM': [455], 'LMD': [456], 'MDE': [457], 'DED': [458], 'EDC': [459], 'DCQ': [460], 'CQR': [461], 'RVD': [463], 'VDD': [464], 'DDD': [465], 'DVH': [467], 'VHS': [468], 'HSE': [469], 'SEF': [470], 'EFV': [471], 'FVR': [472], 'VRR': [473], 'RRR': [474, 475, 476], 'RRI': [477], 'RIQ': [478], 'IQE': [479], 'ELA': [481], 'LAV': [482], 'AVM': [483], 'VMA': [484], 'MAK': [485], 'AKK': [486], 'KKA': [487], 'KAV': [488], 'AVN': [489], 'VND': [490], 'NDK': [491], 'DKG': [492], 'KGS': [493], 'GSS': [494], 'SSS': [495], 'SSI': [496], 'SIN': [497], 'NVS': [499], 'VSI': [500], 'SIL': [501], 'ILM': [502], 'LMQ': [503], 'MQD': [504], 'QDV': [505], 'DVL': [506], 'VLE': [507], 'LEH': [508], 'EHL': [509], 'LSL': [511], 'SLD': [512], 'LDR': [513], 'DRV': [514], 'RVE': [515], 'VEK': [516], 'EKF': [517], 'KFS': [518]}" /ripp_evidence="{}" /top_kmer_word="LIP" /top_kmer_hits=24 /top_kmer_hits=33 /top_kmer_hits=310 /table="LIP" /table="LIP" /table="LIP" /subgroup_hmm="D_Triterpenoid(oleananes),flavonoid-7-O- (E=1.5e-178, bitscore=585.1);M (E=7.6e-86, bitscore=279.2);A_glycosidic_branch_elongating (E=1.3e-82, bitscore=268.4)" /subgroup_tree="{('D_Triterpenoid(oleananes),flavonoid-7-O- ',): 1}" /subgroup="D_Triterpenoid(oleananes),flavonoid-7-O-" /substrates="oleananes" /substrates="flavonoid" gene complement(13279..15063) /gene="LOC17884861" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /db_xref="GeneID:17884861" mRNA complement(join(13279..14393,14508..15063)) /gene="LOC17884861" /product="UDP-glycosyltransferase 73C7, transcript variant X3" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 100% coverage of the annotated genomic feature by RNAseq alignments, including 1 sample with support for all annotated introns" /transcript_id="XM_023783253.1" /db_xref="GeneID:17884861" mRNA complement(join(13279..14408,14508..15063)) /gene="LOC17884861" /product="UDP-glycosyltransferase 73C7, transcript variant X2" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 100% coverage of the annotated genomic feature by RNAseq alignments, including 3 samples with support for all annotated introns" /transcript_id="XM_006291014.2" /db_xref="GeneID:17884861" mRNA complement(13279..15063) /gene="LOC17884861" /product="UDP-glycosyltransferase 73C7, transcript variant X1" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 11 Proteins, and 100% coverage of the annotated genomic feature by RNAseq alignments" /transcript_id="XM_023783252.1" /db_xref="GeneID:17884861" CDS complement(join(13488..14393,14508..14978)) /gene="LOC17884861" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="UDP-glycosyltransferase 73C7 isoform X3" /protein_id="XP_023639021.1" /db_xref="GeneID:17884861" /translation="MCSDDPLHFVVIPFMAQGHMIPLVDISRLLSQRQGVTVSIITTTQ NVAKIKTSLSSSSSFPTINIVEVKFPSRQAGLQEGCESVDMLASMVDMVKFFDVANSLE EQVEKAMKKMVQPRPSCIIGDMSLPFTSRLAKKFKIPKLLFHGFSCFSLMCIQPLEGNM KESTVKIIEADNDSYGVIVNSFEELEVDYAREYRKARTGKVWCVGPVSLCNKLELKNAE RGDKASIGQDQCLQWLDSQGTGSVLYVCLGSLCNLPLAQLKELGLGLEESNKPFIWVIR EWGKYEDLAKWMQQSGFEERIRDRGLLIKGWAPQVFILSHASIGGFLTHCGWNSTLEGI TAGVPLLTWPLSAEQFLNEKLIVKILKSGLKIGVETLMKYGKEEEIGVTVSRETVRKAV GELMGDSQEAEERRRRVRELSDLANKALEQGGSSDANITLLIQDIMEQSQHQRGLKDCY " /domain_record="plants/UDPGT_2 (E-value: 5.8e-64, bitscore: 216.0, seeds: 248)" /sec_met="Type: saccharide" /sec_met="Domains detected: UDPGT_2 (E-value: 5.8e-64, bitscore: 216.0, seeds: 248)" /sec_met="Kind: biosynthetic" /sec_met="Percentage identity: LOC17887227=29.167,LOC17886373=42.857,LOC17887019=45.639" /kmer_dict="{'MCS': [0], 'CSD': [1], 'SDD': [2], 'DDP': [3], 'DPL': [4], 'PLH': [5], 'LHF': [6], 'HFV': [7], 'FVV': [8], 'VVI': [9], 'VIP': [10], 'IPF': [11], 'PFM': [12], 'FMA': [13], 'MAQ': [14], 'AQG': [15], 'QGH': [16], 'GHM': [17], 'HMI': [18], 'MIP': [19], 'IPL': [20], 'PLV': [21], 'LVD': [22], 'VDI': [23], 'DIS': [24], 'ISR': [25], 'SRL': [26, 131], 'RLL': [27], 'LLS': [28], 'LSQ': [29], 'SQR': [30], 'QRQ': [31], 'RQG': [32], 'QGV': [33], 'GVT': [34, 386], 'VTV': [35, 387], 'TVS': [36, 388], 'VSI': [37], 'SII': [38], 'IIT': [39], 'ITT': [40], 'TTT': [41], 'TTQ': [42], 'TQN': [43], 'QNV': [44], 'NVA': [45], 'VAK': [46], 'AKI': [47], 'KIK': [48], 'IKT': [49], 'KTS': [50], 'TSL': [51], 'SLS': [52], 'LSS': [53], 'SSS': [54, 55, 56], 'SSF': [57], 'SFP': [58], 'FPT': [59], 'PTI': [60], 'TIN': [61], 'INI': [62], 'NIV': [63], 'IVE': [64], 'VEV': [65], 'EVK': [66], 'VKF': [67, 93], 'KFP': [68], 'FPS': [69], 'PSR': [70], 'SRQ': [71], 'RQA': [72], 'QAG': [73], 'AGL': [74], 'GLQ': [75], 'LQE': [76], 'QEG': [77], 'EGC': [78], 'GCE': [79], 'CES': [80], 'ESV': [81], 'SVD': [82], 'VDM': [83, 90], 'DML': [84], 'MLA': [85], 'LAS': [86], 'ASM': [87], 'SMV': [88], 'MVD': [89], 'DMV': [91], 'MVK': [92], 'KFF': [94], 'FFD': [95], 'FDV': [96], 'DVA': [97], 'VAN': [98], 'ANS': [99], 'NSL': [100], 'SLE': [101], 'LEE': [102, 268], 'EEQ': [103], 'EQV': [104], 'QVE': [105], 'VEK': [106], 'EKA': [107], 'KAM': [108], 'AMK': [109], 'MKK': [110], 'KKM': [111], 'KMV': [112], 'MVQ': [113], 'VQP': [114], 'QPR': [115], 'PRP': [116], 'RPS': [117], 'PSC': [118], 'SCI': [119], 'CII': [120], 'IIG': [121], 'IGD': [122], 'GDM': [123], 'DMS': [124], 'MSL': [125], 'SLP': [126], 'LPF': [127], 'PFT': [128], 'FTS': [129], 'TSR': [130], 'RLA': [132], 'LAK': [133, 288], 'AKK': [134], 'KKF': [135], 'KFK': [136], 'FKI': [137], 'KIP': [138], 'IPK': [139], 'PKL': [140], 'KLL': [141], 'LLF': [142], 'LFH': [143], 'FHG': [144], 'HGF': [145], 'GFS': [146], 'FSC': [147], 'SCF': [148], 'CFS': [149], 'FSL': [150], 'SLM': [151], 'LMC': [152], 'MCI': [153], 'CIQ': [154], 'IQP': [155], 'QPL': [156], 'PLE': [157], 'LEG': [158, 336], 'EGN': [159], 'GNM': [160], 'NMK': [161], 'MKE': [162], 'KES': [163], 'EST': [164], 'STV': [165], 'TVK': [166], 'VKI': [167, 362], 'KII': [168], 'IIE': [169], 'IEA': [170], 'EAD': [171], 'ADN': [172], 'DND': [173], 'NDS': [174], 'DSY': [175], 'SYG': [176], 'YGV': [177], 'GVI': [178], 'VIV': [179], 'IVN': [180], 'VNS': [181], 'NSF': [182], 'SFE': [183], 'FEE': [184, 297], 'EEL': [185], 'ELE': [186], 'LEV': [187], 'EVD': [188], 'VDY': [189], 'DYA': [190], 'YAR': [191], 'ARE': [192], 'REY': [193], 'EYR': [194], 'YRK': [195], 'RKA': [196, 395], 'KAR': [197], 'ART': [198], 'RTG': [199], 'TGK': [200], 'GKV': [201], 'KVW': [202], 'VWC': [203], 'WCV': [204], 'CVG': [205], 'VGP': [206], 'GPV': [207], 'PVS': [208], 'VSL': [209], 'SLC': [210, 252], 'LCN': [211, 253], 'CNK': [212], 'NKL': [213], 'KLE': [214], 'LEL': [215], 'ELK': [216], 'LKN': [217], 'KNA': [218], 'NAE': [219], 'AER': [220], 'ERG': [221], 'RGD': [222], 'GDK': [223], 'DKA': [224], 'KAS': [225], 'ASI': [226, 321], 'SIG': [227, 322], 'IGQ': [228], 'GQD': [229], 'QDQ': [230], 'DQC': [231], 'QCL': [232], 'CLQ': [233], 'LQW': [234], 'QWL': [235], 'WLD': [236], 'LDS': [237], 'DSQ': [238, 404], 'SQG': [239], 'QGT': [240], 'GTG': [241], 'TGS': [242], 'GSV': [243], 'SVL': [244], 'VLY': [245], 'LYV': [246], 'YVC': [247], 'VCL': [248], 'CLG': [249], 'LGS': [250], 'GSL': [251], 'CNL': [254], 'NLP': [255], 'LPL': [256], 'PLA': [257], 'LAQ': [258], 'AQL': [259], 'QLK': [260], 'LKE': [261], 'KEL': [262], 'ELG': [263], 'LGL': [264, 266], 'GLG': [265], 'GLE': [267], 'EES': [269], 'ESN': [270], 'SNK': [271], 'NKP': [272], 'KPF': [273], 'PFI': [274], 'FIW': [275], 'IWV': [276], 'WVI': [277], 'VIR': [278], 'IRE': [279], 'REW': [280], 'EWG': [281], 'WGK': [282], 'GKY': [283], 'KYE': [284], 'YED': [285], 'EDL': [286], 'DLA': [287, 420], 'AKW': [289], 'KWM': [290], 'WMQ': [291], 'MQQ': [292], 'QQS': [293], 'QSG': [294], 'SGF': [295], 'GFE': [296], 'EER': [298, 409], 'ERI': [299], 'RIR': [300], 'IRD': [301], 'RDR': [302], 'DRG': [303], 'RGL': [304, 451], 'GLL': [305], 'LLI': [306, 438], 'LIK': [307], 'IKG': [308], 'KGW': [309], 'GWA': [310], 'WAP': [311], 'APQ': [312], 'PQV': [313], 'QVF': [314], 'VFI': [315], 'FIL': [316], 'ILS': [317], 'LSH': [318], 'SHA': [319], 'HAS': [320], 'IGG': [323], 'GGF': [324], 'GFL': [325], 'FLT': [326], 'LTH': [327], 'THC': [328], 'HCG': [329], 'CGW': [330], 'GWN': [331], 'WNS': [332], 'NST': [333], 'STL': [334], 'TLE': [335], 'EGI': [337], 'GIT': [338], 'ITA': [339], 'TAG': [340], 'AGV': [341], 'GVP': [342], 'VPL': [343], 'PLL': [344], 'LLT': [345], 'LTW': [346], 'TWP': [347], 'WPL': [348], 'PLS': [349], 'LSA': [350], 'SAE': [351], 'AEQ': [352], 'EQF': [353], 'QFL': [354], 'FLN': [355], 'LNE': [356], 'NEK': [357], 'EKL': [358], 'KLI': [359], 'LIV': [360], 'IVK': [361], 'KIL': [363], 'ILK': [364], 'LKS': [365], 'KSG': [366], 'SGL': [367], 'GLK': [368, 452], 'LKI': [369], 'KIG': [370], 'IGV': [371, 385], 'GVE': [372], 'VET': [373], 'ETL': [374], 'TLM': [375], 'LMK': [376], 'MKY': [377], 'KYG': [378], 'YGK': [379], 'GKE': [380], 'KEE': [381], 'EEE': [382], 'EEI': [383], 'EIG': [384], 'VSR': [389], 'SRE': [390], 'RET': [391], 'ETV': [392], 'TVR': [393], 'VRK': [394], 'KAV': [396], 'AVG': [397], 'VGE': [398], 'GEL': [399], 'ELM': [400], 'LMG': [401], 'MGD': [402], 'GDS': [403], 'SQE': [405], 'QEA': [406], 'EAE': [407], 'AEE': [408], 'ERR': [410], 'RRR': [411, 412], 'RRV': [413], 'RVR': [414], 'VRE': [415], 'REL': [416], 'ELS': [417], 'LSD': [418], 'SDL': [419], 'LAN': [421], 'ANK': [422], 'NKA': [423], 'KAL': [424], 'ALE': [425], 'LEQ': [426], 'EQG': [427], 'QGG': [428], 'GGS': [429], 'GSS': [430], 'SSD': [431], 'SDA': [432], 'DAN': [433], 'ANI': [434], 'NIT': [435], 'ITL': [436], 'TLL': [437], 'LIQ': [439], 'IQD': [440], 'QDI': [441], 'DIM': [442], 'IME': [443], 'MEQ': [444], 'EQS': [445], 'QSQ': [446], 'SQH': [447], 'QHQ': [448], 'HQR': [449], 'QRG': [450], 'LKD': [453], 'KDC': [454]}" /ripp_evidence="{}" /top_kmer_word="SSS" /top_kmer_hits=54 /top_kmer_hits=55 /top_kmer_hits=56 /table="SSS" /table="SSS" /table="SSS" /subgroup_hmm="D_Triterpenoid(oleananes),flavonoid-7-O- (E=1.3e-125, bitscore=410.5);E (E=7.6e-70, bitscore=226.5);E_small_phenolic (E=1.3e-69, bitscore=225.4)" /subgroup_tree="{('D_Triterpenoid(oleananes),flavonoid-7-O- ',): 1}" /subgroup="D_Triterpenoid(oleananes),flavonoid-7-O-" /substrates="oleananes" /substrates="flavonoid" CDS complement(join(13488..14408,14508..14978)) /gene="LOC17884861" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="LOC17884_67" /protein_id="XP_006291076.1" /db_xref="GeneID:17884861" /translation="MCSDDPLHFVVIPFMAQGHMIPLVDISRLLSQRQGVTVSIITTTQ NVAKIKTSLSSSSSFPTINIVEVKFPSRQAGLQEGCESVDMLASMVDMVKFFDVANSLE EQVEKAMKKMVQPRPSCIIGDMSLPFTSRLAKKFKIPKLLFHGFSCFSLMCIQVSVLQP LEGNMKESTVKIIEADNDSYGVIVNSFEELEVDYAREYRKARTGKVWCVGPVSLCNKLE LKNAERGDKASIGQDQCLQWLDSQGTGSVLYVCLGSLCNLPLAQLKELGLGLEESNKPF IWVIREWGKYEDLAKWMQQSGFEERIRDRGLLIKGWAPQVFILSHASIGGFLTHCGWNS TLEGITAGVPLLTWPLSAEQFLNEKLIVKILKSGLKIGVETLMKYGKEEEIGVTVSRET VRKAVGELMGDSQEAEERRRRVRELSDLANKALEQGGSSDANITLLIQDIMEQSQHQRG LKDCY" /locus_tag="LOC17884_67" /domain_record="plants/UDPGT_2 (E-value: 5.3e-64, bitscore: 216.1, seeds: 248)" /kmer_dict="{'MCS': [0], 'CSD': [1], 'SDD': [2], 'DDP': [3], 'DPL': [4], 'PLH': [5], 'LHF': [6], 'HFV': [7], 'FVV': [8], 'VVI': [9], 'VIP': [10], 'IPF': [11], 'PFM': [12], 'FMA': [13], 'MAQ': [14], 'AQG': [15], 'QGH': [16], 'GHM': [17], 'HMI': [18], 'MIP': [19], 'IPL': [20], 'PLV': [21], 'LVD': [22], 'VDI': [23], 'DIS': [24], 'ISR': [25], 'SRL': [26, 131], 'RLL': [27], 'LLS': [28], 'LSQ': [29], 'SQR': [30], 'QRQ': [31], 'RQG': [32], 'QGV': [33], 'GVT': [34, 391], 'VTV': [35, 392], 'TVS': [36, 393], 'VSI': [37], 'SII': [38], 'IIT': [39], 'ITT': [40], 'TTT': [41], 'TTQ': [42], 'TQN': [43], 'QNV': [44], 'NVA': [45], 'VAK': [46], 'AKI': [47], 'KIK': [48], 'IKT': [49], 'KTS': [50], 'TSL': [51], 'SLS': [52], 'LSS': [53], 'SSS': [54, 55, 56], 'SSF': [57], 'SFP': [58], 'FPT': [59], 'PTI': [60], 'TIN': [61], 'INI': [62], 'NIV': [63], 'IVE': [64], 'VEV': [65], 'EVK': [66], 'VKF': [67, 93], 'KFP': [68], 'FPS': [69], 'PSR': [70], 'SRQ': [71], 'RQA': [72], 'QAG': [73], 'AGL': [74], 'GLQ': [75], 'LQE': [76], 'QEG': [77], 'EGC': [78], 'GCE': [79], 'CES': [80], 'ESV': [81], 'SVD': [82], 'VDM': [83, 90], 'DML': [84], 'MLA': [85], 'LAS': [86], 'ASM': [87], 'SMV': [88], 'MVD': [89], 'DMV': [91], 'MVK': [92], 'KFF': [94], 'FFD': [95], 'FDV': [96], 'DVA': [97], 'VAN': [98], 'ANS': [99], 'NSL': [100], 'SLE': [101], 'LEE': [102, 273], 'EEQ': [103], 'EQV': [104], 'QVE': [105], 'VEK': [106], 'EKA': [107], 'KAM': [108], 'AMK': [109], 'MKK': [110], 'KKM': [111], 'KMV': [112], 'MVQ': [113], 'VQP': [114], 'QPR': [115], 'PRP': [116], 'RPS': [117], 'PSC': [118], 'SCI': [119], 'CII': [120], 'IIG': [121], 'IGD': [122], 'GDM': [123], 'DMS': [124], 'MSL': [125], 'SLP': [126], 'LPF': [127], 'PFT': [128], 'FTS': [129], 'TSR': [130], 'RLA': [132], 'LAK': [133, 293], 'AKK': [134], 'KKF': [135], 'KFK': [136], 'FKI': [137], 'KIP': [138], 'IPK': [139], 'PKL': [140], 'KLL': [141], 'LLF': [142], 'LFH': [143], 'FHG': [144], 'HGF': [145], 'GFS': [146], 'FSC': [147], 'SCF': [148], 'CFS': [149], 'FSL': [150], 'SLM': [151], 'LMC': [152], 'MCI': [153], 'CIQ': [154], 'IQV': [155], 'QVS': [156], 'VSV': [157], 'SVL': [158, 249], 'VLQ': [159], 'LQP': [160], 'QPL': [161], 'PLE': [162], 'LEG': [163, 341], 'EGN': [164], 'GNM': [165], 'NMK': [166], 'MKE': [167], 'KES': [168], 'EST': [169], 'STV': [170], 'TVK': [171], 'VKI': [172, 367], 'KII': [173], 'IIE': [174], 'IEA': [175], 'EAD': [176], 'ADN': [177], 'DND': [178], 'NDS': [179], 'DSY': [180], 'SYG': [181], 'YGV': [182], 'GVI': [183], 'VIV': [184], 'IVN': [185], 'VNS': [186], 'NSF': [187], 'SFE': [188], 'FEE': [189, 302], 'EEL': [190], 'ELE': [191], 'LEV': [192], 'EVD': [193], 'VDY': [194], 'DYA': [195], 'YAR': [196], 'ARE': [197], 'REY': [198], 'EYR': [199], 'YRK': [200], 'RKA': [201, 400], 'KAR': [202], 'ART': [203], 'RTG': [204], 'TGK': [205], 'GKV': [206], 'KVW': [207], 'VWC': [208], 'WCV': [209], 'CVG': [210], 'VGP': [211], 'GPV': [212], 'PVS': [213], 'VSL': [214], 'SLC': [215, 257], 'LCN': [216, 258], 'CNK': [217], 'NKL': [218], 'KLE': [219], 'LEL': [220], 'ELK': [221], 'LKN': [222], 'KNA': [223], 'NAE': [224], 'AER': [225], 'ERG': [226], 'RGD': [227], 'GDK': [228], 'DKA': [229], 'KAS': [230], 'ASI': [231, 326], 'SIG': [232, 327], 'IGQ': [233], 'GQD': [234], 'QDQ': [235], 'DQC': [236], 'QCL': [237], 'CLQ': [238], 'LQW': [239], 'QWL': [240], 'WLD': [241], 'LDS': [242], 'DSQ': [243, 409], 'SQG': [244], 'QGT': [245], 'GTG': [246], 'TGS': [247], 'GSV': [248], 'VLY': [250], 'LYV': [251], 'YVC': [252], 'VCL': [253], 'CLG': [254], 'LGS': [255], 'GSL': [256], 'CNL': [259], 'NLP': [260], 'LPL': [261], 'PLA': [262], 'LAQ': [263], 'AQL': [264], 'QLK': [265], 'LKE': [266], 'KEL': [267], 'ELG': [268], 'LGL': [269, 271], 'GLG': [270], 'GLE': [272], 'EES': [274], 'ESN': [275], 'SNK': [276], 'NKP': [277], 'KPF': [278], 'PFI': [279], 'FIW': [280], 'IWV': [281], 'WVI': [282], 'VIR': [283], 'IRE': [284], 'REW': [285], 'EWG': [286], 'WGK': [287], 'GKY': [288], 'KYE': [289], 'YED': [290], 'EDL': [291], 'DLA': [292, 425], 'AKW': [294], 'KWM': [295], 'WMQ': [296], 'MQQ': [297], 'QQS': [298], 'QSG': [299], 'SGF': [300], 'GFE': [301], 'EER': [303, 414], 'ERI': [304], 'RIR': [305], 'IRD': [306], 'RDR': [307], 'DRG': [308], 'RGL': [309, 456], 'GLL': [310], 'LLI': [311, 443], 'LIK': [312], 'IKG': [313], 'KGW': [314], 'GWA': [315], 'WAP': [316], 'APQ': [317], 'PQV': [318], 'QVF': [319], 'VFI': [320], 'FIL': [321], 'ILS': [322], 'LSH': [323], 'SHA': [324], 'HAS': [325], 'IGG': [328], 'GGF': [329], 'GFL': [330], 'FLT': [331], 'LTH': [332], 'THC': [333], 'HCG': [334], 'CGW': [335], 'GWN': [336], 'WNS': [337], 'NST': [338], 'STL': [339], 'TLE': [340], 'EGI': [342], 'GIT': [343], 'ITA': [344], 'TAG': [345], 'AGV': [346], 'GVP': [347], 'VPL': [348], 'PLL': [349], 'LLT': [350], 'LTW': [351], 'TWP': [352], 'WPL': [353], 'PLS': [354], 'LSA': [355], 'SAE': [356], 'AEQ': [357], 'EQF': [358], 'QFL': [359], 'FLN': [360], 'LNE': [361], 'NEK': [362], 'EKL': [363], 'KLI': [364], 'LIV': [365], 'IVK': [366], 'KIL': [368], 'ILK': [369], 'LKS': [370], 'KSG': [371], 'SGL': [372], 'GLK': [373, 457], 'LKI': [374], 'KIG': [375], 'IGV': [376, 390], 'GVE': [377], 'VET': [378], 'ETL': [379], 'TLM': [380], 'LMK': [381], 'MKY': [382], 'KYG': [383], 'YGK': [384], 'GKE': [385], 'KEE': [386], 'EEE': [387], 'EEI': [388], 'EIG': [389], 'VSR': [394], 'SRE': [395], 'RET': [396], 'ETV': [397], 'TVR': [398], 'VRK': [399], 'KAV': [401], 'AVG': [402], 'VGE': [403], 'GEL': [404], 'ELM': [405], 'LMG': [406], 'MGD': [407], 'GDS': [408], 'SQE': [410], 'QEA': [411], 'EAE': [412], 'AEE': [413], 'ERR': [415], 'RRR': [416, 417], 'RRV': [418], 'RVR': [419], 'VRE': [420], 'REL': [421], 'ELS': [422], 'LSD': [423], 'SDL': [424], 'LAN': [426], 'ANK': [427], 'NKA': [428], 'KAL': [429], 'ALE': [430], 'LEQ': [431], 'EQG': [432], 'QGG': [433], 'GGS': [434], 'GSS': [435], 'SSD': [436], 'SDA': [437], 'DAN': [438], 'ANI': [439], 'NIT': [440], 'ITL': [441], 'TLL': [442], 'LIQ': [444], 'IQD': [445], 'QDI': [446], 'DIM': [447], 'IME': [448], 'MEQ': [449], 'EQS': [450], 'QSQ': [451], 'SQH': [452], 'QHQ': [453], 'HQR': [454], 'QRG': [455], 'LKD': [458], 'KDC': [459]}" /ripp_evidence="{}" /top_kmer_word="SSS" /top_kmer_hits=54 /top_kmer_hits=55 /top_kmer_hits=56 /table="SSS" /table="SSS" /table="SSS" CDS complement(13488..14978) /gene="LOC17884861" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="LOC17884_68" /protein_id="XP_023639020.1" /db_xref="GeneID:17884861" /translation="MCSDDPLHFVVIPFMAQGHMIPLVDISRLLSQRQGVTVSIITTTQ NVAKIKTSLSSSSSFPTINIVEVKFPSRQAGLQEGCESVDMLASMVDMVKFFDVANSLE EQVEKAMKKMVQPRPSCIIGDMSLPFTSRLAKKFKIPKLLFHGFSCFSLMCIQVVRESG ILKFIESNDEYFDLPGLPDRVEFTKPQVSVLQPLEGNMKESTVKIIEADNDSYGVIVNS FEELEVDYAREYRKARTGKVWCVGPVSLCNKLELKNAERGDKASIGQDQCLQWLDSQGT GSVLYVCLGSLCNLPLAQLKELGLGLEESNKPFIWVIREWGKYEDLAKWMQQSGFEERI RDRGLLIKGWAPQVFILSHASIGGFLTHCGWNSTLEGITAGVPLLTWPLSAEQFLNEKL IVKILKSGLKIGVETLMKYGKEEEIGVTVSRETVRKAVGELMGDSQEAEERRRRVRELS DLANKALEQGGSSDANITLLIQDIMEQSQHQRGLKDCY" /locus_tag="LOC17884_68" /domain_record="plants/UDPGT_2 (E-value: 6.8e-80, bitscore: 268.5, seeds: 248)" /kmer_dict="{'MCS': [0], 'CSD': [1], 'SDD': [2], 'DDP': [3], 'DPL': [4], 'PLH': [5], 'LHF': [6], 'HFV': [7], 'FVV': [8], 'VVI': [9], 'VIP': [10], 'IPF': [11], 'PFM': [12], 'FMA': [13], 'MAQ': [14], 'AQG': [15], 'QGH': [16], 'GHM': [17], 'HMI': [18], 'MIP': [19], 'IPL': [20], 'PLV': [21], 'LVD': [22], 'VDI': [23], 'DIS': [24], 'ISR': [25], 'SRL': [26, 131], 'RLL': [27], 'LLS': [28], 'LSQ': [29], 'SQR': [30], 'QRQ': [31], 'RQG': [32], 'QGV': [33], 'GVT': [34, 424], 'VTV': [35, 425], 'TVS': [36, 426], 'VSI': [37], 'SII': [38], 'IIT': [39], 'ITT': [40], 'TTT': [41], 'TTQ': [42], 'TQN': [43], 'QNV': [44], 'NVA': [45], 'VAK': [46], 'AKI': [47], 'KIK': [48], 'IKT': [49], 'KTS': [50], 'TSL': [51], 'SLS': [52], 'LSS': [53], 'SSS': [54, 55, 56], 'SSF': [57], 'SFP': [58], 'FPT': [59], 'PTI': [60], 'TIN': [61], 'INI': [62], 'NIV': [63], 'IVE': [64], 'VEV': [65], 'EVK': [66], 'VKF': [67, 93], 'KFP': [68], 'FPS': [69], 'PSR': [70], 'SRQ': [71], 'RQA': [72], 'QAG': [73], 'AGL': [74], 'GLQ': [75], 'LQE': [76], 'QEG': [77], 'EGC': [78], 'GCE': [79], 'CES': [80], 'ESV': [81], 'SVD': [82], 'VDM': [83, 90], 'DML': [84], 'MLA': [85], 'LAS': [86], 'ASM': [87], 'SMV': [88], 'MVD': [89], 'DMV': [91], 'MVK': [92], 'KFF': [94], 'FFD': [95], 'FDV': [96], 'DVA': [97], 'VAN': [98], 'ANS': [99], 'NSL': [100], 'SLE': [101], 'LEE': [102, 306], 'EEQ': [103], 'EQV': [104], 'QVE': [105], 'VEK': [106], 'EKA': [107], 'KAM': [108], 'AMK': [109], 'MKK': [110], 'KKM': [111], 'KMV': [112], 'MVQ': [113], 'VQP': [114], 'QPR': [115], 'PRP': [116], 'RPS': [117], 'PSC': [118], 'SCI': [119], 'CII': [120], 'IIG': [121], 'IGD': [122], 'GDM': [123], 'DMS': [124], 'MSL': [125], 'SLP': [126], 'LPF': [127], 'PFT': [128], 'FTS': [129], 'TSR': [130], 'RLA': [132], 'LAK': [133, 326], 'AKK': [134], 'KKF': [135], 'KFK': [136], 'FKI': [137], 'KIP': [138], 'IPK': [139], 'PKL': [140], 'KLL': [141], 'LLF': [142], 'LFH': [143], 'FHG': [144], 'HGF': [145], 'GFS': [146], 'FSC': [147], 'SCF': [148], 'CFS': [149], 'FSL': [150], 'SLM': [151], 'LMC': [152], 'MCI': [153], 'CIQ': [154], 'IQV': [155], 'QVV': [156], 'VVR': [157], 'VRE': [158, 453], 'RES': [159], 'ESG': [160], 'SGI': [161], 'GIL': [162], 'ILK': [163, 402], 'LKF': [164], 'KFI': [165], 'FIE': [166], 'IES': [167], 'ESN': [168, 308], 'SND': [169], 'NDE': [170], 'DEY': [171], 'EYF': [172], 'YFD': [173], 'FDL': [174], 'DLP': [175], 'LPG': [176], 'PGL': [177], 'GLP': [178], 'LPD': [179], 'PDR': [180], 'DRV': [181], 'RVE': [182], 'VEF': [183], 'EFT': [184], 'FTK': [185], 'TKP': [186], 'KPQ': [187], 'PQV': [188, 351], 'QVS': [189], 'VSV': [190], 'SVL': [191, 282], 'VLQ': [192], 'LQP': [193], 'QPL': [194], 'PLE': [195], 'LEG': [196, 374], 'EGN': [197], 'GNM': [198], 'NMK': [199], 'MKE': [200], 'KES': [201], 'EST': [202], 'STV': [203], 'TVK': [204], 'VKI': [205, 400], 'KII': [206], 'IIE': [207], 'IEA': [208], 'EAD': [209], 'ADN': [210], 'DND': [211], 'NDS': [212], 'DSY': [213], 'SYG': [214], 'YGV': [215], 'GVI': [216], 'VIV': [217], 'IVN': [218], 'VNS': [219], 'NSF': [220], 'SFE': [221], 'FEE': [222, 335], 'EEL': [223], 'ELE': [224], 'LEV': [225], 'EVD': [226], 'VDY': [227], 'DYA': [228], 'YAR': [229], 'ARE': [230], 'REY': [231], 'EYR': [232], 'YRK': [233], 'RKA': [234, 433], 'KAR': [235], 'ART': [236], 'RTG': [237], 'TGK': [238], 'GKV': [239], 'KVW': [240], 'VWC': [241], 'WCV': [242], 'CVG': [243], 'VGP': [244], 'GPV': [245], 'PVS': [246], 'VSL': [247], 'SLC': [248, 290], 'LCN': [249, 291], 'CNK': [250], 'NKL': [251], 'KLE': [252], 'LEL': [253], 'ELK': [254], 'LKN': [255], 'KNA': [256], 'NAE': [257], 'AER': [258], 'ERG': [259], 'RGD': [260], 'GDK': [261], 'DKA': [262], 'KAS': [263], 'ASI': [264, 359], 'SIG': [265, 360], 'IGQ': [266], 'GQD': [267], 'QDQ': [268], 'DQC': [269], 'QCL': [270], 'CLQ': [271], 'LQW': [272], 'QWL': [273], 'WLD': [274], 'LDS': [275], 'DSQ': [276, 442], 'SQG': [277], 'QGT': [278], 'GTG': [279], 'TGS': [280], 'GSV': [281], 'VLY': [283], 'LYV': [284], 'YVC': [285], 'VCL': [286], 'CLG': [287], 'LGS': [288], 'GSL': [289], 'CNL': [292], 'NLP': [293], 'LPL': [294], 'PLA': [295], 'LAQ': [296], 'AQL': [297], 'QLK': [298], 'LKE': [299], 'KEL': [300], 'ELG': [301], 'LGL': [302, 304], 'GLG': [303], 'GLE': [305], 'EES': [307], 'SNK': [309], 'NKP': [310], 'KPF': [311], 'PFI': [312], 'FIW': [313], 'IWV': [314], 'WVI': [315], 'VIR': [316], 'IRE': [317], 'REW': [318], 'EWG': [319], 'WGK': [320], 'GKY': [321], 'KYE': [322], 'YED': [323], 'EDL': [324], 'DLA': [325, 458], 'AKW': [327], 'KWM': [328], 'WMQ': [329], 'MQQ': [330], 'QQS': [331], 'QSG': [332], 'SGF': [333], 'GFE': [334], 'EER': [336, 447], 'ERI': [337], 'RIR': [338], 'IRD': [339], 'RDR': [340], 'DRG': [341], 'RGL': [342, 489], 'GLL': [343], 'LLI': [344, 476], 'LIK': [345], 'IKG': [346], 'KGW': [347], 'GWA': [348], 'WAP': [349], 'APQ': [350], 'QVF': [352], 'VFI': [353], 'FIL': [354], 'ILS': [355], 'LSH': [356], 'SHA': [357], 'HAS': [358], 'IGG': [361], 'GGF': [362], 'GFL': [363], 'FLT': [364], 'LTH': [365], 'THC': [366], 'HCG': [367], 'CGW': [368], 'GWN': [369], 'WNS': [370], 'NST': [371], 'STL': [372], 'TLE': [373], 'EGI': [375], 'GIT': [376], 'ITA': [377], 'TAG': [378], 'AGV': [379], 'GVP': [380], 'VPL': [381], 'PLL': [382], 'LLT': [383], 'LTW': [384], 'TWP': [385], 'WPL': [386], 'PLS': [387], 'LSA': [388], 'SAE': [389], 'AEQ': [390], 'EQF': [391], 'QFL': [392], 'FLN': [393], 'LNE': [394], 'NEK': [395], 'EKL': [396], 'KLI': [397], 'LIV': [398], 'IVK': [399], 'KIL': [401], 'LKS': [403], 'KSG': [404], 'SGL': [405], 'GLK': [406, 490], 'LKI': [407], 'KIG': [408], 'IGV': [409, 423], 'GVE': [410], 'VET': [411], 'ETL': [412], 'TLM': [413], 'LMK': [414], 'MKY': [415], 'KYG': [416], 'YGK': [417], 'GKE': [418], 'KEE': [419], 'EEE': [420], 'EEI': [421], 'EIG': [422], 'VSR': [427], 'SRE': [428], 'RET': [429], 'ETV': [430], 'TVR': [431], 'VRK': [432], 'KAV': [434], 'AVG': [435], 'VGE': [436], 'GEL': [437], 'ELM': [438], 'LMG': [439], 'MGD': [440], 'GDS': [441], 'SQE': [443], 'QEA': [444], 'EAE': [445], 'AEE': [446], 'ERR': [448], 'RRR': [449, 450], 'RRV': [451], 'RVR': [452], 'REL': [454], 'ELS': [455], 'LSD': [456], 'SDL': [457], 'LAN': [459], 'ANK': [460], 'NKA': [461], 'KAL': [462], 'ALE': [463], 'LEQ': [464], 'EQG': [465], 'QGG': [466], 'GGS': [467], 'GSS': [468], 'SSD': [469], 'SDA': [470], 'DAN': [471], 'ANI': [472], 'NIT': [473], 'ITL': [474], 'TLL': [475], 'LIQ': [477], 'IQD': [478], 'QDI': [479], 'DIM': [480], 'IME': [481], 'MEQ': [482], 'EQS': [483], 'QSQ': [484], 'SQH': [485], 'QHQ': [486], 'HQR': [487], 'QRG': [488], 'LKD': [491], 'KDC': [492]}" /ripp_evidence="{}" /top_kmer_word="SSS" /top_kmer_hits=54 /top_kmer_hits=55 /top_kmer_hits=56 /table="SSS" /table="SSS" /table="SSS" gene complement(15330..17596) /gene="LOC17886706" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /db_xref="GeneID:17886706" mRNA complement(join(15330..15561,15642..15746,15875..16958, 17052..17596)) /gene="LOC17886706" /product="pentatricopeptide repeat-containing protein At3g53170, transcript variant X2" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 2 Proteins, and 100% coverage of the annotated genomic feature by RNAseq alignments, including 6 samples with support for all annotated introns" /transcript_id="XM_023783254.1" /db_xref="GeneID:17886706" mRNA complement(join(15333..15561,15642..15752,15875..16958, 17052..17596)) /gene="LOC17886706" /product="pentatricopeptide repeat-containing protein At3g53170, transcript variant X1" /note="Derived by automated computational analysis using gene prediction method: Gnomon. Supporting evidence includes similarity to: 4 Proteins, and 100% coverage of the annotated genomic feature by RNAseq alignments, including 10 samples with support for all annotated introns" /transcript_id="XM_006290906.2" /db_xref="GeneID:17886706" CDS complement(join(15724..15746,15875..16958,17052..17426)) /gene="LOC17886706" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="pentatricopeptide repeat-containing protein At3g53170 isoform X2" /protein_id="XP_023639022.1" /db_xref="GeneID:17886706" /translation="MELIQNPIQGINSAYAIENIKLCFSRQHIPSTVCSRRVASVSTTP TTCSTKIPNDGTGKMGSGLISTRHRVDPKKELSRILRAESAVKGIERKANSEKYLTLWP KAVLEALDEAIKENRWQSALKIFNLLRKQHWYEPRCKTYTKLFKVLGNCKQPDQASLLF EVMLSEGLKPTIDVYTSLIAVYGKSGLLDKAFSTLEYMKSASDCKPDVFTFTVLISCCC KLGRFDLVKSIVLEMSYLGVGCSTVTYNTIIDGYGKAGMFEEMENVLADMIEDGDSLPD VFTLNSIIGSYGNGGDTKKMESWYNRFQLMGVQPDITTFNILILSFGKAGMYKKMCSVM EFMEKRFFSLTTVTYNIVIETFGKAGRIEKMDDIFRKMKYQGVKPNSITYCSLVNAYSK VGLLVKIDSILRQIVNSDVILDTPFFNCIINSYGQAGDLATMKELYIQMEERKCKPDKV TFATMIKTYTAHGIFDAVHELEKQMISTGKKRLME" /kmer_dict="{'MEL': [0], 'ELI': [1], 'LIQ': [2], 'IQN': [3], 'QNP': [4], 'NPI': [5], 'PIQ': [6], 'IQG': [7], 'QGI': [8], 'GIN': [9], 'INS': [10, 428], 'NSA': [11], 'SAY': [12], 'AYA': [13], 'YAI': [14], 'AIE': [15], 'IEN': [16], 'ENI': [17], 'NIK': [18], 'IKL': [19], 'KLC': [20], 'LCF': [21], 'CFS': [22], 'FSR': [23], 'SRQ': [24], 'RQH': [25], 'QHI': [26], 'HIP': [27], 'IPS': [28], 'PST': [29], 'STV': [30, 244], 'TVC': [31], 'VCS': [32], 'CSR': [33], 'SRR': [34], 'RRV': [35], 'RVA': [36], 'VAS': [37], 'ASV': [38], 'SVS': [39], 'VST': [40], 'STT': [41], 'TTP': [42], 'TPT': [43], 'PTT': [44], 'TTC': [45], 'TCS': [46], 'CST': [47, 243], 'STK': [48], 'TKI': [49], 'KIP': [50], 'IPN': [51], 'PND': [52], 'NDG': [53], 'DGT': [54], 'GTG': [55], 'TGK': [56, 485], 'GKM': [57], 'KMG': [58], 'MGS': [59], 'GSG': [60], 'SGL': [61, 187], 'GLI': [62], 'LIS': [63, 216], 'IST': [64, 483], 'STR': [65], 'TRH': [66], 'RHR': [67], 'HRV': [68], 'RVD': [69], 'VDP': [70], 'DPK': [71], 'PKK': [72], 'KKE': [73], 'KEL': [74, 441], 'ELS': [75], 'LSR': [76], 'SRI': [77], 'RIL': [78], 'ILR': [79, 408], 'LRA': [80], 'RAE': [81], 'AES': [82], 'ESA': [83], 'SAV': [84], 'AVK': [85], 'VKG': [86], 'KGI': [87], 'GIE': [88], 'IER': [89], 'ERK': [90, 449], 'RKA': [91], 'KAN': [92], 'ANS': [93], 'NSE': [94], 'SEK': [95], 'EKY': [96], 'KYL': [97], 'YLT': [98], 'LTL': [99], 'TLW': [100], 'LWP': [101], 'WPK': [102], 'PKA': [103], 'KAV': [104], 'AVL': [105], 'VLE': [106, 233], 'LEA': [107], 'EAL': [108], 'ALD': [109], 'LDE': [110], 'DEA': [111], 'EAI': [112], 'AIK': [113], 'IKE': [114], 'KEN': [115], 'ENR': [116], 'NRW': [117], 'RWQ': [118], 'WQS': [119], 'QSA': [120], 'SAL': [121], 'ALK': [122], 'LKI': [123], 'KIF': [124], 'IFN': [125], 'FNL': [126], 'NLL': [127], 'LLR': [128], 'LRK': [129], 'RKQ': [130], 'KQH': [131], 'QHW': [132], 'HWY': [133], 'WYE': [134], 'YEP': [135], 'EPR': [136], 'PRC': [137], 'RCK': [138], 'CKT': [139], 'KTY': [140, 464], 'TYT': [141, 465], 'YTK': [142], 'TKL': [143], 'KLF': [144], 'LFK': [145], 'FKV': [146], 'KVL': [147], 'VLG': [148], 'LGN': [149], 'GNC': [150], 'NCK': [151], 'CKQ': [152], 'KQP': [153], 'QPD': [154, 313], 'PDQ': [155], 'DQA': [156], 'QAS': [157], 'ASL': [158], 'SLL': [159], 'LLF': [160], 'LFE': [161], 'FEV': [162], 'EVM': [163], 'VML': [164], 'MLS': [165], 'LSE': [166], 'SEG': [167], 'EGL': [168], 'GLK': [169], 'LKP': [170], 'KPT': [171], 'PTI': [172], 'TID': [173], 'IDV': [174], 'DVY': [175], 'VYT': [176], 'YTS': [177], 'TSL': [178], 'SLI': [179], 'LIA': [180], 'IAV': [181], 'AVY': [182], 'VYG': [183], 'YGK': [184, 255], 'GKS': [185], 'KSG': [186], 'GLL': [188, 400], 'LLD': [189], 'LDK': [190], 'DKA': [191], 'KAF': [192], 'AFS': [193], 'FST': [194], 'STL': [195], 'TLE': [196], 'LEY': [197], 'EYM': [198], 'YMK': [199], 'MKS': [200], 'KSA': [201], 'SAS': [202], 'ASD': [203], 'SDC': [204], 'DCK': [205], 'CKP': [206, 452], 'KPD': [207, 453], 'PDV': [208, 279], 'DVF': [209, 280], 'VFT': [210, 281], 'FTF': [211], 'TFT': [212], 'FTV': [213], 'TVL': [214], 'VLI': [215], 'ISC': [217], 'SCC': [218], 'CCC': [219], 'CCK': [220], 'CKL': [221], 'KLG': [222], 'LGR': [223], 'GRF': [224], 'RFD': [225], 'FDL': [226], 'DLV': [227], 'LVK': [228, 402], 'VKS': [229], 'KSI': [230], 'SIV': [231], 'IVL': [232], 'LEM': [234], 'EMS': [235], 'MSY': [236], 'SYL': [237], 'YLG': [238], 'LGV': [239], 'GVG': [240], 'VGC': [241], 'GCS': [242], 'TVT': [245, 351], 'VTY': [246, 352], 'TYN': [247, 353], 'YNT': [248], 'NTI': [249], 'TII': [250], 'IID': [251], 'IDG': [252], 'DGY': [253], 'GYG': [254], 'GKA': [256, 327, 362], 'KAG': [257, 328, 363], 'AGM': [258, 329], 'GMF': [259], 'MFE': [260], 'FEE': [261], 'EEM': [262], 'EME': [263], 'MEN': [264], 'ENV': [265], 'NVL': [266], 'VLA': [267], 'LAD': [268], 'ADM': [269], 'DMI': [270], 'MIE': [271], 'IED': [272], 'EDG': [273], 'DGD': [274], 'GDS': [275], 'DSL': [276], 'SLP': [277], 'LPD': [278], 'FTL': [282], 'TLN': [283], 'LNS': [284], 'NSI': [285, 385], 'SII': [286], 'IIG': [287], 'IGS': [288], 'GSY': [289], 'SYG': [290, 430], 'YGN': [291], 'GNG': [292], 'NGG': [293], 'GGD': [294], 'GDT': [295], 'DTK': [296], 'TKK': [297], 'KKM': [298, 333], 'KME': [299], 'MES': [300], 'ESW': [301], 'SWY': [302], 'WYN': [303], 'YNR': [304], 'NRF': [305], 'RFQ': [306], 'FQL': [307], 'QLM': [308], 'LMG': [309], 'MGV': [310], 'GVQ': [311], 'VQP': [312], 'PDI': [314], 'DIT': [315], 'ITT': [316], 'TTF': [317], 'TFN': [318], 'FNI': [319], 'NIL': [320], 'ILI': [321], 'LIL': [322], 'ILS': [323], 'LSF': [324], 'SFG': [325], 'FGK': [326, 361], 'GMY': [330], 'MYK': [331], 'YKK': [332], 'KMC': [334], 'MCS': [335], 'CSV': [336], 'SVM': [337], 'VME': [338], 'MEF': [339], 'EFM': [340], 'FME': [341], 'MEK': [342], 'EKR': [343], 'KRF': [344], 'RFF': [345], 'FFS': [346], 'FSL': [347], 'SLT': [348], 'LTT': [349], 'TTV': [350], 'YNI': [354], 'NIV': [355], 'IVI': [356], 'VIE': [357], 'IET': [358], 'ETF': [359], 'TFG': [360], 'AGR': [364], 'GRI': [365], 'RIE': [366], 'IEK': [367], 'EKM': [368], 'KMD': [369], 'MDD': [370], 'DDI': [371], 'DIF': [372], 'IFR': [373], 'FRK': [374], 'RKM': [375], 'KMK': [376], 'MKY': [377], 'KYQ': [378], 'YQG': [379], 'QGV': [380], 'GVK': [381], 'VKP': [382], 'KPN': [383], 'PNS': [384], 'SIT': [386], 'ITY': [387], 'TYC': [388], 'YCS': [389], 'CSL': [390], 'SLV': [391], 'LVN': [392], 'VNA': [393], 'NAY': [394], 'AYS': [395], 'YSK': [396], 'SKV': [397], 'KVG': [398], 'VGL': [399], 'LLV': [401], 'VKI': [403], 'KID': [404], 'IDS': [405], 'DSI': [406], 'SIL': [407], 'LRQ': [409], 'RQI': [410], 'QIV': [411], 'IVN': [412], 'VNS': [413], 'NSD': [414], 'SDV': [415], 'DVI': [416], 'VIL': [417], 'ILD': [418], 'LDT': [419], 'DTP': [420], 'TPF': [421], 'PFF': [422], 'FFN': [423], 'FNC': [424], 'NCI': [425], 'CII': [426], 'IIN': [427], 'NSY': [429], 'YGQ': [431], 'GQA': [432], 'QAG': [433], 'AGD': [434], 'GDL': [435], 'DLA': [436], 'LAT': [437], 'ATM': [438, 460], 'TMK': [439], 'MKE': [440], 'ELY': [442], 'LYI': [443], 'YIQ': [444], 'IQM': [445], 'QME': [446], 'MEE': [447], 'EER': [448], 'RKC': [450], 'KCK': [451], 'PDK': [454], 'DKV': [455], 'KVT': [456], 'VTF': [457], 'TFA': [458], 'FAT': [459], 'TMI': [461], 'MIK': [462], 'IKT': [463], 'YTA': [466], 'TAH': [467], 'AHG': [468], 'HGI': [469], 'GIF': [470], 'IFD': [471], 'FDA': [472], 'DAV': [473], 'AVH': [474], 'VHE': [475], 'HEL': [476], 'ELE': [477], 'LEK': [478], 'EKQ': [479], 'KQM': [480], 'QMI': [481], 'MIS': [482], 'STG': [484], 'GKK': [486], 'KKR': [487], 'KRL': [488], 'RLM': [489]}" /ripp_evidence="{}" /top_kmer_word="GKA" /top_kmer_hits=256 /top_kmer_hits=327 /top_kmer_hits=362 /table="GKAGMFEEM" /table="GKAGMYKKM" /table="GKAGRIEKM" /pattern="GKAG[MR][FYI][EK][EK]M" /has_repeat=True /cyclopeptide_analysis="GKAG[MR][FYI][EK][EK]M//GKAGMFEEM|G KAGMYKKM|GKAGRIEKM//MELIQNPIQGINSAYAIENIKLCFSRQHIPSTVCSRRVA SVSTTPTTCSTKIPNDGTGKMGSGLISTRHRVDPKKELSRILRAESAVKGIERKANSEK YLTLWPKAVLEALDEAIKENRWQSALKIFNLLRKQHWYEPRCKTYTKLFKVLGNCKQPD QASLLFEVMLSEGLKPTIDVYTSLIAVYGKSGLLDKAFSTLEYMKSASDCKPDVFTFTV LISCCCKLGRFDLVKSIVLEMSYLGVGCSTVTYNTIIDGYGKAGMFEEMENVLADMIED GDSLPDVFTLNSIIGSYGNGGDTKKMESWYNRFQLMGVQPDITTFNILILSFGKAGMYK KMCSVMEFMEKRFFSLTTVTYNIVIETFGKAGRIEKMDDIFRKMKYQGVKPNSITYCSL VNAYSKVGLLVKIDSILRQIVNSDVILDTPFFNCIINSYGQAGDLATMKELYIQMEERK CKPDKVTFATMIKTYTAHGIFDAVHELEKQMISTGKKRLME//CDS//9824259|982 5962//LOC17886706////" CDS complement(join(15724..15752,15875..16958,17052..17426)) /gene="LOC17886706" /note="Derived by automated computational analysis using gene prediction method: Gnomon." /codon_start=1 /product="LOC17886_149" /protein_id="XP_006290968.1" /db_xref="GeneID:17886706" /translation="MELIQNPIQGINSAYAIENIKLCFSRQHIPSTVCSRRVASVSTTP TTCSTKIPNDGTGKMGSGLISTRHRVDPKKELSRILRAESAVKGIERKANSEKYLTLWP KAVLEALDEAIKENRWQSALKIFNLLRKQHWYEPRCKTYTKLFKVLGNCKQPDQASLLF EVMLSEGLKPTIDVYTSLIAVYGKSGLLDKAFSTLEYMKSASDCKPDVFTFTVLISCCC KLGRFDLVKSIVLEMSYLGVGCSTVTYNTIIDGYGKAGMFEEMENVLADMIEDGDSLPD VFTLNSIIGSYGNGGDTKKMESWYNRFQLMGVQPDITTFNILILSFGKAGMYKKMCSVM EFMEKRFFSLTTVTYNIVIETFGKAGRIEKMDDIFRKMKYQGVKPNSITYCSLVNAYSK VGLLVKIDSILRQIVNSDVILDTPFFNCIINSYGQAGDLATMKELYIQMEERKCKPDKV TFATMIKTYTAHGIFDAVHELEKQMISTDIGKKRLME" /locus_tag="LOC17886_149" /kmer_dict="{'MEL': [0], 'ELI': [1], 'LIQ': [2], 'IQN': [3], 'QNP': [4], 'NPI': [5], 'PIQ': [6], 'IQG': [7], 'QGI': [8], 'GIN': [9], 'INS': [10, 428], 'NSA': [11], 'SAY': [12], 'AYA': [13], 'YAI': [14], 'AIE': [15], 'IEN': [16], 'ENI': [17], 'NIK': [18], 'IKL': [19], 'KLC': [20], 'LCF': [21], 'CFS': [22], 'FSR': [23], 'SRQ': [24], 'RQH': [25], 'QHI': [26], 'HIP': [27], 'IPS': [28], 'PST': [29], 'STV': [30, 244], 'TVC': [31], 'VCS': [32], 'CSR': [33], 'SRR': [34], 'RRV': [35], 'RVA': [36], 'VAS': [37], 'ASV': [38], 'SVS': [39], 'VST': [40], 'STT': [41], 'TTP': [42], 'TPT': [43], 'PTT': [44], 'TTC': [45], 'TCS': [46], 'CST': [47, 243], 'STK': [48], 'TKI': [49], 'KIP': [50], 'IPN': [51], 'PND': [52], 'NDG': [53], 'DGT': [54], 'GTG': [55], 'TGK': [56], 'GKM': [57], 'KMG': [58], 'MGS': [59], 'GSG': [60], 'SGL': [61, 187], 'GLI': [62], 'LIS': [63, 216], 'IST': [64, 483], 'STR': [65], 'TRH': [66], 'RHR': [67], 'HRV': [68], 'RVD': [69], 'VDP': [70], 'DPK': [71], 'PKK': [72], 'KKE': [73], 'KEL': [74, 441], 'ELS': [75], 'LSR': [76], 'SRI': [77], 'RIL': [78], 'ILR': [79, 408], 'LRA': [80], 'RAE': [81], 'AES': [82], 'ESA': [83], 'SAV': [84], 'AVK': [85], 'VKG': [86], 'KGI': [87], 'GIE': [88], 'IER': [89], 'ERK': [90, 449], 'RKA': [91], 'KAN': [92], 'ANS': [93], 'NSE': [94], 'SEK': [95], 'EKY': [96], 'KYL': [97], 'YLT': [98], 'LTL': [99], 'TLW': [100], 'LWP': [101], 'WPK': [102], 'PKA': [103], 'KAV': [104], 'AVL': [105], 'VLE': [106, 233], 'LEA': [107], 'EAL': [108], 'ALD': [109], 'LDE': [110], 'DEA': [111], 'EAI': [112], 'AIK': [113], 'IKE': [114], 'KEN': [115], 'ENR': [116], 'NRW': [117], 'RWQ': [118], 'WQS': [119], 'QSA': [120], 'SAL': [121], 'ALK': [122], 'LKI': [123], 'KIF': [124], 'IFN': [125], 'FNL': [126], 'NLL': [127], 'LLR': [128], 'LRK': [129], 'RKQ': [130], 'KQH': [131], 'QHW': [132], 'HWY': [133], 'WYE': [134], 'YEP': [135], 'EPR': [136], 'PRC': [137], 'RCK': [138], 'CKT': [139], 'KTY': [140, 464], 'TYT': [141, 465], 'YTK': [142], 'TKL': [143], 'KLF': [144], 'LFK': [145], 'FKV': [146], 'KVL': [147], 'VLG': [148], 'LGN': [149], 'GNC': [150], 'NCK': [151], 'CKQ': [152], 'KQP': [153], 'QPD': [154, 313], 'PDQ': [155], 'DQA': [156], 'QAS': [157], 'ASL': [158], 'SLL': [159], 'LLF': [160], 'LFE': [161], 'FEV': [162], 'EVM': [163], 'VML': [164], 'MLS': [165], 'LSE': [166], 'SEG': [167], 'EGL': [168], 'GLK': [169], 'LKP': [170], 'KPT': [171], 'PTI': [172], 'TID': [173], 'IDV': [174], 'DVY': [175], 'VYT': [176], 'YTS': [177], 'TSL': [178], 'SLI': [179], 'LIA': [180], 'IAV': [181], 'AVY': [182], 'VYG': [183], 'YGK': [184, 255], 'GKS': [185], 'KSG': [186], 'GLL': [188, 400], 'LLD': [189], 'LDK': [190], 'DKA': [191], 'KAF': [192], 'AFS': [193], 'FST': [194], 'STL': [195], 'TLE': [196], 'LEY': [197], 'EYM': [198], 'YMK': [199], 'MKS': [200], 'KSA': [201], 'SAS': [202], 'ASD': [203], 'SDC': [204], 'DCK': [205], 'CKP': [206, 452], 'KPD': [207, 453], 'PDV': [208, 279], 'DVF': [209, 280], 'VFT': [210, 281], 'FTF': [211], 'TFT': [212], 'FTV': [213], 'TVL': [214], 'VLI': [215], 'ISC': [217], 'SCC': [218], 'CCC': [219], 'CCK': [220], 'CKL': [221], 'KLG': [222], 'LGR': [223], 'GRF': [224], 'RFD': [225], 'FDL': [226], 'DLV': [227], 'LVK': [228, 402], 'VKS': [229], 'KSI': [230], 'SIV': [231], 'IVL': [232], 'LEM': [234], 'EMS': [235], 'MSY': [236], 'SYL': [237], 'YLG': [238], 'LGV': [239], 'GVG': [240], 'VGC': [241], 'GCS': [242], 'TVT': [245, 351], 'VTY': [246, 352], 'TYN': [247, 353], 'YNT': [248], 'NTI': [249], 'TII': [250], 'IID': [251], 'IDG': [252], 'DGY': [253], 'GYG': [254], 'GKA': [256, 327, 362], 'KAG': [257, 328, 363], 'AGM': [258, 329], 'GMF': [259], 'MFE': [260], 'FEE': [261], 'EEM': [262], 'EME': [263], 'MEN': [264], 'ENV': [265], 'NVL': [266], 'VLA': [267], 'LAD': [268], 'ADM': [269], 'DMI': [270], 'MIE': [271], 'IED': [272], 'EDG': [273], 'DGD': [274], 'GDS': [275], 'DSL': [276], 'SLP': [277], 'LPD': [278], 'FTL': [282], 'TLN': [283], 'LNS': [284], 'NSI': [285, 385], 'SII': [286], 'IIG': [287], 'IGS': [288], 'GSY': [289], 'SYG': [290, 430], 'YGN': [291], 'GNG': [292], 'NGG': [293], 'GGD': [294], 'GDT': [295], 'DTK': [296], 'TKK': [297], 'KKM': [298, 333], 'KME': [299], 'MES': [300], 'ESW': [301], 'SWY': [302], 'WYN': [303], 'YNR': [304], 'NRF': [305], 'RFQ': [306], 'FQL': [307], 'QLM': [308], 'LMG': [309], 'MGV': [310], 'GVQ': [311], 'VQP': [312], 'PDI': [314], 'DIT': [315], 'ITT': [316], 'TTF': [317], 'TFN': [318], 'FNI': [319], 'NIL': [320], 'ILI': [321], 'LIL': [322], 'ILS': [323], 'LSF': [324], 'SFG': [325], 'FGK': [326, 361], 'GMY': [330], 'MYK': [331], 'YKK': [332], 'KMC': [334], 'MCS': [335], 'CSV': [336], 'SVM': [337], 'VME': [338], 'MEF': [339], 'EFM': [340], 'FME': [341], 'MEK': [342], 'EKR': [343], 'KRF': [344], 'RFF': [345], 'FFS': [346], 'FSL': [347], 'SLT': [348], 'LTT': [349], 'TTV': [350], 'YNI': [354], 'NIV': [355], 'IVI': [356], 'VIE': [357], 'IET': [358], 'ETF': [359], 'TFG': [360], 'AGR': [364], 'GRI': [365], 'RIE': [366], 'IEK': [367], 'EKM': [368], 'KMD': [369], 'MDD': [370], 'DDI': [371], 'DIF': [372], 'IFR': [373], 'FRK': [374], 'RKM': [375], 'KMK': [376], 'MKY': [377], 'KYQ': [378], 'YQG': [379], 'QGV': [380], 'GVK': [381], 'VKP': [382], 'KPN': [383], 'PNS': [384], 'SIT': [386], 'ITY': [387], 'TYC': [388], 'YCS': [389], 'CSL': [390], 'SLV': [391], 'LVN': [392], 'VNA': [393], 'NAY': [394], 'AYS': [395], 'YSK': [396], 'SKV': [397], 'KVG': [398], 'VGL': [399], 'LLV': [401], 'VKI': [403], 'KID': [404], 'IDS': [405], 'DSI': [406], 'SIL': [407], 'LRQ': [409], 'RQI': [410], 'QIV': [411], 'IVN': [412], 'VNS': [413], 'NSD': [414], 'SDV': [415], 'DVI': [416], 'VIL': [417], 'ILD': [418], 'LDT': [419], 'DTP': [420], 'TPF': [421], 'PFF': [422], 'FFN': [423], 'FNC': [424], 'NCI': [425], 'CII': [426], 'IIN': [427], 'NSY': [429], 'YGQ': [431], 'GQA': [432], 'QAG': [433], 'AGD': [434], 'GDL': [435], 'DLA': [436], 'LAT': [437], 'ATM': [438, 460], 'TMK': [439], 'MKE': [440], 'ELY': [442], 'LYI': [443], 'YIQ': [444], 'IQM': [445], 'QME': [446], 'MEE': [447], 'EER': [448], 'RKC': [450], 'KCK': [451], 'PDK': [454], 'DKV': [455], 'KVT': [456], 'VTF': [457], 'TFA': [458], 'FAT': [459], 'TMI': [461], 'MIK': [462], 'IKT': [463], 'YTA': [466], 'TAH': [467], 'AHG': [468], 'HGI': [469], 'GIF': [470], 'IFD': [471], 'FDA': [472], 'DAV': [473], 'AVH': [474], 'VHE': [475], 'HEL': [476], 'ELE': [477], 'LEK': [478], 'EKQ': [479], 'KQM': [480], 'QMI': [481], 'MIS': [482], 'STD': [484], 'TDI': [485], 'DIG': [486], 'IGK': [487], 'GKK': [488], 'KKR': [489], 'KRL': [490], 'RLM': [491]}" /ripp_evidence="{}" /top_kmer_word="GKA" /top_kmer_hits=256 /top_kmer_hits=327 /top_kmer_hits=362 /table="GKAGMFEEM" /table="GKAGMYKKM" /table="GKAGRIEKM" /pattern="GKAG[MR][FYI][EK][EK]M" /has_repeat=True /cyclopeptide_analysis="GKAG[MR][FYI][EK][EK]M//GKAGMFEEM|G KAGMYKKM|GKAGRIEKM//MELIQNPIQGINSAYAIENIKLCFSRQHIPSTVCSRRVA SVSTTPTTCSTKIPNDGTGKMGSGLISTRHRVDPKKELSRILRAESAVKGIERKANSEK YLTLWPKAVLEALDEAIKENRWQSALKIFNLLRKQHWYEPRCKTYTKLFKVLGNCKQPD QASLLFEVMLSEGLKPTIDVYTSLIAVYGKSGLLDKAFSTLEYMKSASDCKPDVFTFTV LISCCCKLGRFDLVKSIVLEMSYLGVGCSTVTYNTIIDGYGKAGMFEEMENVLADMIED GDSLPDVFTLNSIIGSYGNGGDTKKMESWYNRFQLMGVQPDITTFNILILSFGKAGMYK KMCSVMEFMEKRFFSLTTVTYNIVIETFGKAGRIEKMDDIFRKMKYQGVKPNSITYCSL VNAYSKVGLLVKIDSILRQIVNSDVILDTPFFNCIINSYGQAGDLATMKELYIQMEERK CKPDKVTFATMIKTYTAHGIFDAVHELEKQMISTDIGKKRLME//CDS//9824259|9 825962//LOC17886706////" assembly_gap 18286..18385 /estimated_length=unknown /gap_type="within scaffold" /linkage_evidence="map" ORIGIN 1 taagtaagat gacaaatgat agtgggatat gtaccttagt aaatatatac aattcagctg 61 tgtttttttt gtatagagcc ctttattttg ataggacatg tctgtgtgtc aacgatgatg 121 aatctgtctt cactgctgaa agctgtacta aagatgggtt atttcattat cttagtggct 181 gttagtctaa attaaaggaa attatgttgc tttttcgttc ttgtgccaat tttgattgtt 241 ttcttgtgtt attgaccttc tttctgacag gttctacttt tctcggcaac ttttaatgaa 301 actgtcaaag attttgtggc aaggacagtc aaggatccta atcaattgtt tgtcaaaaga 361 gaggatctgg ctttggactc ggtaaagcag tttaaagttc tttgcccgaa ggagcaaaac 421 aagatcgaag tcattaagga tcagattatg gaacttgggg atattgggca aaccattatc 481 tttgtgaaaa caaaagtgtc tgctaacaag gtccacaaag cccttgcaga aatgggatat 541 gatgtcacca gtgtccatgg tagtatgtct gaagtggaca gggataagat agttaaggag 601 ttcaaagact gccttactca agtgctaatt gctactgatg tcattgcaag aggttttgac 661 caacagcggg taaatattat catttggccc ttttactctc ttctcctttt tccccaatgg 721 tgcttcgtag ttaatgcctc ttgctggttt tatacaatac ttgcaggtga atttggttgt 781 caattacaat cttcccacca aatatgagac cggagagcca gattatgagg tgtaccttca 841 cagggttggg agagctggcc ggtttggtcg taaaggttag ttttgattcg tccatttttt 901 taaactcaag tgttgccaca agttgtcata agtttctgaa ctatgtattt gtattgtagg 961 agcggtattt aacctgctgt tagacgatgg gtgggataaa gaggtgatgg agaagatcga 1021 gaagtatttt ggagcaaatg ttaaggaggt ataataagat ttatgaaaac tgctaattat 1081 ctttctatag tgtttgtgaa aacagtatcc aatgatttta aactttactg cagatcaagt 1141 cgtggaactc agaggacgaa tacaagggtg cgttaaagga agctggcctg ctcgacgagt 1201 gagaaagagg gacaaaatgt gttcaaaaag tttgaaggac tgtcgtctgt ttttttgaga 1261 ttgttgaaga aagaaacttg tatacgtctt tgggttttct tgtaatcttt ctatcagatt 1321 gctgagattt tcagactttg tagtttttta taaaggaaaa aacaaacata attttgatgt 1381 caatgtcaat cacttttaca acatcggata aggagtcata agacacaaaa ccaagacttt 1441 ggtttgtgat gagttcaatg tgcaaggctt attaattcag atatttgagg ttttagcagc 1501 aaggtgaatc aatgctcttc gatgatatgt agttcgcagc ttcttgaatt tctgtacaaa 1561 tgctgctgta tcaatctcct tctctaggaa tttctcttgc agcgcttcag attcttcatc 1621 cacctgattc atagcctctg caaaaacagt aaaatgtgtt tacaaatgtt gacacaagaa 1681 cagttgagaa gaagagacga gtggaaaatc catagcaatg gaaatttgtt accttggagt 1741 ttatgaagaa gagaaccagg ggagtagaat ttgaggatct cttctttttg cctctcaagc 1801 tcattaagct tttcttgcgc ggctgcgagc tcagttgtac ggataattct gcactgtaaa 1861 agaagtaagg attggtaaat aagagatatc aaaaaggtac actgaacaag aaaagttggt 1921 tcttgataca cacttggttc ctgagctcca ttatctgtgg ctccttctcc aagttctctc 1981 ctgtttcatg tgatcacatg aacaattatt agaatcctgg attgaactaa agtttcttgt 2041 agaatgacat caaccataga gaacttacta gctatctgca atgtttctct gcggagctcc 2101 tcttttatct gatggacaga aacaaacaag gaacaattaa cgtccagaga ctataaaaaa 2161 gaactagaaa gctctaatta ctggcaacat ataaaagatg atgctatgat aaaaaggcta 2221 aaatcaccac ataactaact aagctacagt cttaaaacta aagacaatac gcgttattaa 2281 gaaacaacag actgttctaa agacttacat tgttctgtat tttgacctgg tcaagtgaaa 2341 gcagaaattg ctgatacgca tctttgtcag agagaagctt cctaagctcg tccacgctac 2401 agaaaagtat acgctaacgc tatttaaaaa aaaaaaacag acaaaaaacc gcattacacg 2461 agaagcatag taaacagcga accttttatc tttcaagaag gcaataatgc cagctgcttc 2521 cccaggcgac acatttgctg gaatctgacc tgaagtttga ggccgggatg agcttggcga 2581 gctgactaaa gaaggtgagt accatggcga ttgtgaagaa gcttccggag gacgagatgt 2641 cccttgttgt tgttcttttg atccccttga tgtacacaac aaaaagaaac gtcatcaatt 2701 actaaacaca aaggcgatgc tacaacatcc aagacataaa tttgaatagg tgcttaaggg 2761 cacagctaaa agaacaaaaa atacttcttc tgatcagatt cacatcactg aaacaaccaa 2821 gatgcaaaac atagagactc atcaacctaa ctctcacatg aactacaaca ttttaaatcc 2881 aataacagca actatgaacc tcaaatcagt aactgagcaa ataatctaca ctaaagtgct 2941 cttagaaaaa cgcactcttc aattgttgat cacagctcaa atttttttgg cgaaccaact 3001 ttacataaca acctaataat atccttaatc gtgaacagat ctaatttccg tagctcaagt 3061 atccgaattt cataaaaatc aaacagagca tatatgaaac agattgcgaa aaattcgcac 3121 aatcacggaa acacaataag attgtaagag ttggtattac cagaaattga acatcgtttc 3181 aagaaatcgc cgaccaaatc aaaggagaat tgactttcgt attgagcaaa actcgaatct 3241 ttctacttcc ttcttcctta gcagatcgac aaaaatatta acaacttaaa tcccgaaacc 3301 agagacctcc gtgtttaaga gagtttcaac gaaaattcca attcttcgat cttctccgtt 3361 tcatttcagt tttttttttt ttttggttcc tgctctctaa aaggcccaaa tacgaatatt 3421 ttaggcccat attaactctt tttttttggt tgaataggcc catattaact gtccaagcgg 3481 taccgtttcg aacatcgtcg tccttatcca cgtctaacgg ctcgcgtttc ctatatagta 3541 catacacaga gtcttcaccg aagcttcgaa aagagctcct catcaatgga gtcttctctc 3601 ttttctccat cttcctcttc tatattcact gcaaaatcta cgcttctttc ttctccaaaa 3661 cccaaattct tctctttctc tatcaaatct tcaatagaga aacctaaacc caagcccaaa 3721 ctagagacaa gttcatcaaa atcccagtca tgggtcagcc ccgattggct cacatctctt 3781 actcgtaccc tttcctcagg taaaaacgac gattcgggca taccaatcgc gagcgcgaag 3841 ctcgacgacg tctctgacct cctcggagga gctctcttct tacctctata caaatggatg 3901 aacgagtacg gacccattta ccgtctcgct gctggtcctc gaaatttcgt ggtcgtgagt 3961 gacccagcga tcgctaaaca cgttttgagg aactatccta agtacgctaa aggcttagtc 4021 gctgaagtct ctgagttcct ttttggttcg ggtttcgcaa tcgctgaagg tcctctttgg 4081 acggtaattt catcttcttc aatctctatt atgatattag tggaatcatt gaagtaatgt 4141 ggcactctct tgtgttataa gtaaccttga atctggaatt aggttccaat cttctcaatt 4201 ggtatcagtt ttgtaccaat ttgaaccatt gaattctgat ttttgatata taggcgaggc 4261 gaaaagcggt ggttccgtcc cttcacagga ggtatttgtc tgtgattgtg gagagagtat 4321 tctgcaaaag tgcagagagg cttgttgaga agctgcagcc ttatgcaaag gatggaagtg 4381 ctgtgaacat ggaagagaag ttctctcagt tgacacttga tgttattggc ttgtcacttt 4441 ttaactacaa ttttgattct ttgactaccg atagtcctgt cattgaagct gtttacactg 4501 ctcttaaaga agctgagctt cgttctactg atcttttacc atattggaag gcaagttttg 4561 tgtgttttta catgtggttt gttgattgcg gcacatttgg attcttgtca atttagaggc 4621 tttggttgtt tttttcagat cgatgcattg tgtaagatta taccgagaca ggtgaaagct 4681 gaaaaggctg taactttgat aagggaaact gtggaagacc ttatttccaa gtgcaaagaa 4741 attgttgaaa gagaaggcga aagaatcaat gatgaggaat acgtaaatga tgctgaccct 4801 agtatccttc gtttcttgct cgcaagcaga gaagaggttt aacttttttc ccttcattcc 4861 attagcaagc ttggccattc attattgcaa actgaagctg atattagatt gtaccgggtt 4921 ttttcaggtg tcaagtgtgc agttacgaga tgatcttctc tccatgcttg tcgcgggtca 4981 tgagaccacc ggatctgttc tcacttggac actttatctc ctaagtaagg taccttttgg 5041 tatcttatac tttgccactt gaaagggagc ttctctgatc tcattgatgg gtaaatgttt 5101 gcctctttaa acttatatat gtgcatatag aactcatctg cattggcgaa agcacaagaa 5161 gaagtagacc gagttttaga gggaagaaac ccggcttttg aggatataaa ggagttgaag 5221 tacattactc gttgtataaa cgagtcaatg cgtctctacc ctcatcctcc tgtaagcaat 5281 caagctcatt tctcgaatta ttcatgaact aaatttactg attgctttat ttcctggtag 5341 gtcttgatta gaagagctca agttccagac attcttccag ggaactacaa ggttaatacc 5401 ggacaagaca ttatgatttc agtctataac atccatcgtt cttccgaggt acagttctct 5461 ttccttcatt taggggatcc cattctggta tcagtttgga tttttcggtt cttgttttgg 5521 ttaggatata taacttgcat ggacacccct aatattacat tcatgcccac aattcttatg 5581 tgtttgtaat tacgaaggta tgggaaaaag ccgaggaatt tctgcctgaa cgattcgaat 5641 tagaaggcgc aatccctaac gaaacaaaca ccgatttcaa gtaaactcac tagtactctt 5701 gtttcgacaa actattaaaa agcaaggtaa tattgggatt acaaatgtta aagatgattt 5761 gcatttcacc agatttatac cgttcagtgg agggcctaga aaatgtgtag gcgatcagtt 5821 tgcattgatg gaggcaattg tggcactcgc ggtgtttctc cagcggttaa acgtggagct 5881 ggttcctgat cagaccatta gcatgaccac tggagcaacc attcacacca ccaatgtatg 5941 acaatgttca ccgactaaag aaaattaatc agactctgtt tcttttttga tatagaatca 6001 ttccaagttt tctgatgctg aatttttttc tttaattgca gggattgtat atgaaagtga 6061 gccaaaggta aaaccaggat gtagaggatg aaattgattt ctgcttttat ctgtctttat 6121 gatcattgat tgttttttgt taacaccttt attatttgtt gttgatggat atgttttata 6181 tacaagtata gtagtctaga tataacgaca aacagaatta tggagttttg gagttcgaga 6241 gaaaaacaaa acaaaacaac tcaattgtat catatcggga atgtgaaaac agtgtatgtg 6301 actgtgctac cagtcatagt atttatcgga aaatgtgaaa gttgaacagt gatatgctac 6361 aattaccagt aaagttttgg taattgtttt atcatttcaa aaccaagtgc catacaacac 6421 aacttggtgt gtttttctgt ttccttgcac taccaatatg gagtatctgt tttgttcgtt 6481 ttcatcaatc agtctcataa ttactaaatc atatactacc atttctttca ttgcactcac 6541 aacattatta ctatagtata actgtttttt ttttatatat atcgtttgta aaacactttt 6601 aaacttgaag accaaaccag tttaactagt gtataaaact ttttccctgg gaaatttatt 6661 atagtgtgta atgtatcata gattcataga tctaatacgt tttatcgaag ctttcaattg 6721 attgagaaag tacaaaatgt aaaaacaata aaagaaggta acaaaaatat atttatcaag 6781 gcaaaatatc tagattctag caataattaa ttttaaacac ccaggccaaa agtatactat 6841 tttaaagctt tttcaataac ttcaataata taattacttt agaatattaa ataaaactgt 6901 aagaaactaa agtataacta aaacccacta ggaccatata tgtaatatta tcctcagtcc 6961 tttacgtatg aacgtatcat ataaaaccat tactagtggt cctttagcgg agtgaggtga 7021 ttcactttca cggacgggaa aatggagaag gaaagctcgg aaagcagaaa cagagctcgt 7081 ctcgccatta tggagctggc caacatgatt agcgttccca tgtccctcaa cgctgccgtg 7141 agactaggca tcgccgacgc tatttggaac ggcggggcca actctcctct ctccgcctcc 7201 gagatcctcc ctcgcctcct tatcccatct gccactacca ccggcggcga tcctgagaat 7261 ctccaacgta tacttcgaat gctcaccagc tacggtgtct tctctgaaca ccttgttggc 7321 tccagcgaga ggaaattttc tcttacggac gttggaaaga ctctcgtcac tgactctgat 7381 ggcctctctt acgcagccta catcctccaa caccaccagg tctcttcatt tttaatggtt 7441 tttgttttgt tgttttagtt tatgtttatc actaccattt tggttggttt gtttggttgg 7501 ctaatgttac atgggaaccc aaatatcata tccttcacaa atctcgtgat tagtctagat 7561 ttcggtatga atgctccggt tatatttttt aagtggtttt cgtttcgttg tttttagttt 7621 acctctacca tttttaggat tggctaatgc tttatatggc taatgcttta tatgggaata 7681 tattacattt tcacgaatct cgagattagt ctagatatga tatttgtgtg taaaaatgac 7741 atattgtagg aagcgttgat gcgagcatgg ccgctagttc acacggcggt ggtggagccc 7801 gagacggagc cgtacgtgaa agccaacggc gaggcggcat acgtgcagta tgggaaaagc 7861 gaggagatga acagtctgat gctcaaggca atgtccgggg tatccgtacc gttcatgaaa 7921 gctatattgg aaggctacga agggtttaag agcgttgagc gtttggtgga cgtaggaggt 7981 agcgcagggg attgtctccg catgatcctt caacactttc ctaatgtccg tgaagggatt 8041 aattttgatt tgcctgaagt tgttgccaaa gcccccaata ttcctggtaa gtttaatatc 8101 tgtaataaaa taagaaaaaa gaatctctgt cttttgtaac gtagtaatta ataatggatg 8161 gatgatattt tttttttgta ttgtatagga gtgagtcacg tgggtgggga tatgttccaa 8221 tcagttccta gcggtgacgc tatcttcatg aaggtttgtg gtatacatta tttgtcacga 8281 gaataccaac ctagctacta ttttttccat ataggacgaa tactgatttc tatatataga 8341 cagtctgttt aaggttagtt tagtttaggc atacatatat attgtataag ctggtcgcac 8401 aaaaaatcat ataagtccct aggggcaata tgtttggtac tatacatatt tggcttagac 8461 gtttatcgtt agatcatgcg actggtcacc tatatttatg taagatcgtt ttaaaaacta 8521 atacatatat ttgtcaaacc aaaaacttgt gatgtagcta aaagcctaga atcatgcatg 8581 gatatgatgt gattgtttgt tgaaattaaa gaacaatata atataataca aacaaataaa 8641 cacatttctt aatgcacagt gggtattaac gacatggacg gatgaagaat gcaaggagat 8701 aatgaagaat tgctacaacg cattacccgt tggaggaaag ctaatcgcgt gtgagcctgt 8761 cttgcctaag gaaaccgatg atagccaccg gactcgtgcc ttgttagaag gcgacatctt 8821 cgtcatgacc atctatagaa ccaaaggtaa gcataggacc gaagaagagt ttaaagagct 8881 tggtctctct gcgggattcc ctactttccg acctttctac attgattact tctacaccat 8941 cttggagttt cagaagtaat attatcaaaa gatttatctt tcggtttttt ttttaaaaga 9001 ataaactttg aaataataaa tcaaggaggg aggcgtcttt gttgagatct ctaataaaat 9061 acattttcat catcaagatg taataaggga taatctaata gtctatttct attttttttg 9121 agtgcatctt tcgagaaaag gaattaaaaa aaaaaaaact ctttgatgat ttaatttcaa 9181 gttcgataca agatatgtga cttattaatt ttatatcaac ttataaacta aatttttcta 9241 cccgatcgag actcaaatgc tctaaaacat cttgcattaa aattgaaacg ttaatactcg 9301 aagatccctt atcattcaca gcctttttcg ccattactgc aagttcttga atacgtctcc 9361 ttcgtctcac aaattcactg tgaacatcat catctacacg ttgacaatct tcgtccatca 9421 aaagctttat agctttcaca actctttgtt tcgtgaccaa cactccaact ttctcctcgt 9481 ctccccatct caccggaatc tccaccccaa ccctaacccc tatcttcaat atctccacga 9541 ttagtttctc attgaggaat tgttcagcga acaatggcca tgtgatcatt ggtacaccaa 9601 aacatatcgc ttctattgta gagttccaac cacagtgaga caaaaaacct ccggttgagc 9661 catgtgagag tatcatagcc tgaggactcc aaccttttat cactatccct cttcctctaa 9721 ctctctcttc aaaattttct tgttttagcc attcatctag ctcattcatg tgtttttcct 9781 cggtcttgat tacccaaata aaaggttttc ccgactcttc taaccctaaa cctagttcta 9841 tcaattgatt aggtattagt cgacatagac tacctagaca aacatataac actgaccttg 9901 gtctcatcga atctagaaag tgcaagcact cggtcttgct tatcgcgata ttacagttgt 9961 ttcctctatc aaataggtca gccatacggt cgttgcataa agaaacgggt ccaacgaacc 10021 ataccttcat attgatggcc tcagcgtagg cttctgcata gccaggctcc aattcttgga 10081 agctattaac gataacccca aaggcttctg attcagattc acgcatcttg tcgcgtacgt 10141 catccatatt tgctaacttc tcaaacgcac ctggtaactg agctctggct atctcaatcc 10201 tatgtggcat tgccggtata gagaatggct ctgaggctga agaaaccgag aggtgcgggc 10261 tatgaagatg gaggttgtgc gaactcaaaa gagagaagca acacattcca tggaacacga 10321 tcctcgggat cttaaacctc tttgcggttt tcgacgtcca aacaaggcat ttatcggaga 10381 ttatgcaact tggagggatg tcttgttgct caagaaaccg ttccaaggga tcctgaagtt 10441 tatccagagc gtcatagaat ctccgtagaa ggtctttgga tgggagagtg tcgagagtct 10501 cacaatcttt gggaagaccg aagtctttgt aaggaattgg aaacgtaacg acgttgattt 10561 cgagaccagc ctcggatctt gctcggtcaa ctgtcttcac aaacctagaa gcattttgag 10621 gggttgtaac tatggttacg atgttgcctt gtcgcgctag aatcttggat atgtcgacca 10681 tagggatcaa atgcccttga gccataagag ggatcaaaac aaagtgaagt cctttggctt 10741 ttgaatctat ggctgtttcc atttttgggt ttagcaaatg tttacgcata tagaaggtaa 10801 acaaaattct caaacaacat atatatgtgt ggatgcatct ggtgagagat ctaactaaat 10861 taattgggaa agtcgtcaaa agctgtatat attgactttg aacaagtcat ttaaaacaaa 10921 aactattgtt tcgagaacca aatcatgtat tccttgtttt aaaaatttta gtcgctgacg 10981 gtggtgagtt acgtcattat accatgacaa tgaaatccta aaatatatgt ttatcgagtt 11041 gcataagaat tcgaaaaact tcaaggaaaa tatgtggaag tttaaattct aaaatgatga 11101 atatatccag ttctatatac gtaactttaa gttaaaataa gcttatgtta ttttaagttt 11161 gttaattagt attacacatc taaaatattc aatatataca aacacaacta gataaaaata 11221 ctgttatcct tttagtttac tttctgataa tgattgctat attgtttatt gtgatttcgg 11281 tttaagaagt gcaagtaggt caagctaatt atggtttaag agttccatat tgattatggt 11341 tttgtccccg cgccacgata tagatcagtg gtttggttat cacatgattg attattcaca 11401 tcgttaatat ttacatagaa gtttaattta tttagttttc tttccggtct agtgttcaag 11461 agattgtttt gttaataatc gaataaaatt ccaacataat ttctacaaga gttcacgttg 11521 agtttttaga ttagacaaaa gaagtaaaat ggaaccatct tcatatataa agtgtggttt 11581 aaattgatac attgttgtct atcagaatat atgtatacta gaaatatttt ttcaacggct 11641 aattaaaaac aagatatatc taatacattt tagataaaat aatattatat cttgttctta 11701 attagccgtt gaaatcacat tatatctttt ctaatccaag aaatccaaga aatgctagaa 11761 aagatgtatg aaacaaagaa aaaatggatt tgaagacggt tcttttctta tcatacattt 11821 tagaaactat atatttgaaa ccaaagcatt tctaccaact cattttaaat acataaaccc 11881 caaacttcac ggcatatatg ttcgtagttt cctttttgtt ttaaatgagt tctgtttgaa 11941 aaggacattt gtcttttctt tgtttgcatg aaaaagactc tttgaaacgt tcaatatgtg 12001 cgtatgcagt ggtgaacaaa ctaacgtaga ctagttcaaa ttttgggagt tctcgagact 12061 ttgagcattg acgtatatac tcacaccatt tggttactgt attttttgtt tacatttttc 12121 ttttcttttc gttttggttc ttgtaatcaa tcatttgatt gtttcgttca tgtatttgtt 12181 ttttttttaa agaactagct actaaacact tttatatata actttttttg cggaacacat 12241 tagtaattaa catggacata taattacaaa cgaaaagcaa agtccactca agttgaaact 12301 attaaccacg aagtttcgaa aattttgaga atatataagc aaataaatat acacatacgc 12361 acacaagctt gtatcatcaa ttatgcatag agggtacttt acaactatct tttgtagtta 12421 aagttaattc tatcatgcat gacgattgtt tttgcgtcta cgtatacaat tcatgttgtt 12481 ttttttttgt tttgttaaaa gatataacaa ttcatgttgt tttgattaaa gcatgcctct 12541 tttttgctac cacaaagtct tactcatgta taatatgtcc ccatgttact gttttacaag 12601 atcttcatat ttgactactt gagacgaatc aatttgtaaa cttcttacag ttttaaactc 12661 ttaatcaaca aaactaaaga agtttctttt tttttgtttt catctcatga gaatccaaag 12721 ccacgtccaa atgtcaaaac tcaaatcaga aaacttgcat aagaagattc aaagaagttc 12781 ccgtgatctt ctcttaccca aaaggactag tctatcatca tttaatctta tcaaaatcga 12841 tgatttatag aaaaatctta ttcaacactt tagcatgcag ataaggattt cctttatctt 12901 tccttttttg cagaaaactg aatatagtaa tatttaagcg aagaaaaatc gatttcacta 12961 caaagtcatt cttggataat aatcctcaca ctagtcgtct ttggaatatt ggttgtaaaa 13021 attccttaac aactaaagct ttcgatttcc aaattccaat ccccaatata tcttatttct 13081 tcgtctgatt tgacatcatc ctcttttgtc tctcaatgta tgtaaccatg catgttaatt 13141 aagatcactc tgtatattat atggtttgat gtttctgaat taacaaaata ttagttttgg 13201 gcttagtttc acaagagaaa cctaacttac aaaaaaaaaa aaaaaagggt ccaaaagtat 13261 gataattttt ttgtctaaat gatatattgt ggacacataa gtacaaaagc acctttgagg 13321 ctactaaaaa ccagagtctg tctcaacgtc aaacaagacc agctcaatta tttcagagac 13381 attgtgcctg tatttttgaa ttaaaagagt ttgagtatta tttttattag ctatggtttt 13441 tattatacaa acctctttat tctaacatgg aaaagaaaat atcaatccta ataacaatct 13501 ttgagacccc tttgatgttg ggattgctcc ataatgtctt gaatgagcaa tgtgatatta 13561 gcatctgaag atcctccttg ttccaaagcc ttatttgcca agtcactaag ttccctgact 13621 cttcttcttc tctcttctgc ttcttggcta tcacccatta gctcacccac tgcttttctc 13681 acagtttctc tactcaccgt cactcctatc tcctcttcct ttccatattt catcaatgtc 13741 tccactccta tctttaaccc tgattttagt atcttcacaa ttaacttctc gttcaagaat 13801 tgttcagcag acaaaggcca tgtcaataac ggaactcctg cagtgattcc ttctagagtc 13861 gagttccatc cgcagtgagt caaaaaccct ccgatggatg cgtgtgagag gatgaaaact 13921 tgcggcgccc aacctttgat caaaagtcct ctatctctta tccgctcttc gaatccgctt 13981 tgctgcatcc actttgctaa atcctcatat tttccccact ctcttataac ccatataaaa 14041 ggtttattag attcctcaag gcctagtcct agctctttga gctgagccaa gggaagatta 14101 cataaactgc caaggcaaac atagagcacc gaaccagttc cttgagagtc gagccattga 14161 agacattggt cttgaccaat ggaagccttg tctcctcttt cagcattttt tagttctaac 14221 ttattgcaca aggaaacagg tccaacgcac caaacttttc cagtccttgc tttcctatat 14281 tctcttgcat agtcaacctc taactcctca aaactgttca caataacacc ataagagtca 14341 ttatcagctt caataatctt gactgtactc tctttcatat ttccttcaag aggctgcaac 14401 acagagacct gaggtttagt gaactcaact ctatcaggca agccaggtaa atcgaaatac 14461 tcgtcgttag attctataaa ttttaagatc ccgctttctc gaaccacctg tatgcacatg 14521 aggctgaaac aagaaaatcc atggaagaga agtttgggga tcttgaattt ctttgcaagt 14581 cttgaagtga aaggaaggct catgtctcca atgatgcagc tcggccgcgg ctgaaccatc 14641 ttcttcatag ctttctctac ttgctcctca agcgagttgg ccacgtcaaa gaacttcacc 14701 atgtcgacca ttgaagccaa catatctaca ctctcgcacc cttcttgcaa acccgcttgt 14761 cgagacggaa acttaacttc aacgatgttg atggtcggaa aggaagagga agaggagagt 14821 gaagtcttga tcttggctac attttgagta gttgtgatga tagagacggt cacgccttga 14881 cgctgggaca agagtctaga gatatcgacc aatgggatca tatggccttg ggccataaag 14941 ggtattacga cgaagtgaag aggatcatca gaacacattg tagaagatct tacgacgaag 15001 tgaagaggat catgacatct ctatataact acgatagcgt ttagatcaaa aaaagaggtt 15061 tgaccagtct aaagagcctg cgtaaggaaa ttatataaga caacttcaaa tttgagtttt 15121 gattccagag tctggacaac tgtcccaaga ctcccaacct aagtgataat attttctaat 15181 atgtatgaca attagtctga tcgtttgtgt taatgttata ttcgtgtcat catctgtatt 15241 gacaccttgg aataatgaat tagaagcatc atgaaatgag tcaaaaagat aatagttaat 15301 aaaaagaggt ggcgggtcaa acaatgtctg ctgaatattt ttgagaattt ggtatataac 15361 tttatttgac atgatatcag tcgtagatgt atctgttgat ttctttgttt tgttcattta 15421 gtgacacagc tacaaatgat ggcttctaat acttacagtt acccgaatca ttacgttttg 15481 atttggtaga tttcggaact ggccaaattc tcatcagtaa tgaccatgcc gctcttggaa 15541 ccttggtatc cccccaatca cctgaacaga cagttccata acttacttac aggcatgtgt 15601 ctccagttta tcttaaagtt acgagtaagc ggaacagtta cctcaagtga tccacttagt 15661 gtgaacattt cccaacttcc aaaattcttc tgcattagat tgctcaattc acaacccaaa 15721 gcctcactcc ataagcctct tcttgcctat atctttaaac acaataaaag gaacaccgtt 15781 tagaaacaaa tacaatcacc aaatagagct gtaatactca gcatatatct cttatcttaa 15841 ttatagtttt ctaagaggaa atttgaattc tcaccagtgg aaatcatttg tttctcgagt 15901 tcatggactg catcgaatat tccatgagca gtgtaggttt tgatcatagt agcaaaagtg 15961 actttatcag gcttacattt tctctcttcc atttgtatgt ataattcttt cattgtagcc 16021 aaatcaccag cctgaccgta tgaattgatt atacaattga agaatggagt atccagtatc 16081 acatctgaat tcacaatttg cctcaaaatc gaatctatct tcacgagaag accaactttg 16141 ctatacgcgt taacaagcga acaataagtg atcgagtttg gtttcactcc ttgatacttc 16201 attttcctga atatatcatc cattttctcg attcttccag cttttccaaa cgtctcgatc 16261 actatattgt aagtgacagt ggtcagggag aagaaccttt tctccatgaa ttccataacc 16321 gagcacatct tcttatacat tccagctttt ccaaatgaca ggatcagtat gttaaacgta 16381 gtgatgtctg gctgcactcc catgagctgg aaccgattat accagctctc catcttcttc 16441 gtgtcaccac cattcccata tgacccaatg atcgagttaa gtgtgaaaac atccggaaga 16501 gaatctccat cctcgatcat atcagccaga acattttcca tttcctcaaa cataccagcc 16561 tttccatacc catcaataat agtattgtaa gtaaccgtgc tgcatccaac tccaagatac 16621 gacatctcaa gaacgatact tttaaccaga tcaaaccgac caagtttgca gcaacaactg 16681 atgagaacag taaaggtgaa cacatctggc ttacagtcac tagccgattt catatattca 16741 agcgtggaaa acgccttgtc tagaagtcca cttttgccat aaacagctat aagagatgta 16801 tacacatcaa tggtgggttt taatccttca gacaacatta cttcaaaaag caagctagct 16861 tgatcaggct gcttgcaatt cccaagcact ttaaacagct ttgtgtatgt tttgcatctt 16921 ggttcatacc aatgctgctt cctaagaaga ttgaaaatct ataaagtaga gaaatgggca 16981 aatgaattct attgaacctt atggaaaatt cagtgtaaag agttagaaag gaataaaagg 17041 gggaagtgta ccttcaatgc agactgccat cgattctctt tgatagcttc atcaagtgct 17101 tcaagaacag cttttggcca taaagttaag tacttttcag aattggcttt cctctcgatg 17161 cctttgacag ctgactctgc tctcagaatc cgagacaact ctttcttagg atctactcgg 17221 tgtcttgttg agatcagacc ggatcccatt ttcccagtac cgtcattggg gatttttgtc 17281 gaacatgttg tgggcgttgt tgaaacagag gctacacgcc gagaacaaac cgtggagggt 17341 atatgttgcc gagaaaagca gagttttata ttttcaatgg cgtatgcgga attaatccct 17401 tgaataggat tctgtatcaa ttccatcgaa gagaaatgcg agaaagataa ggggaagacg 17461 acgatgcaac ttcggtgtgt aggaggagga gctagaagac gacacagttg ttcggcttca 17521 tctatttcgg tttagctcga ttgggcgggt tcggttttca aaattaatcg gtttgtctga 17581 tatatagaat ggtatgatgt ggttttggtt ttgaatttta ttatattttc aaaaggtcta 17641 agcttcaatc agttttgttt tttttccaat gttatgtaat ctgaaaaatt agaaaaaacc 17701 aaatgaaaaa ttttctccaa ttttgacttt gttttatcat ttaatattgg actcacttga 17761 atgacaacga accgaaaatt ggaaatgtga cgtgaaccgg aactgaaaaa tggaaaaatg 17821 caagaaagtt atccgcacaa ttaaggacac gtggagccta actgtaggcc acgtggccac 17881 gtgctcatca ctctcctcct agtcgccgcc gtgaacttaa ggtcagacgt atcggccacc 17941 gaccaaatca gacaacaacg aagagtcaaa agatttaatg gatacttcac ttatgtttta 18001 taaaccttcc tgtagtaaac tgtgaagact gtaagaagaa caacacgaat caagtaatcg 18061 aaagtatact tttaatttag agagagagag agagagagag agagagagag agagagagag 18121 agagagagag agagagagag agagagagag agagagagag agagagagag agagagagag 18181 agagagagag agagagagag agagagagag agagagagag agagagagag agagagagag 18241 agagagagag agagagagag agagagagag agagagagat ggagtnnnnn nnnnnnnnnn 18301 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 18361 nnnnnnnnnn nnnnnnnnnn nnnnngagag agagagagag agagagagag agagagagag 18421 agagagagat ggagttggag tttaaggagt taaaagaagc aatagaagaa gtagagctcg 18481 ttgatgctca tggacacaac cttgtcgctc ttgactcttc ttttccgttc gtcggaactt 18541 tctccgaggc taacggcgac gcg //