Commit 6f204617 by re

特征工程

parents
# Default ignored files
# Default ignored files
/shelf/
/workspace.xml
# Editor-based HTTP Client requests
/httpRequests/
# Datasource local storage ignored files
/dataSources/
/dataSources.local.xml
<component name="InspectionProjectProfileManager">
<component name="InspectionProjectProfileManager">
<profile version="1.0">
<option name="myName" value="Project Default" />
<inspection_tool class="PyUnresolvedReferencesInspection" enabled="true" level="WARNING" enabled_by_default="true">
<option name="ignoredIdentifiers">
<list>
<option value="tensorflow.compat" />
</list>
</option>
</inspection_tool>
</profile>
</component>
\ No newline at end of file
<component name="InspectionProjectProfileManager">
<component name="InspectionProjectProfileManager">
<settings>
<option name="USE_PROJECT_PROFILE" value="false" />
<version value="1.0" />
</settings>
</component>
\ No newline at end of file
<?xml version="1.0" encoding="UTF-8"?>
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="ProjectRootManager" version="2" project-jdk-name="Python 3.11 (GoT2G-F-main) (2)" project-jdk-type="Python SDK" />
</project>
\ No newline at end of file
<?xml version="1.0" encoding="UTF-8"?>
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="ProjectModuleManager">
<modules>
<module fileurl="file://$PROJECT_DIR$/.idea/特征工程.iml" filepath="$PROJECT_DIR$/.idea/特征工程.iml" />
</modules>
</component>
</project>
\ No newline at end of file
<?xml version="1.0" encoding="US-ASCII"?>
<?xml version="1.0" encoding="US-ASCII"?>
<!DOCTYPE BlastOutput PUBLIC "-//NCBI//NCBI BlastOutput/EN" "http://www.ncbi.nlm.nih.gov/dtd/NCBI_BlastOutput.dtd">
<BlastOutput>
<BlastOutput_program>blastp</BlastOutput_program>
<BlastOutput_version>BLASTP 2.17.0+</BlastOutput_version>
<BlastOutput_reference>Stephen F. Altschul, Thomas L. Madden, Alejandro A. Sch&amp;auml;ffer, Jinghui Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997), &quot;Gapped BLAST and PSI-BLAST: a new generation of protein database search programs&quot;, Nucleic Acids Res. 25:3389-3402.</BlastOutput_reference>
<BlastOutput_db>nr</BlastOutput_db>
<BlastOutput_query-ID>Query_613691</BlastOutput_query-ID>
<BlastOutput_query-def>lcl|1 unnamed protein product</BlastOutput_query-def>
<BlastOutput_query-len>93</BlastOutput_query-len>
<BlastOutput_param>
<Parameters>
<Parameters_matrix>BLOSUM62</Parameters_matrix>
<Parameters_expect>0.05</Parameters_expect>
<Parameters_gap-open>11</Parameters_gap-open>
<Parameters_gap-extend>1</Parameters_gap-extend>
<Parameters_filter>F</Parameters_filter>
</Parameters>
</BlastOutput_param>
<BlastOutput_iterations>
<Iteration>
<Iteration_iter-num>1</Iteration_iter-num>
<Iteration_query-ID>Query_613691</Iteration_query-ID>
<Iteration_query-def>lcl|1 unnamed protein product</Iteration_query-def>
<Iteration_query-len>93</Iteration_query-len>
<Iteration_hits>
<Hit>
<Hit_num>1</Hit_num>
<Hit_id>pdb|7KAE|A</Hit_id>
<Hit_def>Chain A, Regulatory protein rop [Escherichia coli] &gt;pdb|7KAE|B Chain B, Regulatory protein rop [Escherichia coli]</Hit_def>
<Hit_accession>7KAE_A</Hit_accession>
<Hit_len>65</Hit_len>
<Hit_hsps>
<Hsp>
<Hsp_num>1</Hsp_num>
<Hsp_bit-score>53.1434</Hsp_bit-score>
<Hsp_score>126</Hsp_score>
<Hsp_evalue>1.67188e-06</Hsp_evalue>
<Hsp_query-from>1</Hsp_query-from>
<Hsp_query-to>93</Hsp_query-to>
<Hsp_hit-from>1</Hsp_hit-from>
<Hsp_hit-to>65</Hsp_hit-to>
<Hsp_query-frame>0</Hsp_query-frame>
<Hsp_hit-frame>0</Hsp_hit-frame>
<Hsp_identity>41</Hsp_identity>
<Hsp_positive>51</Hsp_positive>
<Hsp_gaps>28</Hsp_gaps>
<Hsp_align-len>93</Hsp_align-len>
<Hsp_qseq>MGHHHHHHGTPEEKQALQMAKQIKQQAQEIQKQTEELLKKVQELLKKLHQLGAPEMAKIAEELHKHAEALKQAAEEFYKHAEELHKAAEARWG</Hsp_qseq>
<Hsp_hseq>MGHHHHHHGTKQEKTALNMARFIQNQ--------------TQTLLEKLNELDADEQADIAESLH--------------DHADELYRSALARWG</Hsp_hseq>
<Hsp_midline>MGHHHHHHGT +EK AL MA+ I+ Q Q LL+KL++L A E A IAE LH HA+EL+++A ARWG</Hsp_midline>
</Hsp>
</Hit_hsps>
</Hit>
<Hit>
<Hit_num>2</Hit_num>
<Hit_id>ref|WP_068840410.1|</Hit_id>
<Hit_def>Rop family plasmid primer RNA-binding protein [Salmonella enterica] &gt;gb|OCT02482.1| hypothetical protein A7B04_25020 [Salmonella enterica subsp. enterica]</Hit_def>
<Hit_accession>WP_068840410</Hit_accession>
<Hit_len>63</Hit_len>
<Hit_hsps>
<Hsp>
<Hsp_num>1</Hsp_num>
<Hsp_bit-score>45.0542</Hsp_bit-score>
<Hsp_score>105</Hsp_score>
<Hsp_evalue>0.00198286</Hsp_evalue>
<Hsp_query-from>10</Hsp_query-from>
<Hsp_query-to>93</Hsp_query-to>
<Hsp_hit-from>2</Hsp_hit-from>
<Hsp_hit-to>57</Hsp_hit-to>
<Hsp_query-frame>0</Hsp_query-frame>
<Hsp_hit-frame>0</Hsp_hit-frame>
<Hsp_identity>30</Hsp_identity>
<Hsp_positive>40</Hsp_positive>
<Hsp_gaps>28</Hsp_gaps>
<Hsp_align-len>84</Hsp_align-len>
<Hsp_qseq>TPEEKQALQMAKQIKQQAQEIQKQTEELLKKVQELLKKLHQLGAPEMAKIAEELHKHAEALKQAAEEFYKHAEELHKAAEARWG</Hsp_qseq>
<Hsp_hseq>TKQEKTALNMARIIKTQ--------------TRTLLKKLNKLDADEQADICESLH--------------DHADELYRSCLARFG</Hsp_hseq>
<Hsp_midline>T +EK AL MA+ IK Q + LLKKL++L A E A I E LH HA+EL+++ AR+G</Hsp_midline>
</Hsp>
</Hit_hsps>
</Hit>
<Hit>
<Hit_num>3</Hit_num>
<Hit_id>ref|WP_105178307.1|</Hit_id>
<Hit_def>Rop family plasmid primer RNA-binding protein [Klebsiella pneumoniae] &gt;gb|PPJ97315.1| Rop family plasmid primer RNA-binding protein [Klebsiella pneumoniae]</Hit_def>
<Hit_accession>WP_105178307</Hit_accession>
<Hit_len>63</Hit_len>
<Hit_hsps>
<Hsp>
<Hsp_num>1</Hsp_num>
<Hsp_bit-score>43.1282</Hsp_bit-score>
<Hsp_score>100</Hsp_score>
<Hsp_evalue>0.0120913</Hsp_evalue>
<Hsp_query-from>10</Hsp_query-from>
<Hsp_query-to>93</Hsp_query-to>
<Hsp_hit-from>2</Hsp_hit-from>
<Hsp_hit-to>57</Hsp_hit-to>
<Hsp_query-frame>0</Hsp_query-frame>
<Hsp_hit-frame>0</Hsp_hit-frame>
<Hsp_identity>29</Hsp_identity>
<Hsp_positive>39</Hsp_positive>
<Hsp_gaps>28</Hsp_gaps>
<Hsp_align-len>84</Hsp_align-len>
<Hsp_qseq>TPEEKQALQMAKQIKQQAQEIQKQTEELLKKVQELLKKLHQLGAPEMAKIAEELHKHAEALKQAAEEFYKHAEELHKAAEARWG</Hsp_qseq>
<Hsp_hseq>TKQEKTALNMARFIRSQ--------------TLTLLEKLHELDADEQADICESLH--------------DHADELYRSCLARFG</Hsp_hseq>
<Hsp_midline>T +EK AL MA+ I+ Q LL+KLH+L A E A I E LH HA+EL+++ AR+G</Hsp_midline>
</Hsp>
</Hit_hsps>
</Hit>
</Iteration_hits>
<Iteration_stat>
<Statistics>
<Statistics_db-num>936828191</Statistics_db-num>
<Statistics_db-len>355460431291</Statistics_db-len>
<Statistics_hsp-len>0</Statistics_hsp-len>
<Statistics_eff-space>0</Statistics_eff-space>
<Statistics_kappa>0.041</Statistics_kappa>
<Statistics_lambda>0.267</Statistics_lambda>
<Statistics_entropy>0.14</Statistics_entropy>
</Statistics>
</Iteration_stat>
</Iteration>
</BlastOutput_iterations>
</BlastOutput>
>9CFS_1|Chains A, B|Long regulatory protein rop|Escherichia coli (562)
>9CFS_1|Chains A, B|Long regulatory protein rop|Escherichia coli (562)
MGHHHHHHGTPEEKQALQMAKQIKQQAQEIQKQTEELLKKVQELLKKLHQLGAPEMAKIAEELHKHAEALKQAAEEFYKHAEELHKAAEARWG
This source diff could not be displayed because it is too large. You can view the blob instead.
Unnamed
Unnamed
Chem3D Core 21.010272417003D
55 57 0 0 0 0 0 0 0 0999 V2000
-5.7857 1.9733 -1.0316 C 0 0 0 0 0 0 0 0 0 0 0 0
-6.0640 0.6117 -0.9700 C 0 0 0 0 0 0 0 0 0 0 0 0
-5.0178 -0.2959 -0.8280 C 0 0 0 0 0 0 0 0 0 0 0 0
-3.6902 0.1696 -0.7480 C 0 0 0 0 0 0 0 0 0 0 0 0
-3.3983 1.5375 -0.8089 C 0 0 0 0 0 0 0 0 0 0 0 0
-4.4620 2.4205 -0.9508 C 0 0 0 0 0 0 0 0 0 0 0 0
-2.5904 -0.6658 -0.6061 C 0 0 0 0 0 0 0 0 0 0 0 0
-1.3187 -0.2308 -0.5289 N 0 0 0 0 0 0 0 0 0 0 0 0
-1.1654 1.0983 -0.5987 C 0 0 0 0 0 0 0 0 0 0 0 0
-2.1444 2.0067 -0.7352 N 0 0 0 0 0 0 0 0 0 0 0 0
-6.7957 2.8660 -1.1697 O 0 0 0 0 0 0 0 0 0 0 0 0
-7.3433 0.1721 -1.0475 O 0 0 0 0 0 0 0 0 0 0 0 0
0.0187 1.5409 -0.5293 N 0 0 0 0 0 0 0 0 0 0 0 0
1.1446 0.6077 -0.3792 C 0 0 0 0 0 0 0 0 0 0 0 0
2.4496 1.3907 -0.3210 C 0 0 0 0 0 0 0 0 0 0 0 0
3.6161 0.4239 -0.1656 C 0 0 0 0 0 0 0 0 0 0 0 0
4.8585 1.1694 -0.1101 N 0 0 0 0 0 0 0 0 0 0 0 0
6.0486 0.5070 0.0284 C 0 0 0 0 0 0 0 0 0 0 0 0
6.0674 -0.9989 0.1233 C 0 0 0 0 0 0 0 0 0 0 0 0
6.7041 -1.4265 1.4400 C 0 0 0 0 0 0 0 0 0 0 0 0
7.9392 -2.2142 0.9971 C 0 0 0 0 0 0 0 0 0 0 0 0
7.5117 -2.6464 -0.3974 C 0 0 0 0 0 0 0 0 0 0 0 0
6.8390 -1.5330 -0.9214 O 0 0 0 0 0 0 0 0 0 0 0 0
7.0837 1.1281 0.0746 O 0 0 0 0 0 0 0 0 0 0 0 0
-8.0339 2.2113 -1.2306 C 0 0 0 0 0 0 0 0 0 0 0 0
-7.3951 -1.2265 -0.9651 C 0 0 0 0 0 0 0 0 0 0 0 0
-2.7961 -1.9135 -0.5456 N 0 0 0 0 0 0 0 0 0 0 0 0
0.2677 2.9880 -0.5986 C 0 0 0 0 0 0 0 0 0 0 0 0
-5.2273 -1.3746 -0.7784 H 0 0 0 0 0 0 0 0 0 0 0 0
-4.2580 3.5003 -1.0009 H 0 0 0 0 0 0 0 0 0 0 0 0
1.0200 0.0249 0.5607 H 0 0 0 0 0 0 0 0 0 0 0 0
1.1680 -0.0879 -1.2478 H 0 0 0 0 0 0 0 0 0 0 0 0
2.5742 1.9736 -1.2610 H 0 0 0 0 0 0 0 0 0 0 0 0
2.4262 2.0863 0.5476 H 0 0 0 0 0 0 0 0 0 0 0 0
3.4915 -0.1589 0.7744 H 0 0 0 0 0 0 0 0 0 0 0 0
3.6394 -0.2717 -1.0341 H 0 0 0 0 0 0 0 0 0 0 0 0
4.8459 2.1793 -0.1737 H 0 0 0 0 0 0 0 0 0 0 0 0
5.0195 -1.3686 0.0605 H 0 0 0 0 0 0 0 0 0 0 0 0
6.0110 -2.0701 2.0266 H 0 0 0 0 0 0 0 0 0 0 0 0
6.9512 -0.5671 2.1027 H 0 0 0 0 0 0 0 0 0 0 0 0
8.8466 -1.5705 0.9665 H 0 0 0 0 0 0 0 0 0 0 0 0
8.2213 -3.0511 1.6744 H 0 0 0 0 0 0 0 0 0 0 0 0
6.8325 -3.5265 -0.3448 H 0 0 0 0 0 0 0 0 0 0 0 0
8.3759 -2.9532 -1.0282 H 0 0 0 0 0 0 0 0 0 0 0 0
-8.8466 2.9634 -1.3438 H 0 0 0 0 0 0 0 0 0 0 0 0
-8.0449 1.5199 -2.1027 H 0 0 0 0 0 0 0 0 0 0 0 0
-8.1932 1.6314 -0.2941 H 0 0 0 0 0 0 0 0 0 0 0 0
-8.4538 -1.5637 -1.0309 H 0 0 0 0 0 0 0 0 0 0 0 0
-6.8126 -1.6689 -1.8040 H 0 0 0 0 0 0 0 0 0 0 0 0
-6.9602 -1.5572 0.0046 H 0 0 0 0 0 0 0 0 0 0 0 0
-3.7756 -2.2875 -0.6027 H 0 0 0 0 0 0 0 0 0 0 0 0
-1.9872 -2.5744 -0.4384 H 0 0 0 0 0 0 0 0 0 0 0 0
-0.6998 3.5265 -0.7112 H 0 0 0 0 0 0 0 0 0 0 0 0
0.7713 3.3225 0.3359 H 0 0 0 0 0 0 0 0 0 0 0 0
0.9199 3.2106 -1.4726 H 0 0 0 0 0 0 0 0 0 0 0 0
1 2 2 0
1 6 1 0
1 11 1 0
3 2 1 0
2 12 1 0
4 3 2 0
3 29 1 0
5 4 1 0
7 4 1 0
6 5 2 0
5 10 1 0
6 30 1 0
8 7 2 0
7 27 1 0
9 8 1 0
10 9 2 0
9 13 1 0
11 25 1 0
12 26 1 0
13 14 1 0
13 28 1 0
14 15 1 0
14 31 1 0
14 32 1 0
15 16 1 0
15 33 1 0
15 34 1 0
16 17 1 0
16 35 1 0
16 36 1 0
17 18 1 0
17 37 1 0
18 19 1 0
18 24 2 0
19 20 1 0
23 19 1 0
19 38 1 0
20 21 1 0
20 39 1 0
20 40 1 0
21 22 1 0
21 41 1 0
21 42 1 0
23 22 1 0
22 43 1 0
22 44 1 0
25 45 1 0
25 46 1 0
25 47 1 0
26 48 1 0
26 49 1 0
26 50 1 0
27 51 1 0
27 52 1 0
28 53 1 0
28 54 1 0
28 55 1 0
M END
$$$$
++ "a/\347\211\271\345\276\201\345\267\245\347\250\213/__init__.py"
This source diff could not be displayed because it is too large. You can view the blob instead.
<?xml version="1.0" encoding="US-ASCII"?>
<?xml version="1.0" encoding="US-ASCII"?>
<!DOCTYPE BlastOutput PUBLIC "-//NCBI//NCBI BlastOutput/EN" "http://www.ncbi.nlm.nih.gov/dtd/NCBI_BlastOutput.dtd">
<BlastOutput>
<BlastOutput_program>blastp</BlastOutput_program>
<BlastOutput_version>BLASTP 2.17.0+</BlastOutput_version>
<BlastOutput_reference>Stephen F. Altschul, Thomas L. Madden, Alejandro A. Sch&amp;auml;ffer, Jinghui Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997), &quot;Gapped BLAST and PSI-BLAST: a new generation of protein database search programs&quot;, Nucleic Acids Res. 25:3389-3402.</BlastOutput_reference>
<BlastOutput_db>nt</BlastOutput_db>
<BlastOutput_query-ID>Query_3881555</BlastOutput_query-ID>
<BlastOutput_query-def>unnamed protein product</BlastOutput_query-def>
<BlastOutput_query-len>93</BlastOutput_query-len>
<BlastOutput_param>
<Parameters>
<Parameters_matrix>BLOSUM62</Parameters_matrix>
<Parameters_expect>10</Parameters_expect>
<Parameters_gap-open>11</Parameters_gap-open>
<Parameters_gap-extend>1</Parameters_gap-extend>
<Parameters_filter>F</Parameters_filter>
</Parameters>
</BlastOutput_param>
<BlastOutput_iterations>
<Iteration>
<Iteration_iter-num>1</Iteration_iter-num>
<Iteration_query-ID>Query_3881555</Iteration_query-ID>
<Iteration_query-def>unnamed protein product</Iteration_query-def>
<Iteration_query-len>93</Iteration_query-len>
<Iteration_hits>
</Iteration_hits>
<Iteration_stat>
<Statistics>
<Statistics_db-num>0</Statistics_db-num>
<Statistics_db-len>0</Statistics_db-len>
<Statistics_hsp-len>0</Statistics_hsp-len>
<Statistics_eff-space>0</Statistics_eff-space>
<Statistics_kappa>-1</Statistics_kappa>
<Statistics_lambda>-1</Statistics_lambda>
<Statistics_entropy>-1</Statistics_entropy>
</Statistics>
</Iteration_stat>
</Iteration>
</BlastOutput_iterations>
</BlastOutput>
LOCUS NC_000913 4641652 bp DNA circular CON 09-MAR-2022
LOCUS NC_000913 4641652 bp DNA circular CON 09-MAR-2022
DEFINITION Escherichia coli str. K-12 substr. MG1655, complete genome.
ACCESSION NC_000913
VERSION NC_000913.3
DBLINK BioProject: PRJNA57779
BioSample: SAMN02604091
KEYWORDS RefSeq.
SOURCE Escherichia coli str. K-12 substr. MG1655
ORGANISM Escherichia coli str. K-12 substr. MG1655
Bacteria; Pseudomonadati; Pseudomonadota; Gammaproteobacteria;
Enterobacterales; Enterobacteriaceae; Escherichia.
REFERENCE 1 (bases 1 to 4641652)
AUTHORS Riley,M., Abe,T., Arnaud,M.B., Berlyn,M.K., Blattner,F.R.,
Chaudhuri,R.R., Glasner,J.D., Horiuchi,T., Keseler,I.M., Kosuge,T.,
Mori,H., Perna,N.T., Plunkett,G. III, Rudd,K.E., Serres,M.H.,
Thomas,G.H., Thomson,N.R., Wishart,D. and Wanner,B.L.
TITLE Escherichia coli K-12: a cooperatively developed annotation
snapshot--2005
JOURNAL Nucleic Acids Res. 34 (1), 1-9 (2006)
PUBMED 16397293
REMARK Publication Status: Online-Only
REFERENCE 2 (bases 1 to 4641652)
AUTHORS Hayashi,K., Morooka,N., Yamamoto,Y., Fujita,K., Isono,K., Choi,S.,
Ohtsubo,E., Baba,T., Wanner,B.L., Mori,H. and Horiuchi,T.
TITLE Highly accurate genome sequences of Escherichia coli K-12 strains
MG1655 and W3110
JOURNAL Mol. Syst. Biol. 2, 2006 (2006)
PUBMED 16738553
REFERENCE 3 (bases 1 to 4641652)
AUTHORS Blattner,F.R., Plunkett,G. III, Bloch,C.A., Perna,N.T., Burland,V.,
Riley,M., Collado-Vides,J., Glasner,J.D., Rode,C.K., Mayhew,G.F.,
Gregor,J., Davis,N.W., Kirkpatrick,H.A., Goeden,M.A., Rose,D.J.,
Mau,B. and Shao,Y.
TITLE The complete genome sequence of Escherichia coli K-12
JOURNAL Science 277 (5331), 1453-1462 (1997)
PUBMED 9278503
REFERENCE 4 (bases 1 to 4641652)
AUTHORS Arnaud,M., Berlyn,M.K.B., Blattner,F.R., Galperin,M.Y.,
Glasner,J.D., Horiuchi,T., Kosuge,T., Mori,H., Perna,N.T.,
Plunkett,G. III, Riley,M., Rudd,K.E., Serres,M.H., Thomas,G.H. and
Wanner,B.L.
TITLE Workshop on Annotation of Escherichia coli K-12
JOURNAL Unpublished
REMARK Woods Hole, Mass., on 14-18 November 2003 (sequence corrections)
REFERENCE 5 (bases 1 to 4641652)
AUTHORS Glasner,J.D., Perna,N.T., Plunkett,G. III, Anderson,B.D.,
Bockhorst,J., Hu,J.C., Riley,M., Rudd,K.E. and Serres,M.H.
TITLE ASAP: Escherichia coli K-12 strain MG1655 version m56
JOURNAL Unpublished
REMARK ASAP download 10 June 2004 (annotation updates)
REFERENCE 6 (bases 1 to 4641652)
AUTHORS Hayashi,K., Morooka,N., Mori,H. and Horiuchi,T.
TITLE A more accurate sequence comparison between genomes of Escherichia
coli K12 W3110 and MG1655 strains
JOURNAL Unpublished
REMARK GenBank accessions AG613214 to AG613378 (sequence corrections)
REFERENCE 7 (bases 1 to 4641652)
AUTHORS Perna,N.T.
TITLE Escherichia coli K-12 MG1655 yqiK-rfaE intergenic region, genomic
sequence correction
JOURNAL Unpublished
REMARK GenBank accession AY605712 (sequence corrections)
REFERENCE 8 (bases 1 to 4641652)
AUTHORS Rudd,K.E.
TITLE A manual approach to accurate translation start site annotation: an
E. coli K-12 case study
JOURNAL Unpublished
REFERENCE 9 (bases 1 to 4641652)
CONSRTM NCBI Genome Project
TITLE Direct Submission
JOURNAL Submitted (08-MAR-2022) National Center for Biotechnology
Information, NIH, Bethesda, MD 20894, USA
REFERENCE 10 (bases 1 to 4641652)
AUTHORS Blattner,F.R. and Plunkett,G. III.
TITLE Direct Submission
JOURNAL Submitted (30-JUL-2014) Laboratory of Genetics, University of
Wisconsin, 425G Henry Mall, Madison, WI 53706-1580, USA
REMARK Protein update by submitter
REFERENCE 11 (bases 1 to 4641652)
AUTHORS Blattner,F.R. and Plunkett,G. III.
TITLE Direct Submission
JOURNAL Submitted (15-NOV-2013) Laboratory of Genetics, University of
Wisconsin, 425G Henry Mall, Madison, WI 53706-1580, USA
REMARK Protein update by submitter
REFERENCE 12 (bases 1 to 4641652)
AUTHORS Blattner,F.R. and Plunkett,G. III.
TITLE Direct Submission
JOURNAL Submitted (26-SEP-2013) Laboratory of Genetics, University of
Wisconsin, 425G Henry Mall, Madison, WI 53706-1580, USA
REMARK Sequence update by submitter
REFERENCE 13 (bases 1 to 4641652)
AUTHORS Rudd,K.E.
TITLE Direct Submission
JOURNAL Submitted (06-FEB-2013) Department of Biochemistry and Molecular
Biology, University of Miami Miller School of Medicine, 118 Gautier
Bldg., Miami, FL 33136, USA
REMARK Sequence update by submitter
REFERENCE 14 (bases 1 to 4641652)
AUTHORS Rudd,K.E.
TITLE Direct Submission
JOURNAL Submitted (24-APR-2007) Department of Biochemistry and Molecular
Biology, University of Miami Miller School of Medicine, 118 Gautier
Bldg., Miami, FL 33136, USA
REMARK Annotation update from ecogene.org as a multi-database collaboration
REFERENCE 15 (bases 1 to 4641652)
AUTHORS Plunkett,G. III.
TITLE Direct Submission
JOURNAL Submitted (07-FEB-2006) Laboratory of Genetics, University of
Wisconsin, 425G Henry Mall, Madison, WI 53706-1580, USA
REMARK Protein updates by submitter
REFERENCE 16 (bases 1 to 4641652)
AUTHORS Plunkett,G. III.
TITLE Direct Submission
JOURNAL Submitted (10-JUN-2004) Laboratory of Genetics, University of
Wisconsin, 425G Henry Mall, Madison, WI 53706-1580, USA
REMARK Sequence update by submitter
REFERENCE 17 (bases 1 to 4641652)
AUTHORS Plunkett,G. III.
TITLE Direct Submission
JOURNAL Submitted (13-OCT-1998) Laboratory of Genetics, University of
Wisconsin, 425G Henry Mall, Madison, WI 53706-1580, USA
REFERENCE 18 (bases 1 to 4641652)
AUTHORS Blattner,F.R. and Plunkett,G. III.
TITLE Direct Submission
JOURNAL Submitted (02-SEP-1997) Laboratory of Genetics, University of
Wisconsin, 425G Henry Mall, Madison, WI 53706-1580, USA
REFERENCE 19 (bases 1 to 4641652)
AUTHORS Blattner,F.R. and Plunkett,G. III.
TITLE Direct Submission
JOURNAL Submitted (16-JAN-1997) Laboratory of Genetics, University of
Wisconsin, 425G Henry Mall, Madison, WI 53706-1580, USA
COMMENT PROVISIONAL REFSEQ: This record has not yet been subject to final
NCBI review. The reference sequence is identical to U00096.
On Nov 3, 2013 this sequence version replaced NC_000913.2.
Changes to proteins and annotation made on March 7, 2022. Current
U00096 annotation updates are derived from EcoCyc
https://ecocyc.org/. Suggestions for updates can be sent to
biocyc-support@ai.sri.com. These updates are being generated from a
collaboration that includes EcoCyc, the University of Wisconsin,
UniProtKB/Swiss-Prot, and the National Center for Biotechnology
Information (NCBI).
COMPLETENESS: full length.
FEATURES Location/Qualifiers
source 1..4641652
/organism="Escherichia coli str. K-12 substr. MG1655"
/mol_type="genomic DNA"
/strain="K-12"
/sub_strain="MG1655"
/db_xref="taxon:511145"
CONTIG join(U00096.3:1..4641652)
//
This source diff could not be displayed because it is too large. You can view the blob instead.
This source diff could not be displayed because it is too large. You can view the blob instead.
This source diff could not be displayed because it is too large. You can view the blob instead.
>seq1 first
>seq1 first
ATGCGA
>seq2 second
GGGCCC
>9CFS_1|Chains A, B|Long regulatory protein rop|Escherichia coli (562)
>9CFS_1|Chains A, B|Long regulatory protein rop|Escherichia coli (562)
MGHHHHHHGTPEEKQALQMAKQIKQQAQEIQKQTEELLKKVQELLKKLHQLGAPEMAKIA
EELHKHAEALKQAAEEFYKHAEELHKAAEARWG
>gene1
>gene1
ATGGCCATTGTAATGGGCCGCTGAAAGGGTGCCCGATAG
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment