test_SProt

testing sp001...
*Using SequenceParser
Q13454
N33_HUMAN
N33 PROTEIN.
Seq('MGARGAPSRRRQAGRRLRYLPTGSFPFLLLLLLLCIQLGGGQKKKENLLAEKVE...DFE', ProteinAlphabet())
*Using RecordParser
N33_HUMAN
['Q13454', 'Q14911', 'Q14912']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Mammalia', 'Eutheria', 'Primates', 'Catarrhini', 'Hominidae', 'Homo']
(348, 39676, '75818910')
***Features:
('TRANSMEM', 20, 40, 'POTENTIAL.', '')
('TRANSMEM', 197, 217, 'POTENTIAL.', '')
('TRANSMEM', 222, 242, 'POTENTIAL.', '')
('TRANSMEM', 277, 297, 'POTENTIAL.', '')
('TRANSMEM', 313, 333, 'POTENTIAL.', '')
('VARSPLIC', 344, 348, 'DLDFE -> FLIK (IN FORM 2).', '')
***References:
authors: MACGROGAN D., LEVY A., BOVA G.S., ISAACS W.B., BOOKSTEIN R.;
title: "Structure and methylation-associated silencing of a gene within a
homozygously deleted region of human chromosome band 8p22.";
references: [('MEDLINE', '96299740')]

testing sp002...
*Using SequenceParser
P54101
CSP_MOUSE
CYSTEINE STRING PROTEIN (CSP).
Seq('MADQRQRSLSTSGESLYHVLGLDKNATSDDIKKSYRKLALKYHPDKNPDNPEAA...GFN', ProteinAlphabet())
*Using RecordParser
CSP_MOUSE
['P54101']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Mammalia', 'Eutheria', 'Rodentia', 'Sciurognathi', 'Muridae', 'Murinae', 'Mus']
(198, 22100, '9DF0142B')
***Features:
('DOMAIN', 13, 82, 'DNAJ-LIKE.', '')
('DOMAIN', 118, 128, 'POLY-CYS.', '')
***References:
authors: QIN N., LIN T., BIRNBAUMER L.;
title: 
references: []
authors: MASTROGIACOMO A., GUNDERSEN C.B.;
title: "The nucleotide and deduced amino acid sequence of a rat cysteine
string protein.";
references: [('MEDLINE', '95223109')]
authors: BRAUN J.E., SCHELLER R.H.;
title: "Cysteine string protein, a DnaJ family member, is present on diverse
secretory vesicles.";
references: [('MEDLINE', '96188189')]

testing sp003...
*Using SequenceParser
P42655
143E_HUMAN
14-3-3 PROTEIN EPSILON (MITOCHONDRIAL IMPORT STIMULATION FACTOR L
SUBUNIT) (PROTEIN KINASE C INHIBITOR PROTEIN-1) (KCIP-1) (14-3-3E).
Seq('MDDREDLVYQAKLAEQAERYDEMVESMKKVAGMDVELTVEERNLLSVAYKNVIG...ENQ', ProteinAlphabet())
*Using RecordParser
143E_HUMAN
['P42655', 'P29360', 'Q63631']
['EUKARYOTA', 'METAZOA', 'CHORDATA', 'VERTEBRATA', 'MAMMALIA', 'EUTHERIA', 'PRIMATES', 'CATARRHINI', 'HOMINIDAE', 'HOMO']
(255, 29174, '40A43E62')
***Features:
('MOD_RES', 1, 1, 'ACETYLATION.', '')
('CONFLICT', 73, 73, 'K -> T (IN REF. 8).', '')
('CONFLICT', 120, 120, 'F -> S (IN REF. 8).', '')
('CONFLICT', 123, 123, 'K -> Y (IN REF. 8).', '')
('CONFLICT', 129, 129, 'H -> Y (IN REF. 13).', '')
***References:
authors: CONKLIN D.S., GALAKTIONOV K., BEACH D.;
title: "14-3-3 proteins associate with cdc25 phosphatases.";
references: [('MEDLINE', '95372385')]
authors: LUK S.C.W., LEE C.Y., WAYE M.M.Y.;
title: 
references: []
authors: JIN D.Y., LYU M.S., KOZAK C.A., JEANG K.T.;
title: "Function of 14-3-3 proteins.";
references: [('MEDLINE', '96300316')]
authors: CHONG S.S., TANIGAMI A., ROSCHKE A.V., LEDBETTER D.H.;
title: "14-3-3 epsilon has no homology to LIS1 and lies telomeric to it on
chromosome 17p13.3 outside the Miller-Dieker syndrome chromosome
region.";
references: [('MEDLINE', '97011338')]
authors: TANIGAMI A., CHONG S.S., LEDBETTER D.H.;
title: "14-3-3 epsilon genomic sequence.";
references: []
authors: ROSEBOOM P.H., WELLER J.L., BABILA T., AITKEN A., SELLERS L.A.,
MOFFET J.R., NAMBOODIRI M.A., KLEIN D.C.;
title: "Cloning and characterization of the epsilon and zeta isoforms of the
14-3-3 proteins.";
references: [('MEDLINE', '94296566')]
authors: ALAM R., HACHIYA N., SAKAGUCHI M., SHUN-ICHIRO K., IWANAGA S.,
KITAJIMA M., MIHARA K., OMURA T.;
title: "cDNA cloning and characterization of mitochondrial import
stimulation factor (MSF) purified from rat liver cytosol.";
references: [('MEDLINE', '95122474')]
authors: GAO L., GU X.B., YU D.S., YU R.K., ZENG G.;
title: "Association of a 14-3-3 protein with CMP-NeuAc:GM1 alpha 2,3-
sialyltransferase.";
references: [('MEDLINE', '96280718')]
authors: MCCONNELL J.E., ARMSTRONG J.F., BARD J.B.;
title: "The mouse 14-3-3 epsilon isoform, a kinase regulator whose
expression pattern is modulated in mesenchyme and neuronal
differentiation.";
references: [('MEDLINE', '95269876')]
authors: TAKIHARA Y., IRIE K., NOMURA M., MOTALEB M., MATSUMOTO K.,
SHIMADA K.;
title: 
references: []
authors: JONES J.M., NIIKURA T., PINKE R.M., GUO W., MOLDAY L., LEYKAM J.,
MCCONNELL D.G.;
title: "Expression of 14-3-3 proteins in bovine retinal photoreceptors.";
references: []
authors: TOKER A., SELLERS L.A., AMESS B., PATEL Y., HARRIS A., AITKEN A.;
title: "Multiple isoforms of a protein kinase C inhibitor (KCIP-1/14-3-3)
from sheep brain. Amino acid sequence of phosphorylated forms.";
references: [('MEDLINE', '92283271')]
authors: TOKER A., ELLIS C.A., SELLERS L.A., AITKEN A.;
title: "Protein kinase C inhibitor proteins. Purification from sheep brain
and sequence similarity to lipocortins and 14-3-3 protein.";
references: [('MEDLINE', '90345949')]

testing sp004...
*Using SequenceParser
P23082
NDOA_PSEPU
NAPHTHALENE 1,2-DIOXYGENASE SYSTEM FERREDOXIN COMPONENT.
Seq('TVKWIEAVALSDILEGDVLGVTVEGKELALYEVEGEIYATDNLCTHGSARMSDG...DLS', ProteinAlphabet())
*Using RecordParser
NDOA_PSEPU
['P23082', 'Q52123', 'O07829']
['Bacteria', 'Proteobacteria', 'gamma subdivision', 'Pseudomonas group', 'Pseudomonas']
(103, 11315, '9F91B3C8')
***Features:
('INIT_MET', 0, 0, '', '')
('METAL', 44, 44, 'IRON-SULFUR (2FE-2S) (POTENTIAL).', '')
('METAL', 46, 46, 'IRON-SULFUR (2FE-2S) (POTENTIAL).', '')
('METAL', 63, 63, 'IRON-SULFUR (2FE-2S) (POTENTIAL).', '')
('METAL', 66, 66, 'IRON-SULFUR (2FE-2S) (POTENTIAL).', '')
('VARIANT', 2, 2, 'V -> E (IN STRAIN G7).', '')
('VARIANT', 14, 14, 'L -> P (IN STRAIN G7).', '')
('VARIANT', 48, 48, 'S -> A (IN STRAIN G7).', '')
('VARIANT', 76, 76, 'K -> R (IN STRAIN G7).', '')
('VARIANT', 84, 84, 'Q -> E (IN STRAIN G7).', '')
('VARIANT', 90, 90, 'P -> A (IN STRAIN G7).', '')
('VARIANT', 103, 103, 'S -> GEF (IN STRAIN G7).', '')
***References:
authors: KURKELA S., LEHVAESLAIHO H., PALVA E.T., TEERI T.H.;
title: "Cloning, nucleotide sequence and characterization of genes encoding
naphthalene dioxygenase of Pseudomonas putida strain NCIB9816.";
references: [('MEDLINE', '89211973')]
authors: SIMON M.J., OSSLUND T.D., SAUNDERS R., ENSLEY B.D., SUGGS S.,
HARCOURT A.A., SUEN W.-C., CRUDEN D.L., GIBSON D.T., ZYLSTRA G.J.;
title: "Sequences of genes encoding naphthalene dioxygenase in Pseudomonas
putida strains G7 and NCIB 9816-4.";
references: [('MEDLINE', '93252277')]
authors: DENOME S.A., STANLEY D.C., OLSON E.S., YOUNG K.D.;
title: "Metabolism of dibenzothiophene and naphthalene in Pseudomonas
strains: complete DNA sequence of an upper naphthalene catabolic
pathway.";
references: [('MEDLINE', '94042852')]
authors: HAMANN C.;
title: 
references: []

testing sp005...
*Using SequenceParser
P24973
NU3M_BALPH
NADH-UBIQUINONE OXIDOREDUCTASE CHAIN 3 (EC 1.6.5.3).
Seq('MNLLLTLLTNTTLALLLVFIAFWLPQLNVYAEKTSPYECGFDPMGSARLPFSMK...WAE', ProteinAlphabet())
*Using RecordParser
NU3M_BALPH
['P24973']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Mammalia', 'Eutheria', 'Cetartiodactyla', 'Cetacea', 'Mysticeti', 'Balaenopteridae', 'Balaenoptera']
(115, 13022, 'ACF02965')
***Features:
***References:
authors: ARNASON U., GULLBERG A., WIDEGREN B.;
title: "The complete nucleotide sequence of the mitochondrial DNA of the fin
whale, Balaenoptera physalus.";
references: [('MEDLINE', '92139449')]
authors: ARNASON U., GULLBERG A.;
title: "Comparison between the complete mtDNA sequences of the blue and the
fin whale, two species that can hybridize in nature.";
references: [('MEDLINE', '94141932')]

testing sp006...
*Using SequenceParser
P39896
TCMO_STRGA
TETRACENOMYCIN POLYKETIDE SYNTHESIS 8-O-METHYL TRANSFERASE TCMO
(EC 2.1.1.-).
Seq('MTPHTHVRGPGDILQLTMAFYGSRALISAVELDLFTLLAGKPLPLGELCERAGI...KPR', ProteinAlphabet())
*Using RecordParser
TCMO_STRGA
['P39896']
['BACTERIA', 'FIRMICUTES', 'ACTINOBACTERIA', 'ACTINOBACTERIDAE', 'ACTINOMYCETALES', 'STREPTOMYCINEAE', 'STREPTOMYCETACEAE', 'STREPTOMYCES']
(339, 37035, '848B7337')
***Features:
***References:
authors: SUMMERS R.G., WENDT-PIENKOWSKI E., MOTAMEDI H., HUTCHINSON C.R.;
title: "Nucleotide sequence of the tcmII-tcmIV region of the tetracenomycin
C biosynthetic gene cluster of Streptomyces glaucescens and evidence
that the tcmN gene encodes a multifunctional
cyclase-dehydratase-O-methyl transferase.";
references: [('MEDLINE', '92193265')]

testing sp007...
*Using SequenceParser
O95832
CLD1_HUMAN
CLAUDIN-1 (SENESCENCE-ASSOCIATED EPITHELIAL MEMBRANE PROTEIN).
Seq('MANAGLQLLGFILAFLGWIGAIVSTALPQWRIYSYAGDNIVTAQAMYEGLWMSC...DYV', ProteinAlphabet())
*Using RecordParser
CLD1_HUMAN
['O95832']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Mammalia', 'Eutheria', 'Primates', 'Catarrhini', 'Hominidae', 'Homo']
(211, 22744, '07269000E6C214F0')
***Features:
('TRANSMEM', 8, 28, 'POTENTIAL.', '')
('TRANSMEM', 82, 102, 'POTENTIAL.', '')
('TRANSMEM', 116, 136, 'POTENTIAL.', '')
('TRANSMEM', 164, 184, 'POTENTIAL.', '')
('CONFLICT', 62, 62, 'I -> V (IN REF. 2).', '')
('CONFLICT', 135, 135, 'V -> A (IN REF. 2).', '')
***References:
authors: Swisshelm K.L., Machl A., Planitzer S., Robertson R., Kubbies M.,
Hosier S.;
title: "SEMP1, a senescence-associated cDNA isolated from human mammary
epithelial cells, is a member of an epithelial membrane protein
superfamily.";
references: [('MEDLINE', '99132301')]
authors: Mitic L.M., Anderson J.M.;
title: "Human claudin-1 isolated from Caco-2 mRNA.";
references: []

testing sp008...
*Using SequenceParser
P01892
1A02_HUMAN
HLA CLASS I HISTOCOMPATIBILITY ANTIGEN, A-2 ALPHA CHAIN PRECURSOR.
Seq('MAVMAPRTLVLLLSGALALTQTWAGSHSMRYFFTSVSRPGRGEPRFIAVGYVDD...CKV', ProteinAlphabet())
*Using RecordParser
1A02_HUMAN
['P01892', 'P06338', 'P30514', 'P30444', 'P30445', 'P30446', 'Q29680', 'Q29899', 'Q95352', 'Q29837', 'Q95380']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Mammalia', 'Eutheria', 'Primates', 'Catarrhini', 'Hominidae', 'Homo']
(365, 40922, 'B54A97B24B337C08')
***Features:
('SIGNAL', 1, 24, '', '')
('CHAIN', 25, 365, 'HLA CLASS I HISTOCOMPATIBILITY ANTIGEN, A-2 ALPHA CHAIN.', '')
('DOMAIN', 25, 114, 'EXTRACELLULAR ALPHA-1.', '')
('DOMAIN', 115, 206, 'EXTRACELLULAR ALPHA-2.', '')
('DOMAIN', 207, 298, 'EXTRACELLULAR ALPHA-3.', '')
('DOMAIN', 299, 308, 'CONNECTING PEPTIDE.', '')
('TRANSMEM', 309, 332, '', '')
('DOMAIN', 333, 365, 'CYTOPLASMIC TAIL.', '')
('CARBOHYD', 110, 110, '', '')
('DISULFID', 125, 188, '', '')
('DISULFID', 227, 283, '', '')
('STRAND', 27, 36, '', '')
('STRAND', 45, 52, '', '')
('TURN', 53, 54, '', '')
('STRAND', 55, 61, '', '')
('TURN', 62, 63, '', '')
('STRAND', 70, 71, '', '')
('HELIX', 74, 76, '', '')
('TURN', 77, 78, '', '')
('HELIX', 81, 108, '', '')
('TURN', 109, 110, '', '')
('TURN', 113, 114, '', '')
('STRAND', 118, 127, '', '')
('TURN', 129, 130, '', '')
('STRAND', 133, 142, '', '')
('TURN', 143, 144, '', '')
('STRAND', 145, 150, '', '')
('TURN', 152, 153, '', '')
('STRAND', 157, 159, '', '')
('TURN', 163, 163, '', '')
('HELIX', 164, 173, '', '')
('TURN', 174, 175, '', '')
('HELIX', 176, 185, '', '')
('TURN', 186, 186, '', '')
('HELIX', 187, 198, '', '')
('TURN', 199, 199, '', '')
('HELIX', 200, 203, '', '')
('TURN', 204, 204, '', '')
('STRAND', 207, 207, '', '')
('STRAND', 210, 219, '', '')
('TURN', 220, 221, '', '')
('STRAND', 222, 233, '', '')
('STRAND', 238, 243, '', '')
('TURN', 244, 245, '', '')
('STRAND', 246, 247, '', '')
('HELIX', 249, 251, '', '')
('STRAND', 253, 254, '', '')
('STRAND', 258, 259, '', '')
('STRAND', 265, 274, '', '')
('TURN', 275, 276, '', '')
('HELIX', 278, 280, '', '')
('STRAND', 281, 286, '', '')
('TURN', 288, 289, '', '')
('STRAND', 294, 297, '', '')
('VARIANT', 33, 33, 'F -> Y (IN A*0205, A*0206, A*0208, A*0210 AND A*0221). /FTId=VAR_004334.', 'VAR_004334')
('VARIANT', 54, 54, 'D -> N (IN A*0221). /FTId=VAR_004335.', 'VAR_004335')
('VARIANT', 67, 67, 'Q -> R (IN A*0202, A*0205, AND A*0208). /FTId=VAR_004336.', 'VAR_004336')
('VARIANT', 90, 90, 'K -> N (IN A*0208 AND A*0220). /FTId=VAR_004337.', 'VAR_004337')
('VARIANT', 97, 98, 'TH -> ID (IN A*0211). /FTId=VAR_004338.', 'VAR_004338')
('VARIANT', 119, 119, 'V -> L (IN A*0202, A*0205, A*0208 AND A*0217). /FTId=VAR_004339.', 'VAR_004339')
('VARIANT', 121, 121, 'R -> M (IN A*0204 AND A*0217). /FTId=VAR_004340.', 'VAR_004340')
('VARIANT', 123, 123, 'Y -> C (IN A*0207 AND A*0218). /FTId=VAR_004341.', 'VAR_004341')
('VARIANT', 123, 123, 'Y -> F (IN A*0210 AND A*0217). /FTId=VAR_004342.', 'VAR_004342')
('VARIANT', 131, 131, 'W -> G (IN A*0210). /FTId=VAR_004343.', 'VAR_004343')
('VARIANT', 162, 162, 'M -> K (IN A*0218). /FTId=VAR_004344.', 'VAR_004344')
('VARIANT', 173, 173, 'A -> T (IN A*0203). /FTId=VAR_004345.', 'VAR_004345')
('VARIANT', 176, 176, 'V -> E (IN A*0203 AND A*0213). /FTId=VAR_004346.', 'VAR_004346')
('VARIANT', 180, 180, 'L -> W (IN A*0202, A*0203, A*0205 AND A*0208). /FTId=VAR_004347.', 'VAR_004347')
('VARIANT', 180, 180, 'L -> Q (IN A*0212 AND A*0213). /FTId=VAR_004348.', 'VAR_004348')
('VARIANT', 187, 187, 'T -> E (IN A*0216). /FTId=VAR_004349.', 'VAR_004349')
('VARIANT', 260, 260, 'A -> E (IN A*0209). /FTId=VAR_004350.', 'VAR_004350')
***References:
authors: Koller B.H., Orr H.T.;
title: "Cloning and complete sequence of an HLA-A2 gene: analysis of two
HLA-A alleles at the nucleotide level.";
references: [('MEDLINE', '85132727')]
authors: Cianetti L., Testa U., Scotto L., la Valle R., Simeone A.,
Boccoli G., Giannella G., Peschle C., Boncinelli E.;
title: "Three new class I HLA alleles: structure of mRNAs and alternative
mechanisms of processing.";
references: [('MEDLINE', '89122144')]
authors: Ennis P.D., Zemmour J., Salter R.D., Parham P.;
title: "Rapid cloning of HLA-A,B cDNA by using the polymerase chain
reaction: frequency and nature of errors produced in amplification.";
references: [('MEDLINE', '90207291')]
authors: Belich M.P., Madrigal J.A., Hildebrand W.H., Zemmour J.,
Williams R.C., Luz R., Petzl-Erler M.L., Parham P.;
title: "Unusual HLA-B alleles in two tribes of Brazilian Indians.";
references: [('MEDLINE', '92269955')]
authors: Krangel M.S.;
title: "Unusual RNA splicing generates a secreted form of HLA-A2 in a
mutagenized B lymphoblastoid cell line.";
references: [('MEDLINE', '85230571')]
authors: Orr H.T., Lopez de Castro J.A., Parham P., Ploegh H.L.,
Strominger J.L.;
title: "Comparison of amino acid sequences of two human histocompatibility
antigens, HLA-A2 and HLA-B7: location of putative alloantigenic
sites.";
references: [('MEDLINE', '80056745')]
authors: Lopez de Castro J.A., Strominger J.L., Strong D.M., Orr H.T.;
title: "Structure of crossreactive human histocompatibility antigens HLA-A28
and HLA-A2: possible implications for the generation of HLA
polymorphism.";
references: [('MEDLINE', '82247941')]
authors: Mattson D.H., Handy D.E., Bradley D.A., Coligan J.E., Cowan E.P.,
Biddison W.E.;
title: "DNA sequences of the genes that encode the CTL-defined HLA-A2
variants M7 and DK1.";
references: [('MEDLINE', '87306734')]
authors: Holmes N., Ennis P., Wan A.M., Denney D.W., Parham P.;
title: "Multiple genetic mechanisms have contributed to the generation of
the HLA-A2/A28 family of class I MHC molecules.";
references: [('MEDLINE', '87252273')]
authors: Domena J.D.;
title: 
references: []
authors: Castano A.R., Lopez de Castro J.A.;
title: "Structure of the HLA-A*0204 antigen, found in South American
Indians. Spatial clustering of HLA-A2 subtype polymorphism.";
references: [('MEDLINE', '92039809')]
authors: Watkins D.I., McAdam S.N., Liu X., Stang C.R., Milford E.L.,
Levine C.G., Garber T.L., Dogon A.L., Lord C.I., Ghim S.H.,
Troup G.M., Hughes A.L., Letvin N.L.;
title: "New recombinant HLA-B alleles in a tribe of South American
Amerindians indicate rapid evolution of MHC class I loci.";
references: [('MEDLINE', '92269956')]
authors: Parham P., Lawlor D.A., Lomen C.E., Ennis P.D.;
title: "Diversity and diversification of HLA-A,B,C alleles.";
references: [('MEDLINE', '89235215')]
authors: Ezquerra A., Domenech N., van der Poel J., Strominger J.L., Vega M.A.,
Lopez de Castro J.A.;
title: "Molecular analysis of an HLA-A2 functional variant CLA defined by
cytolytic T lymphocytes.";
references: [('MEDLINE', '86305811')]
authors: Domenech N., Ezquerra A., Castano R., Lopez de Castro J.A.;
title: "Structural analysis of HLA-A2.4 functional variant KNE. Implications
for the mapping of HLA-A2-specific T-cell epitopes.";
references: [('MEDLINE', '88113844')]
authors: Domenech N., Castano R., Goulmy E., Lopez de Castro J.A.;
title: "Molecular analysis of HLA-A2.4 functional variant KLO: close
structural and evolutionary relatedness to the HLA-A2.2 subtype.";
references: [('MEDLINE', '88314183')]
authors: Castano R., Ezquerra A., Domenech N., Lopez de Castro J.A.;
title: "An HLA-A2 population variant with structural polymorphism in the
alpha 3 region.";
references: [('MEDLINE', '88186100')]
authors: Epstein H., Kennedy L., Holmes N.;
title: "An Oriental HLA-A2 subtype is closely related to a subset of
Caucasoid HLA-A2 alleles.";
references: [('MEDLINE', '89122133')]
authors: Castano A.R., Lopez de Castro J.A.;
title: "Structure of the HLA-A*0211 (A2.5) subtype: further evidence for
selection-driven diversification of HLA-A2 antigens.";
references: [('MEDLINE', '92218010')]
authors: Barber D.F., Fernandez J.M., Lopez de Castro J.A.;
title: "Primary structure of a new HLA-A2 subtype: HLA-A*0213.";
references: [('MEDLINE', '94222455')]
authors: Barouch D., Krausa P., Bodmer J., Browning M.J., McMichael A.J.;
title: "Identification of a novel HLA-A2 subtype, HLA-A*0216.";
references: [('MEDLINE', '95278976')]
authors: Selvakumar A., Granja C.B., Salazar M., Alosco S.M., Yunis E.J.,
Dupont B.;
title: "A novel subtype of A2 (A*0217) isolated from the South American
Indian B-cell line AMALA.";
references: [('MEDLINE', '95381236')]
authors: Kashiwase K., Tokunaga K., Ishikawa Y., Oohashi H., Hashimoto M.,
Akaza T., Tadokoro K., Juji T.;
title: "A new A2 sequence HLA-A2K from Japanese.";
references: []
authors: Fleischhauer K., Zino E., Mazzi B., Severini G.M., Benazzi E.,
Bordignon C.;
title: "HLA-A*02 subtype distribution in Caucasians from northern Italy:
identification of A*0220.";
references: [('MEDLINE', '97161038')]
authors: Szmania S., Baxter-Lowe L.A.;
title: "Nucleotide sequence of a novel HLA-A2 gene.";
references: []
authors: Bjorkman P.J., Saper M.A., Samraoui B., Bennett W.S.,
Strominger J.L., Wiley D.C.;
title: "Structure of the human class I histocompatibility antigen, HLA-A2.";
references: [('MEDLINE', '88014204')]
authors: Saper M.A., Bjorkman P.J., Wiley D.C.;
title: "Refined structure of the human histocompatibility antigen HLA-A2 at
2.6-A resolution.";
references: [('MEDLINE', '91245570')]

testing sp009...
*Using SequenceParser
O23729
CHS3_BROFI
CHALCONE SYNTHASE 3 (EC 2.3.1.74) (NARINGENIN-CHALCONE SYNTHASE 3).
Seq('MAPAMEEIRQAQRAEGPAAVLAIGTSTPPNALYQADYPDYYFRITKSEHLTELK...GAE', ProteinAlphabet())
*Using RecordParser
CHS3_BROFI
['O23729']
['Eukaryota', 'Viridiplantae', 'Embryophyta', 'Tracheophyta', 'Spermatophyta', 'Magnoliophyta', 'Liliopsida', 'Asparagales', 'Orchidaceae', 'Bromheadia']
(394, 42941, '2F8D14AF4870BBB2')
***Features:
('ACT_SITE', 165, 165, 'BY SIMILARITY.', '')
***References:
authors: Liew C.F., Lim S.H., Loh C.S., Goh C.J.;
title: "Molecular cloning and sequence analysis of chalcone synthase cDNAs of
Bromheadia finlaysoniana.";
references: []

testing sp010...
*Using SequenceParser
Q13639
5H4_HUMAN
5-HYDROXYTRYPTAMINE 4 RECEPTOR (5-HT-4) (SEROTONIN RECEPTOR) (5-HT4).
Seq('MDKLDANVSSEEGFGSVEKVVLLTFLSTVILMAILGNLLVMVAVCWDRQLRKIK...SDT', ProteinAlphabet())
*Using RecordParser
5H4_HUMAN
['Q13639', 'Q9UBM6', 'Q9UQR6', 'Q9UE22', 'Q9UE23', 'Q9UBT4', 'Q9NY73']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Euteleostomi', 'Mammalia', 'Eutheria', 'Primates', 'Catarrhini', 'Hominidae', 'Homo']
(388, 43761, '7FCFEC60E7BDF560')
***Features:
('DOMAIN', 1, 19, 'EXTRACELLULAR (POTENTIAL).', '')
('TRANSMEM', 20, 40, '1 (POTENTIAL).', '')
('DOMAIN', 41, 58, 'CYTOPLASMIC (POTENTIAL).', '')
('TRANSMEM', 59, 79, '2 (POTENTIAL).', '')
('DOMAIN', 80, 93, 'EXTRACELLULAR (POTENTIAL).', '')
('TRANSMEM', 94, 116, '3 (POTENTIAL).', '')
('DOMAIN', 117, 137, 'CYTOPLASMIC (POTENTIAL).', '')
('TRANSMEM', 138, 158, '4 (POTENTIAL).', '')
('DOMAIN', 159, 192, 'EXTRACELLULAR (POTENTIAL).', '')
('TRANSMEM', 193, 213, '5 (POTENTIAL).', '')
('DOMAIN', 214, 260, 'CYTOPLASMIC (POTENTIAL).', '')
('TRANSMEM', 261, 281, '6 (POTENTIAL).', '')
('DOMAIN', 282, 294, 'EXTRACELLULAR (POTENTIAL).', '')
('TRANSMEM', 295, 315, '7 (POTENTIAL).', '')
('DOMAIN', 316, 388, 'CYTOPLASMIC (POTENTIAL).', '')
('CARBOHYD', 7, 7, 'N-LINKED (GLCNAC...) (POTENTIAL).', '')
('DISULFID', 93, 184, 'BY SIMILARITY.', '')
('LIPID', 329, 329, 'PALMITATE (BY SIMILARITY).', '')
('VARSPLIC', 169, 169, 'L -> LERSLNQGLGQDFHA (IN ISOFORM 5- HT4(F)).', '')
('VARSPLIC', 359, 388, 'RDAVECGGQWESQCHPPATSPLVAAQPSDT -> SGCSPVSSFLLLFCNRPVPV (IN ISOFORM 5-HT4(E)).', '')
('VARSPLIC', 359, 388, 'RDAVECGGQWESQCHPPATSPLVAAQPSDT -> SSGTETDRRNFGIRKRRLTKPS (IN ISOFORM 5-HT4(D)).', '')
('VARSPLIC', 360, 388, 'DAVECGGQWESQCHPPATSPLVAAQPSDT -> F (IN ISOFORM 5-HT4(C)).', '')
('VARSPLIC', 360, 388, 'DAVECGGQWESQCHPPATSPLVAAQPSDT -> YTVLHRGHHQELEKLPIHNDPESLESCF (IN ISOFORM 5- HT4(A)).', '')
***References:
authors: Blondel O., Gastineau M., Dahmoune Y., Langlois M., Fischmeister R.;
title: "Cloning, expression, and pharmacology of four human 5-
hydroxytryptamine receptor isoforms produced by alternative splicing
in the carboxyl terminus.";
references: [('PubMed', '9603189')]
authors: Van den Wyngaert I., Gommeren W., Jurzak M., Verhasselt P., Gordon R.,
Leysen J., Luyten W., Bender E.;
title: "Cloning and expression of 5-HT4 receptor species and splice
variants.";
references: []
authors: Claeysen S., Faye P., Sebben M., Lemaire S., Bockaert J., Dumuis A.;
title: "Cloning and expression of human 5-HT4S receptors. Effect of receptor
density on their coupling to adenylyl cyclase.";
references: [('PubMed', '9351641')]
authors: Claeysen S., Sebben M., Becamel C., Bockaert J., Dumuis A.;
title: "Novel brain-specific 5-HT4 receptors splice variants show marked
constitutive activity: role of the c-terminal intracellular domain.";
references: []
authors: Bender E., Pindon A., van Oers I., Zhang Y.B., Gommeren W.,
Verhasselt P., Jurzak M., Leysen J., Luyten W.;
title: "Structure of the human serotonin 5-HT4 receptor gene and cloning of a
novel 5-HT4 splice variant.";
references: [('PubMed', '10646498')]
authors: Ullmer C., Schmuck K., Kalkman H.O., Lubbert H.;
title: "Expression of serotonin receptor mRNAs in blood vessels.";
references: [('MEDLINE', '95385798'), ('PubMed', '7656980')]

testing sp011...
*Using SequenceParser
P16235
LSHR_RAT
LUTROPIN-CHORIOGONADOTROPIC HORMONE RECEPTOR PRECURSOR (LH/CG-R)
(LSH-R) (LUTEINIZING HORMONE RECEPTOR).
Seq('MGRRVPALRQLLVLAVLLLKPSQLQSRELSGSRCPEPCDCAPDGALRCPGPRAG...LTH', ProteinAlphabet())
*Using RecordParser
LSHR_RAT
['P16235', 'P70646', 'Q63807', 'Q63808', 'Q63809']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Euteleostomi', 'Mammalia', 'Eutheria', 'Rodentia', 'Sciurognathi', 'Muridae', 'Murinae', 'Rattus']
(700, 78035, '31807E73BAC94F1F')
***Features:
('SIGNAL', 1, 26, '', '')
('CHAIN', 27, 700, 'LUTROPIN-CHORIOGONADOTROPIC HORMONE RECEPTOR.', '')
('DOMAIN', 27, 362, 'EXTRACELLULAR (POTENTIAL).', '')
('TRANSMEM', 363, 390, '1 (POTENTIAL).', '')
('DOMAIN', 391, 399, 'CYTOPLASMIC (POTENTIAL).', '')
('TRANSMEM', 400, 422, '2 (POTENTIAL).', '')
('DOMAIN', 423, 443, 'EXTRACELLULAR (POTENTIAL).', '')
('TRANSMEM', 444, 466, '3 (POTENTIAL).', '')
('DOMAIN', 467, 486, 'CYTOPLASMIC (POTENTIAL).', '')
('TRANSMEM', 487, 509, '4 (POTENTIAL).', '')
('DOMAIN', 510, 529, 'EXTRACELLULAR (POTENTIAL).', '')
('TRANSMEM', 530, 551, '5 (POTENTIAL).', '')
('DOMAIN', 552, 574, 'CYTOPLASMIC (POTENTIAL).', '')
('TRANSMEM', 575, 598, '6 (POTENTIAL).', '')
('DOMAIN', 599, 609, 'EXTRACELLULAR (POTENTIAL).', '')
('TRANSMEM', 610, 631, '7 (POTENTIAL).', '')
('DOMAIN', 632, 700, 'CYTOPLASMIC (POTENTIAL).', '')
('REPEAT', 52, 75, 'LRR 1.', '')
('REPEAT', 126, 150, 'LRR 2.', '')
('REPEAT', 152, 175, 'LRR 3.', '')
('REPEAT', 176, 200, 'LRR 4.', '')
('REPEAT', 202, 224, 'LRR 5.', '')
('REPEAT', 225, 248, 'LRR 6.', '')
('REPEAT', 250, 271, 'LRR 7.', '')
('DISULFID', 443, 518, 'BY SIMILARITY.', '')
('CARBOHYD', 103, 103, 'N-LINKED (GLCNAC...) (POTENTIAL).', '')
('CARBOHYD', 178, 178, 'N-LINKED (GLCNAC...) (POTENTIAL).', '')
('CARBOHYD', 199, 199, 'N-LINKED (GLCNAC...) (POTENTIAL).', '')
('CARBOHYD', 295, 295, 'N-LINKED (GLCNAC...) (POTENTIAL).', '')
('CARBOHYD', 303, 303, 'N-LINKED (GLCNAC...) (POTENTIAL).', '')
('CARBOHYD', 317, 317, 'N-LINKED (GLCNAC...) (POTENTIAL).', '')
('VARSPLIC', 83, 132, 'MISSING (IN ISOFORM 1950).', '')
('VARSPLIC', 133, 157, 'MISSING (IN ISOFORM 1759).', '')
('VARSPLIC', 184, 700, 'MISSING (IN ISOFORM C2).', '')
('VARSPLIC', 232, 251, 'DISSTKLQALPSHGLESIQT -> PCRATGWSPFRRSSPCLPTH (IN ISOFORM 2075).', '')
('VARSPLIC', 232, 293, 'MISSING (IN ISOFORM E/A2, ISOFORM EB AND ISOFORM B1).', '')
('VARSPLIC', 252, 700, 'MISSING (IN ISOFORM 2075).', '')
('VARSPLIC', 294, 367, 'QNFSFSIFENFSKQCESTVRKADNETLYSAIFEENELSGWDYDYGFCSPKTLQCAPEPDAFNPCEDIMGYAFLR -> IFHFPFLKTSPNNAKAQLEKQITRRFIPPSLRRMNSVAGIMIMASVHPRHSNVLQNQMLSTPVKILWAMPSLGS (IN ISOFORM B1 AND ISOFORM B3).', '')
('VARSPLIC', 294, 294, 'Q -> P (IN ISOFORM C1).', '')
('VARSPLIC', 295, 700, 'MISSING (IN ISOFORM C1).', '')
('VARSPLIC', 321, 342, 'YSAIFEENELSGWDYDYGFCSP -> LHGALPAAHCLRGLPNKRPVL (IN ISOFORM 1834, ISOFORM 1759 AND ISOFORM EB).', '')
('VARSPLIC', 343, 700, 'MISSING (IN ISOFORMS 1834, ISOFORM 1759 AND ISOFORM EB).', '')
('VARSPLIC', 368, 700, 'MISSING (IN ISOFORM B1 AND ISOFORM B3).', '')
('VARIANT', 82, 82, 'I -> M (IN ISOFORM 1950).', '')
('VARIANT', 179, 179, 'E -> G (IN ISOFORM 1759).', '')
('VARIANT', 233, 233, 'I -> T (IN ISOFORM 1950).', '')
('VARIANT', 646, 646, 'G -> S (IN ISOFORM 1950).', '')
('MUTAGEN', 409, 409, 'D->N: SIGNIFICANT REDUCTION OF BINDING.', '')
('MUTAGEN', 436, 436, 'D->N: NO CHANGE IN BINDING OR CAMP PROD.', '')
('MUTAGEN', 455, 455, 'E->Q: NO CHANGE IN BINDING OR CAMP PROD.', '')
('MUTAGEN', 582, 582, 'D->N: NO CHANGE IN BINDING OR CAMP PROD.', '')
('CONFLICT', 33, 33, 'R -> L (IN REF. 7).', '')
***References:
authors: McFarland K.C., Sprengel R., Phillips H.S., Koehler M.,
Rosemblit N., Nikolics K., Segaloff D.L., Seeburg P.H.;
title: "Lutropin-choriogonadotropin receptor: an unusual member of the G
protein-coupled receptor family.";
references: [('MEDLINE', '89332512'), ('PubMed', '2502842')]
authors: Aatsinki J.T., Pietila E.M., Lakkakorpi J.T., Rajaniemi H.J.;
title: "Expression of the LH/CG receptor gene in rat ovarian tissue is
regulated by an extensive alternative splicing of the primary
transcript.";
references: [('MEDLINE', '92347604'), ('PubMed', '1353463')]
authors: Koo Y.B., Slaughter R.G., Ji T.H.;
title: "Structure of the luteinizing hormone receptor gene and multiple
exons of the coding sequence.";
references: [('MEDLINE', '91209270'), ('PubMed', '2019252')]
authors: Bernard M.P., Myers R.V., Moyle W.R.;
title: "Cloning of rat lutropin (LH) receptor analogs lacking the soybean
lectin domain.";
references: [('MEDLINE', '91006819'), ('PubMed', '1976554')]
authors: Segaloff D.L., Sprengel R., Nikolics K., Ascoli M.;
title: "Structure of the lutropin/choriogonadotropin receptor.";
references: [('MEDLINE', '91126285'), ('PubMed', '2281186')]
authors: Tsai-Morris C.H., Buczko E., Wang W., Dufau M.L.;
title: "Intronic nature of the rat luteinizing hormone receptor gene defines
a soluble receptor subspecies with hormone binding activity.";
references: [('MEDLINE', '91060531'), ('PubMed', '2174034')]
authors: Roche P.C., Ryan R.J.;
title: "Purification, characterization, and amino-terminal sequence of rat
ovarian receptor for luteinizing hormone/human choriogonadotropin.";
references: [('MEDLINE', '89174723'), ('PubMed', '2925659')]
authors: Ji I., Ji T.H.;
title: "Asp383 in the second transmembrane domain of the lutropin receptor
is important for high affinity hormone binding and cAMP production.";
references: [('MEDLINE', '91332007'), ('PubMed', '1714448')]

testing sp012...
*Using SequenceParser
Q9Y736
Q9Y736
UBIQUITIN.
Seq('MQIFVKTLTGKTITLEVESSDTIDNVKTKIQDKEGIPPDQQRLIFAGKQLEDGR...GGN', ProteinAlphabet())
*Using RecordParser
Q9Y736
['Q9Y736']
['Eukaryota', 'Fungi', 'Ascomycota', 'Pezizomycotina', 'Eurotiomycetes', 'Onygenales', 'Arthrodermataceae', 'mitosporic Arthrodermataceae', 'Trichophyton']
(153, 17238, '01153CF30C2DEDFF')
***Features:
***References:
authors: Kano R., Nakamura Y., Watanabe S., Hasegawa A.;
title: "Trichophyton mentagrophytes mRNA for ubiquitin.";
references: []
authors: Kano R.;
title: "Microsporum canis mRNA for ubiquitin, complete cds.";
references: []

testing sp013...
*Using SequenceParser
P82909
P82909
MITOCHONDRIAL 28S RIBOSOMAL PROTEIN S36 (MRP-S36).
Seq('MGSKMASASRVVQVVKPHTPLIRFPDRRDNPKPNVSEALRSAGLPSHSSVISQH...GPE', ProteinAlphabet())
*Using RecordParser
P82909
['P82909']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Euteleostomi', 'Mammalia', 'Eutheria', 'Primates', 'Catarrhini', 'Hominidae', 'Homo']
(102, 11335, '83EF107B42E2FCFD')
***Features:
***References:
authors: Strausberg R.;
title: 
references: []
authors: Koc E.C., Burkhart W., Blackburn K., Moseley A., Spremulli L.L.;
title: "The small subunit of the mammalian mitochondrial ribosome.
Identification of the full complement ribosomal proteins present.";
references: []

testing sp014...
*Using SequenceParser
P12166
PSBL_ORYSA
PHOTOSYSTEM II REACTION CENTER L PROTEIN (PSII 5 KDA PROTEIN).
Seq('TQSNPNEQNVELNRTSLYWGLLLIFVLAVLFSNYFFN', ProteinAlphabet())
*Using RecordParser
PSBL_ORYSA
['P12166', 'P12167', 'Q34007']
['Eukaryota', 'Viridiplantae', 'Embryophyta', 'Tracheophyta', 'Spermatophyta', 'Magnoliophyta', 'Liliopsida', 'Poales', 'Poaceae', 'Ehrhartoideae', 'Oryzeae', 'Oryza']
(37, 4366, 'CC537AEC50B2C784')
***Features:
('INIT_MET', 0, 0, '', '')
***References:
authors: Sugiura M.;
title: 
references: []
authors: Hiratsuka J., Shimada H., Whittier R., Ishibashi T., Sakamoto M.,
Mori M., Kondo C., Honji Y., Sun C.-R., Meng B.-Y., Li Y.-Q.,
Kanno A., Nishizawa Y., Hirai A., Shinozaki K., Sugiura M.;
title: "The complete sequence of the rice (Oryza sativa) chloroplast genome:
intermolecular recombination between distinct tRNA genes accounts for
a major plastid DNA inversion during the evolution of the cereals.";
references: [('MEDLINE', '89364698'), ('PubMed', '2770692')]
authors: Sugiura M.;
title: 
references: []
authors: Shinozaki K., Ohme M., Tanaka M., Wakasugi T., Hayashida N.,
Matsubayashi T., Zaita N., Chunwongse J., Obokata J.,
Yamaguchi-Shinozaki K., Ohto C., Torazawa K., Meng B.Y., Sugita M.,
Deno H., Kamogashira T., Yamada K., Kusuda J., Takaiwa F., Kato A.,
Tohdoh N., Shimada H., Sugiura M.;
title: "The complete nucleotide sequence of the tobacco chloroplast genome:
its gene organization and expression.";
references: []
authors: Chaudhuri S., Maliga P.;
title: "Sequences directing C to U editing of the plastid psbL mRNA are
located within a 22 nucleotide segment spanning the editing site.";
references: [('MEDLINE', '97076156'), ('PubMed', '8918473')]
authors: Chakhmakhcheva O.G., Andreeva A.V., Buryakova A.A., Reverdatto S.V.,
Efimov V.A.;
title: "Nucleotide sequence of the barley chloroplast psbE, psbF genes and
flanking regions.";
references: [('MEDLINE', '89240046'), ('PubMed', '2654886')]
authors: Efimov V.A., Andreeva A.V., Reverdatto S.V., Chakhmakhcheva O.G.;
title: "Photosystem II of rye. Nucleotide sequence of the psbB, psbC, psbE,
psbF, psbH genes of rye and chloroplast DNA regions adjacent to
them.";
references: [('MEDLINE', '92207253'), ('PubMed', '1804121')]
authors: Webber A.N., Hird S.M., Packman L.C., Dyer T.A., Gray J.C.;
title: "A photosystem II polypeptide is encoded by an open reading frame
co-transcribed with genes for cytochrome b-559 in wheat chloroplast
DNA.";
references: []
authors: Kudla J., Igloi G.L., Metzlaff M., Hagemann R., Koessel H.;
title: "RNA editing in tobacco chloroplasts leads to the formation of a
translatable psbL mRNA by a C to U substitution within the initiation
codon.";
references: [('MEDLINE', '92191997'), ('PubMed', '1547774')]
authors: Zolotarev A.S., Kolosov V.L.;
title: "Nucleotide sequence of the rye chloroplast DNA fragment, comprising
psbE and psbF genes.";
references: [('MEDLINE', '89160331'), ('PubMed', '2646599')]
authors: Kolosov V.L., Klezovich O.N., Abdulaev N.G., Zolotarev A.S.;
title: "Photosystem II of rye. Nucleotide sequence of genes psbE, psbF, psbL
and OPC40 of chloroplast DNA.";
references: [('MEDLINE', '90073796'), ('PubMed', '2686655')]
authors: Haley J., Bogorad L.;
title: 
references: []
authors: Maier R.M., Neckermann K., Igloi G.L., Koessel H.;
title: "Complete sequence of the maize chloroplast genome: gene content,
hotspots of divergence and fine tuning of genetic information by
transcript editing.";
references: [('MEDLINE', '95395841'), ('PubMed', '7666415')]
authors: Willey D.L., Gray J.C.;
title: "Two small open reading frames are co-transcribed with the pea
chloroplast genes for the polypeptides of cytochrome b-559.";
references: [('MEDLINE', '89354671'), ('PubMed', '2766383')]
authors: Bock R., Hagemann R., Koessel H., Kudla J.;
title: "Tissue- and stage-specific modulation of RNA editing of the psbF and
psbL transcript from spinach plastids -- a new regulatory mechanism?";
references: [('MEDLINE', '93360903'), ('PubMed', '8355656')]
authors: Hermann R.G., Alt J., Schiller B., Widger W.R., Cramer W.A.;
title: "Nucleotide sequence of the gene for apocytochrome b-559 on the
spinach plastid chromosome: implications for the structure of the
membrane protein.";
references: []
authors: Kuntz M., Camara B., Weil J.-H., Schantz R.;
title: "The psbL gene from bell pepper (Capsicum annuum): plastid RNA
editing also occurs in non-photosynthetic chromoplasts.";
references: [('MEDLINE', '93099270'), ('PubMed', '1463853')]
authors: Forsthoefel N.R., Cushman J.C.;
title: "Characterization and expression of photosystem II genes (psbE, psbF,
and psbL) from the facultative crassulacean acid metabolism plant
Mesembryanthemum crystallinum.";
references: [('MEDLINE', '94345017'), ('PubMed', '8066140')]
authors: Kubo T., Yanai Y., Kinoshita T., Mikami T.;
title: "The chloroplast trnP-trnW-petG gene cluster in the mitochondrial
genomes of Beta vulgaris, B. trigyna and B. webbiana: evolutionary
aspects.";
references: [('MEDLINE', '95254673'), ('PubMed', '7736615')]
authors: Naithani S.;
title: 
references: []
authors: Ikeuchi M., Takio K., Inoue Y.;
title: "N-terminal sequencing of photosystem II low-molecular-mass proteins.
5 and 4.1 kDa components of the O2-evolving core complex from higher
plants.";
references: [('MEDLINE', '89121082'), ('PubMed', '2644131')]
authors: Zheleva D., Sharma J., Panico M., Morris H.R., Barber J.;
title: "Isolation and characterization of monomeric and dimeric
CP47-reaction center photosystem II complexes.";
references: [('MEDLINE', '98298118'), ('PubMed', '9632665')]

testing sp015...
*Using SequenceParser
IPI00383150
IPI00383150.2

Seq('MSFQAPRRLLELAGQSLLRDQALAISVLDELPRELFPRLFVEAFTSRRCEVLKV...TPC', ProteinAlphabet())
*Using RecordParser
IPI00383150.2
['IPI00383150']
['Eukaryota', 'Metazoa', 'Chordata', 'Craniata', 'Vertebrata', 'Euteleostomi', 'Mammalia', 'Eutheria', 'Primates', 'Catarrhini', 'Hominidae', 'Homo']
(457, 52856, '5C3151AAADBDE232')
***Features:
***References:
