~ubuntu-branches/ubuntu/hoary/bioperl/hoary

« back to all changes in this revision

Viewing changes to t/data/interpro_short.xml

  • Committer: Bazaar Package Importer
  • Author(s): Matt Hope
  • Date: 2004-04-18 14:24:11 UTC
  • mfrom: (1.2.1 upstream) (2.1.1 warty)
  • Revision ID: james.westby@ubuntu.com-20040418142411-gr92uexquw4w8liq
Tags: 1.4-1
* New upstream release
* Examples and working code are installed by default to usr/bin,
  this has been moved to usr/share/doc/bioperl/bin

Show diffs side-by-side

added added

removed removed

Lines of Context:
 
1
<?xml version="1.0" encoding="ISO-8859-1"?>
 
2
<!-- edited with XML Spy v4.4 U (http://www.xmlspy.com) by LYNN WHITE (EMBL OUTSTATION THE EBI) -->
 
3
<!DOCTYPE interprodb SYSTEM "interpro.dtd">
 
4
<interprodb>
 
5
  <release>
 
6
    <dbinfo dbname="INTERPRO" version="5.1" entry_count="5630" file_date="12-JUL-2002 00:00:00"/>
 
7
    <dbinfo dbname="SWISS" version="40.22" entry_count="110823" file_date="24-JUN-2002 00:00:00"/>
 
8
    <dbinfo dbname="TREMBL" version="21.2" entry_count="671586" file_date="05-JUL-2002 00:00:00"/>
 
9
    <dbinfo dbname="PRINTS" version="33.0" entry_count="1650" file_date="24-JAN-2002 00:00:00"/>
 
10
    <dbinfo dbname="PREFILE" version="N/A" entry_count="252" file_date="18-JUL-2001 00:00:00"/>
 
11
    <dbinfo dbname="PROSITE" version="17.5" entry_count="1565" file_date="21-JUN-2002 00:00:00"/>
 
12
    <dbinfo dbname="PFAM" version="7.3" entry_count="3865" file_date="17-MAY-2002 00:00:00"/>
 
13
    <dbinfo dbname="PRODOM" version="2001.3" entry_count="1346" file_date="28-JAN-2002 00:00:00"/>
 
14
    <dbinfo dbname="SMART" version="3.1" entry_count="509" file_date="16-NOV-2000 00:00:00"/>
 
15
    <dbinfo dbname="TIGRFAMs" version="1.2" entry_count="814" file_date="03-AUG-2001 00:00:00"/>
 
16
  </release>
 
17
  <interpro id="IPR000001" type="Domain" short_name="Kringle" protein_count="129">
 
18
    <name>Kringle</name>
 
19
    <abstract>
 
20
Kringles are autonomous structural domains, found throughout the blood 
 
21
               clotting and fibrinolytic proteins.
 
22
Kringle domains are believed to play a role in binding mediators (e.g., membranes,
 
23
other proteins or phospholipids), and in the regulation of proteolytic activity
 
24
<cite idref="PUB00002414"/>, <cite idref="PUB00001541"/>, <cite idref="PUB00003257"/>. 
 
25
Kringle domains <cite idref="PUB00003400"/>, <cite idref="PUB00000803"/>, <cite idref="PUB00001620"/> are characterised by a triple loop, 3-disulphide bridge structure, whose  conformation is defined by a number of hydrogen bonds and small pieces of  anti-parallel beta-sheet. They are found in a varying number  of  copies,  in some serine proteases and
 
26
plasma proteins.</abstract>
 
27
    <example_list>
 
28
      <example><db_xref dbkey="P00748" db="SWISS"/>Blood coagulation factor XII (Hageman factor) (1 copy)</example>
 
29
      <example><db_xref dbkey="P00749" db="SWISS"/>Urokinase-type plasminogen activator (1 copy)</example>
 
30
      <example><db_xref dbkey="Q08048" db="SWISS"/>Hepatocyte growth factor (HGF) (4 copies)</example>
 
31
      <example><db_xref dbkey="Q04756" db="SWISS"/>Hepatocyte growth factor activator <cite idref="PUB00003400"/> (1 copy) <cite idref="PUB00002776"/></example>
 
32
      <example>
 
33
                                <db_xref dbkey="P06867" db="SWISS"/>
 
34
Plasminogen (5 copies)
 
35
      </example>
 
36
      <example>
 
37
                                <db_xref dbkey="P26927" db="SWISS"/>
 
38
Hepatocyte growth factor like protein (4 copies) <cite idref="PUB00000355"/>
 
39
                        </example>
 
40
      <example>
 
41
                                <db_xref dbkey="P00735" db="SWISS"/>
 
42
Thrombin (2 copies)
 
43
      </example>
 
44
      <example>
 
45
                                <db_xref dbkey="P15638" db="SWISS"/>
 
46
Tissue plasminogen activator (TPA) (2 copies)
 
47
      </example>
 
48
      <example>
 
49
                                <db_xref dbkey="P08519" db="SWISS"/>
 
50
Apolipoprotein A (38 copies)
 
51
      </example>
 
52
    </example_list>
 
53
    <pub_list>
 
54
      <publication id="PUB00002414">
 
55
        <author_list>Fujikawa K., McMullen B.A.</author_list>
 
56
        <title>Primary structure of the heavy chain of human factor XIIa.</title>
 
57
        <db_xref db="MEDLINE" dbkey="85182674"/>
 
58
        <journal>J. Biol. Chem.</journal>
 
59
        <location firstpage="5328" lastpage="5341" volume="260"/>
 
60
        <year>1985</year>
 
61
      </publication>
 
62
      <publication id="PUB00001541">
 
63
        <author_list>Patthy L., Trexler M., Vali V., Banyai L., Varadi A.</author_list>
 
64
        <title>Kringles: Modules specialized for protein binding.</title>
 
65
        <db_xref db="MEDLINE" dbkey="84208845"/>
 
66
        <journal>FEBS Lett.</journal>
 
67
        <location firstpage="131" lastpage="136" volume="171"/>
 
68
        <year>1984</year>
 
69
      </publication>
 
70
      <publication id="PUB00003257">
 
71
        <author_list>Atkinson R.A., Williams R.J.P.</author_list>
 
72
        <title>Solution structure of the kringle 4 domain from human plasminogen by 1H nuclear magnetic resonance spectroscopy and distance geometry.</title>
 
73
        <db_xref db="MEDLINE" dbkey="90219023"/>
 
74
        <journal>J. Mol. Biol.</journal>
 
75
        <location firstpage="541" lastpage="552" volume="212"/>
 
76
        <year>1990</year>
 
77
      </publication>
 
78
      <publication id="PUB00003400">
 
79
        <author_list>Castellino F.J., Beals J.M.</author_list>
 
80
        <title>The genetic relationships between the kringle domains of human plasminogen, prothrombin, tissue plasminogen activator, urokinase, and coagulation factor XII.</title>
 
81
        <db_xref db="MEDLINE" dbkey="88230478"/>
 
82
        <journal>J. Mol. Evol.</journal>
 
83
        <location firstpage="358" lastpage="369" volume="26"/>
 
84
        <year>1987</year>
 
85
      </publication>
 
86
      <publication id="PUB00000803">
 
87
        <author_list>Patthy L.</author_list>
 
88
        <title>Evolution of the proteases of blood coagulation and fibrinolysis by assembly from modules.</title>
 
89
        <db_xref db="MEDLINE" dbkey="85228216"/>
 
90
        <journal>Cell</journal>
 
91
        <location firstpage="657" lastpage="663" volume="41"/>
 
92
        <year>1985</year>
 
93
      </publication>
 
94
      <publication id="PUB00001620">
 
95
        <author_list>Takahashi K., Ikeo K., Gojobori T.</author_list>
 
96
        <title>Evolutionary origin of numerous kringles in human and simian apolipoprotein(a).</title>
 
97
        <db_xref db="MEDLINE" dbkey="91348198"/>
 
98
        <journal>FEBS Lett.</journal>
 
99
        <location firstpage="146" lastpage="148" volume="287"/>
 
100
        <year>1991</year>
 
101
      </publication>
 
102
      <publication id="PUB00000355">
 
103
        <author_list>Friezner Degen S.J., Stuart L.A., Han S., Jamison C.S.</author_list>
 
104
        <title>Characterization of the mouse cDNA and gene coding for a hepatocyte growth factor-like protein: expression during development.</title>
 
105
        <db_xref db="MEDLINE" dbkey="92002017"/>
 
106
        <journal>Biochemistry</journal>
 
107
        <location firstpage="9781" lastpage="9791" volume="30"/>
 
108
        <year>1991</year>
 
109
      </publication>
 
110
      <publication id="PUB00002776">
 
111
        <author_list>Miyazawa K., Shimomura T., Kitamura A., Kondo J., Morimoto Y., Kitamura N.</author_list>
 
112
        <title>Molecular cloning and sequence analysis of the cDNA for a human serine protease reponsible for activation of hepatocyte growth factor. Structural similarity of the protease precursor to blood coagulation factor XII.</title>
 
113
        <db_xref db="MEDLINE" dbkey="93252878"/>
 
114
        <journal>J. Biol. Chem.</journal>
 
115
        <location firstpage="10024" lastpage="10028" volume="268"/>
 
116
        <year>1993</year>
 
117
      </publication>
 
118
    </pub_list>
 
119
    <member_list>
 
120
      <db_xref protein_count="91" db="PRINTS" dbkey="PR00018" name="KRINGLE"/>
 
121
      <db_xref protein_count="126" db="PROFILE" dbkey="PS50070" name="KRINGLE_2"/>
 
122
      <db_xref protein_count="161" db="PROSITE" dbkey="PS00021" name="KRINGLE_1"/>
 
123
      <db_xref protein_count="128" db="PFAM" dbkey="PF00051" name="kringle"/>
 
124
      <db_xref protein_count="126" db="PRODOM" dbkey="PD000395" name="Kringle"/>
 
125
      <db_xref protein_count="115" db="SMART" dbkey="SM00130" name="KR"/>
 
126
    </member_list>
 
127
    <external_doc_list>
 
128
      <db_xref db="BLOCKS" dbkey="IPB000001"/>
 
129
      <db_xref db="PDOC" dbkey="PDOC00020"/>
 
130
    </external_doc_list>
 
131
  </interpro>
 
132
  <interpro id="IPR000002" type="Domain" short_name="Fizzy" protein_count="57">
 
133
    <name>Cdc20/Fizzy</name>
 
134
    <abstract>
 
135
&lt;p&gt;The Cdc20/Fizzy region is almost always associated with the G-protein beta WD-40 repeat (<db_xref db="INTERPRO" dbkey="IPR001680"/>). Ubiquitin-mediated proteolysis due to the anaphase-promoting complex/cyclosome
 
136
 (APC/C) is essential for separation of sister chromatids, requiring degradation of the anaphase inhibitor Pds1, and for exit from mitosis, requiring inactivation of cyclin B  Cdk1 kinases <cite idref="PUB00006167"/>. In <taxon tax_id="4890">yeast</taxon> Cdc20 is required for two microtubule-dependent processes, nuclear movements prior to anaphase and chromosome separation. APC(Cdc20) allows activation of Cdc14 and promotes exit from mitosis by mediating proteolysis of Pds1  and the S phase cyclin Clb5 in the yeast <taxon tax_id="4932">Saccharomyces cerevisiae</taxon>. &lt;/p&gt;
 
137
&lt;p&gt;This domain is also found in a number of, as yet, uncharacterised proteins. These include a <taxon tax_id="40674">mammalian</taxon> protein, p55CDC, that is present in dividing cells and is
 
138
      associated with protein kinase activity.&lt;/p&gt;
 
139
</abstract>
 
140
    <example_list>
 
141
      <example>
 
142
                                <db_xref dbkey="P26309" db="SWISS"/>Cell division control protein (Cdc20) from S. cerevisiae
 
143
      </example>
 
144
      <example>
 
145
                                <db_xref dbkey="Q09786" db="SWISS"/>A hypothetical protein from S. pombe
 
146
      </example>
 
147
    </example_list>
 
148
    <pub_list>
 
149
      <publication id="PUB00006167">
 
150
        <author_list>Shirayama M., Toth A., Galova M., Nasmyth K.</author_list>
 
151
        <title>APC(Cdc20) promotes exit from mitosis by destroying the anaphase inhibitor Pds1 and cyclin Clb5.</title>
 
152
        <db_xref db="MEDLINE" dbkey="20110935"/>
 
153
        <journal>Nature</journal>
 
154
        <location firstpage="203" lastpage="207" volume="402" issue="6758"/>
 
155
        <year>1999</year>
 
156
      </publication>
 
157
    </pub_list>
 
158
    <member_list>
 
159
      <db_xref protein_count="59" db="PREFILE" dbkey="PS50218" name="FIZZY_DOMAIN"/>
 
160
      <db_xref protein_count="55" db="PRODOM" dbkey="PD004563" name="Fizzy"/>
 
161
    </member_list>
 
162
    <external_doc_list>
 
163
      <db_xref db="QDOC" dbkey="QDOC50218"/>
 
164
    </external_doc_list>
 
165
  </interpro>
 
166
  <interpro id="IPR000003" type="Family" short_name="RtnoidX_receptor" protein_count="75">
 
167
    <name>Retinoid X receptor</name>
 
168
    <abstract>
 
169
Steroid or nuclear hormone receptors (4A nuclear receptor, NRs) constitute an important superfamily of transcription regulators that are involved in widely diverse physiological functions, including control of embryonic development, cell differentiation and homeostasis. Members of the superfamily include the steroid hormone receptors and receptors for thyroid hormone, retinoids, 1,25-dihydroxy-vitamin D3 and a variety of other ligands. The proteins function as dimeric molecules in nuclei to regulate the transcription of target genes in a ligand-responsive manner <cite idref="PUB00004464"/>, <cite idref="PUB00006168"/>. In addition to C-terminal ligand-binding domains, these nuclear receptors contain a highly-conserved, N-terminal zinc-finger that mediates specific binding to target DNA sequences, termed ligand-responsive elements. In the absence of ligand, steroid hormone receptors are thought to be weakly associated with nuclear components; hormone binding greatly increases receptor affinity.
 
170
 
 
171
NRs are extremely important in medical research, a large number of them being implicated in diseases such as cancer, diabetes, hormone resistance syndromes, etc. While several NRs act as ligand-inducible transcription factors, many do not yet have a defined ligand and are accordingly termed "orphan" receptors. During the last decade, more than 300 NRs have been described, many of which are orphans, which cannot easily be named due to current nomenclature confusions in the literature. However, a new system has recently been introduced in an attempt to rationalise the increasingly complex set of names used to describe superfamily members.
 
172
 
 
173
 
 
174
&lt;p&gt;The retinoic acid (retinoid X) receptor consists of 3 functional and 
 
175
               structural domains: an N-terminal (modulatory) domain; a DNA binding domain
 
176
               that mediates specific binding to target DNA sequences (ligand-responsive
 
177
               elements); and a hormone binding domain. The N-terminal domain differs 
 
178
               between retinoic acid isoforms; the small highly-conserved DNA-binding
 
179
               domain (~65 residues) occupies the central portion of the protein; and 
 
180
               the ligand binding domain lies at the receptor C-terminus.&lt;/p&gt;
 
181
&lt;p&gt;Synonym(s): 2B nuclear receptor&lt;/p&gt;
 
182
</abstract>
 
183
    <class_list>
 
184
      <classification id="GO:0003677" class_type="GO">
 
185
        <category>Molecular Function</category>
 
186
        <description>DNA binding</description>
 
187
      </classification>
 
188
      <classification id="GO:0004879" class_type="GO">
 
189
        <category>Molecular Function</category>
 
190
        <description>ligand-dependent nuclear receptor</description>
 
191
      </classification>
 
192
      <classification id="GO:0005496" class_type="GO">
 
193
        <category>Molecular Function</category>
 
194
        <description>steroid binding</description>
 
195
      </classification>
 
196
      <classification id="GO:0005634" class_type="GO">
 
197
        <category>Cellular Component</category>
 
198
        <description>nucleus</description>
 
199
      </classification>
 
200
      <classification id="GO:0006355" class_type="GO">
 
201
        <category>Biological Process</category>
 
202
        <description>regulation of transcription</description>
 
203
      </classification>
 
204
    </class_list>
 
205
    <example_list>
 
206
      <example>
 
207
                                <db_xref dbkey="Q06726" db="SWISS"/>
 
208
                        </example>
 
209
      <example>
 
210
                                <db_xref dbkey="P81559" db="SWISS"/>
 
211
                        </example>
 
212
      <example>
 
213
                                <db_xref dbkey="Q64104" db="SWISS"/>
 
214
                        </example>
 
215
      <example>
 
216
                                <db_xref dbkey="Q91766" db="SWISS"/>
 
217
                        </example>
 
218
      <example>
 
219
                                <db_xref dbkey="P28701" db="SWISS"/>
 
220
                        </example>
 
221
      <example>
 
222
                                <db_xref dbkey="O75454" db="SWISS"/>
 
223
                        </example>
 
224
    </example_list>
 
225
    <pub_list>
 
226
      <publication id="PUB00004464">
 
227
        <author_list>Nishihara T., Nishikawa J.-I., Kitaura M., Imagawa M.</author_list>
 
228
        <title>Vitamin D receptor contains multiple dimerisation interfaces that are functionally different.</title>
 
229
        <db_xref db="MEDLINE" dbkey="95206940"/>
 
230
        <journal>Nucleic Acids Res.</journal>
 
231
        <location firstpage="606" lastpage="611" volume="23"/>
 
232
        <year>1995</year>
 
233
      </publication>
 
234
      <publication id="PUB00006168">
 
235
        <author_list>Schmitt J., De Vos P., Verhoeven G., Stunnenberg H.G.</author_list>
 
236
        <title>Human androgen receptor expressed in HeLa cells activates transcription in vitro.</title>
 
237
        <db_xref db="MEDLINE" dbkey="94218237"/>
 
238
        <journal>Nucleic Acids Res.</journal>
 
239
        <location firstpage="1161" lastpage="1166" volume="22" issue="7"/>
 
240
        <year>1994</year>
 
241
      </publication>
 
242
    </pub_list>
 
243
    <parent_list>
 
244
      <rel_ref ipr_ref="IPR001723"/>
 
245
    </parent_list>
 
246
    <contains>
 
247
      <rel_ref ipr_ref="IPR000536"/>
 
248
    </contains>
 
249
    <member_list>
 
250
      <db_xref protein_count="75" db="PRINTS" dbkey="PR00545" name="RETINOIDXR"/>
 
251
    </member_list>
 
252
  </interpro>
 
253
  <interpro id="IPR000004" type="Domain" short_name="SapB" protein_count="135">
 
254
    <name>Saposin type B</name>
 
255
    <abstract>
 
256
Saposins are small lysosomal proteins that serve as activators of various
 
257
lysosomal lipid-degrading enzymes <cite idref="PUB00005747"/>. They probably act by isolating the
 
258
lipid substrate from the membrane surroundings, thus making it more 
 
259
accessible to the soluble degradative enzymes. All <taxon tax_id="40674">mammalian</taxon> saposins
 
260
are synthesized as a single precursor molecule (prosaposin) which contains
 
261
four Saposin-B domains, yielding the active saposins after proteolytic
 
262
cleavage, and two Saposin-A domains that are removed in the activation
 
263
reaction. 
 
264
The Saposin-B domains also occur in other 
 
265
proteins, many of them active in the lysis of membranes <cite idref="PUB00005721"/>, <cite idref="PUB00005765"/>. &lt;p&gt;The 3D-structure of NK-lysin has recently been determined <cite idref="PUB00005798"/> and found to
 
266
be very different from the one predicted in <cite idref="PUB00005747"/>.
 
267
A group of <taxon tax_id="3193">plant</taxon> aspartic proteases related to cyprosin. These proteins
 
268
have a peculiar SAP-B domain where the two halves are 'swapped' <cite idref="PUB00005742"/>.&lt;/p&gt;
 
269
</abstract>
 
270
    <example_list>
 
271
      <example>
 
272
                                <db_xref dbkey="P28039" db="SWISS"/>Mammalian Acyloxyacyl-hydrolase
 
273
      </example>
 
274
      <example>
 
275
                                <db_xref dbkey="P42210" db="SWISS"/>Plant aspartic proteinase
 
276
      </example>
 
277
      <example>
 
278
                                <db_xref dbkey="P17405" db="SWISS"/>Mammalian acid sphingomyelinase
 
279
      </example>
 
280
      <example>
 
281
                                <db_xref dbkey="Q07831" db="SWISS"/>Nonpathogenic pore-forming peptide from entamoeba
 
282
      </example>
 
283
      <example>
 
284
                                <db_xref dbkey="P10960" db="SWISS"/>Saposins Sap-A, Sap-B, Sap-C, Sap-D
 
285
      </example>
 
286
    </example_list>
 
287
    <pub_list>
 
288
      <publication id="PUB00005747">
 
289
        <author_list>O'Hara P.J., Munford R.S., Sheppard P.O.</author_list>
 
290
        <title>Saposin-like proteins (SAPLIP) carry out diverse functions on a common backbone structure.</title>
 
291
        <db_xref db="MEDLINE" dbkey="96048294"/>
 
292
        <journal>J. Lipid Res.</journal>
 
293
        <location firstpage="1653" lastpage="1663" volume="36" issue="8"/>
 
294
        <year>1995</year>
 
295
      </publication>
 
296
      <publication id="PUB00005721">
 
297
        <author_list>Ponting C.P.</author_list>
 
298
        <title>Acid sphingomyelinase possesses a domain homologous to its activator proteins: saposins B and D.</title>
 
299
        <db_xref db="MEDLINE" dbkey="94272336"/>
 
300
        <journal>Protein Sci.</journal>
 
301
        <location firstpage="359" lastpage="361" volume="3" issue="2"/>
 
302
        <year>1994</year>
 
303
      </publication>
 
304
      <publication id="PUB00005765">
 
305
        <author_list>Hofmann K., Tschopp J.</author_list>
 
306
        <title>Cytotoxic T cells: more weapons for new targets?</title>
 
307
        <db_xref db="MEDLINE" dbkey="97021725"/>
 
308
        <journal>Trends Microbiol.</journal>
 
309
        <location firstpage="91" lastpage="94" volume="4" issue="3"/>
 
310
        <year>1996</year>
 
311
      </publication>
 
312
      <publication id="PUB00005798">
 
313
        <author_list>Liepinsh E., Otting G., Andersson M., Ruysschaert J.M.</author_list>
 
314
        <title>Saposin fold revealed by the NMR structure of NK-lysin.</title>
 
315
        <db_xref db="MEDLINE" dbkey="97475218"/>
 
316
        <journal>Nat. Struct. Biol.</journal>
 
317
        <location firstpage="793" lastpage="795" volume="4" issue="10"/>
 
318
        <year>1997</year>
 
319
      </publication>
 
320
      <publication id="PUB00005742">
 
321
        <author_list>Ponting C.P., Russell R.B.</author_list>
 
322
        <title>Swaposins: circular permutations within genes encoding saposin homologues.</title>
 
323
        <db_xref db="MEDLINE" dbkey="95334819"/>
 
324
        <journal>Trends Biochem. Sci.</journal>
 
325
        <location firstpage="179" lastpage="180" volume="20" issue="5"/>
 
326
        <year>1995</year>
 
327
      </publication>
 
328
    </pub_list>
 
329
    <child_list>
 
330
      <rel_ref ipr_ref="IPR003258"/>
 
331
    </child_list>
 
332
    <member_list>
 
333
      <db_xref protein_count="133" db="PREFILE" dbkey="PS50015" name="SAP_B"/>
 
334
      <db_xref protein_count="71" db="PRODOM" dbkey="PD001732" name="SapB"/>
 
335
      <db_xref protein_count="109" db="SMART" dbkey="SM00118" name="SAPB"/>
 
336
    </member_list>
 
337
    <external_doc_list>
 
338
      <db_xref db="QDOC" dbkey="QDOC50015"/>
 
339
    </external_doc_list>
 
340
  </interpro>
 
341
  <interpro id="IPR000005" type="Domain" short_name="HTHAraC" protein_count="765">
 
342
    <name>Helix-turn-helix, AraC type </name>
 
343
    <abstract>
 
344
&lt;p&gt;Many bacterial transcription regulation proteins bind DNA through a
 
345
'helix-turn-helix' (HTH) motif. One major subfamily of these proteins <cite idref="PUB00004444"/>, <cite idref="PUB00003566"/> is related to the arabinose 
 
346
operon regulatory protein AraC <cite idref="PUB00004444"/>, <cite idref="PUB00003566"/>.
 
347
Except for celD <cite idref="PUB00001933"/>, all of these proteins seem to be positive transcriptional factors.&lt;/p&gt;
 
348
 
 
349
&lt;p&gt;Although the sequences belonging to this family differ somewhat in length, in nearly every case the HTH motif is situated towards the C-terminus in the third quarter of most of the sequences. The minimal DNA binding domain spans roughly 100 residues and comprises two HTH subdomains; the classical HTH domain and another HTH subdomain with similarity to the classical HTH domain but with an insertion of one residue in the turn-region. The  N-terminal and  central regions of these proteins are presumed
 
350
            to interact  with  effector molecules and may be involved in dimerization <cite idref="PUB00004817"/>.&lt;/p&gt;
 
351
 
 
352
&lt;p&gt;The known structure of MarA (<db_xref db="SWISSPROT" dbkey="P27246"/>) shows that the AraC domain is alpha helical and shows the two HTH subdomains both bind the major groove of the DNA. The two HTH subdomains are separated by only 27
 
353
angstroms, which causes the cognate DNA to bend.&lt;/p&gt;
 
354
</abstract>
 
355
    <class_list>
 
356
      <classification id="GO:0003700" class_type="GO">
 
357
        <category>Molecular Function</category>
 
358
        <description>transcription factor</description>
 
359
      </classification>
 
360
      <classification id="GO:0005622" class_type="GO">
 
361
        <category>Cellular Component</category>
 
362
        <description>intracellular</description>
 
363
      </classification>
 
364
      <classification id="GO:0006355" class_type="GO">
 
365
        <category>Biological Process</category>
 
366
        <description>regulation of transcription</description>
 
367
      </classification>
 
368
    </class_list>
 
369
    <example_list>
 
370
      <example>
 
371
                                <db_xref dbkey="Q04248" db="SWISS"/>Virulence regulon transcriptional activator
 
372
      </example>
 
373
      <example>
 
374
                                <db_xref dbkey="P28809" db="SWISS"/>mmsAB peron regulatory  protein
 
375
      </example>
 
376
      <example>
 
377
                                <db_xref dbkey="Q48413" db="SWISS"/>
 
378
                        </example>
 
379
      <example>
 
380
                                <db_xref dbkey="P35319" db="SWISS"/>Transcription regulator
 
381
      </example>
 
382
      <example>
 
383
                                <db_xref dbkey="Q52620" db="SWISS"/>Regulatory factor of blood coagulation
 
384
      </example>
 
385
      <example>
 
386
                                <db_xref dbkey="P17410" db="SWISS"/>CelD, the Escherichia coli cel operon repressor.
 
387
      </example>
 
388
      <example>
 
389
                                <db_xref dbkey="P19219" db="SWISS"/>AdaA, a Bacillus subtilis  bifunctional protein  that   acts  both  as  a transcriptional activator of the ada operon and as a methylphosphotriester-DNA alkyltransferase.
 
390
      </example>
 
391
      <example>
 
392
                                <db_xref dbkey="P03021" db="SWISS"/>AraC, the arabinose operon regulatory  protein, which activates the transcription of the araBAD genes.
 
393
      </example>
 
394
      <example>
 
395
                                <db_xref dbkey="P27246" db="SWISS"/>MarA,  which  may  be  a transcriptional activator of genes involved in the multiple antibiotic resistance (mar) phenotype.
 
396
      </example>
 
397
    </example_list>
 
398
    <pub_list>
 
399
      <publication id="PUB00004444">
 
400
        <author_list>Gallegos M.-T., Michan C., Ramos J.L.</author_list>
 
401
        <title>The XylS/AraC family of regulators.</title>
 
402
        <db_xref db="MEDLINE" dbkey="93197143"/>
 
403
        <journal>Nucleic Acids Res.</journal>
 
404
        <location firstpage="807" lastpage="810" volume="21"/>
 
405
        <year>1993</year>
 
406
      </publication>
 
407
      <publication id="PUB00003566">
 
408
        <author_list>Henikoff S., Wallace J.C., Brown J.P.</author_list>
 
409
        <title>Finding protein similarities with nucleotide sequence databases.</title>
 
410
        <db_xref db="MEDLINE" dbkey="90190362"/>
 
411
        <journal>Meth. Enzymol.</journal>
 
412
        <location firstpage="111" lastpage="132" volume="183"/>
 
413
        <year>1990</year>
 
414
      </publication>
 
415
      <publication id="PUB00001933">
 
416
        <author_list>Parker L.L., Hall B.G.</author_list>
 
417
        <title>Characterisation and nucleotide sequence of the cryptic cel operon of Escherichia coli K12.</title>
 
418
        <db_xref db="MEDLINE" dbkey="90185127"/>
 
419
        <journal>Genetics</journal>
 
420
        <location firstpage="455" lastpage="471" volume="124"/>
 
421
        <year>1990</year>
 
422
      </publication>
 
423
      <publication id="PUB00004817">
 
424
        <author_list>Bustos S.A., Schleif R.F.</author_list>
 
425
        <title>Functional domains of the AraC protein.</title>
 
426
        <db_xref db="MEDLINE" dbkey="93296193"/>
 
427
        <journal>Proc. Natl. Acad. Sci. U.S.A.</journal>
 
428
        <location firstpage="5638" lastpage="5642" volume="90"/>
 
429
        <year>1993</year>
 
430
      </publication>
 
431
    </pub_list>
 
432
    <member_list>
 
433
      <db_xref protein_count="478" db="PRINTS" dbkey="PR00032" name="HTHARAC"/>
 
434
      <db_xref protein_count="762" db="PROFILE" dbkey="PS01124" name="HTH_ARAC_FAMILY_2"/>
 
435
      <db_xref protein_count="855" db="PROSITE" dbkey="PS00041" name="HTH_ARAC_FAMILY_1"/>
 
436
      <db_xref protein_count="747" db="PFAM" dbkey="PF00165" name="HTH_AraC"/>
 
437
      <db_xref protein_count="683" db="SMART" dbkey="SM00342" name="HTH_ARAC"/>
 
438
    </member_list>
 
439
    <external_doc_list>
 
440
      <db_xref db="BLOCKS" dbkey="IPB000005"/>
 
441
      <db_xref db="PDOC" dbkey="PDOC00040"/>
 
442
    </external_doc_list>
 
443
  </interpro>
 
444
        <interpro id="IPR000010" type="Family" short_name="Cystatin" protein_count="219">
 
445
                <name>Cysteine proteases inhibitor</name>
 
446
                <abstract>
 
447
Members of this family are inhibitors of cysteine  proteases <cite idref="PUB00005324"/>, <cite idref="PUB00003412"/>, <cite idref="PUB00001614"/>, which are found in the tissues and body fluids of <taxon tax_id="33208">animals</taxon>, as well as in <taxon tax_id="3193">plants</taxon>. They can be grouped into three distinct but related families. These are the type 1 cystatins (or stefins), type 2 cystatins, and the kininogens.
 
448
&lt;p&gt;Kininogen is the precursor  of  the  active  peptide  bradykinin that  plays a role in blood coagulation by  helping  to  position optimally prekallikrein and factor XI next  to factor XII. They  are  also  inhibitors  of  cysteine  proteases. Structurally,  kininogens  are  made  of  three  contiguous type-2 cystatin domains, followed  by an  additional  domain  (of  variable  length)  which contains  the  sequence of bradykinin.  The  first  of  the  three cystatin domains seems to have lost its inhibitory activity.&lt;/p&gt;
 
449
</abstract>
 
450
                <class_list>
 
451
                        <classification id="GO:0004869" class_type="GO">
 
452
                                <category>Molecular Function</category>
 
453
                                <description>cysteine protease inhibitor</description>
 
454
                        </classification>
 
455
                </class_list>
 
456
                <example_list>
 
457
                        <example>
 
458
                                <db_xref dbkey="P09229" db="SWISS"/>Cysteine proteinase inhibitor of rice
 
459
      </example>
 
460
                        <example>
 
461
                                <db_xref dbkey="P29701" db="SWISS"/>Mammalian fetuin
 
462
      </example>
 
463
                        <example>
 
464
                                <db_xref dbkey="P28325" db="SWISS"/>Type 2 cystatin
 
465
      </example>
 
466
                        <example>
 
467
                                <db_xref dbkey="P37842" db="SWISS"/>Potato  multicystatin, an eight-domain cysteine proteinase inhibitor
 
468
      </example>
 
469
                        <example>
 
470
                                <db_xref dbkey="P01045" db="SWISS"/>Kininogen
 
471
      </example>
 
472
                        <example>
 
473
                                <db_xref dbkey="Q28986" db="SWISS"/>Type 1 cystatin
 
474
      </example>
 
475
                        <example>
 
476
                                <db_xref dbkey="P31727" db="SWISS"/>Sarcocystatin A from the flesh fish
 
477
      </example>
 
478
                </example_list>
 
479
                <pub_list>
 
480
                        <publication id="PUB00005324">
 
481
                                <author_list>Barrett A.J.</author_list>
 
482
                                <journal>Trends Biochem. Sci.</journal>
 
483
                                <location firstpage="193" lastpage="196" volume="12"/>
 
484
                                <year>1987</year>
 
485
                        </publication>
 
486
                        <publication id="PUB00003412">
 
487
                                <author_list>Rawlings N.D., Barrett A.J.</author_list>
 
488
                                <title>Evolution of proteins of the cystatin superfamily.</title>
 
489
                                <db_xref db="MEDLINE" dbkey="90189177"/>
 
490
                                <journal>J. Mol. Evol.</journal>
 
491
                                <location firstpage="60" lastpage="71" volume="30"/>
 
492
                                <year>1990</year>
 
493
                        </publication>
 
494
                        <publication id="PUB00001614">
 
495
                                <author_list>Bode W., Turk V.</author_list>
 
496
                                <title>The cystatins: protein inhibitors of cysteine proteinases.</title>
 
497
                                <db_xref db="MEDLINE" dbkey="91309737"/>
 
498
                                <journal>FEBS Lett.</journal>
 
499
                                <location firstpage="213" lastpage="219" volume="285"/>
 
500
                                <year>1991</year>
 
501
                        </publication>
 
502
                </pub_list>
 
503
                <child_list>
 
504
                        <rel_ref ipr_ref="IPR001363"/>
 
505
                        <rel_ref ipr_ref="IPR001713"/>
 
506
                        <rel_ref ipr_ref="IPR003243"/>
 
507
                        <rel_ref ipr_ref="IPR003244"/>
 
508
                </child_list>
 
509
                <member_list>
 
510
                        <db_xref protein_count="199" db="PROSITE" dbkey="PS00287" name="CYSTATIN"/>
 
511
                        <db_xref protein_count="209" db="PFAM" dbkey="PF00031" name="cystatin"/>
 
512
                        <db_xref protein_count="205" db="SMART" dbkey="SM00043" name="CY"/>
 
513
                </member_list>
 
514
                <external_doc_list>
 
515
                        <db_xref db="BLOCKS" dbkey="IPB000010"/>
 
516
                        <db_xref db="PDOC" dbkey="PDOC00259"/>
 
517
                </external_doc_list>
 
518
                <sec_list>
 
519
                        <sec_ac acc="IPR000078"/>
 
520
                </sec_list>
 
521
        </interpro>
 
522
        <interpro id="IPR000413" type="Family" short_name="Integrin_alpha" protein_count="126">
 
523
                <name>Integrins alpha chain</name>
 
524
                <abstract>
 
525
Integrins <cite idref="PUB00000811"/>, <cite idref="PUB00001505"/> are a large family of cell surface receptors that mediate cell
 
526
to cell as well as cell to matrix adhesion. Some integrins recognize the R-G-D
 
527
sequence in their extracellular matrix protein ligand. Structurally, integrins
 
528
consist of a dimer of an alpha and a beta chain.  Each  subunit  has  a  large
 
529
N-terminal extracellular domain followed by a transmembrane domain and a short
 
530
C-terminal cytoplasmic  region.    Some    alpha  subunits   are cleaved post-
 
531
translationally to produce  a  heavy  and a  light chain linked by a disulfide
 
532
bond. Integrin alpha chains  share a  conserved sequence which is found at
 
533
the  beginning  of  the  cytoplasmic  domain,  just   after  the  end  of  the
 
534
transmembrane region. The exact pairing of alpha- and beta-subunits determines
 
535
ligand specificity, localisation and function. Within the N-terminal domain of alpha subunits, seven sequence repeats, each
 
536
of approximately 60 amino acids, have been found <cite idref="PUB00006166"/>. It has been predicted 
 
537
that these repeats assume a beta-propeller fold. The domains contain seven 
 
538
four-stranded beta-sheets arranged in a torus around a pseudosymmetry axis
 
539
<cite idref="PUB00005772"/>. Integrin ligands and a putative Mg&lt;sup&gt;2+&lt;/sup&gt; ion are predicted to bind to the
 
540
upper face of the propeller, in a manner analogous to the way in which the
 
541
trimeric G-protein beta subunit (G beta) (which also has a beta-propeller
 
542
fold) binds the G protein alpha subunit <cite idref="PUB00005772"/>.
 
543
</abstract>
 
544
                <class_list>
 
545
                        <classification id="GO:0004895" class_type="GO">
 
546
                                <category>Molecular Function</category>
 
547
                                <description>cell adhesion receptor</description>
 
548
                        </classification>
 
549
                        <classification id="GO:0007155" class_type="GO">
 
550
                                <category>Biological Process</category>
 
551
                                <description>cell adhesion</description>
 
552
                        </classification>
 
553
                        <classification id="GO:0007160" class_type="GO">
 
554
                                <category>Biological Process</category>
 
555
                                <description>cell-matrix adhesion</description>
 
556
                        </classification>
 
557
                        <classification id="GO:0008305" class_type="GO">
 
558
                                <category>Cellular Component</category>
 
559
                                <description>integrin</description>
 
560
                        </classification>
 
561
                </class_list>
 
562
                <example_list>
 
563
                        <example>
 
564
                                <db_xref dbkey="P23229" db="SWISS"/>The alpha-6 chain (VLA-6) which,  with  the beta-1  chain, forms a platelet laminin receptor.
 
565
      </example>
 
566
                        <example>
 
567
                                <db_xref dbkey="P53708" db="SWISS"/>The alpha-8 chain which, with the  beta-1 chain  plays  a  possible role in cell-cell interactions during axon-growth and fasciculation.
 
568
      </example>
 
569
                        <example>
 
570
                                <db_xref dbkey="P08648" db="SWISS"/>The alpha-5 chain (VLA-5) (CD49e) which,  with  the beta-1 chain,  forms  a receptor specific to fibronectin.
 
571
      </example>
 
572
                        <example>
 
573
                                <db_xref dbkey="P12080" db="SWISS"/>The Drosophila position-specific antigen 2 alpha chain (PS2).
 
574
      </example>
 
575
                        <example>
 
576
                                <db_xref dbkey="P26006" db="SWISS"/>The alpha-3 chain (VLA-3) (Galactoprotein B3).
 
577
      </example>
 
578
                        <example>
 
579
                                <db_xref dbkey="P56199" db="SWISS"/>The alpha-1 chain (VLA-1) (CD49a)  which,  with the beta-1 chain, acts as a receptor for laminin and collagen.
 
580
      </example>
 
581
                        <example>
 
582
                                <db_xref dbkey="P13612" db="SWISS"/>The alpha-4 chain (VLA-4) (CD49d)  which,  with the beta-1 chain, interacts with vascular cell adhesion protein 1 (VCAM-1).
 
583
      </example>
 
584
                        <example>
 
585
                                <db_xref dbkey="P17301" db="SWISS"/>The alpha-2 chain (VLA-2) (CD49b)  which,  with the beta-1 chain, acts as a receptor that binds collagen.
 
586
      </example>
 
587
                </example_list>
 
588
                <pub_list>
 
589
                        <publication id="PUB00000811">
 
590
                                <author_list>Hynes R.O.</author_list>
 
591
                                <title>Integrins: a family of cell surface receptors.</title>
 
592
                                <db_xref db="MEDLINE" dbkey="87131067"/>
 
593
                                <journal>Cell</journal>
 
594
                                <location firstpage="549" lastpage="554" volume="48"/>
 
595
                                <year>1987</year>
 
596
                        </publication>
 
597
                        <publication id="PUB00001505">
 
598
                                <author_list>Albelda S.M., Buck C.A.</author_list>
 
599
                                <title>Integrins and other cell adhesion molecules.</title>
 
600
                                <db_xref db="MEDLINE" dbkey="90337122"/>
 
601
                                <journal>FASEB J.</journal>
 
602
                                <location firstpage="2868" lastpage="2880" volume="4"/>
 
603
                                <year>1990</year>
 
604
                        </publication>
 
605
                        <publication id="PUB00006166">
 
606
                                <author_list>Springer T.A., Corbi A.L., Miller L.J., O'Connor K., Larson R.S.</author_list>
 
607
                                <title>cDNA cloning and complete primary structure of the alpha subunit of a leukocyte adhesion glycoprotein, p150,95.</title>
 
608
                                <db_xref db="MEDLINE" dbkey="88166645"/>
 
609
                                <journal>EMBO J.</journal>
 
610
                                <location firstpage="4023" lastpage="4028" volume="6" issue="13"/>
 
611
                                <year>1987</year>
 
612
                        </publication>
 
613
                        <publication id="PUB00005772">
 
614
                                <author_list>Springer T.A.</author_list>
 
615
                                <title>Folding of the N-terminal, ligand-binding region of integrin alpha-subunits into a beta-propeller domain.</title>
 
616
                                <db_xref db="MEDLINE" dbkey="97144395"/>
 
617
                                <journal>Proc. Natl. Acad. Sci. U.S.A.</journal>
 
618
                                <location firstpage="65" lastpage="72" volume="94" issue="1"/>
 
619
                                <year>1997</year>
 
620
                        </publication>
 
621
                </pub_list>
 
622
                <member_list>
 
623
                        <db_xref protein_count="79" db="PRINTS" dbkey="PR01185" name="INTEGRINA"/>
 
624
                        <db_xref protein_count="112" db="PREFILE" dbkey="PS50107" name="INTEGRIN_ALPHA_2"/>
 
625
                        <db_xref protein_count="104" db="PROSITE" dbkey="PS00242" name="INTEGRIN_ALPHA"/>
 
626
                        <db_xref protein_count="75" db="PFAM" dbkey="PF00357" name="integrin_A"/>
 
627
                        <db_xref protein_count="117" db="PFAM" dbkey="PF01839" name="FG-GAP"/>
 
628
                        <db_xref protein_count="110" db="SMART" dbkey="SM00191" name="Int_alpha"/>
 
629
                </member_list>
 
630
                <external_doc_list>
 
631
                        <db_xref db="BLOCKS" dbkey="IPB000413"/>
 
632
                        <db_xref db="PDOC" dbkey="PDOC00215"/>
 
633
                        <db_xref db="PROPRO" dbkey="integrins_alpha"/>
 
634
                </external_doc_list>
 
635
                <sec_list>
 
636
                        <sec_ac acc="IPR002458"/>
 
637
                        <sec_ac acc="IPR002476"/>
 
638
                </sec_list>
 
639
        </interpro>
 
640
  <deleted_entries>
 
641
    <del_ref id="IPR000001"/>
 
642
    <del_ref id="IPR000005"/>
 
643
    <del_ref id="IPR000019"/>
 
644
    <del_ref id="IPR000027"/>
 
645
    <del_ref id="IPR000078"/>
 
646
  </deleted_entries>
 
647
</interprodb>