create_index.sgml 11.5 KB
Newer Older
1
<!--
2
$Header: /cvsroot/pgsql/doc/src/sgml/ref/create_index.sgml,v 1.13 2000/05/02 20:02:03 thomas Exp $
3 4 5
Postgres documentation
-->

6 7
<refentry id="SQL-CREATEINDEX">
 <refmeta>
8
  <refentrytitle id="sql-createindex-title">
9
   CREATE INDEX
10 11 12 13 14
  </refentrytitle>
  <refmiscinfo>SQL - Language Statements</refmiscinfo>
 </refmeta>
 <refnamediv>
  <refname>
15
   CREATE INDEX
16 17
  </refname>
  <refpurpose>
18
   Constructs a secondary index
19
  </refpurpose>
20
 </refnamediv>
21 22
 <refsynopsisdiv>
  <refsynopsisdivinfo>
23
   <date>1999-07-20</date>
24 25
  </refsynopsisdivinfo>
  <synopsis>
26
CREATE [ UNIQUE ] INDEX <replaceable class="parameter">index_name</replaceable> ON <replaceable class="parameter">table</replaceable>
27
    [ USING <replaceable class="parameter">acc_name</replaceable> ] ( <replaceable class="parameter">column</replaceable> [ <replaceable class="parameter">ops_name</replaceable> ] [, ...] )
28
CREATE [ UNIQUE ] INDEX <replaceable class="parameter">index_name</replaceable> ON <replaceable class="parameter">table</replaceable>
29
    [ USING <replaceable class="parameter">acc_name</replaceable> ] ( <replaceable class="parameter">func_name</replaceable>( <replaceable class="parameter">column</replaceable> [, ... ]) [ <replaceable class="parameter">ops_name</replaceable> ] )
30 31 32 33 34 35 36
  </synopsis>

  <refsect2 id="R2-SQL-CREATEINDEX-1">
   <refsect2info>
    <date>1998-09-09</date>
   </refsect2info>
   <title>
37
    Inputs
38 39 40 41 42 43 44 45 46 47 48
   </title>
   <para>

    <variablelist>
     <varlistentry>
      <term>UNIQUE</term>
      <listitem>
       <para>
	Causes the system to check for
	duplicate values in the table when the index is created (if data
	already exist) and each time data is added. Attempts to
T
Thomas G. Lockhart 已提交
49 50
	insert or update data which would result in duplicate entries
	will generate an error.
51 52 53
       </para>
      </listitem>
     </varlistentry>
54

55 56 57 58 59 60 61 62
     <varlistentry>
      <term><replaceable class="parameter">index_name</replaceable></term>
      <listitem>
       <para>
	The name of the index to be created.
       </para>
      </listitem>
     </varlistentry>
63

64 65 66 67 68 69 70 71
     <varlistentry>
      <term><replaceable class="parameter">table</replaceable></term>
      <listitem>
       <para>
	The name of the table to be indexed.
       </para>
      </listitem>
     </varlistentry>
72

73 74 75 76
     <varlistentry>
      <term><replaceable class="parameter">acc_name</replaceable></term>
      <listitem>
       <para>
77
	The name of the access method to be used for
78
	the index. The default access method is BTREE.
79
	Postgres provides three access methods for indexes:
80

81 82 83 84 85
	<variablelist>
	 <varlistentry>
	  <term>BTREE</term>
	  <listitem>
	   <para>
86
	    an implementation of Lehman-Yao
87 88 89 90
	    high-concurrency btrees.
	   </para>
	  </listitem>
	 </varlistentry>
91

92 93 94 95 96 97 98 99
	 <varlistentry>
	  <term>RTREE</term>
	  <listitem>
	   <para>implements standard rtrees using Guttman's
	    quadratic split algorithm.
	   </para>
	  </listitem>
	 </varlistentry>
100

101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121
	 <varlistentry>
	  <term>HASH</term>
	  <listitem>
	   <para>
	    an implementation of Litwin's linear hashing.
	   </para>
	  </listitem>
	 </varlistentry>
	</variablelist>
       </para>
      </listitem>
     </varlistentry>

     <varlistentry>
      <term><replaceable class="parameter">column</replaceable></term>
      <listitem>
       <para>
	The name of a column of the table.
       </para>
      </listitem>
     </varlistentry>
122

123 124 125 126
     <varlistentry>
      <term><replaceable class="parameter">ops_name</replaceable></term>
      <listitem>
       <para>
127
	An associated operator class. See below for details.
128 129 130
       </para>
      </listitem>
     </varlistentry>
131

132 133 134 135
     <varlistentry>
      <term><replaceable class="parameter">func_name</replaceable></term>
      <listitem>
       <para>
136
	A function, which returns a value that can be indexed.
137 138 139
       </para>
      </listitem>
     </varlistentry>
140 141
    </variablelist>
   </para>
142 143 144 145 146 147 148
  </refsect2>

  <refsect2 id="R2-SQL-CREATEINDEX-2">
   <refsect2info>
    <date>1998-09-09</date>
   </refsect2info>
   <title>
149
    Outputs
150 151
   </title>
   <para>
T
Thomas G. Lockhart 已提交
152

153 154 155 156 157 158 159 160 161 162 163
    <variablelist>
     <varlistentry>
      <term><computeroutput>
CREATE
       </computeroutput></term>
      <listitem>
       <para>
	The message returned if the index is successfully created.
       </para>
      </listitem>
     </varlistentry>
T
Thomas G. Lockhart 已提交
164

165 166 167 168 169 170
     <varlistentry>
      <term><computeroutput>
ERROR: Cannot create index: 'index_name' already exists.
       </computeroutput></term>
      <listitem>
       <para>
171 172 173 174 175 176
	This error occurs if it is impossible to create the index.
       </para>
      </listitem>
     </varlistentry>
    </variablelist>
   </para>
177 178 179 180 181 182 183 184
  </refsect2>
 </refsynopsisdiv>

 <refsect1 id="R1-SQL-CREATEINDEX-1">
  <refsect1info>
   <date>1998-09-09</date>
  </refsect1info>
  <title>
185
   Description
186 187
  </title>
  <para>
188
   <command>CREATE INDEX</command> constructs an index 
189 190
   <replaceable class="parameter">index_name</replaceable>
   on the specified <replaceable class="parameter">table</replaceable>.
191

192 193 194 195 196 197 198
   <tip>
    <para>
     Indexes are primarily used to enhance database performance.
     But inappropriate use will result in slower performance.
    </para>
   </tip>
  </para>
199

200
  <para>
201 202 203 204
   In the first syntax shown above, the key field(s) for the
   index are specified as column names.
   Multiple fields can be specified if the index access method supports
   multi-column indexes.
205
  </para>
206

207
  <para>
208
   In the second syntax shown above, an index is defined
209
   on the result of a user-specified function
210
   <replaceable class="parameter">func_name</replaceable> applied
211 212 213
   to one or more attributes of a single class.
   These <firstterm>functional indices</firstterm>
   can be used to obtain fast access to data
214 215 216 217
   based on operators that would normally require some
   transformation to apply them to the base data.
  </para>

218 219
  <para>
   Postgres provides btree, rtree and hash access methods for
220 221
   indices.  The btree access method is an implementation of
   Lehman-Yao high-concurrency btrees.  The rtree access method
222 223 224 225 226 227 228 229
   implements standard rtrees using Guttman's quadratic split algorithm.
   The hash access method is an implementation of Litwin's linear
   hashing.  We mention the algorithms used solely to indicate that all
   of these access methods are fully dynamic and do not have to be
   optimized periodically (as is the case with, for example, static hash
   access methods).
  </para>

230 231 232 233 234
  <para>
   Use <xref linkend="sql-dropindex-title" endterm="sql-dropindex-title">
   to remove an index.
  </para>

235 236 237 238 239
  <refsect2 id="R2-SQL-CREATEINDEX-3">
   <refsect2info>
    <date>1998-09-09</date>
   </refsect2info>
   <title>
240
    Notes
241
   </title>
242 243

   <para>
244 245 246
    The <productname>Postgres</productname>
    query optimizer will consider using a btree index whenever
    an indexed attribute is involved in a comparison using one of:
247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279

    <simplelist type="inline">
     <member>&lt;</member>
     <member>&lt;=</member>
     <member>=</member>
     <member>&gt;=</member>
     <member>&gt;</member>
    </simplelist>
   </para>

   <para>
    The <productname>Postgres</productname>
    query optimizer will consider using an rtree index whenever
    an indexed attribute is involved in a comparison using one of:

    <simplelist type="inline">
     <member>&lt;&lt;</member>
     <member>&amp;&lt;</member>
     <member>&amp;&gt;</member>
     <member>&gt;&gt;</member>
     <member>@</member>
     <member>~=</member>
     <member>&amp;&amp;</member>
    </simplelist>
   </para>

   <para>
    The <productname>Postgres</productname>
    query optimizer will consider using a hash index whenever
    an indexed attribute is involved in a comparison using
    the <literal>=</literal> operator.
   </para>

280
   <para>
281 282 283
    Currently, only the btree access method supports multi-column
    indexes. Up to 16 keys may be specified by default (this limit
    can be altered when building Postgres).
284
   </para>
285

286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327
  <para>
   An <firstterm>operator class</firstterm> can be specified for each
   column of an index.  The operator class identifies the operators to
   be used by the index for that column.  For example, a btree index on
   four-byte integers would use the <literal>int4_ops</literal> class;
   this operator class includes comparison functions for four-byte
   integers.  In practice the default operator class for the field's
   datatype is usually sufficient.  The main point of having operator classes
   is that for some datatypes, there could be more than one meaningful
   ordering.  For example, we might want to sort a complex-number datatype
   either by absolute value or by real part.  We could do this by defining
   two operator classes for the datatype and then selecting the proper
   class when making an index.  There are also some operator classes with
   special purposes:

   <itemizedlist>
    <listitem>
     <para>
      The operator classes <literal>box_ops</literal> and
      <literal>bigbox_ops</literal> both support rtree indices on the
      <literal>box</literal> datatype.
      The difference between them is that <literal>bigbox_ops</literal>
      scales box coordinates down, to avoid floating point exceptions from
      doing multiplication, addition, and subtraction on very large
      floating-point coordinates.  If the field on which your rectangles lie
      is about 20,000 units square or larger, you should use
      <literal>bigbox_ops</literal>.
     </para>
    </listitem>

    <listitem>
     <para>
      The <literal>int24_ops</literal>
      operator class is useful for constructing indices on int2 data, and
      doing comparisons against int4 data in query qualifications.
      Similarly, <literal>int42_ops</literal>
      support indices on int4 data that is to be compared against int2 data
      in queries.
     </para>
    </listitem>
   </itemizedlist>
  </para>
328 329

   <para>
330
    The following query shows all defined operator classes:
331 332 333 334 335 336 337 338 339 340 341 342 343

    <programlisting>
SELECT am.amname AS acc_name,
       opc.opcname AS ops_name,
       opr.oprname AS ops_comp
    FROM pg_am am, pg_amop amop,
         pg_opclass opc, pg_operator opr
    WHERE amop.amopid = am.oid AND
          amop.amopclaid = opc.oid AND
          amop.amopopr = opr.oid
    ORDER BY acc_name, ops_name, ops_comp
    </programlisting>
   </para>
344
  </refsect2>
345 346
 </refsect1>

347 348
 <refsect1 id="R1-SQL-CREATEINDEX-2">
  <title>
349
   Usage
350 351
  </title>
  <para>To create a btree index on the field <literal>title</literal>
352
   in the table <literal>films</literal>:
353 354
  </para>
  <programlisting>
355 356
CREATE UNIQUE INDEX title_idx
    ON films (title);
357
  </programlisting>
358 359 360 361 362

<!--
<comment>
Is this example correct?
</comment>
363 364 365 366 367 368
  <para>
   To create a rtree index on a point attribute so that we
   can efficiently use box operators on the result of the
   conversion function:
  </para>
  <programlisting>
369 370 371 372
CREATE INDEX pointloc
    ON points USING RTREE (point2box(location) box_ops);
SELECT * FROM points
    WHERE point2box(points.pointloc) = boxes.box;
373
  </programlisting>
374 375
-->

376
 </refsect1>
377
 
378 379
 <refsect1 id="R1-SQL-CREATEINDEX-3">
  <title>
380
   Compatibility
381
  </title>
382
  
383 384 385 386 387
  <refsect2 id="R2-SQL-CREATEINDEX-4">
   <refsect2info>
    <date>1998-09-09</date>
   </refsect2info>
   <title>
388
    SQL92
389 390
   </title>
   <para>
391
    CREATE INDEX is a <productname>Postgres</productname> language extension.
392
   </para>
393
   <para>
394
    There is no <command>CREATE INDEX</command> command in SQL92.
395 396 397
   </para>
  </refsect2>
 </refsect1>
398
</refentry>
399 400 401 402

<!-- Keep this comment at the end of the file
Local variables:
mode: sgml
403
sgml-omittag:nil
404 405 406 407 408 409 410 411 412 413 414 415
sgml-shorttag:t
sgml-minimize-attributes:nil
sgml-always-quote-attributes:t
sgml-indent-step:1
sgml-indent-data:t
sgml-parent-document:nil
sgml-default-dtd-file:"../reference.ced"
sgml-exposed-tags:nil
sgml-local-catalogs:"/usr/lib/sgml/catalog"
sgml-local-ecat-files:nil
End:
-->