improve some of the documentation around target data layout strings.

[oota-llvm.git] / docs / LangRef.html
diff --git a/docs/LangRef.html b/docs/LangRef.html

index dce39c5ac31f4ac300562ce02957c68bb8bf0a12..8e54f3c433a8550d5b24c825a9efcf21bbf3ed2e 100644 (file)
--- a/docs/LangRef.html
+++ b/docs/LangRef.html
@@ -35,7 +35,7 @@
            <li><a href="#linkage_externweak">'<tt>extern_weak</tt>' Linkage</a></li>
            <li><a href="#linkage_linkonce_odr">'<tt>linkonce_odr</tt>' Linkage</a></li>
            <li><a href="#linkage_weak">'<tt>weak_odr</tt>' Linkage</a></li>
-          <li><a href="#linkage_external">'<tt>externally visible</tt>' Linkage</a></li>
+          <li><a href="#linkage_external">'<tt>external</tt>' Linkage</a></li>
            <li><a href="#linkage_dllimport">'<tt>dllimport</tt>' Linkage</a></li>
            <li><a href="#linkage_dllexport">'<tt>dllexport</tt>' Linkage</a></li>
          </ol>
@@ -202,6 +202,7 @@
            <li><a href="#i_select">'<tt>select</tt>' Instruction</a></li>
            <li><a href="#i_call">'<tt>call</tt>'  Instruction</a></li>
            <li><a href="#i_va_arg">'<tt>va_arg</tt>'  Instruction</a></li>
+          <li><a href="#i_landingpad">'<tt>landingpad</tt>' Instruction</a></li>
          </ol>
        </li>
      </ol>
@@ -274,9 +275,10 @@
        </li>
        <li><a href="#int_debugger">Debugger intrinsics</a></li>
        <li><a href="#int_eh">Exception Handling intrinsics</a></li>
-      <li><a href="#int_trampoline">Trampoline Intrinsic</a>
+      <li><a href="#int_trampoline">Trampoline Intrinsics</a>
          <ol>
            <li><a href="#int_it">'<tt>llvm.init.trampoline</tt>' Intrinsic</a></li>
+          <li><a href="#int_at">'<tt>llvm.adjust.trampoline</tt>' Intrinsic</a></li>
          </ol>
        </li>
        <li><a href="#int_atomics">Atomic intrinsics</a>
@@ -645,7 +647,7 @@ define i32 @main() {   <i>; i32()* </i>&nbsp;
        be merged with equivalent globals.  These linkage types are otherwise the
        same as their non-<tt>odr</tt> versions.</dd>
  
-  <dt><tt><b><a name="linkage_external">externally visible</a></b></tt>:</dt>
+  <dt><tt><b><a name="linkage_external">external</a></b></tt>:</dt>
    <dd>If none of the above identifiers are used, the global is externally
        visible, meaning that it participates in linkage and can be used to
        resolve external symbol references.</dd>
@@ -678,8 +680,8 @@ define i32 @main() {   <i>; i32()* </i>&nbsp;
     declarations), they are accessible outside of the current module.</p>
  
  <p>It is illegal for a function <i>declaration</i> to have any linkage type
-   other than "externally visible", <tt>dllimport</tt>
-   or <tt>extern_weak</tt>.</p>
+   other than <tt>external</tt>, <tt>dllimport</tt>
+  or <tt>extern_weak</tt>.</p>
  
  <p>Aliases can have only <tt>external</tt>, <tt>internal</tt>, <tt>weak</tt>
     or <tt>weak_odr</tt> linkages.</p>
@@ -1161,14 +1163,6 @@ define void @f() optsize { ... }
        function into callers whenever possible, ignoring any active inlining size
        threshold for this caller.</dd>
  
-  <dt><tt><b>hotpatch</b></tt></dt>
-  <dd>This attribute indicates that the function should be 'hotpatchable',
-      meaning the function can be patched and/or hooked even while it is
-      loaded into memory. On x86, the function prologue will be preceded
-      by six bytes of padding and will begin with a two-byte instruction.
-      Most of the functions in the Windows system DLLs in Windows XP SP2 or
-      higher were compiled in this fashion.</dd>
-
    <dt><tt><b>nonlazybind</b></tt></dt>
    <dd>This attribute suppresses lazy symbol binding for the function. This
        may make calls to the function faster, at the cost of extra program
@@ -1260,6 +1254,11 @@ define void @f() optsize { ... }
        the ELF x86-64 abi, but it can be disabled for some compilation
        units.</dd>
  
+  <dt><tt><b><a name="returns_twice">returns_twice</a></b></tt></dt>
+  <dd>This attribute indicates that this function can return
+  twice. The C <code>setjmp</code> is an example of such a function.
+  The compiler disables some optimizations (like tail calls) in the caller of
+  these functions.</dd>
  </dl>
  
  </div>
@@ -1320,6 +1319,13 @@ target datalayout = "<i>layout specification</i>"
        the bits with the least significance have the lowest address
        location.</dd>
  
+  <dt><tt>S<i>size</i></tt></dt>
+  <dd>Specifies the natural alignment of the stack in bits. Alignment promotion
+      of stack variables is limited to the natural stack alignment to avoid
+      dynamic stack realignment. The stack alignment must be a multiple of
+      8-bits. If omitted, the natural stack alignment defaults to "unspecified",
+      which does not prevent any alignment promotions.</dd>
+
    <dt><tt>p:<i>size</i>:<i>abi</i>:<i>pref</i></tt></dt>
    <dd>This specifies the <i>size</i> of a pointer and its <i>abi</i> and
        <i>preferred</i> alignments. All sizes are in bits. Specifying
@@ -1400,6 +1406,22 @@ target datalayout = "<i>layout specification</i>"
        implemented in terms of 64 &lt;2 x double&gt;, for example.</li>
  </ol>
  
+<p>The function of the data layout string may not be what you expect.  Notably,
+   this is not a specification from the frontend of what alignment the code
+   generator should use.</p>
+
+<p>Instead, if specified, the target data layout is required to match what the 
+   ultimate <em>code generator</em> expects.  This string is used by the 
+   mid-level optimizers to
+   improve code, and this only works if it matches what the ultimate code 
+   generator uses.  If you would like to generate IR that does not embed this
+   target-specific detail into the IR, then you don't have to specify the 
+   string.  This will disable some optimizations that require precise layout
+   information, but this also prevents those optimizations from introducing
+   target specificity into the IR.</p>
+
+
+
  </div>
  
  <!-- ======================================================================= -->
@@ -1496,6 +1518,9 @@ or to register signal handlers. Nonetheless, there are platform-specific
  ways to create them, and we define LLVM IR's behavior in their presence. This
  model is inspired by the C++0x memory model.</p>
  
+<p>For a more informal introduction to this model, see the
+<a href="Atomics.html">LLVM Atomic Instructions and Concurrency Guide</a>.
+
  <p>We define a <i>happens-before</i> partial order as the least partial order
  that</p>
  <ul>
@@ -1532,7 +1557,12 @@ any write to the same byte, except:</p>
  
  <p>Given that definition, <var>R<sub>byte</sub></var> is defined as follows:
  <ul>
-  <li>If there is no write to the same byte that happens before
+  <li>If <var>R</var> is volatile, the result is target-dependent. (Volatile
+      is supposed to give guarantees which can support
+      <code>sig_atomic_t</code> in C/C++, and may be used for accesses to
+      addresses which do not behave like normal memory.  It does not generally
+      provide cross-thread synchronization.)
+  <li>Otherwise, if there is no write to the same byte that happens before
      <var>R<sub>byte</sub></var>, <var>R<sub>byte</sub></var> returns 
      <tt>undef</tt> for that byte.
    <li>Otherwise, if <var>R<sub>byte</sub></var> may see exactly one write,
@@ -1575,27 +1605,30 @@ as if it writes to the relevant surrounding bytes.
  </div>
  
  <!-- ======================================================================= -->
-<div class="doc_subsection">
+<h3>
        <a name="ordering">Atomic Memory Ordering Constraints</a>
-</div>
+</h3>
  
-<div class="doc_text">
+<div>
  
  <p>Atomic instructions (<a href="#i_cmpxchg"><code>cmpxchg</code></a>,
-<a href="#i_atomicrmw"><code>atomicrmw</code></a>, and
-<a href="#i_fence"><code>fence</code></a>) take an ordering parameter
+<a href="#i_atomicrmw"><code>atomicrmw</code></a>,
+<a href="#i_fence"><code>fence</code></a>,
+<a href="#i_load"><code>atomic load</code></a>, and
+<a href="#i_store"><code>atomic store</code></a>) take an ordering parameter
  that determines which other atomic instructions on the same address they
  <i>synchronize with</i>.  These semantics are borrowed from Java and C++0x,
  but are somewhat more colloquial. If these descriptions aren't precise enough,
-check those specs.  <a href="#i_fence"><code>fence</code></a> instructions
+check those specs (see spec references in the
+<a href="Atomic.html#introduction">atomics guide</a>).
+<a href="#i_fence"><code>fence</code></a> instructions
  treat these orderings somewhat differently since they don't take an address.
  See that instruction's documentation for details.</p>
  
-<!-- FIXME Note atomic load+store here once those get added. -->
+<p>For a simpler introduction to the ordering constraints, see the
+<a href="Atomics.html">LLVM Atomic Instructions and Concurrency Guide</a>.</p>
  
  <dl>
-<!-- FIXME: unordered is intended to be used for atomic load and store;
-it isn't allowed for any instruction yet. -->
  <dt><code>unordered</code></dt>
  <dd>The set of values that can be read is governed by the happens-before
  partial order. A value cannot be read unless some operation wrote it.
@@ -1619,18 +1652,21 @@ address's modification order. This disallows reordering of
  <code>monotonic</code> (or stronger) operations on the same address. If an
  address is written <code>monotonic</code>ally by one thread, and other threads
  <code>monotonic</code>ally read that address repeatedly, the other threads must
-eventually see the write. This is intended to model C++'s relaxed atomic
-variables.</dd>
+eventually see the write. This corresponds to the C++0x/C1x
+<code>memory_order_relaxed</code>.</dd>
  <dt><code>acquire</code></dt>
-<dd>In addition to the guarantees of <code>monotonic</code>, if this operation
-reads a value written by a <code>release</code> atomic operation, it
-<i>synchronizes-with</i> that operation.</dd>
-<dt><code>release</code></dt>
  <dd>In addition to the guarantees of <code>monotonic</code>,
-a <i>synchronizes-with</i> edge may be formed by an <code>acquire</code>
-operation.</dd>
+a <i>synchronizes-with</i> edge may be formed with a <code>release</code>
+operation. This is intended to model C++'s <code>memory_order_acquire</code>.</dd>
+<dt><code>release</code></dt>
+<dd>In addition to the guarantees of <code>monotonic</code>, if this operation
+writes a value which is subsequently read by an <code>acquire</code> operation,
+it <i>synchronizes-with</i> that operation.  (This isn't a complete
+description; see the C++0x definition of a release sequence.) This corresponds
+to the C++0x/C1x <code>memory_order_release</code>.</dd>
  <dt><code>acq_rel</code> (acquire+release)</dt><dd>Acts as both an
-<code>acquire</code> and <code>release</code> operation on its address.</dd>
+<code>acquire</code> and <code>release</code> operation on its address.
+This corresponds to the C++0x/C1x <code>memory_order_acq_rel</code>.</dd>
  <dt><code>seq_cst</code> (sequentially consistent)</dt><dd>
  <dd>In addition to the guarantees of <code>acq_rel</code>
  (<code>acquire</code> for an operation which only reads, <code>release</code>
@@ -1638,9 +1674,8 @@ for an operation which only writes), there is a global total order on all
  sequentially-consistent operations on all addresses, which is consistent with
  the <i>happens-before</i> partial order and with the modification orders of
  all the affected addresses. Each sequentially-consistent read sees the last
-preceding write to the same address in this global order. This is intended
-to model C++'s sequentially-consistent atomic variables and Java's volatile
-shared variables.</dd>
+preceding write to the same address in this global order. This corresponds
+to the C++0x/C1x <code>memory_order_seq_cst</code> and Java volatile.</dd>
  </dl>
  
  <p id="singlethread">If an atomic operation is marked <code>singlethread</code>,
@@ -2032,20 +2067,22 @@ in signal handlers).</p>
    
  <p>Structures may optionally be "packed" structures, which indicate that the 
    alignment of the struct is one byte, and that there is no padding between
-  the elements.  In non-packed structs, padding between field types is defined
-  by the target data string to match the underlying processor.</p>
-
-<p>Structures can either be "anonymous" or "named".  An anonymous structure is
-  defined inline with other types (e.g. <tt>{i32, i32}*</tt>) and a named types
-  are always defined at the top level with a name.  Anonmyous types are uniqued
-  by their contents and can never be recursive since there is no way to write
-  one.  Named types can be recursive.
+  the elements.  In non-packed structs, padding between field types is inserted
+  as defined by the TargetData string in the module, which is required to match
+  what the underlying processor expects.</p>
+
+<p>Structures can either be "literal" or "identified".  A literal structure is
+  defined inline with other types (e.g. <tt>{i32, i32}*</tt>) whereas identified
+  types are always defined at the top level with a name.  Literal types are
+  uniqued by their contents and can never be recursive or opaque since there is
+  no way to write one.  Identified types can be recursive, can be opaqued, and are
+  never uniqued.
  </p>
    
  <h5>Syntax:</h5>
  <pre>
-  %T1 = type { &lt;type list&gt; }     <i>; Named normal struct type</i>
-  %T2 = type &lt;{ &lt;type list&gt; }&gt;   <i>; Named packed struct type</i>
+  %T1 = type { &lt;type list&gt; }     <i>; Identified normal struct type</i>
+  %T2 = type &lt;{ &lt;type list&gt; }&gt;   <i>; Identified packed struct type</i>
  </pre>
    
  <h5>Examples:</h5>
@@ -3256,6 +3293,17 @@ IfUnequal:
     instruction, control is interrupted and continued at the dynamically nearest
     "exception" label.</p>
  
+<p>The '<tt>exception</tt>' label is a
+   <i><a href="ExceptionHandling.html#overview">landing pad</a></i> for the
+   exception. As such, '<tt>exception</tt>' label is required to have the
+   "<a href="#i_landingpad"><tt>landingpad</tt></a>" instruction, which contains
+   the information about about the behavior of the program after unwinding
+   happens, as its first non-PHI instruction. The restrictions on the
+   "<tt>landingpad</tt>" instruction's tightly couples it to the
+   "<tt>invoke</tt>" instruction, so that the important information contained
+   within the "<tt>landingpad</tt>" instruction can't be lost through normal
+   code motion.</p>
+
  <h5>Arguments:</h5>
  <p>This instruction requires several arguments:</p>
  
@@ -3372,17 +3420,18 @@ that the invoke/unwind semantics are likely to change in future versions.</p>
     successors.</p>
  
  <h5>Arguments:</h5>
-<p>The '<tt>resume</tt>' instruction's argument must have the same type as the
-   result of any '<tt>landingpad</tt>' instruction in the same function.</p>
+<p>The '<tt>resume</tt>' instruction requires one argument, which must have the
+   same type as the result of any '<tt>landingpad</tt>' instruction in the same
+   function.</p>
  
  <h5>Semantics:</h5>
  <p>The '<tt>resume</tt>' instruction resumes propagation of an existing
     (in-flight) exception whose unwinding was interrupted with
-   a landingpad instruction.</p>
+   a <a href="#i_landingpad"><tt>landingpad</tt></a> instruction.</p>
  
  <h5>Example:</h5>
  <pre>
- resume { i8*, i32 } %exn
+  resume { i8*, i32 } %exn
  </pre>
  
  </div>
@@ -4559,8 +4608,8 @@ that the invoke/unwind semantics are likely to change in future versions.</p>
  
  <h5>Syntax:</h5>
  <pre>
-  &lt;result&gt; = load &lt;ty&gt;* &lt;pointer&gt;[, align &lt;alignment&gt;][, !nontemporal !&lt;index&gt;]
-  &lt;result&gt; = volatile load &lt;ty&gt;* &lt;pointer&gt;[, align &lt;alignment&gt;][, !nontemporal !&lt;index&gt;]
+  &lt;result&gt; = load [volatile] &lt;ty&gt;* &lt;pointer&gt;[, align &lt;alignment&gt;][, !nontemporal !&lt;index&gt;]
+  &lt;result&gt; = load atomic [volatile] &lt;ty&gt;* &lt;pointer&gt; [singlethread] &lt;ordering&gt;, align &lt;alignment&gt;
    !&lt;index&gt; = !{ i32 1 }
  </pre>
  
@@ -4575,6 +4624,19 @@ that the invoke/unwind semantics are likely to change in future versions.</p>
     number or order of execution of this <tt>load</tt> with other <a
     href="#volatile">volatile operations</a>.</p>
  
+<p>If the <code>load</code> is marked as <code>atomic</code>, it takes an extra
+   <a href="#ordering">ordering</a> and optional <code>singlethread</code>
+   argument.  The <code>release</code> and <code>acq_rel</code> orderings are
+   not valid on <code>load</code> instructions.  Atomic loads produce <a
+   href="#memorymodel">defined</a> results when they may see multiple atomic
+   stores.  The type of the pointee must be an integer type whose bit width
+   is a power of two greater than or equal to eight and less than or equal
+   to a target-specific size limit. <code>align</code> must be explicitly 
+   specified on atomic loads, and the load has undefined behavior if the
+   alignment is not set to a value which is at least the size in bytes of
+   the pointee. <code>!nontemporal</code> does not have any defined semantics
+   for atomic loads.</p>
+
  <p>The optional constant <tt>align</tt> argument specifies the alignment of the
     operation (that is, the alignment of the memory address). A value of 0 or an
     omitted <tt>align</tt> argument means that the operation has the preferential
@@ -4618,8 +4680,8 @@ that the invoke/unwind semantics are likely to change in future versions.</p>
  
  <h5>Syntax:</h5>
  <pre>
-  store &lt;ty&gt; &lt;value&gt;, &lt;ty&gt;* &lt;pointer&gt;[, align &lt;alignment&gt;][, !nontemporal !&lt;index&gt;]                   <i>; yields {void}</i>
-  volatile store &lt;ty&gt; &lt;value&gt;, &lt;ty&gt;* &lt;pointer&gt;[, align &lt;alignment&gt;][, !nontemporal !&lt;index&gt;]          <i>; yields {void}</i>
+  store [volatile] &lt;ty&gt; &lt;value&gt;, &lt;ty&gt;* &lt;pointer&gt;[, align &lt;alignment&gt;][, !nontemporal !&lt;index&gt;]                   <i>; yields {void}</i>
+  store atomic [volatile] &lt;ty&gt; &lt;value&gt;, &lt;ty&gt;* &lt;pointer&gt; [singlethread] &lt;ordering&gt;, align &lt;alignment&gt;             <i>; yields {void}</i>
  </pre>
  
  <h5>Overview:</h5>
@@ -4635,6 +4697,19 @@ that the invoke/unwind semantics are likely to change in future versions.</p>
     order of execution of this <tt>store</tt> with other <a
     href="#volatile">volatile operations</a>.</p>
  
+<p>If the <code>store</code> is marked as <code>atomic</code>, it takes an extra
+   <a href="#ordering">ordering</a> and optional <code>singlethread</code>
+   argument.  The <code>acquire</code> and <code>acq_rel</code> orderings aren't
+   valid on <code>store</code> instructions.  Atomic loads produce <a
+   href="#memorymodel">defined</a> results when they may see multiple atomic
+   stores. The type of the pointee must be an integer type whose bit width
+   is a power of two greater than or equal to eight and less than or equal
+   to a target-specific size limit. <code>align</code> must be explicitly 
+   specified on atomic stores, and the store has undefined behavior if the
+   alignment is not set to a value which is at least the size in bytes of
+   the pointee. <code>!nontemporal</code> does not have any defined semantics
+   for atomic stores.</p>
+
  <p>The optional constant "align" argument specifies the alignment of the
     operation (that is, the alignment of the memory address). A value of 0 or an
     omitted "align" argument means that the operation has the preferential
@@ -4672,10 +4747,11 @@ that the invoke/unwind semantics are likely to change in future versions.</p>
  </div>
  
  <!-- _______________________________________________________________________ -->
-<div class="doc_subsubsection"> <a name="i_fence">'<tt>fence</tt>'
-Instruction</a> </div>
+<h4>
+<a name="i_fence">'<tt>fence</tt>' Instruction</a>
+</h4>
  
-<div class="doc_text">
+<div>
  
  <h5>Syntax:</h5>
  <pre>
@@ -4717,9 +4793,6 @@ operations and/or fences.</p>
  specifies that the fence only synchronizes with other fences in the same
  thread.  (This is useful for interacting with signal handlers.)</p>
  
-<p>FIXME: This instruction is a work in progress; until it is finished, use
-   llvm.memory.barrier.
-
  <h5>Example:</h5>
  <pre>
    fence acquire                          <i>; yields {void}</i>
@@ -4729,14 +4802,15 @@ thread.  (This is useful for interacting with signal handlers.)</p>
  </div>
  
  <!-- _______________________________________________________________________ -->
-<div class="doc_subsubsection"> <a name="i_cmpxchg">'<tt>cmpxchg</tt>'
-Instruction</a> </div>
+<h4>
+<a name="i_cmpxchg">'<tt>cmpxchg</tt>' Instruction</a>
+</h4>
  
-<div class="doc_text">
+<div>
  
  <h5>Syntax:</h5>
  <pre>
-  [volatile] cmpxchg &lt;ty&gt;* &lt;pointer&gt;, &lt;ty&gt; &lt;cmp&gt;, &lt;ty&gt; &lt;new&gt; [singlethread] &lt;ordering&gt;                   <i>; yields {ty}</i>
+  cmpxchg [volatile] &lt;ty&gt;* &lt;pointer&gt;, &lt;ty&gt; &lt;cmp&gt;, &lt;ty&gt; &lt;new&gt; [singlethread] &lt;ordering&gt;                   <i>; yields {ty}</i>
  </pre>
  
  <h5>Overview:</h5>
@@ -4811,14 +4885,15 @@ done:
  </div>
  
  <!-- _______________________________________________________________________ -->
-<div class="doc_subsubsection"> <a name="i_atomicrmw">'<tt>atomicrmw</tt>'
-Instruction</a> </div>
+<h4>
+<a name="i_atomicrmw">'<tt>atomicrmw</tt>' Instruction</a>
+</h4>
  
-<div class="doc_text">
+<div>
  
  <h5>Syntax:</h5>
  <pre>
-  [volatile] atomicrmw &lt;operation&gt; &lt;ty&gt;* &lt;pointer&gt;, &lt;ty&gt; &lt;value&gt; [singlethread] &lt;ordering&gt;                   <i>; yields {ty}</i>
+  atomicrmw [volatile] &lt;operation&gt; &lt;ty&gt;* &lt;pointer&gt;, &lt;ty&gt; &lt;value&gt; [singlethread] &lt;ordering&gt;                   <i>; yields {ty}</i>
  </pre>
  
  <h5>Overview:</h5>
@@ -4915,7 +4990,7 @@ specified by the <var>operation</var> argument:</p>
     When indexing into a (optionally packed) structure, only <tt>i32</tt>
     integer <b>constants</b> are allowed.  When indexing into an array, pointer
     or vector, integers of any width are allowed, and they are not required to be
-   constant.</p>
+   constant.  These integers are treated as signed values where relevant.</p>
  
  <p>For example, let's consider a C code fragment and how it gets compiled to
     LLVM:</p>
@@ -4981,18 +5056,20 @@ entry:
     base pointer is not an <i>in bounds</i> address of an allocated object,
     or if any of the addresses that would be formed by successive addition of
     the offsets implied by the indices to the base address with infinitely
-   precise arithmetic are not an <i>in bounds</i> address of that allocated
-   object. The <i>in bounds</i> addresses for an allocated object are all
-   the addresses that point into the object, plus the address one byte past
-   the end.</p>
+   precise signed arithmetic are not an <i>in bounds</i> address of that
+   allocated object. The <i>in bounds</i> addresses for an allocated object
+   are all the addresses that point into the object, plus the address one
+   byte past the end.</p>
  
  <p>If the <tt>inbounds</tt> keyword is not present, the offsets are added to
-   the base address with silently-wrapping two's complement arithmetic, and
-   the result value of the <tt>getelementptr</tt> may be outside the object
-   pointed to by the base pointer. The result value may not necessarily be
-   used to access memory though, even if it happens to point into allocated
-   storage. See the <a href="#pointeraliasing">Pointer Aliasing Rules</a>
-   section for more information.</p>
+   the base address with silently-wrapping two's complement arithmetic. If the
+   offsets have a different width from the pointer, they are sign-extended or
+   truncated to the width of the pointer. The result value of the
+   <tt>getelementptr</tt> may be outside the object pointed to by the base
+   pointer. The result value may not necessarily be used to access memory
+   though, even if it happens to point into allocated storage. See the
+   <a href="#pointeraliasing">Pointer Aliasing Rules</a> section for more
+   information.</p>
  
  <p>The getelementptr instruction is often confusing.  For some more insight into
     how it works, see <a href="GetElementPtr.html">the getelementptr FAQ</a>.</p>
@@ -5970,6 +6047,87 @@ freestanding environments and non-C-based languages.</p>
  
  </div>
  
+<!-- _______________________________________________________________________ -->
+<h4>
+  <a name="i_landingpad">'<tt>landingpad</tt>' Instruction</a>
+</h4>
+
+<div>
+
+<h5>Syntax:</h5>
+<pre>
+  &lt;resultval&gt; = landingpad &lt;somety&gt; personality &lt;type&gt; &lt;pers_fn&gt; &lt;clause&gt;+
+  &lt;resultval&gt; = landingpad &lt;somety&gt; personality &lt;type&gt; &lt;pers_fn&gt; cleanup &lt;clause&gt;*
+
+  &lt;clause&gt; := catch &lt;type&gt; &lt;value&gt;
+  &lt;clause&gt; := filter &lt;array constant type&gt; &lt;array constant&gt;
+</pre>
+
+<h5>Overview:</h5>
+<p>The '<tt>landingpad</tt>' instruction is used by
+   <a href="ExceptionHandling.html#overview">LLVM's exception handling
+   system</a> to specify that a basic block is a landing pad &mdash; one where
+   the exception lands, and corresponds to the code found in the
+   <i><tt>catch</tt></i> portion of a <i><tt>try/catch</tt></i> sequence. It
+   defines values supplied by the personality function (<tt>pers_fn</tt>) upon
+   re-entry to the function. The <tt>resultval</tt> has the
+   type <tt>somety</tt>.</p>
+
+<h5>Arguments:</h5>
+<p>This instruction takes a <tt>pers_fn</tt> value. This is the personality
+   function associated with the unwinding mechanism. The optional
+   <tt>cleanup</tt> flag indicates that the landing pad block is a cleanup.</p>
+
+<p>A <tt>clause</tt> begins with the clause type &mdash; <tt>catch</tt>
+   or <tt>filter</tt> &mdash; and contains the global variable representing the
+   "type" that may be caught or filtered respectively. Unlike the
+   <tt>catch</tt> clause, the <tt>filter</tt> clause takes an array constant as
+   its argument. Use "<tt>[0 x i8**] undef</tt>" for a filter which cannot
+   throw. The '<tt>landingpad</tt>' instruction must contain <em>at least</em>
+   one <tt>clause</tt> or the <tt>cleanup</tt> flag.</p>
+
+<h5>Semantics:</h5>
+<p>The '<tt>landingpad</tt>' instruction defines the values which are set by the
+   personality function (<tt>pers_fn</tt>) upon re-entry to the function, and
+   therefore the "result type" of the <tt>landingpad</tt> instruction. As with
+   calling conventions, how the personality function results are represented in
+   LLVM IR is target specific.</p>
+
+<p>The clauses are applied in order from top to bottom. If two
+   <tt>landingpad</tt> instructions are merged together through inlining, the
+   clauses from the calling function are appended to the list of clauses.</p>
+
+<p>The <tt>landingpad</tt> instruction has several restrictions:</p>
+
+<ul>
+  <li>A landing pad block is a basic block which is the unwind destination of an
+      '<tt>invoke</tt>' instruction.</li>
+  <li>A landing pad block must have a '<tt>landingpad</tt>' instruction as its
+      first non-PHI instruction.</li>
+  <li>There can be only one '<tt>landingpad</tt>' instruction within the landing
+      pad block.</li>
+  <li>A basic block that is not a landing pad block may not include a
+      '<tt>landingpad</tt>' instruction.</li>
+  <li>All '<tt>landingpad</tt>' instructions in a function must have the same
+      personality function.</li>
+</ul>
+
+<h5>Example:</h5>
+<pre>
+  ;; A landing pad which can catch an integer.
+  %res = landingpad { i8*, i32 } personality i32 (...)* @__gxx_personality_v0
+           catch i8** @_ZTIi
+  ;; A landing pad that is a cleanup.
+  %res = landingpad { i8*, i32 } personality i32 (...)* @__gxx_personality_v0
+           cleanup
+  ;; A landing pad which can catch an integer and can only throw a double.
+  %res = landingpad { i8*, i32 } personality i32 (...)* @__gxx_personality_v0
+           catch i8** @_ZTIi
+           filter [1 x i8**] [@_ZTId]
+</pre>
+
+</div>
+
  </div>
  
  </div>
@@ -7543,12 +7701,12 @@ LLVM</a>.</p>
  
  <!-- ======================================================================= -->
  <h3>
-  <a name="int_trampoline">Trampoline Intrinsic</a>
+  <a name="int_trampoline">Trampoline Intrinsics</a>
  </h3>
  
  <div>
  
-<p>This intrinsic makes it possible to excise one parameter, marked with
+<p>These intrinsics make it possible to excise one parameter, marked with
     the <a href="#nest"><tt>nest</tt></a> attribute, from a function.
     The result is a callable
     function pointer lacking the nest parameter - the caller does not need to
@@ -7565,7 +7723,8 @@ LLVM</a>.</p>
  <pre class="doc_code">
    %tramp = alloca [10 x i8], align 4 ; size and alignment only correct for X86
    %tramp1 = getelementptr [10 x i8]* %tramp, i32 0, i32 0
-  %p = call i8* @llvm.init.trampoline(i8* %tramp1, i8* bitcast (i32 (i8* nest , i32, i32)* @f to i8*), i8* %nval)
+  call i8* @llvm.init.trampoline(i8* %tramp1, i8* bitcast (i32 (i8*, i32, i32)* @f to i8*), i8* %nval)
+  %p = call i8* @llvm.adjust.trampoline(i8* %tramp1)
    %fp = bitcast i8* %p to i32 (i32, i32)*
  </pre>
  
@@ -7583,12 +7742,12 @@ LLVM</a>.</p>
  
  <h5>Syntax:</h5>
  <pre>
-  declare i8* @llvm.init.trampoline(i8* &lt;tramp&gt;, i8* &lt;func&gt;, i8* &lt;nval&gt;)
+  declare void @llvm.init.trampoline(i8* &lt;tramp&gt;, i8* &lt;func&gt;, i8* &lt;nval&gt;)
  </pre>
  
  <h5>Overview:</h5>
-<p>This fills the memory pointed to by <tt>tramp</tt> with code and returns a
-   function pointer suitable for executing it.</p>
+<p>This fills the memory pointed to by <tt>tramp</tt> with executable code,
+   turning it into a trampoline.</p>
  
  <h5>Arguments:</h5>
  <p>The <tt>llvm.init.trampoline</tt> intrinsic takes three arguments, all
@@ -7602,17 +7761,50 @@ LLVM</a>.</p>
  
  <h5>Semantics:</h5>
  <p>The block of memory pointed to by <tt>tramp</tt> is filled with target
-   dependent code, turning it into a function.  A pointer to this function is
-   returned, but needs to be bitcast to an <a href="#int_trampoline">appropriate
-   function pointer type</a> before being called.  The new function's signature
-   is the same as that of <tt>func</tt> with any arguments marked with
-   the <tt>nest</tt> attribute removed.  At most one such <tt>nest</tt> argument
-   is allowed, and it must be of pointer type.  Calling the new function is
-   equivalent to calling <tt>func</tt> with the same argument list, but
-   with <tt>nval</tt> used for the missing <tt>nest</tt> argument.  If, after
-   calling <tt>llvm.init.trampoline</tt>, the memory pointed to
-   by <tt>tramp</tt> is modified, then the effect of any later call to the
-   returned function pointer is undefined.</p>
+   dependent code, turning it into a function.  Then <tt>tramp</tt> needs to be
+   passed to <a href="#int_at">llvm.adjust.trampoline</a> to get a pointer
+   which can be <a href="#int_trampoline">bitcast (to a new function) and
+   called</a>.  The new function's signature is the same as that of
+   <tt>func</tt> with any arguments marked with the <tt>nest</tt> attribute
+   removed.  At most one such <tt>nest</tt> argument is allowed, and it must be of
+   pointer type.  Calling the new function is equivalent to calling <tt>func</tt>
+   with the same argument list, but with <tt>nval</tt> used for the missing
+   <tt>nest</tt> argument.  If, after calling <tt>llvm.init.trampoline</tt>, the
+   memory pointed to by <tt>tramp</tt> is modified, then the effect of any later call
+   to the returned function pointer is undefined.</p>
+</div>
+
+<!-- _______________________________________________________________________ -->
+<h4>
+  <a name="int_at">
+    '<tt>llvm.adjust.trampoline</tt>' Intrinsic
+  </a>
+</h4>
+
+<div>
+
+<h5>Syntax:</h5>
+<pre>
+  declare i8* @llvm.adjust.trampoline(i8* &lt;tramp&gt;)
+</pre>
+
+<h5>Overview:</h5>
+<p>This performs any required machine-specific adjustment to the address of a
+   trampoline (passed as <tt>tramp</tt>).</p>
+
+<h5>Arguments:</h5>
+<p><tt>tramp</tt> must point to a block of memory which already has trampoline code
+   filled in by a previous call to <a href="#int_it"><tt>llvm.init.trampoline</tt>
+   </a>.</p>
+
+<h5>Semantics:</h5>
+<p>On some architectures the address of the code to be executed needs to be
+   different to the address where the trampoline is actually stored.  This
+   intrinsic returns the executable address corresponding to <tt>tramp</tt>
+   after performing the required machine specific adjustments.
+   The pointer returned can then be <a href="#int_trampoline"> bitcast and
+   executed</a>.
+</p>
  
  </div>
  
@@ -8274,7 +8466,7 @@ LLVM</a>.</p>
  <h5>Semantics:</h5>
  <p>This intrinsic allows annotation of local variables with arbitrary strings.
     This can be useful for special purpose optimizations that want to look for
-   these annotations.  These have no other defined use, they are ignored by code
+   these annotations.  These have no other defined use; they are ignored by code
     generation and optimization.</p>
  
  </div>
@@ -8310,7 +8502,7 @@ LLVM</a>.</p>
  <h5>Semantics:</h5>
  <p>This intrinsic allows annotations to be put on arbitrary expressions with
     arbitrary strings.  This can be useful for special purpose optimizations that
-   want to look for these annotations.  These have no other defined use, they
+   want to look for these annotations.  These have no other defined use; they
     are ignored by code generation and optimization.</p>
  
  </div>