Whamcloud - gitweb
53399f66aa7dff993b4aa171c39e4f0f9463639e
[doc/manual.git] / ConfiguringFailover.xml
1 <?xml version="1.0" encoding="UTF-8"?>
2 <article version="5.0" xml:lang="en-US" xmlns="http://docbook.org/ns/docbook" xmlns:xl="http://www.w3.org/1999/xlink">
3   <info>
4     <title>Configuring Lustre Failover</title>
5   </info>
6   <informaltable frame="none">
7     <tgroup cols="2">
8       <colspec colname="c1" colwidth="50*"/>
9       <colspec colname="c2" colwidth="50*"/>
10       
11       
12       <tbody>
13         <row>
14           <entry align="left"><para>Lustre 2.0 Operations Manual</para></entry>
15           <entry align="right" valign="top"><para><link xl:href="index.html"><inlinemediaobject><imageobject role="html">
16                     <imagedata contentdepth="26" contentwidth="30" fileref="./shared/toc01.gif" scalefit="1"/>
17                   </imageobject>
18 <imageobject role="fo">
19                     <imagedata contentdepth="100%" contentwidth="" depth="" fileref="./shared/toc01.gif" scalefit="1" width="100%"/>
20                   </imageobject>
21 </inlinemediaobject></link><link xl:href="ConfiguringLustre.html"><inlinemediaobject><imageobject role="html">
22                     <imagedata contentdepth="26" contentwidth="30" fileref="./shared/prev01.gif" scalefit="1"/>
23                   </imageobject>
24 <imageobject role="fo">
25                     <imagedata contentdepth="100%" contentwidth="" depth="" fileref="./shared/prev01.gif" scalefit="1" width="100%"/>
26                   </imageobject>
27 </inlinemediaobject></link><link xl:href="III_LustreAdministration.html"><inlinemediaobject><imageobject role="html">
28                     <imagedata contentdepth="26" contentwidth="30" fileref="./shared/next01.gif" scalefit="1"/>
29                   </imageobject>
30 <imageobject role="fo">
31                     <imagedata contentdepth="100%" contentwidth="" depth="" fileref="./shared/next01.gif" scalefit="1" width="100%"/>
32                   </imageobject>
33 </inlinemediaobject></link><link xl:href="ix.html"><inlinemediaobject><imageobject role="html">
34                     <imagedata contentdepth="26" contentwidth="30" fileref="./shared/index01.gif" scalefit="1"/>
35                   </imageobject>
36 <imageobject role="fo">
37                     <imagedata contentdepth="100%" contentwidth="" depth="" fileref="./shared/index01.gif" scalefit="1" width="100%"/>
38                   </imageobject>
39 </inlinemediaobject></link></para></entry>
40         </row>
41       </tbody>
42     </tgroup>
43   </informaltable>
44   <para><link xl:href=""/></para>
45   <informaltable frame="none">
46     <tgroup cols="1">
47       <colspec colname="c1" colwidth="100*"/>
48       
49       <tbody>
50         <row>
51           <entry align="right"><para><anchor xml:id="dbdoclet.50438188_pgfId-874" xreflabel=""/>C H A P T E R  11<anchor xml:id="dbdoclet.50438188_30183" xreflabel=""/></para></entry>
52         </row>
53       </tbody>
54     </tgroup>
55   </informaltable>
56   <informaltable frame="none">
57     <tgroup cols="1">
58       <colspec colname="c1" colwidth="100*"/>
59       
60       <tbody>
61         <row>
62           <entry align="right"><para><anchor xml:id="dbdoclet.50438188_pgfId-1292188" xreflabel=""/><anchor xml:id="dbdoclet.50438188_50628" xreflabel=""/>Configuring Lustre Failover</para></entry>
63         </row>
64       </tbody>
65     </tgroup>
66   </informaltable>
67   <para><anchor xml:id="dbdoclet.50438188_pgfId-1292189" xreflabel=""/>This chapter describes how to configure Lustre failover using the Heartbeat cluster infrastructure daemon. It includes:</para>
68   <itemizedlist><listitem>
69       <para><anchor xml:id="dbdoclet.50438188_pgfId-1292193" xreflabel=""/><link xl:href="ConfiguringFailover.html#50438188_82389">Creating a Failover Environment</link></para>
70     </listitem>
71 <listitem>
72       <para> </para>
73     </listitem>
74 <listitem>
75       <para><anchor xml:id="dbdoclet.50438188_pgfId-1293185" xreflabel=""/><link xl:href="ConfiguringFailover.html#50438188_92688">Setting up High-Availability (HA) Software with Lustre</link></para>
76     </listitem>
77 <listitem>
78       <para> </para>
79     </listitem>
80 </itemizedlist>
81    <informaltable frame="none">
82     <tgroup cols="1">
83       <colspec colname="c1" colwidth="100*"/>
84       <tbody>
85         <row>
86           <entry><para><emphasis role="bold">Note -</emphasis><anchor xml:id="dbdoclet.50438188_pgfId-1292610" xreflabel=""/><emphasis>Using Lustre Failover is optional.</emphasis></para></entry>
87         </row>
88       </tbody>
89     </tgroup>
90   </informaltable>
91    <section remap="h2">
92     <title><anchor xml:id="dbdoclet.50438188_pgfId-1292208" xreflabel=""/></title>
93     <section remap="h2">
94       <title>11.1 <anchor xml:id="dbdoclet.50438188_82389" xreflabel=""/><anchor xml:id="dbdoclet.50438188_60346" xreflabel=""/>Creating a Failover Environment</title>
95       <para><anchor xml:id="dbdoclet.50438188_pgfId-1292209" xreflabel=""/>Lustre provides failover mechanisms only at the file system level. No failover functionality is provided for system-level components, such as node failure detection or power control, as would typically be provided in a complete failover solution. Additional tools are also needed to provide resource fencing, control and monitoring.</para>
96       <section remap="h3">
97         <title><anchor xml:id="dbdoclet.50438188_pgfId-1292210" xreflabel=""/>11.1.1 Power Management Software</title>
98         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292211" xreflabel=""/>Lustre failover requires power control and management capability to verify that a failed node is shut down before I/O is directed to the failover node. This avoids double-mounting the two nodes, and the risk of unrecoverable data corruption. A variety of power management tools will work, but two packages that are commonly used with Lustre are STONITH and PowerMan.</para>
99         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292212" xreflabel=""/>Shoot The Other Node In The HEAD (STONITH), is a set of power management tools provided with the Linux-HA package. STONITH has native support for many power control devices and is extensible. It uses expect scripts to automate control.</para>
100         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292213" xreflabel=""/>PowerMan, available from the Lawrence Livermore National Laboratory (LLNL), is used to control remote power control (RPC) devices from a central location. PowerMan provides native support for several RPC varieties and expect-like configuration simplifies the addition of new devices.</para>
101         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292214" xreflabel=""/>The latest versions of PowerMan are available at:</para>
102         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292216" xreflabel=""/><link xl:href="http://sourceforge.net/projects/powerman">http://sourceforge.net/projects/powerman</link></para>
103         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292217" xreflabel=""/>For more information about PowerMan, go to:</para>
104         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292219" xreflabel=""/><link xl:href="https://computing.llnl.gov/linux/powerman.html">https://computing.llnl.gov/linux/powerman.html</link></para>
105       </section>
106       <section remap="h3">
107         <title><anchor xml:id="dbdoclet.50438188_pgfId-1292220" xreflabel=""/>11.1.2 Power Equipment</title>
108         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292221" xreflabel=""/>Lustre failover also requires the use of RPC devices, which come in different configurations. Lustre server nodes may be equipped with some kind of service processor that allows remote power control. If a Lustre server node is not equipped with a service processor, then a multi-port, Ethernet-addressable RPC may be used as an alternative. For recommended products, refer to the list of supported RPC devices on the PowerMan website.</para>
109         <para><anchor xml:id="dbdoclet.50438188_pgfId-1292223" xreflabel=""/><link xl:href="https://computing.llnl.gov/linux/powerman.html">https://computing.llnl.gov/linux/powerman.html</link></para>
110       </section>
111     </section>
112     <section remap="h2">
113       <title>11.2 <anchor xml:id="dbdoclet.50438188_92688" xreflabel=""/>Setting up High-Availability (HA) Software with Lustre</title>
114       <para><anchor xml:id="dbdoclet.50438188_pgfId-1292225" xreflabel=""/>Lustre must be combined with high-availability (HA) software to enable a complete Lustre failover solution. Lustre can be used with several HA packages including:</para>
115       <itemizedlist><listitem>
116           <para><anchor xml:id="dbdoclet.50438188_pgfId-1293083" xreflabel=""/><emphasis>Red Hat Cluster Manager</emphasis>  - For more information about setting up Lustre failover with Red Hat Cluster Manager, see the Lustre wiki topic <link xl:href="http://wiki.lustre.org/index.php/Using_Red_Hat_Cluster_Manager_with_Lustre">Using Red Hat Cluster Manager with Lustre</link>.</para>
117         </listitem>
118 <listitem>
119           <para> </para>
120         </listitem>
121 <listitem>
122           <para><anchor xml:id="dbdoclet.50438188_pgfId-1293110" xreflabel=""/><emphasis>Pacemaker</emphasis>  - For more information about setting up Lustre failover with Pacemaker, see the Lustre wiki topic <link xl:href="http://wiki.lustre.org/index.php/Using_Pacemaker_with_Lustre">Using Pacemaker with Lustre</link>.<anchor xml:id="dbdoclet.50438188_61775" xreflabel=""/></para>
123         </listitem>
124 <listitem>
125           <para> </para>
126         </listitem>
127 </itemizedlist>
128       <!--
129 Begin SiteCatalyst code version: G.5.
130 -->
131       <!--
132 End SiteCatalyst code version: G.5.
133 -->
134         <informaltable frame="none">
135         <tgroup cols="3">
136           <colspec colname="c1" colwidth="33*"/>
137           <colspec colname="c2" colwidth="33*"/>
138           <colspec colname="c3" colwidth="33*"/>
139           
140           
141           
142           <tbody>
143             <row>
144               <entry align="left"><para>Lustre 2.0 Operations Manual</para></entry>
145               <entry align="right"><para>821-2076-10</para></entry>
146               <entry align="right" valign="top"><para><link xl:href="index.html"><inlinemediaobject><imageobject role="html">
147                         <imagedata contentdepth="26" contentwidth="30" fileref="./shared/toc01.gif" scalefit="1"/>
148                       </imageobject>
149 <imageobject role="fo">
150                         <imagedata contentdepth="100%" contentwidth="" depth="" fileref="./shared/toc01.gif" scalefit="1" width="100%"/>
151                       </imageobject>
152 </inlinemediaobject></link><link xl:href="ConfiguringLustre.html"><inlinemediaobject><imageobject role="html">
153                         <imagedata contentdepth="26" contentwidth="30" fileref="./shared/prev01.gif" scalefit="1"/>
154                       </imageobject>
155 <imageobject role="fo">
156                         <imagedata contentdepth="100%" contentwidth="" depth="" fileref="./shared/prev01.gif" scalefit="1" width="100%"/>
157                       </imageobject>
158 </inlinemediaobject></link><link xl:href="III_LustreAdministration.html"><inlinemediaobject><imageobject role="html">
159                         <imagedata contentdepth="26" contentwidth="30" fileref="./shared/next01.gif" scalefit="1"/>
160                       </imageobject>
161 <imageobject role="fo">
162                         <imagedata contentdepth="100%" contentwidth="" depth="" fileref="./shared/next01.gif" scalefit="1" width="100%"/>
163                       </imageobject>
164 </inlinemediaobject></link><link xl:href="ix.html"><inlinemediaobject><imageobject role="html">
165                         <imagedata contentdepth="26" contentwidth="30" fileref="./shared/index01.gif" scalefit="1"/>
166                       </imageobject>
167 <imageobject role="fo">
168                         <imagedata contentdepth="100%" contentwidth="" depth="" fileref="./shared/index01.gif" scalefit="1" width="100%"/>
169                       </imageobject>
170 </inlinemediaobject></link></para></entry>
171             </row>
172           </tbody>
173         </tgroup>
174       </informaltable>
175       <para><link xl:href=""/></para>
176       <para><link xl:href="copyright.html">Copyright</link> © 2011, Oracle and/or its affiliates. All rights reserved.</para>
177     </section>
178   </section>
179 </article>