zookeeperStarted.html 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499
  1. <!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
  2. <html>
  3. <head>
  4. <META http-equiv="Content-Type" content="text/html; charset=UTF-8">
  5. <meta content="Apache Forrest" name="Generator">
  6. <meta name="Forrest-version" content="0.8">
  7. <meta name="Forrest-skin-name" content="pelt">
  8. <title>ZooKeeper Getting Started Guide</title>
  9. <link type="text/css" href="skin/basic.css" rel="stylesheet">
  10. <link media="screen" type="text/css" href="skin/screen.css" rel="stylesheet">
  11. <link media="print" type="text/css" href="skin/print.css" rel="stylesheet">
  12. <link type="text/css" href="skin/profile.css" rel="stylesheet">
  13. <script src="skin/getBlank.js" language="javascript" type="text/javascript"></script><script src="skin/getMenu.js" language="javascript" type="text/javascript"></script><script src="skin/fontsize.js" language="javascript" type="text/javascript"></script>
  14. <link rel="shortcut icon" href="images/favicon.ico">
  15. </head>
  16. <body onload="init()">
  17. <script type="text/javascript">ndeSetTextSize();</script>
  18. <div id="top">
  19. <!--+
  20. |breadtrail
  21. +-->
  22. <div class="breadtrail">
  23. <a href="http://www.apache.org/">Apache</a> &gt; <a href="http://hadoop.apache.org/">Hadoop</a> &gt; <a href="http://hadoop.apache.org/zookeeper/">ZooKeeper</a><script src="skin/breadcrumbs.js" language="JavaScript" type="text/javascript"></script>
  24. </div>
  25. <!--+
  26. |header
  27. +-->
  28. <div class="header">
  29. <!--+
  30. |start group logo
  31. +-->
  32. <div class="grouplogo">
  33. <a href="http://hadoop.apache.org/"><img class="logoImage" alt="Hadoop" src="images/hadoop-logo.jpg" title="Apache Hadoop"></a>
  34. </div>
  35. <!--+
  36. |end group logo
  37. +-->
  38. <!--+
  39. |start Project Logo
  40. +-->
  41. <div class="projectlogo">
  42. <a href="http://hadoop.apache.org/zookeeper/"><img class="logoImage" alt="ZooKeeper" src="images/zookeeper_small.gif" title="The Hadoop database"></a>
  43. </div>
  44. <!--+
  45. |end Project Logo
  46. +-->
  47. <!--+
  48. |start Search
  49. +-->
  50. <div class="searchbox">
  51. <form action="http://www.google.com/search" method="get" class="roundtopsmall">
  52. <input value="hadoop.apache.org" name="sitesearch" type="hidden"><input onFocus="getBlank (this, 'Search the site with google');" size="25" name="q" id="query" type="text" value="Search the site with google">&nbsp;
  53. <input name="Search" value="Search" type="submit">
  54. </form>
  55. </div>
  56. <!--+
  57. |end search
  58. +-->
  59. <!--+
  60. |start Tabs
  61. +-->
  62. <ul id="tabs">
  63. <li>
  64. <a class="unselected" href="http://hadoop.apache.org/zookeeper/">Project</a>
  65. </li>
  66. <li>
  67. <a class="unselected" href="http://wiki.apache.org/hadoop/ZooKeeper">Wiki</a>
  68. </li>
  69. <li class="current">
  70. <a class="selected" href="index.html">ZooKeeper 3.1 Documentation</a>
  71. </li>
  72. </ul>
  73. <!--+
  74. |end Tabs
  75. +-->
  76. </div>
  77. </div>
  78. <div id="main">
  79. <div id="publishedStrip">
  80. <!--+
  81. |start Subtabs
  82. +-->
  83. <div id="level2tabs"></div>
  84. <!--+
  85. |end Endtabs
  86. +-->
  87. <script type="text/javascript"><!--
  88. document.write("Last Published: " + document.lastModified);
  89. // --></script>
  90. </div>
  91. <!--+
  92. |breadtrail
  93. +-->
  94. <div class="breadtrail">
  95. &nbsp;
  96. </div>
  97. <!--+
  98. |start Menu, mainarea
  99. +-->
  100. <!--+
  101. |start Menu
  102. +-->
  103. <div id="menu">
  104. <div onclick="SwitchMenu('menu_selected_1.1', 'skin/')" id="menu_selected_1.1Title" class="menutitle" style="background-image: url('skin/images/chapter_open.gif');">Overview</div>
  105. <div id="menu_selected_1.1" class="selectedmenuitemgroup" style="display: block;">
  106. <div class="menuitem">
  107. <a href="index.html">Welcome</a>
  108. </div>
  109. <div class="menuitem">
  110. <a href="zookeeperOver.html">Overview</a>
  111. </div>
  112. <div class="menupage">
  113. <div class="menupagetitle">Getting Started</div>
  114. </div>
  115. <div class="menuitem">
  116. <a href="releasenotes.html">Release Notes</a>
  117. </div>
  118. </div>
  119. <div onclick="SwitchMenu('menu_1.2', 'skin/')" id="menu_1.2Title" class="menutitle">Developer</div>
  120. <div id="menu_1.2" class="menuitemgroup">
  121. <div class="menuitem">
  122. <a href="api/index.html">API Docs</a>
  123. </div>
  124. <div class="menuitem">
  125. <a href="zookeeperProgrammers.html">Programmer's Guide</a>
  126. </div>
  127. <div class="menuitem">
  128. <a href="javaExample.html">Java Example</a>
  129. </div>
  130. <div class="menuitem">
  131. <a href="zookeeperTutorial.html">Barrier and Queue Tutorial</a>
  132. </div>
  133. <div class="menuitem">
  134. <a href="recipes.html">Recipes</a>
  135. </div>
  136. </div>
  137. <div onclick="SwitchMenu('menu_1.3', 'skin/')" id="menu_1.3Title" class="menutitle">Admin &amp; Ops</div>
  138. <div id="menu_1.3" class="menuitemgroup">
  139. <div class="menuitem">
  140. <a href="zookeeperAdmin.html">Administrator's Guide</a>
  141. </div>
  142. <div class="menuitem">
  143. <a href="zookeeperJMX.html">JMX</a>
  144. </div>
  145. </div>
  146. <div onclick="SwitchMenu('menu_1.4', 'skin/')" id="menu_1.4Title" class="menutitle">Contributor</div>
  147. <div id="menu_1.4" class="menuitemgroup">
  148. <div class="menuitem">
  149. <a href="zookeeperInternals.html">ZooKeeper Internals</a>
  150. </div>
  151. </div>
  152. <div onclick="SwitchMenu('menu_1.5', 'skin/')" id="menu_1.5Title" class="menutitle">Miscellaneous</div>
  153. <div id="menu_1.5" class="menuitemgroup">
  154. <div class="menuitem">
  155. <a href="http://wiki.apache.org/hadoop/ZooKeeper">Wiki</a>
  156. </div>
  157. <div class="menuitem">
  158. <a href="http://wiki.apache.org/hadoop/ZooKeeper/FAQ">FAQ</a>
  159. </div>
  160. <div class="menuitem">
  161. <a href="http://hadoop.apache.org/zookeeper/mailing_lists.html">Mailing Lists</a>
  162. </div>
  163. </div>
  164. <div id="credit"></div>
  165. <div id="roundbottom">
  166. <img style="display: none" class="corner" height="15" width="15" alt="" src="skin/images/rc-b-l-15-1body-2menu-3menu.png"></div>
  167. <!--+
  168. |alternative credits
  169. +-->
  170. <div id="credit2"></div>
  171. </div>
  172. <!--+
  173. |end Menu
  174. +-->
  175. <!--+
  176. |start content
  177. +-->
  178. <div id="content">
  179. <div title="Portable Document Format" class="pdflink">
  180. <a class="dida" href="zookeeperStarted.pdf"><img alt="PDF -icon" src="skin/images/pdfdoc.gif" class="skin"><br>
  181. PDF</a>
  182. </div>
  183. <h1>ZooKeeper Getting Started Guide</h1>
  184. <div id="minitoc-area">
  185. <ul class="minitoc">
  186. <li>
  187. <a href="#ch_GettingStarted">Getting Started: Coordinating Distributed Applications with
  188. ZooKeeper</a>
  189. <ul class="minitoc">
  190. <li>
  191. <a href="#sc_Prerequisites">Pre-requisites</a>
  192. </li>
  193. <li>
  194. <a href="#sc_Download">Download</a>
  195. </li>
  196. <li>
  197. <a href="#sc_InstallingSingleMode">Standalone Operation</a>
  198. </li>
  199. <li>
  200. <a href="#sc_FileManagement">Managing ZooKeeper Storage</a>
  201. </li>
  202. <li>
  203. <a href="#sc_ConnectingToZooKeeper">Connecting to ZooKeeper</a>
  204. </li>
  205. <li>
  206. <a href="#sc_ProgrammingToZooKeeper">Programming to ZooKeeper</a>
  207. </li>
  208. <li>
  209. <a href="#sc_RunningReplicatedZooKeeper">Running Replicated ZooKeeper</a>
  210. </li>
  211. <li>
  212. <a href="#Other+Optimizations">Other Optimizations</a>
  213. </li>
  214. </ul>
  215. </li>
  216. </ul>
  217. </div>
  218. <a name="N10009"></a><a name="ch_GettingStarted"></a>
  219. <h2 class="h3">Getting Started: Coordinating Distributed Applications with
  220. ZooKeeper</h2>
  221. <div class="section">
  222. <p>This document contains information to get you started quickly with
  223. ZooKeeper. It is aimed primarily at developers hoping to try it out, and
  224. contains simple installation instructions for a single ZooKeeper server, a
  225. few commands to verify that it is running, and a simple programming
  226. example. Finally, as a convenience, there are a few sections regarding
  227. more complicated installations, for example running replicated
  228. deployments, and optimizing the transaction log. However for the complete
  229. instructions for commercial deployments, please refer to the <a href="zookeeperAdmin.html">ZooKeeper
  230. Administrator's Guide</a>.</p>
  231. <a name="N10016"></a><a name="sc_Prerequisites"></a>
  232. <h3 class="h4">Pre-requisites</h3>
  233. <p>See <a href="zookeeperAdmin.html#sc_systemReq">
  234. System Requirements</a> in the Admin guide.</p>
  235. <a name="N10024"></a><a name="sc_Download"></a>
  236. <h3 class="h4">Download</h3>
  237. <p>To get a ZooKeeper distribution, download a recent
  238. <a href="http://hadoop.apache.org/zookeeper/releases.html">
  239. stable</a> release from one of the Apache Download
  240. Mirrors.</p>
  241. <a name="N10032"></a><a name="sc_InstallingSingleMode"></a>
  242. <h3 class="h4">Standalone Operation</h3>
  243. <p>Setting up a ZooKeeper server in standalone mode is
  244. straightforward. The server is contained in a single JAR file,
  245. so installation consists of creating a configuration.</p>
  246. <p>Once you've downloaded a stable ZooKeeper release unpack
  247. it and cd to the root</p>
  248. <p>To start ZooKeeper you need a configuration file. Here is a sample,
  249. create it in <strong>conf/zoo.cfg</strong>:</p>
  250. <pre class="code">
  251. tickTime=2000
  252. dataDir=/var/zookeeper
  253. clientPort=2181
  254. </pre>
  255. <p>This file can be called anything, but for the sake of this
  256. discussion call
  257. it <strong>conf/zoo.cfg</strong>. Change the
  258. value of <strong>dataDir</strong> to specify an
  259. existing (empty to start with) directory. Here are the meanings
  260. for each of the fields:</p>
  261. <dl>
  262. <dt>
  263. <term>
  264. <strong>tickTime</strong>
  265. </term>
  266. </dt>
  267. <dd>
  268. <p>the basic time unit in milliseconds used by ZooKeeper. It is
  269. used to do heartbeats and the minimum session timeout will be
  270. twice the tickTime.</p>
  271. </dd>
  272. </dl>
  273. <dl>
  274. <dt>
  275. <term>
  276. <strong>dataDir</strong>
  277. </term>
  278. </dt>
  279. <dd>
  280. <p>the location to store the in-memory database snapshots and,
  281. unless specified otherwise, the transaction log of updates to the
  282. database.</p>
  283. </dd>
  284. <dt>
  285. <term>
  286. <strong>clientPort</strong>
  287. </term>
  288. </dt>
  289. <dd>
  290. <p>the port to listen for client connections</p>
  291. </dd>
  292. </dl>
  293. <p>Now that you created the configuration file, you can start
  294. ZooKeeper:</p>
  295. <pre class="code">bin/zkServer.sh start</pre>
  296. <p>ZooKeeper logs messages using log4j -- more detail
  297. available in the
  298. <a href="zookeeperProgrammers.html#Logging">Logging</a>
  299. section of the Programmer's Guide. You will see log messages
  300. coming to the console (default) and/or a log file depending on
  301. the log4j configuration.</p>
  302. <p>The steps outlined here run ZooKeeper in standalone mode. There is
  303. no replication, so if ZooKeeper process fails, the service will go down.
  304. This is fine for most development situations, but to run ZooKeeper in
  305. replicated mode, please see <a href="#sc_RunningReplicatedZooKeeper">Running Replicated
  306. ZooKeeper</a>.</p>
  307. <a name="N10083"></a><a name="sc_FileManagement"></a>
  308. <h3 class="h4">Managing ZooKeeper Storage</h3>
  309. <p>For long running production systems ZooKeeper storage must
  310. be managed externally (dataDir and logs). See the section on
  311. <a href="zookeeperAdmin.html#sc_maintenance">maintenance</a> for
  312. more details.</p>
  313. <a name="N10091"></a><a name="sc_ConnectingToZooKeeper"></a>
  314. <h3 class="h4">Connecting to ZooKeeper</h3>
  315. <p>Once ZooKeeper is running, you have several options for connection
  316. to it:</p>
  317. <ul>
  318. <li>
  319. <p>
  320. <strong>Java</strong>: Use</p>
  321. <pre class="code">bin/zkCli.sh 127.0.0.1:2181</pre>
  322. <p>This lets you perform simple, file-like operations.</p>
  323. </li>
  324. <li>
  325. <p>
  326. <strong>C</strong>: compile cli_mt
  327. (multi-threaded) or cli_st (single-threaded) by running
  328. <span class="codefrag command">make cli_mt</span> or <span class="codefrag command">make
  329. cli_st</span> in
  330. the <strong>src/c</strong> subdirectory in
  331. the ZooKeeper sources. See the README contained within
  332. <strong>src/c</strong> for full details.</p>
  333. <p>You can run the program
  334. from <strong>src/c</strong> using:</p>
  335. <pre class="code">LD_LIBRARY_PATH=. cli_mt 127.0.0.1:2181</pre>
  336. <p>or</p>
  337. <pre class="code">LD_LIBRARY_PATH=. cli_st 127.0.0.1:2181</pre>
  338. <p>This will give you a simple shell to execute file
  339. system like operations on ZooKeeper.</p>
  340. </li>
  341. </ul>
  342. <a name="N100D4"></a><a name="sc_ProgrammingToZooKeeper"></a>
  343. <h3 class="h4">Programming to ZooKeeper</h3>
  344. <p>ZooKeeper has a Java bindings and C bindings. They are
  345. functionally equivalent. The C bindings exist in two variants: single
  346. threaded and multi-threaded. These differ only in how the messaging loop
  347. is done. For more information, see the <a href="zookeeperProgrammers.html#ch_programStructureWithExample.html">Programming
  348. Examples in the ZooKeeper Programmer's Guide</a> for
  349. sample code using of the different APIs.</p>
  350. <a name="N100E2"></a><a name="sc_RunningReplicatedZooKeeper"></a>
  351. <h3 class="h4">Running Replicated ZooKeeper</h3>
  352. <p>Running ZooKeeper in standalone mode is convenient for evaluation,
  353. some development, and testing. But in production, you should run
  354. ZooKeeper in replicated mode. A replicated group of servers in the same
  355. application is called a <em>quorum</em>, and in replicated
  356. mode, all servers in the quorum have copies of the same configuration
  357. file. The file is similar to the one used in standalone mode, but with a
  358. few differences. Here is an example:</p>
  359. <pre class="code">
  360. tickTime=2000
  361. dataDir=/var/zookeeper
  362. clientPort=2181
  363. initLimit=5
  364. syncLimit=2
  365. server.1=zoo1:2888:3888
  366. server.2=zoo2:2888:3888
  367. server.3=zoo3:2888:3888
  368. </pre>
  369. <p>The new entry, <strong>initLimit</strong> is
  370. timeouts ZooKeeper uses to limit the length of time the ZooKeeper
  371. servers in quorum have to connect to a leader. The entry <strong>syncLimit</strong> limits how far out of date a server can
  372. be from a leader.</p>
  373. <p>With both of these timeouts, you specify the unit of time using
  374. <strong>tickTime</strong>. In this example, the timeout
  375. for initLimit is 5 ticks at 2000 milleseconds a tick, or 10
  376. seconds.</p>
  377. <p>The entries of the form <em>server.X</em> list the
  378. servers that make up the ZooKeeper service. When the server starts up,
  379. it knows which server it is by looking for the file
  380. <em>myid</em> in the data directory. That file has the
  381. contains the server number, in ASCII.</p>
  382. <p>Finally, note the two port numbers after each server
  383. name: " 2888" and "3888". Peers use the former port to connect
  384. to other peers. Such a connection is necessary so that peers
  385. can communicate, for example, to agree upon the order of
  386. updates. More specifically, a ZooKeeper server uses this port
  387. to connect followers to the leader. When a new leader arises, a
  388. follower opens a TCP connection to the leader using this
  389. port. Because the default leader election also uses TCP, we
  390. currently require another port for leader election. This is the
  391. second port in the server entry.
  392. </p>
  393. <div class="note">
  394. <div class="label">Note</div>
  395. <div class="content">
  396. <p>If you want to test multiple servers on a single
  397. machine, specify the servername
  398. as <em>localhost</em> with unique quorum &amp;
  399. leader election ports (i.e. 2888:3888, 2889:3889, 2890:3890 in
  400. the example above) for each server.X in that server's config
  401. file. Of course separate <em>dataDir</em>s and
  402. distinct <em>clientPort</em>s are also necessary
  403. (in the above replicated example, running on a
  404. single <em>localhost</em>, you would still have
  405. three config files).</p>
  406. </div>
  407. </div>
  408. <a name="N1011F"></a><a name="Other+Optimizations"></a>
  409. <h3 class="h4">Other Optimizations</h3>
  410. <p>There are a couple of other configuration parameters that can
  411. greatly increase performance:</p>
  412. <ul>
  413. <li>
  414. <p>To get low latencies on updates it is important to
  415. have a dedicated transaction log directory. By default
  416. transaction logs are put in the same directory as the data
  417. snapshots and <em>myid</em> file. The dataLogDir
  418. parameters indicates a different directory to use for the
  419. transaction logs.</p>
  420. </li>
  421. <li>
  422. <p>
  423. <em>[tbd: what is the other config param?]</em>
  424. </p>
  425. </li>
  426. </ul>
  427. </div>
  428. <p align="right">
  429. <font size="-2"></font>
  430. </p>
  431. </div>
  432. <!--+
  433. |end content
  434. +-->
  435. <div class="clearboth">&nbsp;</div>
  436. </div>
  437. <div id="footer">
  438. <!--+
  439. |start bottomstrip
  440. +-->
  441. <div class="lastmodified">
  442. <script type="text/javascript"><!--
  443. document.write("Last Published: " + document.lastModified);
  444. // --></script>
  445. </div>
  446. <div class="copyright">
  447. Copyright &copy;
  448. 2008 <a href="http://www.apache.org/licenses/">The Apache Software Foundation.</a>
  449. </div>
  450. <!--+
  451. |end bottomstrip
  452. +-->
  453. </div>
  454. </body>
  455. </html>