<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta charset="utf-8">
<meta name="generator" content="pdf2htmlEX">
<meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1">
<link rel="stylesheet" href="https://static.pudn.com/base/css/base.min.css">
<link rel="stylesheet" href="https://static.pudn.com/base/css/fancy.min.css">
<link rel="stylesheet" href="https://static.pudn.com/prod/directory_preview_static/628020919b6e2b6d5576e3d6/raw.css">
<script src="https://static.pudn.com/base/js/compatibility.min.js"></script>
<script src="https://static.pudn.com/base/js/pdf2htmlEX.min.js"></script>
<script>
try{
pdf2htmlEX.defaultViewer = new pdf2htmlEX.Viewer({});
}catch(e){}
</script>
<title></title>
</head>
<body>
<div id="sidebar" style="display: none">
<div id="outline">
</div>
</div>
<div id="pf1" class="pf w0 h0" data-page-no="1"><div class="pc pc1 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/628020919b6e2b6d5576e3d6/bg1.jpg"><div class="c x0 y1 w0 h2"><div class="t m0 x1 h3 y2 ff1 fs0 fc0 sc0 ls0 ws0"><span class="fc2 sc0">b</span><span class="fc2 sc0">b</span><span class="fc2 sc0">s</span><span class="fc2 sc0">.</span><span class="fc2 sc0">h</span><span class="fc2 sc0">a</span><span class="fc2 sc0">d</span><span class="fc2 sc0">o</span><span class="fc2 sc0">o</span><span class="fc2 sc0">p</span><span class="fc2 sc0">o</span><span class="fc2 sc0">r</span><span class="fc2 sc0">.</span><span class="fc2 sc0">c</span><span class="fc2 sc0">o</span><span class="fc2 sc0">m</span><span class="_ _0"> </span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">h</span><span class="fc2 sc0">a</span><span class="fc2 sc0">d</span><span class="fc2 sc0">o</span><span class="fc2 sc0">o</span><span class="fc2 sc0">p</span><span class="_ _1"> </span><span class="fc2 sc0">技术论坛</span></div></div><div class="t m1 x1 h4 y3 ff1 fs1 fc0 sc0 ls0 ws0"><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span><span class="fc2 sc0">-</span></div><div class="t m1 x1 h4 y4 ff1 fs1 fc0 sc0 ls0 ws0"><span class="fc2 sc0">创刊号</span><span class="_ _2"> </span><span class="fc2 sc0">2</span><span class="fc2 sc0">0</span><span class="fc2 sc0">1</span><span class="fc2 sc0">0</span><span class="_ _3"> </span><span class="fc2 sc0">年</span><span class="_ _4"> </span><span class="fc2 sc0">1</span><span class="_ _5"> </span><span class="fc2 sc0">月</span><span class="_ _6"> </span><span class="ff2"><span class="fc2 sc0">-</span><span class="_ _7"> </span><span class="fc2 sc0">1</span><span class="_ _5"> </span><span class="fc2 sc0">-</span></span></div><div class="c x2 y5 w2 h5"><div class="t m1 x3 h6 y6 ff3 fs2 fc1 sc0 ls0 ws0">www<span class="_ _8"></span>.had<span class="_ _9"></span>oopor<span class="_ _a"></span>.com</div></div><div class="c x4 y7 w3 h7"><div class="t m1 x3 h8 y8 ff4 fs2 fc1 sc0 ls0 ws0">2010<span class="_ _b"> </span>入门专刊</div></div></div><div class="pi" data-data='{"ctm":[1.612022,0.000000,0.000000,1.612022,0.000000,0.000000]}'></div></div>
</body>
</html>
<div id="pf2" class="pf w0 h0" data-page-no="2"><div class="pc pc2 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/628020919b6e2b6d5576e3d6/bg2.jpg"><div class="c x5 y9 w4 h9"><div class="t m1 x3 ha ya ff1 fs2 fc0 sc1 ls0 ws0">出品</div><div class="t m1 x3 hb yb ff1 fs3 fc0 sc0 ls0 ws0">Hadoop<span class="_ _c"> </span>技术论坛</div><div class="t m1 x3 ha yc ff1 fs2 fc0 sc1 ls0 ws0">总编辑</div><div class="t m1 x3 hb yd ff1 fs3 fc0 sc0 ls0 ws0">易剑<span class="_ _d"> </span>(<span class="_ _e"> </span>一见<span class="_ _d"> </span>)</div><div class="t m1 x3 ha ye ff1 fs2 fc0 sc1 ls0 ws0">副总编辑</div><div class="t m1 x3 hb yf ff1 fs3 fc0 sc0 ls0 ws0">代志远<span class="_ _f"> </span>(<span class="_ _e"> </span>国宝<span class="_ _d"> </span>)<span class="_ _10"> </span>王磊<span class="_ _d"> </span>(<span class="_ _e"> </span>beyi<span class="_ _d"> </span>)</div><div class="t m1 x3 ha y10 ff1 fs2 fc0 sc1 ls0 ws0">本期主<span class="_ _11"> </span>编</div><div class="t m1 x3 hb y11 ff1 fs3 fc0 sc0 ls0 ws0">皮冰锋<span class="_ _f"> </span>(<span class="_ _e"> </span>若冰<span class="_ _d"> </span>)</div><div class="t m1 x3 ha y12 ff1 fs2 fc0 sc1 ls0 ws0">编辑</div><div class="t m1 x3 hb y13 ff1 fs3 fc0 sc0 ls0 ws0">皮冰锋<span class="_ _f"> </span>(<span class="_ _e"> </span>若冰<span class="_ _d"> </span>)<span class="_ _12"> </span>易剑<span class="_ _d"> </span>(<span class="_ _e"> </span>一见<span class="_ _d"> </span>)</div><div class="t m1 x3 hb y14 ff1 fs4 fc0 sc0 ls0 ws0">贺湘辉<span class="_ _13"> </span>(<span class="_ _14"> </span><span class="fs3">小米<span class="_ _d"> </span>)<span class="_ _15"> </span>王磊<span class="_ _d"> </span>(<span class="_ _e"> </span>beyi<span class="_ _d"> </span>)</span></div><div class="t m1 x3 hb y15 ff1 fs3 fc0 sc0 ls0 ws0">代志远<span class="_ _f"> </span>(<span class="_ _e"> </span>国宝<span class="_ _d"> </span>)<span class="_ _12"> </span>柏传杰<span class="_ _f"> </span>(<span class="_ _e"> </span>飞鸿雪泥<span class="_ _16"> </span>)</div><div class="t m1 x3 hb y16 ff1 fs3 fc0 sc0 ls0 ws0">何忠育<span class="_ _f"> </span>(<span class="_ _e"> </span>Spork<span class="_ _17"> </span>)<span class="_ _18"> </span>秘中凯</div><div class="t m1 x3 hb y17 ff1 fs3 fc0 sc0 ls0 ws0">陈炬</div><div class="t m1 x3 ha y18 ff1 fs2 fc0 sc1 ls0 ws0">美工<span class="_ _19"> </span>/<span class="_ _1a"> </span>封面设计</div><div class="t m1 x3 hb y19 ff1 fs3 fc0 sc0 ls0 ws0">易剑<span class="_ _d"> </span>(<span class="_ _e"> </span>一见<span class="_ _d"> </span>)</div><div class="t m1 x3 ha y1a ff1 fs2 fc0 sc1 ls0 ws0">网址</div><div class="t m1 x3 hc y1b ff3 fs3 fc0 sc0 ls0 ws0">http://w<span class="_ _9"></span>ww<span class="_ _8"></span>.hadoo<span class="_ _1b"></span>por<span class="_ _a"></span>.com</div><div class="t m1 x3 ha y1c ff1 fs2 fc0 sc1 ls0 ws0">投稿信箱</div><div class="t m1 x3 hc y1d ff3 fs3 fc0 sc0 ls0 ws0">hadoopor@fox<span class="_ _9"></span>mail.com</div></div><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a></div><div class="pi" data-data='{"ctm":[1.612022,0.000000,0.000000,1.612022,0.000000,0.000000]}'></div></div>
<div id="pf3" class="pf w0 h0" data-page-no="3"><div class="pc pc3 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/628020919b6e2b6d5576e3d6/bg3.jpg"><div class="t m1 x6 hd y1e ff1 fs5 fc0 sc1 ls0 ws0">刊首语</div><div class="t m1 x7 he y1f ff4 fs3 fc0 sc0 ls0 ws0">2010<span class="_ _1c"> </span>年<span class="_ _1d"> </span>1</div><div class="t m3 x8 he y1f ff4 fs3 fc0 sc0 ls0 ws0">月<span class="_ _1e"></span>,<span class="_ _1f"> </span>《</div><div class="t m1 x9 he y1f ff4 fs3 fc0 sc0 ls0 ws0">Hadoop<span class="_ _16"> </span>开发者》沐着<span class="_ _20"> </span>2010<span class="_ _1c"> </span>年的第一缕春光诞生了。</div><div class="t m1 x7 he y20 ff4 fs3 fc0 sc0 ls0 ws0">正是有了<span class="_ _21"> </span>Doug<span class="_ _22"> </span>Cutting<span class="_ _23"> </span>这样的大师级开源者,<span class="_"> </span>正是有了无数个为<span class="_ _24"> </span>Hadoo<span class="_ _25"> </span>p</div><div class="t m1 x1 he y21 ff4 fs3 fc0 sc0 ls0 ws0">贡献力量的开源者们<span class="_ _1b"></span>的共同努<span class="_ _1b"></span>力,才有<span class="_ _1b"></span>了<span class="_ _26"> </span>Hadoop<span class="_ _16"> </span>自诞生时的倍受<span class="_ _1b"></span>关注到现在</div><div class="t m1 x1 he y22 ff4 fs3 fc0 sc0 ls0 ws0">的倍受瞩目。<span class="_ _27"> </span>Hadoop<span class="_ _16"> </span>从单一应用发展到目前的<span class="_ _28"> </span>Hadoop<span class="_ _29"> </span>Ecosystem<span class="_ _2a"> </span>,自成一</div><div class="t m1 x1 he y23 ff4 fs3 fc0 sc0 ls0 ws0">格的技术体系,<span class="_ _2b"> </span>叩开了信息爆炸时代的海量数据处理的大门,<span class="_ _2b"> </span>开辟了海量数据<span class="_ _2c"> </span>存</div><div class="t m4 x1 he y24 ff4 fs3 fc0 sc0 ls0 ws0">储<span class="_ _2d"></span>与<span class="_ _2d"></span>计<span class="_ _2d"></span>算<span class="_ _2d"></span>及<span class="_ _2d"></span>其<span class="_ _2d"></span>应<span class="_ _2d"></span>用<span class="_ _2d"></span>的<span class="_ _2d"></span>新<span class="_ _2d"></span>领<span class="_ _2d"></span>地<span class="_ _2d"></span>,<span class="_ _2e"> </span>《</div><div class="t m1 xa he y24 ff4 fs3 fc0 sc0 ls0 ws0">Hadoop<span class="_ _16"> </span>开发者》<span class="_"> </span>正是在这样的背景下应运而</div><div class="t m5 xb he y24 ff4 fs3 fc0 sc0 ls0 ws0">生<span class="_ _2f"></span>。</div><div class="t m1 x7 he y25 ff4 fs3 fc0 sc0 ls0 ws0">Hadoop<span class="_ _30"> </span>技术交流群自创建起,<span class="_ _31"> </span>短短的几个月时间里就形成了<span class="_ _32"> </span>2<span class="_ _33"> </span>个超级大</div><div class="t m5 xb he y25 ff4 fs3 fc0 sc0 ls0 ws0">群<span class="_ _2f"></span>,</div><div class="t m1 x1 he y26 ff4 fs3 fc0 sc0 ls0 ws0">Hadoop<span class="_ _34"> </span>技术体系深蒙面向各行各业应用的开发者们的厚爱,<span class="_ _31"> </span>可以预见<span class="_ _35"> </span>Hado<span class="_ _36"> </span>op</div><div class="t m1 x1 he y27 ff4 fs3 fc0 sc0 ls0 ws0">应用前景广阔。<span class="_ _8"></span>但<span class="_ _9"></span>时下稍显稚嫩,<span class="_ _a"></span>需要广大的爱好者共同尝试、<span class="_ _a"></span>探索,<span class="_ _8"></span>发掘应<span class="_ _2c"> </span>用</div><div class="t m6 x1 he y28 ff4 fs3 fc0 sc0 ls0 ws0">的<span class="_ _37"></span>同<span class="_ _37"></span>时<span class="_ _37"></span>帮<span class="_ _37"></span>助<span class="_ _37"></span>改<span class="_ _37"></span>进<span class="_ _37"></span>。<span class="_ _38"> </span>《</div><div class="t m1 xc he y28 ff4 fs3 fc0 sc0 ls0 ws0">Hadoop<span class="_ _16"> </span>开发者》<span class="_ _2b"> </span>是<span class="_ _39"> </span>Hadoop<span class="_ _16"> </span>交流群的几位志愿者们自发<span class="_ _3a"> </span>创</div><div class="t m1 x1 he y29 ff4 fs3 fc0 sc0 ls0 ws0">建的,<span class="_"> </span>希望它的出现能为您的学习和探索铺路,<span class="_"> </span>同<span class="_ _9"></span>时也期盼能分享您的<span class="_ _3b"> </span>Hadoo<span class="_ _25"> </span>p</div><div class="t m4 x1 he y2a ff4 fs3 fc0 sc0 ls0 ws0">之<span class="_ _2d"></span>旅<span class="_ _2d"></span>。<span class="_ _2d"></span>在<span class="_ _2d"></span>分<span class="_ _2d"></span>享<span class="_ _2d"></span>中<span class="_ _2d"></span>,<span class="_ _3c"> </span>《</div><div class="t m1 xd he y2a ff4 fs3 fc0 sc0 ls0 ws0">hadoop<span class="_ _3d"> </span>开发者》将与您一路同行,共同进步。</div><div class="t m7 x7 he y2b ff4 fs3 fc0 sc0 ls0 ws0">分<span class="_ _37"></span>享<span class="_ _37"></span>、自<span class="_ _37"></span>由<span class="_ _2d"></span>、开<span class="_ _37"></span>放<span class="_ _2d"></span>,<span class="_ _3e"> </span>《</div><div class="t m1 xe he y2b ff4 fs3 fc0 sc0 ls0 ws0">Hadoop<span class="_ _16"> </span>开发者》<span class="_ _8"></span>将秉承这一开源社区的血脉和传统</div><div class="t m8 xf he y2b ff4 fs3 fc0 sc0 ls0 ws0">,</div><div class="t m1 x1 he y2c ff4 fs3 fc0 sc0 ls0 ws0">传承<span class="_ _3f"> </span>“<span class="_ _12"> </span>百家争鸣</div><div class="t m8 x10 he y2c ff4 fs3 fc0 sc0 ls0 ws0">”</div><div class="t m1 x11 he y2c ff4 fs3 fc0 sc0 ls0 ws0">,<span class="_ _9"></span>在思想交流和技术的切磋中促进<span class="_ _40"> </span>hadoop<span class="_ _3d"> </span>社区的发展,期<span class="_ _41"> </span>待</div><div class="t m1 x1 he y2d ff4 fs3 fc0 sc0 ls0 ws0">Hadoop<span class="_ _16"> </span>这一尚待开垦的田野里<span class="_ _42"> </span>“<span class="_ _12"> </span>百花齐放</div><div class="t m8 x12 he y2d ff4 fs3 fc0 sc0 ls0 ws0">”</div><div class="t m1 x13 he y2d ff4 fs3 fc0 sc0 ls0 ws0">。</div><div class="t m1 x7 he y2e ff4 fs3 fc0 sc0 ls0 ws0">最后,<span class="_ _8"></span>感谢<span class="_ _8"></span>《<span class="_ _43"> </span>Hadoop<span class="_ _16"> </span>开发者》<span class="_ _8"></span>编辑组所有同仁们,<span class="_ _44"></span>彼此素未蒙面的爱好<span class="_ _45"> </span>者</div><div class="t m1 x1 he y2f ff4 fs3 fc0 sc0 ls0 ws0">能聚到一起,为了一<span class="_ _1b"></span>个共同的<span class="_ _1b"></span>爱好策划<span class="_ _1b"></span>这本杂志,这<span class="_ _1b"></span>本身就<span class="_ _1b"></span>是<span class="_ _46"> </span>Hadoop<span class="_ _16"> </span>魅力的</div><div class="t m1 x1 he y30 ff4 fs3 fc0 sc0 ls0 ws0">体现。当<span class="_ _1b"></span>然,<span class="_ _1b"></span>也要<span class="_ _1b"></span>感谢大<span class="_ _1b"></span>师<span class="_ _47"> </span>Doug<span class="_ _22"> </span>Cutting<span class="_ _23"> </span>和<span class="_ _48"> </span>Hadoop<span class="_ _16"> </span>社区的开<span class="_ _1b"></span>源者们<span class="_ _1b"></span>,因为</div><div class="t m1 x1 he y31 ff4 fs3 fc0 sc0 ls0 ws0">有了您,这里才变得如此精彩!</div><div class="t m1 x14 he y32 ff4 fs3 fc0 sc0 ls0 ws0">《<span class="_ _12"> </span>Hadoop<span class="_ _16"> </span>开发者》编辑组<span class="_ _49"> </span>2010-1-27</div></div><div class="pi" data-data='{"ctm":[1.612022,0.000000,0.000000,1.612022,0.000000,0.000000]}'></div></div>
<div id="pf4" class="pf w0 h0" data-page-no="4"><div class="pc pc4 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/628020919b6e2b6d5576e3d6/bg4.jpg"><div class="t m1 x15 hf y33 ff5 fs6 fc0 sc0 ls0 ws0">目<span class="_ _4a"></span>录</div><div class="c x16 y34 w5 h10"><div class="t m1 x3 h11 y35 ff4 fs4 fc0 sc0 ls0 ws0">1<span class="_ _d"> </span><span class="fc3">Had<span class="_ _9"></span>oop<span class="_ _11"> </span>介绍</span></div><div class="t m1 x3 h11 y36 ff4 fs4 fc0 sc0 ls0 ws0">2<span class="_ _d"> </span><span class="fc3">Had<span class="_ _9"></span>oop<span class="_ _11"> </span>在国内应用情<span class="_ _9"></span>况</span></div><div class="t m1 x3 h11 y37 ff4 fs4 fc0 sc0 ls0 ws0">3<span class="_ _d"> </span><span class="fc3">Had<span class="_ _9"></span>oop<span class="_ _11"> </span>源代码<span class="_ _4b"> </span>eclipse<span class="_ _4c"> </span>编译教程</span></div><div class="t m1 x3 h11 y38 ff4 fs4 fc0 sc0 ls0 ws0">7<span class="_ _d"> </span><span class="fc3">在<span class="_ _12"> </span>Windows<span class="_ _16"> </span>上安装<span class="_ _4b"> </span>Ha<span class="_ _1b"></span>doop<span class="_ _11"> </span>教程</span></div><div class="t m1 x3 h11 y39 ff4 fs4 fc0 sc0 ls0 ws0">1<span class="_ _4d"> </span>3<span class="_ _4e"> </span><span class="fc3">在<span class="_ _12"> </span>Linux<span class="_ _4f"> </span>上安装<span class="_ _4b"> </span>Hadoop<span class="_ _11"> </span>教程</span></div><div class="t m1 x3 h11 y3a ff4 fs4 fc0 sc0 ls0 ws0">19<span class="_ _50"> </span><span class="fc3">在<span class="_ _12"> </span>Windows<span class="_ _51"> </span>上使用<span class="_ _4b"> </span>eclipse<span class="_ _4c"> </span>编写<span class="_ _52"> </span>Hadoop<span class="_ _11"> </span>应用程序</span></div><div class="t m1 x3 h11 y3b ff4 fs4 fc0 sc0 ls0 ws0">24<span class="_ _50"> </span><span class="fc3">在<span class="_ _12"> </span>Windows<span class="_ _51"> </span>中使用<span class="_ _4b"> </span>Cygwin<span class="_ _53"> </span>安装<span class="_ _52"> </span>HBase</span></div><div class="t m1 x3 h11 y3c ff4 fs4 fc0 sc0 ls0 ws0">28<span class="_ _50"> </span><span class="fc3">Nutch<span class="_ _54"> </span>与<span class="_ _12"> </span>Ha<span class="_ _1b"></span>doop<span class="_ _11"> </span>的整合与<span class="_ _9"></span>部署</span></div><div class="t m1 x3 h11 y3d ff4 fs4 fc0 sc0 ls0 ws0">31<span class="_ _50"> </span><span class="fc3">在<span class="_ _12"> </span>Windows<span class="_ _16"> </span>eclipse<span class="_ _4c"> </span>上单步调试<span class="_ _55"> </span>Hive<span class="_ _3f"> </span>教程</span></div><div class="t m1 x3 h11 y3e ff4 fs4 fc0 sc0 ls0 ws0">38<span class="_ _50"> </span><span class="fc3">Hive<span class="_ _3f"> </span>应用介绍</span></div><div class="t m1 x3 h11 y3f ff4 fs4 fc0 sc0 ls0 ws0">42<span class="_ _50"> </span><span class="fc3">Hive<span class="_ _3f"> </span>执行计划解析</span></div><div class="t m1 x3 h11 y40 ff4 fs4 fc0 sc0 ls0 ws0">50<span class="_ _50"> </span><span class="fc3">MapR<span class="_ _9"></span>ed<span class="_ _9"></span>uce<span class="_ _56"> </span>中的<span class="_ _52"> </span>Shuf<span class="_ _9"></span>fle<span class="_ _b"> </span>和<span class="_ _12"> </span>Sort<span class="_ _57"> </span>分析</span></div><div class="t m1 x3 h11 y41 ff4 fs4 fc0 sc0 ls0 ws0">53<span class="_ _50"> </span><span class="fc3">海量数据存储<span class="_ _9"></span>和计算平<span class="_ _9"></span>台的调试<span class="_ _9"></span>器研究</span></div><div class="t m1 x3 h11 y42 ff4 fs4 fc0 sc0 ls0 ws0">56<span class="_ _50"> </span><span class="fc3">探讨<span class="_ _52"> </span>Map<span class="_ _9"></span>Re<span class="_ _9"></span>duce<span class="_ _56"> </span>模型的改<span class="_ _9"></span>进</span></div><div class="t m1 x3 h11 y43 ff4 fs4 fc0 sc0 ls0 ws0">58<span class="_ _50"> </span><span class="fc3">运行<span class="_ _52"> </span>eclipse<span class="_ _4c"> </span>编译出的<span class="_ _58"> </span>Hadoop<span class="_ _11"> </span>框架</span></div><div class="t m1 x3 h11 y44 ff4 fs4 fc0 sc0 ls0 ws0">59<span class="_ _50"> </span><span class="fc3">表关联在<span class="_ _58"> </span>MapR<span class="_ _9"></span>ed<span class="_ _9"></span>uce<span class="_ _56"> </span>上的实现</span></div><div class="t m1 x3 h11 y45 ff4 fs4 fc0 sc0 ls0 ws0">63<span class="_ _50"> </span><span class="fc3">Hadoop<span class="_ _11"> </span>计算平台和<span class="_ _55"> </span>Hadoop<span class="_ _11"> </span>数据仓库<span class="_ _9"></span>的区别</span></div></div><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a><a class="l" rel='nofollow' onclick='return false;'><div class="d m2"></div></a></div><div class="pi" data-data='{"ctm":[1.612022,0.000000,0.000000,1.612022,0.000000,0.000000]}'></div></div>
<div id="pf5" class="pf w0 h0" data-page-no="5"><div class="pc pc5 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/628020919b6e2b6d5576e3d6/bg5.jpg"><div class="c x0 y1 w0 h2"><div class="t m0 x1 h3 y2 ff1 fs0 fc0 sc0 ls0 ws0">bbs.hadoopor.com<span class="_ _0"> </span>--------had<span class="_ _1b"></span>oop<span class="_ _59"> </span>技术论坛</div></div><div class="t m1 x1 h4 y3 ff1 fs1 fc0 sc0 ls0 ws0">--------------------------------------------------------------------------------------------</div><div class="t m1 x1 h4 y4 ff1 fs1 fc0 sc0 ls0 ws0">创刊号<span class="_ _2"> </span>2010<span class="_ _3"> </span>年<span class="_ _4"> </span>1<span class="_ _5"> </span>月<span class="_ _6"> </span><span class="ff2">-<span class="_ _38"> </span>1<span class="_ _5a"> </span>-</span></div><div class="t m1 x17 h12 y46 ff6 fs7 fc0 sc0 ls0 ws0">Hadoop</div><div class="t m1 x17 h12 y47 ff6 fs7 fc0 sc0 ls0 ws0">Hadoop</div><div class="t m1 x17 h12 y48 ff6 fs7 fc0 sc0 ls0 ws0">Hadoop</div><div class="t m1 x17 h13 y46 ff6 fs7 fc0 sc0 ls0 ws0">Hadoop<span class="_ _5b"> </span><span class="ff7">介绍</span></div><div class="t m1 x18 h13 y47 ff7 fs7 fc0 sc0 ls0 ws0">介绍</div><div class="t m1 x18 h13 y48 ff7 fs7 fc0 sc0 ls0 ws0">介绍</div><div class="t m1 x18 h13 y46 ff7 fs7 fc0 sc0 ls0 ws0">介绍</div><div class="t m1 x7 h14 y49 ff2 fs4 fc0 sc0 ls0 ws0">Hadoop<span class="_ _5c"> </span><span class="ff1">是<span class="_ _12"> </span></span>A<span class="_ _1b"></span>pache<span class="_ _22"> </span><span class="ff1">下的一<span class="_ _1b"></span>个项目<span class="_ _1b"></span>,由<span class="_ _5d"> </span><span class="ff2">HDFS<span class="_ _5e"> </span></span>、<span class="_ _5f"> </span><span class="ff2">MapReduce<span class="_ _60"> </span></span>、<span class="_ _5f"> </span><span class="ff2">HBase<span class="_ _19"> </span></span>、<span class="_ _5f"> </span><span class="ff2">Hiv<span class="_ _9"></span>e<span class="_ _61"> </span></span>和<span class="_ _12"> </span><span class="ff2">ZooK<span class="_ _9"></span>eeper</span></span></div><div class="t m1 x1 h14 y4a ff1 fs4 fc0 sc0 ls0 ws0">等成员组成。<span class="_ _9"></span>其中,<span class="_ _62"> </span><span class="ff2">HDFS<span class="_ _63"> </span></span>和<span class="_ _64"> </span><span class="ff2">MapReduce<span class="_ _65"> </span></span>是两个最基础<span class="_ _9"></span>最重要的<span class="_ _9"></span>成员。</div><div class="t m1 x7 h14 y4b ff2 fs4 fc0 sc0 ls0 ws0">HDFS<span class="_ _63"> </span><span class="ff1">是<span class="_ _64"> </span></span>Google<span class="_ _66"> </span>GFS<span class="_ _67"> </span><span class="ff1">的开源版本,一个高度容错的分布式文件系统,它能够提供高吞</span></div><div class="t m1 x1 h14 y4c ff1 fs4 fc0 sc0 ls0 ws0">吐量的数据访<span class="_ _9"></span>问,适<span class="_ _9"></span>合存储海<span class="_ _9"></span>量(<span class="_ _68"> </span><span class="ff2">PB<span class="_ _69"> </span></span>级)的大文<span class="_ _9"></span>件(通常<span class="_ _9"></span>超过<span class="_ _6a"> </span><span class="ff2">64M</span></div><div class="t m4 x19 h14 y4c ff1 fs4 fc0 sc0 ls0 ws0">)<span class="_ _1f"> </span>,<span class="_ _2d"></span>其<span class="_ _1b"></span>原<span class="_ _2d"></span>理<span class="_ _2d"></span>如<span class="_ _2d"></span>下<span class="_ _2d"></span>图<span class="_ _2d"></span>所<span class="_ _1b"></span>示</div><div class="t m8 x1a h14 y4c ff1 fs4 fc0 sc0 ls0 ws0">:</div><div class="t m1 x7 h14 y4d ff1 fs4 fc0 sc0 ls0 ws0">采用<span class="_ _52"> </span><span class="ff2">Master/<span class="_ _9"></span>Slave<span class="_ _6b"> </span></span>结构。<span class="_ _13"> </span><span class="ff2">NameNode<span class="_ _6c"> </span></span>维护集群内的<span class="_ _9"></span>元数据,<span class="_ _9"></span>对外提供<span class="_ _9"></span>创建、打开、<span class="_ _9"></span>删除</div><div class="t m1 x1 h14 y4e ff1 fs4 fc0 sc0 ls0 ws0">和重命名文件<span class="_ _9"></span>或目录的<span class="_ _9"></span>功能。<span class="_ _6d"> </span><span class="ff2">DataNode<span class="_ _6e"> </span></span>存储数据,<span class="_ _6f"> </span>并提负责<span class="_ _9"></span>处理数据<span class="_ _9"></span>的读写请<span class="_ _9"></span>求。<span class="_ _70"> </span><span class="ff2">DataNo<span class="_ _71"> </span>de</span></div><div class="t m1 x1 h14 y4f ff1 fs4 fc0 sc0 ls0 ws0">定期向<span class="_ _4b"> </span><span class="ff2">NameNode<span class="_ _6c"> </span></span>上报心跳,<span class="_ _72"> </span><span class="ff2">NameNode<span class="_ _6c"> </span></span>通过响应心跳来控制<span class="_ _73"> </span><span class="ff2">DataNode<span class="_ _74"> </span></span>。</div><div class="t m1 x7 h14 y50 ff2 fs4 fc0 sc0 ls0 ws0">InfoW<span class="_ _44"></span>or<span class="_ _9"></span>d<span class="_ _11"> </span><span class="ff1">将<span class="_ _12"> </span></span>MapReduce<span class="_ _65"> </span><span class="ff1">评为<span class="_ _75"> </span></span>2009<span class="_ _10"> </span><span class="ff1">年十大新<span class="_ _2d"></span>兴技术的<span class="_ _2d"></span>冠军。<span class="_ _76"> </span><span class="ff2">MapReduce<span class="_ _65"> </span></span>是大规模<span class="_ _1b"></span>数据</span></div><div class="t m1 x1 h14 y51 ff1 fs4 fc0 sc0 ls0 ws0">(<span class="_ _5f"> </span><span class="ff2">TB<span class="_ _77"> </span></span>级)计算的利器,<span class="_ _78"> </span><span class="ff2">Map<span class="_ _67"> </span></span>和<span class="_ _64"> </span><span class="ff2">Reduce<span class="_ _79"> </span></span>是它的主要思想,来源于函数式编程语言,它的原</div><div class="t m1 x1 h14 y52 ff1 fs4 fc0 sc0 ls0 ws0">理如下图所示<span class="_ _9"></span>:</div><div class="t m1 x7 h14 y53 ff2 fs4 fc0 sc0 ls0 ws0">Map<span class="_ _67"> </span><span class="ff1">负责将数据打散,<span class="_ _7a"> </span></span>Reduce</div><div class="t m1 x1 h14 y54 ff1 fs4 fc0 sc0 ls0 ws0">负责对数据进<span class="_ _9"></span>行聚集,<span class="_ _9"></span>用户只需<span class="_ _9"></span>要实</div><div class="t m1 x1 h14 y55 ff1 fs4 fc0 sc0 ls0 ws0">现<span class="_ _64"> </span><span class="ff2">map<span class="_ _7b"> </span></span>和<span class="_ _64"> </span><span class="ff2">reduce<span class="_ _2"> </span></span>两个<span class="_ _9"></span>接口,即<span class="_ _9"></span>可完成</div><div class="t m1 x1 h14 y56 ff2 fs4 fc0 sc0 ls0 ws0">TB<span class="_ _77"> </span><span class="ff1">级数据的计算<span class="_ _9"></span>,常见的<span class="_ _9"></span>应用包括<span class="_ _9"></span>:</span></div><div class="t m1 x1 h14 y57 ff1 fs4 fc0 sc0 ls0 ws0">日志分析和数<span class="_ _9"></span>据挖掘等<span class="_ _9"></span>数据分析<span class="_ _9"></span>应用。</div><div class="t m1 x1 h14 y58 ff1 fs4 fc0 sc0 ls0 ws0">另外,还可用<span class="_ _9"></span>于科学数<span class="_ _9"></span>据计算,<span class="_ _9"></span>如圆周</div><div class="t m1 x1 h14 y59 ff1 fs4 fc0 sc0 ls0 ws0">率<span class="_ _64"> </span><span class="ff2">PI<span class="_ _5f"> </span></span>的计<span class="_ _9"></span>算等。</div><div class="t m1 x7 h14 y5a ff2 fs4 fc0 sc0 ls0 ws0">Hadoop<span class="_ _5c"> </span>MapReduce<span class="_ _65"> </span><span class="ff1">的实现也采用</span></div><div class="t m1 x1 h14 y5b ff1 fs4 fc0 sc0 ls0 ws0">了<span class="_ _64"> </span><span class="ff2">Master/Sl<span class="_ _9"></span>ave<span class="_ _6b"> </span></span>结构。<span class="_ _13"> </span><span class="ff2">Master<span class="_ _7c"> </span></span>叫做</div><div class="t m1 x1 h14 y5c ff2 fs4 fc0 sc0 ls0 ws0">JobT<span class="_ _9"></span>racker<span class="_ _7d"> </span><span class="ff1">,而<span class="_ _52"> </span></span>Slave<span class="_ _7e"> </span><span class="ff1">叫做<span class="_ _52"> </span></span>T<span class="_ _44"></span>askT<span class="_ _44"></span>racker<span class="_ _7f"> </span><span class="ff1">。</span></div><div class="t m1 x7 h14 y5d ff1 fs4 fc0 sc0 ls0 ws0">用户提交的计<span class="_ _9"></span>算叫做<span class="_ _80"> </span><span class="ff2">Job<span class="_ _15"> </span></span>,每一个</div><div class="t m1 x1 h14 y5e ff2 fs4 fc0 sc0 ls0 ws0">Job<span class="_ _81"> </span><span class="ff1">会被划分成若<span class="_ _9"></span>干个<span class="_ _82"> </span></span>T<span class="_ _44"></span>asks<span class="_ _d"> </span><span class="ff1">。<span class="_ _83"> </span></span>JobT<span class="_ _9"></span>racker</div><div class="t m1 x1 h14 y5f ff1 fs4 fc0 sc0 ls0 ws0">负责<span class="_ _52"> </span><span class="ff2">Job<span class="_ _81"> </span></span>和<span class="_ _64"> </span><span class="ff2">T<span class="_ _44"></span>asks<span class="_ _84"> </span></span>的调度,而<span class="_ _55"> </span><span class="ff2">T<span class="_ _44"></span>askT<span class="_ _9"></span>r<span class="_ _9"></span>acker</span></div><div class="t m1 x1 h14 y60 ff1 fs4 fc0 sc0 ls0 ws0">负责执行<span class="_ _58"> </span><span class="ff2">T<span class="_ _9"></span>a<span class="_ _9"></span>sks<span class="_ _d"> </span></span>。</div></div><div class="pi" data-data='{"ctm":[1.612022,0.000000,0.000000,1.612022,0.000000,0.000000]}'></div></div>