<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta charset="utf-8">
<meta name="generator" content="pdf2htmlEX">
<meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1">
<link rel="stylesheet" href="https://static.pudn.com/base/css/base.min.css">
<link rel="stylesheet" href="https://static.pudn.com/base/css/fancy.min.css">
<link rel="stylesheet" href="https://static.pudn.com/prod/directory_preview_static/6268177f4f8811599ef4a3dd/raw.css">
<script src="https://static.pudn.com/base/js/compatibility.min.js"></script>
<script src="https://static.pudn.com/base/js/pdf2htmlEX.min.js"></script>
<script>
try{
pdf2htmlEX.defaultViewer = new pdf2htmlEX.Viewer({});
}catch(e){}
</script>
<title></title>
</head>
<body>
<div id="sidebar" style="display: none">
<div id="outline">
</div>
</div>
<div id="pf1" class="pf w0 h0" data-page-no="1"><div class="pc pc1 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/6268177f4f8811599ef4a3dd/bg1.jpg"><div class="c x0 y1 w2 h2"><div class="t m0 x1 h3 y2 ff1 fs0 fc0 sc0 ls0 ws0"><span class="fc2 sc0">P</span><span class="fc2 sc0">1</span><span class="fc2 sc0">9</span><span class="fc2 sc0"> </span></div><div class="t m0 x2 h4 y3 ff2 fs1 fc0 sc0 ls0 ws0"><span class="fc2 sc0">第</span><span class="_ _0"> </span><span class="ff1"><span class="fc2 sc0">3</span><span class="_ _0"> </span></span><span class="fc2 sc0">章 </span><span class="fc2 sc0"> </span><span class="_ _0"> </span><span class="ff1"><span class="fc2 sc0">H</span><span class="fc2 sc0">a</span><span class="fc2 sc0">d</span><span class="fc2 sc0">oo</span><span class="fc2 sc0">p</span><span class="_ _0"> </span></span><span class="fc2 sc0">基础</span></div></div><div class="c x0 y4 w3 h5"><div class="t m0 x3 h6 y5 ff2 fs2 fc0 sc0 ls0 ws0">《大数据技术与应用基础》</div><div class="t m0 x4 h6 y6 ff3 fs2 fc0 sc0 ls0 ws0">21<span class="_ _1"> </span><span class="ff2">世纪高<span class="fc2 sc0">等院校“</span><span class="fc2 sc0">云计</span>算和大数据”人才培养规划教材</span></div><div class="t m0 x5 h7 y7 ff2 fs3 fc0 sc0 ls0 ws0">第<span class="_ _2"> </span><span class="ff3">3</span></div><div class="t m0 x5 h7 y8 ff2 fs3 fc0 sc0 ls0 ws0">章 </div><div class="t m0 x6 h8 y9 ff4 fs4 fc0 sc0 ls0 ws0">Hadoop<span class="_ _3"> </span><span class="ff2 sc1">基础</span></div><div class="t m0 x7 h6 ya ff2 fs2 fc1 sc0 ls0 ws0">人民邮电出版社</div></div></div><div class="pi" data-data='{"ctm":[0.999488,0.000000,0.000000,0.999488,0.000000,0.000000]}'></div></div>
</body>
</html>
<div id="pf2" class="pf w0 h0" data-page-no="2"><div class="pc pc2 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/6268177f4f8811599ef4a3dd/bg2.jpg"><div class="c x0 y1 w2 h2"><div class="t m0 x1 h3 y2 ff1 fs0 fc0 sc0 ls0 ws0"><span class="fc2 sc0">P</span><span class="fc2 sc0">1</span><span class="fc2 sc0">9</span><span class="fc2 sc0"> </span></div><div class="t m0 x2 h4 y3 ff2 fs1 fc0 sc0 ls0 ws0"><span class="fc2 sc0">第</span><span class="_ _0"> </span><span class="ff1"><span class="fc2 sc0">3</span><span class="_ _0"> </span></span><span class="fc2 sc0">章 </span><span class="fc2 sc0"> </span><span class="_ _0"> </span><span class="ff1"><span class="fc2 sc0">H</span><span class="fc2 sc0">a</span><span class="fc2 sc0">d</span><span class="fc2 sc0">oo</span><span class="fc2 sc0">p</span><span class="_ _0"> </span></span><span class="fc2 sc0">基础</span></div></div><div class="c x0 y4 w3 h5"><div class="t m0 x8 h9 yb ff2 fs5 fc3 sc0 ls0 ws0">能力</div><div class="t m0 x9 ha yc ff5 fs6 fc3 sc0 ls0 ws0">CAP<span class="_ _4"></span>ACITY</div><div class="t m0 xa hb yd ff2 fs7 fc3 sc0 ls0 ws0">要求</div><div class="t m0 xb hc ye ff2 fs8 fc4 sc0 ls0 ws0">了解什么是<span class="_ _5"> </span><span class="ff1">Hadoop<span class="_ _5"> </span></span>。</div><div class="t m0 xb hc yf ff2 fs8 fc4 sc0 ls0 ws0">理解<span class="_ _5"> </span><span class="ff1">Hadoop<span class="_ _5"> </span></span>的基本原理。</div><div class="t m0 xc hc y10 ff2 fs8 fc4 sc0 ls0 ws0">了解<span class="_ _5"> </span><span class="ff1">Hadoop<span class="_ _5"> </span></span>社区各攻击的作用。</div><div class="t m0 xb hc y11 ff2 fs8 fc4 sc0 ls0 ws0">掌握<span class="_ _5"> </span><span class="ff1">Hadoop<span class="_ _5"> </span></span>单机和集群的安装配置<span class="_ _6"></span>。</div></div></div><div class="pi" data-data='{"ctm":[0.999488,0.000000,0.000000,0.999488,0.000000,0.000000]}'></div></div>
<div id="pf3" class="pf w0 h0" data-page-no="3"><div class="pc pc3 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/6268177f4f8811599ef4a3dd/bg3.jpg"><div class="c x0 y4 w4 h5"><div class="t m0 x1 h3 y12 ff1 fs0 fc0 sc0 ls0 ws0"><span class="fc2 sc0">P</span><span class="fc2 sc0">1</span><span class="fc2 sc0">9</span><span class="fc2 sc0"> </span></div><div class="t m0 x2 h4 y13 ff2 fs1 fc0 sc0 ls0 ws0"><span class="fc2 sc0">第</span><span class="_ _0"> </span><span class="ff1"><span class="fc2 sc0">3</span><span class="_ _0"> </span></span><span class="fc2 sc0">章 </span><span class="fc2 sc0"> </span><span class="_ _0"> </span><span class="ff1"><span class="fc2 sc0">H</span><span class="fc2 sc0">a</span><span class="fc2 sc0">d</span><span class="fc2 sc0">oo</span><span class="fc2 sc0">p</span><span class="_ _0"> </span></span><span class="fc2 sc0">基础</span></div><div class="t m0 x8 h9 yb ff2 fs5 fc3 sc0 ls0 ws0">内容</div><div class="t m0 x9 ha yc ff5 fs6 fc3 sc0 ls0 ws0">CONTENTS</div><div class="t m0 xa hb yd ff2 fs7 fc3 sc0 ls0 ws0">导航</div></div><div class="c x0 y4 w3 h5"><div class="t m0 xd hd y14 ff1 fs6 fc5 sc0 ls0 ws0">Hadoop<span class="_ _0"> </span><span class="ff2">原理</span></div><div class="t m0 xd hd y15 ff1 fs6 fc0 sc0 ls0 ws0">Hadoop<span class="_ _0"> </span><span class="ff2">概述</span></div><div class="t m0 xd hd y16 ff1 fs6 fc5 sc0 ls0 ws0">Hadoop<span class="_ _0"> </span><span class="ff2">安装与配置</span></div><div class="t m0 xd hd y17 ff1 fs6 fc5 sc0 ls0 ws0">Hadoop<span class="_ _0"> </span><span class="ff2">生态系统简介</span></div></div></div><div class="pi" data-data='{"ctm":[0.999488,0.000000,0.000000,0.999488,0.000000,0.000000]}'></div></div>
<div id="pf4" class="pf w0 h0" data-page-no="4"><div class="pc pc4 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/6268177f4f8811599ef4a3dd/bg4.jpg"><div class="c x0 y1 w2 h2"><div class="t m0 x1 h3 y2 ff1 fs0 fc0 sc0 ls0 ws0">P19 </div><div class="t m0 x2 h4 y3 ff2 fs1 fc0 sc0 ls0 ws0">第<span class="_ _0"> </span><span class="ff1">3<span class="_ _0"> </span></span>章 <span class="_ _0"> </span><span class="ff1">Hadoop<span class="_ _0"> </span></span>基础</div></div><div class="c x0 y4 w3 h5"><div class="t m0 xe h6 y18 ff2 fs9 fc0 sc0 ls0 ws0">一、<span class="_ _7"> </span><span class="ff1 fs2">Hadoop<span class="_ _1"> </span><span class="ff2">概述</span></span></div><div class="t m0 xf he y19 ff3 fsa fc6 sc0 ls0 ws0"> Hadoo<span class="_ _6"></span>p<span class="_ _8"> </span><span class="ff2">是一个由<span class="_ _0"> </span></span>Apache<span class="_ _8"> </span><span class="ff2">基金<span class="_ _6"></span>会所开发的分<span class="_ _6"></span>布式系统<span class="_ _6"></span>基础架构<span class="_ _6"></span>。用户可<span class="_ _6"></span>以在不了解<span class="_ _6"></span>分布式底<span class="_ _6"></span>层细节的</span></div><div class="t m0 xf he y1a ff2 fsa fc6 sc0 ls0 ws0">情况下<span class="_ _6"></span>,开发分布<span class="_ _6"></span>式程序,<span class="_ _6"></span>充分利用集<span class="_ _6"></span>群的威力<span class="_ _6"></span>进行高速运<span class="_ _6"></span>算和存储</div><div class="t m0 x10 hf y1b ff3 fsb fc6 sc0 ls0 ws0">[2]</div><div class="t m0 x11 he y1a ff2 fsa fc6 sc0 ls0 ws0">。</div><div class="t m0 xf he y1c ff2 fsa fc6 sc0 ls0 ws0">现将各<span class="_ _6"></span>个主流的发<span class="_ _6"></span>行版本介<span class="_ _6"></span>绍如下<span class="_ _8"> </span><span class="ff3">;</span></div><div class="t m0 x12 h6 y1d ff3 fs2 fc7 sc0 ls0 ws0">Cloudera<span class="_ _1"> </span><span class="ff2">:最成型的<span class="_ _9"></span>发行版本,拥有最多的部署案例</span></div><div class="t m0 x12 h6 y1e ff3 fs2 fc7 sc0 ls0 ws0">Hortonworks<span class="_ _1"> </span><span class="ff2">:<span class="_ _1"> </span></span>100%<span class="_ _1"> </span><span class="ff2">开源的<span class="_ _1"> </span></span>Apache Had<span class="_ _9"></span>oop<span class="_ _1"> </span><span class="ff2">唯一提供商。</span></div><div class="t m0 x12 h6 y1f ff3 fs2 fc7 sc0 ls0 ws0">MapReduce<span class="_ _1"> </span><span class="ff2">:与竞争者相比,它使用了一些不同的概念,特别是为了获取更</span></div><div class="t m0 x12 h6 y20 ff2 fs2 fc7 sc0 ls0 ws0">好的性能和易用性而支持本地<span class="_ _1"> </span><span class="ff3">UNIX<span class="_ _1"> </span></span>文件系统而不是<span class="_ _1"> </span><span class="ff3">HDFS<span class="_ _1"> </span></span>(使用非开源的</div><div class="t m0 x12 h6 y21 ff2 fs2 fc7 sc0 ls0 ws0">组件)。</div><div class="t m0 x12 h6 y22 ff3 fs2 fc7 sc0 ls0 ws0">Amazon Elastic Map Redu<span class="_ _9"></span>ce<span class="_ _1"> </span><span class="ff2">(<span class="_ _1"> </span></span>EMR<span class="_ _a"> </span><span class="ff2">):区别于其他提供商的是,这是一</span></div><div class="t m0 x12 h6 y23 ff2 fs2 fc7 sc0 ls0 ws0">个托管的解决方案,其运行在由<span class="_ _1"> </span><span class="ff3">Amazon El<span class="_ _9"></span>astic Compute Cloud<span class="_ _1"> </span><span class="ff2">(<span class="_ _1"> </span></span>Amazon </span></div><div class="t m0 x12 h6 y24 ff3 fs2 fc7 sc0 ls0 ws0">EC2<span class="_ _1"> </span><span class="ff2">)和<span class="_ _1"> </span></span>AmzonSimple Strorage Se<span class="_ _9"></span>rvice<span class="_ _1"> </span><span class="ff2">(<span class="_ _1"> </span></span>Amzon S3<span class="_ _1"> </span><span class="ff2">)组成的网络规模的</span></div><div class="t m0 x12 h6 y25 ff2 fs2 fc7 sc0 ls0 ws0">基础设施之上。</div></div></div><div class="pi" data-data='{"ctm":[0.999488,0.000000,0.000000,0.999488,0.000000,0.000000]}'></div></div>
<div id="pf5" class="pf w0 h0" data-page-no="5"><div class="pc pc5 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/6268177f4f8811599ef4a3dd/bg5.jpg"><div class="c x0 y4 w4 h5"><div class="t m0 x1 h3 y12 ff1 fs0 fc0 sc0 ls0 ws0"><span class="fc2 sc0">P</span><span class="fc2 sc0">1</span><span class="fc2 sc0">9</span><span class="fc2 sc0"> </span></div><div class="t m0 x2 h4 y13 ff2 fs1 fc0 sc0 ls0 ws0"><span class="fc2 sc0">第</span><span class="_ _0"> </span><span class="ff1"><span class="fc2 sc0">3</span><span class="_ _0"> </span></span><span class="fc2 sc0">章 </span><span class="fc2 sc0"> </span><span class="_ _0"> </span><span class="ff1"><span class="fc2 sc0">H</span><span class="fc2 sc0">a</span><span class="fc2 sc0">d</span><span class="fc2 sc0">oo</span><span class="fc2 sc0">p</span><span class="_ _0"> </span></span><span class="fc2 sc0">基础</span></div><div class="t m0 x8 h9 yb ff2 fs5 fc3 sc0 ls0 ws0">内容</div><div class="t m0 x9 ha yc ff5 fs6 fc3 sc0 ls0 ws0">CONTENTS</div><div class="t m0 xa hb yd ff2 fs7 fc3 sc0 ls0 ws0">导航</div></div><div class="c x0 y4 w3 h5"><div class="t m0 xd hd y26 ff1 fs6 fc5 sc0 ls0 ws0">Hadoop<span class="_ _0"> </span><span class="ff2">概述</span></div><div class="t m0 xd hd y27 ff1 fs6 fc0 sc0 ls0 ws0">Hadoop<span class="_ _0"> </span><span class="ff2">原理</span></div><div class="t m0 xd hd y16 ff1 fs6 fc5 sc0 ls0 ws0">Hadoop<span class="_ _0"> </span><span class="ff2">安装与配置</span></div><div class="t m0 xd hd y17 ff1 fs6 fc5 sc0 ls0 ws0">Hadoop<span class="_ _0"> </span><span class="ff2">生态系统简介</span></div></div></div><div class="pi" data-data='{"ctm":[0.999488,0.000000,0.000000,0.999488,0.000000,0.000000]}'></div></div>