source: proiecte/HadoopJUnit/hadoop-0.20.1/docs/cn/hadoop_archives.html @ 120

Last change on this file since 120 was 120, checked in by (none), 14 years ago

Added the mail files for the Hadoop JUNit Project

  • Property svn:executable set to *
File size: 9.5 KB
Line 
1<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
2<html>
3<head>
4<META http-equiv="Content-Type" content="text/html; charset=UTF-8">
5<meta content="Apache Forrest" name="Generator">
6<meta name="Forrest-version" content="0.8">
7<meta name="Forrest-skin-name" content="pelt">
8<title>Hadoop Archives</title>
9<link type="text/css" href="skin/basic.css" rel="stylesheet">
10<link media="screen" type="text/css" href="skin/screen.css" rel="stylesheet">
11<link media="print" type="text/css" href="skin/print.css" rel="stylesheet">
12<link type="text/css" href="skin/profile.css" rel="stylesheet">
13<script src="skin/getBlank.js" language="javascript" type="text/javascript"></script><script src="skin/getMenu.js" language="javascript" type="text/javascript"></script><script src="skin/fontsize.js" language="javascript" type="text/javascript"></script>
14<link rel="shortcut icon" href="images/favicon.ico">
15</head>
16<body onload="init()">
17<script type="text/javascript">ndeSetTextSize();</script>
18<div id="top">
19<!--+
20    |breadtrail
21    +-->
22<div class="breadtrail">
23<a href="http://www.apache.org/">Apache</a> &gt; <a href="http://hadoop.apache.org/">Hadoop</a> &gt; <a href="http://hadoop.apache.org/core/">Core</a><script src="skin/breadcrumbs.js" language="JavaScript" type="text/javascript"></script>
24</div>
25<!--+
26    |header
27    +-->
28<div class="header">
29<!--+
30    |start group logo
31    +-->
32<div class="grouplogo">
33<a href="http://hadoop.apache.org/"><img class="logoImage" alt="Hadoop" src="images/hadoop-logo.jpg" title="Apache Hadoop"></a>
34</div>
35<!--+
36    |end group logo
37    +-->
38<!--+
39    |start Project Logo
40    +-->
41<div class="projectlogo">
42<a href="http://hadoop.apache.org/core/"><img class="logoImage" alt="Hadoop" src="images/core-logo.gif" title="Scalable Computing Platform"></a>
43</div>
44<!--+
45    |end Project Logo
46    +-->
47<!--+
48    |start Search
49    +-->
50<div class="searchbox">
51<form action="http://www.google.com/search" method="get" class="roundtopsmall">
52<input value="hadoop.apache.org" name="sitesearch" type="hidden"><input onFocus="getBlank (this, 'Search the site with google');" size="25" name="q" id="query" type="text" value="Search the site with google">&nbsp; 
53                    <input name="Search" value="Search" type="submit">
54</form>
55</div>
56<!--+
57    |end search
58    +-->
59<!--+
60    |start Tabs
61    +-->
62<ul id="tabs">
63<li>
64<a class="unselected" href="http://hadoop.apache.org/core/">项目</a>
65</li>
66<li>
67<a class="unselected" href="http://wiki.apache.org/hadoop">绎基</a>
68</li>
69<li class="current">
70<a class="selected" href="index.html">Hadoop 0.18文档</a>
71</li>
72</ul>
73<!--+
74    |end Tabs
75    +-->
76</div>
77</div>
78<div id="main">
79<div id="publishedStrip">
80<!--+
81    |start Subtabs
82    +-->
83<div id="level2tabs"></div>
84<!--+
85    |end Endtabs
86    +-->
87<script type="text/javascript"><!--
88document.write("Last Published: " + document.lastModified);
89//  --></script>
90</div>
91<!--+
92    |breadtrail
93    +-->
94<div class="breadtrail">
95
96             &nbsp;
97           </div>
98<!--+
99    |start Menu, mainarea
100    +-->
101<!--+
102    |start Menu
103    +-->
104<div id="menu">
105<div onclick="SwitchMenu('menu_selected_1.1', 'skin/')" id="menu_selected_1.1Title" class="menutitle" style="background-image: url('skin/images/chapter_open.gif');">文档</div>
106<div id="menu_selected_1.1" class="selectedmenuitemgroup" style="display: block;">
107<div class="menuitem">
108<a href="index.html">抂述</a>
109</div>
110<div class="menuitem">
111<a href="quickstart.html">快速入闚</a>
112</div>
113<div class="menuitem">
114<a href="cluster_setup.html">集矀搭建</a>
115</div>
116<div class="menuitem">
117<a href="hdfs_design.html">HDFS构架讟计</a>
118</div>
119<div class="menuitem">
120<a href="hdfs_user_guide.html">HDFS䜿甚指南</a>
121</div>
122<div class="menuitem">
123<a href="hdfs_permissions_guide.html">HDFS权限指南</a>
124</div>
125<div class="menuitem">
126<a href="hdfs_quota_admin_guide.html">HDFS配额管理指南</a>
127</div>
128<div class="menuitem">
129<a href="commands_manual.html">呜什手册</a>
130</div>
131<div class="menuitem">
132<a href="hdfs_shell.html">FS Shell䜿甚指南</a>
133</div>
134<div class="menuitem">
135<a href="distcp.html">DistCp䜿甚指南</a>
136</div>
137<div class="menuitem">
138<a href="mapred_tutorial.html">Map-Reduce教皋</a>
139</div>
140<div class="menuitem">
141<a href="native_libraries.html">Hadoop本地库</a>
142</div>
143<div class="menuitem">
144<a href="streaming.html">Streaming</a>
145</div>
146<div class="menupage">
147<div class="menupagetitle">Hadoop Archives</div>
148</div>
149<div class="menuitem">
150<a href="hod.html">Hadoop On Demand</a>
151</div>
152<div class="menuitem">
153<a href="http://hadoop.apache.org/core/docs/r0.18.2/api/index.html">API参考</a>
154</div>
155<div class="menuitem">
156<a href="http://hadoop.apache.org/core/docs/r0.18.2/jdiff/changes.html">API Changes</a>
157</div>
158<div class="menuitem">
159<a href="http://wiki.apache.org/hadoop/">绎基</a>
160</div>
161<div class="menuitem">
162<a href="http://wiki.apache.org/hadoop/FAQ">垞见问题</a>
163</div>
164<div class="menuitem">
165<a href="http://hadoop.apache.org/core/mailing_lists.html">邮件列衚</a>
166</div>
167<div class="menuitem">
168<a href="http://hadoop.apache.org/core/docs/r0.18.2/releasenotes.html">发行诎明</a>
169</div>
170<div class="menuitem">
171<a href="http://hadoop.apache.org/core/docs/r0.18.2/changes.html">变曎日志</a>
172</div>
173</div>
174<div id="credit"></div>
175<div id="roundbottom">
176<img style="display: none" class="corner" height="15" width="15" alt="" src="skin/images/rc-b-l-15-1body-2menu-3menu.png"></div>
177<!--+
178  |alternative credits
179  +-->
180<div id="credit2"></div>
181</div>
182<!--+
183    |end Menu
184    +-->
185<!--+
186    |start content
187    +-->
188<div id="content">
189<div title="Portable Document Format" class="pdflink">
190<a class="dida" href="hadoop_archives.pdf"><img alt="PDF -icon" src="skin/images/pdfdoc.gif" class="skin"><br>
191        PDF</a>
192</div>
193<h1>Hadoop Archives</h1>
194<div id="minitoc-area">
195<ul class="minitoc">
196<li>
197<a href="#%E4%BB%80%E4%B9%88%E6%98%AFHadoop+archives%3F"> ä»€ä¹ˆæ˜¯Hadoop archives? </a>
198</li>
199<li>
200<a href="#%E5%A6%82%E4%BD%95%E5%88%9B%E5%BB%BAarchive%3F"> åŠ‚䜕创建archive? </a>
201</li>
202<li>
203<a href="#%E5%A6%82%E4%BD%95%E6%9F%A5%E7%9C%8Barchives%E4%B8%AD%E7%9A%84%E6%96%87%E4%BB%B6%3F"> åŠ‚䜕查看archives䞭的文件? </a>
204</li>
205</ul>
206</div>
207       
208<a name="N1000D"></a><a name="%E4%BB%80%E4%B9%88%E6%98%AFHadoop+archives%3F"></a>
209<h2 class="h3"> ä»€ä¹ˆæ˜¯Hadoop archives? </h2>
210<div class="section">
211<p>
212        Hadoop archives是特殊的档案栌匏。䞀䞪Hadoop archive对应䞀䞪文件系统目圕。
213        Hadoop archive的扩展名是*.har。Hadoop archive包含元数据圢匏是_index和_masterindx和数据part-*文件。_index文件包含了档案䞭的文件的文件名和䜍眮信息。
214        </p>
215</div>
216       
217<a name="N10017"></a><a name="%E5%A6%82%E4%BD%95%E5%88%9B%E5%BB%BAarchive%3F"></a>
218<h2 class="h3"> åŠ‚䜕创建archive? </h2>
219<div class="section">
220<p>
221       
222<span class="codefrag">甚法: hadoop archive -archiveName name &lt;src&gt;* &lt;dest&gt;</span>
223       
224</p>
225<p>
226        由-archiveName选项指定䜠芁创建的archive的名字。比劂foo.har。archive的名字的扩展名应该是*.har。蟓入是文件系统的路埄名路埄名的栌匏和平时的衚蟟方匏䞀样。创建的archive䌚保存到目标目圕䞋。泚意创建archives是䞀䞪Map/Reduce job。䜠应该圚map reduce集矀䞊运行这䞪呜什。䞋面是䞀䞪䟋子
227        </p>
228<p>
229       
230<span class="codefrag">hadoop archive -archiveName foo.har /user/hadoop/dir1 /user/hadoop/dir2 /user/zoo/</span>
231       
232</p>
233<p>
234        圚䞊面的䟋子䞭
235        /user/hadoop/dir1 和 /user/hadoop/dir2 䌚被園档到这䞪文件系统目圕䞋
236        -- /user/zoo/foo.har。圓创建archive时源文件䞍䌚被曎改或删陀。
237        </p>
238</div>
239       
240<a name="N1002F"></a><a name="%E5%A6%82%E4%BD%95%E6%9F%A5%E7%9C%8Barchives%E4%B8%AD%E7%9A%84%E6%96%87%E4%BB%B6%3F"></a>
241<h2 class="h3"> åŠ‚䜕查看archives䞭的文件? </h2>
242<div class="section">
243<p>
244        archive䜜䞺文件系统层暎露给倖界。所以所有的fs shell呜什郜胜圚archive䞊运行䜆是芁䜿甚䞍同的URI。
245        及倖archive是䞍可改变的。所以重呜名删陀和创建郜䌚返回错误。Hadoop Archives 的URI是
246        </p>
247<p>
248<span class="codefrag">har://scheme-hostname:port/archivepath/fileinarchive</span>
249</p>
250<p>
251        劂果没提䟛scheme-hostname它䌚䜿甚默讀的文件系统。这种情况䞋URI是这种圢匏
252        </p>
253<p>
254<span class="codefrag">
255        har:///archivepath/fileinarchive</span>
256</p>
257<p>
258        这是䞀䞪archive的䟋子。archive的蟓入是/dir。这䞪dir目圕包含文件fileafileb。
259        把/dir園档到/user/hadoop/foo.bar的呜什是
260        </p>
261<p>
262<span class="codefrag">hadoop archive -archiveName foo.har /dir /user/hadoop</span>
263       
264</p>
265<p>
266        获埗创建的archive䞭的文件列衚䜿甚呜什
267        </p>
268<p>
269<span class="codefrag">hadoop dfs -lsr har:///user/hadoop/foo.har</span>
270</p>
271<p>查看archive侭的filea文件的呜什-
272        </p>
273<p>
274<span class="codefrag">hadoop dfs -cat har:///user/hadoop/foo.har/dir/filea</span>
275</p>
276</div>
277       
278</div>
279<!--+
280    |end content
281    +-->
282<div class="clearboth">&nbsp;</div>
283</div>
284<div id="footer">
285<!--+
286    |start bottomstrip
287    +-->
288<div class="lastmodified">
289<script type="text/javascript"><!--
290document.write("Last Published: " + document.lastModified);
291//  --></script>
292</div>
293<div class="copyright">
294        Copyright &copy;
295         2007 <a href="http://www.apache.org/licenses/">The Apache Software Foundation.</a>
296</div>
297<!--+
298    |end bottomstrip
299    +-->
300</div>
301</body>
302</html>
Note: See TracBrowser for help on using the repository browser.