mirror of
https://github.com/xroche/httrack.git
synced 2026-05-17 08:26:14 +03:00
Fixed manual (lintian)
This commit is contained in:
@@ -51,99 +51,98 @@ offline browser : copy websites to a local directory</p>
|
||||
|
||||
|
||||
<p style="margin-left:11%; margin-top: 1em"><b>httrack [
|
||||
url ]... [ −filter ]... [ +filter ]... [ −O,
|
||||
−−path</b> ] [ <b>−w,
|
||||
−−mirror</b> ] [ <b>−W,
|
||||
−−mirror−wizard</b> ] [ <b>−g,
|
||||
−−get−files</b> ] [ <b>−i,
|
||||
−−continue</b> ] [ <b>−Y,
|
||||
−−mirrorlinks</b> ] [ <b>−P,
|
||||
−−proxy</b> ] [ <b>−%f,
|
||||
−−httpproxy−ftp[=N]</b> ] [ <b>−%b,
|
||||
−−bind</b> ] [ <b>−rN,
|
||||
−−depth[=N]</b> ] [ <b>−%eN,
|
||||
−−ext−depth[=N]</b> ] [ <b>−mN,
|
||||
−−max−files[=N]</b> ] [ <b>−MN,
|
||||
−−max−size[=N]</b> ] [ <b>−EN,
|
||||
−−max−time[=N]</b> ] [ <b>−AN,
|
||||
−−max−rate[=N]</b> ] [ <b>−%cN,
|
||||
url ]... [ −filter ]... [ +filter ]... [ −O
|
||||
−−path</b> ] [ <b>−w
|
||||
−−mirror</b> ] [ <b>−W
|
||||
−−mirror−wizard</b> ] [ <b>−g
|
||||
−−get−files</b> ] [ <b>−i
|
||||
−−continue</b> ] [ <b>−Y
|
||||
−−mirrorlinks</b> ] [ <b>−P
|
||||
−−proxy</b> ] [ <b>−%f
|
||||
−−httpproxy−ftp[=N]</b> ] [ <b>−%b
|
||||
−−bind</b> ] [ <b>−rN
|
||||
−−depth[=N]</b> ] [ <b>−%eN
|
||||
−−ext−depth[=N]</b> ] [ <b>−mN
|
||||
−−max−files[=N]</b> ] [ <b>−MN
|
||||
−−max−size[=N]</b> ] [ <b>−EN
|
||||
−−max−time[=N]</b> ] [ <b>−AN
|
||||
−−max−rate[=N]</b> ] [ <b>−%cN
|
||||
−−connection−per−second[=N]</b> ] [
|
||||
<b>−GN, −−max−pause[=N]</b> ] [
|
||||
<b>−cN, −−sockets[=N]</b> ] [
|
||||
<b>−TN, −−timeout[=N]</b> ] [
|
||||
<b>−RN, −−retries[=N]</b> ] [
|
||||
<b>−JN, −−min−rate[=N]</b> ] [
|
||||
<b>−HN, −−host−control[=N]</b> ] [
|
||||
<b>−%P, −−extended−parsing[=N]</b> ]
|
||||
[ <b>−n, −−near</b> ] [ <b>−t,
|
||||
−−test</b> ] [ <b>−%L,
|
||||
−−list</b> ] [ <b>−%S,
|
||||
−−urllist</b> ] [ <b>−NN,
|
||||
−−structure[=N]</b> ] [ <b>−%D,
|
||||
<b>−GN −−max−pause[=N]</b> ] [
|
||||
<b>−cN −−sockets[=N]</b> ] [ <b>−TN
|
||||
−−timeout[=N]</b> ] [ <b>−RN
|
||||
−−retries[=N]</b> ] [ <b>−JN
|
||||
−−min−rate[=N]</b> ] [ <b>−HN
|
||||
−−host−control[=N]</b> ] [ <b>−%P
|
||||
−−extended−parsing[=N]</b> ] [ <b>−n
|
||||
−−near</b> ] [ <b>−t
|
||||
−−test</b> ] [ <b>−%L
|
||||
−−list</b> ] [ <b>−%S
|
||||
−−urllist</b> ] [ <b>−NN
|
||||
−−structure[=N]</b> ] [ <b>−%D
|
||||
−−cached−delayed−type−check</b>
|
||||
] [ <b>−%M, −−mime−html</b> ] [
|
||||
<b>−LN, −−long−names[=N]</b> ] [
|
||||
<b>−KN, −−keep−links[=N]</b> ] [
|
||||
<b>−x, −−replace−external</b> ] [
|
||||
<b>−%x, −−disable−passwords</b> ] [
|
||||
<b>−%q,
|
||||
] [ <b>−%M −−mime−html</b> ] [
|
||||
<b>−LN −−long−names[=N]</b> ] [
|
||||
<b>−KN −−keep−links[=N]</b> ] [
|
||||
<b>−x −−replace−external</b> ] [
|
||||
<b>−%x −−disable−passwords</b> ] [
|
||||
<b>−%q
|
||||
−−include−query−string</b> ] [
|
||||
<b>−o, −−generate−errors</b> ] [
|
||||
<b>−X, −−purge−old[=N]</b> ] [
|
||||
<b>−%p, −−preserve</b> ] [ <b>−%T,
|
||||
−−utf8−conversion</b> ] [ <b>−bN,
|
||||
−−cookies[=N]</b> ] [ <b>−u,
|
||||
−−check−type[=N]</b> ] [ <b>−j,
|
||||
−−parse−java[=N]</b> ] [ <b>−sN,
|
||||
−−robots[=N]</b> ] [ <b>−%h,
|
||||
−−http−10</b> ] [ <b>−%k,
|
||||
−−keep−alive</b> ] [ <b>−%B,
|
||||
−−tolerant</b> ] [ <b>−%s,
|
||||
−−updatehack</b> ] [ <b>−%u,
|
||||
−−urlhack</b> ] [ <b>−%A,
|
||||
−−assume</b> ] [ <b>−@iN,
|
||||
−−protocol[=N]</b> ] [ <b>−%w,
|
||||
−−disable−module</b> ] [ <b>−F,
|
||||
−−user−agent</b> ] [ <b>−%R,
|
||||
−−referer</b> ] [ <b>−%E,
|
||||
−−from</b> ] [ <b>−%F,
|
||||
−−footer</b> ] [ <b>−%l,
|
||||
−−language</b> ] [ <b>−%a,
|
||||
−−accept</b> ] [ <b>−%X,
|
||||
−−headers</b> ] [ <b>−C,
|
||||
−−cache[=N]</b> ] [ <b>−k,
|
||||
<b>−o −−generate−errors</b> ] [
|
||||
<b>−X −−purge−old[=N]</b> ] [
|
||||
<b>−%p −−preserve</b> ] [ <b>−%T
|
||||
−−utf8−conversion</b> ] [ <b>−bN
|
||||
−−cookies[=N]</b> ] [ <b>−u
|
||||
−−check−type[=N]</b> ] [ <b>−j
|
||||
−−parse−java[=N]</b> ] [ <b>−sN
|
||||
−−robots[=N]</b> ] [ <b>−%h
|
||||
−−http−10</b> ] [ <b>−%k
|
||||
−−keep−alive</b> ] [ <b>−%B
|
||||
−−tolerant</b> ] [ <b>−%s
|
||||
−−updatehack</b> ] [ <b>−%u
|
||||
−−urlhack</b> ] [ <b>−%A
|
||||
−−assume</b> ] [ <b>−@iN
|
||||
−−protocol[=N]</b> ] [ <b>−%w
|
||||
−−disable−module</b> ] [ <b>−F
|
||||
−−user−agent</b> ] [ <b>−%R
|
||||
−−referer</b> ] [ <b>−%E
|
||||
−−from</b> ] [ <b>−%F
|
||||
−−footer</b> ] [ <b>−%l
|
||||
−−language</b> ] [ <b>−%a
|
||||
−−accept</b> ] [ <b>−%X
|
||||
−−headers</b> ] [ <b>−C
|
||||
−−cache[=N]</b> ] [ <b>−k
|
||||
−−store−all−in−cache</b> ] [
|
||||
<b>−%n, −−do−not−recatch</b> ]
|
||||
[ <b>−%v, −−display</b> ] [ <b>−Q,
|
||||
−−do−not−log</b> ] [ <b>−q,
|
||||
−−quiet</b> ] [ <b>−z,
|
||||
−−extra−log</b> ] [ <b>−Z,
|
||||
−−debug−log</b> ] [ <b>−v,
|
||||
−−verbose</b> ] [ <b>−f,
|
||||
−−file−log</b> ] [ <b>−f2,
|
||||
−−single−log</b> ] [ <b>−I,
|
||||
−−index</b> ] [ <b>−%i,
|
||||
<b>−%n −−do−not−recatch</b> ]
|
||||
[ <b>−%v −−display</b> ] [ <b>−Q
|
||||
−−do−not−log</b> ] [ <b>−q
|
||||
−−quiet</b> ] [ <b>−z
|
||||
−−extra−log</b> ] [ <b>−Z
|
||||
−−debug−log</b> ] [ <b>−v
|
||||
−−verbose</b> ] [ <b>−f
|
||||
−−file−log</b> ] [ <b>−f2
|
||||
−−single−log</b> ] [ <b>−I
|
||||
−−index</b> ] [ <b>−%i
|
||||
−−build−top−index</b> ] [
|
||||
<b>−%I, −−search−index</b> ] [
|
||||
<b>−pN, −−priority[=N]</b> ] [
|
||||
<b>−S,
|
||||
<b>−%I −−search−index</b> ] [
|
||||
<b>−pN −−priority[=N]</b> ] [ <b>−S
|
||||
−−stay−on−same−dir</b> ] [
|
||||
<b>−D, −−can−go−down</b> ] [
|
||||
<b>−U, −−can−go−up</b> ] [
|
||||
<b>−B,
|
||||
<b>−D −−can−go−down</b> ] [
|
||||
<b>−U −−can−go−up</b> ] [
|
||||
<b>−B
|
||||
−−can−go−up−and−down</b>
|
||||
] [ <b>−a,
|
||||
] [ <b>−a
|
||||
−−stay−on−same−address</b> ] [
|
||||
<b>−d,
|
||||
<b>−d
|
||||
−−stay−on−same−domain</b> ] [
|
||||
<b>−l,
|
||||
<b>−l
|
||||
−−stay−on−same−tld</b> ] [
|
||||
<b>−e, −−go−everywhere</b> ] [
|
||||
<b>−%H, −−debug−headers</b> ] [
|
||||
<b>−%!,
|
||||
<b>−e −−go−everywhere</b> ] [
|
||||
<b>−%H −−debug−headers</b> ] [
|
||||
<b>−%!
|
||||
−−disable−security−limits</b> ] [
|
||||
<b>−V, −−userdef−cmd</b> ] [
|
||||
<b>−%W, −−callback</b> ] [ <b>−K,
|
||||
<b>−V −−userdef−cmd</b> ] [
|
||||
<b>−%W −−callback</b> ] [ <b>−K
|
||||
−−keep−links[=N]</b> ] [</p>
|
||||
|
||||
<h2>DESCRIPTION
|
||||
@@ -185,7 +184,7 @@ sites</p>
|
||||
www.someweb.com/bob/bobby.html +* −r6</b></p>
|
||||
|
||||
<p style="margin-left:22%;">means get all files starting
|
||||
from bobby.html, with 6 link−depth, and possibility of
|
||||
from bobby.html with 6 link−depth and possibility of
|
||||
going everywhere on the web</p>
|
||||
|
||||
<p style="margin-left:11%;"><b>httrack
|
||||
@@ -234,7 +233,7 @@ options:</b></p>
|
||||
|
||||
|
||||
<p>path for mirror/logfiles+cache (−O path
|
||||
mirror[,path cache and logfiles]) (−−path
|
||||
mirror[path cache and logfiles]) (−−path
|
||||
<param>)</p> </td></tr>
|
||||
</table>
|
||||
|
||||
@@ -265,7 +264,7 @@ options:</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>mirror web sites, semi−automatic (asks questions)
|
||||
<p>mirror web sites semi−automatic (asks questions)
|
||||
(−−mirror−wizard)</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -356,11 +355,11 @@ options:</b></p>
|
||||
cellspacing="0" cellpadding="0">
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p style="margin-top: 1em">−rN</p></td>
|
||||
<td width="2%"></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
@@ -368,11 +367,11 @@ options:</b></p>
|
||||
r9999) (−−depth[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p>−%eN</p></td>
|
||||
<td width="2%"></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
@@ -380,11 +379,11 @@ r9999) (−−depth[=N])</p></td></tr>
|
||||
(−−ext−depth[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p>−mN</p></td>
|
||||
<td width="2%"></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
@@ -392,22 +391,22 @@ r9999) (−−depth[=N])</p></td></tr>
|
||||
(−−max−files[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p>−mN,N2</p></td>
|
||||
<td width="2%"></td>
|
||||
<p>−mNN2</p></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>maximum file length for non html (N) and html (N2)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p>−MN</p></td>
|
||||
<td width="2%"></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
@@ -415,23 +414,23 @@ r9999) (−−depth[=N])</p></td></tr>
|
||||
(−−max−size[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p>−EN</p></td>
|
||||
<td width="2%"></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>maximum mirror time in seconds (60=1 minute, 3600=1
|
||||
hour) (−−max−time[=N])</p></td></tr>
|
||||
<p>maximum mirror time in seconds (60=1 minute 3600=1 hour)
|
||||
(−−max−time[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p>−AN</p></td>
|
||||
<td width="2%"></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
@@ -439,11 +438,11 @@ hour) (−−max−time[=N])</p></td></tr>
|
||||
(−−max−rate[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p>−%cN</p></td>
|
||||
<td width="2%"></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
@@ -451,15 +450,15 @@ hour) (−−max−time[=N])</p></td></tr>
|
||||
(−−connection−per−second[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
<td width="7%">
|
||||
|
||||
|
||||
<p>−GN</p></td>
|
||||
<td width="2%"></td>
|
||||
<td width="4%"></td>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>pause transfer if N bytes reached, and wait until lock
|
||||
<p>pause transfer if N bytes reached and wait until lock
|
||||
file is deleted (−−max−pause[=N])</p></td></tr>
|
||||
</table>
|
||||
|
||||
@@ -490,7 +489,7 @@ control:</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>timeout, number of seconds after a non−responding
|
||||
<p>timeout number of seconds after a non−responding
|
||||
link is shutdown (−−timeout[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -502,7 +501,7 @@ link is shutdown (−−timeout[=N])</p></td></tr>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>number of retries, in case of timeout or non−fatal
|
||||
<p>number of retries in case of timeout or non−fatal
|
||||
errors (*R1) (−−retries[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -514,7 +513,7 @@ errors (*R1) (−−retries[=N])</p></td></tr>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>traffic jam control, minimum transfert rate
|
||||
<p>traffic jam control minimum transfert rate
|
||||
(bytes/seconds) tolerated for a link
|
||||
(−−min−rate[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
@@ -527,7 +526,7 @@ errors (*R1) (−−retries[=N])</p></td></tr>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>host is abandonned if: 0=never, 1=timeout, 2=slow,
|
||||
<p>host is abandonned if: 0=never 1=timeout 2=slow
|
||||
3=timeout or slow (−−host−control[=N])</p></td></tr>
|
||||
</table>
|
||||
|
||||
@@ -546,8 +545,8 @@ options:</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p style="margin-top: 1em">*extended parsing, attempt to
|
||||
parse all links, even in unknown tags or Javascript (%P0 don
|
||||
<p style="margin-top: 1em">*extended parsing attempt to
|
||||
parse all links even in unknown tags or Javascript (%P0 don
|
||||
t use) (−−extended−parsing[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -616,7 +615,7 @@ options:</b></p>
|
||||
|
||||
|
||||
<p style="margin-top: 1em">structure type (0 *original
|
||||
structure, 1+: see below) (−−structure[=N])</p></td></tr>
|
||||
structure 1+: see below) (−−structure[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="4%">
|
||||
@@ -639,9 +638,9 @@ structure, 1+: see below) (−−structure[=N])</p></td></tr>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>delayed type check, don t make any link test but wait
|
||||
for files download to start instead (experimental) (%N0 don
|
||||
t use, %N1 use for unknown extensions, * %N2 always use)</p></td></tr>
|
||||
<p>delayed type check don t make any link test but wait for
|
||||
files download to start instead (experimental) (%N0 don t
|
||||
use %N1 use for unknown extensions * %N2 always use)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="4%">
|
||||
@@ -652,8 +651,8 @@ t use, %N1 use for unknown extensions, * %N2 always use)</p></td></tr>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>cached delayed type check, don t wait for remote type
|
||||
during updates, to speedup them (%D0 wait, * %D1 don t wait)
|
||||
<p>cached delayed type check don t wait for remote type
|
||||
during updates to speedup them (%D0 wait * %D1 don t wait)
|
||||
(−−cached−delayed−type−check)</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -692,8 +691,8 @@ L2 ISO9660 compatible)
|
||||
|
||||
|
||||
<p>keep original links (e.g. http://www.adr/link) (K0
|
||||
*relative link, K absolute links, K4 original links, K3
|
||||
absolute URI links, K5 transparent proxy link)
|
||||
*relative link K absolute links K4 original links K3
|
||||
absolute URI links K5 transparent proxy link)
|
||||
(−−keep−links[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -730,7 +729,7 @@ protected websites (%x0 include)
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>*include query string for local files (useless, for
|
||||
<p>*include query string for local files (useless for
|
||||
information purpose only) (%q0 don t include)
|
||||
(−−include−query−string)</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
@@ -799,7 +798,7 @@ options:</b></p>
|
||||
|
||||
|
||||
<p style="margin-top: 1em">accept cookies in cookies.txt
|
||||
(0=do not accept,* 1=accept) (−−cookies[=N])</p></td></tr>
|
||||
(0=do not accept* 1=accept) (−−cookies[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="6%">
|
||||
@@ -810,8 +809,8 @@ options:</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>check document type if unknown (cgi,asp..) (u0 don t
|
||||
check, * u1 check but /, u2 check always)
|
||||
<p>check document type if unknown (cgiasp..) (u0 don t
|
||||
check * u1 check but / u2 check always)
|
||||
(−−check−type[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -823,9 +822,9 @@ check, * u1 check but /, u2 check always)
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>*parse Java Classes (j0 don t parse, bitmask: |1 parse
|
||||
default, |2 don t parse .class |4 don t parse .js |8 don t
|
||||
be aggressive) (−−parse−java[=N])</p></td></tr>
|
||||
<p>*parse Java Classes (j0 don t parse bitmask: |1 parse
|
||||
default |2 don t parse .class |4 don t parse .js |8 don t be
|
||||
aggressive) (−−parse−java[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="6%">
|
||||
@@ -837,8 +836,8 @@ be aggressive) (−−parse−java[=N])</p></td></tr>
|
||||
|
||||
|
||||
<p>follow robots.txt and meta robots tags
|
||||
(0=never,1=sometimes,* 2=always, 3=always (even strict
|
||||
rules)) (−−robots[=N])</p></td></tr>
|
||||
(0=never1=sometimes* 2=always 3=always (even strict rules))
|
||||
(−−robots[=N])</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="6%">
|
||||
@@ -849,9 +848,8 @@ rules)) (−−robots[=N])</p></td></tr>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>force HTTP/1.0 requests (reduce update features, only
|
||||
for old servers or proxies)
|
||||
(−−http−10)</p> </td></tr>
|
||||
<p>force HTTP/1.0 requests (reduce update features only for
|
||||
old servers or proxies) (−−http−10)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="6%">
|
||||
@@ -862,7 +860,7 @@ for old servers or proxies)
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>use keep−alive if possible, greately reducing
|
||||
<p>use keep−alive if possible greately reducing
|
||||
latency for small files and test requests (%k0 don t use)
|
||||
(−−keep−alive)</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
@@ -876,7 +874,7 @@ latency for small files and test requests (%k0 don t use)
|
||||
|
||||
|
||||
<p>tolerant requests (accept bogus responses on some
|
||||
servers, but not standard!) (−−tolerant)</p></td></tr>
|
||||
servers but not standard!) (−−tolerant)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="6%">
|
||||
@@ -888,7 +886,7 @@ servers, but not standard!) (−−tolerant)</p></td></tr>
|
||||
|
||||
|
||||
<p>update hacks: various hacks to limit re−transfers
|
||||
when updating (identical size, bogus response..)
|
||||
when updating (identical size bogus response..)
|
||||
(−−updatehack)</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -901,7 +899,7 @@ when updating (identical size, bogus response..)
|
||||
|
||||
|
||||
<p>url hacks: various hacks to limit duplicate URLs (strip
|
||||
//, www.foo.com==foo.com..) (−−urlhack)</p></td></tr>
|
||||
// www.foo.com==foo.com..) (−−urlhack)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="6%">
|
||||
@@ -912,9 +910,9 @@ when updating (identical size, bogus response..)
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>assume that a type (cgi,asp..) is always linked with a
|
||||
<p>assume that a type (cgiasp..) is always linked with a
|
||||
mime type (−%A
|
||||
php3,cgi=text/html;dat,bin=application/x−zip)
|
||||
php3cgi=text/html;datbin=application/x−zip)
|
||||
(−−assume <param>)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -938,7 +936,7 @@ php3,cgi=text/html;dat,bin=application/x−zip)
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>internet protocol (0=both ipv6+ipv4, 4=ipv4 only, 6=ipv6
|
||||
<p>internet protocol (0=both ipv6+ipv4 4=ipv4 only 6=ipv6
|
||||
only) (−−protocol[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -1020,7 +1018,7 @@ HTTP headers (−F "user−agent name")
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>preffered language (−%l "fr, en, jp, *"
|
||||
<p>preffered language (−%l "fr en jp *"
|
||||
(−−language <param>)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -1033,7 +1031,7 @@ HTTP headers (−F "user−agent name")
|
||||
|
||||
|
||||
<p>accepted formats (−%l
|
||||
"text/html,image/png,image/jpeg,image/gif;q=0.9,*/*;q=0.1"
|
||||
"text/htmlimage/pngimage/jpegimage/gif;q=0.9*/*;q=0.1"
|
||||
(−−accept <param>)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -1050,7 +1048,7 @@ HTTP headers (−F "user−agent name")
|
||||
<param>)</p> </td></tr>
|
||||
</table>
|
||||
|
||||
<p style="margin-left:11%; margin-top: 1em"><b>Log, index,
|
||||
<p style="margin-left:11%; margin-top: 1em"><b>Log index
|
||||
cache</b></p>
|
||||
|
||||
<table width="100%" border="0" rules="none" frame="void"
|
||||
@@ -1066,7 +1064,7 @@ cache</b></p>
|
||||
|
||||
|
||||
<p style="margin-top: 1em">create/use a cache for updates
|
||||
and retries (C0 no cache,C1 cache is prioritary,* C2 test
|
||||
and retries (C0 no cacheC1 cache is prioritary* C2 test
|
||||
update before) (−−cache[=N])</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -1249,7 +1247,7 @@ options:</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>just scan, don t save anything (for checking links)</p></td></tr>
|
||||
<p>just scan don t save anything (for checking links)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="6%">
|
||||
@@ -1293,7 +1291,7 @@ options:</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>get html files before, then treat other files</p></td></tr>
|
||||
<p>get html files before then treat other files</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="6%">
|
||||
@@ -1650,14 +1648,14 @@ doing)</b></p>
|
||||
|
||||
|
||||
<p style="margin-top: 1em">bypass built−in security
|
||||
limits aimed to avoid bandwidth abuses (bandwidth,
|
||||
limits aimed to avoid bandwidth abuses (bandwidth
|
||||
simultaneous connections)
|
||||
(−−disable−security−limits)</p> </td></tr>
|
||||
</table>
|
||||
|
||||
<p style="margin-left:11%;">−IMPORTANT</p>
|
||||
|
||||
<p style="margin-left:22%;">NOTE: DANGEROUS OPTION, ONLY
|
||||
<p style="margin-left:22%;">NOTE: DANGEROUS OPTION ONLY
|
||||
SUITABLE FOR EXPERTS</p>
|
||||
|
||||
<table width="100%" border="0" rules="none" frame="void"
|
||||
@@ -1707,7 +1705,7 @@ each files ($0 is the filename: −V "rm ")
|
||||
|
||||
|
||||
<p>use an external library function as a wrapper (−%W
|
||||
myfoo.so[,myparameters]) (−−callback
|
||||
myfoo.so[myparameters]) (−−callback
|
||||
<param>)</p> </td></tr>
|
||||
</table>
|
||||
|
||||
@@ -1738,7 +1736,7 @@ Option N</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>HTML in web/, images/other files in web/images/</p></td></tr>
|
||||
<p>HTML in web/ images/other files in web/images/</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
@@ -1749,7 +1747,7 @@ Option N</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>HTML in web/HTML, images/other in web/images</p></td></tr>
|
||||
<p>HTML in web/HTML images/other in web/images</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
@@ -1760,7 +1758,7 @@ Option N</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>HTML in web/, images/other in web/</p></td></tr>
|
||||
<p>HTML in web/ images/other in web/</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
@@ -1771,8 +1769,8 @@ Option N</b></p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>HTML in web/, images/other in web/xxx, where xxx is the
|
||||
file extension (all gif will be placed onto web/gif, for
|
||||
<p>HTML in web/ images/other in web/xxx where xxx is the
|
||||
file extension (all gif will be placed onto web/gif for
|
||||
example)</p> </td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -1795,7 +1793,7 @@ example)</p> </td></tr>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>All files in web/, with random names (gadget !)</p></td></tr>
|
||||
<p>All files in web/ with random names (gadget !)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
@@ -1806,7 +1804,7 @@ example)</p> </td></tr>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>Site−structure, without www.domain.xxx/</p></td></tr>
|
||||
<p>Site−structure without www.domain.xxx/</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="9%">
|
||||
@@ -1956,15 +1954,15 @@ directory</p> </td></tr>
|
||||
<p style="margin-left:11%; margin-top: 1em"><b>Details:
|
||||
User−defined option N</b> <br>
|
||||
%n Name of file without file type (ex: image) <br>
|
||||
%N Name of file, including file type (ex: image.gif) <br>
|
||||
%N Name of file including file type (ex: image.gif) <br>
|
||||
%t File type (ex: gif) <br>
|
||||
%p Path [without ending /] (ex: /someimages) <br>
|
||||
%h Host name (ex: www.someweb.com) <br>
|
||||
%M URL MD5 (128 bits, 32 ascii bytes) <br>
|
||||
%Q query string MD5 (128 bits, 32 ascii bytes) <br>
|
||||
%M URL MD5 (128 bits 32 ascii bytes) <br>
|
||||
%Q query string MD5 (128 bits 32 ascii bytes) <br>
|
||||
%k full query string <br>
|
||||
%r protocol name (ex: http) <br>
|
||||
%q small query string MD5 (16 bits, 4 ascii bytes) <br>
|
||||
%q small query string MD5 (16 bits 4 ascii bytes) <br>
|
||||
%s? Short name version (ex: %sN) <br>
|
||||
%[param] param variable in query string <br>
|
||||
%[param:before:after:empty:notfound] advanced variable
|
||||
@@ -2042,8 +2040,8 @@ parameter could not be found</p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p>fields, except the first one (the parameter name), can
|
||||
be empty</p></td></tr>
|
||||
<p>fields except the first one (the parameter name) can be
|
||||
empty</p> </td></tr>
|
||||
</table>
|
||||
|
||||
<p style="margin-left:11%; margin-top: 1em"><b>Details:
|
||||
@@ -2062,7 +2060,7 @@ Option K</b></p>
|
||||
|
||||
|
||||
<p style="margin-top: 1em">foo.cgi?q=45 −>
|
||||
foo4B54.html?q=45 (relative URI, default)</p></td></tr>
|
||||
foo4B54.html?q=45 (relative URI default)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
<td width="4%">
|
||||
@@ -2132,7 +2130,7 @@ site(s) (default)</p>
|
||||
<td width="78%">
|
||||
|
||||
|
||||
<p><URLs> get the files indicated, do not seek other
|
||||
<p><URLs> get the files indicated do not seek other
|
||||
URLs (−qg)</p></td></tr>
|
||||
<tr valign="top" align="left">
|
||||
<td width="11%"></td>
|
||||
@@ -2160,7 +2158,7 @@ pages (−r1p0C0I0t)</p>
|
||||
|
||||
<p style="margin-left:11%;">−−spider</p>
|
||||
|
||||
<p style="margin-left:22%;"><URLs> spider site(s), to
|
||||
<p style="margin-left:22%;"><URLs> spider site(s) to
|
||||
test links: reports Errors & Warnings
|
||||
(−p0C0I0t)</p>
|
||||
|
||||
@@ -2171,17 +2169,17 @@ test links: reports Errors & Warnings
|
||||
|
||||
<p style="margin-left:11%;">−−skeleton</p>
|
||||
|
||||
<p style="margin-left:22%;"><URLs> make a mirror, but
|
||||
<p style="margin-left:22%;"><URLs> make a mirror but
|
||||
gets only html files (−p1)</p>
|
||||
|
||||
<p style="margin-left:11%;">−−update</p>
|
||||
|
||||
<p style="margin-left:22%;">update a mirror, without
|
||||
<p style="margin-left:22%;">update a mirror without
|
||||
confirmation (−iC2)</p>
|
||||
|
||||
<p style="margin-left:11%;">−−continue</p>
|
||||
|
||||
<p style="margin-left:22%;">continue a mirror, without
|
||||
<p style="margin-left:22%;">continue a mirror without
|
||||
confirmation (−iC1)</p>
|
||||
|
||||
<p style="margin-left:11%;">−−catchurl</p>
|
||||
|
||||
280
man/httrack.1
280
man/httrack.1
@@ -1,182 +1,182 @@
|
||||
.\" Process this file with
|
||||
.\" groff -man -Tascii httrack.1
|
||||
.\"
|
||||
.TH httrack 1 "Apr 2014" "httrack website copier"
|
||||
.TH httrack 1 "29 April 2014" "httrack website copier"
|
||||
.SH NAME
|
||||
httrack \- offline browser : copy websites to a local directory
|
||||
.SH SYNOPSIS
|
||||
.B httrack [ url ]... [ \-filter ]... [ +filter ]... [
|
||||
.B \-O, \-\-path
|
||||
.B \-O\, \-\-path
|
||||
] [
|
||||
.B \-w, \-\-mirror
|
||||
.B \-w\, \-\-mirror
|
||||
] [
|
||||
.B \-W, \-\-mirror\-wizard
|
||||
.B \-W\, \-\-mirror\-wizard
|
||||
] [
|
||||
.B \-g, \-\-get\-files
|
||||
.B \-g\, \-\-get\-files
|
||||
] [
|
||||
.B \-i, \-\-continue
|
||||
.B \-i\, \-\-continue
|
||||
] [
|
||||
.B \-Y, \-\-mirrorlinks
|
||||
.B \-Y\, \-\-mirrorlinks
|
||||
] [
|
||||
.B \-P, \-\-proxy
|
||||
.B \-P\, \-\-proxy
|
||||
] [
|
||||
.B \-%f, \-\-httpproxy\-ftp[=N]
|
||||
.B \-%f\, \-\-httpproxy\-ftp[=N]
|
||||
] [
|
||||
.B \-%b, \-\-bind
|
||||
.B \-%b\, \-\-bind
|
||||
] [
|
||||
.B \-rN, \-\-depth[=N]
|
||||
.B \-rN\, \-\-depth[=N]
|
||||
] [
|
||||
.B \-%eN, \-\-ext\-depth[=N]
|
||||
.B \-%eN\, \-\-ext\-depth[=N]
|
||||
] [
|
||||
.B \-mN, \-\-max\-files[=N]
|
||||
.B \-mN\, \-\-max\-files[=N]
|
||||
] [
|
||||
.B \-MN, \-\-max\-size[=N]
|
||||
.B \-MN\, \-\-max\-size[=N]
|
||||
] [
|
||||
.B \-EN, \-\-max\-time[=N]
|
||||
.B \-EN\, \-\-max\-time[=N]
|
||||
] [
|
||||
.B \-AN, \-\-max\-rate[=N]
|
||||
.B \-AN\, \-\-max\-rate[=N]
|
||||
] [
|
||||
.B \-%cN, \-\-connection\-per\-second[=N]
|
||||
.B \-%cN\, \-\-connection\-per\-second[=N]
|
||||
] [
|
||||
.B \-GN, \-\-max\-pause[=N]
|
||||
.B \-GN\, \-\-max\-pause[=N]
|
||||
] [
|
||||
.B \-cN, \-\-sockets[=N]
|
||||
.B \-cN\, \-\-sockets[=N]
|
||||
] [
|
||||
.B \-TN, \-\-timeout[=N]
|
||||
.B \-TN\, \-\-timeout[=N]
|
||||
] [
|
||||
.B \-RN, \-\-retries[=N]
|
||||
.B \-RN\, \-\-retries[=N]
|
||||
] [
|
||||
.B \-JN, \-\-min\-rate[=N]
|
||||
.B \-JN\, \-\-min\-rate[=N]
|
||||
] [
|
||||
.B \-HN, \-\-host\-control[=N]
|
||||
.B \-HN\, \-\-host\-control[=N]
|
||||
] [
|
||||
.B \-%P, \-\-extended\-parsing[=N]
|
||||
.B \-%P\, \-\-extended\-parsing[=N]
|
||||
] [
|
||||
.B \-n, \-\-near
|
||||
.B \-n\, \-\-near
|
||||
] [
|
||||
.B \-t, \-\-test
|
||||
.B \-t\, \-\-test
|
||||
] [
|
||||
.B \-%L, \-\-list
|
||||
.B \-%L\, \-\-list
|
||||
] [
|
||||
.B \-%S, \-\-urllist
|
||||
.B \-%S\, \-\-urllist
|
||||
] [
|
||||
.B \-NN, \-\-structure[=N]
|
||||
.B \-NN\, \-\-structure[=N]
|
||||
] [
|
||||
.B \-%D, \-\-cached\-delayed\-type\-check
|
||||
.B \-%D\, \-\-cached\-delayed\-type\-check
|
||||
] [
|
||||
.B \-%M, \-\-mime\-html
|
||||
.B \-%M\, \-\-mime\-html
|
||||
] [
|
||||
.B \-LN, \-\-long\-names[=N]
|
||||
.B \-LN\, \-\-long\-names[=N]
|
||||
] [
|
||||
.B \-KN, \-\-keep\-links[=N]
|
||||
.B \-KN\, \-\-keep\-links[=N]
|
||||
] [
|
||||
.B \-x, \-\-replace\-external
|
||||
.B \-x\, \-\-replace\-external
|
||||
] [
|
||||
.B \-%x, \-\-disable\-passwords
|
||||
.B \-%x\, \-\-disable\-passwords
|
||||
] [
|
||||
.B \-%q, \-\-include\-query\-string
|
||||
.B \-%q\, \-\-include\-query\-string
|
||||
] [
|
||||
.B \-o, \-\-generate\-errors
|
||||
.B \-o\, \-\-generate\-errors
|
||||
] [
|
||||
.B \-X, \-\-purge\-old[=N]
|
||||
.B \-X\, \-\-purge\-old[=N]
|
||||
] [
|
||||
.B \-%p, \-\-preserve
|
||||
.B \-%p\, \-\-preserve
|
||||
] [
|
||||
.B \-%T, \-\-utf8\-conversion
|
||||
.B \-%T\, \-\-utf8\-conversion
|
||||
] [
|
||||
.B \-bN, \-\-cookies[=N]
|
||||
.B \-bN\, \-\-cookies[=N]
|
||||
] [
|
||||
.B \-u, \-\-check\-type[=N]
|
||||
.B \-u\, \-\-check\-type[=N]
|
||||
] [
|
||||
.B \-j, \-\-parse\-java[=N]
|
||||
.B \-j\, \-\-parse\-java[=N]
|
||||
] [
|
||||
.B \-sN, \-\-robots[=N]
|
||||
.B \-sN\, \-\-robots[=N]
|
||||
] [
|
||||
.B \-%h, \-\-http\-10
|
||||
.B \-%h\, \-\-http\-10
|
||||
] [
|
||||
.B \-%k, \-\-keep\-alive
|
||||
.B \-%k\, \-\-keep\-alive
|
||||
] [
|
||||
.B \-%B, \-\-tolerant
|
||||
.B \-%B\, \-\-tolerant
|
||||
] [
|
||||
.B \-%s, \-\-updatehack
|
||||
.B \-%s\, \-\-updatehack
|
||||
] [
|
||||
.B \-%u, \-\-urlhack
|
||||
.B \-%u\, \-\-urlhack
|
||||
] [
|
||||
.B \-%A, \-\-assume
|
||||
.B \-%A\, \-\-assume
|
||||
] [
|
||||
.B \-@iN, \-\-protocol[=N]
|
||||
.B \-@iN\, \-\-protocol[=N]
|
||||
] [
|
||||
.B \-%w, \-\-disable\-module
|
||||
.B \-%w\, \-\-disable\-module
|
||||
] [
|
||||
.B \-F, \-\-user\-agent
|
||||
.B \-F\, \-\-user\-agent
|
||||
] [
|
||||
.B \-%R, \-\-referer
|
||||
.B \-%R\, \-\-referer
|
||||
] [
|
||||
.B \-%E, \-\-from
|
||||
.B \-%E\, \-\-from
|
||||
] [
|
||||
.B \-%F, \-\-footer
|
||||
.B \-%F\, \-\-footer
|
||||
] [
|
||||
.B \-%l, \-\-language
|
||||
.B \-%l\, \-\-language
|
||||
] [
|
||||
.B \-%a, \-\-accept
|
||||
.B \-%a\, \-\-accept
|
||||
] [
|
||||
.B \-%X, \-\-headers
|
||||
.B \-%X\, \-\-headers
|
||||
] [
|
||||
.B \-C, \-\-cache[=N]
|
||||
.B \-C\, \-\-cache[=N]
|
||||
] [
|
||||
.B \-k, \-\-store\-all\-in\-cache
|
||||
.B \-k\, \-\-store\-all\-in\-cache
|
||||
] [
|
||||
.B \-%n, \-\-do\-not\-recatch
|
||||
.B \-%n\, \-\-do\-not\-recatch
|
||||
] [
|
||||
.B \-%v, \-\-display
|
||||
.B \-%v\, \-\-display
|
||||
] [
|
||||
.B \-Q, \-\-do\-not\-log
|
||||
.B \-Q\, \-\-do\-not\-log
|
||||
] [
|
||||
.B \-q, \-\-quiet
|
||||
.B \-q\, \-\-quiet
|
||||
] [
|
||||
.B \-z, \-\-extra\-log
|
||||
.B \-z\, \-\-extra\-log
|
||||
] [
|
||||
.B \-Z, \-\-debug\-log
|
||||
.B \-Z\, \-\-debug\-log
|
||||
] [
|
||||
.B \-v, \-\-verbose
|
||||
.B \-v\, \-\-verbose
|
||||
] [
|
||||
.B \-f, \-\-file\-log
|
||||
.B \-f\, \-\-file\-log
|
||||
] [
|
||||
.B \-f2, \-\-single\-log
|
||||
.B \-f2\, \-\-single\-log
|
||||
] [
|
||||
.B \-I, \-\-index
|
||||
.B \-I\, \-\-index
|
||||
] [
|
||||
.B \-%i, \-\-build\-top\-index
|
||||
.B \-%i\, \-\-build\-top\-index
|
||||
] [
|
||||
.B \-%I, \-\-search\-index
|
||||
.B \-%I\, \-\-search\-index
|
||||
] [
|
||||
.B \-pN, \-\-priority[=N]
|
||||
.B \-pN\, \-\-priority[=N]
|
||||
] [
|
||||
.B \-S, \-\-stay\-on\-same\-dir
|
||||
.B \-S\, \-\-stay\-on\-same\-dir
|
||||
] [
|
||||
.B \-D, \-\-can\-go\-down
|
||||
.B \-D\, \-\-can\-go\-down
|
||||
] [
|
||||
.B \-U, \-\-can\-go\-up
|
||||
.B \-U\, \-\-can\-go\-up
|
||||
] [
|
||||
.B \-B, \-\-can\-go\-up\-and\-down
|
||||
.B \-B\, \-\-can\-go\-up\-and\-down
|
||||
] [
|
||||
.B \-a, \-\-stay\-on\-same\-address
|
||||
.B \-a\, \-\-stay\-on\-same\-address
|
||||
] [
|
||||
.B \-d, \-\-stay\-on\-same\-domain
|
||||
.B \-d\, \-\-stay\-on\-same\-domain
|
||||
] [
|
||||
.B \-l, \-\-stay\-on\-same\-tld
|
||||
.B \-l\, \-\-stay\-on\-same\-tld
|
||||
] [
|
||||
.B \-e, \-\-go\-everywhere
|
||||
.B \-e\, \-\-go\-everywhere
|
||||
] [
|
||||
.B \-%H, \-\-debug\-headers
|
||||
.B \-%H\, \-\-debug\-headers
|
||||
] [
|
||||
.B \-%!, \-\-disable\-security\-limits
|
||||
.B \-%!\, \-\-disable\-security\-limits
|
||||
] [
|
||||
.B \-V, \-\-userdef\-cmd
|
||||
.B \-V\, \-\-userdef\-cmd
|
||||
] [
|
||||
.B \-%W, \-\-callback
|
||||
.B \-%W\, \-\-callback
|
||||
] [
|
||||
.B \-K, \-\-keep\-links[=N]
|
||||
.B \-K\, \-\-keep\-links[=N]
|
||||
] [
|
||||
.B
|
||||
.SH DESCRIPTION
|
||||
@@ -191,7 +191,7 @@ allows you to download a World Wide Web site from the Internet to a local direct
|
||||
mirror the two sites together (with shared links) and accept any .jpg files on .com sites
|
||||
.TP
|
||||
.B httrack www.someweb.com/bob/bobby.html +* \-r6
|
||||
means get all files starting from bobby.html, with 6 link\-depth, and possibility of going everywhere on the web
|
||||
means get all files starting from bobby.html\, with 6 link\-depth\, and possibility of going everywhere on the web
|
||||
.TP
|
||||
.B httrack www.someweb.com/bob/bobby.html \-\-spider \-P proxy.myhost.com:8080
|
||||
runs the spider on www.someweb.com/bob/bobby.html using a proxy
|
||||
@@ -208,7 +208,7 @@ continues a mirror in the current folder
|
||||
.SS General options:
|
||||
.IP \-O
|
||||
path for mirror/logfiles+cache (\-O path
|
||||
mirror[,path
|
||||
mirror[\,path
|
||||
cache
|
||||
and
|
||||
logfiles]) (\-\-path <param>)
|
||||
@@ -217,7 +217,7 @@ logfiles]) (\-\-path <param>)
|
||||
.IP \-w
|
||||
*mirror web sites (\-\-mirror)
|
||||
.IP \-W
|
||||
mirror web sites, semi\-automatic (asks questions) (\-\-mirror\-wizard)
|
||||
mirror web sites\, semi\-automatic (asks questions) (\-\-mirror\-wizard)
|
||||
.IP \-g
|
||||
just get files (saved in the current directory) (\-\-get\-files)
|
||||
.IP \-i
|
||||
@@ -240,34 +240,34 @@ set the mirror depth to N (* r9999) (\-\-depth[=N])
|
||||
set the external links depth to N (* %e0) (\-\-ext\-depth[=N])
|
||||
.IP \-mN
|
||||
maximum file length for a non\-html file (\-\-max\-files[=N])
|
||||
.IP \-mN,N2
|
||||
.IP \-mN\,N2
|
||||
maximum file length for non html (N) and html (N2)
|
||||
.IP \-MN
|
||||
maximum overall size that can be uploaded/scanned (\-\-max\-size[=N])
|
||||
.IP \-EN
|
||||
maximum mirror time in seconds (60=1 minute, 3600=1 hour) (\-\-max\-time[=N])
|
||||
maximum mirror time in seconds (60=1 minute\, 3600=1 hour) (\-\-max\-time[=N])
|
||||
.IP \-AN
|
||||
maximum transfer rate in bytes/seconds (1000=1KB/s max) (\-\-max\-rate[=N])
|
||||
.IP \-%cN
|
||||
maximum number of connections/seconds (*%c10) (\-\-connection\-per\-second[=N])
|
||||
.IP \-GN
|
||||
pause transfer if N bytes reached, and wait until lock file is deleted (\-\-max\-pause[=N])
|
||||
pause transfer if N bytes reached\, and wait until lock file is deleted (\-\-max\-pause[=N])
|
||||
|
||||
.SS Flow control:
|
||||
.IP \-cN
|
||||
number of multiple connections (*c8) (\-\-sockets[=N])
|
||||
.IP \-TN
|
||||
timeout, number of seconds after a non\-responding link is shutdown (\-\-timeout[=N])
|
||||
timeout\, number of seconds after a non\-responding link is shutdown (\-\-timeout[=N])
|
||||
.IP \-RN
|
||||
number of retries, in case of timeout or non\-fatal errors (*R1) (\-\-retries[=N])
|
||||
number of retries\, in case of timeout or non\-fatal errors (*R1) (\-\-retries[=N])
|
||||
.IP \-JN
|
||||
traffic jam control, minimum transfert rate (bytes/seconds) tolerated for a link (\-\-min\-rate[=N])
|
||||
traffic jam control\, minimum transfert rate (bytes/seconds) tolerated for a link (\-\-min\-rate[=N])
|
||||
.IP \-HN
|
||||
host is abandonned if: 0=never, 1=timeout, 2=slow, 3=timeout or slow (\-\-host\-control[=N])
|
||||
host is abandonned if: 0=never\, 1=timeout\, 2=slow\, 3=timeout or slow (\-\-host\-control[=N])
|
||||
|
||||
.SS Links options:
|
||||
.IP \-%P
|
||||
*extended parsing, attempt to parse all links, even in unknown tags or Javascript (%P0 don t use) (\-\-extended\-parsing[=N])
|
||||
*extended parsing\, attempt to parse all links\, even in unknown tags or Javascript (%P0 don t use) (\-\-extended\-parsing[=N])
|
||||
.IP \-n
|
||||
get non\-html files near an html file (ex: an image located outside) (\-\-near)
|
||||
.IP \-t
|
||||
@@ -279,25 +279,25 @@ test all URLs (even forbidden ones) (\-\-test)
|
||||
|
||||
.SS Build options:
|
||||
.IP \-NN
|
||||
structure type (0 *original structure, 1+: see below) (\-\-structure[=N])
|
||||
structure type (0 *original structure\, 1+: see below) (\-\-structure[=N])
|
||||
.IP \-or
|
||||
user defined structure (\-N "%h%p/%n%q.%t")
|
||||
.IP \-%N
|
||||
delayed type check, don t make any link test but wait for files download to start instead (experimental) (%N0 don t use, %N1 use for unknown extensions, * %N2 always use)
|
||||
delayed type check\, don t make any link test but wait for files download to start instead (experimental) (%N0 don t use\, %N1 use for unknown extensions\, * %N2 always use)
|
||||
.IP \-%D
|
||||
cached delayed type check, don t wait for remote type during updates, to speedup them (%D0 wait, * %D1 don t wait) (\-\-cached\-delayed\-type\-check)
|
||||
cached delayed type check\, don t wait for remote type during updates\, to speedup them (%D0 wait\, * %D1 don t wait) (\-\-cached\-delayed\-type\-check)
|
||||
.IP \-%M
|
||||
generate a RFC MIME\-encapsulated full\-archive (.mht) (\-\-mime\-html)
|
||||
.IP \-LN
|
||||
long names (L1 *long names / L0 8\-3 conversion / L2 ISO9660 compatible) (\-\-long\-names[=N])
|
||||
.IP \-KN
|
||||
keep original links (e.g. http://www.adr/link) (K0 *relative link, K absolute links, K4 original links, K3 absolute URI links, K5 transparent proxy link) (\-\-keep\-links[=N])
|
||||
keep original links (e.g. http://www.adr/link) (K0 *relative link\, K absolute links\, K4 original links\, K3 absolute URI links\, K5 transparent proxy link) (\-\-keep\-links[=N])
|
||||
.IP \-x
|
||||
replace external html links by error pages (\-\-replace\-external)
|
||||
.IP \-%x
|
||||
do not include any password for external password protected websites (%x0 include) (\-\-disable\-passwords)
|
||||
.IP \-%q
|
||||
*include query string for local files (useless, for information purpose only) (%q0 don t include) (\-\-include\-query\-string)
|
||||
*include query string for local files (useless\, for information purpose only) (%q0 don t include) (\-\-include\-query\-string)
|
||||
.IP \-o
|
||||
*generate output html file in case of error (404..) (o0 don t generate) (\-\-generate\-errors)
|
||||
.IP \-X
|
||||
@@ -309,29 +309,29 @@ links conversion to UTF\-8 (\-\-utf8\-conversion)
|
||||
|
||||
.SS Spider options:
|
||||
.IP \-bN
|
||||
accept cookies in cookies.txt (0=do not accept,* 1=accept) (\-\-cookies[=N])
|
||||
accept cookies in cookies.txt (0=do not accept\,* 1=accept) (\-\-cookies[=N])
|
||||
.IP \-u
|
||||
check document type if unknown (cgi,asp..) (u0 don t check, * u1 check but /, u2 check always) (\-\-check\-type[=N])
|
||||
check document type if unknown (cgi\,asp..) (u0 don t check\, * u1 check but /\, u2 check always) (\-\-check\-type[=N])
|
||||
.IP \-j
|
||||
*parse Java Classes (j0 don t parse, bitmask: |1 parse default, |2 don t parse .class |4 don t parse .js |8 don t be aggressive) (\-\-parse\-java[=N])
|
||||
*parse Java Classes (j0 don t parse\, bitmask: |1 parse default\, |2 don t parse .class |4 don t parse .js |8 don t be aggressive) (\-\-parse\-java[=N])
|
||||
.IP \-sN
|
||||
follow robots.txt and meta robots tags (0=never,1=sometimes,* 2=always, 3=always (even strict rules)) (\-\-robots[=N])
|
||||
follow robots.txt and meta robots tags (0=never\,1=sometimes\,* 2=always\, 3=always (even strict rules)) (\-\-robots[=N])
|
||||
.IP \-%h
|
||||
force HTTP/1.0 requests (reduce update features, only for old servers or proxies) (\-\-http\-10)
|
||||
force HTTP/1.0 requests (reduce update features\, only for old servers or proxies) (\-\-http\-10)
|
||||
.IP \-%k
|
||||
use keep\-alive if possible, greately reducing latency for small files and test requests (%k0 don t use) (\-\-keep\-alive)
|
||||
use keep\-alive if possible\, greately reducing latency for small files and test requests (%k0 don t use) (\-\-keep\-alive)
|
||||
.IP \-%B
|
||||
tolerant requests (accept bogus responses on some servers, but not standard!) (\-\-tolerant)
|
||||
tolerant requests (accept bogus responses on some servers\, but not standard!) (\-\-tolerant)
|
||||
.IP \-%s
|
||||
update hacks: various hacks to limit re\-transfers when updating (identical size, bogus response..) (\-\-updatehack)
|
||||
update hacks: various hacks to limit re\-transfers when updating (identical size\, bogus response..) (\-\-updatehack)
|
||||
.IP \-%u
|
||||
url hacks: various hacks to limit duplicate URLs (strip //, www.foo.com==foo.com..) (\-\-urlhack)
|
||||
url hacks: various hacks to limit duplicate URLs (strip //\, www.foo.com==foo.com..) (\-\-urlhack)
|
||||
.IP \-%A
|
||||
assume that a type (cgi,asp..) is always linked with a mime type (\-%A php3,cgi=text/html;dat,bin=application/x\-zip) (\-\-assume <param>)
|
||||
assume that a type (cgi\,asp..) is always linked with a mime type (\-%A php3\,cgi=text/html;dat\,bin=application/x\-zip) (\-\-assume <param>)
|
||||
.IP \-can
|
||||
also be used to force a specific file type: \-\-assume foo.cgi=text/html
|
||||
.IP \-@iN
|
||||
internet protocol (0=both ipv6+ipv4, 4=ipv4 only, 6=ipv6 only) (\-\-protocol[=N])
|
||||
internet protocol (0=both ipv6+ipv4\, 4=ipv4 only\, 6=ipv6 only) (\-\-protocol[=N])
|
||||
.IP \-%w
|
||||
disable a specific external mime module (\-%w htsswf \-%w htsjava) (\-\-disable\-module <param>)
|
||||
|
||||
@@ -345,15 +345,15 @@ from email address sent in HTTP headers (\-\-from <param>)
|
||||
.IP \-%F
|
||||
footer string in Html code (\-%F "Mirrored [from host %s [file %s [at %s]]]" (\-\-footer <param>)
|
||||
.IP \-%l
|
||||
preffered language (\-%l "fr, en, jp, *" (\-\-language <param>)
|
||||
preffered language (\-%l "fr\, en\, jp\, *" (\-\-language <param>)
|
||||
.IP \-%a
|
||||
accepted formats (\-%l "text/html,image/png,image/jpeg,image/gif;q=0.9,*/*;q=0.1" (\-\-accept <param>)
|
||||
accepted formats (\-%l "text/html\,image/png\,image/jpeg\,image/gif;q=0.9\,*/*;q=0.1" (\-\-accept <param>)
|
||||
.IP \-%X
|
||||
additional HTTP header line (\-%X "X\-Magic: 42" (\-\-headers <param>)
|
||||
|
||||
.SS Log, index, cache
|
||||
.SS Log\, index\, cache
|
||||
.IP \-C
|
||||
create/use a cache for updates and retries (C0 no cache,C1 cache is prioritary,* C2 test update before) (\-\-cache[=N])
|
||||
create/use a cache for updates and retries (C0 no cache\,C1 cache is prioritary\,* C2 test update before) (\-\-cache[=N])
|
||||
.IP \-k
|
||||
store all files in cache (not useful if files on disk) (\-\-store\-all\-in\-cache)
|
||||
.IP \-%n
|
||||
@@ -385,7 +385,7 @@ make an searchable index for this mirror (* %I0 don t make) (\-\-search\-index)
|
||||
.IP \-pN
|
||||
priority mode: (* p3) (\-\-priority[=N])
|
||||
.IP \-p0
|
||||
just scan, don t save anything (for checking links)
|
||||
just scan\, don t save anything (for checking links)
|
||||
.IP \-p1
|
||||
save only html files
|
||||
.IP \-p2
|
||||
@@ -393,7 +393,7 @@ save only non html files
|
||||
.IP \-*p3
|
||||
save all files
|
||||
.IP \-p7
|
||||
get html files before, then treat other files
|
||||
get html files before\, then treat other files
|
||||
.IP \-S
|
||||
stay on the same directory (\-\-stay\-on\-same\-dir)
|
||||
.IP \-D
|
||||
@@ -455,9 +455,9 @@ generate transfer rate statictics every minutes (\-\-debug\-ratestats)
|
||||
|
||||
.SS Dangerous options: (do NOT use unless you exactly know what you are doing)
|
||||
.IP \-%!
|
||||
bypass built\-in security limits aimed to avoid bandwidth abuses (bandwidth, simultaneous connections) (\-\-disable\-security\-limits)
|
||||
bypass built\-in security limits aimed to avoid bandwidth abuses (bandwidth\, simultaneous connections) (\-\-disable\-security\-limits)
|
||||
.IP \-IMPORTANT
|
||||
NOTE: DANGEROUS OPTION, ONLY SUITABLE FOR EXPERTS
|
||||
NOTE: DANGEROUS OPTION\, ONLY SUITABLE FOR EXPERTS
|
||||
.IP \-USE
|
||||
IT WITH EXTREME CARE
|
||||
|
||||
@@ -465,25 +465,25 @@ IT WITH EXTREME CARE
|
||||
.IP \-V
|
||||
execute system command after each files ($0 is the filename: \-V "rm \$0") (\-\-userdef\-cmd <param>)
|
||||
.IP \-%W
|
||||
use an external library function as a wrapper (\-%W myfoo.so[,myparameters]) (\-\-callback <param>)
|
||||
use an external library function as a wrapper (\-%W myfoo.so[\,myparameters]) (\-\-callback <param>)
|
||||
|
||||
.SS Details: Option N
|
||||
.IP \-N0
|
||||
Site\-structure (default)
|
||||
.IP \-N1
|
||||
HTML in web/, images/other files in web/images/
|
||||
HTML in web/\, images/other files in web/images/
|
||||
.IP \-N2
|
||||
HTML in web/HTML, images/other in web/images
|
||||
HTML in web/HTML\, images/other in web/images
|
||||
.IP \-N3
|
||||
HTML in web/, images/other in web/
|
||||
HTML in web/\, images/other in web/
|
||||
.IP \-N4
|
||||
HTML in web/, images/other in web/xxx, where xxx is the file extension (all gif will be placed onto web/gif, for example)
|
||||
HTML in web/\, images/other in web/xxx\, where xxx is the file extension (all gif will be placed onto web/gif\, for example)
|
||||
.IP \-N5
|
||||
Images/other in web/xxx and HTML in web/HTML
|
||||
.IP \-N99
|
||||
All files in web/, with random names (gadget !)
|
||||
All files in web/\, with random names (gadget !)
|
||||
.IP \-N100
|
||||
Site\-structure, without www.domain.xxx/
|
||||
Site\-structure\, without www.domain.xxx/
|
||||
.IP \-N101
|
||||
Identical to N1 exept that "web" is replaced by the site s name
|
||||
.IP \-N102
|
||||
@@ -510,15 +510,15 @@ Identical to N5 exept that there is no "web" directory
|
||||
Identical to N99 exept that there is no "web" directory
|
||||
.SS Details: User\-defined option N
|
||||
%n Name of file without file type (ex: image)
|
||||
%N Name of file, including file type (ex: image.gif)
|
||||
%N Name of file\, including file type (ex: image.gif)
|
||||
%t File type (ex: gif)
|
||||
%p Path [without ending /] (ex: /someimages)
|
||||
%h Host name (ex: www.someweb.com)
|
||||
%M URL MD5 (128 bits, 32 ascii bytes)
|
||||
%Q query string MD5 (128 bits, 32 ascii bytes)
|
||||
%M URL MD5 (128 bits\, 32 ascii bytes)
|
||||
%Q query string MD5 (128 bits\, 32 ascii bytes)
|
||||
%k full query string
|
||||
%r protocol name (ex: http)
|
||||
%q small query string MD5 (16 bits, 4 ascii bytes)
|
||||
%q small query string MD5 (16 bits\, 4 ascii bytes)
|
||||
%s? Short name version (ex: %sN)
|
||||
%[param] param variable in query string
|
||||
%[param:before:after:empty:notfound] advanced variable extraction
|
||||
@@ -535,11 +535,11 @@ Identical to N99 exept that there is no "web" directory
|
||||
.IP \-empty
|
||||
: string replacement if the parameter was empty
|
||||
.IP \-all
|
||||
fields, except the first one (the parameter name), can be empty
|
||||
fields\, except the first one (the parameter name)\, can be empty
|
||||
|
||||
.SS Details: Option K
|
||||
.IP \-K0
|
||||
foo.cgi?q=45 \-> foo4B54.html?q=45 (relative URI, default)
|
||||
foo.cgi?q=45 \-> foo4B54.html?q=45 (relative URI\, default)
|
||||
.IP \-K
|
||||
\-> http://www.foobar.com/folder/foo.cgi?q=45 (absolute URL) (\-\-keep\-links[=N])
|
||||
.IP \-K3
|
||||
@@ -553,7 +553,7 @@ foo.cgi?q=45 \-> foo4B54.html?q=45 (relative URI, default)
|
||||
.IP \-\-mirror
|
||||
<URLs> *make a mirror of site(s) (default)
|
||||
.IP \-\-get
|
||||
<URLs> get the files indicated, do not seek other URLs (\-qg)
|
||||
<URLs> get the files indicated\, do not seek other URLs (\-qg)
|
||||
.IP \-\-list
|
||||
<text file> add all URL located in this text file (\-%L)
|
||||
.IP \-\-mirrorlinks
|
||||
@@ -561,15 +561,15 @@ foo.cgi?q=45 \-> foo4B54.html?q=45 (relative URI, default)
|
||||
.IP \-\-testlinks
|
||||
<URLs> test links in pages (\-r1p0C0I0t)
|
||||
.IP \-\-spider
|
||||
<URLs> spider site(s), to test links: reports Errors & Warnings (\-p0C0I0t)
|
||||
<URLs> spider site(s)\, to test links: reports Errors & Warnings (\-p0C0I0t)
|
||||
.IP \-\-testsite
|
||||
<URLs> identical to \-\-spider
|
||||
.IP \-\-skeleton
|
||||
<URLs> make a mirror, but gets only html files (\-p1)
|
||||
<URLs> make a mirror\, but gets only html files (\-p1)
|
||||
.IP \-\-update
|
||||
update a mirror, without confirmation (\-iC2)
|
||||
update a mirror\, without confirmation (\-iC2)
|
||||
.IP \-\-continue
|
||||
continue a mirror, without confirmation (\-iC1)
|
||||
continue a mirror\, without confirmation (\-iC1)
|
||||
|
||||
.IP \-\-catchurl
|
||||
create a temporary proxy to capture an URL or a form post URL
|
||||
|
||||
Reference in New Issue
Block a user