mirror of
https://github.com/xroche/httrack.git
synced 2026-05-17 08:26:14 +03:00
2622 lines
58 KiB
HTML
2622 lines
58 KiB
HTML
<!-- Creator : groff version 1.18.1 -->
|
|
<!-- CreationDate: Mon Jul 28 23:17:44 2008 -->
|
|
<html>
|
|
<head>
|
|
<meta name="generator" content="groff -Thtml, see www.gnu.org">
|
|
<meta name="Content-Style" content="text/css">
|
|
<title>httrack</title>
|
|
</head>
|
|
<body>
|
|
|
|
<h1 align=center>httrack</h1>
|
|
<a href="#NAME">NAME</a><br>
|
|
<a href="#SYNOPSIS">SYNOPSIS</a><br>
|
|
<a href="#DESCRIPTION">DESCRIPTION</a><br>
|
|
<a href="#EXAMPLES">EXAMPLES</a><br>
|
|
<a href="#OPTIONS">OPTIONS</a><br>
|
|
<a href="#FILES">FILES</a><br>
|
|
<a href="#ENVIRONMENT">ENVIRONMENT</a><br>
|
|
<a href="#DIAGNOSTICS">DIAGNOSTICS</a><br>
|
|
<a href="#LIMITS">LIMITS</a><br>
|
|
<a href="#BUGS">BUGS</a><br>
|
|
<a href="#COPYRIGHT">COPYRIGHT</a><br>
|
|
<a href="#AVAILABILITY">AVAILABILITY</a><br>
|
|
<a href="#AUTHOR">AUTHOR</a><br>
|
|
<a href="#SEE ALSO">SEE ALSO</a><br>
|
|
|
|
<hr>
|
|
<a name="NAME"></a>
|
|
<h2>NAME</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>httrack − offline browser : copy websites to a
|
|
local directory</p>
|
|
</td>
|
|
</table>
|
|
<a name="SYNOPSIS"></a>
|
|
<h2>SYNOPSIS</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack [ url ]... [ -filter ]... [ +filter ]... [</b>
|
|
] [ <b>-%O, --chroot</b> ] [ <b>-w, --mirror</b> ] [ <b>-W,
|
|
--mirror-wizard</b> ] [ <b>-g, --get-files</b> ] [ <b>-i,
|
|
--continue</b> ] [ <b>-Y, --mirrorlinks</b> ] [ <b>-P,
|
|
--proxy</b> ] [ <b>-%f, --httpproxy-ftp[=N]</b> ] [ <b>-%b,
|
|
--bind</b> ] [ <b>-rN, --depth[=N]</b> ] [ <b>-%eN,
|
|
--ext-depth[=N]</b> ] [ <b>-mN, --max-files[=N]</b> ] [
|
|
<b>-MN, --max-size[=N]</b> ] [ <b>-EN, --max-time[=N]</b> ]
|
|
[ <b>-AN, --max-rate[=N]</b> ] [ <b>-%cN,
|
|
--connection-per-second[=N]</b> ] [ <b>-GN,
|
|
--max-pause[=N]</b> ] [ <b>-%mN, --max-mms-time[=N]</b> ] [
|
|
<b>-cN, --sockets[=N]</b> ] [ <b>-TN, --timeout</b> ] [
|
|
<b>-RN, --retries[=N]</b> ] [ <b>-JN, --min-rate[=N]</b> ] [
|
|
<b>-HN, --host-control[=N]</b> ] [ <b>-%P,
|
|
--extended-parsing[=N]</b> ] [ <b>-n, --near</b> ] [ <b>-t,
|
|
--test</b> ] [ <b>-%L, --list</b> ] [ <b>-%S, --urllist</b>
|
|
] [ <b>-NN, --structure[=N]</b> ] [ <b>-%D,
|
|
--cached-delayed-type-check</b> ] [ <b>-%M, --mime-html</b>
|
|
] [ <b>-LN, --long-names[=N]</b> ] [ <b>-KN,
|
|
--keep-links[=N]</b> ] [ <b>-x, --replace-external</b> ] [
|
|
<b>-%x, --disable-passwords</b> ] [ <b>-%q,
|
|
--include-query-string</b> ] [ <b>-o, --generate-errors</b>
|
|
] [ <b>-X, --purge-old[=N]</b> ] [ <b>-%p, --preserve</b> ]
|
|
[ <b>-bN, --cookies[=N]</b> ] [ <b>-u, --check-type[=N]</b>
|
|
] [ <b>-j, --parse-java[=N]</b> ] [ <b>-sN, --robots[=N]</b>
|
|
] [ <b>-%h, --http-10</b> ] [ <b>-%k, --keep-alive</b> ] [
|
|
<b>-%B, --tolerant</b> ] [ <b>-%s, --updatehack</b> ] [
|
|
<b>-%u, --urlhack</b> ] [ <b>-%A, --assume</b> ] [ <b>-@iN,
|
|
--protocol[=N]</b> ] [ <b>-%w, --disable-module</b> ] [
|
|
<b>-F, --user-agent</b> ] [ <b>-%R, --referer</b> ] [
|
|
<b>-%E, --from</b> ] [ <b>-%F, --footer</b> ] [ <b>-%l,
|
|
--language</b> ] [ <b>-C, --cache[=N]</b> ] [ <b>-k,
|
|
--store-all-in-cache</b> ] [ <b>-%n, --do-not-recatch</b> ]
|
|
[ <b>-%v, --display</b> ] [ <b>-Q, --do-not-log</b> ] [
|
|
<b>-q, --quiet</b> ] [ <b>-z, --extra-log</b> ] [ <b>-Z,
|
|
--debug-log</b> ] [ <b>-v, --verbose</b> ] [ <b>-f,
|
|
--file-log</b> ] [ <b>-f2, --single-log</b> ] [ <b>-I,
|
|
--index</b> ] [ <b>-%i, --build-top-index</b> ] [ <b>-%I,
|
|
--search-index</b> ] [ <b>-pN, --priority[=N]</b> ] [ <b>-S,
|
|
--stay-on-same-dir</b> ] [ <b>-D, --can-go-down</b> ] [
|
|
<b>-U, --can-go-up</b> ] [ <b>-B, --can-go-up-and-down</b> ]
|
|
[ <b>-a, --stay-on-same-address</b> ] [ <b>-d,
|
|
--stay-on-same-domain</b> ] [ <b>-l, --stay-on-same-tld</b>
|
|
] [ <b>-e, --go-everywhere</b> ] [ <b>-%H,
|
|
--debug-headers</b> ] [ <b>-%!,
|
|
--disable-security-limits</b> ] [ <b>-V, --userdef-cmd</b> ]
|
|
[ <b>-%U, --user</b> ] [ <b>-%W, --callback</b> ] [ <b>-K,
|
|
--keep-links[=N]</b> ] [</p>
|
|
</td>
|
|
</table>
|
|
<a name="DESCRIPTION"></a>
|
|
<h2>DESCRIPTION</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack</b> allows you to download a World Wide Web
|
|
site from the Internet to a local directory, building
|
|
recursively all directories, getting HTML, images, and other
|
|
files from the server to your computer. HTTrack arranges the
|
|
original site’s relative link-structure. Simply open a
|
|
page of the "mirrored" website in your browser,
|
|
and you can browse the site from link to link, as if you
|
|
were viewing it online. HTTrack can also update an existing
|
|
mirrored site, and resume interrupted downloads.</p>
|
|
</td>
|
|
</table>
|
|
<a name="EXAMPLES"></a>
|
|
<h2>EXAMPLES</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack www.someweb.com/bob/</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>mirror site www.someweb.com/bob/ and only this site</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack www.someweb.com/bob/ www.anothertest.com/mike/
|
|
+*.com/*.jpg -mime:application/*</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>mirror the two sites together (with shared links) and
|
|
accept any .jpg files on .com sites</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack www.someweb.com/bob/bobby.html +*
|
|
-r6</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>means get all files starting from bobby.html, with 6
|
|
link-depth, and possibility of going everywhere on the
|
|
web</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack www.someweb.com/bob/bobby.html --spider -P
|
|
proxy.myhost.com:8080</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>runs the spider on www.someweb.com/bob/bobby.html using a
|
|
proxy</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack --update</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>updates a mirror in the current folder</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>will bring you to the interactive mode</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><b>httrack --continue</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>continues a mirror in the current folder</p>
|
|
</td>
|
|
</table>
|
|
<a name="OPTIONS"></a>
|
|
<h2>OPTIONS</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>General options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="4%">
|
|
|
|
<p>-O</p>
|
|
</td>
|
|
<td width="5%"></td>
|
|
<td width="77%">
|
|
|
|
<p>path for mirror/logfiles+cache (-O path mirror[,path
|
|
cache and logfiles]) (--path <param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="4%">
|
|
|
|
<p>-%O</p>
|
|
</td>
|
|
<td width="5%"></td>
|
|
<td width="77%">
|
|
|
|
<p>chroot path to, must be r00t (-%O root path) (--chroot
|
|
<param>)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Action options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-w</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*mirror web sites (--mirror)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-W</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>mirror web sites, semi-automatic (asks questions)
|
|
(--mirror-wizard)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-g</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>just get files (saved in the current directory)
|
|
(--get-files)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-i</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>continue an interrupted mirror using the cache
|
|
(--continue)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-Y</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>mirror ALL links located in the first level pages
|
|
(mirror links) (--mirrorlinks)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Proxy options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="4%">
|
|
|
|
<p>-P</p>
|
|
</td>
|
|
<td width="5%"></td>
|
|
<td width="77%">
|
|
|
|
<p>proxy use (-P proxy:port or -P user:pass@proxy:port)
|
|
(--proxy <param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="4%">
|
|
|
|
<p>-%f</p>
|
|
</td>
|
|
<td width="5%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*use proxy for ftp (f0 don t use)
|
|
(--httpproxy-ftp[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="4%">
|
|
|
|
<p>-%b</p>
|
|
</td>
|
|
<td width="5%"></td>
|
|
<td width="77%">
|
|
|
|
<p>use this local hostname to make/send requests (-%b
|
|
hostname) (--bind <param>)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Limits options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-rN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>set the mirror depth to N (* r9999) (--depth[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%eN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>set the external links depth to N (* %e0)
|
|
(--ext-depth[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-mN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum file length for a non-html file
|
|
(--max-files[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-mN,N2</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum file length for non html (N) and html (N2)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-MN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum overall size that can be uploaded/scanned
|
|
(--max-size[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-EN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum mirror time in seconds (60=1 minute, 3600=1
|
|
hour) (--max-time[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-AN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum transfer rate in bytes/seconds (1000=1KB/s max)
|
|
(--max-rate[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%cN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum number of connections/seconds (*%c10)
|
|
(--connection-per-second[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-GN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>pause transfer if N bytes reached, and wait until lock
|
|
file is deleted (--max-pause[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%mN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum mms stream download time in seconds (60=1
|
|
minute, 3600=1 hour) (--max-mms-time[=N])</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Flow control:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-cN</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>number of multiple connections (*c8) (--sockets[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-TN</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>timeout, number of seconds after a non-responding link
|
|
is shutdown (--timeout)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-RN</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>number of retries, in case of timeout or non-fatal
|
|
errors (*R1) (--retries[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-JN</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>traffic jam control, minimum transfert rate
|
|
(bytes/seconds) tolerated for a link (--min-rate[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-HN</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>host is abandonned if: 0=never, 1=timeout, 2=slow,
|
|
3=timeout or slow (--host-control[=N])</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Links options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%P</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*extended parsing, attempt to parse all links, even in
|
|
unknown tags or Javascript (%P0 don t use)
|
|
(--extended-parsing[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-n</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>get non-html files near an html file (ex: an image
|
|
located outside) (--near)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-t</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>test all URLs (even forbidden ones) (--test)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%L</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p><file> add all URL located in this text file (one
|
|
URL per line) (--list <param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%S</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p><file> add all scan rules located in this text
|
|
file (one scan rule per line) (--urllist <param>)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Build options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-NN</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>structure type (0 *original structure, 1+: see below)
|
|
(--structure[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-or</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>user defined structure (-N "%h%p/%n%q.%t")</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%N</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>delayed type check, don t make any link test but wait
|
|
for files download to start instead (experimental) (%N0 don
|
|
t use, %N1 use for unknown extensions, * %N2 always use)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%D</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>cached delayed type check, don t wait for remote type
|
|
during updates, to speedup them (%D0 wait, * %D1 don t wait)
|
|
(--cached-delayed-type-check)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%M</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>generate a RFC MIME-encapsulated full-archive (.mht)
|
|
(--mime-html)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-LN</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>long names (L1 *long names / L0 8-3 conversion / L2
|
|
ISO9660 compatible) (--long-names[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-KN</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>keep original links (e.g. http://www.adr/link) (K0
|
|
*relative link, K absolute links, K4 original links, K3
|
|
absolute URI links) (--keep-links[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-x</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>replace external html links by error pages
|
|
(--replace-external)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%x</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>do not include any password for external password
|
|
protected websites (%x0 include) (--disable-passwords)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%q</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*include query string for local files (useless, for
|
|
information purpose only) (%q0 don t include)
|
|
(--include-query-string)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-o</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*generate output html file in case of error (404..) (o0
|
|
don t generate) (--generate-errors)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-X</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*purge old files after update (X0 keep delete)
|
|
(--purge-old[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%p</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>preserve html files as is (identical to -K4 -%F
|
|
"" ) (--preserve)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Spider options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-bN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>accept cookies in cookies.txt (0=do not accept,*
|
|
1=accept) (--cookies[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-u</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>check document type if unknown (cgi,asp..) (u0 don t
|
|
check, * u1 check but /, u2 check always)
|
|
(--check-type[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-j</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*parse Java Classes (j0 don t parse, bitmask: |1 parse
|
|
default, |2 don t parse .class |4 don t parse .js |8 don t
|
|
be aggressive) (--parse-java[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-sN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>follow robots.txt and meta robots tags
|
|
(0=never,1=sometimes,* 2=always, 3=always (even strict
|
|
rules)) (--robots[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%h</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>force HTTP/1.0 requests (reduce update features, only
|
|
for old servers or proxies) (--http-10)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%k</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>use keep-alive if possible, greately reducing latency
|
|
for small files and test requests (%k0 don t use)
|
|
(--keep-alive)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%B</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>tolerant requests (accept bogus responses on some
|
|
servers, but not standard!) (--tolerant)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%s</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>update hacks: various hacks to limit re-transfers when
|
|
updating (identical size, bogus response..)
|
|
(--updatehack)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%u</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>url hacks: various hacks to limit duplicate URLs (strip
|
|
//, www.foo.com==foo.com..) (--urlhack)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%A</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>assume that a type (cgi,asp..) is always linked with a
|
|
mime type (-%A php3,cgi=text/html;dat,bin=application/x-zip)
|
|
(--assume <param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-can</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>also be used to force a specific file type: --assume
|
|
foo.cgi=text/html</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-@iN</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>internet protocol (0=both ipv6+ipv4, 4=ipv4 only, 6=ipv6
|
|
only) (--protocol[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-%w</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>disable a specific external mime module (-%w htsswf -%w
|
|
htsjava) (--disable-module <param>)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Browser ID:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-F</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>user-agent field sent in HTTP headers (-F
|
|
"user-agent name") (--user-agent
|
|
<param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%R</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>default referer field sent in HTTP headers (--referer
|
|
<param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%E</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>from email address sent in HTTP headers (--from
|
|
<param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%F</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>footer string in Html code (-%F "Mirrored [from
|
|
host %s [file %s [at %s]]]" (--footer
|
|
<param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%l</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>preffered language (-%l "fr, en, jp, *"
|
|
(--language <param>)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Log, index, cache</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-C</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>create/use a cache for updates and retries (C0 no
|
|
cache,C1 cache is prioritary,* C2 test update before)
|
|
(--cache[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-k</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>store all files in cache (not useful if files on disk)
|
|
(--store-all-in-cache)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%n</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>do not re-download locally erased files
|
|
(--do-not-recatch)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%v</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>display on screen filenames downloaded (in realtime) - *
|
|
%v1 short version - %v2 full animation (--display)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-Q</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>no log - quiet mode (--do-not-log)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-q</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>no questions - quiet mode (--quiet)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-z</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>log - extra infos (--extra-log)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-Z</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>log - debug (--debug-log)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-v</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>log on screen (--verbose)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-f</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*log in files (--file-log)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-f2</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>one single log file (--single-log)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-I</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*make an index (I0 don t make) (--index)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%i</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>make a top index for a project folder (* %i0 don t make)
|
|
(--build-top-index)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%I</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>make an searchable index for this mirror (* %I0 don t
|
|
make) (--search-index)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Expert options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-pN</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>priority mode: (* p3) (--priority[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-p0</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>just scan, don t save anything (for checking links)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-p1</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>save only html files</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-p2</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>save only non html files</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-*p3</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>save all files</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-p7</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>get html files before, then treat other files</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-S</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>stay on the same directory (--stay-on-same-dir)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-D</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*can only go down into subdirs (--can-go-down)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-U</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>can only go to upper directories (--can-go-up)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-B</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>can both go up&down into the directory structure
|
|
(--can-go-up-and-down)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-a</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*stay on the same address (--stay-on-same-address)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-d</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>stay on the same principal domain
|
|
(--stay-on-same-domain)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-l</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>stay on the same TLD (eg: .com) (--stay-on-same-tld)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-e</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>go everywhere on the web (--go-everywhere)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%H</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>debug HTTP headers in logfile (--debug-headers)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Guru options: (do NOT use if possible)</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#X</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>*use optimized engine (limited memory boundary checks)
|
|
(--fast-engine)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#0</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>filter test (-#0 *.gif www.bar.com/foo.gif )
|
|
(--debug-testfilters <param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#1</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>simplify test (-#1 ./foo/bar/../foobar)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#2</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>type test (-#2 /foo/bar.php)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#C</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>cache list (-#C *.com/spider*.gif (--debug-cache
|
|
<param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#R</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>cache repair (damaged cache) (--repair-cache)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#d</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>debug parser (--debug-parsing)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#E</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>extract new.zip cache meta-data in meta.zip</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#f</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>always flush log files (--advanced-flushlogs)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#FN</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum number of filters
|
|
(--advanced-maxfilters[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#h</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>version info (--version)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#K</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>scan stdin (debug) (--debug-scanstdin)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="7%">
|
|
|
|
<p>-#L</p>
|
|
</td>
|
|
<td width="2%"></td>
|
|
<td width="77%">
|
|
|
|
<p>maximum number of links (-#L1000000)
|
|
(--advanced-maxlinks)</p>
|
|
</td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-#p</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>display ugly progress information
|
|
(--advanced-progressinfo)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-#P</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>catch URL (--catch-url)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-#R</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>old FTP routines (debug) (--repair-cache)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-#T</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>generate transfer ops. log every minutes
|
|
(--debug-xfrstats)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-#u</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>wait time (--advanced-wait)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-#Z</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>generate transfer rate statictics every minutes
|
|
(--debug-ratestats)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-#!</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>execute a shell command (-#! "echo hello")
|
|
(--exec <param>)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Dangerous options: (do NOT use unless you exactly know
|
|
what you are doing)</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="4%">
|
|
|
|
<p>-%!</p>
|
|
</td>
|
|
<td width="5%"></td>
|
|
<td width="77%">
|
|
|
|
<p>bypass built-in security limits aimed to avoid bandwith
|
|
abuses (bandwidth, simultaneous connections)
|
|
(--disable-security-limits)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>-IMPORTANT</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>NOTE: DANGEROUS OPTION, ONLY SUITABLE FOR EXPERTS</p>
|
|
</td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="5" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-USE</p>
|
|
</td>
|
|
<td width="13%"></td>
|
|
<td width="29%">
|
|
|
|
<p>IT WITH EXTREME CARE</p>
|
|
</td>
|
|
<td width="39%">
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Command-line specific options:</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-V</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>execute system command after each files ($0 is the
|
|
filename: -V "rm ") (--userdef-cmd
|
|
<param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%U</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>run the engine with another id when called as root (-%U
|
|
smith) (--user <param>)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-%W</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>use an external library function as a wrapper (-%W
|
|
myfoo.so[,myparameters]) (--callback <param>)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Details: Option N</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="3" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N0</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Site-structure (default)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N1</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>HTML in web/, images/other files in web/images/</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N2</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>HTML in web/HTML, images/other in web/images</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N3</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>HTML in web/, images/other in web/</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N4</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>HTML in web/, images/other in web/xxx, where xxx is the
|
|
file extension (all gif will be placed onto web/gif, for
|
|
example)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N5</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Images/other in web/xxx and HTML in web/HTML</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N99</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>All files in web/, with random names (gadget !)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N100</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Site-structure, without www.domain.xxx/</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N101</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N1 exept that "web" is replaced
|
|
by the site s name</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N102</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N2 exept that "web" is replaced
|
|
by the site s name</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N103</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N3 exept that "web" is replaced
|
|
by the site s name</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N104</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N4 exept that "web" is replaced
|
|
by the site s name</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N105</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N5 exept that "web" is replaced
|
|
by the site s name</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N199</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N99 exept that "web" is replaced
|
|
by the site s name</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N1001</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N1 exept that there is no "web"
|
|
directory</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N1002</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N2 exept that there is no "web"
|
|
directory</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N1003</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N3 exept that there is no "web"
|
|
directory (option set for g option)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N1004</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N4 exept that there is no "web"
|
|
directory</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N1005</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N5 exept that there is no "web"
|
|
directory</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>-N1099</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p>Identical to N99 exept that there is no "web"
|
|
directory</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Details: User-defined option N</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>%n Name of file without file type (ex: image) %N Name of
|
|
file, including file type (ex: image.gif) %t File type (ex:
|
|
gif) %p Path [without ending /] (ex: /someimages) %h Host
|
|
name (ex: www.someweb.com) %M URL MD5 (128 bits, 32 ascii
|
|
bytes) %Q query string MD5 (128 bits, 32 ascii bytes) %r
|
|
protocol name (ex: http) %q small query string MD5 (16 bits,
|
|
4 ascii bytes) %s? Short name version (ex: %sN) %[param]
|
|
param variable in query string
|
|
%[param:before:after:empty:notfound] advanced variable
|
|
extraction</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Details: User-defined option N and advanced variable
|
|
extraction</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>%[param:before:after:empty:notfound]</p>
|
|
</td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="5" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-param</p>
|
|
</td>
|
|
<td width="13%"></td>
|
|
<td width="23%">
|
|
|
|
<p>: parameter name</p>
|
|
</td>
|
|
<td width="42%">
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>-before</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>: string to prepend if the parameter was found</p>
|
|
</td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="5" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-after</p>
|
|
</td>
|
|
<td width="13%"></td>
|
|
<td width="66%">
|
|
|
|
<p>: string to append if the parameter was found</p>
|
|
</td>
|
|
<td width="0%">
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>-notfound</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>: string replacement if the parameter could not be
|
|
found</p>
|
|
</td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-empty</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>: string replacement if the parameter was empty</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="8%">
|
|
|
|
<p>-all</p>
|
|
</td>
|
|
<td width="1%"></td>
|
|
<td width="77%">
|
|
|
|
<p>fields, except the first one (the parameter name), can
|
|
be empty</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Details: Option K</b></p></td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-K0</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>foo.cgi?q=45 -> foo4B54.html?q=45 (relative URI,
|
|
default)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-K</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>-> http://www.foobar.com/folder/foo.cgi?q=45
|
|
(absolute URL) (--keep-links[=N])</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-K4</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>-> foo.cgi?q=45 (original URL)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>-K3</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>-> /folder/foo.cgi?q=45 (absolute URI)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Shortcuts:</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--mirror</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p><URLs> *make a mirror of site(s) (default)</p>
|
|
</td>
|
|
</table>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="3" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>--get</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p><URLs> get the files indicated, do not seek other
|
|
URLs (-qg)</p>
|
|
</td>
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="10%">
|
|
|
|
<p>--list</p>
|
|
</td>
|
|
<td width="77%">
|
|
|
|
<p><text file> add all URL located in this text file
|
|
(-%L)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--mirrorlinks</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p><URLs> mirror all links in 1st level pages (-Y)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--testlinks</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p><URLs> test links in pages (-r1p0C0I0t)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--spider</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p><URLs> spider site(s), to test links: reports
|
|
Errors & Warnings (-p0C0I0t)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--testsite</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p><URLs> identical to --spider</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--skeleton</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p><URLs> make a mirror, but gets only html files
|
|
(-p1)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--update</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>update a mirror, without confirmation (-iC2)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--continue</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>continue a mirror, without confirmation (-iC1)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--catchurl</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>create a temporary proxy to capture an URL or a form post
|
|
URL</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--clean</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>erase cache & log files</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>--http10</p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="21%"></td>
|
|
<td width="77%">
|
|
<p>force http/1.0 requests (-%h)</p>
|
|
</td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>Details: Option %W: External callbacks
|
|
prototypes</b></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="4%"></td>
|
|
<td width="95%">
|
|
<p><b>see htsdefines.h</b></p></td>
|
|
</table>
|
|
<a name="FILES"></a>
|
|
<h2>FILES</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p><i>/etc/httrack.conf</i></p></td>
|
|
</table>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="20%"></td>
|
|
<td width="79%">
|
|
<p>The system wide configuration file.</p>
|
|
</td>
|
|
</table>
|
|
<a name="ENVIRONMENT"></a>
|
|
<h2>ENVIRONMENT</h2>
|
|
<!-- TABS -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="4" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="11%"></td>
|
|
<td width="5%">
|
|
|
|
<p>HOME</p>
|
|
</td>
|
|
<td width="4%"></td>
|
|
<td width="77%">
|
|
|
|
<p>Is being used if you defined in /etc/httrack.conf the
|
|
line <i>path ~/websites/#</i></p>
|
|
</td>
|
|
</table>
|
|
<a name="DIAGNOSTICS"></a>
|
|
<h2>DIAGNOSTICS</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>Errors/Warnings are reported to <i>hts-log.txt</i> by
|
|
default, or to stderr if the <i>-v</i> option was
|
|
specified.</p>
|
|
</td>
|
|
</table>
|
|
<a name="LIMITS"></a>
|
|
<h2>LIMITS</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>These are the principals limits of HTTrack for that
|
|
moment. Note that we did not heard about any other utility
|
|
that would have solved them.</p>
|
|
<!-- INDENTATION -->
|
|
<p><small>- Several scripts generating complex filenames may
|
|
not find them (ex:
|
|
img.src=’image’+a+Mobj.dst+’.gif’)</small></p>
|
|
<!-- INDENTATION -->
|
|
<p><small>- Some java classes may not find some files on
|
|
them (class included)</small></p>
|
|
<!-- INDENTATION -->
|
|
<p><small>- Cgi-bin links may not work properly in some
|
|
cases (parameters needed). To avoid them: use filters like
|
|
-*cgi-bin*</small></p>
|
|
</td>
|
|
</table>
|
|
<a name="BUGS"></a>
|
|
<h2>BUGS</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>Please reports bugs to <b><bugs@httrack.com>.</b>
|
|
Include a complete, self-contained example that will allow
|
|
the bug to be reproduced, and say which version of httrack
|
|
you are using. Do not forget to detail options used, OS
|
|
version, and any other information you deem necessary.</p>
|
|
</td>
|
|
</table>
|
|
<a name="COPYRIGHT"></a>
|
|
<h2>COPYRIGHT</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>Copyright (C) Xavier Roche and other contributors</p>
|
|
<!-- INDENTATION -->
|
|
<p>This program is free software; you can redistribute it
|
|
and/or modify it under the terms of the GNU General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2 of the License, or any later version.</p>
|
|
<!-- INDENTATION -->
|
|
<p>This program is distributed in the hope that it will be
|
|
useful, but WITHOUT ANY WARRANTY; without even the implied
|
|
warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR
|
|
PURPOSE. See the GNU General Public License for more
|
|
details.</p>
|
|
<!-- INDENTATION -->
|
|
<p>You should have received a copy of the GNU General Public
|
|
License along with this program; if not, write to the Free
|
|
Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
Boston, MA 02111-1307, USA.</p>
|
|
</td>
|
|
</table>
|
|
<a name="AVAILABILITY"></a>
|
|
<h2>AVAILABILITY</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>The most recent released version of httrack can be found
|
|
at: <b>http://www.httrack.com</b></p>
|
|
</td>
|
|
</table>
|
|
<a name="AUTHOR"></a>
|
|
<h2>AUTHOR</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>Xavier Roche <roche@httrack.com></p>
|
|
</td>
|
|
</table>
|
|
<a name="SEE ALSO"></a>
|
|
<h2>SEE ALSO</h2>
|
|
<!-- INDENTATION -->
|
|
<table width="100%" border=0 rules="none" frame="void"
|
|
cols="2" cellspacing="0" cellpadding="0">
|
|
<tr valign="top" align="left">
|
|
<td width="10%"></td>
|
|
<td width="89%">
|
|
<p>The <b>HTML</b> documentation (available online at
|
|
<b>http://www.httrack.com/html/</b> ) contains more detailed
|
|
information. Please also refer to the <b>httrack FAQ</b>
|
|
(available online at
|
|
<b>http://www.httrack.com/html/faq.html</b> )</p>
|
|
</td>
|
|
</table>
|
|
<hr>
|
|
</body>
|
|
</html>
|