summaryrefslogtreecommitdiff
path: root/html/httrack.man.html
diff options
context:
space:
mode:
Diffstat (limited to 'html/httrack.man.html')
-rw-r--r--html/httrack.man.html293
1 files changed, 254 insertions, 39 deletions
diff --git a/html/httrack.man.html b/html/httrack.man.html
index 986954b..33701d1 100644
--- a/html/httrack.man.html
+++ b/html/httrack.man.html
@@ -24,7 +24,7 @@
<hr>
<!-- Creator : groff version 1.17.2 -->
-<!-- CreationDate: Sat Oct 11 09:14:41 2003 -->
+<!-- CreationDate: Sat Jun 4 14:17:19 2005 -->
<a name="NAME"></a>
<h2>NAME</h2>
<table width="100%" border=0 rules="none" frame="void"
@@ -54,34 +54,36 @@ httrack - offline browser : copy websites to a local directory</td></table>
--host-control[=N]</b> ] [ <b>-%P,
--extended-parsing[=N]</b> ] [ <b>-n, --near</b> ] [ <b>-t,
--test</b> ] [ <b>-%L, --list</b> ] [ <b>-%S, --urllist</b>
-] [ <b>-NN, --structure[=N]</b> ] [ <b>-%M,
---mime-html[=N]</b> ] [ <b>-LN, --long-names[=N]</b> ] [
-<b>-KN, --keep-links[=N]</b> ] [ <b>-x,
---replace-external</b> ] [ <b>-%x, --disable-passwords</b> ]
-[ <b>-%q, --include-query-string</b> ] [ <b>-o,
---generate-errors</b> ] [ <b>-X, --purge-old[=N]</b> ] [
-<b>-%p, --preserve</b> ] [ <b>-bN, --cookies[=N]</b> ] [
-<b>-u, --check-type[=N]</b> ] [ <b>-j, --parse-java[=N]</b>
-] [ <b>-sN, --robots[=N]</b> ] [ <b>-%h, --http-10</b> ] [
-<b>-%k, --keep-alive</b> ] [ <b>-%B, --tolerant</b> ] [
-<b>-%s, --updatehack</b> ] [ <b>-%u, --urlhack</b> ] [
-<b>-%A, --assume</b> ] [ <b>-@iN, --protocol[=N]</b> ] [
-<b>-F, --user-agent</b> ] [ <b>-%F, --footer</b> ] [ <b>-%l,
---language</b> ] [ <b>-C, --cache[=N]</b> ] [ <b>-k,
---store-all-in-cache</b> ] [ <b>-%n, --do-not-recatch</b> ]
-[ <b>-%v, --display</b> ] [ <b>-Q, --do-not-log</b> ] [
-<b>-q, --quiet</b> ] [ <b>-z, --extra-log</b> ] [ <b>-Z,
---debug-log</b> ] [ <b>-v, --verbose</b> ] [ <b>-f,
---file-log</b> ] [ <b>-f2, --single-log</b> ] [ <b>-I,
---index</b> ] [ <b>-%i, --build-top-index</b> ] [ <b>-%I,
---search-index</b> ] [ <b>-pN, --priority[=N]</b> ] [ <b>-S,
---stay-on-same-dir</b> ] [ <b>-D, --can-go-down</b> ] [
-<b>-U, --can-go-up</b> ] [ <b>-B, --can-go-up-and-down</b> ]
-[ <b>-a, --stay-on-same-address</b> ] [ <b>-d,
+] [ <b>-NN, --structure[=N]</b> ] [ <b>-%M, --mime-html</b>
+] [ <b>-LN, --long-names[=N]</b> ] [ <b>-KN,
+--keep-links[=N]</b> ] [ <b>-x, --replace-external</b> ] [
+<b>-%x, --disable-passwords</b> ] [ <b>-%q,
+--include-query-string</b> ] [ <b>-o, --generate-errors</b>
+] [ <b>-X, --purge-old[=N]</b> ] [ <b>-%p, --preserve</b> ]
+[ <b>-bN, --cookies[=N]</b> ] [ <b>-u, --check-type[=N]</b>
+] [ <b>-j, --parse-java[=N]</b> ] [ <b>-sN, --robots[=N]</b>
+] [ <b>-%h, --http-10</b> ] [ <b>-%k, --keep-alive</b> ] [
+<b>-%B, --tolerant</b> ] [ <b>-%s, --updatehack</b> ] [
+<b>-%u, --urlhack</b> ] [ <b>-%A, --assume</b> ] [ <b>-@iN,
+--protocol[=N]</b> ] [ <b>-F, --user-agent</b> ] [ <b>-%R,
+--referer</b> ] [ <b>-%E, --from</b> ] [ <b>-%F,
+--footer</b> ] [ <b>-%l, --language</b> ] [ <b>-C,
+--cache[=N]</b> ] [ <b>-k, --store-all-in-cache</b> ] [
+<b>-%n, --do-not-recatch</b> ] [ <b>-%v, --display</b> ] [
+<b>-Q, --do-not-log</b> ] [ <b>-q, --quiet</b> ] [ <b>-z,
+--extra-log</b> ] [ <b>-Z, --debug-log</b> ] [ <b>-v,
+--verbose</b> ] [ <b>-f, --file-log</b> ] [ <b>-f2,
+--single-log</b> ] [ <b>-I, --index</b> ] [ <b>-%i,
+--build-top-index</b> ] [ <b>-%I, --search-index</b> ] [
+<b>-pN, --priority[=N]</b> ] [ <b>-S, --stay-on-same-dir</b>
+] [ <b>-D, --can-go-down</b> ] [ <b>-U, --can-go-up</b> ] [
+<b>-B, --can-go-up-and-down</b> ] [ <b>-a,
+--stay-on-same-address</b> ] [ <b>-d,
--stay-on-same-domain</b> ] [ <b>-l, --stay-on-same-tld</b>
] [ <b>-e, --go-everywhere</b> ] [ <b>-%H,
---debug-headers</b> ] [ <b>-V, --userdef-cmd</b> ] [ <b>-%U,
---user</b> ] [ <b>-%W, --callback</b> ] [ <b>-K,
+--debug-headers</b> ] [ <b>-%!,
+--disable-security-limits</b> ] [ <b>-V, --userdef-cmd</b> ]
+[ <b>-%U, --user</b> ] [ <b>-%W, --callback</b> ] [ <b>-K,
--keep-links[=N]</b> ] [</td></table>
<a name="DESCRIPTION"></a>
<h2>DESCRIPTION</h2>
@@ -120,7 +122,7 @@ site</td></table>
<tr valign="top" align="left">
<td width="10%"></td><td width="90%">
<b>httrack www.someweb.com/bob/ www.anothertest.com/mike/
-+*.com/*.jpg</b></td></table>
++*.com/*.jpg -mime:application/*</b></td></table>
<table width="100%" border=0 rules="none" frame="void"
cols="2" cellspacing="0" cellpadding="0">
@@ -632,6 +634,21 @@ user defined structure (-N
cols="2" cellspacing="0" cellpadding="0">
<tr valign="top" align="left">
<td width="10%"></td><td width="90%">
+-%N</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+delayed type check, don t make any link test but wait for
+files download to start instead (experimental) (%N0 don t
+use, %N1 use for unknown extensions, * %N2 always
+use)</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
-%M</td></table>
<table width="100%" border=0 rules="none" frame="void"
@@ -639,7 +656,7 @@ user defined structure (-N
<tr valign="top" align="left">
<td width="21%"></td><td width="79%">
generate a RFC MIME-encapsulated full-archive (.mht)
-(--mime-html[=N])</td></table>
+(--mime-html)</td></table>
<table width="100%" border=0 rules="none" frame="void"
cols="2" cellspacing="0" cellpadding="0">
@@ -804,7 +821,8 @@ check document type if unknown (cgi,asp..) (u0 don t check,
<tr valign="top" align="left">
<td width="21%"></td><td width="79%">
follow robots.txt and meta robots tags
-(0=never,1=sometimes,* 2=always) (--robots[=N])</td></table>
+(0=never,1=sometimes,* 2=always, 3=always (even strict
+rules)) (--robots[=N])</td></table>
<table width="100%" border=0 rules="none" frame="void"
cols="2" cellspacing="0" cellpadding="0">
@@ -891,6 +909,19 @@ type (-%A php3,cgi=text/html;dat,bin=application/x-zip)
cols="2" cellspacing="0" cellpadding="0">
<tr valign="top" align="left">
<td width="10%"></td><td width="90%">
+-can</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+also be used to force a specific file type: --assume
+foo.cgi=text/html</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
-@iN</td></table>
<table width="100%" border=0 rules="none" frame="void"
@@ -916,8 +947,34 @@ only) (--protocol[=N])</td></table>
cols="2" cellspacing="0" cellpadding="0">
<tr valign="top" align="left">
<td width="21%"></td><td width="79%">
-user-agent field (-F &quot;user-agent name&quot;)
-(--user-agent &lt;param&gt;)</td></table>
+user-agent field sent in HTTP headers (-F &quot;user-agent
+name&quot;) (--user-agent &lt;param&gt;)</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+-%R</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+default referer field sent in HTTP headers (--referer
+&lt;param&gt;)</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+-%E</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+from email address sent in HTTP headers (--from
+&lt;param&gt;)</td></table>
<table width="100%" border=0 rules="none" frame="void"
cols="2" cellspacing="0" cellpadding="0">
@@ -1003,7 +1060,7 @@ do not re-download locally erased files
<tr valign="top" align="left">
<td width="21%"></td><td width="79%">
display on screen filenames downloaded (in realtime) - * %v1
-short version (--display)</td></table>
+short version - %v2 full animation (--display)</td></table>
<table width="100%" border=0 rules="none" frame="void"
cols="2" cellspacing="0" cellpadding="0">
@@ -1354,6 +1411,30 @@ filter test (-#0 *.gif www.bar.com/foo.gif )
cols="2" cellspacing="0" cellpadding="0">
<tr valign="top" align="left">
<td width="10%"></td><td width="90%">
+-#1</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+simplify test (-#1 ./foo/bar/../foobar)</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+-#2</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+type test (-#2 /foo/bar.php)</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
-#C</td></table>
<table width="100%" border=0 rules="none" frame="void"
@@ -1367,6 +1448,42 @@ cache list (-#C *.com/spider*.gif (--debug-cache
cols="2" cellspacing="0" cellpadding="0">
<tr valign="top" align="left">
<td width="10%"></td><td width="90%">
+-#R</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+cache repair (damaged cache) (--debug-oldftp)</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+-#d</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+debug parser (--debug-parsing)</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+-#E</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+extract new.zip cache meta-data in meta.zip</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
-#f</td></table>
<table width="100%" border=0 rules="none" frame="void"
@@ -1517,6 +1634,52 @@ execute a shell command (-#! &quot;echo hello&quot;) (--exec
cols="2" cellspacing="0" cellpadding="0">
<tr valign="top" align="left">
<td width="4%"></td><td width="96%">
+<b>Dangerous options: (do NOT use unless you exactly know
+what you are doing)</b></td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+-%!</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+bypass built-in security limits aimed to avoid bandwith
+abuses (bandwidth, simultaneous connections)
+(--disable-security-limits)</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+-IMPORTANT</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+NOTE: DANGEROUS OPTION, ONLY SUITABLE FOR
+EXPERTS</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+-USE</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="21%"></td><td width="79%">
+IT WITH EXTREME CARE</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="4%"></td><td width="96%">
<b>Command-line specific options:</b></td></table>
<table width="100%" border=0 rules="none" frame="void"
@@ -1557,7 +1720,7 @@ smith) (--user &lt;param&gt;)</td></table>
<tr valign="top" align="left">
<td width="21%"></td><td width="79%">
use an external library function as a wrapper (-%W
-link-detected=foo.so:myfunction) (--callback
+link-detected=foo.so:myfunction[,myparameters]) (--callback
&lt;param&gt;)</td></table>
<table width="100%" border=0 rules="none" frame="void"
@@ -1834,11 +1997,12 @@ directory</td></table>
file, including file type (ex: image.gif) %t File type (ex:
gif) %p Path [without ending /] (ex: /someimages) %h Host
name (ex: www.someweb.com) %M URL MD5 (128 bits, 32 ascii
-bytes) %Q query string MD5 (128 bits, 32 ascii bytes) %q
-small query string MD5 (16 bits, 4 ascii bytes) %s? Short
-name version (ex: %sN) %[param] param variable in query
-string %[param:before:after:notfound:empty] advanced
-variable extraction</td></table>
+bytes) %Q query string MD5 (128 bits, 32 ascii bytes) %r
+protocol name (ex: http) %q small query string MD5 (16 bits,
+4 ascii bytes) %s? Short name version (ex: %sN) %[param]
+param variable in query string
+%[param:before:after:notfound:empty] advanced variable
+extraction</td></table>
<table width="100%" border=0 rules="none" frame="void"
cols="2" cellspacing="0" cellpadding="0">
@@ -2195,6 +2359,32 @@ opt);</b></td></table>
cols="2" cellspacing="0" cellpadding="0">
<tr valign="top" align="left">
<td width="4%"></td><td width="96%">
+<b>preprocess-html : int (* myfunction)(char** html,int*
+len,char* url</b></td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+adresse,char* url fichier);</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="4%"></td><td width="96%">
+<b>postprocess-html : int (* myfunction)(char** html,int*
+len,char* url</b></td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+adresse,char* url fichier);</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="4%"></td><td width="96%">
<b>check-html : int (* myfunction)(char* html,int len,char*
url</b></td></table>
@@ -2270,6 +2460,19 @@ link);</b></td></table>
cols="2" cellspacing="0" cellpadding="0">
<tr valign="top" align="left">
<td width="4%"></td><td width="96%">
+<b>link-detected2 : int (* myfunction)(char* link, char*
+start</b></td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+tag);</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="4%"></td><td width="96%">
<b>transfer-status : int (*
myfunction)(lien</b></td></table>
@@ -2291,6 +2494,18 @@ back* back);</td></table>
<td width="10%"></td><td width="90%">
complete,char* fil complete,char* referer adr,char* referer
fil,char* save);</td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="4%"></td><td width="96%">
+<b>And &lt;wrappername&gt;</b></td></table>
+
+<table width="100%" border=0 rules="none" frame="void"
+ cols="2" cellspacing="0" cellpadding="0">
+<tr valign="top" align="left">
+<td width="10%"></td><td width="90%">
+init() functions if defined, called upon plug</td></table>
<a name="FILES"></a>
<h2>FILES</h2>