diff options
Diffstat (limited to 'html/httrack.man.html')
-rw-r--r-- | html/httrack.man.html | 293 |
1 files changed, 254 insertions, 39 deletions
diff --git a/html/httrack.man.html b/html/httrack.man.html index 986954b..33701d1 100644 --- a/html/httrack.man.html +++ b/html/httrack.man.html @@ -24,7 +24,7 @@ <hr> <!-- Creator : groff version 1.17.2 --> -<!-- CreationDate: Sat Oct 11 09:14:41 2003 --> +<!-- CreationDate: Sat Jun 4 14:17:19 2005 --> <a name="NAME"></a> <h2>NAME</h2> <table width="100%" border=0 rules="none" frame="void" @@ -54,34 +54,36 @@ httrack - offline browser : copy websites to a local directory</td></table> --host-control[=N]</b> ] [ <b>-%P, --extended-parsing[=N]</b> ] [ <b>-n, --near</b> ] [ <b>-t, --test</b> ] [ <b>-%L, --list</b> ] [ <b>-%S, --urllist</b> -] [ <b>-NN, --structure[=N]</b> ] [ <b>-%M, ---mime-html[=N]</b> ] [ <b>-LN, --long-names[=N]</b> ] [ -<b>-KN, --keep-links[=N]</b> ] [ <b>-x, ---replace-external</b> ] [ <b>-%x, --disable-passwords</b> ] -[ <b>-%q, --include-query-string</b> ] [ <b>-o, ---generate-errors</b> ] [ <b>-X, --purge-old[=N]</b> ] [ -<b>-%p, --preserve</b> ] [ <b>-bN, --cookies[=N]</b> ] [ -<b>-u, --check-type[=N]</b> ] [ <b>-j, --parse-java[=N]</b> -] [ <b>-sN, --robots[=N]</b> ] [ <b>-%h, --http-10</b> ] [ -<b>-%k, --keep-alive</b> ] [ <b>-%B, --tolerant</b> ] [ -<b>-%s, --updatehack</b> ] [ <b>-%u, --urlhack</b> ] [ -<b>-%A, --assume</b> ] [ <b>-@iN, --protocol[=N]</b> ] [ -<b>-F, --user-agent</b> ] [ <b>-%F, --footer</b> ] [ <b>-%l, ---language</b> ] [ <b>-C, --cache[=N]</b> ] [ <b>-k, ---store-all-in-cache</b> ] [ <b>-%n, --do-not-recatch</b> ] -[ <b>-%v, --display</b> ] [ <b>-Q, --do-not-log</b> ] [ -<b>-q, --quiet</b> ] [ <b>-z, --extra-log</b> ] [ <b>-Z, ---debug-log</b> ] [ <b>-v, --verbose</b> ] [ <b>-f, ---file-log</b> ] [ <b>-f2, --single-log</b> ] [ <b>-I, ---index</b> ] [ <b>-%i, --build-top-index</b> ] [ <b>-%I, ---search-index</b> ] [ <b>-pN, --priority[=N]</b> ] [ <b>-S, ---stay-on-same-dir</b> ] [ <b>-D, --can-go-down</b> ] [ -<b>-U, --can-go-up</b> ] [ <b>-B, --can-go-up-and-down</b> ] -[ <b>-a, --stay-on-same-address</b> ] [ <b>-d, +] [ <b>-NN, --structure[=N]</b> ] [ <b>-%M, --mime-html</b> +] [ <b>-LN, --long-names[=N]</b> ] [ <b>-KN, +--keep-links[=N]</b> ] [ <b>-x, --replace-external</b> ] [ +<b>-%x, --disable-passwords</b> ] [ <b>-%q, +--include-query-string</b> ] [ <b>-o, --generate-errors</b> +] [ <b>-X, --purge-old[=N]</b> ] [ <b>-%p, --preserve</b> ] +[ <b>-bN, --cookies[=N]</b> ] [ <b>-u, --check-type[=N]</b> +] [ <b>-j, --parse-java[=N]</b> ] [ <b>-sN, --robots[=N]</b> +] [ <b>-%h, --http-10</b> ] [ <b>-%k, --keep-alive</b> ] [ +<b>-%B, --tolerant</b> ] [ <b>-%s, --updatehack</b> ] [ +<b>-%u, --urlhack</b> ] [ <b>-%A, --assume</b> ] [ <b>-@iN, +--protocol[=N]</b> ] [ <b>-F, --user-agent</b> ] [ <b>-%R, +--referer</b> ] [ <b>-%E, --from</b> ] [ <b>-%F, +--footer</b> ] [ <b>-%l, --language</b> ] [ <b>-C, +--cache[=N]</b> ] [ <b>-k, --store-all-in-cache</b> ] [ +<b>-%n, --do-not-recatch</b> ] [ <b>-%v, --display</b> ] [ +<b>-Q, --do-not-log</b> ] [ <b>-q, --quiet</b> ] [ <b>-z, +--extra-log</b> ] [ <b>-Z, --debug-log</b> ] [ <b>-v, +--verbose</b> ] [ <b>-f, --file-log</b> ] [ <b>-f2, +--single-log</b> ] [ <b>-I, --index</b> ] [ <b>-%i, +--build-top-index</b> ] [ <b>-%I, --search-index</b> ] [ +<b>-pN, --priority[=N]</b> ] [ <b>-S, --stay-on-same-dir</b> +] [ <b>-D, --can-go-down</b> ] [ <b>-U, --can-go-up</b> ] [ +<b>-B, --can-go-up-and-down</b> ] [ <b>-a, +--stay-on-same-address</b> ] [ <b>-d, --stay-on-same-domain</b> ] [ <b>-l, --stay-on-same-tld</b> ] [ <b>-e, --go-everywhere</b> ] [ <b>-%H, ---debug-headers</b> ] [ <b>-V, --userdef-cmd</b> ] [ <b>-%U, ---user</b> ] [ <b>-%W, --callback</b> ] [ <b>-K, +--debug-headers</b> ] [ <b>-%!, +--disable-security-limits</b> ] [ <b>-V, --userdef-cmd</b> ] +[ <b>-%U, --user</b> ] [ <b>-%W, --callback</b> ] [ <b>-K, --keep-links[=N]</b> ] [</td></table> <a name="DESCRIPTION"></a> <h2>DESCRIPTION</h2> @@ -120,7 +122,7 @@ site</td></table> <tr valign="top" align="left"> <td width="10%"></td><td width="90%"> <b>httrack www.someweb.com/bob/ www.anothertest.com/mike/ -+*.com/*.jpg</b></td></table> ++*.com/*.jpg -mime:application/*</b></td></table> <table width="100%" border=0 rules="none" frame="void" cols="2" cellspacing="0" cellpadding="0"> @@ -632,6 +634,21 @@ user defined structure (-N cols="2" cellspacing="0" cellpadding="0"> <tr valign="top" align="left"> <td width="10%"></td><td width="90%"> +-%N</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +delayed type check, don t make any link test but wait for +files download to start instead (experimental) (%N0 don t +use, %N1 use for unknown extensions, * %N2 always +use)</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> -%M</td></table> <table width="100%" border=0 rules="none" frame="void" @@ -639,7 +656,7 @@ user defined structure (-N <tr valign="top" align="left"> <td width="21%"></td><td width="79%"> generate a RFC MIME-encapsulated full-archive (.mht) -(--mime-html[=N])</td></table> +(--mime-html)</td></table> <table width="100%" border=0 rules="none" frame="void" cols="2" cellspacing="0" cellpadding="0"> @@ -804,7 +821,8 @@ check document type if unknown (cgi,asp..) (u0 don t check, <tr valign="top" align="left"> <td width="21%"></td><td width="79%"> follow robots.txt and meta robots tags -(0=never,1=sometimes,* 2=always) (--robots[=N])</td></table> +(0=never,1=sometimes,* 2=always, 3=always (even strict +rules)) (--robots[=N])</td></table> <table width="100%" border=0 rules="none" frame="void" cols="2" cellspacing="0" cellpadding="0"> @@ -891,6 +909,19 @@ type (-%A php3,cgi=text/html;dat,bin=application/x-zip) cols="2" cellspacing="0" cellpadding="0"> <tr valign="top" align="left"> <td width="10%"></td><td width="90%"> +-can</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +also be used to force a specific file type: --assume +foo.cgi=text/html</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> -@iN</td></table> <table width="100%" border=0 rules="none" frame="void" @@ -916,8 +947,34 @@ only) (--protocol[=N])</td></table> cols="2" cellspacing="0" cellpadding="0"> <tr valign="top" align="left"> <td width="21%"></td><td width="79%"> -user-agent field (-F "user-agent name") -(--user-agent <param>)</td></table> +user-agent field sent in HTTP headers (-F "user-agent +name") (--user-agent <param>)</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +-%R</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +default referer field sent in HTTP headers (--referer +<param>)</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +-%E</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +from email address sent in HTTP headers (--from +<param>)</td></table> <table width="100%" border=0 rules="none" frame="void" cols="2" cellspacing="0" cellpadding="0"> @@ -1003,7 +1060,7 @@ do not re-download locally erased files <tr valign="top" align="left"> <td width="21%"></td><td width="79%"> display on screen filenames downloaded (in realtime) - * %v1 -short version (--display)</td></table> +short version - %v2 full animation (--display)</td></table> <table width="100%" border=0 rules="none" frame="void" cols="2" cellspacing="0" cellpadding="0"> @@ -1354,6 +1411,30 @@ filter test (-#0 *.gif www.bar.com/foo.gif ) cols="2" cellspacing="0" cellpadding="0"> <tr valign="top" align="left"> <td width="10%"></td><td width="90%"> +-#1</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +simplify test (-#1 ./foo/bar/../foobar)</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +-#2</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +type test (-#2 /foo/bar.php)</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> -#C</td></table> <table width="100%" border=0 rules="none" frame="void" @@ -1367,6 +1448,42 @@ cache list (-#C *.com/spider*.gif (--debug-cache cols="2" cellspacing="0" cellpadding="0"> <tr valign="top" align="left"> <td width="10%"></td><td width="90%"> +-#R</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +cache repair (damaged cache) (--debug-oldftp)</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +-#d</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +debug parser (--debug-parsing)</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +-#E</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +extract new.zip cache meta-data in meta.zip</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> -#f</td></table> <table width="100%" border=0 rules="none" frame="void" @@ -1517,6 +1634,52 @@ execute a shell command (-#! "echo hello") (--exec cols="2" cellspacing="0" cellpadding="0"> <tr valign="top" align="left"> <td width="4%"></td><td width="96%"> +<b>Dangerous options: (do NOT use unless you exactly know +what you are doing)</b></td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +-%!</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +bypass built-in security limits aimed to avoid bandwith +abuses (bandwidth, simultaneous connections) +(--disable-security-limits)</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +-IMPORTANT</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +NOTE: DANGEROUS OPTION, ONLY SUITABLE FOR +EXPERTS</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +-USE</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="21%"></td><td width="79%"> +IT WITH EXTREME CARE</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="4%"></td><td width="96%"> <b>Command-line specific options:</b></td></table> <table width="100%" border=0 rules="none" frame="void" @@ -1557,7 +1720,7 @@ smith) (--user <param>)</td></table> <tr valign="top" align="left"> <td width="21%"></td><td width="79%"> use an external library function as a wrapper (-%W -link-detected=foo.so:myfunction) (--callback +link-detected=foo.so:myfunction[,myparameters]) (--callback <param>)</td></table> <table width="100%" border=0 rules="none" frame="void" @@ -1834,11 +1997,12 @@ directory</td></table> file, including file type (ex: image.gif) %t File type (ex: gif) %p Path [without ending /] (ex: /someimages) %h Host name (ex: www.someweb.com) %M URL MD5 (128 bits, 32 ascii -bytes) %Q query string MD5 (128 bits, 32 ascii bytes) %q -small query string MD5 (16 bits, 4 ascii bytes) %s? Short -name version (ex: %sN) %[param] param variable in query -string %[param:before:after:notfound:empty] advanced -variable extraction</td></table> +bytes) %Q query string MD5 (128 bits, 32 ascii bytes) %r +protocol name (ex: http) %q small query string MD5 (16 bits, +4 ascii bytes) %s? Short name version (ex: %sN) %[param] +param variable in query string +%[param:before:after:notfound:empty] advanced variable +extraction</td></table> <table width="100%" border=0 rules="none" frame="void" cols="2" cellspacing="0" cellpadding="0"> @@ -2195,6 +2359,32 @@ opt);</b></td></table> cols="2" cellspacing="0" cellpadding="0"> <tr valign="top" align="left"> <td width="4%"></td><td width="96%"> +<b>preprocess-html : int (* myfunction)(char** html,int* +len,char* url</b></td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +adresse,char* url fichier);</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="4%"></td><td width="96%"> +<b>postprocess-html : int (* myfunction)(char** html,int* +len,char* url</b></td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +adresse,char* url fichier);</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="4%"></td><td width="96%"> <b>check-html : int (* myfunction)(char* html,int len,char* url</b></td></table> @@ -2270,6 +2460,19 @@ link);</b></td></table> cols="2" cellspacing="0" cellpadding="0"> <tr valign="top" align="left"> <td width="4%"></td><td width="96%"> +<b>link-detected2 : int (* myfunction)(char* link, char* +start</b></td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +tag);</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="4%"></td><td width="96%"> <b>transfer-status : int (* myfunction)(lien</b></td></table> @@ -2291,6 +2494,18 @@ back* back);</td></table> <td width="10%"></td><td width="90%"> complete,char* fil complete,char* referer adr,char* referer fil,char* save);</td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="4%"></td><td width="96%"> +<b>And <wrappername></b></td></table> + +<table width="100%" border=0 rules="none" frame="void" + cols="2" cellspacing="0" cellpadding="0"> +<tr valign="top" align="left"> +<td width="10%"></td><td width="90%"> +init() functions if defined, called upon plug</td></table> <a name="FILES"></a> <h2>FILES</h2> |