urlHref.php
https://www.wlkl.ch/index.php from 0
- 12533 chars [HTTP/1.1 200 OK, Server: nginx, Date: Fri, 04 Apr 2025 12:12:15 GMT, Content-Type: text/html; charset=UTF-8, Connection: close, Expires: Tue, 01 Jan 2002 00:00:00 GMT, Cache-Control: no-store, no-cache, must-revalidate, X-Frame-Options: SAMEORIGIN, Content-Security-Policy: frame-ancestors 'self'; base-uri 'self'; object-src 'none';, X-XSS-Protection: 1; mode=block, Vary: Accept-Encoding, Strict-Transport-Security: max-age=63072000]
- 70
- already https://www.wlkl.ch/index.php
- queued https://www.wlkl.ch/index.php/Main/HomePage
- skipping https://www.wlkl.ch/index.php/Main/HomePage?action=edit
- skipping https://www.wlkl.ch/index.php/Main/HomePage?action=diff
- skipping https://www.wlkl.ch/index.php/Main/HomePage?action=print
- skipping https://www.wlkl.ch/index.php/Main/HomePage?action=search&q=link=Main.HomePage
- skipping https://www.wlkl.ch/index.php/Site/AllRecentChanges
- skipping https://www.wlkl.ch/index.php/Main/RecentChanges
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- empty href #
- already https://www.wlkl.ch/index.php/Main/HomePage
- empty href #
- skipping https://www.wlkl.ch/index.php/Main/Menu?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- already https://www.wlkl.ch/index.php/Main/HomePage
- empty href #
- queued https://www.wlkl.ch/index.php/J/J
- queued https://www.wlkl.ch/index.php/J/All
- queued https://www.wlkl.ch/index.php/J/Jour
- queued https://www.wlkl.ch/index.php/CS/CS
- queued https://www.wlkl.ch/index.php/Climb/Climb
- queued https://www.wlkl.ch/index.php/Div/Div
- queued https://www.wlkl.ch/index.php/Inf/Inf
- queued https://www.wlkl.ch/index.php/Lit/Lit
- queued https://www.wlkl.ch/index.php/Math/Math
- queued https://www.wlkl.ch/index.php/My/My
- queued https://www.wlkl.ch/index.php/Main/Petri
- queued https://www.wlkl.ch/index.php/Pub/Pub
- queued https://www.wlkl.ch/index.php/Wk13/Wk13
- queued https://www.wlkl.ch/index.php/PmWiki/PmWiki
- queued https://www.wlkl.ch/index.php/Main/WikiSandbox
- queued https://www.wlkl.ch/index.php/PmWiki/BasicEditing
- queued https://www.wlkl.ch/index.php/PmWiki/DocumentationIndex
- skipping https://www.wlkl.ch/index.php/Site/SideBar?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- queued https://www.wlkl.ch/index.php/Main
- already https://www.wlkl.ch/index.php/Main/HomePage
- skipping mailto:wa@wlkl.ch
- queued https://www.wlkl.ch/index.php/Climb/Kletterprogramm25
- queued https://www.wlkl.ch/index.php/Climb/Bergsee25
- already https://www.wlkl.ch/index.php/Climb/Climb
- queued https://www.wlkl.ch/index.php/Climb/13Burghuette
- queued https://www.wlkl.ch/index.php/Climb/13Schmalstoeckli
- queued https://www.wlkl.ch/petri/index.html
- queued https://www.wlkl.ch/petri/petriNetsForRE.pdf
- queued https://www.wlkl.ch/petri/cdSlidesOverview/index.html
- queued https://www.wlkl.ch/petri/cdSlidesOverview.pdf
- queued https://www.wlkl.ch//petri/smalltalk/instruction.html
- queued https://www.wlkl.ch/myPdfs/fastCharacteristicPolynomial.pdf
- queued https://www.wlkl.ch/index.php/Inf/Wsh
- queued https://www.wlkl.ch/index.php/FF/Ecua13
- already https://www.wlkl.ch/index.php/Pub/Pub
- skipping https://www.spwallisellen.ch/positionen/2021/klimaschonend-heizen-ist-unsere-zukunft
- skipping https://www.spwallisellen.ch/positionen/2021/klimafreundlich-heizen-und-solarstrom-produzieren-lohnen-sich
- queued https://www.wlkl.ch/index.php/Pub/Pub#gnd
- skipping https://www.spwallisellen.ch/positionen/2020/noch-nicht-gruen-mit-der-gasversorgung
- already https://www.wlkl.ch/index.php/Main
- already https://www.wlkl.ch/index.php/Main/HomePage
https://www.wlkl.ch/index.php/Main/HomePage from [https://www.wlkl.ch/index.php]
- 12533 chars [HTTP/1.1 200 OK, Server: nginx, Date: Fri, 04 Apr 2025 12:12:15 GMT, Content-Type: text/html; charset=UTF-8, Connection: close, Expires: Tue, 01 Jan 2002 00:00:00 GMT, Cache-Control: no-store, no-cache, must-revalidate, X-Frame-Options: SAMEORIGIN, Content-Security-Policy: frame-ancestors 'self'; base-uri 'self'; object-src 'none';, X-XSS-Protection: 1; mode=block, Vary: Accept-Encoding, Strict-Transport-Security: max-age=63072000]
- 70
- already https://www.wlkl.ch/index.php
- already https://www.wlkl.ch/index.php/Main/HomePage
- skipping https://www.wlkl.ch/index.php/Main/HomePage?action=edit
- skipping https://www.wlkl.ch/index.php/Main/HomePage?action=diff
- skipping https://www.wlkl.ch/index.php/Main/HomePage?action=print
- skipping https://www.wlkl.ch/index.php/Main/HomePage?action=search&q=link=Main.HomePage
- skipping https://www.wlkl.ch/index.php/Site/AllRecentChanges
- skipping https://www.wlkl.ch/index.php/Main/RecentChanges
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- empty href #
- already https://www.wlkl.ch/index.php/Main/HomePage
- empty href #
- skipping https://www.wlkl.ch/index.php/Main/Menu?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- already https://www.wlkl.ch/index.php/Main/HomePage
- empty href #
- already https://www.wlkl.ch/index.php/J/J
- already https://www.wlkl.ch/index.php/J/All
- already https://www.wlkl.ch/index.php/J/Jour
- already https://www.wlkl.ch/index.php/CS/CS
- already https://www.wlkl.ch/index.php/Climb/Climb
- already https://www.wlkl.ch/index.php/Div/Div
- already https://www.wlkl.ch/index.php/Inf/Inf
- already https://www.wlkl.ch/index.php/Lit/Lit
- already https://www.wlkl.ch/index.php/Math/Math
- already https://www.wlkl.ch/index.php/My/My
- already https://www.wlkl.ch/index.php/Main/Petri
- already https://www.wlkl.ch/index.php/Pub/Pub
- already https://www.wlkl.ch/index.php/Wk13/Wk13
- already https://www.wlkl.ch/index.php/PmWiki/PmWiki
- already https://www.wlkl.ch/index.php/Main/WikiSandbox
- already https://www.wlkl.ch/index.php/PmWiki/BasicEditing
- already https://www.wlkl.ch/index.php/PmWiki/DocumentationIndex
- skipping https://www.wlkl.ch/index.php/Site/SideBar?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- already https://www.wlkl.ch/index.php/Main
- already https://www.wlkl.ch/index.php/Main/HomePage
- skipping mailto:wa@wlkl.ch
- already https://www.wlkl.ch/index.php/Climb/Kletterprogramm25
- already https://www.wlkl.ch/index.php/Climb/Bergsee25
- already https://www.wlkl.ch/index.php/Climb/Climb
- already https://www.wlkl.ch/index.php/Climb/13Burghuette
- already https://www.wlkl.ch/index.php/Climb/13Schmalstoeckli
- already https://www.wlkl.ch/petri/index.html
- already https://www.wlkl.ch/petri/petriNetsForRE.pdf
- already https://www.wlkl.ch/petri/cdSlidesOverview/index.html
- already https://www.wlkl.ch/petri/cdSlidesOverview.pdf
- already https://www.wlkl.ch//petri/smalltalk/instruction.html
- already https://www.wlkl.ch/myPdfs/fastCharacteristicPolynomial.pdf
- already https://www.wlkl.ch/index.php/Inf/Wsh
- already https://www.wlkl.ch/index.php/FF/Ecua13
- already https://www.wlkl.ch/index.php/Pub/Pub
- skipping https://www.spwallisellen.ch/positionen/2021/klimaschonend-heizen-ist-unsere-zukunft
- skipping https://www.spwallisellen.ch/positionen/2021/klimafreundlich-heizen-und-solarstrom-produzieren-lohnen-sich
- already https://www.wlkl.ch/index.php/Pub/Pub#gnd
- skipping https://www.spwallisellen.ch/positionen/2020/noch-nicht-gruen-mit-der-gasversorgung
- already https://www.wlkl.ch/index.php/Main
- already https://www.wlkl.ch/index.php/Main/HomePage
https://www.wlkl.ch/index.php/J/J from [https://www.wlkl.ch/index.php]
- 8786 chars [HTTP/1.1 200 OK, Server: nginx, Date: Fri, 04 Apr 2025 12:12:16 GMT, Content-Type: text/html; charset=UTF-8, Connection: close, Expires: Tue, 01 Jan 2002 00:00:00 GMT, Cache-Control: no-store, no-cache, must-revalidate, X-Frame-Options: SAMEORIGIN, Content-Security-Policy: frame-ancestors 'self'; base-uri 'self'; object-src 'none';, X-XSS-Protection: 1; mode=block, Vary: Accept-Encoding, Strict-Transport-Security: max-age=63072000]
- 51
- already https://www.wlkl.ch/index.php
- already https://www.wlkl.ch/index.php/J/J
- skipping https://www.wlkl.ch/index.php/J/J?action=edit
- skipping https://www.wlkl.ch/index.php/J/J?action=diff
- skipping https://www.wlkl.ch/index.php/J/J?action=print
- skipping https://www.wlkl.ch/index.php/J/J?action=search&q=link=J.J
- skipping https://www.wlkl.ch/index.php/Site/AllRecentChanges
- skipping https://www.wlkl.ch/index.php/J/RecentChanges
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- empty href #
- already https://www.wlkl.ch/index.php/J/J
- empty href #
- skipping https://www.wlkl.ch/index.php/J/Menu?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- already https://www.wlkl.ch/index.php/Main/HomePage
- empty href #
- already https://www.wlkl.ch/index.php/J/J
- already https://www.wlkl.ch/index.php/J/All
- already https://www.wlkl.ch/index.php/J/Jour
- already https://www.wlkl.ch/index.php/CS/CS
- already https://www.wlkl.ch/index.php/Climb/Climb
- already https://www.wlkl.ch/index.php/Div/Div
- already https://www.wlkl.ch/index.php/Inf/Inf
- already https://www.wlkl.ch/index.php/Lit/Lit
- already https://www.wlkl.ch/index.php/Math/Math
- already https://www.wlkl.ch/index.php/My/My
- already https://www.wlkl.ch/index.php/Main/Petri
- already https://www.wlkl.ch/index.php/Pub/Pub
- already https://www.wlkl.ch/index.php/Wk13/Wk13
- already https://www.wlkl.ch/index.php/PmWiki/PmWiki
- already https://www.wlkl.ch/index.php/Main/WikiSandbox
- already https://www.wlkl.ch/index.php/PmWiki/BasicEditing
- already https://www.wlkl.ch/index.php/PmWiki/DocumentationIndex
- skipping https://www.wlkl.ch/index.php/Site/SideBar?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- queued https://www.wlkl.ch/index.php/J
- already https://www.wlkl.ch/index.php/J/J
- already https://www.wlkl.ch/index.php/J
- already https://www.wlkl.ch/index.php/J/J
https://www.wlkl.ch/index.php/J/All from [https://www.wlkl.ch/index.php]
- 8811 chars [HTTP/1.1 200 OK, Server: nginx, Date: Fri, 04 Apr 2025 12:12:16 GMT, Content-Type: text/html; charset=UTF-8, Connection: close, Expires: Tue, 01 Jan 2002 00:00:00 GMT, Cache-Control: no-store, no-cache, must-revalidate, X-Frame-Options: SAMEORIGIN, Content-Security-Policy: frame-ancestors 'self'; base-uri 'self'; object-src 'none';, X-XSS-Protection: 1; mode=block, Vary: Accept-Encoding, Strict-Transport-Security: max-age=63072000]
- 51
- already https://www.wlkl.ch/index.php
- already https://www.wlkl.ch/index.php/J/All
- skipping https://www.wlkl.ch/index.php/J/All?action=edit
- skipping https://www.wlkl.ch/index.php/J/All?action=diff
- skipping https://www.wlkl.ch/index.php/J/All?action=print
- skipping https://www.wlkl.ch/index.php/J/All?action=search&q=link=J.All
- skipping https://www.wlkl.ch/index.php/Site/AllRecentChanges
- skipping https://www.wlkl.ch/index.php/J/RecentChanges
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- empty href #
- already https://www.wlkl.ch/index.php/J/J
- empty href #
- skipping https://www.wlkl.ch/index.php/J/Menu?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- already https://www.wlkl.ch/index.php/Main/HomePage
- empty href #
- already https://www.wlkl.ch/index.php/J/J
- already https://www.wlkl.ch/index.php/J/All
- already https://www.wlkl.ch/index.php/J/Jour
- already https://www.wlkl.ch/index.php/CS/CS
- already https://www.wlkl.ch/index.php/Climb/Climb
- already https://www.wlkl.ch/index.php/Div/Div
- already https://www.wlkl.ch/index.php/Inf/Inf
- already https://www.wlkl.ch/index.php/Lit/Lit
- already https://www.wlkl.ch/index.php/Math/Math
- already https://www.wlkl.ch/index.php/My/My
- already https://www.wlkl.ch/index.php/Main/Petri
- already https://www.wlkl.ch/index.php/Pub/Pub
- already https://www.wlkl.ch/index.php/Wk13/Wk13
- already https://www.wlkl.ch/index.php/PmWiki/PmWiki
- already https://www.wlkl.ch/index.php/Main/WikiSandbox
- already https://www.wlkl.ch/index.php/PmWiki/BasicEditing
- already https://www.wlkl.ch/index.php/PmWiki/DocumentationIndex
- skipping https://www.wlkl.ch/index.php/Site/SideBar?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- already https://www.wlkl.ch/index.php/J
- already https://www.wlkl.ch/index.php/J/All
- already https://www.wlkl.ch/index.php/J
- already https://www.wlkl.ch/index.php/J/All
https://www.wlkl.ch/index.php/J/Jour from [https://www.wlkl.ch/index.php]
- 8837 chars [HTTP/1.1 200 OK, Server: nginx, Date: Fri, 04 Apr 2025 12:12:17 GMT, Content-Type: text/html; charset=UTF-8, Connection: close, Expires: Tue, 01 Jan 2002 00:00:00 GMT, Cache-Control: no-store, no-cache, must-revalidate, X-Frame-Options: SAMEORIGIN, Content-Security-Policy: frame-ancestors 'self'; base-uri 'self'; object-src 'none';, X-XSS-Protection: 1; mode=block, Vary: Accept-Encoding, Strict-Transport-Security: max-age=63072000]
- 51
- already https://www.wlkl.ch/index.php
- already https://www.wlkl.ch/index.php/J/Jour
- skipping https://www.wlkl.ch/index.php/J/Jour?action=edit
- skipping https://www.wlkl.ch/index.php/J/Jour?action=diff
- skipping https://www.wlkl.ch/index.php/J/Jour?action=print
- skipping https://www.wlkl.ch/index.php/J/Jour?action=search&q=link=J.Jour
- skipping https://www.wlkl.ch/index.php/Site/AllRecentChanges
- skipping https://www.wlkl.ch/index.php/J/RecentChanges
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- empty href #
- already https://www.wlkl.ch/index.php/J/J
- empty href #
- skipping https://www.wlkl.ch/index.php/J/Menu?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- already https://www.wlkl.ch/index.php/Main/HomePage
- empty href #
- already https://www.wlkl.ch/index.php/J/J
- already https://www.wlkl.ch/index.php/J/All
- already https://www.wlkl.ch/index.php/J/Jour
- already https://www.wlkl.ch/index.php/CS/CS
- already https://www.wlkl.ch/index.php/Climb/Climb
- already https://www.wlkl.ch/index.php/Div/Div
- already https://www.wlkl.ch/index.php/Inf/Inf
- already https://www.wlkl.ch/index.php/Lit/Lit
- already https://www.wlkl.ch/index.php/Math/Math
- already https://www.wlkl.ch/index.php/My/My
- already https://www.wlkl.ch/index.php/Main/Petri
- already https://www.wlkl.ch/index.php/Pub/Pub
- already https://www.wlkl.ch/index.php/Wk13/Wk13
- already https://www.wlkl.ch/index.php/PmWiki/PmWiki
- already https://www.wlkl.ch/index.php/Main/WikiSandbox
- already https://www.wlkl.ch/index.php/PmWiki/BasicEditing
- already https://www.wlkl.ch/index.php/PmWiki/DocumentationIndex
- skipping https://www.wlkl.ch/index.php/Site/SideBar?action=edit
- skipping #wikititle
- skipping #sideBarTrail
- skipping #sideBarGroup
- skipping #sideBarWalter
- skipping #wikifoot
- already https://www.wlkl.ch/index.php/J
- already https://www.wlkl.ch/index.php/J/Jour
- already https://www.wlkl.ch/index.php/J
- already https://www.wlkl.ch/index.php/J/Jour
5 pages, 2.682e+0 ela, 2.679e+0 get, 2.374e-3 parse , queue 34
End urlHref.php
args
urlHref.php
/home/ch45859/web/wlkl.ch/public_html/inf/php/urlHref.php
*** code does not have a span berfore first <br>***<?php
/*******************************************************************************
urlHref.php: read url, analyze HTML for <a href
loop
read an url (i.e. stream) from queue
analyze it as http: DOMDocument::loadHTML
find all <a href=
queue these href-url,
if they conform (e.g. same host, no query ....) and not already queued
report stats and times used
problems:
could not get Connection: keep-alive (not a stream option?)
we get HTTP/1.1 404 Not Found, and not create page as in firefox
*******************************************************************************/
require_once('env.php');
outBegin(basename(__file__));
$mtS = microtime(1);
$mtG = $mtP = 0;
$u0 = 'https://localhost';
$u0 = 'https://www.wlkl.ch';
$uMsk = "%^$u0/(?!.*RecentChan)[^?]+$%";
$que = ["$u0/index.php"];
$u2f = [$que[0] => 0];
# $ctx = stream_context_set_default(['https' => ['method'=>'GET', 'header' => ['Connection: keep-alive']]]);
# $a2strLevel=4;
# out('context', stream_context_get_params($ctx));
for ($wx=0; $wx < count($que) and $wx < 5; $wx++) {
$url = $que[$wx];
out($url, 'from', $u2f[$url] ?? '-');
outOL();
error_clear_last();
$mtG -= microtime(1);
$h = @file_get_contents($url);
$mtG += microtime(1);
if (false === $h) {
outOLEnd("bad get in $url from", $u2f[$url], error_get_last());
continue;
}
outLi(strlen($h), "chars", $http_response_header);
$mtP -= microtime(1);
$d = new DOMDocument();
error_clear_last();
@$d->loadHTML($h);
$mtP += microtime(1);
if (false === $d) {
outOLEnd("bad html in $url from", $u2f[$url], ", html $h", error_get_last());
continue;
}
$aL = $d->getElementsByTagName('a');
outLi(count($aL), '<a...>');
foreach ($aL as $a) {
$href = $a->getAttribute('href');
if (empty($href) )
outLi("empty href # " . $d->saveHTML($a));
elseif (! preg_match($uMsk, $href))
outLi("skipping $href");
elseif (isset($u2f[$href]))
outLi("already $href");
else {
outLi("queued $href");
$u2f[$href] = [$url];
$que[] = $href;
}
}
outOLEnd();
}
out("$wx pages,", sprintf('%9.3e ela, %9.3e get, %9.3e parse', microtime(1) - $mtS, $mtG, $mtP), ", queue", count($que));
outEnd(__FILE__);
?>