...

View Full Version : here is free link checker code! tested



kab_184
11-28-2003, 12:07 PM
HI

here is the php code to check what ever link you want to check ONline or offline internal or external try it ....like www.yahoo.com and it will validate links free..fast one





<div class="mainblockcent">
<h1>Link Checker</h1>
<?
$text['N/A'] = "Ikke HTTP";
$text[OK] = "Valid hostname";
$text[FEJL] = "Invalid hostname";
$text[Død] = "No response";
$text[100] = "Continue";
$text[101] = "Switching Protocols";
$text[200] = "OK";
$text[201] = "Created";
$text[202] = "Accepted";
$text[203] = "Non-Authoritative Information";
$text[204] = "No Content";
$text[205] = "Reset Content";
$text[206] = "Partial Content";
$text[300] = "Multiple Choices";
$text[301] = "Moved Permanently";
$text[302] = "Found";
$text[303] = "See Other";
$text[304] = "Not Modified";
$text[305] = "Use Proxy";
$text[307] = "Temporary Redirect";
$text[400] = "Bad Request";
$text[401] = "Unauthorized";
$text[402] = "Payment Required";
$text[403] = "Forbidden";
$text[404] = "Not Found";
$text[405] = "Method Not Allowed";
$text[406] = "Not Acceptable";
$text[407] = "Proxy Authentication Required";
$text[408] = "Request Timeout";
$text[409] = "Conflict";
$text[410] = "Gone";
$text[411] = "Length Required";
$text[412] = "Precondition Failed";
$text[413] = "Request Entity Too Large";
$text[414] = "Request-URI Too Long";
$text[415] = "Unsupported Media Type";
$text[416] = "Requested Range Not Satisfiable";
$text[417] = "Expectation Failed";
$text[500] = "Internal Server Error";
$text[501] = "Not Implemented";
$text[502] = "Bad Gateway";
$text[503] = "Service Unavailable";
$text[504] = "Gateway Timeout";
$text[505] = "HTTP Version Not Supported";

function specialconcat($base,$path) {
$base = ereg_replace("(.*/)[^/]*","\\1", $base);
$path = ereg_replace("^(\.){1}/", "", $path);
if (ereg("^/", $path)) {
$base = ereg_replace("^(http://([^/]+))/{1}(.*)", "\\1", $base);
}
return $base.$path;
}

function sortarray($arr) {
if (count($arr) == 0) return $arr;
reset($arr);
while (list($key,$value) = each($arr)) $newarr[$value] = $key;
reset($newarr);
while (list($key,$value) = each($newarr)) $sortedarr[] = $key;
return $sortedarr;
}

function firstArd($url) {
$urlArray = parse_url($url);
if (!$urlArray[port]) $urlArray[port] = "80";
if (!$urlArray[path]) $urlArray[path] = "/";
if ($urlArray[query]) $urlArray[path] .= "?$urlArray[query]";
$sock = fsockopen($urlArray[host], $urlArray[port]);
if ($sock) {
$dump .= "GET $urlArray[path] HTTP/1.1\r\n";
$dump .= "User-Agent: Z-Add Link Checker (http://w3.z-add.co.uk/linkcheck/)\r\n";
$dump .= "Host: $urlArray[host]\r\nConnection: close\r\n";
$dump .= "Connection: close\r\n\r\n";
fputs($sock, $dump);
while($str = fgets($sock, 1024)) $headers[] = $str;
fclose($sock);
flush();
for($i=0; $i<count($headers); $i++) {
if (eregi("^HTTP/[0-9]+\.[0-9]+ 200", $headers[$i])) $location = $url;
if (eregi("^Location: ", $headers[$i])) $location = eregi_replace("^Location:( )?", "", $headers[$i]);
}
}
$location = trim($location);
return $location;
}

function check($url) {
if (!eregi("^http://", $url)) {
if (eregi("^mailto:", $url)) {
$url = trim(eregi_replace("^mailto:(.+)", "\\1", $url));
list($brugernavn, $host) = split("@", $url);
$dnsCheck = checkdnsrr($host,"MX");
if ($dnsCheck) $return[code] = "OK";
else $return[code] = "ERROR";
}
else $return[code] = "N/A";
}
else {
$urlArray = parse_url($url);
if (!$urlArray[port]) $urlArray[port] = "80";
if (!$urlArray[path]) $urlArray[path] = "/";
$sock = fsockopen($urlArray[host], $urlArray[port], &$errnum, &$errstr, 10);
if (!$sock) $return[code] = "Død";
else {
$dump .= "HEAD $urlArray[path] HTTP/1.1\r\n";
$dump .= "User-Agent: Z-Add Link Checker (http://w3.z-add.co.uk/linkcheck/)\r\n";
$dump .= "Host: $urlArray[host]\r\nConnection: close\r\n";
$dump .= "Connection: close\r\n\r\n";
fputs($sock, $dump);
while($str = fgets($sock, 1024)) {
if (eregi("^http/[0-9]+.[0-9]+ ([0-9]{3}) [a-z ]*", $str)) $return[code] = trim(eregi_replace("^http/[0-9]+.[0-9]+ ([0-9]{3}) [a-z ]*", "\\1", $str));
if (eregi("^Content-Type: ", $str)) $return[contentType] = trim(eregi_replace("^Content-Type: ", "", $str));
}
fclose($sock);
flush();
}
}
return $return;
}

function liste($url) {
global $Comments;
global $otherLinks;
global $removeq;
$text = implode("", file($url));
$text = eregi_replace("<!--([^-]|-[^-]|--[^>])*-->","", $text);

while (eregi("[:space:]*(href|src)[:space:]*=[:space:]*([^ >]+)", $text, $regs)) {
$regs[2] = ereg_replace("\"", "", $regs[2]);
$regs[2] = ereg_replace("'", "", $regs[2]);
$regs[2] = preg_replace("/(\s.+)/" , "" , $regs[2]);
if ($removeq) $mylist[] = ereg_replace("\?.*$", "", $regs[2]);
else $mylist[] = ereg_replace("#.*$", "", $regs[2]);
$text = substr($text, strpos($text, $regs[1]) + strlen($regs[1]));
}

$mylist = sortarray($mylist);
for($i=0; $i<count($mylist); $i++) {
$temp = "";
if (!eregi("^(mailto|news|javascript|ftp)+:(//)?", $mylist[$i])) {
if (!eregi("^http://", $mylist[$i])) $temp = specialconcat($url, $mylist[$i]);
else $temp = $mylist[$i];
}
else {
if ($otherLinks) $temp = $mylist[$i];
}
if ($temp && $temp != $url) $return[] = $temp;
}
if (count($return) != 0) return $return;
else return false;
}

if ($url && !eregi("^http://", $url)) $url = "http://$url";

if ($url && (eregi("^http://[0-9a-z.-@:]+", $url) || !eregi("^http://.*/.*[|><]", $url))) {
if ($removeq) $url = ereg_replace("\?.*$", "", $url);
$urlArray = parse_url($url);
if (!$urlArray[port]) $urlArray[port] = "80";
if (!$urlArray[path]) $urlArray[path] = "/";
if ($urlArray[query]) $urlArray[path] .= "?$urlArray[query]";
$uri = "http://".$extra.$urlArray[host].$urlArray[path];
while($uri != firstArd($uri) && $trin++ < 5) {
$uri = firstArd($uri);
$steps[] = $uri;
}
}

?>
<form action="<? print basename($PHP_SELF) ?>" name="submitform">
<label for="url">Enter URL:</label><br />
<input name="url" id="url" size="40" value="<? $uri ? print $uri : print $url ?>" /><br />
<label for="removeq">Remove querystring</label> &nbsp; <input type="checkbox" name="removeq" id="removeq" value="1" <? if ($removeq) print "checked"; ?> /><br />
<input type="submit" value=" Check " /> &nbsp; <input type="reset" value=" Reset " /><br />
</form>
<p>free from kab_184.</p>
<?
if ($uri) {
$liste = liste($uri);
if (is_array($liste)) {
print "<table summary=\"Results\" class=\"thin\">\n";
print "<tr><th>Status</th><th>Description</th><th>URL</th></tr>";
for($i=0; $i<count($liste); $i++) {
if ($i == count($liste)-1) $printTemp = $uri;
else {
$procent = number_format($i*100/count($liste),0,".","");
$printTemp = "$procent% - $liste[$i]";
}

$check = check($liste[$i]);
$code = $check[code];
$check[contentType] ? $contentType = ereg_replace(";.*$", "", $check[contentType]) : $contentType = "Unknown";
$statCode[$code]++;
$statContentType[$contentType]++;
print "<tr>
<td>$code</td>
<td>$text[$code]</td>
<td>";
if (eregi("^text/html", $contentType) && ereg("^(2|3)+[0-9]{2}", $code)) {
print "<a href=\"./".basename($PHP_SELF)."?url=".rawurlencode($liste[$i])."\">".rawurldecode($liste[$i])."</a>";
}
else print rawurldecode($liste[$i]);
print "</td></tr>\n";
}
print "</table>\n";
}
else print "<p><b>I didn't find any links.</b></p>";

if (count($statCode) >= 1) {
while(list($key, $value) = each($statCode)) {
$procent = ereg_replace('(\.)?0+$', '', number_format(($value*100/count($liste)),2,".",""));
$space = "";
for($i=0; $i<$procent/3; $i++) $space .= "&nbsp;";
$print_statsCode .= "<tr><td>$text[$key]</td><td>$value</td><td>&nbsp;$procent%&nbsp;</td></tr>\n";
}
print "<p><b>Response Codes:</b></p>";
print "<table summary=\"Response Codes\" class=\"thin\">";
print "<tr><th>Status&nbsp;</th><th>Number&nbsp;</th><th>Percent&nbsp;</th></tr>";
print $print_statsCode;
print "</table>";
}

if (count($statContentType) >= 1) {
while(list($key, $value) = each($statContentType)) {
$procent = ereg_replace('(\.)?0+$', '', number_format(($value*100/count($liste)),2,".",""));
$space = "";
for($i=0; $i<$procent/3; $i++) $space .= "&nbsp;";
$print_statsContent .= "<tr><td>$key</td><td>$value</td><td>&nbsp;$procent%&nbsp;</td></tr>\n";
}
print "<p><b>Content-Type:</b></p>";
print "<table summary=\"Content-Type\" class=\"thin\">";
print "<tr><th>Content-Type&nbsp;</th><th>Number&nbsp;</th><th>Percent</th></tr>";
print $print_statsContent;
print "</table>";
}
}
if ($url && !$uri) print "<p><b>Invalid adress.</b></p>";
?>
</div>



EZ Archive Ads Plugin for vBulletin Copyright 2006 Computer Help Forum