<?xml version="1.0" encoding="UTF-8"?>
<!-- generator="FeedCreator 1.8" -->
<?xml-stylesheet href="https://wiki.glasgow.social/lib/exe/css.php?s=feed" type="text/css"?>
<rdf:RDF
    xmlns="http://purl.org/rss/1.0/"
    xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
    xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
    xmlns:dc="http://purl.org/dc/elements/1.1/">
    <channel rdf:about="https://wiki.glasgow.social/feed.php">
        <title>The Open Guide to Glasgow scraping</title>
        <description></description>
        <link>https://wiki.glasgow.social/</link>
        <image rdf:resource="https://wiki.glasgow.social/lib/tpl/dokuwiki/images/favicon.ico" />
       <dc:date>2026-04-29T09:00:08+0100</dc:date>
        <items>
            <rdf:Seq>
                <rdf:li rdf:resource="https://wiki.glasgow.social/scraping/dns_filter?rev=1605895819&amp;do=diff"/>
            </rdf:Seq>
        </items>
    </channel>
    <image rdf:about="https://wiki.glasgow.social/lib/tpl/dokuwiki/images/favicon.ico">
        <title>The Open Guide to Glasgow</title>
        <link>https://wiki.glasgow.social/</link>
        <url>https://wiki.glasgow.social/lib/tpl/dokuwiki/images/favicon.ico</url>
    </image>
    <item rdf:about="https://wiki.glasgow.social/scraping/dns_filter?rev=1605895819&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2020-11-20T18:10:19+0100</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>scraping:dns_filter</title>
        <link>https://wiki.glasgow.social/scraping/dns_filter?rev=1605895819&amp;do=diff</link>
        <description>Scraping: DNS Filter

This code takes the unique URLs (see Hidden Glasgow for an example and checks which ones are pointing to domains that no longer exists (then drops them from the to-be-checked list).


&lt;?php
$file_list = &quot;non-image-links.txt&quot;;

$data = file_get_contents($file_list);
$lines = explode(&quot;\n&quot;, $data);
$host_list = array();

foreach($lines as $url) {
        $url_parts = parse_url($url);
        if(!empty($url_parts['host'])) {
                $host = $url_parts['host'];
         …</description>
    </item>
</rdf:RDF>
