
[Translate to Slovak:] Do HTML sa extrahuje prvých 10 dostupných obrázkov zo stránky en.wikipedia.orghttp://www.wikipedia.org. Výstup sa obnovuje každých 15 minút.
Výstupy:
Source URL;Image URL;Name "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/commons/thumb/0/02/Rimsky-Korsakov_Serow_crop.png/100px-Rimsky-Korsakov_Serow_crop.png";"100px-Rimsky-Korsakov_Serow_crop.png" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/en/thumb/2/2d/HMAS_Vengeance_%28AWM_044574%29.jpg/80px-HMAS_Vengeance_%28AWM_044574%29.jpg";"80px-HMAS_Vengeance_%28AWM_044574%29.jpg" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/en/thumb/7/76/Kampala_Kasubi_Tombs.jpg/100px-Kampala_Kasubi_Tombs.jpg";"100px-Kampala_Kasubi_Tombs.jpg" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/commons/thumb/5/59/Premiere_Coupe_Stanley_1893.jpg/100px-Premiere_Coupe_Stanley_1893.jpg";"100px-Premiere_Coupe_Stanley_1893.jpg" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/commons/thumb/1/17/Phallus_hadriani.jpg/160px-Phallus_hadriani.jpg";"160px-Phallus_hadriani.jpg" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/en/9/9d/Commons-logo-31px.png";"Commons-logo-31px.png" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/en/6/60/Wikinews-logo-51px.png";"Wikinews-logo-51px.png" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/en/f/f2/Wiktionary-logo-51px.png";"Wiktionary-logo-51px.png" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/en/4/46/Wikiquote-logo-51px.png";"Wikiquote-logo-51px.png" "http://en.wikipedia.org/wiki/Main_Page";"http://upload.wikimedia.org/wikipedia/en/7/7f/Wikibooks-logo-35px.png";"Wikibooks-logo-35px.png"










Zdrojový kód skriptu:
# File: imgdownloader_main.w
# Name: Image Downloader
# Description: Script opens defined URL, finds first 10 available images,
# downloads them into folder 'images', saves basic information into CSV file
# and makes html with downloaded images.
# Input: URL
# Output format: CSV file, images, HTML
# Output CSV fields: Source URL, Image URL, Name
#<Logger File>
# Global
# FileName imgdownloader_log.log
# Level debug
#</Logger>
<Section>
Name imgdownloader_main
Define $output_file imgdownloader_output.csv
Define $output_file2 imgdownloader_output.html
Define $path http://www.qualityunit.com/fileadmin/scripts/imgdownloader/images/
# clean output files and download dir
<Action Print>
FileName {$output_file}
FileMode Write
</Action>
<Action Print>
FileName {$output_file2}
FileMode Write
</Action>
<Action Exec>
cmd rm ./images/*.*
</Action>
Define $url http://en.wikipedia.org/wiki/Main_Page
# downloading the content of URL
<Action ContentURL>
URL {$url}
RemoveNewLine
</Action>
<Section While>
MaxIterations 10
# two types of patterns
<Section Or>
NoContext
<Pattern>
RegExp <img{:re(.*?)}src="{$url_img:re([^"]*)}"
Trim
Compact
MultiLine
</Pattern>
<Pattern>
RegExp <img{:re(.*?)}src={$url_img:re([^ ]*)}
Trim
Compact
MultiLine
</Pattern>
</Section>
# relative address -> absolute address
<Action Php>
Code if (!eregi("^http",$context->getVariable('$url_img')))\
$context->setVariable('$url_img',parse_url($context->getVariable('$url'), PHP_URL_SCHEME)\
."://".parse_url($context->getVariable('$url'),PHP_URL_HOST)\
.parse_url($context->getVariable('$url'),PHP_URL_PATH)."/".$context->getVariable('$url_img'));
</Action>
# image name
<Action Php>
Code $context->setVariable('$name_img',pathinfo($context->getVariable('$url_img'), PATHINFO_FILENAME)\
.".".pathinfo($context->getVariable('$url_img'), PATHINFO_EXTENSION));
</Action>
# downloading image
<Action URLToFile>
URL {$url_img}
FileName images/{$name_img}
</Action>
# saving basic information into SCV file
<Action SaveCSV>
FileName {$output_file}
Separator ;
Column $url, Source URL
Column $url_img, Image URL
Column $name_img, Name
</Action>
# add img to HTML
<Action Print>
FileName {$output_file2}
Text <img src="{$path}{$name_img}" alt="img-{$_ITERATION}" title="image - {$_ITERATION}" />
</Action>
</Section>
</Section>
Main imgdownloader_main