camera01.pl to HTML.

index -|- end

Generated: Tue Feb 2 17:54:23 2010 from camera01.pl 2008/07/18 2.6 KB.

#!/perl -w
# NAME: camera01.pl
# AIM: Obtain digital camer information from web
# 18/07/2008 geoff mclane http://geoffair.net/mperl
use strict;
use warnings;
use LWP::Simple;
use LWP::UserAgent;
require 'logfile.pl' or die "Unable to load logfile.pl ...\n";
require 'htmltools.pl' or die "Unable to load 'htmltools.pl' ...\n";
# log file stuff
my ($LF);
my $pgmname = $0;
if ($pgmname =~ /\w{1}:\\.*/) {
    my @tmpsp = split(/\\/,$pgmname);
    $pgmname = $tmpsp[-1];
}
my $outfile = "temp.$pgmname.txt";
open_log($outfile);
###prt( "$0 ... Hello, World ...\n" );
my $domain = 'http://www.pixmania.com';
my $in_url = $domain.'/fr/fr/1658/xx/150-330/1/1/criteresn_BA00000027.html';
my $out_htm = 'tempcont.htm';
my $out_htm2 = 'tempcont2.htm';
my $rawcnt = 0;
my $trimcnt = 0;
my @lines = ();
my @nlines = ();
my $line = '';
prt( "Doing get [$in_url] ...\n" );
my $content = get( $in_url  ) or mydie( "get FAILED ... $! ...\n" ); 
$rawcnt = length($content);
@lines = split(/\n/,$content);
foreach $line (@lines) {
    chomp $line;
    $line = trim_all($line);
    push(@nlines, $line) if length($line);
}
###$content = trim_all($content);
$content = join("\n",@nlines);
$trimcnt = length($content);
write2file($content, $out_htm);
prt( "Written $trimcnt chars to $out_htm ($rawcnt) ...\n" );
@nlines = array_tags2newline(@nlines);
$content = join("\n",@nlines);
$trimcnt = length($content);
write2file($content, $out_htm2);
prt( "Written $trimcnt chars to $out_htm2 ($rawcnt) ...\n" );
$content = join(' ',@nlines);
my $surtxt = '';
my $subtxt = '';
if ($content =~ /\s+(\d+-\d+\s+sur\s+\d+)\s+/) {
    $surtxt = $1;
    my $ind = index($content,$surtxt);
    $subtxt = substr($content,$ind);
    my $subcnt = 0;
    my $ind2 = index($subtxt,'http://pan.fotovista.com/dev/gui_web/grafx/fleche-violetteD.gif');
    if ($ind2 > 0) {
        $subtxt = substr($content,$ind,$ind2-10);
        $subtxt = removetag($subtxt,'div');
        $subtxt = removetag($subtxt,'span');
        $subtxt =~ s/ / /g;
        while ($subtxt =~ /\s\s/) {
            $subtxt =~ s/\s\s/ /g;
        }
        $subcnt = length($subtxt);
        prt( "Got sur = [$surtxt] ... in $trimcnt characters at offset $ind to $ind2 ... ($subcnt)\n" );
        @lines = split(/\s/,$subtxt);
        write2file(join("\n",@lines), 'tempcont3.txt');
        ##my @hrefs = ret_hrefs_array( $subtxt );
        my @hrefs = collect_hrefs( $subtxt );
        prt( join("\n",@hrefs) );
    }
}
#system( $out_htm );
close_log($outfile,1);
exit(0);
#####################
# eof

index -|- top

checked by tidy  Valid HTML 4.01 Transitional