LinuxQuestions.org - retrieve web site data automatically

I've had to rearrange this a little because the page layout has changed since I used this a few years ago.
Obtaining timestamp and share prices gets you on the way to plotting a graph if you wanted.
This expects a file called INPUT with on each line a share symbol and a quantity.
Code:
#!/usr/bin/perl  -Tw                                                                                                                                                          

# read share prices                                                                                                                    



use Socket;

use IO::Handle;                                                                                                                                              

use POSIX ":sys_wait_h";

use Carp;                                                                                                                                                                  

my $EOL = "\015\01";                                                                                                                                                        

                                                                                                                                                                            

# define how many shares of each type ideally read from input source

open(STDIN, "<INPUT")or die("open $!");                                                                                                                                                      

while (<>) {                                                                                                                                                                                  

    chomp();                                                                                                                                                                                  

    next if (/^\s*#/);

    next if (/^\s*$/);                                                                                                                                                                        

    if (/^(\S+)\s+(\S+)$/) {                                                                                                                                                                  

        # yahoo share ticker and quantity e.g.

        #HSBA.L    1018                                                                                                                                                                                            

        if (defined ($shares{$1})) {                                                                                                                                                                              

            $shares{$1} += $2;

        }else {

            $shares{$1}=$2;

        }

    }

}

close(STDIN);

foreach $symbol (sort keys %shares) {

    undef $price;

    undef $curr;

    $iaddr=inet_aton("192.168.0.8"); $port= 3128;  # address of squid proxy

    $proto  =  getprotobyname('tcp'); 

    $paddr  = sockaddr_in($port, $iaddr);

    socket(SOCK, PF_INET, SOCK_STREAM, $proto)  || die "socket: $!";

    connect(SOCK, $paddr)    || die "connect: $!";



    SOCK->autoflush(1);

    printf(SOCK "GET http://uk.finance.yahoo.com/q?s=%s HTTP/1.0\n", $symbol);

    print SOCK "Host: uk.finance.yahoo.com\n";

    print SOCK "\n";

    shutdown(SOCK, 1); # close outbound stream now



    READPAGE: while ($line=<SOCK>) {

      # print $line;

        chomp($line);

        while (defined($line = <SOCK>)) { 

            if ($line =~ /class="time_rtq_ticker"><span id="[\w.]+">([\d,.]+)<\/span><\/span> /) {

                printf("For %s found price %s\n", $symbol, $1);

                $_=$1;

                s/,//g;

                $price=$price{$symbol}=$_;

            }

            if ($line =~ /"ticker_currency_sym" : "([^"]+)" /){

                # Also need to find the currency in this page

                $curr=$1;

            }

            if (defined($price) && defined($curr)){

                if ("\$" eq $curr) {

                    $curr="GBP";

                    $price{$symbol}/=2;  # XXX needs to get exchange rate

                }

                if ("GBp" eq $curr) {

                    $curr="GBP";

                    $price{$symbol}/=100;

                }

                printf("%d %s %9.2f  %9.2f %s\n", 

                        $^T,  $symbol,  $price{$symbol}, ($shares{$symbol} * $price{$symbol}), $curr);

                last READPAGE;

            }

        }

    } 

    close (SOCK) || die "close: $!";

}

printf("\nT=%d\n",  $^T);

$sum=0;

foreach $symbol (sort keys %shares) {

    if (!defined($price{$symbol})) {

      printf("        No price known for %s\n", $symbol);

      next;

    }

    printf("%s=%9.2f\n",  $symbol, ($shares{$symbol} * $price{$symbol}));

    $sum += $shares{$symbol} * $price{$symbol} ;

}

printf("\nSUM=%9.2f\n", $sum);

exit(0);