Typical output:#!/usr/bin/perl -w #this is fairly silly use strict; use LWP::Simple; my $page = ''; my $url = 'http://www.google.com/search?q=%2B%22all+your%22+%2B%22are+ +belong+to+us%22+-base+-bases&num=100&hl=en&lr=&safe=off&start=' ; for (my $i=0; $i<=900; $i+=100) { $page .= get( $url.$i ) ; } $page =~ s/<[^>]*?>//gs ; $page =~ s/&[^;]*?;//gs ; my (@nouns) = ($page =~ /all your(.{3,20}?)are belong to us/gsi ); my %unique; foreach (@nouns) { s/^\s*//s ; s/\s*$//s ; tr/\n//d ; $unique{$_}++; } print join ', ', sort keys %unique ;
(I was going to sort them by frequency but Google doesn't give a big enough sample)
andy.
|
|---|
| Replies are listed 'Best First'. | |
|---|---|
|
Re: All your what, exactly, are belong to us? (apart from 'base')
by tomhukins (Curate) on Mar 02, 2001 at 18:16 UTC | |
|
Re: All your what, exactly, are belong to us? (apart from 'base')
by EvanK (Chaplain) on Mar 02, 2001 at 23:30 UTC |