in reply to Re^2: Storing UTF-8 data into database from scraped web page
in thread SOLVED: Storing UTF-8 data into database from scraped web page
Hello nysus,
Did you see the updated sample of code? This did not worked for you?
I just run one more last test with HTML::Entities module and both cases either including the HTML entity or the the code tag worked.
See sample of code:
#!/usr/bin/perl use DBI; use utf8; use strict; use warnings; use Data::Dumper; use Config::Simple; use HTML::Entities; $|=1; #flush every time the program my $path = 'conf.ini'; my %config = (); my $checkExist = ""; sub mysql { Config::Simple->import_from("".$path."", \%config) or die Config::Simple->error(); my $dbh = DBI->connect("dbi:mysql::".$config{'MySQL.host'}.":".$co +nfig{'MySQL.port'}."", "".$config{'MySQL.user'}."", "".$config{'MySQL.pass'}."", { 'PrintError' => 1, 'RaiseError' => 1 , 'AutoInactiveD +estroy' => 1 } ) or die "Could not connect to ". $config{'MySQL.host'} .": ". $DB +I::errstr ."\n"; my $databases = $dbh->do("SHOW DATABASES LIKE '".$config{'MySQL.db +'}."'") or die "Error: " .dbh->errstr. "\n"; if ($databases eq 1) { printf "Database: ". $config{'MySQL.db'} ." exists not creating: " +. $config{'MySQL.db'} ."\n"; } else { printf "Database: ". $config{'MySQL.db'} ." does not exist creatin +g: ". $config{'MySQL.db'} ."\n"; $checkExist = $dbh->do("CREATE DATABASE IF NOT EXISTS `".$config{' +MySQL.db'}."`") or die "Could not create the: ".$config{'MySQL.db'}." error: " +. $dbh->errstr ."\n"; } # End of else $dbh->do("USE ".$config{'MySQL.db'}."") or die "Error: " .dbh->errstr. "\n"; my $tables = $dbh->do("SHOW TABLES FROM `".$config{'MySQL.db'}."` WHERE Tables_in_".$config{'MySQL.db'}." LIKE '".$config{'MySQL.table'}."'") or die "Error: ".dbh->errstr. "\n"; if ($tables eq 1) { printf "Table: ".$config{'MySQL.table'}." exists not creating: ".$ +config{'MySQL.table'}."\n"; } else { printf "Table: ".$config{'MySQL.table'}." does not exist creating: + ".$config{'MySQL.table'}."\n"; $checkExist = $dbh->prepare("CREATE TABLE ".$config{'MySQL.table'} +." ( `ID` INT NOT NULL AUTO_INCREMENT, `data` VARCHAR(150) CHARACTER SET utf8 NOT NULL UN +IQUE, PRIMARY KEY(`ID`) );"); if (!$checkExist->execute()) { die "Error: ". $checkExist->errstr ."\n"; } } # End of else $checkExist = $dbh->prepare("INSERT IGNORE INTO `".$config{'MySQL. +table'}. "` (`data`) VALUES (? ?)"); my $encode1 = decode_entities("<p>What\x{2019}s up with the water +?? Encode1</p>"); my $encode2 = decode_entities("<p>What’s up with the water ? +? Encode2</p>"); if (!$checkExist->execute($encode1, $encode2)) { die "Error: ". $checkExist->errstr ."\n"; } my $statement = "SELECT * FROM `".$config{'MySQL.table'}."` WHERE +1"; my $hash_ref = $dbh->selectall_hashref($statement, 'data'); $checkExist->finish(); $dbh->disconnect() or warn "Error disconnecting: $DBI::errstr\n"; return $hash_ref; } # End of mysql sub my $output_ref = mysql(); my @data = keys %$output_ref; print Dumper $output_ref, \@data; __DATA__ $ perl mysql.pl Database: PerlMonks does not exist creating: PerlMonks Table: Data does not exist creating: Data $VAR1 = { '<p>What’s up with the water ?? Encode1</p><p>What’s up with + the water ?? Encode2</p>' => { + 'data' => '<p>What’s up with the +water ?? Encode1</p><p>What’s up with the water ?? Encode2</p>', + 'ID' => 1 + } }; $VAR2 = [ '<p>What’s up with the water ?? Encode1</p><p>What’s up with + the water ?? Encode2</p>' ];
BR / Thanos
|
|---|