#!/usr/local/bin/perl use strict; use warnings; undef $/; chomp($input=$ARGV[0]); open (A, "< $input") || die "Couldn't open the input"; open(B, ">A.xml") or die("Sorry!"); while (){ $_=~s/\s\s//gi; $_=~s/\t//gi; $_=~s/^\n$//gi; $_=~s/\n//gi; $_=~s/’/'/gi; $_=~s/—/—/gi; $_=~s/“/“/gi; $_=~s/”/”/gi; print B $_; } close (A); close (B); open(C, "< A.xml") || die "$!"; open (Z, "> $input.sgm") || die "Can't write the output"; $file = ; #Body matter begins if ($file =~ m/(]*>(.*?)<\/Body>)/){ $xmlBody = $1; #. #. #. #Processing BlockAmendments while ($xmlBody =~ m/(]*>(.+?)<\/BlockAmendment>)/sgi){ $CbBlkTx = $1; $bBlkTx = $CbBlkTx; if ($bBlkTx =~ m/(]+>(.*?)<\/P2><\/BlockAmendment>)/){ $bBlkTx =~ s/]+>(.*?)<\/P2><\/BlockAmendment>/\n$1<\/P2>\n<\/lq>/gi; $bBlkTx =~ s/([^<]+)<\/Pnumber>(.+?)<\/Text>(.*?)<\/P2para><\/P2>/\n($1)<\/no>\n$2<\/pt>$3\n<\/s1>/mgi; $bBlkTx =~ s/([^<]+)<\/Pnumber>(.+?)<\/Text>(.*?)<\/P3para><\/P3>/\n($1)<\/no>\n$2<\/pt>$3\n<\/s2>/mgi; $bBlkTx =~ s/([^<]+)<\/Pnumber>(.+?)<\/Text>(.*?)<\/P4para><\/P4>/\n($1)<\/no>\n$2<\/pt>$3\n<\/s3>/mgi; $bBlkTx =~ s/([^<]+)<\/Pnumber>(.+?)<\/Text>(.*?)<\/P5para><\/P5>/\n($1)<\/no>\n$2<\/pt>$3\n<\/s4>/mgi; } $bBlkTx =~ s/<\/pt>\n<\/s([0-9])>(.+?)<\/Text>/ $2<\/pt><\/s$1>/mgi; print "$CbBlkTx\n\n============\n"; print "$bBlkTx\n\n"; $xmlBody =~ s/$CbBlkTx/$bBlkTx/gi; } } print Z $xmlBody;