Guys,
I tried both suggestions. Here's a minimal version that shows the problem:
#!/usr/bin/perl -w
use HTML::TextToHTML;
use strict;
use diagnostics;
use Data::Dumper;
use warnings;
my (
$html_cvt_obj
);
$html_cvt_obj = new HTML::TextToHTML();
# print STDERR Dumper( \"test.txt", \"test.html", \$html_cvt_obj );
# exit;
$html_cvt_obj->txt2html(infile=>["test.txt"],
outfile=>'test.html',
explicit_headings=>1,
hrule_min=>20,
preformat_trigger_lines=>0,
);
print "$! \n" if( $! );
This still produces the same msg, even though the conversion works.
If I turn on the Dumper and exit lines, I get the following output:
$VAR1 = \'test.txt';
$VAR2 = \'test.html';
$VAR3 = \bless( {
'escape_HTML_chars' => 1,
'__links_table' => {},
'use_preformat_marker' => 0,
'style_url' => '',
'make_anchors' => 1,
'preformat_end_marker' => '^(:?(:?<)|<)/PRE(:?(:
+?>)|>)$',
'par_indent' => 2,
'doctype' => '-//W3C//DTD HTML 3.2 Final//EN',
'links_dictionaries' => [],
'inhandle' => [],
'append_file' => '',
'short_line_length' => 40,
'preformat_trigger_lines' => 2,
'lower_case_tags' => 0,
'bold_delimiter' => '#',
'title' => '',
'tab_width' => 8,
'__call_init_done' => 0,
'indent_par_break' => 0,
'__non_header_anchor' => 0,
'__mode' => 0,
'bullets' => '-=o*\\267',
'custom_heading_regexp' => [],
'make_tables' => 0,
'underline_offset_tolerance' => 1,
'preformat_start_marker' => '^(:?(:?<)|<)PRE(:?(
+:?>)|>)$',
'__links_table_order' => [],
'preserve_indent' => 0,
'__num_heading_styles' => 0,
'unhyphenation' => 1,
'__prev_para_action' => 0,
'hrule_min' => 4,
'use_mosaic_header' => 0,
'extract' => 0,
'endpreformat_trigger_lines' => 2,
'demoronize' => 1,
'__search_patterns' => [],
'__heading_styles' => {},
'infile' => [],
'prepend_file' => '',
'outfile' => '-',
'xhtml' => 0,
'preformat_whitespace_min' => 5,
'debug' => 0,
'explicit_headings' => 0,
'italic_delimiter' => '*',
'dict_debug' => 0,
'__repl_code' => [],
'__list_nice_indent' => '',
'eight_bit_clean' => 0,
'__listnum' => 0,
'bullets_ordered' => '',
'link_only' => 0,
'default_link_dict' => '/root/.txt2html.dict',
'table_type' => {
'DELIM' => 1,
'ALIGN' => 1,
'PGSQL' => 1,
'BORDER' => 1
},
'underline_length_tolerance' => 1,
'__global_links_data' => '
},
'underline_length_tolerance' => 1,
'__global_links_data' => '
/<URL:([-\\w\\.\\/:~_\\@]+):([a-zA-Z0-9\'() ]+)>/ -h-> <A HREF="
+$1">$2</A>
/<URL:\\s*(\\S+?)\\s*>/ -h-> <A HREF="$1">$1</A>
/<(http:\\S+?)\\s*>/ -h-> <<A HREF="$1">$1</A>>
|snews:[\\w\\.]+| -> $&
|news:[\\w\\.]+| -> $&
|nntp:[\\w/\\.:+\\-]+| -> $&
|http:[\\w/\\.:\\@+\\-~\\%#?=&;,]+[\\w/]| -> $&
|shttp:[\\w/\\.:+\\-~\\%#?=&;,]+| -> $&
|https:[\\w/\\.:+\\-~\\%#?=&;,]+| -> $&
|file:[\\w/\\.:+\\-]+| -> $&
|ftp:[\\w/\\.:+\\-]+| -> $&
|wais:[\\w/\\.:+\\-]+| -> $&
|gopher:[\\w/\\.:+\\-]+| -> $&
|telnet:[\\w/\\@\\.:+\\-]+| -> $&
|([^\\w\\-/\\.:\\@>])(alt\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(bionet\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(bit\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(biz\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(clari\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(comp\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(gnu\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(humanities\\.[\\w\\.+\\-]+[\\w+\\-]+)|
-h-> $1<A HREF="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(k12\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(misc\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(news\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(rec\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(soc\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(talk\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(us\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(ch\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|([^\\w\\-/\\.:\\@>])(de\\.[\\w\\.+\\-]+[\\w+\\-]+)| -h-> $1<A HRE
+F="news:$2">$2</A>
|(anonymous\\@)([a-zA-Z][\\w\\.+\\-]+\\.[a-zA-Z]{2,}):(\\s*)([\\w\\d+\
+\-/\\.]+)| -h-> $1<A HREF="ftp://$2/$4">$2:$4</A>$3
|(ftp\\@)([a-zA-Z][\\w\\.+\\-]+\\.[a-zA-Z]{2,}):(\\s*)([\\w\\d+\\-/\\.
+]+)|
-h-> $1<A HREF="ftp://$2/$4">$2:$4</A>$3
|[a-zA-Z0-9_\\+\\-\\.]+\\@([a-zA-Z0-9][\\w\\.+\\-]+\\.[a-zA-Z]{2,})|
-> mailto:$&
|([^\\w\\-/\\.:\\@>])([a-zA-Z][\\w\\.+\\-]+\\.[a-zA-Z]{2,}):(\\s*)([\\
+w\\d+\\-/\\.]+)|
-h-> $1<A HREF="ftp://$2/$4">$2:$4</A>$3
|([^\\w\\-/\\.:\\@])(\\d{2,}\\.\\d{2,}\\.\\d+\\.\\d+):([\\w\\d+\\-/\\.
+]+)|
-h-> $1<A HREF="ftp://$2/$3">$2:$3</A>
|telnet ([a-zA-Z][\\w+\\-]+(\\.[\\w\\.+\\-]+)+\\.[a-zA-Z]{2,})\\s+(\\d
+{2,4})|
-h-> telnet <A HREF="telnet://$1:$3/">$1 $3</A>
|ftp ([a-zA-Z][\\w+\\-]+(\\.[\\w\\.+\\-]+)+\\.[a-zA-Z]{2,})|
-h-> ftp <A HREF="ftp://$1/">$1</A>
|\\b([a-zA-Z][\\w])*ftp[\\w]*(\\.[\\w+\\-]+){2,}| -h-> ftp <A HREF="ft
+p://$&/">$&</A>
|ftp(\\.[a-zA-Z0-9_\\@:-]+)+/\\S+| -> ftp://$&
|www(\\.[a-zA-Z0-9_\\@:-]+)+/\\S+| -> http://$&
|\\b([a-zA-Z][\\w])*www[\\w]*(\\.[\\w+\\-]+){2,}| -> http://$&/
|([a-zA-Z][\\w+\\-]+\\.[\\w+\\-]+\\.[a-zA-Z]{2,})\\s+(\\d{2,4})|
-h-> <A HREF="telnet://$1:$2/">$1 $2</A>
|([^\\w\\-/\\.:\\@])(\\d{1,3}\\.\\d{1,3}\\.\\d{1,3}\\.\\d{1,3})\\s+(\\
+d{1,4})|
-h-> $1<A HREF="telnet://$2:$3">$2 $3</A>
|([^\\w\\-/\\.:\\@])(\\d{1,3}\\.\\d{1,3}\\.\\d{1,3}\\.\\d{1,3})|
-h-> $1<A HREF="telnet://$2">$2</A>
/RFC ?(\\d+)/ -i-> http://www.cis.ohio-state.edu/rfc/rfc$1.txt
/([ \\t\\n])_([a-z][a-z0-9 -]*[a-z])_([ \\t\\n\\.;:,\\!\\?])/ -hi-> $1
+<U>$2</U>$3
"Seth Golub" -io-> http://www.aigeek.com/
"txt2html" -io-> http://txt2html.sourceforge.net/
"Kathryn Andersen" -io-> http://www.katspace.com/
"HTML::TextToHTML" -io-> http://www.katspace.com/tools/text_to_html/
"hypertoc" -io-> http://www.katspace.com/tools/hypertoc/
"HTML::GenToc" -io-> http://www.katspace.com/tools/hypertoc/
',
'indent_width' => 2,
'mailmode' => 0,
'instring' => [],
'append_head' => '',
'caps_tag' => 'STRONG',
'min_caps_length' => 3,
'__file' => '',
'make_links' => 1,
'__list_indent' => [],
'titlefirst' => 0,
'body_deco' => ''
}, 'HTML::TextToHTML' );
I hope this means something to somebody, because it's just line noise to me... ;-)
Cheers
Chris
PS, I'll take a look at the module's debug option...
|