$title

' example.bib >example.html undef $nopages; undef $nosize; undef $nodoi; undef $notype; undef $nocompression; undef $nobrackets; if (defined($opt_e)) { my(@opts) = split(/,/, $opt_e); for $opt (@opts) { if ($opt =~ m/(PostScript|PDF|DVI|DOI):(.*)/) { $typeicon{$1} = $2; } elsif ($opt =~ m/(notype|nosize|nopages|nocompression|nodoi|nobrackets)/) { eval "\$$1 = 1"; } else { print STDERR qq{Invalid extended information specification: $opt This can be a comma-separated list of the following specifications: PostScript|PDF|DVI|DOI:new-text (e.g. PDF file icon) notype|nosize|nopages|nocompression|nodoi|nobrackets }; exit 1; } } } # PostScript and PDF files are assumed to be in same directory # as the target HTML file. if (defined($htmlfile) && ($htmlfile =~ m+(^.*)/+)) { push @filedir, $1; } else { push @filedir, "." } if (defined $opt_D) { local($dir, $url); foreach $dir (split(/\,/, $opt_D)) { $url = $dir; if ($dir =~ s/\@(.*)$//) { $url = $1; } push @filedir, $dir; $dirmap{$dir} = $url; } } umask(077); open(HTMLFILE, (defined($htmlfile) ? ">$htmlfile$$" : ">&STDOUT")); if (defined($htmlfile) && open(OHTMLFILE, "$htmlfile")) { $mode = (stat OHTMLFILE)[2] & 0xfff; $updating = 1; } else { $mode = 0644; $updating = 0; # An existing HTML file does not exist, so output some boilerplate. if ($opt_u) { $enc = 'UTF-8'; } else { $enc = 'US-ASCII'; } print HTMLFILE qq{ $title } . q{ } } $beginstring = ""; $endstring = ""; @citations = (); if ($opt_i && $updating) { loop: while () { print HTMLFILE; last loop if m/^$beginstring$/; } loop: while () { print HTMLFILE; last loop if m/^$endstring$/; push(@citations, $2) if m/^([^\\]*)?(.+\})(.*)?$/; } push(@citations, "\\bibdata{$macrofile$bibfile}"); } # Create an .aux file for bibtex to read. $auxfile = "bib$$"; push(@tmpfiles, "$auxfile.aux"); open(AUXFILE, ">$auxfile" . ".aux"); print AUXFILE "\\relax\n\\bibstyle{$bstfile}\n"; if (defined($citefile)) { $citefile .= ".aux"; open(CITEFILE, "<$citefile") || die "error opening $citefile: $!\n"; while () { print AUXFILE $_ if (m/^\\(citation|bibdata){/); } close(CITEFILE); } elsif (@citations) { foreach $citation (@citations) { print AUXFILE "$citation\n"; } } else { print AUXFILE "\\citation{*}\n\\bibdata{$macrofile$bibfile}\n"; } close(AUXFILE); # run bibtex, redirecting bibtex's output from STDOUT to STDERR. push(@tmpfiles, "$auxfile.blg"); push(@tmpfiles, "$auxfile.bbl"); #Flush HTMLFILE to avoid duplicate buffer writes after the fork select(HTMLFILE); $| = 1; $| = 0; select(STDOUT); # We attempt to fork in order to redirect bibtex's stdout to stderr. # This is needed when bib2xhtml is generating its output on the # standard output. # The shell redirection syntax used in the system() alternative # is by no means portable. eval { fork || (open(STDOUT, ">&STDERR"), # Handle leakage in Win32 prevents the final rename() close(HTMLFILE), close(OHTMLFILE), exec('bibtex', (split(/\s+/, ($opt_b ? $opt_b : "")), $auxfile))); wait; }; # fork is not implemented on some non-Unix platforms. if ($@) { # The fork failed (perhaps not implemented on this system). system("bibtex $opt_b $auxfile 1>&2"); } $beginstring = ""; $endstring = ""; if ($updating) { loop: while () { last loop if m/^$beginstring$/; print HTMLFILE; } loop: while () { last loop if m/^$endstring$/; } } print HTMLFILE "$beginstring\n"; print HTMLFILE < EOF # Now we make two passes over the .bbl file. In the first pass, we # just collect the {cite, label} pairs, which we will use later for # crossrefs. $t = $auxfile . ".bbl"; $/ = ""; # Make a first pass through the .bbl file, collecting citation/label pairs. open(BBLFILE, "<$t") || die "error opening $t: $!\n"; $nentry = 0; loop: while () { # Check for definitions at start of .bbl file. if (($nentry == 0) && (m/^#/)) { if ((m/#\s*label-style:\s*(\S+)/) && (! defined $label_style)) { $label_style = $label_styles{$1}; if (! defined $label_style) { print STDERR "label style unknown: \n"; next loop; } } next loop; } $nentry++; ($bcite, $blabel) = m+

\[([^\]]*)\]

+; $blabel = "$nentry" if ($label_style == $LABEL_NUMBERED); $bibcite{$bcite} = $blabel; } close(BBLFILE); $label_style = $LABEL_DEFAULT if (! defined $label_style); $list_start = $list_start[$label_style]; $list_end = $list_end[$label_style]; if (defined($opt_t)) { print HTMLFILE "$nentry references, last updated " . &ctime(time) . "

\n"; } print HTMLFILE "<$list_start>\n\n"; #foreach $key (sort (keys(%bibcite))) { # print "$key : $bibcite{$key}\n"; #} open(BBLFILE, "<$t") || die "error opening $t: $!\n"; $nentry = 0; loop: while () { # Skip definitions at start of .bbl file. next loop if (($nentry == 0) && (m/^#/)); $nentry++; # Protect \{, \}, and \$, and then assign matching {} pairs a unique ID. s/\\\{/\002/g; s/\\\}/\003/g; s/\\\$/\004/g; { local ($c, $l, $z) = (0, 0, ()); s/([\{\}])/join("","\001",($1 eq "\{" ? $z[$l++]=$c++ : $z[--$l]),$1)/ge; } # bibtex sometimes breaks long lines by inserting "%\n". We remove # that because it might accidently break the line in the middle # of a URL. We don't need to deal with TeX comments in general # because bibtex seems to munge them up anyway, so there shouldn't # be any in the bibliography file. s/\%\n//g; # bibtex's add.period$ knows how to avoid adding extra periods # when a block already ends in a period. bib2xhtml's modifications # of bibtex's style files break that. We fix it here. s/(\.(<\/cite>|<\/a>|\')+)\./$1/g; # Adjust beginning of entry based on bibliography style. if ($label_style == $LABEL_PLAIN) { s:

()\[[^\]]*\]()

$1$2:; s:

::; # Attempt to fix up empty tag, which some browsers # don't handle properly (even though it *is* legal HTML). # First try to combine a with a following )([\w]+):$1$2<\/a>:; } elsif ($label_style == $LABEL_PARAGRAPH) { s:

()\[[^\]]*\]()

$1$2:; s:

:; # Attempt to fix up empty tag, which some browsers # don't handle properly (even though it *is* legal HTML). # First try to combine a with a following )([\w]+):$1$2<\/a>:; } elsif ($label_style == $LABEL_NUMBERED) { s:(

\[)[^\]]*(\]

):$1$nentry$2:; } # Append the key name, if asked so if ($opt_k && ($label_style == $LABEL_NUMBERED || $label_style == $LABEL_DEFAULT)) { # $1 $2 $3 $4 $5 s:(

\[)([^\]]*)(\]

):$1$2$3$4 --- $2$5:; } # Attempt to fix up crossrefs. while (m/(\\(cite(label)?)(\001\d+)\{([^\001]+)\4\})/) { $old = $1; $cmd = $2; $doxref = defined($3); $bcite = $5; if (! defined $bibcite{$bcite}) { $blabel = " [" . $bcite . "]"; } elsif ($doxref) { $blabel = " [" . $bibcite{$bcite} . "]<\/a>"; } else { $blabel = " [" . $bibcite{$bcite} . "]"; } $old =~ s/(\W)/\\$1/g; s/\s*$old/$blabel/g; } # In some styles crossrefs become something like # "In Doe and Roe [Doe and Roe, 1995]." Change this to # "In [Doe and Roe, 1995]." to remove the redundancy. s/In ()([^\[]+) \[(\2)/In $1\[$2/; # Handle the latex2html commands \htmladdnormallink{text}{url} # and \htmladdnormallinkfoot{text}{url}. s/\\htmladdnormallink(foot)?(\001\d+)\{([^\001]+)\2\}(\001\d+)\{([^\001]+)\4\}/$3<\/a>/gs; s/\&/\005/g; # Protect original & sequences s/\\?&/&/g; # \& -> & and & -> & s/\005/&/g; # Restore original & sequences if ($opt_u) { utf_ent(); } else { html_ent(); } # Handle \char123 -> &123;. while (m/\\char([\'\"]?[0-9a-fA-F]+)/) { $o = $r = $1; if ($r =~ s/^\'//) { $r = oct($r); } elsif ($r =~ s/^\"//) { $r = hex($r); } s/\\char$o\s*/&#$r;/g; } s/{\\etalchar\001(\d+)\{(.)}\001\1\}/$2/g; # {\etalchar{x}} -> x s/\\par\b/

/g; s/\\url(\001\d+)\{(.*)\1\}/$2<\/a>/gs; #\url{text} -> text s/\\href(\001\d+)\{(.*)\1\}(\001\d+)\{([^\001]*)\3\}/$4<\/a>/gs; #\href{text} -> text s/\\href(\001\d+)\{(.*)\1\}/$2<\/a>/gs; #\href{text} -> text # There's no way to easily handle \rm and \textrm because # HTML has no tag to convert back to plain text. Since it's very # difficult to do the right thing, we do the wrong thing, and just # remove them. s/(\001\d+)\{\\rm\s+(.*)\1\}/$2/gs; # {\rm text} -> text s/\\textrm(\001\d+)\{(.*)\1\}/$2/gs; # \textrm{text} -> text # This doesn't create correct HTML, because HTML doesn't allow nested # character style tags. Oh well. s/(\001\d+)\{\\em\s+(.*)\1\}/$2<\/em>/gs; # {\em text} -> text s/(\001\d+)\{\\it\s+(.*)\1\}/$2<\/i>/gs; # {\it text} -> text s/(\001\d+)\{\\bf\s+(.*)\1\}/$2<\/b>/gs; # {\bf text} -> text s/(\001\d+)\{\\tt\s+(.*)\1\}/$2<\/tt>/gs; # {\tt text} -> text s/\\emph(\001\d+)\{(.*)\1\}/$2<\/em>/gs; # \emph{text} -> text s/\\textit(\001\d+)\{(.*)\1\}/$2<\/i>/gs; # \textit{text} -> text s/\\textbf(\001\d+)\{(.*)\1\}/$2<\/b>/gs; # \textbf{text} -> text s/\\texttt(\001\d+)\{(.*)\1\}/$2<\/tt>/gs;# \textit{text} -> text s/\\mathrm(\001\d+)\{(.*)\1\}/$2/gs; # \mathrm{text} -> text s/\\mathnormal(\001\d+)\{(.*)\1\}/$2/gs; # \mathnormal{text} -> text s/\\mathsf(\001\d+)\{(.*)\1\}/$2/gs; # \mathsf{text} -> text s/\\mathbf(\001\d+)\{(.*)\1\}/$2<\/b>/gs; # \mathbf{text} -> text s/\\mathcal(\001\d+)\{(.*)\1\}/$2<\/i>/gs;# \mathcal{text} -> text s/\\mathit(\001\d+)\{(.*)\1\}/$2<\/i>/gs; # \mathit{text} -> text s/\\mathtt(\001\d+)\{(.*)\1\}/$2<\/tt>/gs;# \mathtt{text} -> text # Custom highlighting for the -n option. s/\\bibxhtmlname(\001\d+)\{(.*)\1\}/&highlight_name($2)/ges; # {\boldmath $mathstuff$} -> mathstuff # s/(\001\d+)\{\s*\\boldmath ?([^A-Za-z\{\}][^\{\}]*)\}/$1<\/b>/gs; sub domath { local($t) = @_; $t =~ s/\^(\001\d+)\{\\circ\1\}/\&\#176;/gs; # ^{\circ}->degree $t =~ s/\^\\circ/\&\#176;/g; # ^\circ->degree # $t =~ s/\^(\001\d+)\{(.*)\1\}/^{$2<\/sup>/gs; # ^{x} $t =~ s/\^(\001\d+)\{(.*)\1\}/^{$2<\/sup>/gs; # ^{x} $t =~ s/\^(\w)/^{$1<\/sup>/g; # ^x # $t =~ s/\_(\001\d+)\{(.*)\1\}/_{$2<\/sub>/gs; # _{x} $t =~ s/\_(\001\d+)\{(.*)\1\}/_{$2<\/sub>/gs; # _{x} $t =~ s/\_(\w)/_{$1<\/sub>/g; # _x $t; } # Handle superscripts and subscripts in inline math mode. s/(\$([^\$]+)\$)/&domath($2)/ge; # $ ... $ s/(\\$(([^\\]|\\[^\($])+)\\\))/&domath($2)/ge; # $ ... $ # Remove \mbox. s/\\mbox(\001\d+)\{(.*)\1\}/$2/gs; # \mbox{x} # Escape and protect tildes in URLs # For some reason /g doesn't work while (s/(\ ~ # Non-alphabetic macros that we keep. s/\\([\#\&\%\~\_\^\|])/$1/g; # Non-alphabetic macros that we remove. # (discretionary hyphen) # (italic correction) s/\\\W//g; # Clean up things we don't handle. # s/\\//g; # The format {\Xyz{Abc}} is interpreted by BibTeX as a single letter # whose text is given by "Abc". If we see this pattern, it is # likely that discarding the \Xyz will do the right thing. s/\001(\d+)\{\\[A-Za-z]+\001(\d+)\{([^\001]*)\001\2\}\001\1\}/$3/g; # Macro names may be meaningful, so keep them and don't run them together. s/\\([A-Za-z]+)/ $1 /g; # Remove an empty tag that bad cross-referencing # in the BibTeX file may have left us with. s+In ++; &doPaperLinks; # Get rid of { } ids, and put protected { } back. s/\001\d+[\{\}]//gs; tr/\002\003\004/{}$/; print HTMLFILE $_; } close(BBLFILE); print HTMLFILE "<$list_end>\n\n$endstring\n"; if ($updating) { while () { print HTMLFILE; } close (OHTMLFILE); } else { print HTMLFILE "\n"; } close(HTMLFILE); if (defined ($htmlfile)) { #$mode &= 0777; #print "setting $htmlfile$$ to $mode\n"; #printf("mode = %lo\n", $mode); chmod($mode, "$htmlfile$$"); rename("$htmlfile$$", $htmlfile); } unlink(@tmpfiles); exit(0);}}}}}}