#!/usr/bin/env perl -X

=pod

=head1 NAME

bibmradd.pl - add MR numbers to papers in a given bib file

=head1 SYNOPSIS

bibmradd  [-d] [B<-f>] [B<-e> 1|0] [B<-o> I<output>] I<bib_file>

=head1 OPTIONS

=over 4

=item B<-d>

Debug mode

=item B<-e>

If 1 (default), add an empty mrnumber if a mr cannot be found.  This
prevents repeated searches for the same entries if you add new entries
to the file.  Calling C<-e 0> suppresses this behavior.


=item B<-f>

Force searching for MR numbers even if the entry already has one.

=item B<-o> I<output>

Output file.  If this option is not used, the name for the 
output file is formed by adding C<_mr> to the input file

=back

=head1 DESCRIPTION

The script reads a BibTeX file. It checks whether the entries have
mrnumbers. If not, it tries to find the numbers from Internet sites. The
result is a BibTeX file with C<mrnumber=...> fields added.

The name of the output file is either set by the B<-o> option or 
is derived by adding the suffix C<_mr> to the output file.

See the C<bibdoiadd> script for more details on the processing.

=head1 AUTHOR

Boris Veytsman

=head1 COPYRIGHT AND LICENSE

Copyright (C) 2014-2026 Boris Veytsman

This is free software.  You may redistribute copies of it under the
terms of the GNU General Public License
L<http://www.gnu.org/licenses/gpl.html>.  There is NO WARRANTY, to the
extent permitted by law.

=cut

use strict; use warnings;
use Cwd;
use File::Basename;
use File::Spec;

BEGIN {
    # find files relative to our installed location within TeX Live
    chomp(my $TLMaster = `kpsewhich -var-value=TEXMFROOT`); # TL root
    if (length($TLMaster)) {
	unshift @INC, "$TLMaster/texmf-dist/scripts/bibtexperllibs";
    }
     # find development bibtexperllibs in sibling checkout to this script,
     # even if $0 is a symlink. All irrelevant when using from an installation.
     my $real0 = Cwd::abs_path($0);
     my $scriptdir = File::Basename::dirname($real0);
     my $dev_btxperllibs = Cwd::abs_path("$scriptdir/../bibtexperllibs");
     # we need the lib/ subdirectories inside ...
     unshift (@INC, glob ("$dev_btxperllibs/*/lib")) if -d $dev_btxperllibs;
}
use IO::File;
use BibTeX::Parser;
use Getopt::Std;
use URI::Escape;
use LWP::Simple;
$ENV{PERL_LWP_SSL_VERIFY_HOSTNAME}=0;
# Sometimes AMS forgets to update certificates
$ENV{PERL_LWP_SSL_VERIFY_HOSTNAME}=0;

my $USAGE="USAGE: $0  [-d] [-e 1|0] [-f] [-o output] file\n";
my $VERSION = <<END;
bibmradd v3.0
This is free software.  You may redistribute copies of it under the
terms of the GNU General Public License
http://www.gnu.org/licenses/gpl.html.  There is NO WARRANTY, to the
extent permitted by law.
$USAGE
END
my %opts;
getopts('de:fo:hV',\%opts) or die $USAGE;

if ($opts{h} || $opts{V}){
    print $VERSION;
    exit 0;
}

################################################################
# Defaults and parameters
################################################################

my $inputfile = shift;

my $outputfile = $inputfile;

$outputfile =~ s/\.([^\.]*)$/_mr.$1/;

if ($opts{o}) {
    $outputfile = $opts{o};
}

my $forceSearch=$opts{f};

my $forceEmpty = 1;
if (exists $opts{e}) {
    $forceEmpty = $opts{e};
}		

my $debug = $opts{d};

my $input= IO::File->new($inputfile) or 
    die "Cannot find BibTeX file $inputfile\n$USAGE\n";
my $output = IO::File->new("> $outputfile") or 
    die "Cannot write to $outputfile\n$USAGE\n";

my $parser=new BibTeX::Parser($input);



# Creating the HTTP parameters
my $mirror =
    "https://mathscinet.ams.org/batchmrlookup";

while (my $entry = $parser->next ) {
    if (!$entry->parse_ok()) {
	print STDERR "Cannot understand entry: ";
	$entry->print(*STDERR);
	print STDERR "Skipping this entry\n";
	next;
    }
    if ($entry->has('mrnumber') && !$forceSearch) {
	print $output $entry->raw_bibtex(), "\n\n";
	if ($debug) {
	    print STDERR "DEBUG:  entry ", $entry->key(), 
	    " has mrnumber ", $entry->field('mrnumber'), 
	    " and no forced search is requested\n";
	}
	next;
    }
    

     # Now we have an entry with no MR.  Let us get to work.
    if ($debug) {
	print STDERR "DEBUG:  Searching for mr number for entry ",
	$entry->key, "\n";
    }
     my $mr = GetMr($entry, $mirror);
     if (length($mr) || $forceEmpty) {
 	$entry->field('mrnumber', $mr);
     }
    print $output $entry->to_string(), "\n\n";

}

$input->close();
$output->close();
exit 0;

###############################################################
#  Getting one MR
###############################################################

sub GetMr {
    my $entry=shift;
    my $mirror=shift;

    my @data;
    if ($entry->has('issn')) {
	push @data, $entry->field('issn');
    } else {
	push @data, "";
    }
    if ($entry->has('journal')) {
	push @data, $entry->cleaned_field('journal');
    } else {
	push @data, "";
    }
    if ($entry->has('author')) {
	my @authors = $entry->cleaned_author();
	my @lastnames;
	foreach my $author (@authors) {
	    push @lastnames, $author->last();
	}
	if (scalar @lastnames) {
	    push @data, join(";", @lastnames);
	} else {
	    push @data, "";
	}
    } else {
	push @data, "";
    }
    if ($entry->has('volume')) {
	push @data, $entry->cleaned_field('volume');
    } else {
	push @data, "";
    }
    if ($entry->has('number')) {
	push @data, $entry->cleaned_field('number');
    } else {
	push @data, "";
    }
    if ($entry->has('pages')) {
	my $page = $entry->cleaned_field('pages');
	$page =~ s/-.*//;
	$page =~ s/\+.*//;
	push @data, $page;
    } else {
	push @data, "";
    }
    if ($entry->has('year')) {
	push @data, $entry->cleaned_field('year');
    } else {
	push @data, "";
    }
    push @data, $entry->type();
    push @data, $entry->key();
    push @data, "";
    if ($entry->has('title')) {
	my $title = $entry->cleaned_field('title');
	$title =~ s/|/ /g;
	push @data, $entry->cleaned_field('title');
    } else {
	push @data, "";
    }
    
    
    my $qrdata = join("|", @data);
    my $url = "$mirror?api=xref&qdata=".uri_escape_utf8($qrdata);
    if ($debug) {
	print STDERR "DEBUG: query $url\n";
    }

    my $response = get($url);
    chomp $response;
    if ($debug) {
	print "DEBUG: response $response\n";
    }
    
    my @vals = split /\|/, $response;
    my $mr = $vals[9];
    if (length($mr) == 0) {
	if ($debug) {
	    print STDERR "Did not get MR\n";
	}
	return("");
    }

    # Somehow mref deletes leading zeros.  They are needed!
    while (length($mr)<7) {
	$mr = "0$mr";
    }
    if ($debug) {
	print STDERR "DEBUG:  got MR: $mr\n",
    }
    return $mr;

}
