/*
* adsout.c
*
* Copyright (c) Richard Mathar 2007-2018
* Copyright (c) Chris Putnam 2007-2018
*
* Program and source code released under the GPL version 2
*
*/
#include <stdio.h>
#include <stdlib.h>
#include <stdint.h>
#include <string.h>
#include <ctype.h>
#include "utf8.h"
#include "str.h"
#include "strsearch.h"
#include "fields.h"
#include "name.h"
#include "title.h"
#include "url.h"
#include "bibformats.h"
static int adsout_write( fields *in, FILE *fp, param *p, unsigned long refnum );
static void adsout_writeheader( FILE *outptr, param *p );
void
adsout_initparams( param *p, const char *progname )
{
p->writeformat = BIBL_ADSABSOUT;
p->format_opts = 0;
p->charsetout = BIBL_CHARSET_DEFAULT;
p->charsetout_src = BIBL_SRC_DEFAULT;
p->latexout = 0;
p->utf8out = BIBL_CHARSET_UTF8_DEFAULT;
p->utf8bom = BIBL_CHARSET_BOM_DEFAULT;
p->xmlout = BIBL_XMLOUT_FALSE;
p->nosplittitle = 0;
p->verbose = 0;
p->addcount = 0;
p->singlerefperfile = 0;
if ( p->charsetout == BIBL_CHARSET_UNICODE ) {
p->utf8out = p->utf8bom = 1;
}
p->headerf = adsout_writeheader;
p->footerf = NULL;
p->writef = adsout_write;
}
enum {
TYPE_UNKNOWN = 0,
TYPE_GENERIC,
TYPE_ARTICLE,
TYPE_MAGARTICLE,
TYPE_BOOK,
TYPE_INBOOK,
TYPE_INPROCEEDINGS,
TYPE_HEARING,
TYPE_BILL,
TYPE_CASE,
TYPE_NEWSPAPER,
TYPE_COMMUNICATION,
TYPE_BROADCAST,
TYPE_MANUSCRIPT,
TYPE_REPORT,
TYPE_THESIS,
TYPE_MASTERSTHESIS,
TYPE_PHDTHESIS,
TYPE_DIPLOMATHESIS,
TYPE_DOCTORALTHESIS,
TYPE_HABILITATIONTHESIS,
TYPE_LICENTIATETHESIS,
TYPE_PATENT,
TYPE_PROGRAM
};
typedef struct match_type {
char *name;
int type;
} match_type;
static int
get_type( fields *in )
{
match_type match_genres[] = {
{ "academic journal", TYPE_ARTICLE },
{ "magazine", TYPE_MAGARTICLE },
{ "conference publication", TYPE_INPROCEEDINGS },
{ "hearing", TYPE_HEARING },
{ "Ph.D. thesis", TYPE_PHDTHESIS },
{ "Masters thesis", TYPE_MASTERSTHESIS },
{ "Diploma thesis", TYPE_DIPLOMATHESIS },
{ "Doctoral thesis", TYPE_DOCTORALTHESIS },
{ "Habilitation thesis", TYPE_HABILITATIONTHESIS },
{ "Licentiate thesis", TYPE_LICENTIATETHESIS },
{ "legislation", TYPE_BILL },
{ "newspaper", TYPE_NEWSPAPER },
{ "communication", TYPE_COMMUNICATION },
{ "manuscript", TYPE_MANUSCRIPT },
{ "unpublished", TYPE_MANUSCRIPT },
{ "report", TYPE_REPORT },
{ "technical report", TYPE_REPORT },
{ "legal case and case notes", TYPE_CASE },
{ "patent", TYPE_PATENT },
};
int nmatch_genres = sizeof( match_genres ) / sizeof( match_genres[0] );
char *tag, *data;
int i, j, type = TYPE_UNKNOWN;
for ( i=0; i<in->n; ++i ) {
tag = in->tag[i].data;
if ( strcasecmp( tag, "GENRE:MARC" ) &&
strcasecmp( tag, "GENRE:BIBUTILS" ) &&
strcasecmp( tag, "GENRE:UNKNOWN" ) ) continue;
data = in->data[i].data;
for ( j=0; j<nmatch_genres; ++j ) {
if ( !strcasecmp( data, match_genres[j].name ) ) {
type = match_genres[j].type;
fields_setused( in, i );
}
}
if ( type==TYPE_UNKNOWN ) {
if ( !strcasecmp( data, "periodical" ) )
type = TYPE_ARTICLE;
else if ( !strcasecmp( data, "thesis" ) )
type = TYPE_THESIS;
else if ( !strcasecmp( data, "book" ) ) {
if ( in->level[i]==0 ) type = TYPE_BOOK;
else type = TYPE_INBOOK;
}
else if ( !strcasecmp( data, "collection" ) ) {
if ( in->level[i]==0 ) type = TYPE_BOOK;
else type = TYPE_INBOOK;
}
if ( type!=TYPE_UNKNOWN ) fields_setused( in, i );
}
}
if ( type==TYPE_UNKNOWN ) {
for ( i=0; i<in->n; ++i ) {
if ( strcasecmp( in->tag[i].data, "RESOURCE" ) )
continue;
data = in->data[i].data;
if ( !strcasecmp( data, "moving image" ) )
type = TYPE_BROADCAST;
else if ( !strcasecmp( data, "software, multimedia" ) )
type = TYPE_PROGRAM;
if ( type!=TYPE_UNKNOWN ) fields_setused( in, i );
}
}
/* default to generic */
if ( type==TYPE_UNKNOWN ) type = TYPE_GENERIC;
return type;
}
static int
append_title( fields *in, char *ttl, char *sub, char *adstag, int level, fields *out, int *status )
{
str fulltitle, *title, *subtitle, *vol, *iss, *sn, *en, *ar;
int fstatus, output = 0;
str_init( &fulltitle );
title = fields_findv( in, level, FIELDS_STRP, ttl );
subtitle = fields_findv( in, level, FIELDS_STRP, sub );
if ( str_has_value( title ) ) {
output = 1;
title_combine( &fulltitle, title, subtitle );
vol = fields_findv( in, LEVEL_ANY, FIELDS_STRP, "VOLUME" );
if ( str_has_value( vol ) ) {
str_strcatc( &fulltitle, ", vol. " );
str_strcat( &fulltitle, vol );
}
iss = fields_findv_firstof( in, LEVEL_ANY, FIELDS_STRP, "ISSUE",
"NUMBER", NULL );
if ( str_has_value( iss ) ) {
str_strcatc( &fulltitle, ", no. " );
str_strcat( &fulltitle, iss );
}
sn = fields_findv( in, LEVEL_ANY, FIELDS_STRP, "PAGES:START" );
en = fields_findv( in, LEVEL_ANY, FIELDS_STRP, "PAGES:STOP" );
ar = fields_findv( in, LEVEL_ANY, FIELDS_STRP, "ARTICLENUMBER" );
if ( str_has_value( sn ) ) {
if ( str_has_value( en ) ) {
str_strcatc( &fulltitle, ", pp. " );
} else {
str_strcatc( &fulltitle, ", p. " );
}
str_strcat( &fulltitle, sn );
} else if ( str_has_value( ar ) ) {
str_strcatc( &fulltitle, ", p. " );
str_strcat( &fulltitle, ar );
}
if ( str_has_value( en ) ) {
str_addchar( &fulltitle, '-' );
str_strcat( &fulltitle, en );
}
if ( str_memerr( &fulltitle ) ) {
*status = BIBL_ERR_MEMERR;
goto out;
}
fstatus = fields_add( out, adstag, str_cstr( &fulltitle ), LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) *status = BIBL_ERR_MEMERR;
}
out:
str_free( &fulltitle );
return output;
}
static void
append_titles( fields *in, int type, fields *out, int *status )
{
int added;
if ( type==TYPE_ARTICLE || type==TYPE_MAGARTICLE ) {
added = append_title( in, "TITLE", "SUBTITLE", "%J", LEVEL_HOST, out, status );
if ( added==0 )
(void) append_title( in, "SHORTTITLE", "SHORTSUBTITLE", "%J", LEVEL_HOST, out, status );
}
}
static void
append_people( fields *in, char *tag1, char *tag2, char *tag3, char *adstag, int level, fields *out, int *status )
{
str oneperson, allpeople;
vplist_index i;
int fstatus;
vplist a;
str_init( &oneperson );
str_init( &allpeople );
vplist_init( &a );
fields_findv_eachof( in, level, FIELDS_CHRP, &a, tag1, tag2, tag3, NULL );
if ( a.n ) {
for ( i=0; i<a.n; ++i ) {
if ( i!=0 ) str_strcatc( &allpeople, "; " );
name_build_withcomma( &oneperson, (char *) vplist_get( &a, i) );
str_strcat( &allpeople, &oneperson );
}
fstatus = fields_add( out, adstag, str_cstr( &allpeople ), LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) *status = BIBL_ERR_MEMERR;
}
vplist_free( &a );
str_free( &oneperson );
str_free( &allpeople );
}
static void
append_pages( fields *in, fields *out, int *status )
{
str *sn, *en, *ar;
int fstatus;
sn = fields_findv( in, LEVEL_ANY, FIELDS_STRP, "PAGES:START" );
en = fields_findv( in, LEVEL_ANY, FIELDS_STRP, "PAGES:STOP" );
ar = fields_findv( in, LEVEL_ANY, FIELDS_STRP, "ARTICLENUMBER" );
if ( str_has_value( sn ) ) {
fstatus = fields_add( out, "%P", str_cstr( sn ), LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) {
*status = BIBL_ERR_MEMERR;
return;
}
}
else if ( str_has_value( ar ) ) {
fstatus = fields_add( out, "%P", str_cstr( ar ), LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) {
*status = BIBL_ERR_MEMERR;
return;
}
}
if ( str_has_value( en ) ) {
fstatus = fields_add( out, "%L", str_cstr( en ), LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) {
*status = BIBL_ERR_MEMERR;
return;
}
}
}
static int
mont2mont( const char *m )
{
static char *monNames[]= { "jan", "feb", "mar", "apr", "may",
"jun", "jul", "aug", "sep", "oct", "nov", "dec" };
int i;
if ( isdigit( (unsigned char)m[0] ) ) return atoi( m );
else {
for ( i=0; i<12; i++ ) {
if ( !strncasecmp( m, monNames[i], 3 ) ) return i+1;
}
}
return 0;
}
static int
get_month( fields *in, int level )
{
str *month;
month = fields_findv_firstof( in, level, FIELDS_STRP, "DATE:MONTH", "PARTDATE:MONTH", NULL );
if ( str_has_value( month ) ) return mont2mont( month->data );
else return 0;
}
static void
append_date( fields *in, char *adstag, int level, fields *out, int *status )
{
int month, fstatus;
char outstr[1000];
str *year;
year = fields_findv_firstof( in, level, FIELDS_STRP, "DATE:YEAR", "PARTDATE:YEAR", NULL );
if ( str_has_value( year ) ) {
month = get_month( in, level );
sprintf( outstr, "%02d/%s", month, str_cstr( year ) );
fstatus = fields_add( out, adstag, outstr, LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) *status = BIBL_ERR_MEMERR;
}
}
#include "adsout_journals.c"
static void
output_4digit_value( char *pos, long long n )
{
char buf[6];
n = n % 10000; /* truncate to 0->9999, will fit in buf[6] */
#ifdef WIN32
sprintf( buf, "%I64d", n );
#else
sprintf( buf, "%lld", n );
#endif
if ( n < 10 ) strncpy( pos+3, buf, 1 );
else if ( n < 100 ) strncpy( pos+2, buf, 2 );
else if ( n < 1000 ) strncpy( pos+1, buf, 3 );
else strncpy( pos, buf, 4 );
}
static char
get_firstinitial( fields *in )
{
char *name;
int n;
n = fields_find( in, "AUTHOR", LEVEL_MAIN );
if ( n==FIELDS_NOTFOUND ) n = fields_find( in, "AUTHOR", LEVEL_ANY );
if ( n!=FIELDS_NOTFOUND ) {
name = fields_value( in, n, FIELDS_CHRP );
return name[0];
} else return '\0';
}
static int
get_journalabbr( fields *in )
{
char *jrnl;
int n, j;
n = fields_find( in, "TITLE", LEVEL_HOST );
if ( n!=FIELDS_NOTFOUND ) {
jrnl = fields_value( in, n, FIELDS_CHRP );
for ( j=0; j<njournals; j++ ) {
if ( !strcasecmp( jrnl, journals[j]+6 ) )
return j;
}
}
return -1;
}
static void
append_Rtag( fields *in, char *adstag, int type, fields *out, int *status )
{
char outstr[20], ch;
int n, i, fstatus;
long long page;
strcpy( outstr, "..................." );
/** YYYY */
n = fields_find( in, "DATE:YEAR", LEVEL_ANY );
if ( n==FIELDS_NOTFOUND ) n = fields_find( in, "PARTDATE:YEAR", LEVEL_ANY );
if ( n!=FIELDS_NOTFOUND ) output_4digit_value( outstr, atoi( fields_value( in, n, FIELDS_CHRP ) ) );
/** JJJJ */
n = get_journalabbr( in );
if ( n!=-1 ) {
i = 0;
while ( i<5 && journals[n][i]!=' ' && journals[n][i]!='\t' ) {
outstr[4+i] = journals[n][i];
i++;
}
}
/** VVVV */
n = fields_find( in, "VOLUME", LEVEL_ANY );
if ( n!=FIELDS_NOTFOUND ) output_4digit_value( outstr+9, atoi( fields_value( in, n, FIELDS_CHRP ) ) );
/** MPPPP */
n = fields_find( in, "PAGES:START", LEVEL_ANY );
if ( n==FIELDS_NOTFOUND ) n = fields_find( in, "ARTICLENUMBER", LEVEL_ANY );
if ( n!=FIELDS_NOTFOUND ) {
page = atoll( fields_value( in, n, FIELDS_CHRP ) );
output_4digit_value( outstr+14, page );
if ( page>=10000 ) {
ch = 'a' + (page/10000);
outstr[13] = ch;
}
}
/** A */
ch = toupper( (unsigned char) get_firstinitial( in ) );
if ( ch!='\0' ) outstr[18] = ch;
fstatus = fields_add( out, adstag, outstr, LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) *status = BIBL_ERR_MEMERR;
}
static void
append_easyall( fields *in, char *tag, char *adstag, int level, fields *out, int *status )
{
vplist_index i;
int fstatus;
vplist a;
vplist_init( &a );
fields_findv_each( in, level, FIELDS_CHRP, &a, tag );
for ( i=0; i<a.n; ++i ) {
fstatus = fields_add( out, adstag, (char*) vplist_get( &a, i ), LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) {
*status = BIBL_ERR_MEMERR;
goto out;
}
}
out:
vplist_free( &a );
}
static void
append_easy( fields *in, char *tag, char *adstag, int level, fields *out, int *status )
{
char *value;
int fstatus;
value = fields_findv( in, level, FIELDS_CHRP, tag );
if ( value && value[0]!='\0' ) {
fstatus = fields_add( out, adstag, value, LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) *status = BIBL_ERR_MEMERR;
}
}
static void
append_keys( fields *in, char *tag, char *adstag, int level, fields *out, int *status )
{
vplist_index i;
str allkeys;
int fstatus;
vplist a;
str_init( &allkeys );
vplist_init( &a );
fields_findv_each( in, level, FIELDS_CHRP, &a, tag );
if ( a.n ) {
for ( i=0; i<a.n; ++i ) {
if ( i>0 ) str_strcatc( &allkeys, ", " );
str_strcatc( &allkeys, (char *) vplist_get( &a, i ) );
}
fstatus = fields_add( out, adstag, str_cstr( &allkeys ), LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) *status = BIBL_ERR_MEMERR;
}
str_free( &allkeys );
vplist_free( &a );
}
static void
append_urls( fields *in, fields *out, int *status )
{
int lstatus;
slist types;
lstatus = slist_init_valuesc( &types, "URL", "DOI", "PMID", "PMC", "ARXIV", "JSTOR", "MRNUMBER", "FILEATTACH", "FIGATTACH", NULL );
if ( lstatus!=SLIST_OK ) {
*status = BIBL_ERR_MEMERR;
return;
}
*status = urls_merge_and_add( in, LEVEL_ANY, out, "%U", LEVEL_MAIN, &types );
slist_free( &types );
}
static void
append_trailer( fields *out, int *status )
{
int fstatus;
fstatus = fields_add( out, "%W", "PHY", LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) {
*status = BIBL_ERR_MEMERR;
return;
}
fstatus = fields_add( out, "%G", "AUTHOR", LEVEL_MAIN );
if ( fstatus!=FIELDS_OK ) {
*status = BIBL_ERR_MEMERR;
return;
}
}
static void
output( FILE *fp, fields *out )
{
char *tag, *value;
int i;
for ( i=0; i<out->n; ++i ) {
tag = fields_tag( out, i, FIELDS_CHRP );
value = fields_value( out, i, FIELDS_CHRP );
fprintf( fp, "%s %s\n", tag, value );
}
fprintf( fp, "\n" );
fflush( fp );
}
static int
append_data( fields *in, fields *out )
{
int type, status = BIBL_OK;
fields_clearused( in );
type = get_type( in );
append_people ( in, "AUTHOR", "AUTHOR:ASIS", "AUTHOR:CORP", "%A", LEVEL_MAIN, out, &status );
append_people ( in, "EDITOR", "EDITOR:ASIS", "EDITOR:CORP", "%E", LEVEL_ANY, out, &status );
append_easy ( in, "TITLE", "%T", LEVEL_ANY, out, &status );
append_titles ( in, type, out, &status );
append_date ( in, "%D", LEVEL_ANY, out, &status );
append_easy ( in, "VOLUME", "%V", LEVEL_ANY, out, &status );
append_easy ( in, "ISSUE", "%N", LEVEL_ANY, out, &status );
append_easy ( in, "NUMBER", "%N", LEVEL_ANY, out, &status );
append_easy ( in, "LANGUAGE", "%M", LEVEL_ANY, out, &status );
append_easyall( in, "NOTES", "%X", LEVEL_ANY, out, &status );
append_easy ( in, "ABSTRACT", "%B", LEVEL_ANY, out, &status );
append_keys ( in, "KEYWORD", "%K", LEVEL_ANY, out, &status );
append_urls ( in, out, &status );
append_pages ( in, out, &status );
append_easyall( in, "DOI", "%Y", LEVEL_ANY, out, &status );
append_trailer( out, &status );
append_Rtag ( in, "%R", type, out, &status );
return status;
}
static int
adsout_write( fields *in, FILE *fp, param *p, unsigned long refnum )
{
int status;
fields out;
fields_init( &out );
status = append_data( in, &out );
if ( status==BIBL_OK ) output( fp, &out );
fields_free( &out );
return status;
}
static void
adsout_writeheader( FILE *outptr, param *p )
{
if ( p->utf8bom ) utf8_writebom( outptr );
}