|
Packit |
89ede9 |
/*
|
|
Packit |
89ede9 |
* endin.c
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
* Copyright (c) Chris Putnam 2003-2018
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
* Program and source code released under the GPL version 2
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
#include <stdio.h>
|
|
Packit |
89ede9 |
#include <stdlib.h>
|
|
Packit |
89ede9 |
#include <string.h>
|
|
Packit |
89ede9 |
#include <ctype.h>
|
|
Packit |
89ede9 |
#include "is_ws.h"
|
|
Packit |
89ede9 |
#include "str.h"
|
|
Packit |
89ede9 |
#include "str_conv.h"
|
|
Packit |
89ede9 |
#include "fields.h"
|
|
Packit |
89ede9 |
#include "url.h"
|
|
Packit |
89ede9 |
#include "reftypes.h"
|
|
Packit |
89ede9 |
#include "bibformats.h"
|
|
Packit |
89ede9 |
#include "generic.h"
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
extern variants end_all[];
|
|
Packit |
89ede9 |
extern int end_nall;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: void endin_initparams()
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int endin_readf( FILE *fp, char *buf, int bufsize, int *bufpos, str *line, str *reference, int *fcharset );
|
|
Packit |
89ede9 |
static int endin_processf( fields *endin, char *p, char *filename, long nref, param *pm );
|
|
Packit |
89ede9 |
int endin_typef( fields *endin, char *filename, int nrefs, param *p );
|
|
Packit |
89ede9 |
int endin_convertf( fields *endin, fields *info, int reftype, param *p );
|
|
Packit |
89ede9 |
int endin_cleanf( bibl *bin, param *p );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
void
|
|
Packit |
89ede9 |
endin_initparams( param *p, const char *progname )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
p->readformat = BIBL_ENDNOTEIN;
|
|
Packit |
89ede9 |
p->charsetin = BIBL_CHARSET_DEFAULT;
|
|
Packit |
89ede9 |
p->charsetin_src = BIBL_SRC_DEFAULT;
|
|
Packit |
89ede9 |
p->latexin = 0;
|
|
Packit |
89ede9 |
p->xmlin = 0;
|
|
Packit |
89ede9 |
p->utf8in = 0;
|
|
Packit |
89ede9 |
p->nosplittitle = 0;
|
|
Packit |
89ede9 |
p->verbose = 0;
|
|
Packit |
89ede9 |
p->addcount = 0;
|
|
Packit |
89ede9 |
p->output_raw = 0;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
p->readf = endin_readf;
|
|
Packit |
89ede9 |
p->processf = endin_processf;
|
|
Packit |
89ede9 |
p->cleanf = endin_cleanf;
|
|
Packit |
89ede9 |
p->typef = endin_typef;
|
|
Packit |
89ede9 |
p->convertf = endin_convertf;
|
|
Packit |
89ede9 |
p->all = end_all;
|
|
Packit |
89ede9 |
p->nall = end_nall;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
slist_init( &(p->asis) );
|
|
Packit |
89ede9 |
slist_init( &(p->corps) );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( !progname ) p->progname = NULL;
|
|
Packit |
89ede9 |
else p->progname = strdup( progname );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: int endin_readf()
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* Endnote tag definition:
|
|
Packit |
89ede9 |
character 1 = '%'
|
|
Packit |
89ede9 |
character 2 = alphabetic character or digit (or other characters)
|
|
Packit |
89ede9 |
character 3 = space (ansi 32)
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
endin_istag( char *buf )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
const char others[]="!@#$^&*()+=?[~>";
|
|
Packit |
89ede9 |
if ( buf[0]!='%' ) return 0;
|
|
Packit |
89ede9 |
if ( buf[2]!=' ' ) return 0;
|
|
Packit |
89ede9 |
if ( isalpha( (unsigned char)buf[1] ) ) return 1;
|
|
Packit |
89ede9 |
if ( isdigit( (unsigned char)buf[1] ) ) return 1;
|
|
Packit |
89ede9 |
if ( strchr( others, buf[1] ) ) return 1;
|
|
Packit |
89ede9 |
return 0;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
readmore( FILE *fp, char *buf, int bufsize, int *bufpos, str *line )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
if ( line->len ) return 1;
|
|
Packit |
89ede9 |
else return str_fget( fp, buf, bufsize, bufpos, line );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
endin_readf( FILE *fp, char *buf, int bufsize, int *bufpos, str *line, str *reference, int *fcharset )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
int haveref = 0, inref = 0;
|
|
Packit |
89ede9 |
unsigned char *up;
|
|
Packit |
89ede9 |
char *p;
|
|
Packit |
89ede9 |
*fcharset = CHARSET_UNKNOWN;
|
|
Packit |
89ede9 |
while ( !haveref && readmore( fp, buf, bufsize, bufpos, line ) ) {
|
|
Packit |
89ede9 |
if ( !line->data ) continue;
|
|
Packit |
89ede9 |
p = &(line->data[0]);
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* Skip <feff> Unicode header information */
|
|
Packit |
89ede9 |
/* <feff> = ef bb bf */
|
|
Packit |
89ede9 |
up = (unsigned char* ) p;
|
|
Packit |
89ede9 |
if ( line->len > 2 && up[0]==0xEF && up[1]==0xBB &&
|
|
Packit |
89ede9 |
up[2]==0xBF ) {
|
|
Packit |
89ede9 |
*fcharset = CHARSET_UNICODE;
|
|
Packit |
89ede9 |
p += 3;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( !*p ) {
|
|
Packit |
89ede9 |
if ( inref ) haveref = 1; /* blank line separates */
|
|
Packit |
89ede9 |
else continue; /* blank line to ignore */
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
/* Each reference starts with a tag && ends with a blank line */
|
|
Packit |
89ede9 |
if ( endin_istag( p ) ) {
|
|
Packit |
89ede9 |
if ( reference->len ) str_addchar( reference, '\n' );
|
|
Packit |
89ede9 |
str_strcatc( reference, p );
|
|
Packit |
89ede9 |
inref = 1;
|
|
Packit |
89ede9 |
} else if ( inref && p ) {
|
|
Packit |
89ede9 |
str_addchar( reference, '\n' );
|
|
Packit |
89ede9 |
str_strcatc( reference, p );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
str_empty( line );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
if ( reference->len ) haveref = 1;
|
|
Packit |
89ede9 |
return haveref;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: int endin_processf()
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
static char*
|
|
Packit |
89ede9 |
process_endline( str *tag, str *data, char *p )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
int i;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
i = 0;
|
|
Packit |
89ede9 |
while ( i<2 && *p ) {
|
|
Packit |
89ede9 |
str_addchar( tag, *p++);
|
|
Packit |
89ede9 |
i++;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
while ( *p==' ' || *p=='\t' ) p++;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
while ( *p && *p!='\r' && *p!='\n' )
|
|
Packit |
89ede9 |
str_addchar( data, *p++ );
|
|
Packit |
89ede9 |
str_trimendingws( data );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
while ( *p=='\r' || *p=='\n' ) p++;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
return p;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static char *
|
|
Packit |
89ede9 |
process_endline2( str *tag, str *data, char *p )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
while ( *p==' ' || *p=='\t' ) p++;
|
|
Packit |
89ede9 |
while ( *p && *p!='\r' && *p!='\n' )
|
|
Packit |
89ede9 |
str_addchar( data, *p++ );
|
|
Packit |
89ede9 |
str_trimendingws( data );
|
|
Packit |
89ede9 |
while ( *p=='\r' || *p=='\n' ) p++;
|
|
Packit |
89ede9 |
return p;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
endin_processf( fields *endin, char *p, char *filename, long nref, param *pm )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
str tag, data;
|
|
Packit |
89ede9 |
int status, n;
|
|
Packit |
89ede9 |
strs_init( &tag, &data, NULL );
|
|
Packit |
89ede9 |
while ( *p ) {
|
|
Packit |
89ede9 |
strs_empty( &tag, &data, NULL );
|
|
Packit |
89ede9 |
if ( endin_istag( p ) ) {
|
|
Packit |
89ede9 |
p = process_endline( &tag, &data, p );
|
|
Packit |
89ede9 |
if ( str_is_empty( &data ) ) continue;
|
|
Packit |
89ede9 |
status = fields_add( endin, str_cstr( &tag ), str_cstr( &data ), 0 );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return 0;
|
|
Packit |
89ede9 |
} else {
|
|
Packit |
89ede9 |
p = process_endline2( &tag, &data, p );
|
|
Packit |
89ede9 |
/* endnote puts %K only on 1st line of keywords */
|
|
Packit |
89ede9 |
n = fields_num( endin );
|
|
Packit |
89ede9 |
if ( n>0 && str_has_value( &data ) ) {
|
|
Packit |
89ede9 |
if ( !strncmp( endin->tag[n-1].data, "%K", 2 ) ) {
|
|
Packit |
89ede9 |
status = fields_add( endin, "%K", str_cstr( &data ), 0 );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return 0;
|
|
Packit |
89ede9 |
} else {
|
|
Packit |
89ede9 |
str_addchar( &(endin->data[n-1]), ' ' );
|
|
Packit |
89ede9 |
str_strcat( &(endin->data[n-1]), &data );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
strs_free( &tag, &data, NULL );
|
|
Packit |
89ede9 |
return 1;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: int endin_typef()
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* Endnote defaults if no %0 tag
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
* if %J & %V - journal article
|
|
Packit |
89ede9 |
* if %B - book section
|
|
Packit |
89ede9 |
* if %R & !%T - report
|
|
Packit |
89ede9 |
* if %I & !%B & !%J & !%R - book
|
|
Packit |
89ede9 |
* if !%B & !%J & !%R & !%I - journal article
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
int
|
|
Packit |
89ede9 |
endin_typef( fields *endin, char *filename, int nrefs, param *p )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
int ntypename, nrefname, is_default, nj, nv, nb, nr, nt, ni;
|
|
Packit |
89ede9 |
char *refname = "", *typename="";
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
ntypename = fields_find( endin, "%0", LEVEL_MAIN );
|
|
Packit |
89ede9 |
nrefname = fields_find( endin, "%F", LEVEL_MAIN );
|
|
Packit |
89ede9 |
if ( nrefname!=-1 ) refname = fields_value( endin, nrefname, FIELDS_CHRP_NOUSE );
|
|
Packit |
89ede9 |
if ( ntypename!=-1 ) typename = fields_value( endin, ntypename, FIELDS_CHRP_NOUSE );
|
|
Packit |
89ede9 |
else {
|
|
Packit |
89ede9 |
nj = fields_find( endin, "%J", 0 );
|
|
Packit |
89ede9 |
nv = fields_find( endin, "%V", 0 );
|
|
Packit |
89ede9 |
nb = fields_find( endin, "%B", 0 );
|
|
Packit |
89ede9 |
nr = fields_find( endin, "%R", 0 );
|
|
Packit |
89ede9 |
nt = fields_find( endin, "%T", 0 );
|
|
Packit |
89ede9 |
ni = fields_find( endin, "%I", 0 );
|
|
Packit |
89ede9 |
if ( nj!=-1 && nv!=-1 ) {
|
|
Packit |
89ede9 |
typename = "Journal Article";
|
|
Packit |
89ede9 |
} else if ( nb!=-1 ) {
|
|
Packit |
89ede9 |
typename = "Book Section";
|
|
Packit |
89ede9 |
} else if ( nr!=-1 && nt==-1 ) {
|
|
Packit |
89ede9 |
typename = "Report";
|
|
Packit |
89ede9 |
} else if ( ni!=-1 && nb==-1 && nj==-1 && nr==-1 ) {
|
|
Packit |
89ede9 |
typename = "Book";
|
|
Packit |
89ede9 |
} else if ( nb==-1 && nj==-1 && nr==-1 && ni==-1 ) {
|
|
Packit |
89ede9 |
typename = "Journal Article";
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
return get_reftype( typename, nrefs, p->progname, p->all, p->nall, refname, &is_default, REFTYPE_CHATTY );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: void endin_cleanf()
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* Wiley puts multiple authors separated by commas on the %A lines.
|
|
Packit |
89ede9 |
* We can detect this by finding the terminal comma in the value
|
|
Packit |
89ede9 |
* from the tag/value pair.
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
* "%A" "Author A. X. Last, Author N. B. Next,"
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
is_wiley_author( fields *endin, int n )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
str *t, *v;
|
|
Packit |
89ede9 |
t = fields_tag( endin, n, FIELDS_STRP_NOUSE );
|
|
Packit |
89ede9 |
if ( str_is_empty( t ) || strcmp( str_cstr( t ), "%A" ) ) return 0;
|
|
Packit |
89ede9 |
v = fields_value( endin, n, FIELDS_STRP_NOUSE );
|
|
Packit |
89ede9 |
if ( str_is_empty( v ) ) return 0;
|
|
Packit |
89ede9 |
if ( v->data[v->len-1]!=',' ) return 0;
|
|
Packit |
89ede9 |
return 1;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
add_wiley_author( fields *endin, char *intag, str *instring, int inlevel, str *name, int authornum )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
int fstatus;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* if first author, just replace the data string in the field */
|
|
Packit |
89ede9 |
if ( authornum==0 ) {
|
|
Packit |
89ede9 |
str_strcpy( instring, name );
|
|
Packit |
89ede9 |
if ( str_memerr( instring ) ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* otherwise, append the author */
|
|
Packit |
89ede9 |
else {
|
|
Packit |
89ede9 |
fstatus = fields_add( endin, intag, str_cstr( name ), inlevel );
|
|
Packit |
89ede9 |
if ( fstatus!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
return BIBL_OK;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
cleanup_wiley_author( fields *endin, int n )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
int status=BIBL_OK, inlevel, authornum = 0;
|
|
Packit |
89ede9 |
str *instring, copy, name;
|
|
Packit |
89ede9 |
char *p, *intag;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
strs_init( ©, &name, NULL );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
intag = fields_tag ( endin, n, FIELDS_CHRP_NOUSE );
|
|
Packit |
89ede9 |
instring = fields_value( endin, n, FIELDS_STRP_NOUSE );
|
|
Packit |
89ede9 |
inlevel = fields_level( endin, n );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
str_strcpy( ©, instring );
|
|
Packit |
89ede9 |
p = str_cstr( © );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
while ( *p ) {
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( *p==',' ) {
|
|
Packit |
89ede9 |
if ( str_memerr( &name ) ) {
|
|
Packit |
89ede9 |
status = BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
goto out;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
status = add_wiley_author( endin, intag, instring, inlevel, &name, authornum );
|
|
Packit |
89ede9 |
if ( status!=BIBL_OK ) goto out;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
str_empty( &name );
|
|
Packit |
89ede9 |
authornum++;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
p++;
|
|
Packit |
89ede9 |
while ( is_ws( *p ) ) p++;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
else {
|
|
Packit |
89ede9 |
str_addchar( &name, *p );
|
|
Packit |
89ede9 |
p++;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( str_has_value( &name ) )
|
|
Packit |
89ede9 |
status = add_wiley_author( endin, intag, instring, inlevel, &name, authornum );
|
|
Packit |
89ede9 |
out:
|
|
Packit |
89ede9 |
strs_free( ©, &name, NULL );
|
|
Packit |
89ede9 |
return status;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
endin_cleanref( fields *endin )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
int i, n, status;
|
|
Packit |
89ede9 |
n = fields_num( endin );
|
|
Packit |
89ede9 |
for ( i=0; i
|
|
Packit |
89ede9 |
if ( is_wiley_author( endin, i ) ) {
|
|
Packit |
89ede9 |
status = cleanup_wiley_author( endin, i );
|
|
Packit |
89ede9 |
if ( status!=BIBL_OK ) return status;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
return BIBL_OK;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
int
|
|
Packit |
89ede9 |
endin_cleanf( bibl *bin, param *p )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
long i;
|
|
Packit |
89ede9 |
for ( i=0; i<bin->nrefs; ++i )
|
|
Packit |
89ede9 |
endin_cleanref( bin->ref[i] );
|
|
Packit |
89ede9 |
return BIBL_OK;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: int endin_convertf(), returns BIBL_OK or BIBL_ERR_MEMERR
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* month_convert()
|
|
Packit |
89ede9 |
* convert month name to number in format MM, e.g. "January" -> "01"
|
|
Packit |
89ede9 |
* if converted, return 1
|
|
Packit |
89ede9 |
* otherwise return 0
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
month_convert( char *in, char *out )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
char *month1[12]={
|
|
Packit |
89ede9 |
"January", "February",
|
|
Packit |
89ede9 |
"March", "April",
|
|
Packit |
89ede9 |
"May", "June",
|
|
Packit |
89ede9 |
"July", "August",
|
|
Packit |
89ede9 |
"September", "October",
|
|
Packit |
89ede9 |
"November", "December"
|
|
Packit |
89ede9 |
};
|
|
Packit |
89ede9 |
char *month2[12]={
|
|
Packit |
89ede9 |
"Jan", "Feb",
|
|
Packit |
89ede9 |
"Mar", "Apr",
|
|
Packit |
89ede9 |
"May", "Jun",
|
|
Packit |
89ede9 |
"Jul", "Aug",
|
|
Packit |
89ede9 |
"Sep", "Oct",
|
|
Packit |
89ede9 |
"Nov", "Dec"
|
|
Packit |
89ede9 |
};
|
|
Packit |
89ede9 |
int i, found = -1;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
for ( i=0; i<12 && found==-1; ++i ) {
|
|
Packit |
89ede9 |
if ( !strcasecmp( in, month1[i] ) ) found = i;
|
|
Packit |
89ede9 |
if ( !strcasecmp( in, month2[i] ) ) found = i;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( found==-1 ) return 0;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( found > 8 )
|
|
Packit |
89ede9 |
sprintf( out, "%d", found+1 );
|
|
Packit |
89ede9 |
else
|
|
Packit |
89ede9 |
sprintf( out, "0%d", found+1 );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
return 1;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
endin_date( fields *bibin, int n, str *intag, str *invalue, int level, param *pm, char *outtag, fields *bibout )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
char *tags[3][2] = {
|
|
Packit |
89ede9 |
{ "DATE:YEAR", "PARTDATE:YEAR" },
|
|
Packit |
89ede9 |
{ "DATE:MONTH", "PARTDATE:MONTH" },
|
|
Packit |
89ede9 |
{ "DATE:DAY", "PARTDATE:DAY" }
|
|
Packit |
89ede9 |
};
|
|
Packit |
89ede9 |
char *p = invalue->data;
|
|
Packit |
89ede9 |
char month[10], *m;
|
|
Packit |
89ede9 |
int part, status;
|
|
Packit |
89ede9 |
str date;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
str_init( &date );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( !strncasecmp( outtag, "PART", 4 ) ) part = 1;
|
|
Packit |
89ede9 |
else part = 0;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* %D YEAR */
|
|
Packit |
89ede9 |
if ( !strcasecmp( intag->data, "%D" ) ) {
|
|
Packit |
89ede9 |
str_cpytodelim( &date, skip_ws( p ), "", 0 );
|
|
Packit |
89ede9 |
if ( str_memerr( &date ) ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
if ( str_has_value( &date ) ) {
|
|
Packit |
89ede9 |
status = fields_add( bibout, tags[0][part], date.data, level );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* %8 MONTH DAY, YEAR */
|
|
Packit |
89ede9 |
/* %8 MONTH, YEAR */
|
|
Packit |
89ede9 |
/* %8 MONTH YEAR */
|
|
Packit |
89ede9 |
else if ( !strcasecmp( intag->data, "%8" ) ) {
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* ...get month */
|
|
Packit |
89ede9 |
p = str_cpytodelim( &date, skip_ws( p ), " ,\n", 0 );
|
|
Packit |
89ede9 |
if ( str_memerr( &date ) ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
if ( str_has_value( &date ) ) {
|
|
Packit |
89ede9 |
if ( month_convert( date.data, month ) ) m = month;
|
|
Packit |
89ede9 |
else m = str_cstr( &date );
|
|
Packit |
89ede9 |
status = fields_add( bibout, tags[1][part], m, level );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
p = skip_ws( p );
|
|
Packit |
89ede9 |
if ( *p==',' ) p++;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* ...get days */
|
|
Packit |
89ede9 |
p = str_cpytodelim( &date, skip_ws( p ), ",\n", 0 );
|
|
Packit |
89ede9 |
if ( str_memerr( &date ) ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
if ( date.len>0 && date.len<3 ) {
|
|
Packit |
89ede9 |
status = fields_add( bibout, tags[2][part], date.data, level );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
} else if ( date.len==4 ) {
|
|
Packit |
89ede9 |
status = fields_add( bibout, tags[0][part], date.data, level );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
p = skip_ws( p );
|
|
Packit |
89ede9 |
if ( *p==',' ) p++;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* ...get year */
|
|
Packit |
89ede9 |
(void) str_cpytodelim( &date, skip_ws( p ), " \t\n\r", 0 );
|
|
Packit |
89ede9 |
if ( str_memerr( &date ) ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
if ( str_has_value( &date ) ) {
|
|
Packit |
89ede9 |
status = fields_add( bibout, tags[0][part], date.data, level );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
str_free( &date );
|
|
Packit |
89ede9 |
return BIBL_OK;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
endin_type( fields *bibin, int n, str *intag, str *invalue, int level, param *pm, char *outtag, fields *bibout )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
lookups types[] = {
|
|
Packit |
89ede9 |
{ "GENERIC", "ARTICLE" },
|
|
Packit |
89ede9 |
{ "BOOK", "BOOK" },
|
|
Packit |
89ede9 |
{ "MANUSCRIPT", "MANUSCRIPT" },
|
|
Packit |
89ede9 |
{ "CONFERENCE PROCEEDINGS", "INPROCEEDINGS"},
|
|
Packit |
89ede9 |
{ "REPORT", "REPORT" },
|
|
Packit |
89ede9 |
{ "COMPUTER PROGRAM", "BOOK" },
|
|
Packit |
89ede9 |
{ "AUDIOVISUAL MATERIAL", "AUDIOVISUAL" },
|
|
Packit |
89ede9 |
{ "ARTWORK", "BOOK" },
|
|
Packit |
89ede9 |
{ "PATENT", "BOOK" },
|
|
Packit |
89ede9 |
{ "BILL", "BILL" },
|
|
Packit |
89ede9 |
{ "CASE", "CASE" },
|
|
Packit |
89ede9 |
{ "JOURNAL ARTICLE", "ARTICLE" },
|
|
Packit |
89ede9 |
{ "MAGAZINE ARTICLE", "ARTICLE" },
|
|
Packit |
89ede9 |
{ "BOOK SECTION", "INBOOK" },
|
|
Packit |
89ede9 |
{ "EDITED BOOK", "BOOK" },
|
|
Packit |
89ede9 |
{ "NEWSPAPER ARTICLE", "NEWSARTICLE" },
|
|
Packit |
89ede9 |
{ "THESIS", "PHDTHESIS" },
|
|
Packit |
89ede9 |
{ "PERSONAL COMMUNICATION", "COMMUNICATION" },
|
|
Packit |
89ede9 |
{ "ELECTRONIC SOURCE", "TEXT" },
|
|
Packit |
89ede9 |
{ "FILM OR BROADCAST", "AUDIOVISUAL" },
|
|
Packit |
89ede9 |
{ "MAP", "MAP" },
|
|
Packit |
89ede9 |
{ "HEARING", "HEARING" },
|
|
Packit |
89ede9 |
{ "STATUTE", "STATUTE" },
|
|
Packit |
89ede9 |
{ "CHART OR TABLE", "CHART" },
|
|
Packit |
89ede9 |
{ "WEB PAGE", "WEBPAGE" },
|
|
Packit |
89ede9 |
};
|
|
Packit |
89ede9 |
int ntypes = sizeof( types ) / sizeof( lookups );
|
|
Packit |
89ede9 |
int i, status, found=0;
|
|
Packit |
89ede9 |
for ( i=0; i
|
|
Packit |
89ede9 |
if ( !strcasecmp( types[i].oldstr, invalue->data ) ) {
|
|
Packit |
89ede9 |
found = 1;
|
|
Packit |
89ede9 |
status = fields_add( bibout, "INTERNAL_TYPE", types[i].newstr, level );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
if ( !found ) {
|
|
Packit |
89ede9 |
fprintf( stderr, "Did not identify reference type '%s'\n", invalue->data );
|
|
Packit |
89ede9 |
fprintf( stderr, "Defaulting to journal article type\n");
|
|
Packit |
89ede9 |
status = fields_add( bibout, "INTERNAL_TYPE", types[0].newstr, level );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
return BIBL_OK;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static void
|
|
Packit |
89ede9 |
endin_notag( param *p, char *tag, char *data )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
if ( p->verbose ) {
|
|
Packit |
89ede9 |
if ( p->progname ) fprintf( stderr, "%s: ", p->progname );
|
|
Packit |
89ede9 |
fprintf( stderr, "Cannot find tag '%s'='%s'\n", tag, data );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
int
|
|
Packit |
89ede9 |
endin_convertf( fields *bibin, fields *bibout, int reftype, param *p )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
static int (*convertfns[NUM_REFTYPES])(fields *, int, str *, str *, int, param *, char *, fields *) = {
|
|
Packit |
89ede9 |
[ 0 ... NUM_REFTYPES-1 ] = generic_null,
|
|
Packit |
89ede9 |
[ SIMPLE ] = generic_simple,
|
|
Packit |
89ede9 |
[ TITLE ] = generic_title,
|
|
Packit |
89ede9 |
[ PERSON ] = generic_person,
|
|
Packit |
89ede9 |
[ SERIALNO ] = generic_serialno,
|
|
Packit |
89ede9 |
[ PAGES ] = generic_pages,
|
|
Packit |
89ede9 |
[ NOTES ] = generic_notes,
|
|
Packit |
89ede9 |
[ URL ] = generic_url,
|
|
Packit |
89ede9 |
[ GENRE ] = generic_genre,
|
|
Packit |
89ede9 |
[ TYPE ] = endin_type,
|
|
Packit |
89ede9 |
[ DATE ] = endin_date,
|
|
Packit |
89ede9 |
};
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
int i, level, process, nfields, fstatus, status = BIBL_OK;
|
|
Packit |
89ede9 |
char *outtag;
|
|
Packit |
89ede9 |
str *intag, *invalue;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
nfields = fields_num( bibin );
|
|
Packit |
89ede9 |
for ( i=0; i
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* Ensure we have data */
|
|
Packit |
89ede9 |
if ( fields_nodata( bibin, i ) ) {
|
|
Packit |
89ede9 |
fields_setused( bibin, i );
|
|
Packit |
89ede9 |
continue;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
intag = fields_tag( bibin, i, FIELDS_STRP );
|
|
Packit |
89ede9 |
invalue = fields_value( bibin, i, FIELDS_STRP );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*
|
|
Packit |
89ede9 |
* Refer format tags start with '%'. If we have one
|
|
Packit |
89ede9 |
* that doesn't, assume that it comes from endx2xml
|
|
Packit |
89ede9 |
* and just copy and paste to output
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
if ( str_has_value( intag ) && intag->data[0]!='%' ) {
|
|
Packit |
89ede9 |
fstatus = fields_add( bibout, str_cstr( intag ), str_cstr( invalue ), bibin->level[i] );
|
|
Packit |
89ede9 |
if ( fstatus!=FIELDS_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
continue;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( !translate_oldtag( str_cstr( intag ), reftype, p->all, p->nall, &process, &level, &outtag ) ) {
|
|
Packit |
89ede9 |
endin_notag( p, str_cstr( intag ), str_cstr( invalue ) );
|
|
Packit |
89ede9 |
continue;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
fields_setused( bibin, i );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
status = convertfns[ process ]( bibin, i, intag, invalue, level, p, outtag, bibout );
|
|
Packit |
89ede9 |
if ( status!=BIBL_OK ) return status;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
return status;
|
|
Packit |
89ede9 |
}
|