|
Packit |
89ede9 |
/*
|
|
Packit |
89ede9 |
* copacin.c
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
* Copyright (c) Chris Putnam 2004-2018
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
* Program and source code released under the GPL version 2
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
#include <stdio.h>
|
|
Packit |
89ede9 |
#include <stdlib.h>
|
|
Packit |
89ede9 |
#include <string.h>
|
|
Packit |
89ede9 |
#include "is_ws.h"
|
|
Packit |
89ede9 |
#include "str.h"
|
|
Packit |
89ede9 |
#include "str_conv.h"
|
|
Packit |
89ede9 |
#include "slist.h"
|
|
Packit |
89ede9 |
#include "name.h"
|
|
Packit |
89ede9 |
#include "fields.h"
|
|
Packit |
89ede9 |
#include "reftypes.h"
|
|
Packit |
89ede9 |
#include "bibformats.h"
|
|
Packit |
89ede9 |
#include "generic.h"
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
extern variants copac_all[];
|
|
Packit |
89ede9 |
extern int copac_nall;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: void copacin_initparams()
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int copacin_readf( FILE *fp, char *buf, int bufsize, int *bufpos, str *line, str *reference, int *fcharset );
|
|
Packit |
89ede9 |
static int copacin_processf( fields *bibin, char *p, char *filename, long nref, param *pm );
|
|
Packit |
89ede9 |
static int copacin_convertf( fields *bibin, fields *info, int reftype, param *pm );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
void
|
|
Packit |
89ede9 |
copacin_initparams( param *p, const char *progname )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
p->readformat = BIBL_COPACIN;
|
|
Packit |
89ede9 |
p->charsetin = BIBL_CHARSET_DEFAULT;
|
|
Packit |
89ede9 |
p->charsetin_src = BIBL_SRC_DEFAULT;
|
|
Packit |
89ede9 |
p->latexin = 0;
|
|
Packit |
89ede9 |
p->xmlin = 0;
|
|
Packit |
89ede9 |
p->utf8in = 0;
|
|
Packit |
89ede9 |
p->nosplittitle = 0;
|
|
Packit |
89ede9 |
p->verbose = 0;
|
|
Packit |
89ede9 |
p->addcount = 0;
|
|
Packit |
89ede9 |
p->output_raw = 0;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
p->readf = copacin_readf;
|
|
Packit |
89ede9 |
p->processf = copacin_processf;
|
|
Packit |
89ede9 |
p->cleanf = NULL;
|
|
Packit |
89ede9 |
p->typef = NULL;
|
|
Packit |
89ede9 |
p->convertf = copacin_convertf;
|
|
Packit |
89ede9 |
p->all = copac_all;
|
|
Packit |
89ede9 |
p->nall = copac_nall;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
slist_init( &(p->asis) );
|
|
Packit |
89ede9 |
slist_init( &(p->corps) );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( !progname ) p->progname = NULL;
|
|
Packit |
89ede9 |
else p->progname = strdup( progname );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: int copacin_readf()
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* Endnote-Refer/Copac tag definition:
|
|
Packit |
89ede9 |
character 1 = alphabetic character
|
|
Packit |
89ede9 |
character 2 = alphabetic character
|
|
Packit |
89ede9 |
character 3 = dash
|
|
Packit |
89ede9 |
character 4 = space
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
copacin_istag( char *buf )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
if (! ((buf[0]>='A' && buf[0]<='Z')) || (buf[0]>='a' && buf[0]<='z') )
|
|
Packit |
89ede9 |
return 0;
|
|
Packit |
89ede9 |
if (! ((buf[1]>='A' && buf[1]<='Z')) || (buf[1]>='a' && buf[1]<='z') )
|
|
Packit |
89ede9 |
return 0;
|
|
Packit |
89ede9 |
if (buf[2]!='-' ) return 0;
|
|
Packit |
89ede9 |
if (buf[3]!=' ' ) return 0;
|
|
Packit |
89ede9 |
return 1;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
readmore( FILE *fp, char *buf, int bufsize, int *bufpos, str *line )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
if ( line->len ) return 1;
|
|
Packit |
89ede9 |
else return str_fget( fp, buf, bufsize, bufpos, line );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
copacin_readf( FILE *fp, char *buf, int bufsize, int *bufpos, str *line, str *reference, int *fcharset )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
int haveref = 0, inref=0;
|
|
Packit |
89ede9 |
char *p;
|
|
Packit |
89ede9 |
*fcharset = CHARSET_UNKNOWN;
|
|
Packit |
89ede9 |
while ( !haveref && readmore( fp, buf, bufsize, bufpos, line ) ) {
|
|
Packit |
89ede9 |
/* blank line separates */
|
|
Packit |
89ede9 |
if ( line->data==NULL ) continue;
|
|
Packit |
89ede9 |
if ( inref && line->len==0 ) haveref=1;
|
|
Packit |
89ede9 |
p = &(line->data[0]);
|
|
Packit |
89ede9 |
/* Recognize UTF8 BOM */
|
|
Packit |
89ede9 |
if ( line->len > 2 &&
|
|
Packit |
89ede9 |
(unsigned char)(p[0])==0xEF &&
|
|
Packit |
89ede9 |
(unsigned char)(p[1])==0xBB &&
|
|
Packit |
89ede9 |
(unsigned char)(p[2])==0xBF ) {
|
|
Packit |
89ede9 |
*fcharset = CHARSET_UNICODE;
|
|
Packit |
89ede9 |
p += 3;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
if ( copacin_istag( p ) ) {
|
|
Packit |
89ede9 |
if ( inref ) str_addchar( reference, '\n' );
|
|
Packit |
89ede9 |
str_strcatc( reference, p );
|
|
Packit |
89ede9 |
str_empty( line );
|
|
Packit |
89ede9 |
inref = 1;
|
|
Packit |
89ede9 |
} else if ( inref ) {
|
|
Packit |
89ede9 |
if ( p ) {
|
|
Packit |
89ede9 |
/* copac puts tag only on 1st line */
|
|
Packit |
89ede9 |
str_addchar( reference, ' ' );
|
|
Packit |
89ede9 |
if ( *p ) p++;
|
|
Packit |
89ede9 |
if ( *p ) p++;
|
|
Packit |
89ede9 |
if ( *p ) p++;
|
|
Packit |
89ede9 |
str_strcatc( reference, p );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
str_empty( line );
|
|
Packit |
89ede9 |
} else {
|
|
Packit |
89ede9 |
str_empty( line );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
return haveref;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: int copacin_processf()
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static char*
|
|
Packit |
89ede9 |
copacin_addtag2( char *p, str *tag, str *data )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
int i;
|
|
Packit |
89ede9 |
i =0;
|
|
Packit |
89ede9 |
while ( i<3 && *p ) {
|
|
Packit |
89ede9 |
str_addchar( tag, *p++ );
|
|
Packit |
89ede9 |
i++;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
while ( *p==' ' || *p=='\t' ) p++;
|
|
Packit |
89ede9 |
while ( *p && *p!='\r' && *p!='\n' ) {
|
|
Packit |
89ede9 |
str_addchar( data, *p );
|
|
Packit |
89ede9 |
p++;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
str_trimendingws( data );
|
|
Packit |
89ede9 |
while ( *p=='\n' || *p=='\r' ) p++;
|
|
Packit |
89ede9 |
return p;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static char *
|
|
Packit |
89ede9 |
copacin_nextline( char *p )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
while ( *p && *p!='\n' && *p!='\r') p++;
|
|
Packit |
89ede9 |
while ( *p=='\n' || *p=='\r' ) p++;
|
|
Packit |
89ede9 |
return p;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
copacin_processf( fields *copacin, char *p, char *filename, long nref, param *pm )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
str tag, data;
|
|
Packit |
89ede9 |
int status;
|
|
Packit |
89ede9 |
str_init( &tag );
|
|
Packit |
89ede9 |
str_init( &data );
|
|
Packit |
89ede9 |
while ( *p ) {
|
|
Packit |
89ede9 |
p = skip_ws( p );
|
|
Packit |
89ede9 |
if ( copacin_istag( p ) ) {
|
|
Packit |
89ede9 |
p = copacin_addtag2( p, &tag, &data );
|
|
Packit |
89ede9 |
/* don't add empty strings */
|
|
Packit |
89ede9 |
if ( str_has_value( &tag ) && str_has_value( &data ) ) {
|
|
Packit |
89ede9 |
status = fields_add( copacin, tag.data, data.data, 0 );
|
|
Packit |
89ede9 |
if ( status!=FIELDS_OK ) return 0;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
str_empty( &tag );
|
|
Packit |
89ede9 |
str_empty( &data );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
else p = copacin_nextline( p );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
str_free( &tag );
|
|
Packit |
89ede9 |
str_free( &data );
|
|
Packit |
89ede9 |
return 1;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/*****************************************************
|
|
Packit |
89ede9 |
PUBLIC: int copacin_convertf(), returns BIBL_OK or BIBL_ERR_MEMERR
|
|
Packit |
89ede9 |
*****************************************************/
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
/* copac names appear to always start with last name first, but don't
|
|
Packit |
89ede9 |
* always seem to have a comma after the name
|
|
Packit |
89ede9 |
*
|
|
Packit |
89ede9 |
* editors seem to be stuck in as authors with the tag "[Editor]" in it
|
|
Packit |
89ede9 |
*/
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
copacin_person( fields *bibin, int n, str *intag, str *invalue, int level, param *pm, char *outtag, fields *bibout )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
char *usetag = outtag, editor[]="EDITOR";
|
|
Packit |
89ede9 |
int comma = 0, i, ok, status;
|
|
Packit |
89ede9 |
str usename, *s;
|
|
Packit |
89ede9 |
slist tokens;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( slist_find( &(pm->asis), invalue ) !=-1 ||
|
|
Packit |
89ede9 |
slist_find( &(pm->corps), invalue ) !=-1 ) {
|
|
Packit |
89ede9 |
ok = name_add( bibout, outtag, invalue->data, level, &(pm->asis), &(pm->corps) );
|
|
Packit |
89ede9 |
if ( ok ) return BIBL_OK;
|
|
Packit |
89ede9 |
else return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
slist_init( &tokens );
|
|
Packit |
89ede9 |
str_init( &usename );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
status = slist_tokenize( &tokens, invalue, " ", 1 );
|
|
Packit |
89ede9 |
if ( status!=SLIST_OK ) return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
for ( i=0; i
|
|
Packit |
89ede9 |
s = slist_str( &tokens, i );
|
|
Packit |
89ede9 |
if ( !strcmp( str_cstr( s ), "[Editor]" ) ) {
|
|
Packit |
89ede9 |
usetag = editor;
|
|
Packit |
89ede9 |
str_empty( s );
|
|
Packit |
89ede9 |
} else if ( s->len && s->data[s->len-1]==',' ) {
|
|
Packit |
89ede9 |
comma++;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( comma==0 && tokens.n ) {
|
|
Packit |
89ede9 |
s = slist_str( &tokens, 0 );
|
|
Packit |
89ede9 |
str_addchar( s, ',' );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
for ( i=0; i
|
|
Packit |
89ede9 |
s = slist_str( &tokens, i );
|
|
Packit |
89ede9 |
if ( str_is_empty( s ) ) continue;
|
|
Packit |
89ede9 |
if ( i ) str_addchar( &usename, ' ' );
|
|
Packit |
89ede9 |
str_strcat( &usename, s );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
slist_free( &tokens );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
ok = name_add( bibout, usetag, str_cstr( &usename ), level, &(pm->asis), &(pm->corps) );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
str_free( &usename );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( ok ) return BIBL_OK;
|
|
Packit |
89ede9 |
else return BIBL_ERR_MEMERR;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static void
|
|
Packit |
89ede9 |
copacin_report_notag( param *p, char *tag )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
if ( p->verbose ) {
|
|
Packit |
89ede9 |
if ( p->progname ) fprintf( stderr, "%s: ", p->progname );
|
|
Packit |
89ede9 |
fprintf( stderr, "Cannot find tag '%s'\n", tag );
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
static int
|
|
Packit |
89ede9 |
copacin_convertf( fields *bibin, fields *bibout, int reftype, param *p )
|
|
Packit |
89ede9 |
{
|
|
Packit |
89ede9 |
static int (*convertfns[NUM_REFTYPES])(fields *, int, str *, str *, int, param *, char *, fields *) = {
|
|
Packit |
89ede9 |
[ 0 ... NUM_REFTYPES-1 ] = generic_null,
|
|
Packit |
89ede9 |
[ SIMPLE ] = generic_simple,
|
|
Packit |
89ede9 |
[ TITLE ] = generic_title,
|
|
Packit |
89ede9 |
[ NOTES ] = generic_notes,
|
|
Packit |
89ede9 |
[ SERIALNO ] = generic_serialno,
|
|
Packit |
89ede9 |
[ PERSON ] = copacin_person
|
|
Packit |
89ede9 |
};
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
int process, level, i, nfields, status = BIBL_OK;
|
|
Packit |
89ede9 |
str *intag, *invalue;
|
|
Packit |
89ede9 |
char *outtag;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
nfields = fields_num( bibin );
|
|
Packit |
89ede9 |
for ( i=0; i
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
intag = fields_tag( bibin, i, FIELDS_STRP );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
if ( !translate_oldtag( intag->data, reftype, p->all, p->nall, &process, &level, &outtag ) ) {
|
|
Packit |
89ede9 |
copacin_report_notag( p, intag->data );
|
|
Packit |
89ede9 |
continue;
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
invalue = fields_value( bibin, i, FIELDS_STRP );
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
status = convertfns[ process ] ( bibin, i, intag, invalue, level, p, outtag, bibout );
|
|
Packit |
89ede9 |
if ( status!=BIBL_OK ) return status;
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
}
|
|
Packit |
89ede9 |
|
|
Packit |
89ede9 |
return status;
|
|
Packit |
89ede9 |
}
|