Page Menu
Home
c4science
Search
Configure Global Search
Log In
Files
F91090211
refextract_config.py
No One
Temporary
Actions
Download File
Edit File
Delete File
View Transforms
Subscribe
Mute Notifications
Award Token
Subscribers
None
File Metadata
Details
File Info
Storage
Attached
Created
Thu, Nov 7, 19:21
Size
3 KB
Mime Type
text/x-python
Expires
Sat, Nov 9, 19:21 (1 d, 21 h)
Engine
blob
Format
Raw Data
Handle
22194622
Attached To
R3600 invenio-infoscience
refextract_config.py
View Options
# -*- coding: utf-8 -*-
##
## This file is part of CDS Invenio.
## Copyright (C) 2002, 2003, 2004, 2005, 2006, 2007, 2008 CERN.
##
## CDS Invenio is free software; you can redistribute it and/or
## modify it under the terms of the GNU General Public License as
## published by the Free Software Foundation; either version 2 of the
## License, or (at your option) any later version.
##
## CDS Invenio is distributed in the hope that it will be useful, but
## WITHOUT ANY WARRANTY; without even the implied warranty of
## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
## General Public License for more details.
##
## You should have received a copy of the GNU General Public License
## along with CDS Invenio; if not, write to the Free Software Foundation, Inc.,
## 59 Temple Place, Suite 330, Boston, MA 02111-1307, USA.
"""RefExtract configuration."""
__revision__
=
"$Id$"
from
invenio.config
import
CFG_VERSION
,
CFG_ETCDIR
,
CFG_SITE_NAME
# pylint: disable-msg=C0301
# version number:
CFG_REFEXTRACT_VERSION
=
"CDS Invenio/
%s
refextract/
%s
"
%
(
CFG_VERSION
,
CFG_VERSION
)
# periodicals knowledge base:
CFG_REFEXTRACT_KB_JOURNAL_TITLES
=
"
%s
/bibedit/refextract-journal-titles.kb"
%
CFG_ETCDIR
# report numbers knowledge base:
CFG_REFEXTRACT_KB_REPORT_NUMBERS
=
"
%s
/bibedit/refextract-report-numbers.kb"
%
CFG_ETCDIR
## MARC Fields and subfields used by refextract:
## reference fields:
CFG_REFEXTRACT_CTRL_FIELD_RECID
=
"001"
## control-field recid
CFG_REFEXTRACT_TAG_ID_REFERENCE
=
"999"
## ref field tag
CFG_REFEXTRACT_IND1_REFERENCE
=
"C"
## ref field ind1
CFG_REFEXTRACT_IND2_REFERENCE
=
"5"
## ref field ind2
CFG_REFEXTRACT_SUBFIELD_MARKER
=
"o"
## ref marker subfield
CFG_REFEXTRACT_SUBFIELD_MISC
=
"m"
## ref misc subfield
CFG_REFEXTRACT_SUBFIELD_REPORT_NUM
=
"r"
## ref reportnum subfield
CFG_REFEXTRACT_SUBFIELD_TITLE
=
"s"
## ref title subfield
CFG_REFEXTRACT_SUBFIELD_URL
=
"u"
## ref url subfield
CFG_REFEXTRACT_SUBFIELD_URL_DESCR
=
"z"
## ref url-text subfield
## refextract statisticts fields:
CFG_REFEXTRACT_TAG_ID_EXTRACTION_STATS
=
"999"
## ref-stats tag
CFG_REFEXTRACT_IND1_EXTRACTION_STATS
=
"C"
## ref-stats ind1
CFG_REFEXTRACT_IND2_EXTRACTION_STATS
=
"6"
## ref-stats ind2
CFG_REFEXTRACT_SUBFIELD_EXTRACTION_STATS
=
"a"
## ref-stats subfield
## Internal tags are used by refextract to mark-up recognised citation
## information. These are the "closing tags:
CFG_REFEXTRACT_MARKER_CLOSING_REPORT_NUM
=
r"</cds.REPORTNUMBER>"
CFG_REFEXTRACT_MARKER_CLOSING_TITLE
=
r"</cds.TITLE>"
CFG_REFEXTRACT_MARKER_CLOSING_SERIES
=
r"</cds.SER>"
CFG_REFEXTRACT_MARKER_CLOSING_VOLUME
=
r"</cds.VOL>"
CFG_REFEXTRACT_MARKER_CLOSING_YEAR
=
r"</cds.YR>"
CFG_REFEXTRACT_MARKER_CLOSING_PAGE
=
r"</cds.PG>"
## XML Record and collection opening/closing tags:
CFG_REFEXTRACT_XML_VERSION
=
u"""<?xml version="1.0" encoding="UTF-8"?>"""
CFG_REFEXTRACT_XML_COLLECTION_OPEN
=
u"""<collection xmlns="http://www.loc.gov/MARC21/slim">"""
CFG_REFEXTRACT_XML_COLLECTION_CLOSE
=
u"""</collection>
\n
"""
CFG_REFEXTRACT_XML_RECORD_OPEN
=
u"<record>"
CFG_REFEXTRACT_XML_RECORD_CLOSE
=
u"</record>"
Event Timeline
Log In to Comment