Page Menu
Home
c4science
Search
Configure Global Search
Log In
Files
F69849207
bibindex_engine_stopwords.py
No One
Temporary
Actions
Download File
Edit File
Delete File
View Transforms
Subscribe
Mute Notifications
Award Token
Subscribers
None
File Metadata
Details
File Info
Storage
Attached
Created
Wed, Jul 3, 20:40
Size
1 KB
Mime Type
text/x-c
Expires
Fri, Jul 5, 20:40 (2 d)
Engine
blob
Format
Raw Data
Handle
18762344
Attached To
R3600 invenio-infoscience
bibindex_engine_stopwords.py
View Options
# $Id$
## Bibindex stopword class
## This file is part of the CERN Document Server Software (CDSware).
## Copyright (C) 2002 CERN.
##
## The CDSware is free software; you can redistribute it and/or
## modify it under the terms of the GNU General Public License as
## published by the Free Software Foundation; either version 2 of the
## License, or (at your option) any later version.
##
## The CDSware is distributed in the hope that it will be useful, but
## WITHOUT ANY WARRANTY; without even the implied warranty of
## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
## General Public License for more details.
##
## You should have received a copy of the GNU General Public License
## along with CDSware; if not, write to the Free Software Foundation, Inc.,
## 59 Temple Place, Suite 330, Boston, MA 02111-1307, USA.
## read config variables:
#include "config.wml"
#include "configbis.wml"
#include "cdswmllib.wml"
try
:
import
sre
import
string
import
os
import
sys
except
ImportError
,
e
:
import
sys
from
bibindex_engine_config
import
*
stopwords
=
{}
def
get_stopwords
(
file
=
cfg_path_stopwordlist
):
"""Get stopword list"""
try
:
file
=
open
(
file
,
'r'
)
except
:
return
{}
lines
=
file
.
readlines
()
file
.
close
()
stopdict
=
{}
for
line
in
lines
:
stopdict
[
string
.
rstrip
(
line
)]
=
1
return
stopdict
def
is_stopword
(
word
):
"""returns False if not stopword, True if stopword"""
#inputword must be lowercase
if
cfg_path_stopwordlist
and
stopwords
.
has_key
(
word
):
return
True
return
False
def
is_stopword_force
(
word
):
"""returns False if not stopword, True if stopword"""
#inputword must be lowercase
if
stopwords
.
has_key
(
word
):
return
True
return
False
stopwords
=
get_stopwords
()
Event Timeline
Log In to Comment