## This file is part of CDS Invenio. ## Copyright (C) 2002, 2003, 2004, 2005, 2006, 2007 CERN. ## ## CDS Invenio is free software; you can redistribute it and/or ## modify it under the terms of the GNU General Public License as ## published by the Free Software Foundation; either version 2 of the ## License, or (at your option) any later version. ## ## CDS Invenio is distributed in the hope that it will be useful, but ## WITHOUT ANY WARRANTY; without even the implied warranty of ## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU ## General Public License for more details. ## ## You should have received a copy of the GNU General Public License ## along with CDS Invenio; if not, write to the Free Software Foundation, Inc., ## 59 Temple Place, Suite 330, Boston, MA 02111-1307, USA. [rank_method] function = word_similarity [word_similarity] #None = no stemming stemming = en table = rnkWORD01F #using stopwordlist from /bibindex/bibindex_engine_config stopword = True relevance_number_output_prologue = ( relevance_number_output_epilogue = ) #MARC tag,tag points, tag language #keyword tag1 = 6531_a, 1, en #keyword tag2 = 695__a, 1, en #keyword tag3 = 6532_a, 1, en #title tag4 = 245__%, 10, en #title tag5 = 246_%, 1, fr #title tag6 = 250__a, 1, en #title tag7 = 711__a, 1, en #abbreviated tag8 = 210__a, 1, en #key title tag9 = 222__a, 1, en #abstract tag10 = 520__%, 1, en #abstract tag11 = 590__%, 1, fr #conference tag12 = 111__a, 1, en #author tag13 = 100__%, 1, fr #author tag14 = 700__%, 1, fr #author tag15 = 721__a, 1, none [find_similar] #term should exist in maximum X/100% of documents max_word_occurence = 0.05 #term should exist in minimum X/100% of documents min_word_occurence = 0.00 #term should be atleast 3 characters long min_word_length = 3 #term should be in atleast 3 documents or more min_nr_words_docs = 3 #do not use more than 20 terms for "find similar" max_nr_words_upper = 20 #if a document contains less than 10 terms, use much used terms too, if not ignore them max_nr_words_lower = 10 #default minimum relevance value to use for find similar default_min_relevance = 75