websearch_regression_tests.py
No OneTemporary
Actions

Subscribers

None

File Metadata

Created: Fri, Jun 28, 13:23

websearch_regression_tests.py
View Options

	## $Id$
	##
	## This file is part of CDS Invenio.
	## Copyright (C) 2002, 2003, 2004, 2005, 2006 CERN.
	##
	## CDS Invenio is free software; you can redistribute it and/or
	## modify it under the terms of the GNU General Public License as
	## published by the Free Software Foundation; either version 2 of the
	## License, or (at your option) any later version.
	##
	## CDS Invenio is distributed in the hope that it will be useful, but
	## WITHOUT ANY WARRANTY; without even the implied warranty of
	## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	## General Public License for more details.
	##
	## You should have received a copy of the GNU General Public License
	## along with CDS Invenio; if not, write to the Free Software Foundation, Inc.,
	## 59 Temple Place, Suite 330, Boston, MA 02111-1307, USA.

	import unittest
	import re
	import urlparse, cgi
	from sets import Set

	from mechanize import Browser, LinkNotFoundError

	from invenio.testutils import make_suite, make_url, warn_user_about_tests_and_run
	from invenio.config import weburl, cdsname, cdslang
	from invenio.urlutils import same_urls_p

	def parse_url(url):
	parts = urlparse.urlparse(url)
	query = cgi.parse_qs(parts[4], True)

	return parts[2].split('/')[1:], query

	class WebsearchTestLegacyURLs(unittest.TestCase):

	""" Check that the application still responds to legacy URLs for
	navigating, searching and browsing."""

	def test_legacy_collections(self):
	""" websearch - collections handle legacy urls """

	b = Browser()

	def check(legacy, new):
	b.open(legacy)
	got = b.geturl()

	self.failUnless(same_urls_p(got, new), got)

	# Use the root URL unless we need more
	check(make_url('/', c=cdsname),
	make_url('/'))

	# Other collections are redirected in the /collection area
	check(make_url('/', c='Poetry'),
	make_url('/collection/Poetry'))

	# Drop unnecessary arguments, like ln and as (when they are
	# the default value)
	check(make_url('/', c='Poetry', as=0, ln=cdslang),
	make_url('/collection/Poetry'))

	# Otherwise, keep them
	check(make_url('/', c='Poetry', as=1, ln=cdslang),
	make_url('/collection/Poetry', as=1))

	# Support the /index.py addressing too
	check(make_url('/index.py', c='Poetry'),
	make_url('/collection/Poetry'))


	def test_legacy_search(self):
	""" websearch - search queries handle legacy urls """

	b = Browser()

	def check(legacy, new):
	b.open(legacy)
	got = b.geturl()

	self.failUnless(same_urls_p(got, new), got)

	# /search.py is redirected on /search
	check(make_url('/search.py', p='nuclear', as=1),
	make_url('/search', p='nuclear', as=1))

	# direct recid searches are redirected to /record
	check(make_url('/search.py', recid=1, ln='es'),
	make_url('/record/1', ln='es'))



	class WebsearchTestRecord(unittest.TestCase):
	""" Check the interface of the /record results """

	def test_format_links(self):
	""" websearch - check format links for records """

	b = Browser()

	# We open the record in all known HTML formats
	for hformat in ('hd', 'hx', 'hm'):
	b.open(make_url('/record/1', of=hformat))

	# all except the selected links should be present in the
	# page.
	for oformat in ('hd', 'hx', 'hm', 'xm', 'xd'):
	target = make_url('/record/1', of=oformat)

	if oformat == hformat:
	try:
	b.find_link(url=target)
	except LinkNotFoundError:
	continue

	self.fail('link %r should not be in page' % target)
	else:
	try:
	b.find_link(url=target)
	except LinkNotFoundError:
	self.fail('link %r should be in page' % target)

	return


	class WebsearchTestCollections(unittest.TestCase):

	def test_traversal_links(self):
	""" websearch - traverse all the publications of a collection """

	# Ensure that it is possible to traverse a collection as
	# /collection/My_Collection?jrec=...

	b = Browser()

	try:
	for as in (0, 1):
	b.open(make_url('/collection/Preprints', as=as))

	for jrec in (11, 21, 11, 23):
	args = {'jrec': jrec, 'cc': 'Preprints'}
	if as:
	args['as'] = as

	url = make_url('/search', **args)
	b.follow_link(url=url)

	except LinkNotFoundError:
	self.fail('no link %r in %r' % (url, b.geturl()))

	def test_collections_links(self):
	""" websearch - enter in collections and subcollections """

	b = Browser()

	def tryfollow(url):
	cur = b.geturl()
	body = b.response().read()
	try:
	b.follow_link(url=url)
	except LinkNotFoundError:
	print body
	self.fail("in %r: could not find %r" % (
	cur, url))
	return

	for as in (0, 1):
	if as: kargs = {'as': 1}
	else: kargs = {}

	# We navigate from immediate son to immediate son...
	b.open(make_url('/', **kargs))
	tryfollow(make_url('/collection/Articles%20%26%20Preprints', **kargs))
	tryfollow(make_url('/collection/Articles', **kargs))

	# But we can also jump to a grandson immediately
	b.back()
	b.back()
	tryfollow(make_url('/collection/ALEPH', **kargs))

	return

	def test_records_links(self):
	""" websearch - check the links toward records in leaf collections """

	b = Browser()
	b.open(make_url('/collection/Preprints'))

	def harvest():

	""" Parse all the links in the page, and check that for
	each link to a detailed record, we also have the
	corresponding link to the similar records."""

	records = Set()
	similar = Set()

	for link in b.links():
	path, q = parse_url(link.url)

	if not path:
	continue

	if path[0] == 'record':
	records.add(int(path[1]))
	continue

	if path[0] == 'search':
	if not q.get('rm') == ['wrd']:
	continue

	recid = q['p'][0].split(':')[1]
	similar.add(int(recid))

	self.failUnlessEqual(records, similar)

	return records

	# We must have 10 links to the corresponding /records
	found = harvest()
	self.failUnlessEqual(len(found), 10)

	# When clicking on the "Search" button, we must also have
	# these 10 links on the records.
	b.select_form(name="search")
	b.submit()

	found = harvest()
	self.failUnlessEqual(len(found), 10)
	return


	class WebsearchTestBrowse(unittest.TestCase):

	def test_browse_field(self):
	""" websearch - check that browsing works """

	b = Browser()
	b.open(make_url('/'))

	b.select_form(name='search')
	b['f'] = ['title']
	b.submit(name='action_browse')

	def collect():
	# We'll get a few links to search for the actual hits, plus a
	# link to the following results.
	res = []
	for link in b.links(url_regex=re.compile(weburl + r'/search\?')):
	if link.text == 'Advanced Search':
	continue

	path, q = parse_url(link.url)
	res.append((link, q))

	return res

	# if we follow the last link, we should get another
	# batch. There is an overlap of one item.
	batch_1 = collect()

	b.follow_link(link=batch_1[-1][0])

	batch_2 = collect()

	# FIXME: we cannot compare the whole query, as the collection
	# set is not equal
	self.failUnlessEqual(batch_1[-2][1]['p'], batch_2[0][1]['p'])


	class WebsearchTestSearch(unittest.TestCase):

	def test_hits_in_other_collection(self):
	""" websearch - check extension of a query to the home collection """

	b = Browser()

	# We do a precise search in an isolated collection
	b.open(make_url('/collection/ISOLDE', ln='en'))

	b.select_form(name='search')
	b['f'] = ['author']
	b['p'] = 'matsubara'
	b.submit()

	path, current_q = parse_url(b.geturl())

	link = b.find_link(text_regex=re.compile('.*hit', re.I))
	path, target_q = parse_url(link.url)

	# the target query should be the current query without any c
	# or cc specified.
	for f in ('cc', 'c', 'action_search', 'ln'):
	if f in current_q:
	del current_q[f]

	self.failUnlessEqual(current_q, target_q)

	def test_nearest_terms(self):
	""" websearch - provide a list of nearest terms """

	b = Browser()
	b.open(make_url(''))

	# Search something weird
	b.select_form(name='search')
	b['p'] = 'gronf'
	b.submit()

	path, original = parse_url(b.geturl())

	for to_drop in ('cc', 'action_search', 'f'):
	if to_drop in original:
	del original[to_drop]

	# we should get a few searches back, which are identical
	# except for the p field being substituted (and the cc field
	# being dropped).
	if 'cc' in original:
	del original['cc']

	for link in b.links(url_regex=re.compile(weburl + r'/search\?')):
	if link.text == 'Advanced Search':
	continue

	path, target = parse_url(link.url)

	original['p'] = [link.text]
	self.failUnlessEqual(original, target)

	return

	def test_switch_to_simple_search(self):
	""" websearch - switch to simple search """

	b = Browser()
	b.open(make_url('/collection/ISOLDE', as=1))

	b.select_form(name='search')
	b['p1'] = 'tandem'
	b['f1'] = ['title']
	b.submit()

	b.follow_link(text='Simple Search')

	path, q = parse_url(b.geturl())

	self.failUnlessEqual(q, {'cc': ['ISOLDE'], 'p': ['tandem'], 'f': ['title']})


	def test_switch_to_advanced_search(self):
	""" websearch - switch to advanced search """

	b = Browser()
	b.open(make_url('/collection/ISOLDE'))

	b.select_form(name='search')
	b['p'] = 'tandem'
	b['f'] = ['title']
	b.submit()

	b.follow_link(text='Advanced Search')

	path, q = parse_url(b.geturl())

	self.failUnlessEqual(q, {'cc': ['ISOLDE'], 'p1': ['tandem'], 'f1': ['title'], 'as': ['1']})

	def test_no_boolean_hits(self):
	""" websearch - check the 'no boolean hits' proposed links """

	b = Browser()
	b.open(make_url(''))

	b.select_form(name='search')
	b['p'] = 'quasinormal muon'
	b.submit()

	path, q = parse_url(b.geturl())

	for to_drop in ('cc', 'action_search', 'f'):
	if to_drop in q:
	del q[to_drop]

	for bsu in ('quasinormal', 'muon'):
	l = b.find_link(text=bsu)
	q['p'] = bsu

	if not same_urls_p(l.url, make_url('/search', **q)):
	self.fail(repr((l.url, make_url('/search', **q))))

	def test_similar_authors(self):
	""" websearch - test similar authors box """

	b = Browser()
	b.open(make_url(''))

	b.select_form(name='search')
	b['p'] = 'Ellis, R K'
	b['f'] = ['author']
	b.submit()

	l = b.find_link(text="Ellis, R S")
	self.failUnless(same_urls_p(l.url, make_url('/search', p="Ellis, R S", f='author')))

	test_suite = make_suite(WebsearchTestSearch,
	WebsearchTestBrowse,
	WebsearchTestCollections,
	WebsearchTestRecord,
	WebsearchTestLegacyURLs)

	if __name__ == "__main__":
	warn_user_about_tests_and_run(test_suite)

websearch_regression_tests.pyNo OneTemporaryActions

File Metadata

websearch_regression_tests.pyView Options

Event Timeline

websearch_regression_tests.py
No OneTemporary
Actions

websearch_regression_tests.py
View Options