xapian-haystack/tests/xapian_tests/tests/test_backend.py

793 lines
31 KiB
Python

from decimal import Decimal
import datetime
import inspect
import sys
import xapian
import subprocess
import os
from django.apps import apps
from django.contrib.contenttypes.models import ContentType
from django.test import TestCase
from haystack import connections
from haystack.backends.xapian_backend import InvalidIndexError, _term_to_xapian_value
from haystack.models import SearchResult
from haystack.utils.loading import UnifiedIndex
from ..search_indexes import XapianNGramIndex, XapianEdgeNGramIndex, \
CompleteBlogEntryIndex, BlogSearchIndex, DjangoContentTypeIndex
from ..models import BlogEntry, AnotherMockModel, MockTag, DjangoContentType
XAPIAN_VERSION = [int(x) for x in xapian.__version__.split('.')]
class XapianSearchResult(SearchResult):
def __init__(self, app_label, model_name, pk, score, **kwargs):
super().__init__(app_label, model_name, pk, score, **kwargs)
self._model = apps.get_model('xapian_tests', model_name)
def get_terms(backend, *args):
executable = 'xapian-delve'
# dev versions (odd minor) use a suffix
if XAPIAN_VERSION[1] % 2 != 0:
executable = executable+'-%d.%d' % tuple(XAPIAN_VERSION[0:2])
# look for a xapian-delve built by `xapian_wheel_builder`
wheel_delve = os.path.join(os.path.dirname(inspect.getfile(xapian)), executable)
if os.path.exists(wheel_delve):
executable = wheel_delve
result = subprocess.check_output([executable] + list(args) + [backend.path],
env=os.environ.copy()).decode('utf-8')
result = result.split(": ")
if len(result) > 1:
return result[1].strip().split(" ")
return []
def pks(results):
return [result.pk for result in results]
class HaystackBackendTestCase:
"""
Abstract TestCase that implements an hack to ensure `connections`
has the right index
It has a method get_index() that returns a SearchIndex
that must be overwritten.
"""
def get_index(self):
raise NotImplementedError
def setUp(self):
self.old_ui = connections['default'].get_unified_index()
self.ui = UnifiedIndex()
self.index = self.get_index()
self.ui.build(indexes=[self.index])
self.backend = connections['default'].get_backend()
connections['default']._index = self.ui
def tearDown(self):
self.backend.clear()
connections['default']._index = self.old_ui
def assertExpectedQuery(self, query, string_or_list):
if isinstance(string_or_list, list):
strings = string_or_list
else:
strings = [string_or_list]
expected = ['Query(%s)' % string for string in strings]
self.assertIn(str(query), expected)
class BackendIndexationTestCase(HaystackBackendTestCase, TestCase):
"""
Tests indexation behavior.
Tests related to how the backend indexes terms,
values, and others go here.
"""
def get_index(self):
return CompleteBlogEntryIndex()
def setUp(self):
super().setUp()
tag1 = MockTag.objects.create(name='tag')
tag2 = MockTag.objects.create(name='tag-tag')
tag3 = MockTag.objects.create(name='tag-tag-tag')
entry = BlogEntry()
entry.id = 1
entry.text = 'this_is_a_word inside a big text'
entry.author = 'david'
entry.url = 'http://example.com/1/'
entry.boolean = True
entry.number = 123456789
entry.float_number = 123.123456789
entry.decimal_number = Decimal('22.34')
entry.funny_text = 'this-text das das'
entry.non_ascii = 'thsi sdas das corrup\xe7\xe3o das'
entry.datetime = datetime.datetime(2009, 2, 25, 1, 1, 1)
entry.date = datetime.date(2008, 8, 8)
entry.save()
entry.tags.add(tag1, tag2, tag3)
self.backend.update(self.index, [entry])
self.entry = entry
def test_app_is_not_split(self):
"""
Tests that the app path is not split
and added as independent terms.
"""
terms = get_terms(self.backend, '-a')
self.assertFalse('tests' in terms)
self.assertFalse('Ztest' in terms)
def test_app_is_not_indexed(self):
"""
Tests that the app path is not indexed.
"""
terms = get_terms(self.backend, '-a')
self.assertFalse('tests.xapianmockmodel.1' in terms)
self.assertFalse('xapianmockmodel' in terms)
self.assertFalse('tests' in terms)
def test_fields_exist(self):
"""
Tests that all fields are in the database
"""
terms = get_terms(self.backend, '-a')
for field in ['author', 'datetime', 'text', 'url']:
is_inside = False
for term in terms:
if term.startswith("X%s" % field.upper()):
is_inside = True
break
self.assertTrue(is_inside, field)
def test_text_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('this_is_a_word' in terms)
self.assertTrue('Zthis_is_a_word' in terms)
self.assertTrue('ZXTEXTthis_is_a_word' in terms)
self.assertTrue('XTEXTthis_is_a_word' in terms)
self.assertFalse('^this_is_a_word inside a big text$' in terms)
def test_text_posting(self):
"""
Tests that text is correctly positioned in the document
"""
expected_order = ['^', 'this_is_a_word', 'inside', 'a', 'big', 'text', '$']
def get_positions(term):
"""
Uses delve to get
the positions of the term in the first document.
"""
return sorted([int(pos) for pos in get_terms(self.backend, '-r1', '-tXTEXT%s' % term)])
# confirms expected_order
previous_position = get_positions(expected_order[0])
for term in expected_order[1:]:
pos = get_positions(term)
# only two positions per term
# (one from term_generator, one from literal text)
self.assertEqual(len(pos), 2)
self.assertEqual(pos[0] - 1, previous_position[0])
self.assertEqual(pos[1] - 1, previous_position[1])
previous_position[0] += 1
previous_position[1] += 1
def test_author_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('XAUTHORdavid' in terms)
self.assertTrue('ZXAUTHORdavid' in terms)
self.assertTrue('Zdavid' in terms)
self.assertTrue('david' in terms)
def test_funny_text_field(self):
terms = get_terms(self.backend, '-r1')
self.assertTrue('this-text' in terms)
def test_datetime_field(self):
terms = get_terms(self.backend, '-a')
self.assertFalse('XDATETIME20090225000000' in terms)
self.assertFalse('ZXDATETIME20090225000000' in terms)
self.assertFalse('20090225000000' in terms)
self.assertTrue('XDATETIME2009-02-25' in terms)
self.assertTrue('2009-02-25' in terms)
self.assertTrue('01:01:01' in terms)
self.assertTrue('XDATETIME01:01:01' in terms)
def test_date_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('XDATE2008-08-08' in terms)
self.assertTrue('2008-08-08' in terms)
self.assertFalse('XDATE00:00:00' in terms)
self.assertFalse('00:00:00' in terms)
def test_url_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('http://example.com/1/' in terms)
def test_bool_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('XBOOLEANtrue' in terms)
self.assertFalse('ZXBOOLEANtrue' in terms)
def test_integer_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('123456789' in terms)
self.assertTrue('XNUMBER123456789' in terms)
self.assertFalse('ZXNUMBER123456789' in terms)
def test_float_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('123.123456789' in terms)
self.assertTrue('XFLOAT_NUMBER123.123456789' in terms)
self.assertFalse('ZXFLOAT_NUMBER123.123456789' in terms)
def test_decimal_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('22.34' in terms)
self.assertTrue('XDECIMAL_NUMBER22.34' in terms)
self.assertFalse('ZXDECIMAL_NUMBER22.34' in terms)
def test_multivalue_field(self):
"""
Regression test for #103
"""
terms = get_terms(self.backend, '-a')
self.assertTrue('tag' in terms)
self.assertTrue('tag-tag' in terms)
self.assertTrue('tag-tag-tag' in terms)
self.assertTrue('XMULTI_VALUEtag' in terms)
self.assertTrue('XMULTI_VALUEtag-tag' in terms)
self.assertTrue('XMULTI_VALUEtag-tag-tag' in terms)
def test_non_ascii_chars(self):
terms = get_terms(self.backend, '-a')
self.assertIn('corrup\xe7\xe3o', terms)
class BackendFeaturesTestCase(HaystackBackendTestCase, TestCase):
"""
Tests supported features on the backend side.
Tests to features implemented on the backend
go here.
"""
def get_index(self):
return BlogSearchIndex()
@staticmethod
def get_entry(i):
entry = BlogEntry()
entry.id = i
entry.author = 'david%s' % i
entry.url = 'http://example.com/%d/' % i
entry.boolean = bool(i % 2)
entry.number = i*5
entry.float_number = i*5.0
entry.decimal_number = Decimal('22.34')
entry.datetime = datetime.datetime(2009, 2, 25, 1, 1, 1) - datetime.timedelta(seconds=i)
entry.date = datetime.date(2009, 2, 23) + datetime.timedelta(days=i)
return entry
def setUp(self):
super().setUp()
self.sample_objs = []
for i in range(1, 4):
entry = self.get_entry(i)
self.sample_objs.append(entry)
self.sample_objs[0].float_number = 834.0
self.sample_objs[1].float_number = 35.5
self.sample_objs[2].float_number = 972.0
for obj in self.sample_objs:
obj.save()
self.backend.update(self.index, BlogEntry.objects.all())
def test_update(self):
self.assertEqual(pks(self.backend.search(xapian.Query(''))['results']),
[1, 2, 3])
def test_duplicate_update(self):
"""
Regression test for #6.
"""
self.backend.update(self.index, self.sample_objs)
self.assertEqual(self.backend.document_count(), 3)
def test_remove(self):
self.backend.remove(self.sample_objs[0])
self.assertEqual(pks(self.backend.search(xapian.Query(''))['results']),
[2, 3])
def test_clear(self):
self.backend.clear()
self.assertEqual(self.backend.document_count(), 0)
self.backend.update(self.index, self.sample_objs)
self.assertEqual(self.backend.document_count(), 3)
self.backend.clear([AnotherMockModel])
self.assertEqual(self.backend.document_count(), 3)
self.backend.clear([BlogEntry])
self.assertEqual(self.backend.document_count(), 0)
self.backend.update(self.index, self.sample_objs)
self.assertEqual(self.backend.document_count(), 3)
self.backend.clear([AnotherMockModel, BlogEntry])
self.assertEqual(self.backend.document_count(), 0)
def test_search(self):
# no match query
self.assertEqual(self.backend.search(xapian.Query()), {'hits': 0, 'results': []})
# all match query
self.assertEqual(pks(self.backend.search(xapian.Query(''))['results']),
[1, 2, 3])
# Other `result_class`
self.assertTrue(
isinstance(self.backend.search(xapian.Query('indexed'), result_class=XapianSearchResult)['results'][0],
XapianSearchResult))
def test_search_field_with_punctuation(self):
self.assertEqual(pks(self.backend.search(xapian.Query('http://example.com/1/'))['results']),
[1])
def test_search_by_mvf(self):
self.assertEqual(self.backend.search(xapian.Query('ab'))['hits'], 1)
self.assertEqual(self.backend.search(xapian.Query('b'))['hits'], 1)
self.assertEqual(self.backend.search(xapian.Query('to'))['hits'], 1)
self.assertEqual(self.backend.search(xapian.Query('one'))['hits'], 3)
def test_field_facets(self):
self.assertEqual(self.backend.search(xapian.Query(), facets=['name']),
{'hits': 0, 'results': []})
results = self.backend.search(xapian.Query('indexed'), facets=['name'])
self.assertEqual(results['hits'], 3)
self.assertEqual(results['facets']['fields']['name'],
[('david1', 1), ('david2', 1), ('david3', 1)])
results = self.backend.search(xapian.Query('indexed'), facets=['boolean'])
self.assertEqual(results['hits'], 3)
self.assertEqual(results['facets']['fields']['boolean'],
[(False, 1), (True, 2)])
results = self.backend.search(xapian.Query('indexed'), facets=['sites'])
self.assertEqual(results['hits'], 3)
self.assertEqual(set(results['facets']['fields']['sites']),
set([('1', 1), ('3', 2), ('2', 2), ('4', 1), ('6', 2), ('9', 1)]))
results = self.backend.search(xapian.Query('indexed'),
facets=['number'])
self.assertEqual(results['hits'], 3)
self.assertEqual(results['facets']['fields']['number'],
[(5, 1), (10, 1), (15, 1)])
results = self.backend.search(xapian.Query('indexed'),
facets=['float_number'])
self.assertEqual(results['hits'], 3)
self.assertEqual(results['facets']['fields']['float_number'],
[(35.5, 1), (834.0, 1), (972.0, 1)])
def test_raise_index_error_on_wrong_field(self):
"""
Regression test for #109.
"""
self.assertRaises(InvalidIndexError, self.backend.search, xapian.Query(''), facets=['dsdas'])
def test_date_facets_month(self):
facets = {'datetime': {'start_date': datetime.datetime(2008, 10, 26),
'end_date': datetime.datetime(2009, 3, 26),
'gap_by': 'month'}}
self.assertEqual(self.backend.search(xapian.Query(), date_facets=facets),
{'hits': 0, 'results': []})
results = self.backend.search(xapian.Query('indexed'), date_facets=facets)
self.assertEqual(results['hits'], 3)
self.assertEqual(results['facets']['dates']['datetime'], [
(datetime.datetime(2009, 2, 26, 0, 0), 0),
(datetime.datetime(2009, 1, 26, 0, 0), 3),
(datetime.datetime(2008, 12, 26, 0, 0), 0),
(datetime.datetime(2008, 11, 26, 0, 0), 0),
(datetime.datetime(2008, 10, 26, 0, 0), 0),
])
def test_date_facets_seconds(self):
facets = {'datetime': {'start_date': datetime.datetime(2009, 2, 25, 1, 0, 57),
'end_date': datetime.datetime(2009, 2, 25, 1, 1, 1),
'gap_by': 'second'}}
self.assertEqual(self.backend.search(xapian.Query(), date_facets=facets),
{'hits': 0, 'results': []})
results = self.backend.search(xapian.Query('indexed'), date_facets=facets)
self.assertEqual(results['hits'], 3)
self.assertEqual(results['facets']['dates']['datetime'], [
(datetime.datetime(2009, 2, 25, 1, 1, 0), 0),
(datetime.datetime(2009, 2, 25, 1, 0, 59), 1),
(datetime.datetime(2009, 2, 25, 1, 0, 58), 1),
(datetime.datetime(2009, 2, 25, 1, 0, 57), 1),
])
def test_date_facets_days(self):
facets = {'date': {'start_date': datetime.datetime(2009, 2, 1),
'end_date': datetime.datetime(2009, 3, 15),
'gap_by': 'day',
'gap_amount': 15}}
results = self.backend.search(xapian.Query('indexed'), date_facets=facets)
self.assertEqual(results['hits'], 3)
self.assertEqual(results['facets']['dates']['date'], [
(datetime.datetime(2009, 3, 3, 0, 0), 0),
(datetime.datetime(2009, 2, 16, 0, 0), 3),
(datetime.datetime(2009, 2, 1, 0, 0), 0)
])
def test_query_facets(self):
self.assertEqual(self.backend.search(xapian.Query(), query_facets={'name': 'da*'}),
{'hits': 0, 'results': []})
results = self.backend.search(xapian.Query('indexed'), query_facets={'name': 'da*'})
self.assertEqual(results['hits'], 3)
self.assertEqual(results['facets']['queries']['name'], ('da*', 3))
def test_narrow_queries(self):
self.assertEqual(self.backend.search(xapian.Query(), narrow_queries={'name:david1'}),
{'hits': 0, 'results': []})
results = self.backend.search(xapian.Query('indexed'), narrow_queries={'name:david1'})
self.assertEqual(results['hits'], 1)
def test_highlight(self):
self.assertEqual(self.backend.search(xapian.Query(), highlight=True),
{'hits': 0, 'results': []})
self.assertEqual(self.backend.search(xapian.Query('indexed'), highlight=True)['hits'], 3)
results = self.backend.search(xapian.Query('indexed'), highlight=True)['results']
self.assertEqual([result.highlighted['text'] for result in results],
['<em>indexed</em>!\n1\n', '<em>indexed</em>!\n2\n', '<em>indexed</em>!\n3\n'])
def test_spelling_suggestion(self):
self.assertEqual(self.backend.search(xapian.Query('indxe'))['hits'], 0)
self.assertEqual(self.backend.search(xapian.Query('indxe'))['spelling_suggestion'],
'indexed')
self.assertEqual(self.backend.search(xapian.Query('indxed'))['hits'], 0)
self.assertEqual(self.backend.search(xapian.Query('indxed'))['spelling_suggestion'],
'indexed')
self.assertEqual(self.backend.search(xapian.Query('foo'))['hits'], 0)
self.assertEqual(self.backend.search(xapian.Query('foo'), spelling_query='indexy')['spelling_suggestion'],
'indexed')
self.assertEqual(self.backend.search(xapian.Query('XNAMEdavid'))['hits'], 0)
self.assertEqual(self.backend.search(xapian.Query('XNAMEdavid'))['spelling_suggestion'],
'david1')
def test_more_like_this(self):
results = self.backend.more_like_this(self.sample_objs[0])
self.assertEqual(pks(results['results']), [3, 2])
results = self.backend.more_like_this(self.sample_objs[0],
additional_query=xapian.Query('david3'))
self.assertEqual(pks(results['results']), [3])
results = self.backend.more_like_this(self.sample_objs[0],
limit_to_registered_models=True)
self.assertEqual(pks(results['results']), [3, 2])
# Other `result_class`
result = self.backend.more_like_this(self.sample_objs[0],
result_class=XapianSearchResult)
self.assertTrue(isinstance(result['results'][0], XapianSearchResult))
def test_order_by(self):
#results = self.backend.search(xapian.Query(''), sort_by=['datetime'])
#print([d.datetime for d in results['results']])
#self.assertEqual(pks(results['results']), [3, 2, 1])
#results = self.backend.search(xapian.Query(''), sort_by=['-datetime'])
#self.assertEqual(pks(results['results']), [1, 2, 3])
#results = self.backend.search(xapian.Query(''), sort_by=['date'])
#self.assertEqual(pks(results['results']), [1, 2, 3])
#results = self.backend.search(xapian.Query(''), sort_by=['-date'])
#self.assertEqual(pks(results['results']), [3, 2, 1])
results = self.backend.search(xapian.Query(''), sort_by=['id'])
self.assertEqual(pks(results['results']), [1, 2, 3])
results = self.backend.search(xapian.Query(''), sort_by=['-id'])
self.assertEqual(pks(results['results']), [3, 2, 1])
results = self.backend.search(xapian.Query(''), sort_by=['number'])
self.assertEqual(pks(results['results']), [1, 2, 3])
results = self.backend.search(xapian.Query(''), sort_by=['-number'])
self.assertEqual(pks(results['results']), [3, 2, 1])
results = self.backend.search(xapian.Query(''), sort_by=['float_number'])
self.assertEqual(pks(results['results']), [2, 1, 3])
results = self.backend.search(xapian.Query(''), sort_by=['-float_number'])
self.assertEqual(pks(results['results']), [3, 1, 2])
results = self.backend.search(xapian.Query(''), sort_by=['boolean', 'id'])
self.assertEqual(pks(results['results']), [2, 1, 3])
results = self.backend.search(xapian.Query(''), sort_by=['boolean', '-id'])
self.assertEqual(pks(results['results']), [2, 3, 1])
def test_verify_type(self):
self.assertEqual([result.month for result in self.backend.search(xapian.Query(''))['results']],
['02', '02', '02'])
def test_term_to_xapian_value(self):
self.assertEqual(_term_to_xapian_value('abc', 'text'), 'abc')
self.assertEqual(_term_to_xapian_value(1, 'integer'), '000000000001')
self.assertEqual(_term_to_xapian_value(2653, 'integer'), '000000002653')
self.assertEqual(_term_to_xapian_value(25.5, 'float'), b'\xb2`')
self.assertEqual(_term_to_xapian_value([1, 2, 3], 'text'), '[1, 2, 3]')
self.assertEqual(_term_to_xapian_value((1, 2, 3), 'text'), '(1, 2, 3)')
self.assertEqual(_term_to_xapian_value({'a': 1, 'c': 3, 'b': 2}, 'text'),
str({'a': 1, 'c': 3, 'b': 2}))
self.assertEqual(_term_to_xapian_value(datetime.datetime(2009, 5, 9, 16, 14), 'datetime'),
'20090509161400')
self.assertEqual(_term_to_xapian_value(datetime.datetime(2009, 5, 9, 0, 0), 'date'),
'20090509000000')
self.assertEqual(_term_to_xapian_value(datetime.datetime(1899, 5, 18, 0, 0), 'date'),
'18990518000000')
def test_build_schema(self):
search_fields = connections['default'].get_unified_index().all_searchfields()
(content_field_name, fields) = self.backend.build_schema(search_fields)
self.assertEqual(content_field_name, 'text')
self.assertEqual(len(fields), 14 + 3)
self.assertEqual(fields, [
{'column': 0, 'type': 'text', 'field_name': 'id', 'multi_valued': 'false'},
{'column': 1, 'type': 'integer', 'field_name': 'django_id', 'multi_valued': 'false'},
{'column': 2, 'type': 'text', 'field_name': 'django_ct', 'multi_valued': 'false'},
{'column': 3, 'type': 'boolean', 'field_name': 'boolean', 'multi_valued': 'false'},
{'column': 4, 'type': 'date', 'field_name': 'date', 'multi_valued': 'false'},
{'column': 5, 'type': 'date', 'field_name': 'datetime', 'multi_valued': 'false'},
{'column': 6, 'type': 'text', 'field_name': 'empty', 'multi_valued': 'false'},
{'column': 7, 'type': 'float', 'field_name': 'float_number', 'multi_valued': 'false'},
{'column': 8, 'type': 'text', 'field_name': 'keys', 'multi_valued': 'true'},
{'column': 9, 'type': 'text', 'field_name': 'name', 'multi_valued': 'false'},
{'column': 10, 'type': 'text', 'field_name': 'name_exact', 'multi_valued': 'false'},
{'column': 11, 'type': 'integer', 'field_name': 'number', 'multi_valued': 'false'},
{'column': 12, 'type': 'text', 'field_name': 'sites', 'multi_valued': 'true'},
{'column': 13, 'type': 'text', 'field_name': 'tags', 'multi_valued': 'true'},
{'column': 14, 'type': 'text', 'field_name': 'text', 'multi_valued': 'false'},
{'column': 15, 'type': 'text', 'field_name': 'titles', 'multi_valued': 'true'},
{'column': 16, 'type': 'text', 'field_name': 'url', 'multi_valued': 'false'},
])
def test_parse_query(self):
self.assertExpectedQuery(self.backend.parse_query('indexed'), 'Zindex@1')
self.assertExpectedQuery(self.backend.parse_query('name:david'), 'ZXNAMEdavid@1')
if xapian.minor_version() >= 2:
# todo: why `SYNONYM WILDCARD OR XNAMEda`?
self.assertExpectedQuery(
self.backend.parse_query('name:da*'),
[
'(SYNONYM WILDCARD OR XNAMEda)',
'WILDCARD SYNONYM XNAMEda',
])
else:
self.assertEqual(str(self.backend.parse_query('name:da*')),
'Xapian::Query(('
'XNAMEdavid1:(pos=1) OR '
'XNAMEdavid2:(pos=1) OR '
'XNAMEdavid3:(pos=1)))')
def test_parse_query_range(self):
self.assertExpectedQuery(self.backend.parse_query('name:david1..david2'),
[
'0 * VALUE_RANGE 9 david1 david2',
'VALUE_RANGE 9 david1 david2',
])
self.assertExpectedQuery(self.backend.parse_query('number:0..10'),
[
'0 * VALUE_RANGE 11 000000000000 000000000010',
'VALUE_RANGE 11 000000000000 000000000010',
])
self.assertExpectedQuery(self.backend.parse_query('number:..10'),
[
'0 * VALUE_RANGE 11 %012d 000000000010' % (-sys.maxsize - 1),
'VALUE_RANGE 11 %012d 000000000010' % (-sys.maxsize - 1),
])
self.assertExpectedQuery(self.backend.parse_query('number:10..*'),
[
'0 * VALUE_RANGE 11 000000000010 %012d' % sys.maxsize,
'VALUE_RANGE 11 000000000010 %012d' % sys.maxsize,
])
def test_order_by_django_id(self):
"""
We need this test because ordering on more than
10 entries was not correct at some point.
"""
self.sample_objs = []
number_list = list(range(1, 101))
for i in number_list:
entry = self.get_entry(i)
self.sample_objs.append(entry)
for obj in self.sample_objs:
obj.save()
self.backend.clear()
self.backend.update(self.index, self.sample_objs)
results = self.backend.search(xapian.Query(''), sort_by=['-django_id'])
self.assertEqual(pks(results['results']), list(reversed(number_list)))
def test_more_like_this_with_unindexed_model(self):
"""
Tests that more_like_this raises an error when it is called
with an unindexed model and if silently_fail is True.
Also tests the other way around.
"""
mock = BlogEntry()
mock.id = 10
mock.author = 'david10'
try:
self.assertEqual(self.backend.more_like_this(mock)['results'], [])
except InvalidIndexError:
self.fail("InvalidIndexError raised when silently_fail is True")
self.backend.silently_fail = False
self.assertRaises(InvalidIndexError, self.backend.more_like_this, mock)
class IndexationNGramTestCase(HaystackBackendTestCase, TestCase):
def get_index(self):
return XapianNGramIndex()
def setUp(self):
super().setUp()
mock = BlogEntry()
mock.id = 1
mock.author = 'david'
mock1 = BlogEntry()
mock1.id = 2
mock1.author = 'da1id'
self.backend.update(self.index, [mock, mock1])
def test_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('da' in terms)
self.assertTrue('XNGRAMda' in terms)
self.assertTrue('dav' in terms)
self.assertTrue('XNGRAMdav' in terms)
self.assertTrue('davi' in terms)
self.assertTrue('XNGRAMdavi' in terms)
self.assertTrue('david' in terms)
self.assertTrue('XNGRAMdavid' in terms)
self.assertTrue('vid' in terms)
self.assertTrue('XNGRAMvid' in terms)
self.assertTrue('id' in terms)
self.assertTrue('XNGRAMid' in terms)
self.assertTrue('av' in terms)
self.assertTrue('XNGRAMav' in terms)
def test_search(self):
"""Tests edge ngram search with different parts of words"""
# Minimun length of query string must be equal to EDGE_NGRAM_MIN_LENGTH.
self.assertEqual(pks(self.backend.search(xapian.Query('da'))['results']),
[1, 2])
self.assertEqual(pks(self.backend.search(xapian.Query('dav'))['results']),
[1])
self.assertEqual(pks(self.backend.search(xapian.Query('da1'))['results']),
[2])
class IndexationEdgeNGramTestCase(HaystackBackendTestCase, TestCase):
def get_index(self):
return XapianEdgeNGramIndex()
def setUp(self):
super().setUp()
mock = BlogEntry()
mock.id = 1
mock.author = 'david'
mock1 = BlogEntry()
mock1.id = 2
mock1.author = 'da1id'
self.backend.update(self.index, [mock, mock1])
def test_field(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('da' in terms)
self.assertTrue('XEDGE_NGRAMda' in terms)
self.assertTrue('dav' in terms)
self.assertTrue('XEDGE_NGRAMdav' in terms)
self.assertTrue('davi' in terms)
self.assertTrue('XEDGE_NGRAMdavi' in terms)
self.assertTrue('david' in terms)
self.assertTrue('XEDGE_NGRAMdavid' in terms)
self.assertTrue('vid' not in terms)
self.assertTrue('XEDGE_NGRAMvid' not in terms)
self.assertTrue('id' not in terms)
self.assertTrue('XEDGE_NGRAMid' not in terms)
self.assertTrue('av' not in terms)
self.assertTrue('XEDGE_NGRAMav' not in terms)
def test_search(self):
"""Tests edge ngram search with different parts of words"""
# Minimun length of query string must be equal to NGRAM_MIN_LENGTH.
self.assertEqual(pks(self.backend.search(xapian.Query('da'))['results']),
[1, 2])
self.assertEqual(pks(self.backend.search(xapian.Query('dav'))['results']),
[1])
self.assertEqual(pks(self.backend.search(xapian.Query('da1'))['results']),
[2])
class IndexationDjangoContentTypeTestCase(HaystackBackendTestCase, TestCase):
def get_index(self):
return DjangoContentTypeIndex()
def setUp(self):
super().setUp()
entry1 = ContentType(model='DjangoContentType')
entry1.save()
entry2 = DjangoContentType(content_type=entry1)
entry2.save()
self.backend.update(self.index, [entry2])
def test_basic(self):
terms = get_terms(self.backend, '-a')
self.assertTrue('CONTENTTYPExapian_tests.djangocontenttype' in terms)