2015-05-31 21:45:03 +00:00
|
|
|
"""
|
|
|
|
Test PostgreSQL full text search.
|
|
|
|
|
|
|
|
These tests use dialogue from the 1975 film Monty Python and the Holy Grail.
|
|
|
|
All text copyright Python (Monty) Pictures. Thanks to sacred-texts.com for the
|
|
|
|
transcript.
|
|
|
|
"""
|
2020-03-20 21:01:26 +00:00
|
|
|
from django.db.models import F, Value
|
2015-05-31 21:45:03 +00:00
|
|
|
|
2020-02-25 04:48:07 +00:00
|
|
|
from . import PostgreSQLSimpleTestCase, PostgreSQLTestCase
|
2020-03-04 12:33:12 +00:00
|
|
|
from .models import Character, Line, LineSavedSearch, Scene
|
2015-05-31 21:45:03 +00:00
|
|
|
|
2019-11-19 13:59:06 +00:00
|
|
|
try:
|
|
|
|
from django.contrib.postgres.search import (
|
|
|
|
SearchConfig,
|
|
|
|
SearchHeadline,
|
|
|
|
SearchQuery,
|
|
|
|
SearchRank,
|
|
|
|
SearchVector,
|
|
|
|
)
|
|
|
|
except ImportError:
|
|
|
|
pass
|
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
|
2017-01-19 07:39:46 +00:00
|
|
|
class GrailTestData:
|
2015-05-31 21:45:03 +00:00
|
|
|
@classmethod
|
|
|
|
def setUpTestData(cls):
|
|
|
|
cls.robin = Scene.objects.create(
|
|
|
|
scene="Scene 10", setting="The dark forest of Ewing"
|
|
|
|
)
|
|
|
|
cls.minstrel = Character.objects.create(name="Minstrel")
|
|
|
|
verses = [
|
|
|
|
(
|
|
|
|
"Bravely bold Sir Robin, rode forth from Camelot. "
|
|
|
|
"He was not afraid to die, o Brave Sir Robin. "
|
|
|
|
"He was not at all afraid to be killed in nasty ways. "
|
2020-05-17 21:20:16 +00:00
|
|
|
"Brave, brave, brave, brave Sir Robin"
|
2015-05-31 21:45:03 +00:00
|
|
|
),
|
|
|
|
(
|
|
|
|
"He was not in the least bit scared to be mashed into a pulp, "
|
|
|
|
"Or to have his eyes gouged out, and his elbows broken. "
|
|
|
|
"To have his kneecaps split, and his body burned away, "
|
|
|
|
"And his limbs all hacked and mangled, brave Sir Robin!"
|
|
|
|
),
|
|
|
|
(
|
|
|
|
"His head smashed in and his heart cut out, "
|
|
|
|
"And his liver removed and his bowels unplugged, "
|
|
|
|
"And his nostrils ripped and his bottom burned off,"
|
|
|
|
"And his --"
|
|
|
|
),
|
|
|
|
]
|
|
|
|
cls.verses = [
|
|
|
|
Line.objects.create(
|
|
|
|
scene=cls.robin,
|
|
|
|
character=cls.minstrel,
|
|
|
|
dialogue=verse,
|
|
|
|
)
|
|
|
|
for verse in verses
|
|
|
|
]
|
|
|
|
cls.verse0, cls.verse1, cls.verse2 = cls.verses
|
|
|
|
|
|
|
|
cls.witch_scene = Scene.objects.create(
|
|
|
|
scene="Scene 5", setting="Sir Bedemir's Castle"
|
|
|
|
)
|
|
|
|
bedemir = Character.objects.create(name="Bedemir")
|
|
|
|
crowd = Character.objects.create(name="Crowd")
|
|
|
|
witch = Character.objects.create(name="Witch")
|
|
|
|
duck = Character.objects.create(name="Duck")
|
|
|
|
|
|
|
|
cls.bedemir0 = Line.objects.create(
|
|
|
|
scene=cls.witch_scene,
|
|
|
|
character=bedemir,
|
|
|
|
dialogue="We shall use my larger scales!",
|
|
|
|
dialogue_config="english",
|
|
|
|
)
|
|
|
|
cls.bedemir1 = Line.objects.create(
|
|
|
|
scene=cls.witch_scene,
|
|
|
|
character=bedemir,
|
|
|
|
dialogue="Right, remove the supports!",
|
|
|
|
dialogue_config="english",
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
cls.duck = Line.objects.create(
|
|
|
|
scene=cls.witch_scene, character=duck, dialogue=None
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
cls.crowd = Line.objects.create(
|
|
|
|
scene=cls.witch_scene, character=crowd, dialogue="A witch! A witch!"
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
cls.witch = Line.objects.create(
|
|
|
|
scene=cls.witch_scene, character=witch, dialogue="It's a fair cop."
|
|
|
|
)
|
|
|
|
|
|
|
|
trojan_rabbit = Scene.objects.create(
|
|
|
|
scene="Scene 8", setting="The castle of Our Master Ruiz' de lu la Ramper"
|
|
|
|
)
|
|
|
|
guards = Character.objects.create(name="French Guards")
|
|
|
|
cls.french = Line.objects.create(
|
|
|
|
scene=trojan_rabbit,
|
|
|
|
character=guards,
|
2018-09-17 16:03:52 +00:00
|
|
|
dialogue="Oh. Un beau cadeau. Oui oui.",
|
2015-05-31 21:45:03 +00:00
|
|
|
dialogue_config="french",
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
class SimpleSearchTest(GrailTestData, PostgreSQLTestCase):
|
|
|
|
def test_simple(self):
|
|
|
|
searched = Line.objects.filter(dialogue__search="elbows")
|
|
|
|
self.assertSequenceEqual(searched, [self.verse1])
|
|
|
|
|
|
|
|
def test_non_exact_match(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2015-05-31 21:45:03 +00:00
|
|
|
searched = Line.objects.filter(dialogue__search="hearts")
|
|
|
|
self.assertSequenceEqual(searched, [self.verse2])
|
|
|
|
|
|
|
|
def test_search_two_terms(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2015-05-31 21:45:03 +00:00
|
|
|
searched = Line.objects.filter(dialogue__search="heart bowel")
|
|
|
|
self.assertSequenceEqual(searched, [self.verse2])
|
|
|
|
|
|
|
|
def test_search_two_terms_with_partial_match(self):
|
|
|
|
searched = Line.objects.filter(dialogue__search="Robin killed")
|
|
|
|
self.assertSequenceEqual(searched, [self.verse0])
|
|
|
|
|
2020-02-25 04:51:27 +00:00
|
|
|
def test_search_query_config(self):
|
|
|
|
searched = Line.objects.filter(
|
|
|
|
dialogue__search=SearchQuery("nostrils", config="simple"),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [self.verse2])
|
|
|
|
|
2020-03-04 12:33:12 +00:00
|
|
|
def test_search_with_F_expression(self):
|
|
|
|
# Non-matching query.
|
|
|
|
LineSavedSearch.objects.create(line=self.verse1, query="hearts")
|
|
|
|
# Matching query.
|
|
|
|
match = LineSavedSearch.objects.create(line=self.verse1, query="elbows")
|
|
|
|
for query_expression in [F("query"), SearchQuery(F("query"))]:
|
|
|
|
with self.subTest(query_expression):
|
|
|
|
searched = LineSavedSearch.objects.filter(
|
|
|
|
line__dialogue__search=query_expression,
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [match])
|
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
|
|
|
|
class SearchVectorFieldTest(GrailTestData, PostgreSQLTestCase):
|
|
|
|
def test_existing_vector(self):
|
|
|
|
Line.objects.update(dialogue_search_vector=SearchVector("dialogue"))
|
|
|
|
searched = Line.objects.filter(
|
|
|
|
dialogue_search_vector=SearchQuery("Robin killed")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.verse0])
|
|
|
|
|
|
|
|
def test_existing_vector_config_explicit(self):
|
|
|
|
Line.objects.update(dialogue_search_vector=SearchVector("dialogue"))
|
|
|
|
searched = Line.objects.filter(
|
|
|
|
dialogue_search_vector=SearchQuery("cadeaux", config="french")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.french])
|
|
|
|
|
2019-05-17 14:27:01 +00:00
|
|
|
def test_single_coalesce_expression(self):
|
|
|
|
searched = Line.objects.annotate(search=SearchVector("dialogue")).filter(
|
|
|
|
search="cadeaux"
|
|
|
|
)
|
|
|
|
self.assertNotIn("COALESCE(COALESCE", str(searched.query))
|
|
|
|
|
2023-04-05 17:34:16 +00:00
|
|
|
def test_values_with_percent(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector(Value("This week everything is 10% off"))
|
|
|
|
).filter(search="10 % off")
|
|
|
|
self.assertEqual(len(searched), 9)
|
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
|
2020-02-25 04:48:07 +00:00
|
|
|
class SearchConfigTests(PostgreSQLSimpleTestCase):
|
|
|
|
def test_from_parameter(self):
|
|
|
|
self.assertIsNone(SearchConfig.from_parameter(None))
|
|
|
|
self.assertEqual(SearchConfig.from_parameter("foo"), SearchConfig("foo"))
|
|
|
|
self.assertEqual(
|
|
|
|
SearchConfig.from_parameter(SearchConfig("bar")), SearchConfig("bar")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2020-02-25 04:48:07 +00:00
|
|
|
|
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
class MultipleFieldsTest(GrailTestData, PostgreSQLTestCase):
|
|
|
|
def test_simple_on_dialogue(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(search="elbows")
|
|
|
|
self.assertSequenceEqual(searched, [self.verse1])
|
|
|
|
|
|
|
|
def test_simple_on_scene(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(search="Forest")
|
2017-11-15 14:37:18 +00:00
|
|
|
self.assertCountEqual(searched, self.verses)
|
2015-05-31 21:45:03 +00:00
|
|
|
|
|
|
|
def test_non_exact_match(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(search="heart")
|
|
|
|
self.assertSequenceEqual(searched, [self.verse2])
|
|
|
|
|
|
|
|
def test_search_two_terms(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(search="heart forest")
|
|
|
|
self.assertSequenceEqual(searched, [self.verse2])
|
|
|
|
|
|
|
|
def test_terms_adjacent(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("character__name", "dialogue"),
|
|
|
|
).filter(search="minstrel")
|
2017-11-15 14:37:18 +00:00
|
|
|
self.assertCountEqual(searched, self.verses)
|
2015-05-31 21:45:03 +00:00
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(search="minstrelbravely")
|
|
|
|
self.assertSequenceEqual(searched, [])
|
|
|
|
|
|
|
|
def test_search_with_null(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(search="bedemir")
|
2018-11-29 19:43:53 +00:00
|
|
|
self.assertCountEqual(
|
|
|
|
searched, [self.bedemir0, self.bedemir1, self.crowd, self.witch, self.duck]
|
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
|
2018-07-21 01:23:05 +00:00
|
|
|
def test_search_with_non_text(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("id"),
|
|
|
|
).filter(search=str(self.crowd.id))
|
|
|
|
self.assertSequenceEqual(searched, [self.crowd])
|
|
|
|
|
2018-09-17 16:03:52 +00:00
|
|
|
def test_phrase_search(self):
|
|
|
|
line_qs = Line.objects.annotate(search=SearchVector("dialogue"))
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery("burned body his away", search_type="phrase")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2018-09-17 16:03:52 +00:00
|
|
|
self.assertSequenceEqual(searched, [])
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery("his body burned away", search_type="phrase")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2018-09-17 16:03:52 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.verse1])
|
|
|
|
|
|
|
|
def test_phrase_search_with_config(self):
|
|
|
|
line_qs = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue", config="french"),
|
|
|
|
)
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery("cadeau beau un", search_type="phrase", config="french"),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [])
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery("un beau cadeau", search_type="phrase", config="french"),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [self.french])
|
|
|
|
|
|
|
|
def test_raw_search(self):
|
|
|
|
line_qs = Line.objects.annotate(search=SearchVector("dialogue"))
|
|
|
|
searched = line_qs.filter(search=SearchQuery("Robin", search_type="raw"))
|
2018-11-29 19:43:53 +00:00
|
|
|
self.assertCountEqual(searched, [self.verse0, self.verse1])
|
2018-09-17 16:03:52 +00:00
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery("Robin & !'Camelot'", search_type="raw")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2018-09-17 16:03:52 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.verse1])
|
|
|
|
|
|
|
|
def test_raw_search_with_config(self):
|
|
|
|
line_qs = Line.objects.annotate(
|
|
|
|
search=SearchVector("dialogue", config="french")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2018-09-17 16:03:52 +00:00
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery(
|
|
|
|
"'cadeaux' & 'beaux'", search_type="raw", config="french"
|
|
|
|
),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [self.french])
|
|
|
|
|
2019-12-13 20:10:33 +00:00
|
|
|
def test_web_search(self):
|
|
|
|
line_qs = Line.objects.annotate(search=SearchVector("dialogue"))
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery(
|
|
|
|
'"burned body" "split kneecaps"',
|
|
|
|
search_type="websearch",
|
|
|
|
),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [])
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery(
|
|
|
|
'"body burned" "kneecaps split" -"nostrils"',
|
|
|
|
search_type="websearch",
|
|
|
|
),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [self.verse1])
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery(
|
|
|
|
'"Sir Robin" ("kneecaps" OR "Camelot")',
|
|
|
|
search_type="websearch",
|
|
|
|
),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [self.verse0, self.verse1])
|
|
|
|
|
|
|
|
def test_web_search_with_config(self):
|
|
|
|
line_qs = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue", config="french"),
|
|
|
|
)
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery(
|
|
|
|
"cadeau -beau", search_type="websearch", config="french"
|
|
|
|
),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [])
|
|
|
|
searched = line_qs.filter(
|
|
|
|
search=SearchQuery("beau cadeau", search_type="websearch", config="french"),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [self.french])
|
|
|
|
|
2018-09-17 16:03:52 +00:00
|
|
|
def test_bad_search_type(self):
|
|
|
|
with self.assertRaisesMessage(
|
|
|
|
ValueError, "Unknown search_type argument 'foo'."
|
|
|
|
):
|
|
|
|
SearchQuery("kneecaps", search_type="foo")
|
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
def test_config_query_explicit(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue", config="french"),
|
|
|
|
).filter(search=SearchQuery("cadeaux", config="french"))
|
|
|
|
self.assertSequenceEqual(searched, [self.french])
|
|
|
|
|
|
|
|
def test_config_query_implicit(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue", config="french"),
|
|
|
|
).filter(search="cadeaux")
|
|
|
|
self.assertSequenceEqual(searched, [self.french])
|
|
|
|
|
|
|
|
def test_config_from_field_explicit(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector(
|
|
|
|
"scene__setting", "dialogue", config=F("dialogue_config")
|
|
|
|
),
|
|
|
|
).filter(search=SearchQuery("cadeaux", config=F("dialogue_config")))
|
|
|
|
self.assertSequenceEqual(searched, [self.french])
|
|
|
|
|
|
|
|
def test_config_from_field_implicit(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector(
|
|
|
|
"scene__setting", "dialogue", config=F("dialogue_config")
|
|
|
|
),
|
|
|
|
).filter(search="cadeaux")
|
|
|
|
self.assertSequenceEqual(searched, [self.french])
|
|
|
|
|
|
|
|
|
|
|
|
class TestCombinations(GrailTestData, PostgreSQLTestCase):
|
|
|
|
def test_vector_add(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting") + SearchVector("character__name"),
|
|
|
|
).filter(search="bedemir")
|
2018-11-29 19:43:53 +00:00
|
|
|
self.assertCountEqual(
|
|
|
|
searched, [self.bedemir0, self.bedemir1, self.crowd, self.witch, self.duck]
|
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
|
|
|
|
def test_vector_add_multi(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=(
|
|
|
|
SearchVector("scene__setting")
|
|
|
|
+ SearchVector("character__name")
|
|
|
|
+ SearchVector("dialogue")
|
|
|
|
),
|
|
|
|
).filter(search="bedemir")
|
2018-11-29 19:43:53 +00:00
|
|
|
self.assertCountEqual(
|
|
|
|
searched, [self.bedemir0, self.bedemir1, self.crowd, self.witch, self.duck]
|
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
|
2020-01-24 22:23:30 +00:00
|
|
|
def test_vector_combined_mismatch(self):
|
|
|
|
msg = (
|
|
|
|
"SearchVector can only be combined with other SearchVector "
|
|
|
|
"instances, got NoneType."
|
|
|
|
)
|
|
|
|
with self.assertRaisesMessage(TypeError, msg):
|
|
|
|
Line.objects.filter(dialogue__search=None + SearchVector("character__name"))
|
|
|
|
|
2020-02-05 01:51:13 +00:00
|
|
|
def test_combine_different_vector_configs(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2020-02-05 01:51:13 +00:00
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=(
|
|
|
|
SearchVector("dialogue", config="english")
|
|
|
|
+ SearchVector("dialogue", config="french")
|
|
|
|
),
|
|
|
|
).filter(
|
|
|
|
search=SearchQuery("cadeaux", config="french") | SearchQuery("nostrils")
|
|
|
|
)
|
|
|
|
self.assertCountEqual(searched, [self.french, self.verse2])
|
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
def test_query_and(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(search=SearchQuery("bedemir") & SearchQuery("scales"))
|
|
|
|
self.assertSequenceEqual(searched, [self.bedemir0])
|
|
|
|
|
2016-08-25 08:36:49 +00:00
|
|
|
def test_query_multiple_and(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(
|
|
|
|
search=SearchQuery("bedemir")
|
|
|
|
& SearchQuery("scales")
|
|
|
|
& SearchQuery("nostrils")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2016-08-25 08:36:49 +00:00
|
|
|
self.assertSequenceEqual(searched, [])
|
|
|
|
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
search=SearchVector("scene__setting", "dialogue"),
|
|
|
|
).filter(
|
|
|
|
search=SearchQuery("shall") & SearchQuery("use") & SearchQuery("larger")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2016-08-25 08:36:49 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.bedemir0])
|
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
def test_query_or(self):
|
|
|
|
searched = Line.objects.filter(
|
|
|
|
dialogue__search=SearchQuery("kneecaps") | SearchQuery("nostrils")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2018-11-29 19:43:53 +00:00
|
|
|
self.assertCountEqual(searched, [self.verse1, self.verse2])
|
2015-05-31 21:45:03 +00:00
|
|
|
|
2016-08-25 08:36:49 +00:00
|
|
|
def test_query_multiple_or(self):
|
|
|
|
searched = Line.objects.filter(
|
|
|
|
dialogue__search=SearchQuery("kneecaps")
|
|
|
|
| SearchQuery("nostrils")
|
|
|
|
| SearchQuery("Sir Robin")
|
|
|
|
)
|
2018-11-29 19:43:53 +00:00
|
|
|
self.assertCountEqual(searched, [self.verse1, self.verse2, self.verse0])
|
2016-08-25 08:36:49 +00:00
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
def test_query_invert(self):
|
|
|
|
searched = Line.objects.filter(
|
|
|
|
character=self.minstrel, dialogue__search=~SearchQuery("kneecaps")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2018-11-29 19:43:53 +00:00
|
|
|
self.assertCountEqual(searched, [self.verse0, self.verse2])
|
2015-05-31 21:45:03 +00:00
|
|
|
|
2018-11-30 14:42:50 +00:00
|
|
|
def test_combine_different_configs(self):
|
|
|
|
searched = Line.objects.filter(
|
|
|
|
dialogue__search=(
|
|
|
|
SearchQuery("cadeau", config="french")
|
2016-08-25 08:36:49 +00:00
|
|
|
| SearchQuery("nostrils", config="english")
|
|
|
|
)
|
2018-11-30 14:42:50 +00:00
|
|
|
)
|
|
|
|
self.assertCountEqual(searched, [self.french, self.verse2])
|
|
|
|
|
2020-03-13 11:00:48 +00:00
|
|
|
def test_combined_configs(self):
|
|
|
|
searched = Line.objects.filter(
|
|
|
|
dialogue__search=(
|
|
|
|
SearchQuery("nostrils", config="simple")
|
|
|
|
& SearchQuery("bowels", config="simple")
|
|
|
|
),
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(searched, [self.verse2])
|
|
|
|
|
2018-11-30 14:42:50 +00:00
|
|
|
def test_combine_raw_phrase(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2018-11-30 14:42:50 +00:00
|
|
|
searched = Line.objects.filter(
|
|
|
|
dialogue__search=(
|
|
|
|
SearchQuery("burn:*", search_type="raw", config="simple")
|
|
|
|
| SearchQuery("rode forth from Camelot", search_type="phrase")
|
|
|
|
)
|
|
|
|
)
|
|
|
|
self.assertCountEqual(searched, [self.verse0, self.verse1, self.verse2])
|
2016-08-25 08:36:49 +00:00
|
|
|
|
|
|
|
def test_query_combined_mismatch(self):
|
2020-01-24 22:23:30 +00:00
|
|
|
msg = (
|
|
|
|
"SearchQuery can only be combined with other SearchQuery "
|
|
|
|
"instances, got NoneType."
|
|
|
|
)
|
2016-08-25 08:36:49 +00:00
|
|
|
with self.assertRaisesMessage(TypeError, msg):
|
|
|
|
Line.objects.filter(dialogue__search=None | SearchQuery("kneecaps"))
|
|
|
|
|
|
|
|
with self.assertRaisesMessage(TypeError, msg):
|
|
|
|
Line.objects.filter(dialogue__search=None & SearchQuery("kneecaps"))
|
|
|
|
|
2015-05-31 21:45:03 +00:00
|
|
|
|
|
|
|
class TestRankingAndWeights(GrailTestData, PostgreSQLTestCase):
|
|
|
|
def test_ranking(self):
|
|
|
|
searched = (
|
|
|
|
Line.objects.filter(character=self.minstrel)
|
|
|
|
.annotate(
|
|
|
|
rank=SearchRank(
|
|
|
|
SearchVector("dialogue"), SearchQuery("brave sir robin")
|
|
|
|
),
|
|
|
|
)
|
|
|
|
.order_by("rank")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.verse2, self.verse1, self.verse0])
|
|
|
|
|
|
|
|
def test_rank_passing_untyped_args(self):
|
|
|
|
searched = (
|
|
|
|
Line.objects.filter(character=self.minstrel)
|
|
|
|
.annotate(
|
|
|
|
rank=SearchRank("dialogue", "brave sir robin"),
|
|
|
|
)
|
|
|
|
.order_by("rank")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.verse2, self.verse1, self.verse0])
|
|
|
|
|
|
|
|
def test_weights_in_vector(self):
|
|
|
|
vector = SearchVector("dialogue", weight="A") + SearchVector(
|
|
|
|
"character__name", weight="D"
|
|
|
|
)
|
|
|
|
searched = (
|
|
|
|
Line.objects.filter(scene=self.witch_scene)
|
|
|
|
.annotate(
|
|
|
|
rank=SearchRank(vector, SearchQuery("witch")),
|
|
|
|
)
|
|
|
|
.order_by("-rank")[:2]
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.crowd, self.witch])
|
|
|
|
|
|
|
|
vector = SearchVector("dialogue", weight="D") + SearchVector(
|
|
|
|
"character__name", weight="A"
|
|
|
|
)
|
|
|
|
searched = (
|
|
|
|
Line.objects.filter(scene=self.witch_scene)
|
|
|
|
.annotate(
|
|
|
|
rank=SearchRank(vector, SearchQuery("witch")),
|
|
|
|
)
|
|
|
|
.order_by("-rank")[:2]
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.witch, self.crowd])
|
|
|
|
|
|
|
|
def test_ranked_custom_weights(self):
|
|
|
|
vector = SearchVector("dialogue", weight="D") + SearchVector(
|
|
|
|
"character__name", weight="A"
|
|
|
|
)
|
2022-12-06 11:45:47 +00:00
|
|
|
weights = [1.0, 0.0, 0.0, 0.5]
|
2015-05-31 21:45:03 +00:00
|
|
|
searched = (
|
|
|
|
Line.objects.filter(scene=self.witch_scene)
|
|
|
|
.annotate(
|
2022-12-06 11:45:47 +00:00
|
|
|
rank=SearchRank(vector, SearchQuery("witch"), weights=weights),
|
2015-05-31 21:45:03 +00:00
|
|
|
)
|
|
|
|
.order_by("-rank")[:2]
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.crowd, self.witch])
|
|
|
|
|
|
|
|
def test_ranking_chaining(self):
|
|
|
|
searched = (
|
|
|
|
Line.objects.filter(character=self.minstrel)
|
|
|
|
.annotate(
|
|
|
|
rank=SearchRank(
|
|
|
|
SearchVector("dialogue"), SearchQuery("brave sir robin")
|
|
|
|
),
|
|
|
|
)
|
|
|
|
.filter(rank__gt=0.3)
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2015-05-31 21:45:03 +00:00
|
|
|
self.assertSequenceEqual(searched, [self.verse0])
|
2018-08-07 21:32:29 +00:00
|
|
|
|
2020-03-20 21:01:26 +00:00
|
|
|
def test_cover_density_ranking(self):
|
|
|
|
not_dense_verse = Line.objects.create(
|
|
|
|
scene=self.robin,
|
|
|
|
character=self.minstrel,
|
|
|
|
dialogue=(
|
|
|
|
"Bravely taking to his feet, he beat a very brave retreat. "
|
|
|
|
"A brave retreat brave Sir Robin."
|
2022-02-03 19:24:19 +00:00
|
|
|
),
|
|
|
|
)
|
2019-11-19 13:59:06 +00:00
|
|
|
searched = (
|
2020-03-20 21:01:26 +00:00
|
|
|
Line.objects.filter(character=self.minstrel)
|
2019-11-19 13:59:06 +00:00
|
|
|
.annotate(
|
2020-03-20 21:01:26 +00:00
|
|
|
rank=SearchRank(
|
|
|
|
SearchVector("dialogue"),
|
2019-11-19 13:59:06 +00:00
|
|
|
SearchQuery("brave robin"),
|
2020-03-20 21:01:26 +00:00
|
|
|
cover_density=True,
|
2022-02-03 19:24:19 +00:00
|
|
|
),
|
2020-03-20 21:01:26 +00:00
|
|
|
)
|
|
|
|
.order_by("rank", "-pk")
|
|
|
|
)
|
|
|
|
self.assertSequenceEqual(
|
|
|
|
searched,
|
|
|
|
[self.verse2, not_dense_verse, self.verse1, self.verse0],
|
|
|
|
)
|
|
|
|
|
|
|
|
def test_ranking_with_normalization(self):
|
|
|
|
short_verse = Line.objects.create(
|
|
|
|
scene=self.robin,
|
|
|
|
character=self.minstrel,
|
|
|
|
dialogue="A brave retreat brave Sir Robin.",
|
|
|
|
)
|
|
|
|
searched = (
|
|
|
|
Line.objects.filter(character=self.minstrel)
|
|
|
|
.annotate(
|
|
|
|
rank=SearchRank(
|
|
|
|
SearchVector("dialogue"),
|
|
|
|
SearchQuery("brave sir robin"),
|
|
|
|
# Divide the rank by the document length.
|
|
|
|
normalization=2,
|
|
|
|
),
|
|
|
|
)
|
|
|
|
.order_by("rank")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2020-03-20 21:01:26 +00:00
|
|
|
self.assertSequenceEqual(
|
|
|
|
searched,
|
|
|
|
[self.verse2, self.verse1, self.verse0, short_verse],
|
|
|
|
)
|
|
|
|
|
|
|
|
def test_ranking_with_masked_normalization(self):
|
|
|
|
short_verse = Line.objects.create(
|
|
|
|
scene=self.robin,
|
|
|
|
character=self.minstrel,
|
|
|
|
dialogue="A brave retreat brave Sir Robin.",
|
|
|
|
)
|
|
|
|
searched = (
|
|
|
|
Line.objects.filter(character=self.minstrel)
|
|
|
|
.annotate(
|
|
|
|
rank=SearchRank(
|
|
|
|
SearchVector("dialogue"),
|
|
|
|
SearchQuery("brave sir robin"),
|
|
|
|
# Divide the rank by the document length and by the number of
|
|
|
|
# unique words in document.
|
|
|
|
normalization=Value(2).bitor(Value(8)),
|
|
|
|
),
|
|
|
|
)
|
|
|
|
.order_by("rank")
|
2022-02-03 19:24:19 +00:00
|
|
|
)
|
2020-03-20 21:01:26 +00:00
|
|
|
self.assertSequenceEqual(
|
|
|
|
searched,
|
|
|
|
[self.verse2, self.verse1, self.verse0, short_verse],
|
|
|
|
)
|
|
|
|
|
2018-08-07 21:32:29 +00:00
|
|
|
|
2019-11-19 13:59:06 +00:00
|
|
|
class SearchQueryTests(PostgreSQLSimpleTestCase):
|
2018-08-07 21:32:29 +00:00
|
|
|
def test_str(self):
|
|
|
|
tests = (
|
2021-05-24 05:23:00 +00:00
|
|
|
(~SearchQuery("a"), "~SearchQuery(Value('a'))"),
|
2018-08-07 21:32:29 +00:00
|
|
|
(
|
|
|
|
(SearchQuery("a") | SearchQuery("b"))
|
|
|
|
& (SearchQuery("c") | SearchQuery("d")),
|
2021-05-24 05:23:00 +00:00
|
|
|
"((SearchQuery(Value('a')) || SearchQuery(Value('b'))) && "
|
|
|
|
"(SearchQuery(Value('c')) || SearchQuery(Value('d'))))",
|
2018-08-07 21:32:29 +00:00
|
|
|
),
|
|
|
|
(
|
|
|
|
SearchQuery("a") & (SearchQuery("b") | SearchQuery("c")),
|
2021-05-24 05:23:00 +00:00
|
|
|
"(SearchQuery(Value('a')) && (SearchQuery(Value('b')) || "
|
|
|
|
"SearchQuery(Value('c'))))",
|
2018-08-07 21:32:29 +00:00
|
|
|
),
|
|
|
|
(
|
|
|
|
(SearchQuery("a") | SearchQuery("b")) & SearchQuery("c"),
|
2021-05-24 05:23:00 +00:00
|
|
|
"((SearchQuery(Value('a')) || SearchQuery(Value('b'))) && "
|
|
|
|
"SearchQuery(Value('c')))",
|
2018-08-07 21:32:29 +00:00
|
|
|
),
|
|
|
|
(
|
|
|
|
SearchQuery("a")
|
|
|
|
& (SearchQuery("b") & (SearchQuery("c") | SearchQuery("d"))),
|
2021-05-24 05:23:00 +00:00
|
|
|
"(SearchQuery(Value('a')) && (SearchQuery(Value('b')) && "
|
|
|
|
"(SearchQuery(Value('c')) || SearchQuery(Value('d')))))",
|
2018-08-07 21:32:29 +00:00
|
|
|
),
|
|
|
|
)
|
|
|
|
for query, expected_str in tests:
|
|
|
|
with self.subTest(query=query):
|
|
|
|
self.assertEqual(str(query), expected_str)
|
2019-11-19 13:59:06 +00:00
|
|
|
|
|
|
|
|
|
|
|
class SearchHeadlineTests(GrailTestData, PostgreSQLTestCase):
|
|
|
|
def test_headline(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2019-11-19 13:59:06 +00:00
|
|
|
searched = Line.objects.annotate(
|
|
|
|
headline=SearchHeadline(
|
|
|
|
F("dialogue"),
|
|
|
|
SearchQuery("brave sir robin"),
|
|
|
|
config=SearchConfig("english"),
|
|
|
|
),
|
|
|
|
).get(pk=self.verse0.pk)
|
|
|
|
self.assertEqual(
|
|
|
|
searched.headline,
|
|
|
|
"<b>Robin</b>. He was not at all afraid to be killed in nasty "
|
|
|
|
"ways. <b>Brave</b>, <b>brave</b>, <b>brave</b>, <b>brave</b> "
|
|
|
|
"<b>Sir</b> <b>Robin</b>",
|
|
|
|
)
|
|
|
|
|
|
|
|
def test_headline_untyped_args(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2019-11-19 13:59:06 +00:00
|
|
|
searched = Line.objects.annotate(
|
|
|
|
headline=SearchHeadline("dialogue", "killed", config="english"),
|
|
|
|
).get(pk=self.verse0.pk)
|
|
|
|
self.assertEqual(
|
|
|
|
searched.headline,
|
|
|
|
"Robin. He was not at all afraid to be <b>killed</b> in nasty "
|
2020-05-17 21:20:16 +00:00
|
|
|
"ways. Brave, brave, brave, brave Sir Robin",
|
2019-11-19 13:59:06 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
def test_headline_with_config(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
headline=SearchHeadline(
|
|
|
|
"dialogue",
|
|
|
|
SearchQuery("cadeaux", config="french"),
|
|
|
|
config="french",
|
|
|
|
),
|
|
|
|
).get(pk=self.french.pk)
|
|
|
|
self.assertEqual(
|
|
|
|
searched.headline,
|
|
|
|
"Oh. Un beau <b>cadeau</b>. Oui oui.",
|
|
|
|
)
|
|
|
|
|
|
|
|
def test_headline_with_config_from_field(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
headline=SearchHeadline(
|
|
|
|
"dialogue",
|
|
|
|
SearchQuery("cadeaux", config=F("dialogue_config")),
|
|
|
|
config=F("dialogue_config"),
|
|
|
|
),
|
|
|
|
).get(pk=self.french.pk)
|
|
|
|
self.assertEqual(
|
|
|
|
searched.headline,
|
|
|
|
"Oh. Un beau <b>cadeau</b>. Oui oui.",
|
|
|
|
)
|
|
|
|
|
|
|
|
def test_headline_separator_options(self):
|
|
|
|
searched = Line.objects.annotate(
|
|
|
|
headline=SearchHeadline(
|
|
|
|
"dialogue",
|
|
|
|
"brave sir robin",
|
|
|
|
start_sel="<span>",
|
|
|
|
stop_sel="</span>",
|
|
|
|
),
|
|
|
|
).get(pk=self.verse0.pk)
|
|
|
|
self.assertEqual(
|
|
|
|
searched.headline,
|
|
|
|
"<span>Robin</span>. He was not at all afraid to be killed in "
|
|
|
|
"nasty ways. <span>Brave</span>, <span>brave</span>, <span>brave"
|
|
|
|
"</span>, <span>brave</span> <span>Sir</span> <span>Robin</span>",
|
|
|
|
)
|
|
|
|
|
|
|
|
def test_headline_highlight_all_option(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2019-11-19 13:59:06 +00:00
|
|
|
searched = Line.objects.annotate(
|
|
|
|
headline=SearchHeadline(
|
|
|
|
"dialogue",
|
|
|
|
SearchQuery("brave sir robin", config="english"),
|
|
|
|
highlight_all=True,
|
|
|
|
),
|
|
|
|
).get(pk=self.verse0.pk)
|
|
|
|
self.assertIn(
|
|
|
|
"<b>Bravely</b> bold <b>Sir</b> <b>Robin</b>, rode forth from "
|
|
|
|
"Camelot. He was not afraid to die, o ",
|
|
|
|
searched.headline,
|
|
|
|
)
|
|
|
|
|
|
|
|
def test_headline_short_word_option(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2019-11-19 13:59:06 +00:00
|
|
|
searched = Line.objects.annotate(
|
|
|
|
headline=SearchHeadline(
|
|
|
|
"dialogue",
|
2020-05-17 21:20:16 +00:00
|
|
|
SearchQuery("Camelot", config="english"),
|
|
|
|
short_word=5,
|
|
|
|
min_words=8,
|
2019-11-19 13:59:06 +00:00
|
|
|
),
|
|
|
|
).get(pk=self.verse0.pk)
|
2020-05-17 21:20:16 +00:00
|
|
|
self.assertEqual(
|
|
|
|
searched.headline,
|
|
|
|
(
|
|
|
|
"<b>Camelot</b>. He was not afraid to die, o Brave Sir Robin. He "
|
|
|
|
"was not at all afraid"
|
2022-02-03 19:24:19 +00:00
|
|
|
),
|
2020-05-17 21:20:16 +00:00
|
|
|
)
|
2019-11-19 13:59:06 +00:00
|
|
|
|
|
|
|
def test_headline_fragments_words_options(self):
|
2022-12-03 15:40:45 +00:00
|
|
|
self.check_default_text_search_config()
|
2019-11-19 13:59:06 +00:00
|
|
|
searched = Line.objects.annotate(
|
|
|
|
headline=SearchHeadline(
|
|
|
|
"dialogue",
|
|
|
|
SearchQuery("brave sir robin", config="english"),
|
|
|
|
fragment_delimiter="...<br>",
|
|
|
|
max_fragments=4,
|
|
|
|
max_words=3,
|
|
|
|
min_words=1,
|
|
|
|
),
|
|
|
|
).get(pk=self.verse0.pk)
|
|
|
|
self.assertEqual(
|
|
|
|
searched.headline,
|
|
|
|
"<b>Sir</b> <b>Robin</b>, rode...<br>"
|
|
|
|
"<b>Brave</b> <b>Sir</b> <b>Robin</b>...<br>"
|
|
|
|
"<b>Brave</b>, <b>brave</b>, <b>brave</b>...<br>"
|
|
|
|
"<b>brave</b> <b>Sir</b> <b>Robin</b>",
|
|
|
|
)
|