-
-
Notifications
You must be signed in to change notification settings - Fork 1k
Support of including blog in the website search #2136
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
base: main
Are you sure you want to change the base?
Changes from 14 commits
03c5801
12c377e
837e808
5e22aee
edea21c
e9d3d3b
f3c5a83
4fa01d6
021a57d
e5a9452
bcffdee
a7b3bbe
c1a61a9
8e01cca
629bc6d
c89240a
606d381
396050c
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,18 @@ | ||
# Generated by Django 5.2 on 2025-09-03 20:02 | ||
|
||
from django.db import migrations, models | ||
|
||
|
||
class Migration(migrations.Migration): | ||
|
||
dependencies = [ | ||
('blog', '0005_entry_social_media_card'), | ||
] | ||
|
||
operations = [ | ||
migrations.AddField( | ||
model_name='entry', | ||
name='is_searchable', | ||
field=models.BooleanField(default=False, help_text='Tick to make this entry appear in the Django documentation search.'), | ||
), | ||
] |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,18 @@ | ||
# Generated by Django 5.2 on 2025-07-23 16:31 | ||
|
||
from django.db import migrations, models | ||
|
||
|
||
class Migration(migrations.Migration): | ||
|
||
dependencies = [ | ||
('docs', '0006_alter_document_metadata_noop'), | ||
] | ||
|
||
operations = [ | ||
migrations.AddField( | ||
model_name='documentrelease', | ||
name='support_end', | ||
field=models.DateField(blank=True, help_text='The end of support for this release of Django.', null=True), | ||
), | ||
] |
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -18,22 +18,31 @@ | |
from django.db import models, transaction | ||
from django.db.models import Q | ||
from django.db.models.fields.json import KeyTextTransform | ||
from django.template.loader import get_template | ||
from django.utils.functional import cached_property | ||
from django.utils.html import strip_tags | ||
from django_hosts.resolvers import reverse | ||
|
||
from blog.models import Entry | ||
from releases.models import Release | ||
|
||
from . import utils | ||
from .search import ( | ||
DEFAULT_TEXT_SEARCH_CONFIG, | ||
DOCUMENT_SEARCH_VECTOR, | ||
SEARCHABLE_VIEWS, | ||
START_SEL, | ||
STOP_SEL, | ||
TSEARCH_CONFIG_LANGUAGES, | ||
DocumentationCategory, | ||
) | ||
|
||
|
||
def get_search_config(lang): | ||
"""Determine the PostgreSQL search language""" | ||
return TSEARCH_CONFIG_LANGUAGES.get(lang[:2], DEFAULT_TEXT_SEARCH_CONFIG) | ||
|
||
|
||
class DocumentReleaseQuerySet(models.QuerySet): | ||
def current(self, lang="en"): | ||
current = self.get(is_default=True) | ||
|
@@ -95,6 +104,11 @@ class DocumentRelease(models.Model): | |
on_delete=models.CASCADE, | ||
) | ||
is_default = models.BooleanField(default=False) | ||
support_end = models.DateField( | ||
null=True, | ||
blank=True, | ||
help_text="The end of support for this release of Django.", | ||
) | ||
|
||
objects = DocumentReleaseQuerySet.as_manager() | ||
|
||
|
@@ -202,16 +216,81 @@ def sync_to_db(self, decoded_documents): | |
path=document_path, | ||
title=html.unescape(strip_tags(document["title"])), | ||
metadata=document, | ||
config=TSEARCH_CONFIG_LANGUAGES.get( | ||
self.lang[:2], DEFAULT_TEXT_SEARCH_CONFIG | ||
), | ||
config=get_search_config(self.lang), | ||
) | ||
for document in self.documents.all(): | ||
document.metadata["breadcrumbs"] = list( | ||
Document.objects.breadcrumbs(document).values("title", "path") | ||
) | ||
document.save(update_fields=("metadata",)) | ||
|
||
self._sync_blog_to_db() | ||
self._sync_views_to_db() | ||
|
||
def _sync_blog_to_db(self): | ||
""" | ||
Sync the blog entries into search based on the release documents | ||
support end date. | ||
""" | ||
if self.lang != "en" or not self.support_end: | ||
# The blog is only written in English, and we need to know | ||
# the release's support end to know when to stop considering | ||
# blog posts relevant. | ||
return | ||
for entry in Entry.objects.published(self.support_end).searchable(): | ||
Document.objects.create( | ||
release=self, | ||
path=entry.get_absolute_url(), | ||
title=entry.headline, | ||
metadata={ | ||
"body": entry.body_html, | ||
"breadcrumbs": [ | ||
{ | ||
"path": DocumentationCategory.WEBSITE, | ||
"title": "News", | ||
}, | ||
], | ||
"parents": DocumentationCategory.WEBSITE, | ||
"slug": entry.slug, | ||
"title": entry.headline, | ||
"toc": "", | ||
}, | ||
config=get_search_config(self.lang), | ||
) | ||
|
||
def _sync_views_to_db(self): | ||
""" | ||
Sync the specific views into search based on the release documents | ||
support end date. | ||
""" | ||
if self.lang != "en": | ||
return # The searchable views are only written in English currently | ||
|
||
for searchable_view in SEARCHABLE_VIEWS: | ||
absolute_url = reverse(searchable_view.url_name, host="www") | ||
# This must match the template used for the url `community-ecosystem` | ||
html = get_template("aggregator/ecosystem.html").render() | ||
# Need to parse the body element. | ||
|
||
Document.objects.create( | ||
release=self, | ||
path=absolute_url, | ||
title=searchable_view.page_title, | ||
metadata={ | ||
"body": html, | ||
"breadcrumbs": [ | ||
{ | ||
"path": DocumentationCategory.WEBSITE, | ||
"title": "Website", | ||
}, | ||
], | ||
"parents": DocumentationCategory.WEBSITE, | ||
"slug": searchable_view.url_name, | ||
"title": searchable_view.page_title, | ||
"toc": "", | ||
}, | ||
config=get_search_config(self.lang), | ||
) | ||
|
||
|
||
def _clean_document_path(path): | ||
# We have to be a bit careful to reverse-engineer the correct | ||
|
@@ -224,7 +303,9 @@ def _clean_document_path(path): | |
|
||
|
||
def document_url(doc): | ||
if doc.path: | ||
if doc.metadata.get("parents") == DocumentationCategory.WEBSITE: | ||
return doc.path | ||
elif doc.path: | ||
kwargs = { | ||
"lang": doc.release.lang, | ||
"version": doc.release.version, | ||
|
Original file line number | Diff line number | Diff line change | ||||
---|---|---|---|---|---|---|
@@ -1,3 +1,5 @@ | ||||||
from dataclasses import dataclass | ||||||
|
||||||
from django.contrib.postgres.search import SearchVector | ||||||
from django.db.models import F, TextChoices | ||||||
from django.db.models.fields.json import KeyTextTransform | ||||||
|
@@ -65,10 +67,22 @@ class DocumentationCategory(TextChoices): | |||||
TOPICS = "topics", _("Using Django") | ||||||
HOWTO = "howto", _("How-to guides") | ||||||
RELEASE_NOTES = "releases", _("Release notes") | ||||||
WEBSITE = "weblog", _("Django Website") | ||||||
|
WEBSITE = "weblog", _("Django Website") | |
WEBSITE = "website", _("Django Website") |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
So this is a bigger question. We need the value to be "weblog"
to make the breadcrumbs work properly in the search area without adding another hack on the search results side to adjust things. I suppose we could just have "www.djangoproject.com/website/" redirect to "www.djangoproject.com/weblog/". However, I have no idea what to call that category of results on the actual page. I think right now I have it as "Django Website" which doesn't seem right.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Do the breadcrumbs work for you in the first place? I don't think I've ever used that feature and it doesn't seem to work correctly for me locally: even for documents with two or more parents, the links for all the parents are all the same and go to the document's own page.
Not sure I'd want to start adding redirects, that seems like solving the problem at the wrong level to me.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I have no idea what I ran into originally. Looks like we can rename this to be whatever we want.
The breadcrumbs links on the search just point directly to the search result. Not the actual parents. May be a bug to be honest 🫣
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Do we need a dedicated field for this, why couldn't we get the information from
release.eol_date
instead?There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
This is why we do code reviews. Let me get this switched over.