Replace search UI with Algolia backed one (#845)

petyosi · web-flow · commit d89e1b13cd78 · 2025-02-06T15:38:38.000+02:00
diff --git a/docs/.hooks/algolia.py b/docs/.hooks/algolia.py
@@ -21,6 +21,7 @@ class AlgoliaRecord(TypedDict):
     abs_url: str
     title: str
     objectID: str
+    rank: int
 
 
 records: list[AlgoliaRecord] = []
@@ -42,6 +43,13 @@ def on_page_content(html: str, page: Page, config: Config, files: Files) -> str:
 
     soup = BeautifulSoup(html, 'html.parser')
 
+    # If the page does not start with a heading, add the h1 with the title
+    # Some examples don't have a heading. or start with h2
+    first_element = soup.find()
+
+    if not first_element or not first_element.name or first_element.name not in ['h1', 'h2', 'h3']:
+        soup.insert(0, BeautifulSoup(f'<h1 id="{title}">{title}</h1>', 'html.parser'))
+
     # Clean up presentational and UI elements
     for element in soup.find_all(['autoref']):
         element.decompose()
@@ -62,8 +70,10 @@ def on_page_content(html: str, page: Page, config: Config, files: Files) -> str:
     for extra in soup.find_all('table', attrs={'class': 'highlighttable'}):
         extra.replace_with(BeautifulSoup(f'<pre>{extra.find("code").get_text()}</pre>', 'html.parser'))
 
-    # Find all h1 and h2 headings
-    headings = soup.find_all(['h1', 'h2'])
+    headings = soup.find_all(['h1', 'h2', 'h3'])
+
+    # Use the rank to put the sections in the beginning higher in the search results
+    rank = 100
 
     # Process each section
     for current_heading in headings:
@@ -73,26 +83,41 @@ def on_page_content(html: str, page: Page, config: Config, files: Files) -> str:
         # Get content until next heading
         content: list[str] = []
         sibling = current_heading.find_next_sibling()
-        while sibling and sibling.name not in {'h1', 'h2'}:
+        while sibling and sibling.name not in {'h1', 'h2', 'h3'}:
             content.append(str(sibling))
             sibling = sibling.find_next_sibling()
 
         section_html = ''.join(content)
 
+        section_soup = BeautifulSoup(section_html, 'html.parser')
+        section_plain_text = section_soup.get_text(' ', strip=True)
+
         # Create anchor URL
         anchor_url: str = f'{page.abs_url}#{heading_id}' if heading_id else page.abs_url or ''
 
+        record_title = title
+
+        if current_heading.name == 'h2':
+            record_title = f'{title} - {section_title}'
+        elif current_heading.name == 'h3':
+            previous_heading = current_heading.find_previous(['h1', 'h2'])
+            record_title = f'{title} - {previous_heading.get_text()} - {section_title}'
+
+        # print(f'Adding record {record_title}, {rank}, {current_heading.name}')
         # Create record for this section
         records.append(
             AlgoliaRecord(
-                content=section_html,
+                content=section_plain_text,
                 pageID=title,
                 abs_url=anchor_url,
-                title=f'{title} - {section_title}',
+                title=record_title,
                 objectID=anchor_url,
+                rank=rank,
             )
         )
 
+        rank -= 5
+
     return html
 
 
@@ -132,6 +157,16 @@ def algolia_upload() -> None:
     print(f'Uploading {len(filtered_records)} out of {len(all_records)} records to Algolia...')
 
     client.clear_objects(index_name=ALGOLIA_INDEX_NAME)
+    client.set_settings(
+        index_name=ALGOLIA_INDEX_NAME,
+        index_settings={
+            'searchableAttributes': ['title', 'content'],
+            'attributesToSnippet': ['content:40'],
+            'customRanking': [
+                'desc(rank)',
+            ],
+        },
+    )
 
     client.batch(
         index_name=ALGOLIA_INDEX_NAME,
diff --git a/docs/.overrides/main.html b/docs/.overrides/main.html
@@ -1,54 +1,5 @@
 {% extends "base.html" %}
 
-<!--
-  We're changing the config block so that we can change the worker script path to a custom web worker script that pulls search results from Algolia.
-  The rest of the block is the "stock" one, so it can safely be updated if something changes in MkDocs.
--->
-
-{% block config %}
-      {%- set app = {
-        "base": base_url,
-        "features": features,
-        "translations": {},
-        "search": base_url + "/javascripts/search-worker.js" | url
-      } -%}
-
-      <!-- Versioning -->
-      {%- if config.extra.version -%}
-        {%- set mike = config.plugins.get("mike") -%}
-        {%- if not mike or mike.config.version_selector -%}
-          {%- set _ = app.update({ "version": config.extra.version }) -%}
-        {%- endif -%}
-      {%- endif -%}
-
-      <!-- Tags -->
-      {%- if config.extra.tags -%}
-        {%- set _ = app.update({ "tags": config.extra.tags }) -%}
-      {%- endif -%}
-
-      <!-- Translations -->
-      {%- set translations = app.translations -%}
-      {%- for key in [
-        "clipboard.copy",
-        "clipboard.copied",
-        "search.result.placeholder",
-        "search.result.none",
-        "search.result.one",
-        "search.result.other",
-        "search.result.more.one",
-        "search.result.more.other",
-        "search.result.term.missing",
-        "select.version"
-      ] -%}
-        {%- set _ = translations.update({ key: lang.t(key) }) -%}
-      {%- endfor -%}
-
-      <!-- Configuration -->
-      <script id="__config" type="application/json">
-        {{- app | tojson -}}
-      </script>
-{% endblock %}
-
 {% block content %}
   <div id="version-notice"></div>
   {{ super() }}
diff --git a/docs/.overrides/partials/search.html b/docs/.overrides/partials/search.html
@@ -0,0 +1,32 @@
+<div class="md-search" role="dialog">
+  <label class="md-search__overlay" for="__search"></label>
+  <div class="md-search__inner" role="search">
+    <form class="md-search__form" name="search">
+      <input type="text" id="searchbox" class="md-search__input" name="query" aria-label="Search" placeholder="Search" autocapitalize="off" autocorrect="off" autocomplete="off" spellcheck="false" required="">
+      <label class="md-search__icon md-icon" for="__search">
+
+        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.516 6.516 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5Z"></path></svg>
+
+        <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11h12Z"></path></svg>
+      </label>
+      <nav class="md-search__options" aria-label="Search">
+
+        <button id="searchbox-clear" type="reset" class="md-search__icon md-icon" title="Clear" aria-label="Clear" tabindex="-1">
+
+          <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M19 6.41 17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12 19 6.41Z"></path></svg>
+        </button>
+      </nav>
+
+        <div class="md-search__suggest"></div>
+
+    </form>
+    <div class="md-search__output">
+      <div class="md-search__scrollwrap" tabindex="0">
+        <div class="md-search-result">
+          <div class="md-search-result__meta" id="type-to-start-searching">Type to start searching</div>
+          <ol class="md-search-result__list" id="hits" role="presentation"></ol>
+        </div>
+      </div>
+    </div>
+  </div>
+</div>
diff --git a/docs/extra/tweaks.css b/docs/extra/tweaks.css
@@ -58,3 +58,20 @@ img.index-header {
 .mermaid {
   text-align: center;
 }
+
+.md-search__input::-webkit-search-decoration,
+.md-search__input::-webkit-search-cancel-button,
+.md-search__input::-webkit-search-results-button,
+.md-search__input::-webkit-search-results-decoration {
+  -webkit-appearance:none;
+}
+
+.md-search-result__article {
+  padding-bottom: .55em;
+}
+
+.ais-SearchBox-form {
+  display: flex;
+  flex-direction: row;
+  gap: 10px;
+}
diff --git a/docs/javascripts/algolia-search.js b/docs/javascripts/algolia-search.js
@@ -0,0 +1,107 @@
+const ALGOLIA_APP_ID = 'KPPUDTIAVX';
+const ALGOLIA_API_KEY = '1fc841595212a2c3afe8c24dd4cb8790';
+const ALGOLIA_INDEX_NAME = 'pydantic-ai-docs';
+
+const { liteClient: algoliasearch } = window['algoliasearch/lite'];
+const searchClient = algoliasearch(ALGOLIA_APP_ID, ALGOLIA_API_KEY);
+
+const search = instantsearch({
+  indexName: ALGOLIA_INDEX_NAME,
+  searchClient,
+  searchFunction(helper) {
+    const query = helper.state.query
+
+    if (query && query.length > 1) {
+      document.querySelector('#hits').hidden = false
+      document.querySelector('#type-to-start-searching').hidden = true
+      helper.search();
+    } else {
+      document.querySelector('#hits').hidden = true
+      document.querySelector('#type-to-start-searching').hidden = false
+    }
+  },
+});
+
+// create custom widget, to integrate with MkDocs built-in markup
+const customSearchBox = instantsearch.connectors.connectSearchBox((renderOptions, isFirstRender) => {
+  const { query, refine, clear } = renderOptions;
+
+  if (isFirstRender) {
+    document.querySelector('#searchbox').addEventListener('input', event => {
+      refine(event.target.value);
+    });
+
+    document.querySelector('#searchbox').addEventListener('focus', () => {
+      document.querySelector('#__search').checked = true;
+    });
+
+    document.querySelector('#searchbox-clear').addEventListener('click', () => {
+      clear();
+    });
+
+    document.querySelector('#searchbox').addEventListener('keydown', (event) => {
+      // on down arrow, find the first search result and focus it
+      if (event.key === 'ArrowDown') {
+        document.querySelector('.md-search-result__link').focus();
+        event.preventDefault();
+      }
+    });
+
+    // for Hits, add keyboard navigation
+    document.querySelector('#hits').addEventListener('keydown', (event) => {
+      if (event.key === 'ArrowDown') {
+        const next = event.target.parentElement.nextElementSibling;
+        if (next) {
+          next.querySelector('.md-search-result__link').focus();
+          event.preventDefault();
+        }
+      } else if (event.key === 'ArrowUp') {
+        const prev = event.target.parentElement.previousElementSibling;
+        if (prev) {
+          prev.querySelector('.md-search-result__link').focus();
+        } else {
+          document.querySelector('#searchbox').focus();
+        }
+        event.preventDefault();
+      }
+    })
+
+    document.addEventListener('keydown', (event) => {
+      // if forward slash is pressed, focus the search box
+      if (event.key === '/' && event.target.tagName !== 'INPUT') {
+        document.querySelector('#searchbox').focus();
+        event.preventDefault();
+      }
+    })
+  }
+
+
+  document.querySelector('#type-to-start-searching').hidden = query.length > 1;
+  document.querySelector('#searchbox').value = query;
+});
+
+search.addWidgets([
+  customSearchBox({}),
+
+  instantsearch.widgets.hits({
+    container: '#hits',
+    cssClasses: {
+      'list': 'md-search-result__list',
+      'item': 'md-search-result__item'
+    },
+    templates: {
+      item: (hit, { html, components }) => {
+        return html`
+          <a href="${hit.abs_url}" class="md-search-result__link" tabindex="-1">
+            <div class="md-search-result__article md-typeset">
+              <div class="md-search-result__icon md-icon"></div>
+              <h1>${components.Highlight({ attribute: 'title', hit })}</h1>
+              <article>${components.Snippet({ attribute: 'content', hit })} </article>
+            </div>
+          </a>`
+      },
+    },
+  })
+]);
+
+search.start();
diff --git a/docs/javascripts/search-worker.js b/docs/javascripts/search-worker.js
diff --git a/mkdocs.yml b/mkdocs.yml
@@ -121,6 +121,9 @@ extra_css:
 # used for analytics
 extra_javascript:
   - "/flarelytics/client.js"
+  - "https://cdn.jsdelivr.net/npm/algoliasearch@5.20.0/dist/lite/builds/browser.umd.js"
+  - "https://cdn.jsdelivr.net/npm/instantsearch.js@4.77.3/dist/instantsearch.production.min.js"
+  - "/javascripts/algolia-search.js"
 
 markdown_extensions:
   - tables
diff --git a/uv.lock b/uv.lock