Skip to content

Commit

Permalink
improve search index for incremental builds
Browse files Browse the repository at this point in the history
add test
  • Loading branch information
2bndy5 committed Oct 4, 2024
1 parent da38810 commit 3661557
Show file tree
Hide file tree
Showing 2 changed files with 65 additions and 13 deletions.
40 changes: 27 additions & 13 deletions sphinx_immaterial/search.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,9 @@
"""Generates a search index for use by the lunr.js-based mkdocs-material search."""

import multiprocessing
import multiprocessing.managers
import pathlib
from typing import Dict, Any, cast
from typing import Dict, Any, cast, List, Optional

import docutils.nodes
import jinja2.sandbox
Expand All @@ -16,6 +17,24 @@

_SEARCH_QUEUE_KEY = "_sphinx_immaterial_search_entry_queue"
_SEARCH_CONFIG = "_sphinx_immaterial_search_config"
_SEARCH_QUEUE_MGR_KEY = "_sphinx_immaterial_search_multiprocessing_manager"


def _init_search_index_queue(app: sphinx.application.Sphinx):
manager: multiprocessing.managers.SyncManager = getattr(app, _SEARCH_QUEUE_MGR_KEY)
prev_queue = cast(
Optional[multiprocessing.managers.DictProxy],
getattr(app.env, _SEARCH_QUEUE_KEY, None),
)
if prev_queue is not None:
queue = manager.dict(**prev_queue)
else:
queue = manager.dict()
setattr(
app.env,
_SEARCH_QUEUE_KEY,
queue,
)


def _get_search_config(app: sphinx.application.Sphinx):
Expand Down Expand Up @@ -91,8 +110,9 @@ def _html_page_context(
toc=page_ctx["toc"],
)
)
queue = getattr(app, _SEARCH_QUEUE_KEY)
queue.append(indexer.entries)

queue: Dict[str, List[_Page]] = getattr(app.env, _SEARCH_QUEUE_KEY)
queue[pagename] = indexer.entries


def _build_finished(app: sphinx.application.Sphinx, exc) -> None:
Expand All @@ -104,16 +124,11 @@ def _build_finished(app: sphinx.application.Sphinx, exc) -> None:
if not isinstance(app.builder, sphinx.builders.html.StandaloneHTMLBuilder):
return

queue = getattr(app, _SEARCH_QUEUE_KEY)
queue: Dict[str, List[_Page]] = getattr(app.env, _SEARCH_QUEUE_KEY)
indexer = _make_indexer(app)
for entries in queue[:]:
for entries in queue.values():
indexer.entries.extend(entries)
output_path = pathlib.Path(app.outdir) / "search" / "search_index.json"
# try:
# existing_data = output_path.read_text(encoding='utf-8')

# except FileNotFoundError:
# pass
json_data = indexer.generate_search_index(prev=None)

output_path.parent.mkdir(exist_ok=True)
Expand All @@ -124,9 +139,8 @@ def _build_finished(app: sphinx.application.Sphinx, exc) -> None:
def setup(app: sphinx.application.Sphinx):
app.connect("html-page-context", _html_page_context)
app.connect("build-finished", _build_finished)
manager = multiprocessing.Manager()
setattr(app, "_sphinx_immaterial_search_multiprocessing_manager", manager)
setattr(app, _SEARCH_QUEUE_KEY, manager.list())
app.connect("builder-inited", _init_search_index_queue)
setattr(app, _SEARCH_QUEUE_MGR_KEY, multiprocessing.Manager())
return {
"parallel_read_safe": True,
"parallel_write_safe": True,
Expand Down
38 changes: 38 additions & 0 deletions tests/search_indexer_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,3 +38,41 @@ def test_search_metadata(tmp_path: Path, immaterial_make_app):
assert "docs" in index_json
assert len(index_json["docs"]) == 1
assert index_json["docs"][0]["boost"] == "2"


def test_search_incremental_builds(tmp_path: Path, immaterial_make_app):
"""generate a graph and some regular/mono text with system font as fallback."""

def verify_search_index(index_out: Path):
index_json = json.loads(index_out.read_bytes())
assert "docs" in index_json
assert len(index_json["docs"]) == 2
locations = [e["location"] for e in index_json["docs"]]
assert "index.html" in locations
assert "and_more.html" in locations
return index_json

app: SphinxTestApp = immaterial_make_app(files=FILES)
app.build()
index_out = tmp_path / "_build" / "html" / "search" / "search_index.json"
assert index_out.exists()
first_index = verify_search_index(index_out)

# change the contents of the and_more.rst file
changed_file = tmp_path / "and_more.rst"
assert changed_file.exists()
changed_file.write_bytes(changed_file.read_bytes() + b"\nSome new content\n")
assert "and_more" in list(app.builder.get_outdated_docs())
app.build()

# verify expected changes on second build
new_index = verify_search_index(index_out)
assert new_index != first_index
for e in new_index["docs"]:
if e["location"] == "and_more.html":
changed_text = e["text"]
break
else: # pragma: no cover
# should never get here. but just in case something changes the test...
raise RuntimeError("search index entry for changed file not found")
assert "Some new content" in changed_text

0 comments on commit 3661557

Please sign in to comment.