Use suggestion as a search query if the initial one produced no results

marko-bekhta · marko-bekhta · commit ffa26a9e1bee · 2025-03-21T09:33:53.000+01:00
diff --git a/src/main/java/io/quarkus/search/app/SearchService.java b/src/main/java/io/quarkus/search/app/SearchService.java
@@ -21,18 +21,23 @@
 import io.quarkus.search.app.quarkiverseio.QuarkiverseIO;
 import io.quarkus.search.app.quarkusio.QuarkusIO;
 
+import io.quarkus.logging.Log;
+
 import org.hibernate.search.backend.elasticsearch.ElasticsearchExtension;
+import org.hibernate.search.backend.elasticsearch.search.query.ElasticsearchSearchResult;
 import org.hibernate.search.engine.search.common.BooleanOperator;
 import org.hibernate.search.engine.search.common.ValueModel;
 import org.hibernate.search.engine.search.predicate.dsl.MatchPredicateOptionsStep;
 import org.hibernate.search.engine.search.predicate.dsl.PredicateFinalStep;
 import org.hibernate.search.engine.search.predicate.dsl.SearchPredicateFactory;
 import org.hibernate.search.engine.search.predicate.dsl.SimpleQueryFlag;
 import org.hibernate.search.mapper.pojo.standalone.mapping.SearchMapping;
+import org.hibernate.search.mapper.pojo.standalone.session.SearchSession;
 
 import org.eclipse.microprofile.openapi.annotations.Operation;
 import org.jboss.resteasy.reactive.RestQuery;
 
+import com.google.gson.JsonArray;
 import com.google.gson.JsonObject;
 
 @ApplicationScoped
@@ -62,79 +67,97 @@ public SearchResult<GuideSearchHit> search(@RestQuery @DefaultValue(QuarkusVersi
             @RestQuery @DefaultValue("1") @Min(0) @Max(value = 10, message = MAX_FOR_PERF_MESSAGE) int contentSnippets,
             @RestQuery @DefaultValue("100") @Min(0) @Max(value = 200, message = MAX_FOR_PERF_MESSAGE) int contentSnippetsLength) {
         try (var session = searchMapping.createSession()) {
-            var result = session.search(Guide.class)
-                    .extension(ElasticsearchExtension.get())
-                    .select(f -> f.composite().from(
-                            f.id(),
-                            f.field("type"),
-                            f.field("origin"),
-                            f.highlight(language.addSuffix("title")).highlighter("highlighter_title_or_summary").single(),
-                            f.highlight(language.addSuffix("summary")).highlighter("highlighter_title_or_summary").single(),
-                            f.highlight(language.addSuffix("fullContent")).highlighter("highlighter_content"))
-                            .asList(GuideSearchHit::new))
-                    .where((f, root) -> {
-                        // Match all documents by default
-                        root.add(f.matchAll());
-
-                        if (categories != null && !categories.isEmpty()) {
-                            root.add(f.terms().field("categories").matchingAny(categories));
-                        }
-
-                        if (origin != null && !origin.isEmpty()) {
-                            root.add(f.match().field("origin").matching(origin));
-                        }
-
-                        if (q != null && !q.isBlank()) {
-                            root.add(f.or(
-                                    // Duplicate the query so that we apply a multiplicative boost to quarkus.io guides.
-                                    // The end result is that a low-relevance match on quarkus.io _can_ be scored
-                                    // lower than a high-relevance match on quarkiverse.io,
-                                    // if it's significantly more relevant.
-                                    // Note that we could, alternatively,
-                                    // do something like bool().must(textMatch()).should(origin(quarkusio).boost(2f))),
-                                    // but then the boost would be additive, so we would ignore relative relevance
-                                    // of quarkus.io/quarkiverse.io results.
-                                    f.bool().must(textMatch(f, q, language))
-                                            .filter(originMatch(f, QuarkusIO.QUARKUS_ORIGIN))
-                                            // Always score lower for compatibility (legacy) guides.
-                                            // TODO: Maybe we should use a duplicate query with multiplicative boost for this too?
-                                            .should(f.not(f.match().field(language.addSuffix("topics"))
-                                                    .matching("compatibility", ValueModel.INDEX))
-                                                    .boost(50.0f))
-                                            .boost(2.0f),
-                                    f.bool().must(textMatch(f, q, language))
-                                            .filter(originMatch(f, QuarkiverseIO.QUARKIVERSE_ORIGIN))));
-                        }
-                    })
-                    .highlighter(f -> f.fastVector()
-                            // Highlighters are going to use spans-with-classes so that we will have more control over styling the visual on the search results screen.
-                            .tag("<span class=\"" + highlightCssClass + "\">", "</span>"))
-                    .highlighter("highlighter_title_or_summary", f -> f.fastVector()
-                            // We want the whole text of the field, regardless of whether it has a match or not.
-                            .noMatchSize(TITLE_OR_SUMMARY_MAX_SIZE)
-                            .fragmentSize(TITLE_OR_SUMMARY_MAX_SIZE)
-                            // We want the whole text as a single fragment
-                            .numberOfFragments(1))
-                    .highlighter("highlighter_content", f -> f.fastVector()
-                            // If there's no match in the full content we don't want to return anything.
-                            .noMatchSize(0)
-                            // Content is really huge, so we want to only get small parts of the sentences.
-                            // We give control to the caller on the content snippet length and the number of these fragments
-                            .numberOfFragments(contentSnippets)
-                            .fragmentSize(contentSnippetsLength)
-                            // The rest of fragment configuration is static
-                            .orderByScore(true)
-                            // We don't use sentence boundaries because those can result in huge fragments
-                            .boundaryScanner().chars().boundaryMaxScan(10).end())
-                    .sort(f -> f.score().then().field(language.addSuffix("title_sort")))
-                    .routing(QuarkusVersionAndLanguageRoutingBinder.searchKeys(version, language))
-                    .totalHitCountThreshold(TOTAL_HIT_COUNT_THRESHOLD + (page + 1) * PAGE_SIZE)
-                    .requestTransformer(context -> requestSuggestion(context.body(), q, language, highlightCssClass))
-                    .fetch(page * PAGE_SIZE, PAGE_SIZE);
-            return new SearchResult<>(result);
+            var result = performSearch(version, categories, q, origin, language, highlightCssClass, page, contentSnippets,
+                    contentSnippetsLength, session);
+            if (result.total().hitCount() > 0) {
+                return new SearchResult<>(result);
+            } else {
+                SearchResult.Suggestion suggestion = extractSuggestion(result);
+                if (suggestion != null) {
+                    result = performSearch(version, categories, suggestion.query(), origin, language, highlightCssClass, page,
+                            contentSnippets, contentSnippetsLength, session);
+                }
+                return new SearchResult<>(result, suggestion);
+            }
         }
     }
 
+    private ElasticsearchSearchResult<GuideSearchHit> performSearch(String version, List<String> categories, String q,
+            String origin, Language language, String highlightCssClass, int page, int contentSnippets,
+            int contentSnippetsLength, SearchSession session) {
+        return session.search(Guide.class)
+                .extension(ElasticsearchExtension.get())
+                .select(f -> f.composite().from(
+                        f.id(),
+                        f.field("type"),
+                        f.field("origin"),
+                        f.highlight(language.addSuffix("title")).highlighter("highlighter_title_or_summary").single(),
+                        f.highlight(language.addSuffix("summary")).highlighter("highlighter_title_or_summary").single(),
+                        f.highlight(language.addSuffix("fullContent")).highlighter("highlighter_content"))
+                        .asList(GuideSearchHit::new))
+                .where((f, root) -> {
+                    // Match all documents by default
+                    root.add(f.matchAll());
+
+                    if (categories != null && !categories.isEmpty()) {
+                        root.add(f.terms().field("categories").matchingAny(categories));
+                    }
+
+                    if (origin != null && !origin.isEmpty()) {
+                        root.add(f.match().field("origin").matching(origin));
+                    }
+
+                    if (q != null && !q.isBlank()) {
+                        root.add(f.or(
+                                // Duplicate the query so that we apply a multiplicative boost to quarkus.io guides.
+                                // The end result is that a low-relevance match on quarkus.io _can_ be scored
+                                // lower than a high-relevance match on quarkiverse.io,
+                                // if it's significantly more relevant.
+                                // Note that we could, alternatively,
+                                // do something like bool().must(textMatch()).should(origin(quarkusio).boost(2f))),
+                                // but then the boost would be additive, so we would ignore relative relevance
+                                // of quarkus.io/quarkiverse.io results.
+                                f.bool().must(textMatch(f, q, language))
+                                        .filter(originMatch(f, QuarkusIO.QUARKUS_ORIGIN))
+                                        // Always score lower for compatibility (legacy) guides.
+                                        // TODO: Maybe we should use a duplicate query with multiplicative boost for this too?
+                                        .should(f.not(f.match().field(language.addSuffix("topics"))
+                                                .matching("compatibility", ValueModel.INDEX))
+                                                .boost(50.0f))
+                                        .boost(2.0f),
+                                f.bool().must(textMatch(f, q, language))
+                                        .filter(originMatch(f, QuarkiverseIO.QUARKIVERSE_ORIGIN))));
+                    }
+                })
+                .highlighter(f -> f.fastVector()
+                        // Highlighters are going to use spans-with-classes so that we will have more control over styling the visual on the search results screen.
+                        .tag("<span class=\"" + highlightCssClass + "\">", "</span>"))
+                .highlighter(
+                        "highlighter_title_or_summary", f -> f.fastVector()
+                                // We want the whole text of the field, regardless of whether it has a match or not.
+                                .noMatchSize(TITLE_OR_SUMMARY_MAX_SIZE)
+                                .fragmentSize(TITLE_OR_SUMMARY_MAX_SIZE)
+                                // We want the whole text as a single fragment
+                                .numberOfFragments(1))
+                .highlighter(
+                        "highlighter_content", f -> f.fastVector()
+                                // If there's no match in the full content we don't want to return anything.
+                                .noMatchSize(0)
+                                // Content is really huge, so we want to only get small parts of the sentences.
+                                // We give control to the caller on the content snippet length and the number of these fragments
+                                .numberOfFragments(contentSnippets)
+                                .fragmentSize(contentSnippetsLength)
+                                // The rest of fragment configuration is static
+                                .orderByScore(true)
+                                // We don't use sentence boundaries because those can result in huge fragments
+                                .boundaryScanner().chars().boundaryMaxScan(10).end())
+                .sort(f -> f.score().then().field(language.addSuffix("title_sort")))
+                .routing(QuarkusVersionAndLanguageRoutingBinder.searchKeys(version, language))
+                .totalHitCountThreshold(TOTAL_HIT_COUNT_THRESHOLD + (page + 1) * PAGE_SIZE)
+                .requestTransformer(context -> requestSuggestion(context.body(), q, language, highlightCssClass))
+                .fetch(page * PAGE_SIZE, PAGE_SIZE);
+    }
+
     private PredicateFinalStep textMatch(SearchPredicateFactory f, String q, Language language) {
         return f.simpleQueryString()
                 .field(language.addSuffix("title")).boost(10.0f)
@@ -178,4 +201,25 @@ private void requestSuggestion(JsonObject payload, String q, Language language,
         highlight.addProperty("post_tag", "</span>");
     }
 
+    private static SearchResult.Suggestion extractSuggestion(ElasticsearchSearchResult<?> result) {
+        try {
+            JsonObject suggest = result.responseBody().getAsJsonObject("suggest");
+            if (suggest != null) {
+                JsonArray options = suggest
+                        .getAsJsonArray("didYouMean")
+                        .get(0).getAsJsonObject()
+                        .getAsJsonArray("options");
+                if (options != null && !options.isEmpty()) {
+                    JsonObject suggestion = options.get(0).getAsJsonObject();
+                    return new SearchResult.Suggestion(suggestion.get("text").getAsString(),
+                            suggestion.get("highlighted").getAsString());
+                }
+            }
+        } catch (RuntimeException e) {
+            // Though it shouldn't happen, just in case we will catch any exceptions and return no suggestions:
+            Log.warnf(e, "Failed to extract suggestion: %s" + e.getMessage());
+        }
+        return null;
+    }
+
 }
diff --git a/src/main/java/io/quarkus/search/app/dto/SearchResult.java b/src/main/java/io/quarkus/search/app/dto/SearchResult.java
@@ -2,19 +2,20 @@
 
 import java.util.List;
 
-import io.quarkus.logging.Log;
-
 import org.hibernate.search.backend.elasticsearch.search.query.ElasticsearchSearchResult;
 
-import com.google.gson.JsonArray;
-import com.google.gson.JsonObject;
-
 public record SearchResult<T>(Total total, List<T> hits, Suggestion suggestion) {
 
     public SearchResult(ElasticsearchSearchResult<T> result) {
         this(new Total(result.total().isHitCountExact() ? result.total().hitCount() : null,
                 result.total().hitCountLowerBound()),
-                result.hits(), extractSuggestion(result));
+                result.hits(), null);
+    }
+
+    public SearchResult(ElasticsearchSearchResult<T> result, Suggestion suggestion) {
+        this(new Total(result.total().isHitCountExact() ? result.total().hitCount() : null,
+                result.total().hitCountLowerBound()),
+                result.hits(), suggestion);
     }
 
     public record Total(Long exact, Long lowerBound) {
@@ -23,23 +24,4 @@ public record Total(Long exact, Long lowerBound) {
     public record Suggestion(String query, String highlighted) {
     }
 
-    private static Suggestion extractSuggestion(ElasticsearchSearchResult<?> result) {
-        try {
-            JsonObject suggest = result.responseBody().getAsJsonObject("suggest");
-            if (suggest != null) {
-                JsonArray options = suggest
-                        .getAsJsonArray("didYouMean")
-                        .get(0).getAsJsonObject()
-                        .getAsJsonArray("options");
-                if (options != null && !options.isEmpty()) {
-                    JsonObject suggestion = options.get(0).getAsJsonObject();
-                    return new Suggestion(suggestion.get("text").getAsString(), suggestion.get("highlighted").getAsString());
-                }
-            }
-        } catch (RuntimeException e) {
-            // Though it shouldn't happen, just in case we will catch any exceptions and return no suggestions:
-            Log.warnf(e, "Failed to extract suggestion: %s" + e.getMessage());
-        }
-        return null;
-    }
 }
diff --git a/src/main/resources/web/app/qs-target.ts b/src/main/resources/web/app/qs-target.ts
@@ -42,6 +42,15 @@ export class QsTarget extends LitElement {
       font-style: italic;
       text-align: center;
       background: var(--empty-background-color, #F0CA4D);
+    }
+
+    .search-result-title {
+      margin-top: 2.5rem;
+      font-weight: var(--heading-font-weight);
+    }
+
+    .result-message {
+      margin-bottom: 0px;
       
       .suggestion {
         text-decoration: underline;
@@ -52,11 +61,6 @@ export class QsTarget extends LitElement {
       }
     }
 
-    .search-result-title {
-      margin-top: 2.5rem;
-      font-weight: var(--heading-font-weight);
-    }
-
     qs-guide {
       grid-column: span 4;
       margin: 1rem 0rem 1rem 0rem;
@@ -104,29 +108,32 @@ export class QsTarget extends LitElement {
   render() {
     if (this._result?.hits) {
       if (this._result.hits.length === 0) {
-        if (this._result.suggestion) {
-          return html`
-            <div id="qs-target" class="no-hits">
-              <p>Sorry, no ${this.type}s matched your search.
-                Did you mean <span class="suggestion" @click=${this._querySuggestion}>${unsafeHTML(this._result.suggestion.highlighted)}</span>?</p>
-            </div>
-          `;
-        } else {
-          return html`
+        return html`
           <div id="qs-target" class="no-hits">
             <p>Sorry, no ${this.type}s matched your search. Please try again.</p>
           </div>
         `;
-        }
       }
       const result = this._result.hits.map(i => this._renderHit(i));
-      return html`
-        ${this.searchResultsTitle === '' ? '' : html`<h1 class="search-result-title">${this.searchResultsTitle}</h1>`}
-        <div id="qs-target" class="qs-hits" aria-label="Search Hits">
-          ${result}
-        </div>
-        ${this._loading ? this._renderLoading() : ''}
-      `;
+      if (this._result.suggestion) {
+        return html`
+          ${this.searchResultsTitle === '' ? '' : html`<h1 class="search-result-title">${this.searchResultsTitle}</h1>`}
+            <p class="result-message">Sorry, no ${this.type}s matched your original search query.
+                Showing results for <span class="suggestion" @click=${this._querySuggestion}>${unsafeHTML(this._result.suggestion.highlighted)}</span> instead.</p>
+            <div id="qs-target" class="qs-hits" aria-label="Search Hits">
+              ${result}
+            </div>
+            ${this._loading ? this._renderLoading() : ''}
+          `;
+      } else {
+        return html`
+          ${this.searchResultsTitle === '' ? '' : html`<h1 class="search-result-title">${this.searchResultsTitle}</h1>`}
+          <div id="qs-target" class="qs-hits" aria-label="Search Hits">
+            ${result}
+          </div>
+          ${this._loading ? this._renderLoading() : ''}
+        `;
+      }
     }
     if (this._loading) {
       return html`
diff --git a/src/test/java/io/quarkus/search/app/SearchServiceTest.java b/src/test/java/io/quarkus/search/app/SearchServiceTest.java
@@ -518,7 +518,7 @@ void suggestion() {
                 .isEqualTo("configuring your application");
 
         result = given()
-                .queryParam("q", "vertex")
+                .queryParam("q", "vert.ex")
                 .when().get(GUIDES_SEARCH)
                 .then()
                 .statusCode(200)