weaviate · g-despot · May 28, 2026 · May 28, 2026 · May 31, 2026
diff --git a/_includes/code/howto/search.boost.py b/_includes/code/howto/search.boost.py
@@ -0,0 +1,229 @@
+# How-to: Search > Boost results — Python examples.
+#
+# Requires Weaviate v1.38+ and the Python client release that adds Boost
+# support (PR weaviate/weaviate-python-client#2030). Boost is gRPC-only —
+# REST/curl is not supported.
+#
+# Uses the text2vec-transformers vectorizer. Run against the local stack
+# in tests/docker-compose-anon.yml (Weaviate + transformers inference).
+
+import time
+from datetime import datetime, timedelta, timezone
+
+import weaviate
+from weaviate.classes.config import Configure, DataType, Property, Tokenization
+from weaviate.classes.query import Boost, Filter
+
+client = weaviate.connect_to_local()
+
+# ---- Fixture: an Articles collection with date + numeric properties ----
+client.collections.delete("Articles")
+client.collections.create(
+    name="Articles",
+    vector_config=Configure.Vectors.text2vec_transformers(),
+    properties=[
+        Property(name="title", data_type=DataType.TEXT),
+        Property(name="category", data_type=DataType.TEXT, tokenization=Tokenization.FIELD),
+        Property(name="published", data_type=DataType.DATE),
+        Property(name="likes", data_type=DataType.INT),
+        Property(name="price", data_type=DataType.NUMBER),
+        Property(name="draft", data_type=DataType.BOOL),
+    ],
+)
+
+now = datetime.now(timezone.utc)
+articles = client.collections.use("Articles")
+articles.data.insert_many([
+    {"title": "Transformers explained",        "category": "research", "published": now - timedelta(days=2),   "likes": 100,     "price": 49.99, "draft": False},
+    {"title": "Old transformer survey",        "category": "research", "published": now - timedelta(days=400), "likes": 5000,    "price": 49.99, "draft": False},
+    {"title": "How to fine-tune a model",      "category": "tutorial", "published": now - timedelta(days=1),   "likes": 30,      "price": 9.99,  "draft": False},
+    {"title": "Pricing transformers",          "category": "tutorial", "published": now - timedelta(days=10),  "likes": 5000000, "price": 199.0, "draft": False},
+    {"title": "Draft: transformer architecture","category": "research", "published": now - timedelta(days=3),   "likes": 200,     "price": 9.99,  "draft": True},
+])
+
+# Wait briefly for the vectorizer to finish indexing the new objects.
+time.sleep(3)
+
+
+# ==========================================
+# ===== Filter boost (soft WHERE) =====
+# ==========================================
+
+# START BoostFilter
+# Promote articles in the "research" category without filtering others out.
+response = articles.query.near_text(
+    query="transformer architectures",
+    limit=5,
+    # highlight-start
+    boost=Boost.filter(
+        Filter.by_property("category").equal("research"),
+        weight=0.5,
+    ),
+    # highlight-end
+    return_properties=["title", "category"],
+)
+
+for o in response.objects:
+    print(o.properties["category"], "-", o.properties["title"])
+# END BoostFilter
+
+assert response.objects[0].properties["category"] == "research"
+
+
+# ==========================================
+# ===== Property boost (numeric value) =====
+# ==========================================
+
+# START BoostProperty
+# Bias toward articles with more `likes`. LOG1P dampens the long tail so a
+# single 5-million-likes outlier doesn't dominate.
+response = articles.query.near_text(
+    query="transformer architectures",
+    limit=5,
+    # highlight-start
+    boost=Boost.property(
+        "likes",
+        modifier=Boost.Modifier.LOG1P,
+        weight=0.7,
+    ),
+    # highlight-end
+    return_properties=["title", "likes"],
+)
+
+for o in response.objects:
+    print(o.properties["likes"], "-", o.properties["title"])
+# END BoostProperty
+
+
+# ==========================================
+# ===== Time decay (boost recent docs) =====
+# ==========================================
+
+# START BoostTimeDecay
+# Score decays exponentially over time. "30d scale" + decay=0.5 means an
+# article that's 30 days old gets half the score of one published "now".
+response = articles.query.near_text(
+    query="transformer architectures",
+    limit=5,
+    # highlight-start
+    boost=Boost.time_decay(
+        "published",
+        origin="now",
+        scale=timedelta(days=30),
+        curve=Boost.Curve.EXPONENTIAL,
+        decay=0.5,
+        weight=0.6,
+    ),
+    # highlight-end
+    return_properties=["title", "published"],
+)
+# END BoostTimeDecay
+
+# The 400-day-old "Old transformer survey" should be demoted vs the 2-day-old article.
+top_titles = [o.properties["title"] for o in response.objects[:2]]
+assert "Old transformer survey" not in top_titles
+
+
+# ==========================================
+# ===== Numeric decay (closest to a value) =====
+# ==========================================
+
+# START BoostNumericDecay
+# Score peaks at a target price and falls off symmetrically. Gauss gives a
+# bell-shaped falloff: items within `offset` of $49.99 score 1.0, items at
+# $59.99 (one scale away) score `decay`.
+response = articles.query.near_text(
+    query="transformer architectures",
+    limit=5,
+    # highlight-start
+    boost=Boost.numeric_decay(
+        "price",
+        origin=49.99,
+        scale=10.0,
+        curve=Boost.Curve.GAUSSIAN,
+        decay=0.5,
+        weight=0.5,
+    ),
+    # highlight-end
+    return_properties=["title", "price"],
+)
+# END BoostNumericDecay
+
+
+# ==========================================
+# ===== Blend multiple conditions =====
+# ==========================================
+
+# START BoostBlend
+# Combine two soft signals: recency (weight 2) + popularity (weight 1).
+# The outer weight=0.4 controls how much the blended rank affects the
+# final score; the inner weights are *per-condition* and balance each
+# other.
+response = articles.query.near_text(
+    query="transformer architectures",
+    limit=5,
+    # highlight-start
+    boost=Boost.blend(
+        Boost.time_decay("published", origin="now", scale=timedelta(days=30), weight=2.0),
+        Boost.property("likes", modifier=Boost.Modifier.LOG1P, weight=1.0),
+        weight=0.4,
+        depth=200,  # rescore the top 200 vector matches
+    ),
+    # highlight-end
+    return_properties=["title", "likes", "published"],
+)
+# END BoostBlend
+
+
+# ==========================================
+# ===== Negative weights demote =====
+# ==========================================
+
+# START BoostNegativeWeight
+# A negative per-condition weight pushes matching documents DOWN — they
+# stay in the result set but lose ground against everything else. Use
+# this to deprioritize drafts without filtering them out entirely.
+response = articles.query.bm25(
+    query="transformer",
+    limit=5,
+    # highlight-start
+    boost=Boost.blend(
+        Boost.filter(Filter.by_property("draft").equal(True), weight=-2.0),
+        weight=0.5,
+    ),
+    # highlight-end
+    return_properties=["title", "draft"],
+)
+
+# The draft article is still in results, just no longer first.
+all_titles = [o.properties["title"] for o in response.objects]
+assert any("Draft" in t for t in all_titles)
+assert response.objects[0].properties["draft"] is False
+# END BoostNegativeWeight
+
+
+# ==========================================
+# ===== Boost on hybrid search =====
+# ==========================================
+
+# START BoostOnHybrid
+# Hybrid keeps its own alpha-blend of BM25 + vector. The boost runs once
+# over the fused hybrid result — the sub-search legs don't see it.
+response = articles.query.hybrid(
+    query="transformer architectures",
+    alpha=0.75,
+    limit=5,
+    # highlight-start
+    boost=Boost.blend(
+        Boost.filter(Filter.by_property("category").equal("research"), weight=1.0),
+        Boost.filter(Filter.by_property("draft").equal(True), weight=-2.0),
+        weight=0.3,
+    ),
+    # highlight-end
+    return_properties=["title", "category", "draft"],
+)
+# END BoostOnHybrid
+
+
+client.collections.delete("Articles")
+client.close()
diff --git a/_includes/feature-notes/boost.mdx b/_includes/feature-notes/boost.mdx
@@ -0,0 +1,5 @@
+:::caution Preview — added in `v1.38`
+
+Boost is a preview feature. The API may change in future releases. 
+
+:::
diff --git a/docs/deploy/configuration/env-vars/index.md b/docs/deploy/configuration/env-vars/index.md
@@ -90,6 +90,7 @@ import APITable from '@site/src/components/APITable';
 | `PERSISTENCE_LSM_MAX_SEGMENT_SIZE` | Maximum size of a segment in the [LSM store](/weaviate/concepts/storage.md#object-and-inverted-index-store). Set this to limit disk usage spikes during compaction to ~2x the segment size. Default: no limit | `string` | `4GiB` (IEC units), `4GB` (SI units), `4000000000` (bytes) |
 | `PROMETHEUS_MONITORING_ENABLED`  | If set, Weaviate collects [metrics in a Prometheus-compatible format](/deploy/configuration/monitoring.md) | `boolean` | `false` |
 | `PROMETHEUS_MONITORING_GROUP` | If set, Weaviate groups metrics for the same class across all shards. | `boolean` | `true` |
+| `QUERY_BOOST_DEFAULT_DEPTH` | Default candidate-pool size used when a [Boost](/weaviate/search/boost.md) query does not set its own `depth`. The primary search retrieves this many candidates before the boost rescorer runs. Must be a positive integer; hard-capped by `QUERY_MAXIMUM_RESULTS`. Default: `100`<br/>Added in `v1.38` | `string - number` | `200` |
 | `QUERY_CROSS_REFERENCE_DEPTH_LIMIT` | Sets the maximum depth of cross-references to be resolved in a query. Defaults to 5. | `string - number` | `3` |
 | `QUERY_DEFAULTS_LIMIT` | Sets the default number of objects to be returned in a query. | `string - number` | `25` <br/> Defaults to `10`|
 | `QUERY_MAXIMUM_RESULTS` | Sets the maximum total number of objects that can be retrieved. | `string - number` | `10000` |

diff --git a/docs/weaviate/search/bm25.md b/docs/weaviate/search/bm25.md
@@ -16,6 +16,7 @@ import GoCode from '!!raw-loader!/\_includes/code/howto/go/docs/mainpkg/search-b
 import JavaV6Code from "!!raw-loader!/\_includes/code/java-v6/src/test/java/SearchKeywordTest.java";
 import CSharpCode from "!!raw-loader!/\_includes/code/csharp/SearchKeywordTest.cs";
 import GQLCode from '!!raw-loader!/\_includes/code/howto/search.bm25.gql.py';
+import BoostPreview from '/_includes/feature-notes/boost.mdx';
 
 `Keyword` search, also called "BM25 (Best match 25)" or "sparse vector" search, returns objects that have the highest BM25F scores.
 
@@ -764,6 +765,14 @@ Set the tokenization method to `trigram` at the property level when creating you
 
 :::
 
+## Soft-rank with Boost
+
+<BoostPreview/>
+
+Keyword (BM25) queries accept an optional `boost` argument that promotes or demotes matching documents without removing them — useful for biasing results by recency, popularity, a soft filter, or another property. Matching documents move up. Everything else stays in the results but ranks lower.
+
+See [Boost](./boost.md) for the supported condition types (filter, property value, time decay, numeric decay), curve choices, blending semantics, and depth tuning.
+
 ## Further resources
 
 - [Connect to Weaviate](../connections/index.mdx)