diff --git a/effectful/handlers/llm/sampling.py b/effectful/handlers/llm/sampling.py
index effc197d..1778d3b2 100644
--- a/effectful/handlers/llm/sampling.py
+++ b/effectful/handlers/llm/sampling.py
@@ -1,4 +1,5 @@
-from collections import Counter
+from collections import Counter, defaultdict
+from collections.abc import Callable
 from concurrent import futures
 from concurrent.futures.thread import ThreadPoolExecutor
 
@@ -45,3 +46,60 @@ def n_votes_ahead():
                 tasks.append(executor.submit(interpreter(intp)(fwd), *args, **kwargs))
         executor.shutdown()
         return self.votes.most_common(1)[0][0]
+
+
+class ReducedKAheadSampler[**P, T, K](ObjectInterpretation):
+    """KAheadSampler for LLM calls, where votes are generated from LLM outputs."""
+
+    no_voters: int
+    k: int
+    """Number of votes ahead before an answer is accepted"""
+
+    votes: Counter[K] = Counter()
+    results: dict[K, list[T]] = defaultdict(list)
+    reducer: Callable[[T], K]
+    select_best: Callable[[list[T]], T]
+
+    def __init__(
+        self,
+        reducer: Callable[[T], K],
+        select_best: Callable[[list[T]], T] = lambda s: next(iter(s)),
+        no_voters: int = 6,
+        k: int = 3,
+    ):
+        self.no_voters = no_voters
+        self.k = k
+        self.reducer = reducer
+        self.select_best = select_best
+
+    @implements(Template.__call__)
+    def __call__(self, *args: P.args, **kwargs: P.kwargs) -> T:
+        executor = ThreadPoolExecutor()
+        intp = get_interpretation()
+        tasks = [
+            executor.submit(interpreter(intp)(fwd), *args, **kwargs)
+            for _ in range(self.no_voters)
+        ]
+
+        def n_votes_ahead():
+            match self.votes.most_common(2):
+                case [[_, v1], [_, v2]]:
+                    return v1 >= v2 + self.k
+                case [[_, v1]]:
+                    return v1 >= self.k
+                case _:
+                    return False
+
+        while not n_votes_ahead():
+            done, remain = futures.wait(tasks, return_when=futures.FIRST_COMPLETED)
+            tasks = list(remain)
+            for fut in done:
+                res = fut.result()
+                vote = self.reducer(res)
+                self.votes[vote] += 1
+                self.results[vote].append(res)
+                tasks.append(executor.submit(interpreter(intp)(fwd), *args, **kwargs))
+        executor.shutdown()
+        vote = self.votes.most_common(1)[0][0]
+        res = self.select_best(self.results[vote])
+        return res