We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent cbe1077 commit ef1a519Copy full SHA for ef1a519
engine/base_client/search.py
@@ -174,7 +174,9 @@ def cycling_query_generator(queries, total_count):
174
interval_pbar = None
175
176
# Initialize global doc_id offset to ensure uniqueness across intervals
177
- global_doc_id_offset = 0
+ # Start from a high offset to avoid conflicts with uploaded dataset doc_ids
178
+ # Most datasets have < 100M records, so starting from 100M should be safe
179
+ global_doc_id_offset = 100000000
180
181
# Overall accumulators
182
overall_results = []
0 commit comments