From 0341b6f7bed04e9348ba6350c95e3432f2ae8059 Mon Sep 17 00:00:00 2001 From: Kyuyeun Kim Date: Mon, 10 Nov 2025 01:40:15 +0000 Subject: [PATCH 01/17] [DO NOT SUBMIT] sliding window optimization Signed-off-by: Kyuyeun Kim --- oss_log_bias.txt | 2513 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 2513 insertions(+) create mode 100644 oss_log_bias.txt diff --git a/oss_log_bias.txt b/oss_log_bias.txt new file mode 100644 index 000000000..73c89094c --- /dev/null +++ b/oss_log_bias.txt @@ -0,0 +1,2513 @@ +INFO 11-14 19:00:55 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-14 19:00:55 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-14 19:00:55 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-14 19:00:55 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +(APIServer pid=756940) INFO 11-14 19:00:56 [api_server.py:1897] vLLM API server version 0.11.1rc7.dev48+gdf4d3a44a +(APIServer pid=756940) INFO 11-14 19:00:56 [utils.py:253] non-default args: {'model_tag': 'unsloth/gpt-oss-120b-BF16', 'model': 'unsloth/gpt-oss-120b-BF16', 'max_model_len': 8192, 'download_dir': '/mnt/disks/persist', 'tensor_parallel_size': 4, 'data_parallel_size': 2, 'gpu_memory_utilization': 0.98, 'enable_prefix_caching': False, 'max_num_batched_tokens': 8192, 'max_num_seqs': 256, 'async_scheduling': True} +(APIServer pid=756940) INFO 11-14 19:00:56 [model.py:630] Resolved architecture: GptOssForCausalLM +(APIServer pid=756940) INFO 11-14 19:00:56 [model.py:1728] Using max model len 8192 +(APIServer pid=756940) INFO 11-14 19:00:56 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. +(APIServer pid=756940) INFO 11-14 19:00:56 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. +(APIServer pid=756940) INFO 11-14 19:00:56 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=2, attention_data_parallelism=1), device_indexes=None) +(APIServer pid=756940) WARNING 11-14 19:00:56 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(APIServer pid=756940) INFO 11-14 19:00:56 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +INFO 11-14 19:01:00 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-14 19:01:00 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-14 19:01:00 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-14 19:01:01 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:01 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=8192, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=4, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=False, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} +(EngineCore_DP0 pid=757112) WARNING 11-14 19:01:02 [tpu_jax.py:228] Pin memory is not supported on TPU. +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:07 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:07 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:07 [utils.py:314] Phased-based profiler enabled. Traces will be saved to: gs://wenxindong-vm/trace/gpt_oss/dp2/bias +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:07 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:07 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:07 [compilation_manager.py:34] Enabling JAX compile cache. +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:07 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:07 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm +(EngineCore_DP0 pid=757112) WARNING 11-14 19:01:08 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") +(EngineCore_DP0 pid=757112) WARNING 11-14 19:01:08 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=757112) WARNING 11-14 19:01:08 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") +(EngineCore_DP0 pid=757112) WARNING 11-14 19:01:08 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:08 [tpu_jax.py:63] Cannot use None backend on TPU. +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:08 [tpu_jax.py:66] Using Pallas V1 backend. +(EngineCore_DP0 pid=757112) INFO 11-14 19:01:08 [layer.py:331] Disabling MoE shared_experts cuda stream +(EngineCore_DP0 pid=757112) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 {'num_tokens': 16} +(EngineCore_DP0 pid=757112) /mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torchax/tensor.py:154: UserWarning: Explicitly requested dtype int64 requested in astype is not available, and will be truncated to dtype int32. To enable more dtypes, set the jax_enable_x64 configuration option or the JAX_ENABLE_X64 shell environment variable. See https://github.com/jax-ml/jax#current-gotchas for more. +(EngineCore_DP0 pid=757112) res = jax_function(self._elem, *args, **kwargs) +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:02:53 [compilation_manager.py:67] Compilation finished in 10.46 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:02:54 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 32} +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:02:55] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:03:05 [compilation_manager.py:67] Compilation finished in 11.34 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:03:05 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 64} +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:03:16 [compilation_manager.py:67] Compilation finished in 11.41 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:03:17 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 128} +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:17] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:03:33 [compilation_manager.py:67] Compilation finished in 16.28 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:03:33 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 256} +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:03:50 [compilation_manager.py:67] Compilation finished in 16.98 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:03:50 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 512} +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:03:51] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:04:08 [compilation_manager.py:67] Compilation finished in 18.27 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:04:08 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 1024} +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:08] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:04:29 [compilation_manager.py:67] Compilation finished in 20.51 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:04:29 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 2048} +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:29] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:29] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:29] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:04:49 [compilation_manager.py:67] Compilation finished in 20.01 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:04:49 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 4096} +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:04:50] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:05:13 [compilation_manager.py:67] Compilation finished in 24.11 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:05:13 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 8192} +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:13] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:05:44 [compilation_manager.py:67] Compilation finished in 30.21 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:05:44 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 16384} +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:44] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) [2025-11-14 19:05:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:19 [compilation_manager.py:67] Compilation finished in 35.76 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:33 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:33 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:33 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:33 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:325] Compiling select_from_array with different input shapes. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:304] Compiling select_from_array for select all logits. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:67] Compilation finished in 0.08 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:67] Compilation finished in 0.08 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:34 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:37 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:37 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:37 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:37 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:38 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:38 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:38 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:38 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:39 [compilation_manager.py:67] Compilation finished in 0.56 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:39 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:39 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:39 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:40 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:40 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:40 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:40 [compilation_manager.py:67] Compilation finished in 0.28 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:41 [compilation_manager.py:67] Compilation finished in 0.44 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:41 [compilation_manager.py:67] Compilation finished in 0.70 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:42 [compilation_manager.py:67] Compilation finished in 0.28 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:42 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:43 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:43 [compilation_manager.py:67] Compilation finished in 0.34 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:43 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:44 [compilation_manager.py:67] Compilation finished in 0.52 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:44 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:45 [compilation_manager.py:67] Compilation finished in 0.77 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:45 [compilation_manager.py:67] Compilation finished in 0.46 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:46 [compilation_manager.py:67] Compilation finished in 0.45 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:46 [compilation_manager.py:67] Compilation finished in 0.46 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:47 [compilation_manager.py:67] Compilation finished in 0.60 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:47 [compilation_manager.py:67] Compilation finished in 0.56 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:48 [compilation_manager.py:67] Compilation finished in 0.68 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:49 [compilation_manager.py:67] Compilation finished in 0.85 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:49 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:49 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:50 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:50 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:50 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:50 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:51 [compilation_manager.py:67] Compilation finished in 0.60 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:51 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:51 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:51 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:51 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:51 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:51 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:51 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:52 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:52 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:52 [compilation_manager.py:67] Compilation finished in 0.53 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:53 [compilation_manager.py:67] Compilation finished in 0.73 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:53 [compilation_manager.py:365] Compiling compute_logits with different input shapes. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:53 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:53 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:53 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:54 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:54 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:54 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:54 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:55 [compilation_manager.py:67] Compilation finished in 0.41 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:55 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:55 [compilation_manager.py:67] Compilation finished in 0.89 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:55 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:56 [compilation_manager.py:67] Compilation finished in 0.85 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:56 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:57 [compilation_manager.py:67] Compilation finished in 1.09 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:57 [compilation_manager.py:387] Compiling sampling with different input shapes. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:58 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': True} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:58 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:58 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': False} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:58 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:59 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': True} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:59 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:59 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': False} +(EngineCore_DP0 pid=757112) INFO 11-14 19:06:59 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:00 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': True} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:00 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:00 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': False} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:00 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:01 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': True} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:01 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:01 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': False} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:01 [compilation_manager.py:67] Compilation finished in 0.55 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:02 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': True} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:02 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:02 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': False} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:02 [compilation_manager.py:67] Compilation finished in 0.02 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:02 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': True} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:02 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:02 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': False} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:03 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:03 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': True} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:03 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:03 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': False} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:03 [compilation_manager.py:67] Compilation finished in 0.42 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:03 [compilation_manager.py:455] Compiling gather_logprobs with different input shapes. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:03 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 8} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:04 [compilation_manager.py:67] Compilation finished in 0.74 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:04 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 16} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:67] Compilation finished in 0.82 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 32} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 64} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 128} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 256} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 512} +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:67] Compilation finished in 0.05 [secs]. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [compilation_manager.py:751] Compiling structured_decoding with different input shapes. +(EngineCore_DP0 pid=757112) WARNING 11-14 19:07:05 [compilation_manager.py:754] Structured decoding precompilation skipped since structured decoding is not supported with DP. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:05 [core.py:247] init engine (profile, create kv cache, warmup model) took 266.20 seconds +(EngineCore_DP0 pid=757112) WARNING 11-14 19:07:06 [scheduler.py:158] Using custom scheduler class . This scheduler interface is not public and compatibility may not be maintained. +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:06 [dp_scheduler.py:93] DPScheduler (Async = True) per-rank limits: max_seqs=256, max_tokens=8192 +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:06 [core.py:181] Batch queue is enabled with size 2 +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:07 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) +(EngineCore_DP0 pid=757112) WARNING 11-14 19:07:07 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(EngineCore_DP0 pid=757112) INFO 11-14 19:07:07 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +(APIServer pid=756940) [INFO] model_hosting_container_standards - decorators.py:76: [PING] Framework handler registered: ping +(APIServer pid=756940) [2025-11-14 19:07:07] INFO decorators.py:76: [PING] Framework handler registered: ping +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations +(APIServer pid=756940) [2025-11-14 19:07:07] INFO base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations +(APIServer pid=756940) [2025-11-14 19:07:07] INFO base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func +(APIServer pid=756940) [2025-11-14 19:07:07] INFO base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func +(APIServer pid=756940) [2025-11-14 19:07:07] INFO base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func +(APIServer pid=756940) [INFO] model_hosting_container_standards - decorators.py:76: [INVOKE] Framework handler registered: decorated_func +(APIServer pid=756940) [2025-11-14 19:07:07] INFO decorators.py:76: [INVOKE] Framework handler registered: decorated_func +(APIServer pid=756940) [INFO] model_hosting_container_standards - __init__.py:127: Starting SageMaker bootstrap process +(APIServer pid=756940) [2025-11-14 19:07:07] INFO __init__.py:127: Starting SageMaker bootstrap process +(APIServer pid=756940) [INFO] model_hosting_container_standards - registry.py:109: [REGISTRY] Middleware resolution and registration complete +(APIServer pid=756940) [2025-11-14 19:07:07] INFO registry.py:109: [REGISTRY] Middleware resolution and registration complete +(APIServer pid=756940) [INFO] model_hosting_container_standards - core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully +(APIServer pid=756940) [2025-11-14 19:07:07] INFO core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully +(APIServer pid=756940) [INFO] model_hosting_container_standards - core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares +(APIServer pid=756940) [2025-11-14 19:07:07] INFO core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares +(APIServer pid=756940) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=756940) [2025-11-14 19:07:07] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=756940) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=756940) [2025-11-14 19:07:07] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=756940) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:93: Creating SageMaker router with unified route resolver +(APIServer pid=756940) [2025-11-14 19:07:07] INFO sagemaker_router.py:93: Creating SageMaker router with unified route resolver +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:172: Creating router with prefix='', tags=['sagemaker'] +(APIServer pid=756940) [2025-11-14 19:07:07] INFO routing.py:172: Creating router with prefix='', tags=['sagemaker'] +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:110: Mounting 2 handlers to router +(APIServer pid=756940) [2025-11-14 19:07:07] INFO routing.py:110: Mounting 2 handlers to router +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:184: Router created with 0 routes +(APIServer pid=756940) [2025-11-14 19:07:07] INFO routing.py:184: Router created with 0 routes +(APIServer pid=756940) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:101: SageMaker router created successfully with 0 routes +(APIServer pid=756940) [2025-11-14 19:07:07] INFO sagemaker_router.py:101: SageMaker router created successfully with 0 routes +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:287: Including router with conflict detection +(APIServer pid=756940) [2025-11-14 19:07:07] INFO routing.py:287: Including router with conflict detection +(APIServer pid=756940) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:305: Successfully included router with 0 routes +(APIServer pid=756940) [2025-11-14 19:07:07] INFO routing.py:305: Successfully included router with 0 routes +(APIServer pid=756940) [INFO] model_hosting_container_standards - __init__.py:139: SageMaker bootstrap completed successfully +(APIServer pid=756940) [2025-11-14 19:07:07] INFO __init__.py:139: SageMaker bootstrap completed successfully +(APIServer pid=756940) INFO 11-14 19:07:07 [api_server.py:1662] Supported tasks: ['generate'] +(APIServer pid=756940) WARNING 11-14 19:07:07 [serving_responses.py:189] For gpt-oss, we ignore --enable-auto-tool-choice and always enable tool use. +(APIServer pid=756940) INFO 11-14 19:07:07 [api_server.py:1972] Starting vLLM API server 0 on http://0.0.0.0:8000 +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:38] Available routes are: +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /openapi.json, Methods: HEAD, GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /docs, Methods: HEAD, GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /docs/oauth2-redirect, Methods: HEAD, GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /redoc, Methods: HEAD, GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /health, Methods: GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /load, Methods: GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /tokenize, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /detokenize, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/models, Methods: GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /version, Methods: GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/responses, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/responses/{response_id}, Methods: GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/responses/{response_id}/cancel, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/messages, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/chat/completions, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/completions, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/embeddings, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /pooling, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /classify, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /score, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/score, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/audio/transcriptions, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/audio/translations, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /rerank, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v1/rerank, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /v2/rerank, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /scale_elastic_ep, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /is_scaling_elastic_ep, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /ping, Methods: GET +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /ping, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /invocations, Methods: POST +(APIServer pid=756940) INFO 11-14 19:07:07 [launcher.py:46] Route: /metrics, Methods: GET +(APIServer pid=756940) INFO: Started server process [756940] +(APIServer pid=756940) INFO: Waiting for application startup. +(APIServer pid=756940) INFO: Application startup complete. +(APIServer pid=756940) INFO: 127.0.0.1:52498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO 11-14 19:08:57 [loggers.py:221] Engine 000: Avg prompt throughput: 204.8 tokens/s, Avg generation throughput: 75.1 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:09:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 100.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:09:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 100.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:09:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 100.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:09:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 100.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.2%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:09:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 100.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.2%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=757112) WARNING 11-14 19:09:51 [tpu_jax_runner.py:666] Should not schedule a request that does nothing! +(APIServer pid=756940) INFO: 127.0.0.1:52498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33190 - "POST /v1/completions HTTP/1.1" 200 OK +(EngineCore_DP0 pid=757112) INFO 11-14 19:09:52 [utils.py:358] Starting profiling for prefill_heavy phase +(EngineCore_DP0 pid=757112) INFO 11-14 19:09:52 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 2048, 'num_prefill_tokens': 2048, 'num_decode_tokens': 1, 'padded_total_num_scheduled_tokens': 4096, 'num_reqs': 2} +(APIServer pid=756940) INFO: 127.0.0.1:33202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33272 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33282 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33292 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33306 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33344 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33358 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33366 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33384 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33408 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33422 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33426 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33448 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33462 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33468 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33496 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33530 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33544 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33574 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33604 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33616 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33636 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33640 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33656 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33670 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33672 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33686 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33712 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33720 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33738 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33746 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33754 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33772 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33792 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33816 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33844 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33858 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33886 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33894 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33924 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:33998 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34014 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34030 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34044 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34132 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34152 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34166 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34182 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34190 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34210 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34220 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34222 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34236 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34248 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34290 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34294 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34296 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34306 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34308 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34340 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34366 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34386 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34404 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34412 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34444 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34460 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34462 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34476 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34478 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34506 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34524 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34598 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34606 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34614 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34616 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34618 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34640 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34652 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34664 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34670 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34686 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34690 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34706 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34728 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34742 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34744 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34756 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34792 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34800 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34836 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34872 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34884 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34924 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34930 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34946 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34966 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34974 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34988 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34994 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:34998 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35010 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35024 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35026 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35072 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35078 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35098 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35132 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35160 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35178 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35184 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35194 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35208 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35222 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35246 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35256 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35260 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35266 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35282 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35322 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35344 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35372 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35396 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35422 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35434 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35438 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35450 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35462 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35478 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35492 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35522 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35538 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35550 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35566 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35608 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35618 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35626 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35648 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35698 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35738 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35748 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35816 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35826 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35858 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35872 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35886 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35898 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35924 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35956 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35962 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35978 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:35994 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36002 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36028 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36032 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36046 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36052 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36068 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36078 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36094 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36110 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36126 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36136 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36150 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36170 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36198 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36222 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36236 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36238 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36270 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36284 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36316 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36322 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36334 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36374 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36412 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36444 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36454 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36460 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36476 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36484 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36496 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36532 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36548 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36556 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36566 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36572 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36588 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36606 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36658 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36664 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36678 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36686 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36730 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36744 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36754 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36756 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36792 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36842 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36884 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36910 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36920 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36926 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36938 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36942 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36964 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36966 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36978 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36980 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:36992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37030 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37066 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37074 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37082 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37086 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37092 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37098 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37136 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37142 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37154 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37166 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37180 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37214 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37220 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37234 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37250 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37294 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37316 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37328 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37410 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37424 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37436 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37496 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37520 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37524 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37536 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37546 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37550 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37562 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37564 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37606 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37618 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37640 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37644 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37688 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37690 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37704 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37718 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37744 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37756 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37758 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37782 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37796 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37816 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37830 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37842 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37894 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37898 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37910 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37922 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37938 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37962 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37966 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37976 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:37984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38000 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38024 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38044 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38082 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38118 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38170 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38172 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38186 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38220 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38228 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38240 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38250 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38288 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38306 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38334 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38366 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38396 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38410 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38424 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38448 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38462 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38484 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38506 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38514 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38524 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38548 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38556 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38562 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38574 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38604 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38612 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38624 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38658 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38672 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38680 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38690 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38746 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38796 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38852 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38868 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38894 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38916 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38932 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38946 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38962 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38974 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:38996 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39002 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39026 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39036 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39060 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39110 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39126 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39150 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39172 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39190 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39212 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39222 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39224 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39238 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39260 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39270 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39288 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39306 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39308 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39322 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39340 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39366 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39404 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39432 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39438 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39450 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39454 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39464 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39522 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39538 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39546 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39556 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39570 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39598 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39652 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39654 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39668 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39688 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39748 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39784 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39836 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39884 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39886 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39898 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39928 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39932 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39942 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39976 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:39994 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40002 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40032 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40036 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40052 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40060 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40080 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40084 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40136 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40142 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40150 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40158 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40170 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40182 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40214 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40220 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40256 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40290 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40354 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40358 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40374 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40386 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40408 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40418 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40438 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40444 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40460 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40478 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40482 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40522 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40536 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40544 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40572 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40650 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40688 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40690 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40698 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40706 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40718 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40728 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40730 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40746 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40782 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40806 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40830 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40872 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40884 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40898 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40928 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:40996 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41028 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41068 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41078 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41130 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41168 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41182 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41226 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41236 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41240 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41266 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41274 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41292 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41382 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41412 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41414 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41430 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41434 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41444 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41460 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41466 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41476 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41486 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41524 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41570 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41600 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41608 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41624 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41644 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41656 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41668 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41678 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41730 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41742 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41756 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41772 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41792 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41800 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41852 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41856 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41888 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41916 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41930 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41988 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:41998 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42050 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42078 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42086 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42132 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42134 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42148 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42154 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42158 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42160 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42214 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42234 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42274 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42296 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42316 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42396 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42410 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42448 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42464 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42466 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42468 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42476 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42482 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42486 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42488 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42502 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42506 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42520 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42532 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42536 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42564 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO: 127.0.0.1:42586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=756940) INFO 11-14 19:09:57 [loggers.py:221] Engine 000: Avg prompt throughput: 13106.7 tokens/s, Avg generation throughput: 71.6 tokens/s, Running: 74 reqs, Waiting: 950 reqs, GPU KV cache usage: 4.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:10:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 74 reqs, Waiting: 950 reqs, GPU KV cache usage: 4.0%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=757112) INFO 11-14 19:10:21 [utils.py:397] Profiling for prefill_heavy phase finished +(APIServer pid=756940) INFO 11-14 19:10:27 [loggers.py:221] Engine 000: Avg prompt throughput: 21298.5 tokens/s, Avg generation throughput: 156.0 tokens/s, Running: 178 reqs, Waiting: 846 reqs, GPU KV cache usage: 9.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:10:37 [loggers.py:221] Engine 000: Avg prompt throughput: 33997.7 tokens/s, Avg generation throughput: 535.6 tokens/s, Running: 344 reqs, Waiting: 680 reqs, GPU KV cache usage: 18.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:10:47 [loggers.py:221] Engine 000: Avg prompt throughput: 33585.8 tokens/s, Avg generation throughput: 881.2 tokens/s, Running: 508 reqs, Waiting: 516 reqs, GPU KV cache usage: 27.5%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=757112) INFO 11-14 19:10:48 [utils.py:358] Starting profiling for decode_heavy phase +(EngineCore_DP0 pid=757112) INFO 11-14 19:10:48 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 256, 'num_prefill_tokens': 0, 'num_decode_tokens': 512, 'padded_total_num_scheduled_tokens': 512, 'num_reqs': 512} +(APIServer pid=756940) INFO 11-14 19:10:57 [loggers.py:221] Engine 000: Avg prompt throughput: 2867.0 tokens/s, Avg generation throughput: 562.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=757112) INFO 11-14 19:11:07 [utils.py:397] Profiling for decode_heavy phase finished +(APIServer pid=756940) INFO 11-14 19:11:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 716.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:11:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9109.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 28.3%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:11:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9059.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:11:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9059.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:11:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9111.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 35.5%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:11:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9112.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:12:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9266.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:12:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9315.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:12:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9214.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:12:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9263.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:12:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9214.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:12:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9109.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.9%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:13:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6706.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:13:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.8%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:13:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7729.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:13:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7883.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.3%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:13:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7882.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:13:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7933.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:14:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7985.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 62.2%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:14:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7780.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:14:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7882.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 67.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:14:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7778.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:14:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7831.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:14:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7780.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 71.2%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:15:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7780.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:15:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7778.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 76.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:15:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7679.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:15:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7780.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:15:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7677.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:15:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7728.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:16:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7575.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 85.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:16:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7727.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:16:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7677.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:16:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7575.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:16:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7677.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:16:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7625.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 93.4%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:17:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7576.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:17:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7522.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 98.4%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:17:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7473.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:17:37 [loggers.py:221] Engine 000: Avg prompt throughput: 17204.0 tokens/s, Avg generation throughput: 3521.0 tokens/s, Running: 502 reqs, Waiting: 418 reqs, GPU KV cache usage: 83.9%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:17:47 [loggers.py:221] Engine 000: Avg prompt throughput: 31946.3 tokens/s, Avg generation throughput: 995.9 tokens/s, Running: 500 reqs, Waiting: 262 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:17:57 [loggers.py:221] Engine 000: Avg prompt throughput: 31948.2 tokens/s, Avg generation throughput: 992.2 tokens/s, Running: 496 reqs, Waiting: 108 reqs, GPU KV cache usage: 39.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:18:07 [loggers.py:221] Engine 000: Avg prompt throughput: 23750.2 tokens/s, Avg generation throughput: 3303.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:18:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9057.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 29.5%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:18:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9111.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:18:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9060.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:18:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9110.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 36.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:18:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9110.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:19:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9264.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:19:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9264.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:19:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9216.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:19:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9266.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:19:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9215.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:19:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 9009.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 51.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:20:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6448.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:20:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6397.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 54.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:20:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7884.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:20:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7881.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:20:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7934.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:20:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7986.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:21:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7935.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 63.5%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:21:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7831.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:21:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7882.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:21:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7830.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:21:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7831.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:21:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7730.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 72.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:22:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7882.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:22:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7729.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:22:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7780.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:22:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7780.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:22:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7780.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 81.5%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:22:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7677.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:23:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7677.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:23:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7729.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:23:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7679.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:23:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7679.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 90.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:23:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7575.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:23:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7678.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 95.1%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:24:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7576.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:24:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7626.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:24:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7624.2 tokens/s, Running: 511 reqs, Waiting: 0 reqs, GPU KV cache usage: 98.7%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:24:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 2485.7 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% +(APIServer pid=756940) INFO 11-14 19:24:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% From acd671443c5f668365de8f90fcc46fb7dbd61631 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Wed, 12 Nov 2025 21:57:54 +0000 Subject: [PATCH 02/17] wip --- tpu_inference/layers/vllm/fused_moe.py | 106 ++++++++++++------ .../layers/vllm/quantization/common.py | 28 +++-- .../layers/vllm/quantization/unquantized.py | 24 ++-- tpu_inference/layers/vllm/sharding.py | 11 +- 4 files changed, 114 insertions(+), 55 deletions(-) diff --git a/tpu_inference/layers/vllm/fused_moe.py b/tpu_inference/layers/vllm/fused_moe.py index fa9a45288..dfc61224f 100644 --- a/tpu_inference/layers/vllm/fused_moe.py +++ b/tpu_inference/layers/vllm/fused_moe.py @@ -8,7 +8,7 @@ from tpu_inference.layers.vllm.linear_common import \ slice_sharded_tensor_for_concatenation - +from tpu_inference.layers.jax.sharding import ShardingAxisName P = PartitionSpec @@ -110,7 +110,7 @@ def tensor_sharded_gmm_merged_column_parallel( # adapted from https://github.com/pytorch/xla/blob/1d409399474197c484894be90b75d9855393dda5/torch_xla/experimental/custom_kernel.py#L1401 m, k, g = lhs.shape[0], lhs.shape[1], rhs.shape[0] n = rhs.shape[1] if transpose_rhs else rhs.shape[2] - tm, tk, tn = _get_tiling_size_for_gmm_kernel(m, k, n, g) + tm, tk, tn = _get_tiling_size_for_gmm_kernel(m//mesh.shape["data"], k, n, g) _gmm = functools.partial( gmm, @@ -123,8 +123,8 @@ def tensor_sharded_gmm_merged_column_parallel( gmm_result = shard_map( _gmm, mesh=mesh, - in_specs=(P(), P(None, "model", None), P()), - out_specs=(P(None, "model")), + in_specs=(P(ShardingAxisName.MLP_DATA, None), P(None, ShardingAxisName.EXPERT, None), P(ShardingAxisName.MLP_DATA)), + out_specs=(P(ShardingAxisName.MLP_DATA, ShardingAxisName.MLP_TENSOR)), check_rep=False, )(lhs, rhs, group_sizes) @@ -132,7 +132,7 @@ def tensor_sharded_gmm_merged_column_parallel( rhs_bis = jnp.repeat(rhs_bias, group_sizes, 0, total_repeat_length=m) gmm_result = (gmm_result + rhs_bis).astype(gmm_result.dtype) - n_shards = mesh.shape["model"] + n_shards = mesh.shape['model'] * mesh.shape['attn_dp'] output_sizes = [intermediate_size, intermediate_size] return slice_sharded_tensor_for_concatenation(gmm_result, output_sizes, @@ -150,7 +150,7 @@ def tensor_sharded_gmm_row_parallel( # adapted from https://github.com/pytorch/xla/blob/1d409399474197c484894be90b75d9855393dda5/torch_xla/experimental/custom_kernel.py#L1401 m, k, g = lhs.shape[0], lhs.shape[1], rhs.shape[0] n = rhs.shape[1] if transpose_rhs else rhs.shape[2] - tm, tk, tn = _get_tiling_size_for_gmm_kernel(m, k, n, g) + tm, tk, tn = _get_tiling_size_for_gmm_kernel(m//mesh.shape["data"], k, n, g) _gmm = functools.partial( gmm, @@ -162,17 +162,19 @@ def tensor_sharded_gmm_row_parallel( def _gmm_all_reduce(lhs, rhs, group_sizes): r = _gmm(lhs, rhs, group_sizes) - return jax.lax.psum(r, axis_name="model") + return jax.lax.psum(r, axis_name=ShardingAxisName.MLP_TENSOR) gmm_result = shard_map( _gmm_all_reduce, mesh=mesh, - in_specs=(P(None, "model"), P(None, None, "model"), P()), - out_specs=(P()), - check_rep=False, + in_specs=(P(ShardingAxisName.MLP_DATA, ShardingAxisName.MLP_TENSOR), + P(None, None, ShardingAxisName.MLP_TENSOR), P(ShardingAxisName.MLP_DATA)), + out_specs=(P(ShardingAxisName.MLP_DATA)), + check_rep=False, )(lhs, rhs, group_sizes) if rhs_bias is not None: + print("rhs_bias is not None") rhs_bias = jnp.repeat(rhs_bias, group_sizes, 0, total_repeat_length=m) gmm_result = (gmm_result + rhs_bias).astype(gmm_result.dtype) @@ -196,8 +198,7 @@ def expert_sharded_gmm( num_experts_per_shard = num_experts // ep_size group_offset = jnp.arange(0, num_experts, num_experts_per_shard) group_offset = jax.lax.with_sharding_constraint( - group_offset, NamedSharding(mesh, P("model"))) - + group_offset, NamedSharding(mesh, P(ShardingAxisName.EXPERT))) def _gmm(lhs, rhs, group_sizes, group_offset): # Group offset for this shard. `group_offset` is sharded, and in this # sharded function, it has only 1 element and `group_offset.shape` is @@ -236,8 +237,9 @@ def _gmm(lhs, rhs, group_sizes, group_offset): gmm_res = shard_map( _gmm, mesh=mesh, - in_specs=(P(), P("model", None, None), P(), P("model")), - out_specs=(P("model", None)), + in_specs=(P(), P(ShardingAxisName.EXPERT, None, + None), P(), P(ShardingAxisName.EXPERT)), + out_specs=(P(ShardingAxisName.EXPERT, None)), check_rep=False, )(lhs, rhs, group_sizes, group_offset) @@ -256,12 +258,11 @@ def _gmm(lhs, rhs, group_sizes, group_offset): recv_sizes = send_sizes input_offsets = jax.lax.with_sharding_constraint( - input_offsets, NamedSharding(mesh, P("model"))) + input_offsets, NamedSharding(mesh, P(ShardingAxisName.EXPERT))) send_sizes = jax.lax.with_sharding_constraint( - send_sizes, NamedSharding(mesh, P("model"))) + send_sizes, NamedSharding(mesh, P(ShardingAxisName.EXPERT))) output_offsets = jax.lax.with_sharding_constraint( - output_offsets, NamedSharding(mesh, P("model"))) - + output_offsets, NamedSharding(mesh, P(ShardingAxisName.EXPERT))) def _ragged_all_to_all(operand, input_offsets, send_sizes, output_offsets, recv_sizes): output = jnp.zeros_like(operand) @@ -292,8 +293,7 @@ def _ragged_all_to_all(operand, input_offsets, send_sizes, output_offsets, send_sizes_of_shard, output_offsets_of_shard, recv_sizes_of_shard, - axis_name="model") - + axis_name=ShardingAxisName.EXPERT) # Use ragged_all_to_all to send the result from gmm for each expert to all # the shards. In the working example, the result would be: # A, A, A, A A, A, A, A A, A, A, A A, A, A, A @@ -314,7 +314,8 @@ def _ragged_all_to_all(operand, input_offsets, send_sizes, output_offsets, return shard_map( _ragged_all_to_all, mesh=mesh, - in_specs=(P("model", None), P("model"), P("model"), P("model"), P()), + in_specs=(P(ShardingAxisName.EXPERT, None), P(ShardingAxisName.EXPERT), + P(ShardingAxisName.EXPERT), P(ShardingAxisName.EXPERT), P()), out_specs=(P()), check_rep=False, )(gmm_res, input_offsets, send_sizes, output_offsets, recv_sizes) @@ -347,16 +348,24 @@ def fused_moe_func( raise NotImplementedError( "Bias is not supported when using expert parallelism.") orig_shape = hidden_states.shape + print(f"orig_shape: {orig_shape}") hidden_size = hidden_states.shape[-1] num_tokens = hidden_states.size // hidden_size assert global_num_experts == w1.shape[0] - ep_size = mesh.shape["model"] # only used if use_ep is True. + ep_size = mesh.shape['model'] * mesh.shape[ + "attn_dp"] # only used if use_ep is True. intermediate_size = w2.shape[-1] dtype = hidden_states.dtype assert (num_tokens * topk) % 16 == 0, ( "The kernel requires num_tokens * topk to be a multiple of " f"16 but got {num_tokens}*{topk}={num_tokens*topk}") + hidden_states = jax.lax.with_sharding_constraint( + hidden_states, NamedSharding(mesh, P(ShardingAxisName.MLP_DATA, None))) + + gating_output = jax.lax.with_sharding_constraint( + gating_output, NamedSharding(mesh, P(ShardingAxisName.MLP_DATA, None))) + hidden_states = hidden_states.reshape(num_tokens, hidden_size) gating_output = gating_output.reshape(num_tokens, global_num_experts) @@ -366,14 +375,27 @@ def fused_moe_func( topk_weights = topk_weights / topk_weights.sum(axis=-1, keepdims=True) topk_weights = topk_weights.astype(dtype) - topk_indices_flat = topk_indices.flatten() - topk_argsort_indices = jnp.argsort(topk_indices_flat) - topk_argsort_revert_indices = jnp.argsort(topk_argsort_indices) - token_indices = jnp.arange(num_tokens, dtype=jnp.int32).repeat(topk) - token_indices_sorted = token_indices[topk_argsort_indices] - group_sizes = jnp.bincount(topk_indices_flat, length=global_num_experts) - - x = hidden_states[token_indices_sorted] + # Use shard_map for all sorting and gathering operations to enable parallel + # computation on each shard. Each shard processes its local tokens independently. + def _process_tokens_locally(hidden_states_local, topk_indices_local): + num_tokens_local = hidden_states_local.shape[0] + topk_indices_flat = topk_indices_local.flatten() + topk_argsort_indices = jnp.argsort(topk_indices_flat) + topk_argsort_revert_indices = jnp.argsort(topk_argsort_indices) + token_indices = jnp.arange(num_tokens_local, dtype=jnp.int32).repeat(topk) + token_indices_sorted = token_indices[topk_argsort_indices] + group_sizes = jnp.bincount(topk_indices_flat, length=global_num_experts) + + x = hidden_states_local[token_indices_sorted] + return x, group_sizes, topk_argsort_revert_indices + + x, group_sizes, topk_argsort_revert_indices = shard_map( + _process_tokens_locally, + mesh=mesh, + in_specs=(P(ShardingAxisName.MLP_DATA, None), P(ShardingAxisName.MLP_DATA, None)), + out_specs=(P(ShardingAxisName.MLP_DATA, None), P(), P(ShardingAxisName.MLP_DATA)), + check_rep=False, + )(hidden_states, topk_indices) if use_ep: x = expert_sharded_gmm( @@ -411,7 +433,7 @@ def fused_moe_func( ) else: x = jax.lax.with_sharding_constraint( - x, NamedSharding(mesh, P(None, "model"))) + x, NamedSharding(mesh, P(ShardingAxisName.MLP_DATA, "model"))) x = tensor_sharded_gmm_row_parallel( x, w2, @@ -421,13 +443,25 @@ def fused_moe_func( mesh=mesh, ) - x = x[topk_argsort_revert_indices].reshape(-1, topk, hidden_size) - x = x * jnp.expand_dims(topk_weights, axis=-1) - x = x.sum(axis=-2) + # Use shard_map for reordering and final reduction to process each shard locally + def _finalize_output(x_local, topk_argsort_revert_indices_local, topk_weights_local): + x_local = x_local[topk_argsort_revert_indices_local].reshape(-1, topk, hidden_size) + x_local = x_local * jnp.expand_dims(topk_weights_local, axis=-1) + x_local = x_local.sum(axis=-2) + return x_local + + x = shard_map( + _finalize_output, + mesh=mesh, + in_specs=(P(ShardingAxisName.MLP_DATA, None), P(ShardingAxisName.MLP_DATA), P(ShardingAxisName.MLP_DATA, None)), + out_specs=(P(ShardingAxisName.MLP_DATA, None)), + check_rep=False, + )(x, topk_argsort_revert_indices, topk_weights) + x = x.reshape(orig_shape) if reduce_results: - x = jax.lax.with_sharding_constraint(x, NamedSharding(mesh, P())) + x = jax.lax.with_sharding_constraint(x, NamedSharding(mesh, P(ShardingAxisName.MLP_DATA))) return x @@ -462,6 +496,7 @@ def fused_moe_func_padded( hidden_size = hidden_states.shape[-1] num_tokens = hidden_states.size // hidden_size if num_tokens * topk < 16: + print("num_tokens * topk < 16") assert 16 % (num_tokens * topk) == 0, f"Cannot pad to 16: {num_tokens=}, {topk=}" n_repeats = 16 // (num_tokens * topk) @@ -490,6 +525,7 @@ def fused_moe_func_padded( x = expanded_x[:hidden_states.shape[0]] return x else: + print("num_tokens * topk >= 16") return fused_moe_func( hidden_states, w1, diff --git a/tpu_inference/layers/vllm/quantization/common.py b/tpu_inference/layers/vllm/quantization/common.py index 381dce392..f443d6a26 100644 --- a/tpu_inference/layers/vllm/quantization/common.py +++ b/tpu_inference/layers/vllm/quantization/common.py @@ -11,6 +11,7 @@ ReplicatedLinear, RowParallelLinear) +from tpu_inference.layers.jax.sharding import ShardingAxisName from tpu_inference.layers.vllm.linear_common import \ get_model_matmul_fusion_assignment from tpu_inference.utils import TPU_SECOND_LAST_MINOR @@ -34,15 +35,23 @@ def __init__(self, vllm_config: VllmConfig, mesh: Mesh, layer: LinearBase): self.enable_sequence_parallelism = vllm_config.compilation_config.pass_config.enable_sequence_parallelism self.input_sharding = None self.output_sharding = None + self.tp_size = self.mesh.shape['model'] * self.mesh.shape.get( + 'attn_dp', 1) if isinstance(layer, RowParallelLinear): - self.weight_sharding = P(None, "model") + self.weight_sharding = P(None, ShardingAxisName.MLP_TENSOR) if self.enable_sequence_parallelism: - self.output_sharding = P("model", None) + self.output_sharding = P(ShardingAxisName.MLP_TENSOR, None) elif isinstance(layer, ColumnParallelLinear): - self.weight_sharding = P("model", None) + if isinstance(layer, QKVParallelLinear): + self.input_sharding = P(ShardingAxisName.ATTN_DATA, None) + self.weight_sharding = P('model', None) + self.output_sharding = P(ShardingAxisName.ATTN_DATA, "model") + else: + self.weight_sharding = P(ShardingAxisName.MLP_TENSOR, None) + if self.enable_sequence_parallelism: - self.input_sharding = P("model", None) + self.input_sharding = P(ShardingAxisName.MLP_TENSOR, None) if isinstance(layer, MergedColumnParallelLinear) or isinstance( layer, QKVParallelLinear): @@ -61,13 +70,18 @@ def __init__(self, vllm_config: VllmConfig, mesh: Mesh, layer: LinearBase): " bad performance.", type(layer)) self.bias_sharding = P(self.weight_sharding[0]) - self.n_shards = self.mesh.shape.get(self.weight_sharding[0], 1) + if isinstance(self.weight_sharding[0], tuple): + self.n_shards = 1 + for axis in self.weight_sharding[0]: + self.n_shards *= self.mesh.shape.get(axis, 1) + else: + self.n_shards = self.mesh.shape.get(self.weight_sharding[0], 1) def get_input_sharding(self, x: torchax.tensor.Tensor): if self.enable_sequence_parallelism: token_num = x.shape[0] # NOTE(chengjiyao): make sure the sharded token_num is larger than TPU_SECOND_LAST_MINOR - if token_num // self.mesh.shape["model"] >= TPU_SECOND_LAST_MINOR: + if token_num // self.tp_size >= TPU_SECOND_LAST_MINOR: return self.input_sharding else: return None @@ -77,7 +91,7 @@ def get_output_sharding(self, x: torchax.tensor.Tensor): if self.enable_sequence_parallelism: token_num = x.shape[0] # NOTE(chengjiyao): make sure the sharded token_num is larger than TPU_SECOND_LAST_MINOR - if token_num // self.mesh.shape["model"] >= TPU_SECOND_LAST_MINOR: + if token_num // self.tp_size >= TPU_SECOND_LAST_MINOR: return self.output_sharding else: return None diff --git a/tpu_inference/layers/vllm/quantization/unquantized.py b/tpu_inference/layers/vllm/quantization/unquantized.py index 590511ea1..141b192d3 100644 --- a/tpu_inference/layers/vllm/quantization/unquantized.py +++ b/tpu_inference/layers/vllm/quantization/unquantized.py @@ -25,6 +25,8 @@ from tpu_inference.kernels.fused_moe.v1.kernel import fused_ep_moe from tpu_inference.layers.common.quant_methods import (UNQUANTIZED, get_tpu_quant_method) +from tpu_inference.layers.jax.sharding import ShardingAxisName + from tpu_inference.layers.vllm.fused_moe import fused_moe_func_padded from tpu_inference.layers.vllm.linear_common import ( reorder_concatenated_tensor_for_sharding, @@ -261,38 +263,42 @@ def process_weights_after_loading(self, layer: torch.nn.Module) -> None: w13_weight = jax.device_put( w13_weight, Format(Layout((0, 1, 2)), - NamedSharding(self.mesh, P("model", None, None)))) + NamedSharding(self.mesh, P(ShardingAxisName.EXPERT, None, None)))) w2_weight = jax.device_put( w2_weight, Format(Layout((0, 1, 2)), - NamedSharding(self.mesh, P("model", None, None)))) + NamedSharding(self.mesh, P(ShardingAxisName.EXPERT, None, None)))) if self.moe.has_bias: w13_bias = jax.device_put( w13_bias, Format(Layout((0, 1)), - NamedSharding(self.mesh, P("model", None)))) + NamedSharding(self.mesh, P(ShardingAxisName.EXPERT, None)))) w2_bias = jax.device_put( w2_bias, Format(Layout((0, 1)), - NamedSharding(self.mesh, P("model", None)))) + NamedSharding(self.mesh, P(ShardingAxisName.EXPERT, None)))) else: intermediate_size = w13_weight.shape[1] // 2 assert intermediate_size == w2_weight.shape[-1] output_sizes = [intermediate_size, intermediate_size] - n_shards = self.mesh.shape["model"] + n_shards = self.mesh.shape['model'] * self.mesh.shape.get( + "attn_dp", 1) assert intermediate_size % n_shards == 0 w13_weight = reorder_concatenated_tensor_for_sharding( w13_weight, output_sizes, n_shards, dim=1) w13_weight = jax.device_put( w13_weight, - Format(Layout((0, 1, 2)), - NamedSharding(self.mesh, P(None, "model", None)))) + Format( + Layout((0, 1, 2)), + NamedSharding( + self.mesh, + P(None, ShardingAxisName.MLP_TENSOR, None)))) w2_weight = jax.device_put( w2_weight, Format(Layout((0, 1, 2)), - NamedSharding(self.mesh, P(None, None, "model")))) + NamedSharding(self.mesh, P(None, None,ShardingAxisName.MLP_TENSOR)))) if self.moe.has_bias: w13_bias = reorder_concatenated_tensor_for_sharding( @@ -300,7 +306,7 @@ def process_weights_after_loading(self, layer: torch.nn.Module) -> None: w13_bias = jax.device_put( w13_bias, Format(Layout((0, 1)), - NamedSharding(self.mesh, P(None, "model")))) + NamedSharding(self.mesh, P(None, ShardingAxisName.MLP_TENSOR)))) w2_bias = jax.device_put( w2_bias, Format(Layout((0, 1)), diff --git a/tpu_inference/layers/vllm/sharding.py b/tpu_inference/layers/vllm/sharding.py index b06f8b35f..fc1bc983b 100644 --- a/tpu_inference/layers/vllm/sharding.py +++ b/tpu_inference/layers/vllm/sharding.py @@ -19,6 +19,7 @@ from vllm.model_executor.layers.vocab_parallel_embedding import ( ParallelLMHead, VocabParallelEmbedding) +from tpu_inference.layers.jax.sharding import ShardingAxisName from tpu_inference.logger import init_logger P = PartitionSpec @@ -108,7 +109,8 @@ def _shard_tensor_to_tpu_replicated(tensor: torch.Tensor, def _shard_vocab_parallel_embedding(layer: VocabParallelEmbedding, mesh: Mesh) -> None: weight = _convert_to_torchax_and_shard( - layer.weight, NamedSharding(mesh, P('model', None))) + layer.weight, NamedSharding(mesh, P(ShardingAxisName.MLP_TENSOR, + None))) layer.weight = Parameter(weight, requires_grad=False) @@ -117,11 +119,12 @@ def _shard_lm_head(layer: ParallelLMHead, mesh: Mesh): # if that config is set, then we should not create new weights but reuse the # weight from VocabParallelEmbedding weight = _convert_to_torchax_and_shard( - layer.weight, NamedSharding(mesh, P('model', None))) + layer.weight, NamedSharding(mesh, P(ShardingAxisName.MLP_TENSOR, + None))) layer.weight = Parameter(weight, requires_grad=False) if layer.bias is not None: - bias = _convert_to_torchax_and_shard(layer.bias, - NamedSharding(mesh, P('model'))) + bias = _convert_to_torchax_and_shard( + layer.bias, NamedSharding(mesh, P(ShardingAxisName.MLP_TENSOR))) layer.bias = Parameter(bias, requires_grad=False) From 298b9fbea62aec0a5c023c7a7712bac78cd9d679 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Wed, 12 Nov 2025 22:17:49 +0000 Subject: [PATCH 03/17] wip --- tpu_inference/layers/vllm/fused_moe.py | 19 +++++++------------ tpu_inference/runner/kv_cache_manager.py | 2 +- 2 files changed, 8 insertions(+), 13 deletions(-) diff --git a/tpu_inference/layers/vllm/fused_moe.py b/tpu_inference/layers/vllm/fused_moe.py index dfc61224f..34db15a64 100644 --- a/tpu_inference/layers/vllm/fused_moe.py +++ b/tpu_inference/layers/vllm/fused_moe.py @@ -123,13 +123,14 @@ def tensor_sharded_gmm_merged_column_parallel( gmm_result = shard_map( _gmm, mesh=mesh, - in_specs=(P(ShardingAxisName.MLP_DATA, None), P(None, ShardingAxisName.EXPERT, None), P(ShardingAxisName.MLP_DATA)), + in_specs=(P(ShardingAxisName.MLP_DATA, None), P(None, ShardingAxisName.MLP_TENSOR, None), P(ShardingAxisName.MLP_DATA)), out_specs=(P(ShardingAxisName.MLP_DATA, ShardingAxisName.MLP_TENSOR)), check_rep=False, )(lhs, rhs, group_sizes) if rhs_bias is not None: rhs_bis = jnp.repeat(rhs_bias, group_sizes, 0, total_repeat_length=m) + # Maybe need to add sharding constraint here gmm_result = (gmm_result + rhs_bis).astype(gmm_result.dtype) n_shards = mesh.shape['model'] * mesh.shape['attn_dp'] @@ -174,8 +175,9 @@ def _gmm_all_reduce(lhs, rhs, group_sizes): )(lhs, rhs, group_sizes) if rhs_bias is not None: - print("rhs_bias is not None") + rhs_bias = jnp.repeat(rhs_bias, group_sizes, 0, total_repeat_length=m) + # wenxindong: Maybe need to add sharding constraint here gmm_result = (gmm_result + rhs_bias).astype(gmm_result.dtype) return gmm_result @@ -193,7 +195,7 @@ def expert_sharded_gmm( # adapted from https://github.com/pytorch/xla/blob/1d409399474197c484894be90b75d9855393dda5/torch_xla/experimental/custom_kernel.py#L1401 m, k, g = lhs.shape[0], lhs.shape[1], rhs.shape[0] n = rhs.shape[1] if transpose_rhs else rhs.shape[2] - tm, tk, tn = _get_tiling_size_for_gmm_kernel(m, k, n, g) + tm, tk, tn = _get_tiling_size_for_gmm_kernel(m//mesh.shape["data"], k, n, g) num_experts_per_shard = num_experts // ep_size group_offset = jnp.arange(0, num_experts, num_experts_per_shard) @@ -237,8 +239,8 @@ def _gmm(lhs, rhs, group_sizes, group_offset): gmm_res = shard_map( _gmm, mesh=mesh, - in_specs=(P(), P(ShardingAxisName.EXPERT, None, - None), P(), P(ShardingAxisName.EXPERT)), + in_specs=(P(ShardingAxisName.MLP_DATA, None), P(ShardingAxisName.EXPERT, None, + None), P(ShardingAxisName.MLP_DATA), P(ShardingAxisName.EXPERT)), out_specs=(P(ShardingAxisName.EXPERT, None)), check_rep=False, )(lhs, rhs, group_sizes, group_offset) @@ -348,7 +350,6 @@ def fused_moe_func( raise NotImplementedError( "Bias is not supported when using expert parallelism.") orig_shape = hidden_states.shape - print(f"orig_shape: {orig_shape}") hidden_size = hidden_states.shape[-1] num_tokens = hidden_states.size // hidden_size assert global_num_experts == w1.shape[0] @@ -359,7 +360,6 @@ def fused_moe_func( assert (num_tokens * topk) % 16 == 0, ( "The kernel requires num_tokens * topk to be a multiple of " f"16 but got {num_tokens}*{topk}={num_tokens*topk}") - hidden_states = jax.lax.with_sharding_constraint( hidden_states, NamedSharding(mesh, P(ShardingAxisName.MLP_DATA, None))) @@ -375,8 +375,6 @@ def fused_moe_func( topk_weights = topk_weights / topk_weights.sum(axis=-1, keepdims=True) topk_weights = topk_weights.astype(dtype) - # Use shard_map for all sorting and gathering operations to enable parallel - # computation on each shard. Each shard processes its local tokens independently. def _process_tokens_locally(hidden_states_local, topk_indices_local): num_tokens_local = hidden_states_local.shape[0] topk_indices_flat = topk_indices_local.flatten() @@ -443,7 +441,6 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): mesh=mesh, ) - # Use shard_map for reordering and final reduction to process each shard locally def _finalize_output(x_local, topk_argsort_revert_indices_local, topk_weights_local): x_local = x_local[topk_argsort_revert_indices_local].reshape(-1, topk, hidden_size) x_local = x_local * jnp.expand_dims(topk_weights_local, axis=-1) @@ -496,7 +493,6 @@ def fused_moe_func_padded( hidden_size = hidden_states.shape[-1] num_tokens = hidden_states.size // hidden_size if num_tokens * topk < 16: - print("num_tokens * topk < 16") assert 16 % (num_tokens * topk) == 0, f"Cannot pad to 16: {num_tokens=}, {topk=}" n_repeats = 16 // (num_tokens * topk) @@ -525,7 +521,6 @@ def fused_moe_func_padded( x = expanded_x[:hidden_states.shape[0]] return x else: - print("num_tokens * topk >= 16") return fused_moe_func( hidden_states, w1, diff --git a/tpu_inference/runner/kv_cache_manager.py b/tpu_inference/runner/kv_cache_manager.py index bd6932fd8..349cd0212 100644 --- a/tpu_inference/runner/kv_cache_manager.py +++ b/tpu_inference/runner/kv_cache_manager.py @@ -190,7 +190,7 @@ def initialize_kv_cache(self, kv_cache_config: KVCacheConfig) -> None: num_blocks = kv_cache_tensor.size // page_size_bytes dp_size = self.runner.vllm_config.sharding_config.total_dp_size # num_blocks must be a multiple of dp_size - num_blocks = math.ceil(num_blocks / dp_size) * dp_size + num_blocks = (num_blocks // dp_size) * dp_size # NOTE: we'll multiply the num_kv_heads by 2 in the function kv_cache = create_kv_caches( num_blocks=num_blocks, From 90f21adb79c0522e39f251705ae6511d3bab3cae Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Wed, 12 Nov 2025 23:43:50 +0000 Subject: [PATCH 04/17] wip --- tpu_inference/layers/common/sharding.py | 8 ++++---- tpu_inference/layers/vllm/fused_moe.py | 5 ++--- 2 files changed, 6 insertions(+), 7 deletions(-) diff --git a/tpu_inference/layers/common/sharding.py b/tpu_inference/layers/common/sharding.py index 1a1a8d169..2d8637610 100644 --- a/tpu_inference/layers/common/sharding.py +++ b/tpu_inference/layers/common/sharding.py @@ -166,10 +166,10 @@ def validate(cls, vllm_config, sharding_strategy): f"LoRA is not supported with data parallelism " f"(DP size: {total_dp_size}). Please disable LoRA or " f"set data parallelism to 1.") - if not os.environ.get("NEW_MODEL_DESIGN", False): - raise ValueError( - "Must run DP with NEW_MODEL_DESIGN enabled. Please set the " - "NEW_MODEL_DESIGN=True.") + # if not os.environ.get("NEW_MODEL_DESIGN", False): + # raise ValueError( + # "Must run DP with NEW_MODEL_DESIGN enabled. Please set the " + # "NEW_MODEL_DESIGN=True.") @property def total_dp_size(self) -> int: diff --git a/tpu_inference/layers/vllm/fused_moe.py b/tpu_inference/layers/vllm/fused_moe.py index 34db15a64..3f3e4f6d0 100644 --- a/tpu_inference/layers/vllm/fused_moe.py +++ b/tpu_inference/layers/vllm/fused_moe.py @@ -133,7 +133,7 @@ def tensor_sharded_gmm_merged_column_parallel( # Maybe need to add sharding constraint here gmm_result = (gmm_result + rhs_bis).astype(gmm_result.dtype) - n_shards = mesh.shape['model'] * mesh.shape['attn_dp'] + n_shards = mesh.shape['model'] * mesh.shape.get('attn_dp', 1) output_sizes = [intermediate_size, intermediate_size] return slice_sharded_tensor_for_concatenation(gmm_result, output_sizes, @@ -353,8 +353,7 @@ def fused_moe_func( hidden_size = hidden_states.shape[-1] num_tokens = hidden_states.size // hidden_size assert global_num_experts == w1.shape[0] - ep_size = mesh.shape['model'] * mesh.shape[ - "attn_dp"] # only used if use_ep is True. + ep_size = mesh.shape['model'] * mesh.shape.get("attn_dp", 1) # only used if use_ep is True. intermediate_size = w2.shape[-1] dtype = hidden_states.dtype assert (num_tokens * topk) % 16 == 0, ( From a98a8d6cda8b1e033803a01d94b256946a8d0047 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Thu, 13 Nov 2025 21:42:47 +0000 Subject: [PATCH 05/17] wip --- .../batch_composition_stats_2025_11_13_01_11_38_748039.json | 1 + tpu_inference/layers/common/sharding.py | 6 ++++++ 2 files changed, 7 insertions(+) create mode 100644 gs:/wenxindong-vm/trace/gpt_oss/dp2/attn_dp/prefill_heavy/batch_composition_stats_2025_11_13_01_11_38_748039.json diff --git a/gs:/wenxindong-vm/trace/gpt_oss/dp2/attn_dp/prefill_heavy/batch_composition_stats_2025_11_13_01_11_38_748039.json b/gs:/wenxindong-vm/trace/gpt_oss/dp2/attn_dp/prefill_heavy/batch_composition_stats_2025_11_13_01_11_38_748039.json new file mode 100644 index 000000000..f8d0d7b9a --- /dev/null +++ b/gs:/wenxindong-vm/trace/gpt_oss/dp2/attn_dp/prefill_heavy/batch_composition_stats_2025_11_13_01_11_38_748039.json @@ -0,0 +1 @@ +{"total_num_scheduled_tokens": 8192, "num_prefill_tokens": 16349, "num_decode_tokens": 35, "padded_total_num_scheduled_tokens": 16384, "num_reqs": 45} diff --git a/tpu_inference/layers/common/sharding.py b/tpu_inference/layers/common/sharding.py index 2d8637610..930096156 100644 --- a/tpu_inference/layers/common/sharding.py +++ b/tpu_inference/layers/common/sharding.py @@ -121,6 +121,7 @@ def from_vllm_config(cls, if enable_dp_attention: # Replicate attention layer when num_kv_heads < TP num_kv_heads = vllm_config.model_config.get_total_num_kv_heads() + kv_dtype = utils.get_jax_dtype_from_str_dtype( vllm_config.cache_config.cache_dtype) or jnp.bfloat16 packing = 4 // jnp.dtype(kv_dtype).itemsize @@ -128,6 +129,11 @@ def from_vllm_config(cls, # duplicate KV heads across devices, wasting kv cache memory. # Use attention DP instead to reduce per-device num_kv_heads and # eliminate this waste. + + # if head_dim is 64, multiply packing by 2 + if vllm_config.model_config.get_head_size() == 64: + packing *= 2 + num_kv_heads_per_device_in_kv_cache = (num_kv_heads * 2) / packing attn_dp = max( int(tensor_parallelism // num_kv_heads_per_device_in_kv_cache), From 022a9243d1c5ae61f7b867301ae6769f583767a6 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Thu, 13 Nov 2025 21:42:53 +0000 Subject: [PATCH 06/17] wip --- tpu_inference/layers/vllm/fused_moe.py | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/tpu_inference/layers/vllm/fused_moe.py b/tpu_inference/layers/vllm/fused_moe.py index 3f3e4f6d0..351365997 100644 --- a/tpu_inference/layers/vllm/fused_moe.py +++ b/tpu_inference/layers/vllm/fused_moe.py @@ -360,10 +360,10 @@ def fused_moe_func( "The kernel requires num_tokens * topk to be a multiple of " f"16 but got {num_tokens}*{topk}={num_tokens*topk}") hidden_states = jax.lax.with_sharding_constraint( - hidden_states, NamedSharding(mesh, P(ShardingAxisName.MLP_DATA, None))) + hidden_states, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA, None))) gating_output = jax.lax.with_sharding_constraint( - gating_output, NamedSharding(mesh, P(ShardingAxisName.MLP_DATA, None))) + gating_output, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA, None))) hidden_states = hidden_states.reshape(num_tokens, hidden_size) gating_output = gating_output.reshape(num_tokens, global_num_experts) @@ -389,8 +389,8 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): x, group_sizes, topk_argsort_revert_indices = shard_map( _process_tokens_locally, mesh=mesh, - in_specs=(P(ShardingAxisName.MLP_DATA, None), P(ShardingAxisName.MLP_DATA, None)), - out_specs=(P(ShardingAxisName.MLP_DATA, None), P(), P(ShardingAxisName.MLP_DATA)), + in_specs=(P(ShardingAxisName.ATTN_DATA, None), P(ShardingAxisName.ATTN_DATA, None)), + out_specs=(P(ShardingAxisName.ATTN_DATA, None), P(), P(ShardingAxisName.ATTN_DATA)), check_rep=False, )(hidden_states, topk_indices) @@ -449,15 +449,15 @@ def _finalize_output(x_local, topk_argsort_revert_indices_local, topk_weights_lo x = shard_map( _finalize_output, mesh=mesh, - in_specs=(P(ShardingAxisName.MLP_DATA, None), P(ShardingAxisName.MLP_DATA), P(ShardingAxisName.MLP_DATA, None)), - out_specs=(P(ShardingAxisName.MLP_DATA, None)), + in_specs=(P(ShardingAxisName.ATTN_DATA, None), P(ShardingAxisName.ATTN_DATA), P(ShardingAxisName.ATTN_DATA, None)), + out_specs=(P(ShardingAxisName.ATTN_DATA, None)), check_rep=False, )(x, topk_argsort_revert_indices, topk_weights) x = x.reshape(orig_shape) if reduce_results: - x = jax.lax.with_sharding_constraint(x, NamedSharding(mesh, P(ShardingAxisName.MLP_DATA))) + x = jax.lax.with_sharding_constraint(x, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) return x From 11b96ff22c4f453392bd6e161b01ce1883a8bab6 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Fri, 14 Nov 2025 01:09:05 +0000 Subject: [PATCH 07/17] wip --- .../batch_composition_stats_2025_11_13_01_11_38_748039.json | 1 - 1 file changed, 1 deletion(-) delete mode 100644 gs:/wenxindong-vm/trace/gpt_oss/dp2/attn_dp/prefill_heavy/batch_composition_stats_2025_11_13_01_11_38_748039.json diff --git a/gs:/wenxindong-vm/trace/gpt_oss/dp2/attn_dp/prefill_heavy/batch_composition_stats_2025_11_13_01_11_38_748039.json b/gs:/wenxindong-vm/trace/gpt_oss/dp2/attn_dp/prefill_heavy/batch_composition_stats_2025_11_13_01_11_38_748039.json deleted file mode 100644 index f8d0d7b9a..000000000 --- a/gs:/wenxindong-vm/trace/gpt_oss/dp2/attn_dp/prefill_heavy/batch_composition_stats_2025_11_13_01_11_38_748039.json +++ /dev/null @@ -1 +0,0 @@ -{"total_num_scheduled_tokens": 8192, "num_prefill_tokens": 16349, "num_decode_tokens": 35, "padded_total_num_scheduled_tokens": 16384, "num_reqs": 45} From b028301475bdece5f0b84cd176881800b6f300e6 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Fri, 14 Nov 2025 01:49:33 +0000 Subject: [PATCH 08/17] wip --- tpu_inference/layers/vllm/fused_moe.py | 39 +++++++++++++++++--------- 1 file changed, 26 insertions(+), 13 deletions(-) diff --git a/tpu_inference/layers/vllm/fused_moe.py b/tpu_inference/layers/vllm/fused_moe.py index 351365997..a1c5e5428 100644 --- a/tpu_inference/layers/vllm/fused_moe.py +++ b/tpu_inference/layers/vllm/fused_moe.py @@ -103,6 +103,7 @@ def tensor_sharded_gmm_merged_column_parallel( rhs: jax.Array, rhs_bias: jax.Array | None, group_sizes: jax.Array, + group_sizes_global: jax.Array, transpose_rhs: bool, mesh: Mesh, intermediate_size: int, @@ -128,9 +129,9 @@ def tensor_sharded_gmm_merged_column_parallel( check_rep=False, )(lhs, rhs, group_sizes) + if rhs_bias is not None: - rhs_bis = jnp.repeat(rhs_bias, group_sizes, 0, total_repeat_length=m) - # Maybe need to add sharding constraint here + rhs_bis = jnp.repeat(rhs_bias, group_sizes_global, 0, total_repeat_length=m) gmm_result = (gmm_result + rhs_bis).astype(gmm_result.dtype) n_shards = mesh.shape['model'] * mesh.shape.get('attn_dp', 1) @@ -145,6 +146,7 @@ def tensor_sharded_gmm_row_parallel( rhs: jax.Array, rhs_bias: jax.Array | None, group_sizes: jax.Array, + group_sizes_global: jax.Array, transpose_rhs: bool, mesh: Mesh, ) -> jax.Array: @@ -173,11 +175,9 @@ def _gmm_all_reduce(lhs, rhs, group_sizes): out_specs=(P(ShardingAxisName.MLP_DATA)), check_rep=False, )(lhs, rhs, group_sizes) - + jax.debug.print("gmm_result before bias {} {}", gmm_result.sum(), gmm_result.ravel()[:10]) if rhs_bias is not None: - - rhs_bias = jnp.repeat(rhs_bias, group_sizes, 0, total_repeat_length=m) - # wenxindong: Maybe need to add sharding constraint here + rhs_bias = jnp.repeat(rhs_bias, group_sizes_global, 0, total_repeat_length=m) gmm_result = (gmm_result + rhs_bias).astype(gmm_result.dtype) return gmm_result @@ -365,6 +365,7 @@ def fused_moe_func( gating_output = jax.lax.with_sharding_constraint( gating_output, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA, None))) + jax.debug.print("hidden_state before MoE {} {}", hidden_states.sum(), hidden_states.ravel()[:10]) hidden_states = hidden_states.reshape(num_tokens, hidden_size) gating_output = gating_output.reshape(num_tokens, global_num_experts) @@ -381,19 +382,25 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): topk_argsort_revert_indices = jnp.argsort(topk_argsort_indices) token_indices = jnp.arange(num_tokens_local, dtype=jnp.int32).repeat(topk) token_indices_sorted = token_indices[topk_argsort_indices] - group_sizes = jnp.bincount(topk_indices_flat, length=global_num_experts) + group_sizes_local = jnp.bincount(topk_indices_flat, length=global_num_experts) + + # Reduce group_sizes once across data parallel shards to get global counts + # This is needed for bias addition and should be done only once for efficiency + group_sizes_global = jax.lax.psum(group_sizes_local, axis_name=ShardingAxisName.MLP_DATA) x = hidden_states_local[token_indices_sorted] - return x, group_sizes, topk_argsort_revert_indices + return x, group_sizes_local, group_sizes_global, topk_argsort_revert_indices - x, group_sizes, topk_argsort_revert_indices = shard_map( + x, group_sizes, group_sizes_global, topk_argsort_revert_indices = shard_map( _process_tokens_locally, mesh=mesh, in_specs=(P(ShardingAxisName.ATTN_DATA, None), P(ShardingAxisName.ATTN_DATA, None)), - out_specs=(P(ShardingAxisName.ATTN_DATA, None), P(), P(ShardingAxisName.ATTN_DATA)), + out_specs=(P(ShardingAxisName.ATTN_DATA, None), P(ShardingAxisName.ATTN_DATA), P(), P(ShardingAxisName.ATTN_DATA)), check_rep=False, )(hidden_states, topk_indices) - + + jax.debug.print("hidden_state before gmm {} {}", x.sum(), x.ravel()[:10]) + jax.debug.print("group_sizes {} {}", group_sizes.sum(), group_sizes) if use_ep: x = expert_sharded_gmm( x, @@ -411,13 +418,16 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): w1, w1_bias, group_sizes, + group_sizes_global, transpose_rhs=True, mesh=mesh, intermediate_size=intermediate_size, ) + jax.debug.print("hidden_state after first gmm x1 {} {}", x1.sum(), x1.ravel()[:10]) + jax.debug.print("hidden_state after first gmm x2 {} {}", x2.sum(), x2.ravel()[:10]) x = activation_fn(activation, x1, x2) - + jax.debug.print("hidden_state after activation {} {}", x.sum(), x.ravel()[:10]) if use_ep: x = expert_sharded_gmm( x, @@ -436,9 +446,11 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): w2, w2_bias, group_sizes, + group_sizes_global, transpose_rhs=True, mesh=mesh, ) + jax.debug.print("hidden_state after second gmm {} {}", x.sum(), x.ravel()[:10]) def _finalize_output(x_local, topk_argsort_revert_indices_local, topk_weights_local): x_local = x_local[topk_argsort_revert_indices_local].reshape(-1, topk, hidden_size) @@ -453,11 +465,12 @@ def _finalize_output(x_local, topk_argsort_revert_indices_local, topk_weights_lo out_specs=(P(ShardingAxisName.ATTN_DATA, None)), check_rep=False, )(x, topk_argsort_revert_indices, topk_weights) - + jax.debug.print("hidden_state after finalize output {} {}", x.sum(), x.ravel()[:10]) x = x.reshape(orig_shape) if reduce_results: x = jax.lax.with_sharding_constraint(x, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) + jax.debug.print("hidden_state after reducing result {} {}", x.sum(), x.ravel()[:10]) return x From f29cdf9e4983a05f5085eeb1feb0839a810c6836 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Fri, 14 Nov 2025 16:41:05 +0000 Subject: [PATCH 09/17] wip --- debug_attn_dp.txt | 233 +++ debugging.txt | 423 ++++ debugging_baseline.txt | 732 +++++++ oss_log_98.txt | 2508 +++++++++++++++++++++++ oss_log_attn_dp.txt | 2564 ++++++++++++++++++++++++ oss_log_baseline.txt | 2410 ++++++++++++++++++++++ oss_log_numerics.txt | 270 +++ tpu_inference/layers/vllm/fused_moe.py | 22 +- 8 files changed, 9151 insertions(+), 11 deletions(-) create mode 100644 debug_attn_dp.txt create mode 100644 debugging.txt create mode 100644 debugging_baseline.txt create mode 100644 oss_log_98.txt create mode 100644 oss_log_attn_dp.txt create mode 100644 oss_log_baseline.txt create mode 100644 oss_log_numerics.txt diff --git a/debug_attn_dp.txt b/debug_attn_dp.txt new file mode 100644 index 000000000..24e8e7f8d --- /dev/null +++ b/debug_attn_dp.txt @@ -0,0 +1,233 @@ +INFO 11-14 05:25:30 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-14 05:25:30 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-14 05:25:30 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-14 05:25:30 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +INFO 11-14 05:25:31 [utils.py:253] non-default args: {'download_dir': '/mnt/disks/persist', 'max_model_len': 1024, 'tensor_parallel_size': 8, 'num_redundant_experts': None, 'eplb_window_size': None, 'eplb_step_interval': None, 'eplb_log_balancedness': None, 'gpu_memory_utilization': 0.8, 'enable_lora': None, 'reasoning_parser_plugin': '', 'additional_config': {'sharding': {'sharding_strategy': {'enable_dp_attention': 1}}}, 'async_scheduling': True, 'model': 'unsloth/gpt-oss-120b-BF16'} +INFO 11-14 05:25:32 [model.py:630] Resolved architecture: GptOssForCausalLM +INFO 11-14 05:25:32 [model.py:1728] Using max model len 1024 +WARNING 11-14 05:25:32 [tpu_jax.py:82] Error getting device name: 'NoneType' object has no attribute 'name' +INFO 11-14 05:25:32 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. +INFO 11-14 05:25:32 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. +INFO 11-14 05:25:32 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=2), device_indexes=None) +WARNING 11-14 05:25:32 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +INFO 11-14 05:25:32 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:33 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=1024, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=8, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=True, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} +(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:33 [tpu_jax.py:228] Pin memory is not supported on TPU. +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [tpu_jax_runner.py:274] Init mesh | mesh=Mesh('data': 1, 'model': 4, axis_types=(Auto, Auto)) +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [compilation_manager.py:34] Enabling JAX compile cache. +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm +(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:39 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") +(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:39 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:39 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") +(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:39 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:39 [tpu_jax.py:63] Cannot use None backend on TPU. +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:39 [tpu_jax.py:66] Using Pallas V1 backend. +(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:39 [layer.py:331] Disabling MoE shared_experts cuda stream +(EngineCore_DP0 pid=4095770) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 + main(args) + File "/home/wenxindong_google_com/tpu-inference/examples/offline_inference.py", line 37, in main + llm = LLM(**args) + ^^^^^^^^^^^ + File "/home/wenxindong_google_com/vllm/vllm/entrypoints/llm.py", line 341, in __init__ + self.llm_engine = LLMEngine.from_engine_args( + ^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/llm_engine.py", line 174, in from_engine_args + return cls( + ^^^^ + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/llm_engine.py", line 108, in __init__ + self.engine_core = EngineCoreClient.make_client( + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 93, in make_client + return SyncMPClient(vllm_config, executor_class, log_stats) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 640, in __init__ + super().__init__( + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 469, in __init__ + with launch_core_engines(vllm_config, executor_class, log_stats) as ( + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/mnt/disks/persist/vllm_conda/lib/python3.12/contextlib.py", line 144, in __exit__ + next(self.gen) + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/utils.py", line 898, in launch_core_engines + wait_for_engine_startup( + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/utils.py", line 955, in wait_for_engine_startup + raise RuntimeError( +RuntimeError: Engine core initialization failed. See root cause above. Failed core proc(s): {} diff --git a/debugging.txt b/debugging.txt new file mode 100644 index 000000000..66da4ea0e --- /dev/null +++ b/debugging.txt @@ -0,0 +1,423 @@ +INFO 11-14 06:43:43 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-14 06:43:43 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-14 06:43:43 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-14 06:43:43 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +INFO 11-14 06:43:44 [utils.py:253] non-default args: {'download_dir': '/mnt/disks/persist', 'max_model_len': 1024, 'tensor_parallel_size': 4, 'data_parallel_size': 2, 'num_redundant_experts': None, 'eplb_window_size': None, 'eplb_step_interval': None, 'eplb_log_balancedness': None, 'enable_lora': None, 'reasoning_parser_plugin': '', 'model': 'unsloth/gpt-oss-120b-BF16'} +INFO 11-14 06:43:45 [model.py:630] Resolved architecture: GptOssForCausalLM +INFO 11-14 06:43:45 [model.py:1728] Using max model len 1024 +WARNING 11-14 06:43:45 [tpu_jax.py:82] Error getting device name: 'NoneType' object has no attribute 'name' +INFO 11-14 06:43:45 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. +INFO 11-14 06:43:45 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. +INFO 11-14 06:43:45 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=2, attention_data_parallelism=1), device_indexes=None) +WARNING 11-14 06:43:45 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +INFO 11-14 06:43:45 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:46 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=1024, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=4, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=True, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} +(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:46 [tpu_jax.py:228] Pin memory is not supported on TPU. +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:51 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:51 [tpu_jax_runner.py:274] Init mesh | mesh=Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:51 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:52 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:52 [compilation_manager.py:34] Enabling JAX compile cache. +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:52 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:52 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm +(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:53 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") +(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:53 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:53 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") +(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:53 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:53 [tpu_jax.py:63] Cannot use None backend on TPU. +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:53 [tpu_jax.py:66] Using Pallas V1 backend. +(EngineCore_DP0 pid=113991) INFO 11-14 06:43:53 [layer.py:331] Disabling MoE shared_experts cuda stream +(EngineCore_DP0 pid=113991) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00. This scheduler interface is not public and compatibility may not be maintained. +(EngineCore_DP0 pid=113991) INFO 11-14 06:45:29 [dp_scheduler.py:93] DPScheduler (Async = False) per-rank limits: max_seqs=256, max_tokens=8192 +(EngineCore_DP0 pid=113991) INFO 11-14 06:45:29 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) +(EngineCore_DP0 pid=113991) WARNING 11-14 06:45:29 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(EngineCore_DP0 pid=113991) INFO 11-14 06:45:29 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +INFO 11-14 06:45:29 [llm.py:350] Supported tasks: ['generate'] + Adding requests: 0%| | 0/35 [00:00, 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None}, +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [dump_input.py:79] Dumping scheduler output for model execution: DPSchedulerOutput(scheduled_new_reqs=[NewRequestData(req_id=0,prompt_token_ids_len=5,mm_features=[],sampling_params=SamplingParams(n=1, presence_penalty=0.0, frequency_penalty=0.0, repetition_penalty=1.0, temperature=1.0, top_p=1.0, top_k=0, min_p=0.0, seed=None, stop=[], stop_token_ids=[199999], bad_words=[], include_stop_str_in_output=False, ignore_eos=False, max_tokens=16, min_tokens=0, logprobs=None, prompt_logprobs=None, skip_special_tokens=True, spaces_between_special_tokens=True, truncate_prompt_tokens=None, structured_outputs=None, extra_args=None),block_ids=([1],),num_computed_tokens=0,lora_request=None,prompt_embeds_shape=None)], scheduled_cached_reqs=CachedRequestData(req_ids=[], resumed_req_ids=[], new_token_ids=[], all_token_ids=[], new_block_ids=[], num_computed_tokens=[], num_output_tokens=[]), num_scheduled_tokens={0: 5}, total_num_scheduled_tokens=5, scheduled_spec_decode_tokens={}, scheduled_encoder_inputs={}, num_common_prefix_blocks=[1], finished_req_ids=[], free_encoder_mm_hashes=[], pending_structured_output_tokens=false, kv_connector_metadata=null, assigned_dp_rank={0: 0}) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [dump_input.py:81] Dumping scheduler stats: SchedulerStats(num_running_reqs=1, num_waiting_reqs=0, step_counter=0, current_wave=0, kv_cache_usage=1.9061415881982402e-05, prefix_cache_stats=PrefixCacheStats(reset=False, requests=3, queries=15, hits=0, preempted_requests=0, preempted_queries=0, preempted_hits=0), connector_prefix_cache_stats=None, spec_decoding_stats=None, kv_connector_stats=None, waiting_lora_adapters={}, running_lora_adapters={}) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] EngineCore encountered a fatal error. +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] Traceback (most recent call last): +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 848, in run_engine_core +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] engine_core.run_busy_loop() +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 875, in run_busy_loop +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] self._process_engine_step() +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 904, in _process_engine_step +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] outputs, model_executed = self.step_fn() +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 332, in step +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] model_output = future.result() +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/concurrent/futures/_base.py", line 449, in result +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.__get_result() +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/concurrent/futures/_base.py", line 401, in __get_result +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] raise self._exception +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/executor/uniproc_executor.py", line 79, in collective_rpc +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] result = run_method(self.driver_worker, method, args, kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/serial_utils.py", line 459, in run_method +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return func(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/worker/worker_base.py", line 367, in execute_model +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.worker.execute_model(scheduler_output, *args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/worker/tpu_worker_jax.py", line 198, in execute_model +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] output = self.model_runner.execute_model(scheduler_output) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/utils.py", line 313, in wrapper +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] result = func(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/runner/tpu_jax_runner.py", line 526, in execute_model +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] _, output = self._execute_model(scheduler_output) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/runner/tpu_jax_runner.py", line 717, in _execute_model +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] aux_hidden_states) = self.model_fn( +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 169, in step_fun +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] hidden_states = torch.func.functional_call( +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/_functorch/functional_call.py", line 148, in functional_call +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return nn.utils.stateless._functional_call( +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/utils/stateless.py", line 282, in _functional_call +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return module(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 46, in forward +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.compute_hidden_state( +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 60, in compute_hidden_state +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] hidden_state = self.vllm_model(input_ids, positions, +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 716, in forward +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.model(input_ids, positions, intermediate_tensors, inputs_embeds) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/compilation/decorators.py", line 470, in __call__ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] output = self.compiled_callable(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/_dynamo/eval_frame.py", line 761, in compile_wrapper +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] _maybe_set_eval_frame(prior) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 299, in forward +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] x, residual = layer(x, positions, residual) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 236, in forward +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] output = self.mlp(hidden_states) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 189, in forward +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] x = self.experts(hidden_states=x, router_logits=g) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/custom_op.py", line 46, in forward +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._forward_method(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/custom_op.py", line 76, in forward_tpu +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.forward_native(*args, **kwargs) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/layers/fused_moe/layer.py", line 1487, in forward_native +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] fused_output = self.forward_impl(hidden_states, router_logits) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/layers/fused_moe/layer.py", line 1745, in forward_impl +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] final_hidden_states = self.quant_method.apply( +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/quantization/unquantized.py", line 363, in apply +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] output = fused_moe_func_padded( +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 491, in fused_moe_func_padded +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return x +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 388, in fused_moe_func +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] x1, x2 = tensor_sharded_gmm_merged_column_parallel( +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 124, in tensor_sharded_gmm_merged_column_parallel +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] gmm_result = shard_map( +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ValueError: The context mesh AbstractMesh('data': 2, 'model': 4, axis_types=(Manual, Manual), device_kind=TPU7x, num_cores=1) should match the mesh passed to shard_map Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] -------------------- +(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] For simplicity, JAX has removed its internal frames from the traceback of the following exception. Set JAX_TRACEBACK_FILTERING=off to include these. +(EngineCore_DP0 pid=113991) Process EngineCore_DP0: +Traceback (most recent call last): + File "/home/wenxindong_google_com/tpu-inference/examples/offline_inference.py", line 113, in + main(args) + File "/home/wenxindong_google_com/tpu-inference/examples/offline_inference.py", line 92, in main + outputs = llm.generate(prompts, sampling_params) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/home/wenxindong_google_com/vllm/vllm/entrypoints/llm.py", line 446, in generate + outputs = self._run_engine(use_tqdm=use_tqdm) + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/home/wenxindong_google_com/vllm/vllm/entrypoints/llm.py", line 1736, in _run_engine + step_outputs = self.llm_engine.step() + ^^^^^^^^^^^^^^^^^^^^^^ + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/llm_engine.py", line 285, in step + outputs = self.engine_core.get_output() +(EngineCore_DP0 pid=113991) Traceback (most recent call last): + ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 709, in get_output + raise self._format_exception(outputs) from None +vllm.v1.engine.exceptions.EngineDeadError: EngineCore encountered an issue. See stack trace (above) for the root cause. +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/multiprocessing/process.py", line 314, in _bootstrap +(EngineCore_DP0 pid=113991) self.run() +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/multiprocessing/process.py", line 108, in run +(EngineCore_DP0 pid=113991) self._target(*self._args, **self._kwargs) +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 859, in run_engine_core +(EngineCore_DP0 pid=113991) raise e +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 848, in run_engine_core +(EngineCore_DP0 pid=113991) engine_core.run_busy_loop() +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 875, in run_busy_loop +(EngineCore_DP0 pid=113991) self._process_engine_step() +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 904, in _process_engine_step +(EngineCore_DP0 pid=113991) outputs, model_executed = self.step_fn() +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 332, in step +(EngineCore_DP0 pid=113991) model_output = future.result() +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/concurrent/futures/_base.py", line 449, in result +(EngineCore_DP0 pid=113991) return self.__get_result() +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/concurrent/futures/_base.py", line 401, in __get_result +(EngineCore_DP0 pid=113991) raise self._exception +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/executor/uniproc_executor.py", line 79, in collective_rpc +(EngineCore_DP0 pid=113991) result = run_method(self.driver_worker, method, args, kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/serial_utils.py", line 459, in run_method +(EngineCore_DP0 pid=113991) return func(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/worker/worker_base.py", line 367, in execute_model +(EngineCore_DP0 pid=113991) return self.worker.execute_model(scheduler_output, *args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/worker/tpu_worker_jax.py", line 198, in execute_model +(EngineCore_DP0 pid=113991) output = self.model_runner.execute_model(scheduler_output) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/utils.py", line 313, in wrapper +(EngineCore_DP0 pid=113991) result = func(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/runner/tpu_jax_runner.py", line 526, in execute_model +(EngineCore_DP0 pid=113991) _, output = self._execute_model(scheduler_output) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/runner/tpu_jax_runner.py", line 717, in _execute_model +(EngineCore_DP0 pid=113991) aux_hidden_states) = self.model_fn( +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 169, in step_fun +(EngineCore_DP0 pid=113991) hidden_states = torch.func.functional_call( +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/_functorch/functional_call.py", line 148, in functional_call +(EngineCore_DP0 pid=113991) return nn.utils.stateless._functional_call( +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/utils/stateless.py", line 282, in _functional_call +(EngineCore_DP0 pid=113991) return module(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 46, in forward +(EngineCore_DP0 pid=113991) return self.compute_hidden_state( +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 60, in compute_hidden_state +(EngineCore_DP0 pid=113991) hidden_state = self.vllm_model(input_ids, positions, +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 716, in forward +(EngineCore_DP0 pid=113991) return self.model(input_ids, positions, intermediate_tensors, inputs_embeds) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/compilation/decorators.py", line 470, in __call__ +(EngineCore_DP0 pid=113991) output = self.compiled_callable(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/_dynamo/eval_frame.py", line 761, in compile_wrapper +(EngineCore_DP0 pid=113991) _maybe_set_eval_frame(prior) +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 299, in forward +(EngineCore_DP0 pid=113991) x, residual = layer(x, positions, residual) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 236, in forward +(EngineCore_DP0 pid=113991) output = self.mlp(hidden_states) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 189, in forward +(EngineCore_DP0 pid=113991) x = self.experts(hidden_states=x, router_logits=g) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl +(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl +(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/custom_op.py", line 46, in forward +(EngineCore_DP0 pid=113991) return self._forward_method(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/custom_op.py", line 76, in forward_tpu +(EngineCore_DP0 pid=113991) return self.forward_native(*args, **kwargs) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/layers/fused_moe/layer.py", line 1487, in forward_native +(EngineCore_DP0 pid=113991) fused_output = self.forward_impl(hidden_states, router_logits) +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/layers/fused_moe/layer.py", line 1745, in forward_impl +(EngineCore_DP0 pid=113991) final_hidden_states = self.quant_method.apply( +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/quantization/unquantized.py", line 363, in apply +(EngineCore_DP0 pid=113991) output = fused_moe_func_padded( +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 491, in fused_moe_func_padded +(EngineCore_DP0 pid=113991) return x +(EngineCore_DP0 pid=113991) ^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 388, in fused_moe_func +(EngineCore_DP0 pid=113991) x1, x2 = tensor_sharded_gmm_merged_column_parallel( +(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 124, in tensor_sharded_gmm_merged_column_parallel +(EngineCore_DP0 pid=113991) gmm_result = shard_map( +(EngineCore_DP0 pid=113991) ^^^^^^^^^^ +(EngineCore_DP0 pid=113991) ValueError: The context mesh AbstractMesh('data': 2, 'model': 4, axis_types=(Manual, Manual), device_kind=TPU7x, num_cores=1) should match the mesh passed to shard_map Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) +(EngineCore_DP0 pid=113991) -------------------- +(EngineCore_DP0 pid=113991) For simplicity, JAX has removed its internal frames from the traceback of the following exception. Set JAX_TRACEBACK_FILTERING=off to include these. + Processed prompts: 0%| | 0/35 [00:04, 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} +(EngineCore_DP0 pid=59613) WARNING 11-14 06:25:59 [tpu_jax.py:228] Pin memory is not supported on TPU. +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [tpu_jax_runner.py:274] Init mesh | mesh=Mesh('data': 1, 'model': 4, axis_types=(Auto, Auto)) +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192] +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256] +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [compilation_manager.py:34] Enabling JAX compile cache. +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm +(EngineCore_DP0 pid=59613) WARNING 11-14 06:26:06 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") +(EngineCore_DP0 pid=59613) WARNING 11-14 06:26:06 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=59613) WARNING 11-14 06:26:06 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") +(EngineCore_DP0 pid=59613) WARNING 11-14 06:26:06 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:06 [tpu_jax.py:63] Cannot use None backend on TPU. +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:06 [tpu_jax.py:66] Using Pallas V1 backend. +(EngineCore_DP0 pid=59613) INFO 11-14 06:26:06 [layer.py:331] Disabling MoE shared_experts cuda stream +(EngineCore_DP0 pid=59613) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00, 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:02 [tpu_jax.py:228] Pin memory is not supported on TPU. +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:07 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [tpu_jax_runner.py:278] Creating new model mesh | devices=8, num_slices=1 +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 2, 'attn_dp': 1, 'expert': 1, 'model': 4, axis_types=(Auto, Auto, Auto, Auto)) +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [utils.py:314] Phased-based profiler enabled. Traces will be saved to: gs://wenxindong-vm/trace/gpt_oss/dp2/kv_98 +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [compilation_manager.py:34] Enabling JAX compile cache. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:09 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:09 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:09 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:09 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:09 [tpu_jax.py:63] Cannot use None backend on TPU. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:09 [tpu_jax.py:66] Using Pallas V1 backend. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:09 [layer.py:331] Disabling MoE shared_experts cuda stream +(EngineCore_DP0 pid=2733848) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 {'num_tokens': 16} +(EngineCore_DP0 pid=2733848) /mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torchax/tensor.py:154: UserWarning: Explicitly requested dtype int64 requested in astype is not available, and will be truncated to dtype int32. To enable more dtypes, set the jax_enable_x64 configuration option or the JAX_ENABLE_X64 shell environment variable. See https://github.com/jax-ml/jax#current-gotchas for more. +(EngineCore_DP0 pid=2733848) res = jax_function(self._elem, *args, **kwargs) +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:34:57 [compilation_manager.py:67] Compilation finished in 11.39 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:34:57 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 32} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:57] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:57] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:57] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:09 [compilation_manager.py:67] Compilation finished in 12.20 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:09 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 64} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:22 [compilation_manager.py:67] Compilation finished in 12.88 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:22 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 128} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:40 [compilation_manager.py:67] Compilation finished in 17.50 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:40 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 256} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:58 [compilation_manager.py:67] Compilation finished in 18.27 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:58 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 512} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:17 [compilation_manager.py:67] Compilation finished in 19.21 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:18 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 1024} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:37 [compilation_manager.py:67] Compilation finished in 19.12 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:37 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 2048} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:58 [compilation_manager.py:67] Compilation finished in 21.21 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:58 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 4096} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:37:21 [compilation_manager.py:67] Compilation finished in 23.27 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:37:22 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 8192} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:37:52 [compilation_manager.py:67] Compilation finished in 30.79 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:37:52 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 16384} +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:52] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 37.26 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.34 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:325] Compiling select_from_array with different input shapes. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:304] Compiling select_from_array for select all logits. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.08 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:67] Compilation finished in 0.55 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:51 [compilation_manager.py:67] Compilation finished in 0.36 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:51 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:51 [compilation_manager.py:67] Compilation finished in 0.59 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:51 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:53 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:53 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:53 [compilation_manager.py:67] Compilation finished in 0.52 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:53 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:54 [compilation_manager.py:67] Compilation finished in 0.76 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:54 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:55 [compilation_manager.py:67] Compilation finished in 0.46 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:55 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:55 [compilation_manager.py:67] Compilation finished in 0.44 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:55 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:56 [compilation_manager.py:67] Compilation finished in 0.45 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:56 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:56 [compilation_manager.py:67] Compilation finished in 0.47 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:56 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:67] Compilation finished in 0.54 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:67] Compilation finished in 0.64 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:67] Compilation finished in 0.02 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:59 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:59 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:59 [compilation_manager.py:67] Compilation finished in 0.58 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:59 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:67] Compilation finished in 0.60 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:365] Compiling compute_logits with different input shapes. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:67] Compilation finished in 0.28 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:67] Compilation finished in 0.36 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:03 [compilation_manager.py:67] Compilation finished in 0.77 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:03 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:03 [compilation_manager.py:67] Compilation finished in 0.02 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:03 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:04 [compilation_manager.py:67] Compilation finished in 0.84 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:04 [compilation_manager.py:387] Compiling sampling with different input shapes. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': True} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': False} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': True} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': False} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': True} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': False} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:07 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:07 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': True} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:07 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:07 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': False} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:67] Compilation finished in 0.53 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': True} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': False} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:67] Compilation finished in 0.02 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': True} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': False} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': True} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': False} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:10 [compilation_manager.py:67] Compilation finished in 0.39 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:10 [compilation_manager.py:455] Compiling gather_logprobs with different input shapes. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:10 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 8} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.70 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 16} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.78 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 32} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.05 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 64} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 128} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.05 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 256} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 512} +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [compilation_manager.py:751] Compiling structured_decoding with different input shapes. +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:39:12 [compilation_manager.py:754] Structured decoding precompilation skipped since structured decoding is not supported with DP. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [core.py:247] init engine (profile, create kv cache, warmup model) took 270.28 seconds +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:39:12 [scheduler.py:158] Using custom scheduler class . This scheduler interface is not public and compatibility may not be maintained. +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [dp_scheduler.py:93] DPScheduler (Async = True) per-rank limits: max_seqs=256, max_tokens=8192 +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [core.py:181] Batch queue is enabled with size 2 +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:13 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:39:13 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:13 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +(APIServer pid=2733675) [INFO] model_hosting_container_standards - decorators.py:76: [PING] Framework handler registered: ping +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO decorators.py:76: [PING] Framework handler registered: ping +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func +(APIServer pid=2733675) [INFO] model_hosting_container_standards - decorators.py:76: [INVOKE] Framework handler registered: decorated_func +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO decorators.py:76: [INVOKE] Framework handler registered: decorated_func +(APIServer pid=2733675) [INFO] model_hosting_container_standards - __init__.py:127: Starting SageMaker bootstrap process +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO __init__.py:127: Starting SageMaker bootstrap process +(APIServer pid=2733675) [INFO] model_hosting_container_standards - registry.py:109: [REGISTRY] Middleware resolution and registration complete +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO registry.py:109: [REGISTRY] Middleware resolution and registration complete +(APIServer pid=2733675) [INFO] model_hosting_container_standards - core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully +(APIServer pid=2733675) [INFO] model_hosting_container_standards - core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares +(APIServer pid=2733675) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=2733675) [2025-11-12 22:39:13] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=2733675) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=2733675) [2025-11-12 22:39:13] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=2733675) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:93: Creating SageMaker router with unified route resolver +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO sagemaker_router.py:93: Creating SageMaker router with unified route resolver +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:172: Creating router with prefix='', tags=['sagemaker'] +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:172: Creating router with prefix='', tags=['sagemaker'] +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:110: Mounting 2 handlers to router +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:110: Mounting 2 handlers to router +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:184: Router created with 0 routes +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:184: Router created with 0 routes +(APIServer pid=2733675) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:101: SageMaker router created successfully with 0 routes +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO sagemaker_router.py:101: SageMaker router created successfully with 0 routes +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:287: Including router with conflict detection +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:287: Including router with conflict detection +(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:305: Successfully included router with 0 routes +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:305: Successfully included router with 0 routes +(APIServer pid=2733675) [INFO] model_hosting_container_standards - __init__.py:139: SageMaker bootstrap completed successfully +(APIServer pid=2733675) [2025-11-12 22:39:13] INFO __init__.py:139: SageMaker bootstrap completed successfully +(APIServer pid=2733675) INFO 11-12 22:39:13 [api_server.py:1662] Supported tasks: ['generate'] +(APIServer pid=2733675) WARNING 11-12 22:39:13 [serving_responses.py:189] For gpt-oss, we ignore --enable-auto-tool-choice and always enable tool use. +(APIServer pid=2733675) INFO 11-12 22:39:13 [api_server.py:1972] Starting vLLM API server 0 on http://0.0.0.0:8000 +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:38] Available routes are: +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /openapi.json, Methods: GET, HEAD +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /docs, Methods: GET, HEAD +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /docs/oauth2-redirect, Methods: GET, HEAD +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /redoc, Methods: GET, HEAD +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /health, Methods: GET +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /load, Methods: GET +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /tokenize, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /detokenize, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/models, Methods: GET +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /version, Methods: GET +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/responses, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/responses/{response_id}, Methods: GET +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/responses/{response_id}/cancel, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/messages, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/chat/completions, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/completions, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/embeddings, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /pooling, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /classify, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /score, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/score, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/audio/transcriptions, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/audio/translations, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /rerank, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/rerank, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v2/rerank, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /scale_elastic_ep, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /is_scaling_elastic_ep, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /ping, Methods: GET +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /ping, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /invocations, Methods: POST +(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /metrics, Methods: GET +(APIServer pid=2733675) INFO: Started server process [2733675] +(APIServer pid=2733675) INFO: Waiting for application startup. +(APIServer pid=2733675) INFO: Application startup complete. +(APIServer pid=2733675) INFO: 127.0.0.1:46880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO 11-12 22:39:34 [loggers.py:221] Engine 000: Avg prompt throughput: 204.8 tokens/s, Avg generation throughput: 50.8 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:39:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 127.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:39:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 122.5 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:40:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 117.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:40:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 118.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.2%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=2733848) WARNING 11-12 22:40:20 [tpu_jax_runner.py:666] Should not schedule a request that does nothing! +(APIServer pid=2733675) INFO: 127.0.0.1:46880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49068 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49078 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49094 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49098 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49116 - "POST /v1/completions HTTP/1.1" 200 OK +(EngineCore_DP0 pid=2733848) INFO 11-12 22:40:21 [utils.py:358] Starting profiling for prefill_heavy phase +(EngineCore_DP0 pid=2733848) INFO 11-12 22:40:21 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 8192, 'num_prefill_tokens': 12288, 'num_decode_tokens': 1, 'padded_total_num_scheduled_tokens': 16384, 'num_reqs': 7} +(APIServer pid=2733675) INFO: 127.0.0.1:49120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49130 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49138 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49166 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49178 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49220 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49228 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49274 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49294 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49304 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49306 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49316 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49340 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49358 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49366 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49386 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49404 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49432 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49446 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49468 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49482 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49484 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49496 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49510 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49534 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49548 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49562 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49582 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49608 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49696 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49712 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49720 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49728 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49738 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49754 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49768 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49830 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49886 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49916 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49928 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49932 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49964 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49976 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49980 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:49996 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50026 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50030 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50078 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50092 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50106 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50126 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50142 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50158 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50184 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50196 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50234 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50238 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50262 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50288 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50290 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50304 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50344 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50384 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50412 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50430 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50436 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50438 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50466 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50470 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50484 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50506 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50522 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50528 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50530 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50612 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50614 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50640 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50690 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50704 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50718 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50744 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50768 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50844 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50886 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50910 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50924 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50932 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50934 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50938 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50982 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:50986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51002 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51014 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51030 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51044 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51074 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51130 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51132 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51148 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51182 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51186 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51198 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51208 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51294 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51308 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51310 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51326 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51334 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51398 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51408 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51434 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51444 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51454 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51482 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51492 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51506 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51528 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51532 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51538 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51546 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51566 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51574 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51598 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51608 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51636 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51650 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51658 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51672 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51716 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51748 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51758 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51810 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51826 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51844 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51882 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51926 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51942 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51956 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:51984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52000 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52032 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52068 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52078 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52094 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52098 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52106 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52110 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52126 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52136 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52142 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52158 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52164 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52212 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52234 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52240 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52284 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52292 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52326 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52344 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52358 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52404 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52408 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52436 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52450 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52470 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52488 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52520 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52534 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52566 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52572 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52580 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52608 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52614 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52642 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52654 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52656 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52664 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52668 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52672 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52680 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52696 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52706 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52746 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52800 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52852 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52856 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52870 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52892 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52926 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52930 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52942 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52962 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52978 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:52992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53014 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53030 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53044 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53060 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53072 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53082 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53086 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53092 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53096 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53132 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53138 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53158 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53164 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53190 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53198 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53210 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53224 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53240 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53248 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53262 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53266 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53270 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53284 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53306 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53322 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53326 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53340 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53410 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53424 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53432 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53438 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53450 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53454 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53468 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53476 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53488 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53532 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53534 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53550 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53562 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53564 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53570 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53618 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53626 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53636 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53644 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53658 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53672 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53698 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53716 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53718 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53730 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53752 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53758 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53806 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53810 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53838 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53870 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53888 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53922 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53946 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53978 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53982 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:53990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54002 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54024 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54028 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54046 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54052 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54080 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54092 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54132 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54158 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54164 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54168 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54180 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54196 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54228 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54238 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54260 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54262 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54288 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54322 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54328 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54402 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54418 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54436 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54454 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54462 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54476 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54496 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54530 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54538 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54562 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54598 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54652 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54658 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54716 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54738 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54742 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54752 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54754 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54756 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54764 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54860 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54868 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54884 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54916 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54930 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54966 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54982 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:54996 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55030 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55042 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55066 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55072 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55082 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55098 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55118 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55160 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55180 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55208 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55224 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55228 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55284 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55304 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55308 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55310 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55334 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55344 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55354 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55394 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55396 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55426 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55432 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55454 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55470 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55484 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55486 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55510 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55514 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55522 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55528 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55556 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55562 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55564 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55574 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55598 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55604 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55642 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55648 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55698 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55720 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55750 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55810 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55838 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55892 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55894 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55910 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55918 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55926 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55938 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55954 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55956 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55964 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:55992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56014 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56032 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56066 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56080 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56096 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56110 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56134 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56150 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56152 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56168 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56172 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56190 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56214 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56228 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56240 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56248 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56250 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56256 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56262 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56282 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56310 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56334 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56354 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56384 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56396 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56412 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56418 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56444 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56460 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56462 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56482 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56496 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56506 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56530 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56536 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56618 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56626 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56642 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56654 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56668 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56690 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56718 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56738 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56748 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56752 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56782 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56792 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56844 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56894 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56928 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56942 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56954 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:56992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57044 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57078 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57136 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57148 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57150 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57180 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57196 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57198 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57210 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57234 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57274 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57290 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57316 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57338 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57374 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57408 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57422 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57436 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57450 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57488 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57496 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57514 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57524 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57556 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57570 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57582 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57612 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57624 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57648 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57686 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57688 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57698 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57720 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57728 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57744 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57756 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57772 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57792 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57810 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57836 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57842 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57856 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57886 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57888 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57930 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57946 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57974 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:57990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58024 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58028 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58050 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58066 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58074 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58080 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58094 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58110 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO: 127.0.0.1:58136 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2733675) INFO 11-12 22:40:24 [loggers.py:221] Engine 000: Avg prompt throughput: 5938.7 tokens/s, Avg generation throughput: 86.6 tokens/s, Running: 39 reqs, Waiting: 985 reqs, GPU KV cache usage: 2.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:40:34 [loggers.py:221] Engine 000: Avg prompt throughput: 8192.1 tokens/s, Avg generation throughput: 26.5 tokens/s, Running: 79 reqs, Waiting: 945 reqs, GPU KV cache usage: 4.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:40:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 79 reqs, Waiting: 945 reqs, GPU KV cache usage: 4.2%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=2733848) INFO 11-12 22:40:45 [utils.py:397] Profiling for prefill_heavy phase finished +(APIServer pid=2733675) INFO 11-12 22:40:54 [loggers.py:221] Engine 000: Avg prompt throughput: 34405.1 tokens/s, Avg generation throughput: 329.7 tokens/s, Running: 247 reqs, Waiting: 777 reqs, GPU KV cache usage: 13.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:41:04 [loggers.py:221] Engine 000: Avg prompt throughput: 35225.6 tokens/s, Avg generation throughput: 718.6 tokens/s, Running: 419 reqs, Waiting: 605 reqs, GPU KV cache usage: 22.6%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=2733848) INFO 11-12 22:41:09 [utils.py:358] Starting profiling for decode_heavy phase +(EngineCore_DP0 pid=2733848) INFO 11-12 22:41:09 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 256, 'num_prefill_tokens': 0, 'num_decode_tokens': 512, 'padded_total_num_scheduled_tokens': 512, 'num_reqs': 512} +(APIServer pid=2733675) INFO 11-12 22:41:14 [loggers.py:221] Engine 000: Avg prompt throughput: 21094.6 tokens/s, Avg generation throughput: 1114.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:41:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=2733848) INFO 11-12 22:41:28 [utils.py:397] Profiling for decode_heavy phase finished +(APIServer pid=2733675) INFO 11-12 22:41:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5579.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:41:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10390.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:41:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10338.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:42:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10285.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 35.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:42:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10291.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:42:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10238.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:42:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10185.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:42:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10135.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 45.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:42:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10134.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:43:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10084.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:43:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8445.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:43:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7679.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:43:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8448.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:43:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8394.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:43:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8394.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:44:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8345.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:44:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8259.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 63.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:44:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8343.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:44:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8289.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:44:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8241.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 68.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:44:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8191.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:45:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8188.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:45:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8190.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:45:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8138.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:45:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8089.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 79.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:45:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8089.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:45:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8087.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:46:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8036.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:46:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8036.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:46:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8034.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:46:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7983.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:46:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7933.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:46:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7934.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 93.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:47:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7933.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:47:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7880.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:47:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7883.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:47:34 [loggers.py:221] Engine 000: Avg prompt throughput: 26416.4 tokens/s, Avg generation throughput: 2387.5 tokens/s, Running: 502 reqs, Waiting: 373 reqs, GPU KV cache usage: 77.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:47:44 [loggers.py:221] Engine 000: Avg prompt throughput: 33176.0 tokens/s, Avg generation throughput: 1044.4 tokens/s, Running: 498 reqs, Waiting: 211 reqs, GPU KV cache usage: 54.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:47:54 [loggers.py:221] Engine 000: Avg prompt throughput: 35224.7 tokens/s, Avg generation throughput: 1090.2 tokens/s, Running: 496 reqs, Waiting: 41 reqs, GPU KV cache usage: 30.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:48:04 [loggers.py:221] Engine 000: Avg prompt throughput: 10034.3 tokens/s, Avg generation throughput: 7773.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:48:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10390.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:48:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10339.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:48:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10391.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 36.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:48:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10288.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:48:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10289.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:49:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10188.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:49:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10186.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:49:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10183.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 47.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:49:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10083.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:49:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7881.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:49:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8036.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 53.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:50:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8393.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:50:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8445.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:50:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8395.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:50:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8343.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:50:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8342.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:50:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8292.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:51:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8291.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:51:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8240.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 70.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:51:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8241.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:51:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8189.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:51:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8189.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 74.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:51:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8138.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:52:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8136.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:52:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8088.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:52:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8087.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:52:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8038.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 85.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:52:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8038.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:52:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8035.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:53:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7986.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:53:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7982.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:53:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7935.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 95.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:53:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7935.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:53:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7885.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:53:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7925.2 tokens/s, Running: 477 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:54:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 1488.2 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2733675) INFO 11-12 22:54:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% diff --git a/oss_log_attn_dp.txt b/oss_log_attn_dp.txt new file mode 100644 index 000000000..7672ef726 --- /dev/null +++ b/oss_log_attn_dp.txt @@ -0,0 +1,2564 @@ +INFO 11-13 00:09:36 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-13 00:09:36 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-13 00:09:36 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-13 00:09:36 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +(APIServer pid=2993839) INFO 11-13 00:09:37 [api_server.py:1897] vLLM API server version 0.11.1rc7.dev48+gdf4d3a44a +(APIServer pid=2993839) INFO 11-13 00:09:37 [utils.py:253] non-default args: {'model_tag': 'unsloth/gpt-oss-120b-BF16', 'model': 'unsloth/gpt-oss-120b-BF16', 'max_model_len': 8192, 'download_dir': '/mnt/disks/persist', 'tensor_parallel_size': 8, 'gpu_memory_utilization': 0.95, 'enable_prefix_caching': False, 'max_num_batched_tokens': 8192, 'max_num_seqs': 256, 'async_scheduling': True, 'additional_config': {'sharding': {'sharding_strategy': {'enable_dp_attention': 1}}}} +(APIServer pid=2993839) INFO 11-13 00:09:37 [model.py:630] Resolved architecture: GptOssForCausalLM +(APIServer pid=2993839) INFO 11-13 00:09:37 [model.py:1728] Using max model len 8192 +(APIServer pid=2993839) INFO 11-13 00:09:37 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. +(APIServer pid=2993839) INFO 11-13 00:09:37 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. +(APIServer pid=2993839) INFO 11-13 00:09:37 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=2), device_indexes=None) +(APIServer pid=2993839) WARNING 11-13 00:09:37 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(APIServer pid=2993839) INFO 11-13 00:09:37 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +INFO 11-13 00:09:41 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-13 00:09:41 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-13 00:09:41 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-13 00:09:41 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:42 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=8192, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=8, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=False, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} +(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:43 [tpu_jax.py:228] Pin memory is not supported on TPU. +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [tpu_jax_runner.py:278] Creating new model mesh | devices=8, num_slices=1 +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 1, 'attn_dp': 2, 'expert': 1, 'model': 4, axis_types=(Auto, Auto, Auto, Auto)) +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [utils.py:314] Phased-based profiler enabled. Traces will be saved to: gs://wenxindong-vm/trace/gpt_oss/dp2/attn_dp +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [compilation_manager.py:34] Enabling JAX compile cache. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm +(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:49 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") +(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:49 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:49 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") +(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:49 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:49 [tpu_jax.py:63] Cannot use None backend on TPU. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:49 [tpu_jax.py:66] Using Pallas V1 backend. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:49 [layer.py:331] Disabling MoE shared_experts cuda stream +(EngineCore_DP0 pid=2993997) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 {'num_tokens': 16} +(EngineCore_DP0 pid=2993997) /mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torchax/tensor.py:154: UserWarning: Explicitly requested dtype int64 requested in astype is not available, and will be truncated to dtype int32. To enable more dtypes, set the jax_enable_x64 configuration option or the JAX_ENABLE_X64 shell environment variable. See https://github.com/jax-ml/jax#current-gotchas for more. +(EngineCore_DP0 pid=2993997) res = jax_function(self._elem, *args, **kwargs) +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:11:33 [compilation_manager.py:67] Compilation finished in 11.81 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:11:33 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 32} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:11:45 [compilation_manager.py:67] Compilation finished in 12.65 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:11:45 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 64} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:03 [compilation_manager.py:67] Compilation finished in 17.07 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:03 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 128} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:21 [compilation_manager.py:67] Compilation finished in 18.33 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:21 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 256} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:41 [compilation_manager.py:67] Compilation finished in 19.49 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:41 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 512} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:13:06 [compilation_manager.py:67] Compilation finished in 25.35 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:13:06 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 1024} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:13:31 [compilation_manager.py:67] Compilation finished in 24.97 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:13:31 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 2048} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:14:05 [compilation_manager.py:67] Compilation finished in 33.67 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:14:05 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 4096} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:14:42 [compilation_manager.py:67] Compilation finished in 36.63 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:14:42 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 8192} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:15:19 [compilation_manager.py:67] Compilation finished in 37.42 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:15:19 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 16384} +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:17 [compilation_manager.py:67] Compilation finished in 57.90 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:17 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:325] Compiling select_from_array with different input shapes. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:304] Compiling select_from_array for select all logits. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.08 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:37 [compilation_manager.py:67] Compilation finished in 0.71 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:37 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:39 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:39 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:39 [compilation_manager.py:67] Compilation finished in 0.64 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:39 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:67] Compilation finished in 0.28 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:67] Compilation finished in 0.54 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:42 [compilation_manager.py:67] Compilation finished in 0.78 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:43 [compilation_manager.py:67] Compilation finished in 0.49 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:43 [compilation_manager.py:67] Compilation finished in 0.46 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:44 [compilation_manager.py:67] Compilation finished in 0.47 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:44 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:45 [compilation_manager.py:67] Compilation finished in 0.80 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:45 [compilation_manager.py:67] Compilation finished in 0.59 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:46 [compilation_manager.py:67] Compilation finished in 0.78 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:47 [compilation_manager.py:67] Compilation finished in 0.99 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:47 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:49 [compilation_manager.py:67] Compilation finished in 0.40 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:49 [compilation_manager.py:67] Compilation finished in 0.69 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.34 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:51 [compilation_manager.py:67] Compilation finished in 0.59 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:51 [compilation_manager.py:365] Compiling compute_logits with different input shapes. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:51 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:52 [compilation_manager.py:67] Compilation finished in 1.01 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:52 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:53 [compilation_manager.py:67] Compilation finished in 1.10 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:53 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:54 [compilation_manager.py:67] Compilation finished in 1.00 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:54 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:55 [compilation_manager.py:67] Compilation finished in 0.94 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:55 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:56 [compilation_manager.py:67] Compilation finished in 1.02 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:56 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:58 [compilation_manager.py:67] Compilation finished in 1.72 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:58 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:00 [compilation_manager.py:67] Compilation finished in 2.15 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:00 [compilation_manager.py:387] Compiling sampling with different input shapes. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:01 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': True} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:04 [compilation_manager.py:67] Compilation finished in 3.50 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:04 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': False} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:04 [compilation_manager.py:67] Compilation finished in 0.24 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:05 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': True} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:08 [compilation_manager.py:67] Compilation finished in 3.43 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:08 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': False} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:09 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': True} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:12 [compilation_manager.py:67] Compilation finished in 2.58 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:12 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': False} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:12 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:13 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': True} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:16 [compilation_manager.py:67] Compilation finished in 3.50 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:16 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': False} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:17 [compilation_manager.py:67] Compilation finished in 0.77 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:18 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': True} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:22 [compilation_manager.py:67] Compilation finished in 3.94 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:22 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': False} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:27 [compilation_manager.py:67] Compilation finished in 5.03 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:27 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': True} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:30 [compilation_manager.py:67] Compilation finished in 3.08 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:30 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': False} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:30 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:30 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': True} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:33 [compilation_manager.py:67] Compilation finished in 2.88 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:33 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': False} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:67] Compilation finished in 0.43 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:455] Compiling gather_logprobs with different input shapes. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 8} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:67] Compilation finished in 0.75 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 16} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:35 [compilation_manager.py:67] Compilation finished in 0.70 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:35 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 32} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:37 [compilation_manager.py:67] Compilation finished in 1.98 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:37 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 64} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:39 [compilation_manager.py:67] Compilation finished in 2.00 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:39 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 128} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:41 [compilation_manager.py:67] Compilation finished in 1.93 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:41 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 256} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:43 [compilation_manager.py:67] Compilation finished in 2.01 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:43 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 512} +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:45 [compilation_manager.py:67] Compilation finished in 1.96 [secs]. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:45 [compilation_manager.py:751] Compiling structured_decoding with different input shapes. +(EngineCore_DP0 pid=2993997) WARNING 11-13 00:17:45 [compilation_manager.py:754] Structured decoding precompilation skipped since structured decoding is not supported with DP. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:45 [core.py:247] init engine (profile, create kv cache, warmup model) took 388.63 seconds +(EngineCore_DP0 pid=2993997) WARNING 11-13 00:17:46 [scheduler.py:158] Using custom scheduler class . This scheduler interface is not public and compatibility may not be maintained. +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:46 [dp_scheduler.py:93] DPScheduler (Async = True) per-rank limits: max_seqs=256, max_tokens=8192 +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:46 [core.py:181] Batch queue is enabled with size 2 +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:46 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=2), device_indexes=None) +(EngineCore_DP0 pid=2993997) WARNING 11-13 00:17:46 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:46 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +(APIServer pid=2993839) [INFO] model_hosting_container_standards - decorators.py:76: [PING] Framework handler registered: ping +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO decorators.py:76: [PING] Framework handler registered: ping +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func +(APIServer pid=2993839) [INFO] model_hosting_container_standards - decorators.py:76: [INVOKE] Framework handler registered: decorated_func +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO decorators.py:76: [INVOKE] Framework handler registered: decorated_func +(APIServer pid=2993839) [INFO] model_hosting_container_standards - __init__.py:127: Starting SageMaker bootstrap process +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO __init__.py:127: Starting SageMaker bootstrap process +(APIServer pid=2993839) [INFO] model_hosting_container_standards - registry.py:109: [REGISTRY] Middleware resolution and registration complete +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO registry.py:109: [REGISTRY] Middleware resolution and registration complete +(APIServer pid=2993839) [INFO] model_hosting_container_standards - core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully +(APIServer pid=2993839) [INFO] model_hosting_container_standards - core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares +(APIServer pid=2993839) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=2993839) [2025-11-13 00:17:47] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=2993839) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=2993839) [2025-11-13 00:17:47] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=2993839) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:93: Creating SageMaker router with unified route resolver +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO sagemaker_router.py:93: Creating SageMaker router with unified route resolver +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:172: Creating router with prefix='', tags=['sagemaker'] +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:172: Creating router with prefix='', tags=['sagemaker'] +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:110: Mounting 2 handlers to router +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:110: Mounting 2 handlers to router +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:184: Router created with 0 routes +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:184: Router created with 0 routes +(APIServer pid=2993839) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:101: SageMaker router created successfully with 0 routes +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO sagemaker_router.py:101: SageMaker router created successfully with 0 routes +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:287: Including router with conflict detection +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:287: Including router with conflict detection +(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:305: Successfully included router with 0 routes +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:305: Successfully included router with 0 routes +(APIServer pid=2993839) [INFO] model_hosting_container_standards - __init__.py:139: SageMaker bootstrap completed successfully +(APIServer pid=2993839) [2025-11-13 00:17:47] INFO __init__.py:139: SageMaker bootstrap completed successfully +(APIServer pid=2993839) INFO 11-13 00:17:47 [api_server.py:1662] Supported tasks: ['generate'] +(APIServer pid=2993839) WARNING 11-13 00:17:47 [serving_responses.py:189] For gpt-oss, we ignore --enable-auto-tool-choice and always enable tool use. +(APIServer pid=2993839) INFO 11-13 00:17:47 [api_server.py:1972] Starting vLLM API server 0 on http://0.0.0.0:8000 +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:38] Available routes are: +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /openapi.json, Methods: GET, HEAD +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /docs, Methods: GET, HEAD +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /docs/oauth2-redirect, Methods: GET, HEAD +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /redoc, Methods: GET, HEAD +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /health, Methods: GET +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /load, Methods: GET +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /tokenize, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /detokenize, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/models, Methods: GET +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /version, Methods: GET +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/responses, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/responses/{response_id}, Methods: GET +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/responses/{response_id}/cancel, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/messages, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/chat/completions, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/completions, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/embeddings, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /pooling, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /classify, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /score, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/score, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/audio/transcriptions, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/audio/translations, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /rerank, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/rerank, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v2/rerank, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /scale_elastic_ep, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /is_scaling_elastic_ep, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /ping, Methods: GET +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /ping, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /invocations, Methods: POST +(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /metrics, Methods: GET +(APIServer pid=2993839) INFO: Started server process [2993839] +(APIServer pid=2993839) INFO: Waiting for application startup. +(APIServer pid=2993839) INFO: Application startup complete. +(APIServer pid=2993839) INFO: 127.0.0.1:36276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO 11-13 01:08:57 [loggers.py:221] Engine 000: Avg prompt throughput: 204.8 tokens/s, Avg generation throughput: 0.3 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:09:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.6 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:09:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.6 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:09:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.6 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:09:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.5 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:09:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.5 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:09:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.3 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:10:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:10:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:10:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:10:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:10:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:10:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:11:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:11:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:11:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=2993997) WARNING 11-13 01:11:29 [tpu_jax_runner.py:666] Should not schedule a request that does nothing! +(APIServer pid=2993839) INFO: 127.0.0.1:36276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54036 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54042 - "POST /v1/completions HTTP/1.1" 200 OK +(EngineCore_DP0 pid=2993997) INFO 11-13 01:11:30 [utils.py:358] Starting profiling for prefill_heavy phase +(EngineCore_DP0 pid=2993997) INFO 11-13 01:11:30 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 6144, 'num_prefill_tokens': 8192, 'num_decode_tokens': 1, 'padded_total_num_scheduled_tokens': 16384, 'num_reqs': 5} +(APIServer pid=2993839) INFO: 127.0.0.1:54052 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54060 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54068 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54094 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54138 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54142 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54172 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54190 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54210 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54220 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54246 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54272 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54274 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54288 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54316 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54354 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54358 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54374 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54418 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54434 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54448 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54470 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54502 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54534 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54536 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54560 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54570 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54574 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54582 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54658 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54672 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54686 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54704 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54718 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54754 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54768 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54784 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54796 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54810 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54838 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54928 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54964 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54978 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54980 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54988 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:54992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55000 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55050 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55066 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55072 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55082 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55098 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55150 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55160 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55186 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55196 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55210 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55226 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55240 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55262 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55296 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55308 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55340 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55402 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55414 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55424 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55470 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55484 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55532 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55546 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55598 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55614 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55616 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55640 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55656 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55678 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55696 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55720 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55746 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55764 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55800 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55818 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55868 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55920 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55932 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55956 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55978 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:55992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56010 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56036 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56044 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56068 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56080 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56096 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56130 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56160 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56172 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56186 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56222 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56234 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56238 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56240 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56262 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56272 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56296 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56304 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56306 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56334 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56340 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56426 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56430 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56454 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56488 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56548 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56600 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56640 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56642 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56654 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56716 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56750 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56754 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56784 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56796 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56800 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56858 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56910 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56924 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56938 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56946 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56974 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:56994 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57002 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57050 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57092 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57098 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57134 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57142 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57148 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57154 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57168 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57180 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57196 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57212 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57214 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57246 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57316 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57334 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57372 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57396 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57398 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57402 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57410 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57424 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57434 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57444 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57450 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57464 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57466 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57482 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57510 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57538 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57544 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57572 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57580 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57612 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57626 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57654 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57688 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57716 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57720 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57746 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57758 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57836 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57852 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57860 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57868 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57882 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57892 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57920 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57926 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57942 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57946 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57962 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57982 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57988 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:57998 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58010 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58050 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58068 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58074 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58084 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58110 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58138 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58150 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58154 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58170 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58184 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58186 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58196 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58214 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58224 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58234 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58248 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58256 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58292 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58334 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58338 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58372 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58402 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58418 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58424 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58454 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58466 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58482 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58510 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58520 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58534 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58550 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58562 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58580 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58582 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58606 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58608 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58618 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58636 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58652 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58668 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58696 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58748 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58806 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58826 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58830 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58842 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58868 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58922 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58924 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58932 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58934 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58964 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58974 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58980 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:58992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59028 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59046 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59074 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59084 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59098 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59110 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59130 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59154 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59166 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59182 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59210 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59220 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59262 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59322 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59328 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59354 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59374 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59382 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59394 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59396 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59422 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59426 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59430 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59446 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59468 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59478 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59502 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59510 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59574 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59608 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59616 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59686 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59754 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59758 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59784 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59806 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59818 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59868 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59892 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59910 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59918 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59928 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59954 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:59986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60000 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60030 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60068 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60082 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60092 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60134 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60168 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60178 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60224 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60236 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60248 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60250 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60268 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60290 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60338 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60408 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60412 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60414 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60422 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60434 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60438 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60446 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60476 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60492 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60524 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60536 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60550 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60582 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60606 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60612 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60618 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60656 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60670 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60712 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60718 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60730 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60752 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60816 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60830 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60842 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60872 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60888 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60898 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60920 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60924 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60934 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60946 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:60990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32784 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32818 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32856 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32868 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32872 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32882 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32920 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32934 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32942 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32980 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:32996 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33010 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33018 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33024 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33072 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33082 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33126 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33142 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33152 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33154 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33178 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33194 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33234 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33256 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33290 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33294 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33310 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33326 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33338 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33354 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33358 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33382 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33398 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33408 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33418 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33422 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33438 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33462 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33478 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33522 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33538 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33548 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33560 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33566 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33572 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33580 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33598 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33618 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33642 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33644 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33648 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33686 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33690 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33716 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33728 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33744 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33748 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33764 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33784 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33816 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33852 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33886 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33888 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33892 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33894 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33902 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33916 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33922 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33934 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33954 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33964 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33976 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33980 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:33996 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34024 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34032 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34042 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34080 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34092 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34096 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34106 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34110 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34120 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34126 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34132 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34142 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34148 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34164 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34170 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34178 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34194 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34198 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34260 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34272 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34288 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34326 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34338 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34372 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34382 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34426 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34464 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34530 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34544 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34556 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34598 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34614 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34622 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34652 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34706 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34742 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34750 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34764 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34806 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34818 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34892 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO: 127.0.0.1:34916 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=2993839) INFO 11-13 01:11:37 [loggers.py:221] Engine 000: Avg prompt throughput: 3891.0 tokens/s, Avg generation throughput: 11.9 tokens/s, Running: 29 reqs, Waiting: 995 reqs, GPU KV cache usage: 0.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:11:47 [loggers.py:221] Engine 000: Avg prompt throughput: 1638.3 tokens/s, Avg generation throughput: 2.7 tokens/s, Running: 37 reqs, Waiting: 987 reqs, GPU KV cache usage: 1.2%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=2993997) INFO 11-13 01:11:56 [utils.py:397] Profiling for prefill_heavy phase finished +(APIServer pid=2993839) INFO 11-13 01:11:57 [loggers.py:221] Engine 000: Avg prompt throughput: 3276.6 tokens/s, Avg generation throughput: 7.8 tokens/s, Running: 53 reqs, Waiting: 971 reqs, GPU KV cache usage: 1.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:12:07 [loggers.py:221] Engine 000: Avg prompt throughput: 18023.0 tokens/s, Avg generation throughput: 100.1 tokens/s, Running: 141 reqs, Waiting: 883 reqs, GPU KV cache usage: 4.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:12:17 [loggers.py:221] Engine 000: Avg prompt throughput: 18023.9 tokens/s, Avg generation throughput: 196.9 tokens/s, Running: 229 reqs, Waiting: 795 reqs, GPU KV cache usage: 7.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:12:27 [loggers.py:221] Engine 000: Avg prompt throughput: 17611.2 tokens/s, Avg generation throughput: 292.4 tokens/s, Running: 315 reqs, Waiting: 709 reqs, GPU KV cache usage: 10.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:12:37 [loggers.py:221] Engine 000: Avg prompt throughput: 17613.0 tokens/s, Avg generation throughput: 387.5 tokens/s, Running: 401 reqs, Waiting: 623 reqs, GPU KV cache usage: 12.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:12:47 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.1 tokens/s, Avg generation throughput: 481.9 tokens/s, Running: 487 reqs, Waiting: 537 reqs, GPU KV cache usage: 15.6%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=2993997) INFO 11-13 01:12:50 [utils.py:358] Starting profiling for decode_heavy phase +(EngineCore_DP0 pid=2993997) INFO 11-13 01:12:50 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 256, 'num_prefill_tokens': 0, 'num_decode_tokens': 512, 'padded_total_num_scheduled_tokens': 512, 'num_reqs': 512} +(APIServer pid=2993839) INFO 11-13 01:12:57 [loggers.py:221] Engine 000: Avg prompt throughput: 7168.2 tokens/s, Avg generation throughput: 454.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 16.4%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=2993997) INFO 11-13 01:13:06 [utils.py:397] Profiling for decode_heavy phase finished +(APIServer pid=2993839) INFO 11-13 01:13:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 716.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 16.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:13:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6073.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 16.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:13:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6194.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 18.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:13:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 18.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:13:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6090.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 19.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:13:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 20.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:14:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 21.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:14:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 21.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:14:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6144.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 22.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:14:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6194.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 23.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:14:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 23.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:14:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 25.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:15:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 25.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:15:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6192.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:15:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:15:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 29.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:15:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 29.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:15:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5631.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:16:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4709.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:16:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4659.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:16:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5373.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 32.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:16:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 32.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:16:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:16:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:17:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 35.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:17:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5579.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 36.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:17:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5577.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 36.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:17:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 38.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:17:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5476.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 38.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:17:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5527.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 39.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:18:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5476.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:18:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:18:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5476.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 42.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:18:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 42.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:18:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:18:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:19:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 44.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:19:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 45.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:19:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 45.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:19:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 47.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:19:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 47.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:19:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 48.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:20:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:20:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:20:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 51.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:20:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 51.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:20:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5426.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:20:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5376.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 53.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:21:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 53.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:21:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 54.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:21:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 54.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:21:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5424.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 56.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:21:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5376.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 56.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:21:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 57.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:22:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:22:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5424.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:22:28 [loggers.py:221] Engine 000: Avg prompt throughput: 13310.5 tokens/s, Avg generation throughput: 1066.2 tokens/s, Running: 504 reqs, Waiting: 437 reqs, GPU KV cache usage: 51.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:22:38 [loggers.py:221] Engine 000: Avg prompt throughput: 15564.4 tokens/s, Avg generation throughput: 500.0 tokens/s, Running: 500 reqs, Waiting: 361 reqs, GPU KV cache usage: 44.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:22:48 [loggers.py:221] Engine 000: Avg prompt throughput: 17611.5 tokens/s, Avg generation throughput: 547.0 tokens/s, Running: 498 reqs, Waiting: 275 reqs, GPU KV cache usage: 37.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:22:58 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.2 tokens/s, Avg generation throughput: 546.3 tokens/s, Running: 498 reqs, Waiting: 189 reqs, GPU KV cache usage: 30.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:23:08 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.0 tokens/s, Avg generation throughput: 545.2 tokens/s, Running: 496 reqs, Waiting: 105 reqs, GPU KV cache usage: 23.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:23:18 [loggers.py:221] Engine 000: Avg prompt throughput: 17202.6 tokens/s, Avg generation throughput: 544.4 tokens/s, Running: 496 reqs, Waiting: 19 reqs, GPU KV cache usage: 16.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:23:28 [loggers.py:221] Engine 000: Avg prompt throughput: 5937.7 tokens/s, Avg generation throughput: 4500.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 16.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:23:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 16.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:23:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 18.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:23:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 18.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:24:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 20.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:24:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 20.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:24:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 21.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:24:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 21.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:24:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 23.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:24:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 23.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:25:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 25.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:25:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 25.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:25:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:25:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:25:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 28.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:25:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 29.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:26:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 29.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:26:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4914.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:26:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4709.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:26:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4863.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 32.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:26:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5580.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 32.9%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:26:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 33.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:27:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:27:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5529.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:27:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5529.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 36.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:27:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5578.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 36.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:27:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 37.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:27:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 38.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:28:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5527.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 38.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:28:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:28:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5529.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:28:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 41.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:28:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 42.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:28:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 42.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:29:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:29:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:29:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 45.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:29:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5426.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 45.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:29:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5476.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 46.7%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:29:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 47.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:30:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 47.5%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:30:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5424.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:30:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5376.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.3%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:30:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 50.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:30:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 51.1%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:30:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 51.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:31:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 53.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:31:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 53.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:31:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5376.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 54.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:31:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5324.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 54.8%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:31:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 55.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:31:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5306.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 56.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:32:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 56.6%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:32:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:32:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:32:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4980.3 tokens/s, Running: 231 reqs, Waiting: 0 reqs, GPU KV cache usage: 26.4%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:32:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 353.6 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% +(APIServer pid=2993839) INFO 11-13 01:32:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% diff --git a/oss_log_baseline.txt b/oss_log_baseline.txt new file mode 100644 index 000000000..d5b06e0f6 --- /dev/null +++ b/oss_log_baseline.txt @@ -0,0 +1,2410 @@ +INFO 11-12 01:19:42 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-12 01:19:43 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-12 01:19:43 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-12 01:19:43 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +(APIServer pid=1953096) INFO 11-12 01:19:44 [api_server.py:1897] vLLM API server version 0.11.1rc7.dev48+gdf4d3a44a +(APIServer pid=1953096) INFO 11-12 01:19:44 [utils.py:253] non-default args: {'model_tag': 'unsloth/gpt-oss-120b-BF16', 'model': 'unsloth/gpt-oss-120b-BF16', 'max_model_len': 8192, 'download_dir': '/mnt/disks/persist', 'tensor_parallel_size': 4, 'gpu_memory_utilization': 0.98, 'enable_prefix_caching': False, 'max_num_batched_tokens': 8192, 'max_num_seqs': 256, 'async_scheduling': True} +(APIServer pid=1953096) INFO 11-12 01:19:44 [model.py:630] Resolved architecture: GptOssForCausalLM +(APIServer pid=1953096) INFO 11-12 01:19:44 [model.py:1728] Using max model len 8192 +(APIServer pid=1953096) INFO 11-12 01:19:44 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. +(APIServer pid=1953096) INFO 11-12 01:19:44 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. +(APIServer pid=1953096) INFO 11-12 01:19:44 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) +(APIServer pid=1953096) WARNING 11-12 01:19:44 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(APIServer pid=1953096) INFO 11-12 01:19:44 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +INFO 11-12 01:19:48 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-12 01:19:49 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-12 01:19:49 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-12 01:19:49 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:49 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=8192, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=4, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=False, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} +(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:50 [tpu_jax.py:228] Pin memory is not supported on TPU. +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 1, 'model': 4, axis_types=(Auto, Auto)) +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192] +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256] +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [compilation_manager.py:34] Enabling JAX compile cache. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm +(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:56 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") +(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:56 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:56 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") +(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:56 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:56 [tpu_jax.py:63] Cannot use None backend on TPU. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:56 [tpu_jax.py:66] Using Pallas V1 backend. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:56 [layer.py:331] Disabling MoE shared_experts cuda stream +(EngineCore_DP0 pid=1953269) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 {'num_tokens': 16} +(EngineCore_DP0 pid=1953269) /mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torchax/tensor.py:154: UserWarning: Explicitly requested dtype int64 requested in astype is not available, and will be truncated to dtype int32. To enable more dtypes, set the jax_enable_x64 configuration option or the JAX_ENABLE_X64 shell environment variable. See https://github.com/jax-ml/jax#current-gotchas for more. +(EngineCore_DP0 pid=1953269) res = jax_function(self._elem, *args, **kwargs) +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:35 [compilation_manager.py:67] Compilation finished in 9.54 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:35 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 32} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:35] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:35] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:35] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:45 [compilation_manager.py:67] Compilation finished in 9.92 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:45 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 64} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:59 [compilation_manager.py:67] Compilation finished in 14.04 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:59 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 128} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:14 [compilation_manager.py:67] Compilation finished in 14.97 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:14 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 256} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:29 [compilation_manager.py:67] Compilation finished in 15.32 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:29 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 512} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:29] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:48 [compilation_manager.py:67] Compilation finished in 18.31 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:48 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 1024} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:04 [compilation_manager.py:67] Compilation finished in 16.58 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:04 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 2048} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:25 [compilation_manager.py:67] Compilation finished in 20.68 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:25 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 4096} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:25] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:25] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:25] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:48 [compilation_manager.py:67] Compilation finished in 23.21 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:48 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 8192} +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:67] Compilation finished in 27.73 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:67] Compilation finished in 0.39 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:67] Compilation finished in 0.24 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:67] Compilation finished in 0.24 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:67] Compilation finished in 0.37 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:67] Compilation finished in 0.37 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.24 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:325] Compiling select_from_array with different input shapes. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:304] Compiling select_from_array for select all logits. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:67] Compilation finished in 0.55 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:33 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:33 [compilation_manager.py:67] Compilation finished in 0.53 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:34 [compilation_manager.py:67] Compilation finished in 0.76 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:34 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:36 [compilation_manager.py:67] Compilation finished in 0.57 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:37 [compilation_manager.py:67] Compilation finished in 0.80 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:37 [compilation_manager.py:67] Compilation finished in 0.52 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:38 [compilation_manager.py:67] Compilation finished in 0.50 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:38 [compilation_manager.py:67] Compilation finished in 0.49 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:39 [compilation_manager.py:67] Compilation finished in 0.53 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:39 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:40 [compilation_manager.py:67] Compilation finished in 0.78 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.99 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:42 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:42 [compilation_manager.py:67] Compilation finished in 0.62 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:67] Compilation finished in 0.58 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:365] Compiling compute_logits with different input shapes. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:45 [compilation_manager.py:67] Compilation finished in 0.65 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:45 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:45 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:45 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:46 [compilation_manager.py:67] Compilation finished in 0.39 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:46 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:47 [compilation_manager.py:67] Compilation finished in 1.34 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:47 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:48 [compilation_manager.py:67] Compilation finished in 1.22 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:48 [compilation_manager.py:387] Compiling sampling with different input shapes. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:49 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': True} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:52 [compilation_manager.py:67] Compilation finished in 3.23 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:52 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': False} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:52 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:52 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': True} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:55 [compilation_manager.py:67] Compilation finished in 2.43 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:55 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': False} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:55 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:55 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': True} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:59 [compilation_manager.py:67] Compilation finished in 3.38 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:59 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': False} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:59 [compilation_manager.py:67] Compilation finished in 0.57 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:00 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': True} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:04 [compilation_manager.py:67] Compilation finished in 3.76 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:04 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': False} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:09 [compilation_manager.py:67] Compilation finished in 5.32 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': True} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:12 [compilation_manager.py:67] Compilation finished in 2.75 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:12 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': False} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:12 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:12 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': True} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:15 [compilation_manager.py:67] Compilation finished in 2.96 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:15 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': False} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:455] Compiling gather_logprobs with different input shapes. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:67] Compilation finished in 0.72 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:17 [compilation_manager.py:67] Compilation finished in 0.71 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:17 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:19 [compilation_manager.py:67] Compilation finished in 1.83 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:19 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:21 [compilation_manager.py:67] Compilation finished in 1.77 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:21 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:23 [compilation_manager.py:67] Compilation finished in 1.97 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:23 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:25 [compilation_manager.py:67] Compilation finished in 1.84 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:25 [compilation_manager.py:751] Compiling structured_decoding with different input shapes. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:25 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 8} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:26 [compilation_manager.py:67] Compilation finished in 1.86 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:26 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 16} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:28 [compilation_manager.py:67] Compilation finished in 1.82 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:28 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 32} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:30 [compilation_manager.py:67] Compilation finished in 1.81 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:30 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 64} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:32 [compilation_manager.py:67] Compilation finished in 1.46 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:32 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 128} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:33 [compilation_manager.py:67] Compilation finished in 1.24 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:33 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 256} +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:34 [compilation_manager.py:67] Compilation finished in 1.28 [secs]. +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:34 [core.py:247] init engine (profile, create kv cache, warmup model) took 252.55 seconds +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:35 [core.py:181] Batch queue is enabled with size 2 +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:35 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) +(EngineCore_DP0 pid=1953269) WARNING 11-12 01:25:35 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:35 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +(APIServer pid=1953096) [INFO] model_hosting_container_standards - decorators.py:76: [PING] Framework handler registered: ping +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO decorators.py:76: [PING] Framework handler registered: ping +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func +(APIServer pid=1953096) [INFO] model_hosting_container_standards - decorators.py:76: [INVOKE] Framework handler registered: decorated_func +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO decorators.py:76: [INVOKE] Framework handler registered: decorated_func +(APIServer pid=1953096) [INFO] model_hosting_container_standards - __init__.py:127: Starting SageMaker bootstrap process +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO __init__.py:127: Starting SageMaker bootstrap process +(APIServer pid=1953096) [INFO] model_hosting_container_standards - registry.py:109: [REGISTRY] Middleware resolution and registration complete +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO registry.py:109: [REGISTRY] Middleware resolution and registration complete +(APIServer pid=1953096) [INFO] model_hosting_container_standards - core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully +(APIServer pid=1953096) [INFO] model_hosting_container_standards - core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares +(APIServer pid=1953096) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=1953096) [2025-11-12 01:25:36] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=1953096) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=1953096) [2025-11-12 01:25:36] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] +(APIServer pid=1953096) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:93: Creating SageMaker router with unified route resolver +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO sagemaker_router.py:93: Creating SageMaker router with unified route resolver +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:172: Creating router with prefix='', tags=['sagemaker'] +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:172: Creating router with prefix='', tags=['sagemaker'] +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:110: Mounting 2 handlers to router +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:110: Mounting 2 handlers to router +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:184: Router created with 0 routes +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:184: Router created with 0 routes +(APIServer pid=1953096) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:101: SageMaker router created successfully with 0 routes +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO sagemaker_router.py:101: SageMaker router created successfully with 0 routes +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:287: Including router with conflict detection +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:287: Including router with conflict detection +(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:305: Successfully included router with 0 routes +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:305: Successfully included router with 0 routes +(APIServer pid=1953096) [INFO] model_hosting_container_standards - __init__.py:139: SageMaker bootstrap completed successfully +(APIServer pid=1953096) [2025-11-12 01:25:36] INFO __init__.py:139: SageMaker bootstrap completed successfully +(APIServer pid=1953096) INFO 11-12 01:25:36 [api_server.py:1662] Supported tasks: ['generate'] +(APIServer pid=1953096) WARNING 11-12 01:25:36 [serving_responses.py:189] For gpt-oss, we ignore --enable-auto-tool-choice and always enable tool use. +(APIServer pid=1953096) INFO 11-12 01:25:36 [api_server.py:1972] Starting vLLM API server 0 on http://0.0.0.0:8000 +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:38] Available routes are: +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /openapi.json, Methods: GET, HEAD +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /docs, Methods: GET, HEAD +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /docs/oauth2-redirect, Methods: GET, HEAD +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /redoc, Methods: GET, HEAD +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /health, Methods: GET +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /load, Methods: GET +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /tokenize, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /detokenize, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/models, Methods: GET +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /version, Methods: GET +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/responses, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/responses/{response_id}, Methods: GET +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/responses/{response_id}/cancel, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/messages, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/chat/completions, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/completions, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/embeddings, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /pooling, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /classify, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /score, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/score, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/audio/transcriptions, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/audio/translations, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /rerank, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/rerank, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v2/rerank, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /scale_elastic_ep, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /is_scaling_elastic_ep, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /ping, Methods: GET +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /ping, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /invocations, Methods: POST +(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /metrics, Methods: GET +(APIServer pid=1953096) INFO: Started server process [1953096] +(APIServer pid=1953096) INFO: Waiting for application startup. +(APIServer pid=1953096) INFO: Application startup complete. +(APIServer pid=1953096) INFO: 127.0.0.1:53822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO 11-12 05:15:57 [loggers.py:221] Engine 000: Avg prompt throughput: 204.8 tokens/s, Avg generation throughput: 9.3 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:16:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 158.7 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:16:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 158.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:16:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 158.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.3%, Prefix cache hit rate: 0.0% +(EngineCore_DP0 pid=1953269) WARNING 11-12 05:16:35 [tpu_jax_runner.py:666] Should not schedule a request that does nothing! +(APIServer pid=1953096) INFO: 127.0.0.1:53822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52668 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52678 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52680 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52682 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52690 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52706 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52710 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52712 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52718 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52750 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52764 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52838 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52884 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52892 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52916 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52922 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52928 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52954 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52966 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52982 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:52994 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53014 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53026 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53096 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53118 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53130 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53138 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53170 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53180 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53208 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53222 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53236 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53246 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53260 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53266 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53282 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53298 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53304 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53344 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53384 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53398 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53414 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53424 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53426 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53450 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53458 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53486 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53520 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53522 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53528 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53532 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53546 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53558 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53572 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53614 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53650 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53656 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53680 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53696 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53712 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53730 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53746 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53774 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53784 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53792 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53818 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53864 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53868 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53884 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53902 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53910 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53922 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53938 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53966 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53976 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:53990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54002 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54026 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54074 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54084 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54086 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54094 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54126 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54134 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54148 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54160 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54164 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54180 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54190 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54224 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54256 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54260 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54286 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54296 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54316 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54342 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54344 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54396 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54398 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54412 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54434 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54464 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54482 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54494 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54502 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54534 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54544 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54548 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54560 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54564 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54572 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54582 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54624 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54648 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54664 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54672 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54678 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54688 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54702 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54720 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54750 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54788 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54800 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54830 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54842 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54844 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54852 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54860 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54882 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54884 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54888 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54926 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54934 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:54996 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55026 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55044 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55094 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55106 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55134 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55154 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55158 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55168 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55184 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55192 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55228 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55240 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55272 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55288 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55314 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55384 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55398 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55436 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55472 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55488 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55492 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55518 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55534 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55536 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55562 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55588 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55606 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55616 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55632 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55636 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55642 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55648 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55664 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55668 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55680 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55738 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55746 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55792 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55826 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55838 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55848 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55894 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55920 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55928 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55934 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55954 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55964 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55978 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:55998 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56014 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56032 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56046 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56074 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56086 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56094 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56096 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56118 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56134 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56156 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56160 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56172 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56176 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56184 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56206 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56212 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56224 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56238 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56260 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56270 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56282 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56292 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56300 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56326 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56374 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56382 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56392 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56402 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56430 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56444 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56460 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56484 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56488 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56506 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56524 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56534 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56560 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56566 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56600 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56614 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56626 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56630 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56642 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56654 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56666 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56676 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56712 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56734 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56738 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56752 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56776 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56810 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56832 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56838 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56858 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56872 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56892 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56898 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56922 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56926 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56930 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56932 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56942 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56944 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56974 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56990 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:56994 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57034 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57052 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57058 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57086 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57122 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57152 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57172 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57198 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57214 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57232 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57242 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57258 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57270 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57274 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57278 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57282 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57288 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57310 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57312 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57328 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57360 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57368 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57372 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57376 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57386 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57400 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57416 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57424 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57432 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57446 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57470 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57486 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57502 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57510 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57514 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57516 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57520 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57530 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57544 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57560 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57566 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57580 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57590 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57604 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57608 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57616 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57626 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57646 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57660 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57672 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57680 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57694 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57708 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57748 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57762 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57782 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57798 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57838 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57840 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57882 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57894 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57900 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57912 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57918 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57922 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57938 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57952 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57954 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57962 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:57984 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58000 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58006 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58036 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58040 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58046 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58050 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58052 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58060 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58092 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58096 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58100 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58118 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58134 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58168 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58182 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58186 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58190 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58204 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58220 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58248 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58262 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58290 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58302 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58310 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58352 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58354 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58362 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58374 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58386 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58388 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58402 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58408 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58414 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58430 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58434 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58448 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58466 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58492 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58498 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58528 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58542 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58554 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58556 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58568 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58570 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58574 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58586 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58594 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58606 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58612 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58634 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58636 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58652 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58654 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58670 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58684 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58688 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58692 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58700 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58716 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58722 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58724 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58744 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58758 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58770 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58820 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58824 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58836 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58844 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58852 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58860 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58872 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58920 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:58986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59000 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59016 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59030 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59032 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59046 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59048 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59056 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59060 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59076 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59088 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59108 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59116 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59124 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59140 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59150 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59160 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59168 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59172 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59182 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59190 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59194 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59208 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59216 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59226 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59236 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59248 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59266 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59276 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59292 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59308 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59320 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59330 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59356 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59370 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59380 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59386 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59390 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59406 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59420 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59428 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59456 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59468 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59492 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59514 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59528 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59536 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59548 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59552 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59564 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59576 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59588 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59592 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59602 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59604 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59628 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59638 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59652 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59674 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59686 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59698 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59704 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59714 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59728 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59732 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59736 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59748 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59750 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59764 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59818 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59830 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59842 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59874 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59878 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59880 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59896 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59898 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59906 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59914 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59916 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59926 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59934 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59940 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59960 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59962 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59970 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59974 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59982 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:59994 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60004 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60012 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60024 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60044 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60046 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60062 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60080 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60090 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60102 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60112 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60128 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60144 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60158 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60174 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60184 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60194 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60196 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60200 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60208 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60212 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60222 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60238 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60254 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60270 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60292 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60308 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60318 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60326 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60336 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60346 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60348 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60378 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60394 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60404 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60414 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60430 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60438 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60440 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60452 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60460 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60464 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60466 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60474 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60488 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60490 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60496 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60512 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60526 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60530 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60540 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60550 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60560 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60566 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60578 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60584 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60596 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60606 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60610 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60620 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60636 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60640 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60650 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60662 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60664 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60668 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60670 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60678 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60680 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60696 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60704 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60716 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60726 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60740 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60744 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60752 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60760 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60766 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60768 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60782 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60794 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60802 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60810 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60812 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60828 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60834 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60842 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60846 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60858 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60862 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60872 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60876 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60882 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60898 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60908 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60918 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60924 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60930 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60958 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60972 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60988 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60992 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60996 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:60998 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32778 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32780 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32782 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32784 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32786 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32790 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32796 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32804 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32806 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32808 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32810 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32814 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32816 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32822 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32838 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32850 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32854 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32866 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32870 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32882 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32886 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32890 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32904 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32910 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32920 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32936 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32948 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32950 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32964 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32968 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32978 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32982 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:32986 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33002 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33008 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33020 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33022 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33026 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33038 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33042 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33054 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33064 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33070 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33072 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33084 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33096 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33104 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33114 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33130 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33146 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33162 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33166 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33182 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33188 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33198 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33202 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33208 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33218 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33230 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33244 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33252 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33264 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33280 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33292 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33294 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33306 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33308 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33324 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33332 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33344 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33350 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33364 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33372 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33384 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33398 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33402 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33418 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33430 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33442 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33450 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33464 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33470 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33480 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33484 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33500 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33504 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO: 127.0.0.1:33508 - "POST /v1/completions HTTP/1.1" 200 OK +(APIServer pid=1953096) INFO 11-12 05:16:37 [loggers.py:221] Engine 000: Avg prompt throughput: 1843.1 tokens/s, Avg generation throughput: 136.6 tokens/s, Running: 14 reqs, Waiting: 934 reqs, GPU KV cache usage: 1.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:16:47 [loggers.py:221] Engine 000: Avg prompt throughput: 18840.1 tokens/s, Avg generation throughput: 131.1 tokens/s, Running: 106 reqs, Waiting: 918 reqs, GPU KV cache usage: 11.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:16:57 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.6 tokens/s, Avg generation throughput: 321.7 tokens/s, Running: 192 reqs, Waiting: 832 reqs, GPU KV cache usage: 20.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:17:07 [loggers.py:221] Engine 000: Avg prompt throughput: 14126.2 tokens/s, Avg generation throughput: 1760.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:17:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5988.9 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:17:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.8 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:17:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.9 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 36.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:17:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6040.2 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 38.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:17:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.1 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 40.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:18:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6116.8 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:18:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6065.3 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:18:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6065.5 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:18:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4913.5 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:18:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4299.5 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:18:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 56.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:19:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5453.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:19:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.4 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:19:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5399.9 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:19:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:19:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.6 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 70.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:19:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5349.1 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 71.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:20:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:20:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5350.5 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:20:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5349.1 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:20:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5349.3 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:20:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5246.3 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 85.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:20:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5297.8 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:21:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5248.1 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:21:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5246.7 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:21:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5247.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:21:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5195.4 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 97.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:21:47 [loggers.py:221] Engine 000: Avg prompt throughput: 204.7 tokens/s, Avg generation throughput: 5092.9 tokens/s, Running: 256 reqs, Waiting: 767 reqs, GPU KV cache usage: 98.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:21:57 [loggers.py:221] Engine 000: Avg prompt throughput: 14129.8 tokens/s, Avg generation throughput: 1116.0 tokens/s, Running: 250 reqs, Waiting: 693 reqs, GPU KV cache usage: 75.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:22:07 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.2 tokens/s, Avg generation throughput: 546.6 tokens/s, Running: 249 reqs, Waiting: 607 reqs, GPU KV cache usage: 51.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:22:17 [loggers.py:221] Engine 000: Avg prompt throughput: 17408.1 tokens/s, Avg generation throughput: 544.8 tokens/s, Running: 248 reqs, Waiting: 522 reqs, GPU KV cache usage: 27.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:22:27 [loggers.py:221] Engine 000: Avg prompt throughput: 3071.2 tokens/s, Avg generation throughput: 5270.4 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 28.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:22:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:22:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5990.1 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:22:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6014.1 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:23:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.2 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:23:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6167.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:23:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6116.4 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:23:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6089.9 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:23:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.3 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:23:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4247.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:24:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5401.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 55.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:24:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5527.8 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:24:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5604.8 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:24:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5554.2 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:24:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.5 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 67.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:24:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.0 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 68.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:25:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.7 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:25:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.0 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:25:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:25:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5400.1 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:25:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5400.2 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:25:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.3 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:26:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5348.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:26:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5348.7 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:26:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5299.0 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:26:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.7 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:26:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5246.2 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 96.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:26:57 [loggers.py:221] Engine 000: Avg prompt throughput: 204.7 tokens/s, Avg generation throughput: 5169.5 tokens/s, Running: 256 reqs, Waiting: 511 reqs, GPU KV cache usage: 98.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:27:07 [loggers.py:221] Engine 000: Avg prompt throughput: 13311.0 tokens/s, Avg generation throughput: 1297.2 tokens/s, Running: 252 reqs, Waiting: 442 reqs, GPU KV cache usage: 77.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:27:17 [loggers.py:221] Engine 000: Avg prompt throughput: 17406.3 tokens/s, Avg generation throughput: 552.5 tokens/s, Running: 252 reqs, Waiting: 356 reqs, GPU KV cache usage: 53.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:27:27 [loggers.py:221] Engine 000: Avg prompt throughput: 18226.7 tokens/s, Avg generation throughput: 577.5 tokens/s, Running: 252 reqs, Waiting: 267 reqs, GPU KV cache usage: 29.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:27:37 [loggers.py:221] Engine 000: Avg prompt throughput: 3275.9 tokens/s, Avg generation throughput: 5014.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 27.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:27:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:27:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5937.6 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:28:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6013.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:28:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.5 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:28:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6117.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:28:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:28:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.2 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:28:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5606.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:29:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4274.1 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:29:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5298.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:29:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.1 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:29:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.7 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:29:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5553.6 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:29:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5451.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 66.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:30:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5501.7 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:30:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5400.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:30:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5401.6 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:30:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5399.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:30:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5350.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:30:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.3 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 81.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:31:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5273.6 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:31:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:31:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5273.1 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:31:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5271.9 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:31:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5272.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 94.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:31:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5221.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:32:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5220.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:32:17 [loggers.py:221] Engine 000: Avg prompt throughput: 10034.7 tokens/s, Avg generation throughput: 2195.2 tokens/s, Running: 252 reqs, Waiting: 202 reqs, GPU KV cache usage: 82.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:32:27 [loggers.py:221] Engine 000: Avg prompt throughput: 17613.4 tokens/s, Avg generation throughput: 552.8 tokens/s, Running: 252 reqs, Waiting: 117 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:32:37 [loggers.py:221] Engine 000: Avg prompt throughput: 17407.1 tokens/s, Avg generation throughput: 552.6 tokens/s, Running: 252 reqs, Waiting: 31 reqs, GPU KV cache usage: 34.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:32:47 [loggers.py:221] Engine 000: Avg prompt throughput: 7370.0 tokens/s, Avg generation throughput: 3834.5 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:32:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5963.3 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:33:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.9 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:33:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6016.0 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:33:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6116.7 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:33:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.9 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:33:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6117.0 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:33:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.5 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:34:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5913.3 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 51.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:34:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4325.1 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:34:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4990.2 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:34:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.5 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:34:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.5 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:34:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5605.7 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 63.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:35:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.6 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:35:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5527.7 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:35:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5451.1 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:35:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.4 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:35:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5451.3 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:35:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5400.0 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 78.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:36:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5399.7 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:36:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5324.9 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:36:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5348.6 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:36:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5348.2 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:36:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5297.1 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.1%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:36:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5297.6 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:37:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5247.8 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:37:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5271.6 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:37:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 3317.7 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% +(APIServer pid=1953096) INFO 11-12 05:37:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% diff --git a/oss_log_numerics.txt b/oss_log_numerics.txt new file mode 100644 index 000000000..698aa9a09 --- /dev/null +++ b/oss_log_numerics.txt @@ -0,0 +1,270 @@ +INFO 11-14 16:36:45 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-14 16:36:45 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-14 16:36:45 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-14 16:36:45 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +(APIServer pid=218262) INFO 11-14 16:36:46 [api_server.py:1897] vLLM API server version 0.11.1rc7.dev48+gdf4d3a44a +(APIServer pid=218262) INFO 11-14 16:36:46 [utils.py:253] non-default args: {'model_tag': 'unsloth/gpt-oss-120b-BF16', 'model': 'unsloth/gpt-oss-120b-BF16', 'max_model_len': 8192, 'download_dir': '/mnt/disks/persist', 'tensor_parallel_size': 4, 'data_parallel_size': 2, 'gpu_memory_utilization': 0.98, 'enable_prefix_caching': False, 'max_num_batched_tokens': 8192, 'max_num_seqs': 256, 'async_scheduling': True} +(APIServer pid=218262) INFO 11-14 16:36:47 [model.py:630] Resolved architecture: GptOssForCausalLM +(APIServer pid=218262) INFO 11-14 16:36:47 [model.py:1728] Using max model len 8192 +(APIServer pid=218262) INFO 11-14 16:36:47 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. +(APIServer pid=218262) INFO 11-14 16:36:47 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. +(APIServer pid=218262) INFO 11-14 16:36:47 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=2, attention_data_parallelism=1), device_indexes=None) +(APIServer pid=218262) WARNING 11-14 16:36:47 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 +(APIServer pid=218262) INFO 11-14 16:36:47 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. +INFO 11-14 16:36:51 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 +INFO 11-14 16:36:51 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. +INFO 11-14 16:36:51 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. +WARNING 11-14 16:36:51 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:52 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=8192, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=4, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=False, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} +(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:52 [tpu_jax.py:228] Pin memory is not supported on TPU. +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:57 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [utils.py:314] Phased-based profiler enabled. Traces will be saved to: gs://wenxindong-vm/trace/gpt_oss/dp2/numerics +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [compilation_manager.py:34] Enabling JAX compile cache. +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm +(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:59 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") +(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:59 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") +(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:59 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") +(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:59 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:59 [tpu_jax.py:63] Cannot use None backend on TPU. +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:59 [tpu_jax.py:66] Using Pallas V1 backend. +(EngineCore_DP0 pid=218428) INFO 11-14 16:36:59 [layer.py:331] Disabling MoE shared_experts cuda stream +(EngineCore_DP0 pid=218428) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 +(APIServer pid=218262) sys.exit(main()) +(APIServer pid=218262) ^^^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/cli/main.py", line 73, in main +(APIServer pid=218262) args.dispatch_function(args) +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/cli/serve.py", line 59, in cmd +(APIServer pid=218262) uvloop.run(run_server(args)) +(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/uvloop/__init__.py", line 96, in run +(APIServer pid=218262) return __asyncio.run( +(APIServer pid=218262) ^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/asyncio/runners.py", line 195, in run +(APIServer pid=218262) return runner.run(main) +(APIServer pid=218262) ^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/asyncio/runners.py", line 118, in run +(APIServer pid=218262) return self._loop.run_until_complete(task) +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "uvloop/loop.pyx", line 1518, in uvloop.loop.Loop.run_until_complete +(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/uvloop/__init__.py", line 48, in wrapper +(APIServer pid=218262) return await main +(APIServer pid=218262) ^^^^^^^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/openai/api_server.py", line 1944, in run_server +(APIServer pid=218262) await run_server_worker(listen_address, sock, args, **uvicorn_kwargs) +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/openai/api_server.py", line 1963, in run_server_worker +(APIServer pid=218262) async with build_async_engine_client( +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/contextlib.py", line 210, in __aenter__ +(APIServer pid=218262) return await anext(self.gen) +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/openai/api_server.py", line 192, in build_async_engine_client +(APIServer pid=218262) async with build_async_engine_client_from_engine_args( +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/contextlib.py", line 210, in __aenter__ +(APIServer pid=218262) return await anext(self.gen) +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/openai/api_server.py", line 233, in build_async_engine_client_from_engine_args +(APIServer pid=218262) async_llm = AsyncLLM.from_vllm_config( +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/utils/func_utils.py", line 116, in inner +(APIServer pid=218262) return fn(*args, **kwargs) +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/async_llm.py", line 202, in from_vllm_config +(APIServer pid=218262) return cls( +(APIServer pid=218262) ^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/async_llm.py", line 132, in __init__ +(APIServer pid=218262) self.engine_core = EngineCoreClient.make_async_mp_client( +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 121, in make_async_mp_client +(APIServer pid=218262) return AsyncMPClient(*client_args) +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 808, in __init__ +(APIServer pid=218262) super().__init__( +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 469, in __init__ +(APIServer pid=218262) with launch_core_engines(vllm_config, executor_class, log_stats) as ( +(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ +(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/contextlib.py", line 144, in __exit__ +(APIServer pid=218262) next(self.gen) +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/utils.py", line 898, in launch_core_engines +(APIServer pid=218262) wait_for_engine_startup( +(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/utils.py", line 955, in wait_for_engine_startup +(APIServer pid=218262) raise RuntimeError( +(APIServer pid=218262) RuntimeError: Engine core initialization failed. See root cause above. Failed core proc(s): {} diff --git a/tpu_inference/layers/vllm/fused_moe.py b/tpu_inference/layers/vllm/fused_moe.py index a1c5e5428..809ab16d7 100644 --- a/tpu_inference/layers/vllm/fused_moe.py +++ b/tpu_inference/layers/vllm/fused_moe.py @@ -175,7 +175,7 @@ def _gmm_all_reduce(lhs, rhs, group_sizes): out_specs=(P(ShardingAxisName.MLP_DATA)), check_rep=False, )(lhs, rhs, group_sizes) - jax.debug.print("gmm_result before bias {} {}", gmm_result.sum(), gmm_result.ravel()[:10]) + # jax.debug.print("gmm_result before bias {} {}", gmm_result.sum(), gmm_result.ravel()[:10]) if rhs_bias is not None: rhs_bias = jnp.repeat(rhs_bias, group_sizes_global, 0, total_repeat_length=m) gmm_result = (gmm_result + rhs_bias).astype(gmm_result.dtype) @@ -365,7 +365,7 @@ def fused_moe_func( gating_output = jax.lax.with_sharding_constraint( gating_output, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA, None))) - jax.debug.print("hidden_state before MoE {} {}", hidden_states.sum(), hidden_states.ravel()[:10]) + # jax.debug.print("hidden_state before MoE {} {}", hidden_states.sum(), hidden_states.ravel()[:10]) hidden_states = hidden_states.reshape(num_tokens, hidden_size) gating_output = gating_output.reshape(num_tokens, global_num_experts) @@ -386,7 +386,7 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): # Reduce group_sizes once across data parallel shards to get global counts # This is needed for bias addition and should be done only once for efficiency - group_sizes_global = jax.lax.psum(group_sizes_local, axis_name=ShardingAxisName.MLP_DATA) + group_sizes_global = jax.lax.psum(group_sizes_local, axis_name=ShardingAxisName.ATTN_DATA) x = hidden_states_local[token_indices_sorted] return x, group_sizes_local, group_sizes_global, topk_argsort_revert_indices @@ -399,8 +399,8 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): check_rep=False, )(hidden_states, topk_indices) - jax.debug.print("hidden_state before gmm {} {}", x.sum(), x.ravel()[:10]) - jax.debug.print("group_sizes {} {}", group_sizes.sum(), group_sizes) + # jax.debug.print("hidden_state before gmm {} {}", x.sum(), x.ravel()[:10]) + # jax.debug.print("group_sizes {} {}", group_sizes.sum(), group_sizes) if use_ep: x = expert_sharded_gmm( x, @@ -423,11 +423,11 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): mesh=mesh, intermediate_size=intermediate_size, ) - jax.debug.print("hidden_state after first gmm x1 {} {}", x1.sum(), x1.ravel()[:10]) - jax.debug.print("hidden_state after first gmm x2 {} {}", x2.sum(), x2.ravel()[:10]) + # jax.debug.print("hidden_state after first gmm x1 {} {}", x1.sum(), x1.ravel()[:10]) + # jax.debug.print("hidden_state after first gmm x2 {} {}", x2.sum(), x2.ravel()[:10]) x = activation_fn(activation, x1, x2) - jax.debug.print("hidden_state after activation {} {}", x.sum(), x.ravel()[:10]) + # jax.debug.print("hidden_state after activation {} {}", x.sum(), x.ravel()[:10]) if use_ep: x = expert_sharded_gmm( x, @@ -450,7 +450,7 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): transpose_rhs=True, mesh=mesh, ) - jax.debug.print("hidden_state after second gmm {} {}", x.sum(), x.ravel()[:10]) + # jax.debug.print("hidden_state after second gmm {} {}", x.sum(), x.ravel()[:10]) def _finalize_output(x_local, topk_argsort_revert_indices_local, topk_weights_local): x_local = x_local[topk_argsort_revert_indices_local].reshape(-1, topk, hidden_size) @@ -465,12 +465,12 @@ def _finalize_output(x_local, topk_argsort_revert_indices_local, topk_weights_lo out_specs=(P(ShardingAxisName.ATTN_DATA, None)), check_rep=False, )(x, topk_argsort_revert_indices, topk_weights) - jax.debug.print("hidden_state after finalize output {} {}", x.sum(), x.ravel()[:10]) + # jax.debug.print("hidden_state after finalize output {} {}", x.sum(), x.ravel()[:10]) x = x.reshape(orig_shape) if reduce_results: x = jax.lax.with_sharding_constraint(x, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) - jax.debug.print("hidden_state after reducing result {} {}", x.sum(), x.ravel()[:10]) + # jax.debug.print("hidden_state after reducing result {} {}", x.sum(), x.ravel()[:10]) return x From e37a89bbadb3f5655996f85f207387433b586224 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Fri, 14 Nov 2025 18:54:12 +0000 Subject: [PATCH 10/17] wip --- tpu_inference/layers/vllm/fused_moe.py | 50 +++++++++++++------------- 1 file changed, 26 insertions(+), 24 deletions(-) diff --git a/tpu_inference/layers/vllm/fused_moe.py b/tpu_inference/layers/vllm/fused_moe.py index 809ab16d7..750c4df84 100644 --- a/tpu_inference/layers/vllm/fused_moe.py +++ b/tpu_inference/layers/vllm/fused_moe.py @@ -103,7 +103,6 @@ def tensor_sharded_gmm_merged_column_parallel( rhs: jax.Array, rhs_bias: jax.Array | None, group_sizes: jax.Array, - group_sizes_global: jax.Array, transpose_rhs: bool, mesh: Mesh, intermediate_size: int, @@ -129,10 +128,18 @@ def tensor_sharded_gmm_merged_column_parallel( check_rep=False, )(lhs, rhs, group_sizes) - if rhs_bias is not None: - rhs_bis = jnp.repeat(rhs_bias, group_sizes_global, 0, total_repeat_length=m) - gmm_result = (gmm_result + rhs_bis).astype(gmm_result.dtype) + def _add_bias(gmm_result_local, rhs_bias_local, group_sizes_global): + rhs_bis = jnp.repeat(rhs_bias_local, group_sizes_global, 0, total_repeat_length=m//mesh.shape["data"]) + return (gmm_result_local + rhs_bis).astype(gmm_result_local.dtype) + + gmm_result = shard_map( + _add_bias, + mesh=mesh, + in_specs=(P(ShardingAxisName.MLP_DATA, ShardingAxisName.MLP_TENSOR), P(None, ShardingAxisName.MLP_TENSOR), P(ShardingAxisName.MLP_DATA)), + out_specs=(P(ShardingAxisName.MLP_DATA, ShardingAxisName.MLP_TENSOR)), + check_rep=False, + )(gmm_result, rhs_bias, group_sizes) n_shards = mesh.shape['model'] * mesh.shape.get('attn_dp', 1) output_sizes = [intermediate_size, intermediate_size] @@ -146,7 +153,6 @@ def tensor_sharded_gmm_row_parallel( rhs: jax.Array, rhs_bias: jax.Array | None, group_sizes: jax.Array, - group_sizes_global: jax.Array, transpose_rhs: bool, mesh: Mesh, ) -> jax.Array: @@ -177,8 +183,17 @@ def _gmm_all_reduce(lhs, rhs, group_sizes): )(lhs, rhs, group_sizes) # jax.debug.print("gmm_result before bias {} {}", gmm_result.sum(), gmm_result.ravel()[:10]) if rhs_bias is not None: - rhs_bias = jnp.repeat(rhs_bias, group_sizes_global, 0, total_repeat_length=m) - gmm_result = (gmm_result + rhs_bias).astype(gmm_result.dtype) + def _add_bias(gmm_result_local, rhs_bias_local, group_sizes_global): + rhs_bis = jnp.repeat(rhs_bias_local, group_sizes_global, 0, total_repeat_length=m//mesh.shape["data"]) + return (gmm_result_local + rhs_bis).astype(gmm_result_local.dtype) + + gmm_result = shard_map( + _add_bias, + mesh=mesh, + in_specs=(P(ShardingAxisName.MLP_DATA), P(), P(ShardingAxisName.MLP_DATA)), + out_specs=(P(ShardingAxisName.MLP_DATA)), + check_rep=False, + )(gmm_result, rhs_bias, group_sizes) return gmm_result @@ -359,13 +374,6 @@ def fused_moe_func( assert (num_tokens * topk) % 16 == 0, ( "The kernel requires num_tokens * topk to be a multiple of " f"16 but got {num_tokens}*{topk}={num_tokens*topk}") - hidden_states = jax.lax.with_sharding_constraint( - hidden_states, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA, None))) - - gating_output = jax.lax.with_sharding_constraint( - gating_output, NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA, None))) - - # jax.debug.print("hidden_state before MoE {} {}", hidden_states.sum(), hidden_states.ravel()[:10]) hidden_states = hidden_states.reshape(num_tokens, hidden_size) gating_output = gating_output.reshape(num_tokens, global_num_experts) @@ -383,19 +391,15 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): token_indices = jnp.arange(num_tokens_local, dtype=jnp.int32).repeat(topk) token_indices_sorted = token_indices[topk_argsort_indices] group_sizes_local = jnp.bincount(topk_indices_flat, length=global_num_experts) - - # Reduce group_sizes once across data parallel shards to get global counts - # This is needed for bias addition and should be done only once for efficiency - group_sizes_global = jax.lax.psum(group_sizes_local, axis_name=ShardingAxisName.ATTN_DATA) - + x = hidden_states_local[token_indices_sorted] - return x, group_sizes_local, group_sizes_global, topk_argsort_revert_indices + return x, group_sizes_local, topk_argsort_revert_indices - x, group_sizes, group_sizes_global, topk_argsort_revert_indices = shard_map( + x, group_sizes, topk_argsort_revert_indices = shard_map( _process_tokens_locally, mesh=mesh, in_specs=(P(ShardingAxisName.ATTN_DATA, None), P(ShardingAxisName.ATTN_DATA, None)), - out_specs=(P(ShardingAxisName.ATTN_DATA, None), P(ShardingAxisName.ATTN_DATA), P(), P(ShardingAxisName.ATTN_DATA)), + out_specs=(P(ShardingAxisName.ATTN_DATA, None), P(ShardingAxisName.ATTN_DATA), P(ShardingAxisName.ATTN_DATA)), check_rep=False, )(hidden_states, topk_indices) @@ -418,7 +422,6 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): w1, w1_bias, group_sizes, - group_sizes_global, transpose_rhs=True, mesh=mesh, intermediate_size=intermediate_size, @@ -446,7 +449,6 @@ def _process_tokens_locally(hidden_states_local, topk_indices_local): w2, w2_bias, group_sizes, - group_sizes_global, transpose_rhs=True, mesh=mesh, ) From 5dcdecbecb7e3af07fc7544e47948db28d80fa90 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Sun, 16 Nov 2025 17:54:11 +0000 Subject: [PATCH 11/17] wip --- tpu_inference/layers/vllm/fused_moe.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tpu_inference/layers/vllm/fused_moe.py b/tpu_inference/layers/vllm/fused_moe.py index 750c4df84..9f676f4db 100644 --- a/tpu_inference/layers/vllm/fused_moe.py +++ b/tpu_inference/layers/vllm/fused_moe.py @@ -8,7 +8,7 @@ from tpu_inference.layers.vllm.linear_common import \ slice_sharded_tensor_for_concatenation -from tpu_inference.layers.jax.sharding import ShardingAxisName +from tpu_inference.layers.common.sharding import ShardingAxisName P = PartitionSpec From f3e4b88b896e9da9e076c6a3e3b17f2119dcf040 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Sun, 16 Nov 2025 17:54:25 +0000 Subject: [PATCH 12/17] wip --- tpu_inference/layers/vllm/quantization/common.py | 2 +- tpu_inference/layers/vllm/quantization/unquantized.py | 2 +- tpu_inference/layers/vllm/sharding.py | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/tpu_inference/layers/vllm/quantization/common.py b/tpu_inference/layers/vllm/quantization/common.py index f443d6a26..7872c4aaa 100644 --- a/tpu_inference/layers/vllm/quantization/common.py +++ b/tpu_inference/layers/vllm/quantization/common.py @@ -11,7 +11,7 @@ ReplicatedLinear, RowParallelLinear) -from tpu_inference.layers.jax.sharding import ShardingAxisName +from tpu_inference.layers.common.sharding import ShardingAxisName from tpu_inference.layers.vllm.linear_common import \ get_model_matmul_fusion_assignment from tpu_inference.utils import TPU_SECOND_LAST_MINOR diff --git a/tpu_inference/layers/vllm/quantization/unquantized.py b/tpu_inference/layers/vllm/quantization/unquantized.py index 141b192d3..f666422b9 100644 --- a/tpu_inference/layers/vllm/quantization/unquantized.py +++ b/tpu_inference/layers/vllm/quantization/unquantized.py @@ -25,7 +25,7 @@ from tpu_inference.kernels.fused_moe.v1.kernel import fused_ep_moe from tpu_inference.layers.common.quant_methods import (UNQUANTIZED, get_tpu_quant_method) -from tpu_inference.layers.jax.sharding import ShardingAxisName +from tpu_inference.layers.common.sharding import ShardingAxisName from tpu_inference.layers.vllm.fused_moe import fused_moe_func_padded from tpu_inference.layers.vllm.linear_common import ( diff --git a/tpu_inference/layers/vllm/sharding.py b/tpu_inference/layers/vllm/sharding.py index fc1bc983b..1e28ae745 100644 --- a/tpu_inference/layers/vllm/sharding.py +++ b/tpu_inference/layers/vllm/sharding.py @@ -19,7 +19,7 @@ from vllm.model_executor.layers.vocab_parallel_embedding import ( ParallelLMHead, VocabParallelEmbedding) -from tpu_inference.layers.jax.sharding import ShardingAxisName +from tpu_inference.layers.common.sharding import ShardingAxisName from tpu_inference.logger import init_logger P = PartitionSpec From 70e450306f7875ff8245803ed30176b99a615b61 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Mon, 17 Nov 2025 07:25:29 +0000 Subject: [PATCH 13/17] wip --- repro_attention_dp.py | 388 ++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 388 insertions(+) create mode 100644 repro_attention_dp.py diff --git a/repro_attention_dp.py b/repro_attention_dp.py new file mode 100644 index 000000000..dac099ab3 --- /dev/null +++ b/repro_attention_dp.py @@ -0,0 +1,388 @@ +""" +Reproduction script to compare attention kernel performance and HLO +with and without data parallelism. + +Usage: + python repro_attention_dp.py --mode no_dp + python repro_attention_dp.py --mode with_dp +""" + +import argparse +import os +import time +from pathlib import Path +import numpy as np + +import jax +import jax.numpy as jnp +from jax.sharding import Mesh, PartitionSpec as P +from jax import NamedSharding, shard_map + +import sys +sys.path.insert(0, '/home/wenxindong_google_com/tpu-inference') + +from tpu_inference.kernels.ragged_paged_attention.v3.kernel_hd64 import ( + ragged_paged_attention_hd64, + get_kv_cache_shape, +) +from tpu_inference.layers.common.sharding import ShardingAxisName + + +def create_test_inputs( + batch_size: int = 256, + max_num_tokens: int = 256, + num_q_heads: int = 32, + num_kv_heads: int = 8, + head_dim: int = 64, + page_size: int = 256, + pages_per_seq: int = 16, + total_num_pages: int = 8282, + dp_size: int = 1, +): + + # batch_size = batch_size * dp_size + total_num_pages = total_num_pages * dp_size + # Q, K, V tensors - use unique seeds for each DP replica + q = jnp.concatenate([jax.random.normal( + jax.random.PRNGKey(0), # Unique seed per replica + (max_num_tokens, num_q_heads, head_dim), + dtype=jnp.bfloat16, + ) for i in range(dp_size)], axis=0) + k = jnp.concatenate([jax.random.normal( + jax.random.PRNGKey(0), # Unique seed per replica + (max_num_tokens, num_kv_heads, head_dim), + dtype=jnp.bfloat16, + ) for i in range(dp_size)], axis=0) + v = jnp.concatenate([jax.random.normal( + jax.random.PRNGKey(0), # Unique seed per replica + (max_num_tokens, num_kv_heads, head_dim), + dtype=jnp.bfloat16, + ) for i in range(dp_size)], axis=0) + + # KV cache + kv_cache_shape = get_kv_cache_shape( + total_num_pages, + page_size, + num_kv_heads, + head_dim, + jnp.bfloat16, + ) + kv_cache = jnp.zeros(kv_cache_shape, dtype=jnp.bfloat16) + + # kv_lens: each DP rank has its own requests + kv_lens = [] + for dp_rank in range(dp_size): + kv_lens.append([1024 for _ in range(batch_size)]) + kv_lens = jnp.array(kv_lens, dtype=jnp.int32).reshape(-1) + + # Page indices: each DP rank manages its own pages + page_indices = jnp.concatenate([jnp.arange( + batch_size * pages_per_seq, dtype=jnp.int32 + ) for _ in range(dp_size)]) + + # cu_q_lens: cumulative query lengths PER DP RANK + cu_q_lens = [] + for _ in range(dp_size): + cu_q_lens.append([1 * i for i in range(batch_size + 1)]) + cu_q_lens = jnp.array(cu_q_lens, dtype=jnp.int32).reshape(-1) + + # Distribution: per DP rank [decode_end, prefill_end, mixed_end] + distribution_list = [] + for _ in range(dp_size): + distribution_list.extend([0, 0, batch_size]) + distribution = jnp.array(distribution_list, dtype=jnp.int32) + + # Optional attention sink + attention_sink = None + + sm_scale = head_dim ** -0.5 + + print(f"\nInput creation (dp_size={dp_size}):") + print(f" q: {q.shape}") + print(f" kv_cache: {kv_cache.shape}") + print(f" kv_lens: {kv_lens.shape} = {kv_lens}") + print(f" page_indices: {page_indices.shape}", page_indices) + print(f" cu_q_lens: {cu_q_lens.shape} = {cu_q_lens}") + print(f" distribution: {distribution.shape} = {distribution}") + + return { + 'q': q, + 'k': k, + 'v': v, + 'kv_cache': kv_cache, + 'kv_lens': kv_lens, + 'page_indices': page_indices, + 'cu_q_lens': cu_q_lens, + 'distribution': distribution, + 'attention_sink': attention_sink, + 'sm_scale': sm_scale, + } + +def run(inputs, dump_dir, dp_size=2, num_devices=8, dp=True): + """Run attention kernel WITH data parallelism.""" + print("\n" + "="*80) + if dp: + print(f"Running WITH Data Parallelism (dp_size={dp_size}, num_devices={num_devices})") + else: + print(f"Running WITHOUT Data Parallelism (num_devices={num_devices})") + print("="*80) + + print(f"Input shapes:") + for key, val in inputs.items(): + if isinstance(val, jax.Array): + print(f" {key}: {val.shape} {val.dtype}") + + devices = jax.devices() + total_devices = 8 + if dp: + device_array = np.array(devices[:total_devices]).reshape(dp_size, -1) + else: + device_array = np.array(devices[:total_devices//dp_size]).reshape(1, -1) + mesh = Mesh( + device_array, + axis_names=(ShardingAxisName.ATTN_DATA, ShardingAxisName.ATTN_HEAD), + ) + print(f"Mesh: {mesh}") + print(f"Mesh shape: {mesh.shape}") + + + # Define sharding specs (matching the actual implementation) + qkv_spec = P(ShardingAxisName.ATTN_DATA, ShardingAxisName.ATTN_HEAD, None) + kv_cache_spec = P(ShardingAxisName.ATTN_DATA, None, ShardingAxisName.ATTN_HEAD, None, None) + + in_specs = ( + qkv_spec, # q + qkv_spec, # k + qkv_spec, # v + kv_cache_spec, # kv_cache + P(ShardingAxisName.ATTN_DATA), # kv_lens + P(ShardingAxisName.ATTN_DATA), # page_indices + P(ShardingAxisName.ATTN_DATA), # cu_q_lens + P(ShardingAxisName.ATTN_DATA), # distribution + ) + out_specs = (qkv_spec, kv_cache_spec) + + print(f"\nSharding specs:") + print(f" qkv_spec: {qkv_spec}") + print(f" kv_cache_spec: {kv_cache_spec}") + + # Create sharded function + def _ragged_paged_attention(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, distribution): + return ragged_paged_attention_hd64( + q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, distribution, + attention_sink=None, + sm_scale=inputs['sm_scale'], + ) + + sharded_fn = shard_map( + _ragged_paged_attention, + mesh=mesh, + in_specs=in_specs, + out_specs=out_specs, + check_vma=False, + ) + + attention_fn = jax.jit(sharded_fn) + + # Lower and dump HLO + print("\nLowering computation...") + lowered = attention_fn.lower( + inputs['q'], + inputs['k'], + inputs['v'], + inputs['kv_cache'], + inputs['kv_lens'], + inputs['page_indices'], + inputs['cu_q_lens'], + inputs['distribution'], + ) + + # Dump HLO + hlo_text = lowered.as_text() + if dp: + hlo_path = Path(dump_dir) / f"with_dp_{dp_size}_hlo.txt" + else: + hlo_path = Path(dump_dir) / f"no_dp_hlo.txt" + hlo_path.write_text(hlo_text) + print(f"✓ HLO dumped to: {hlo_path}") + + # Compile + print("Compiling...") + compiled = lowered.compile() + + inputs['q'] = jax.device_put(inputs['q'], NamedSharding(mesh, qkv_spec)) + inputs['k'] = jax.device_put(inputs['k'], NamedSharding(mesh, qkv_spec)) + inputs['v'] = jax.device_put(inputs['v'], NamedSharding(mesh, qkv_spec)) + inputs['kv_cache'] = jax.device_put(inputs['kv_cache'], NamedSharding(mesh, kv_cache_spec)) + inputs['kv_lens'] = jax.device_put(inputs['kv_lens'], NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) + inputs['page_indices'] = jax.device_put(inputs['page_indices'], NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) + inputs['cu_q_lens'] = jax.device_put(inputs['cu_q_lens'], NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) + inputs['distribution'] = jax.device_put(inputs['distribution'], NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) + + # Warm up + print("Warming up...") + for _ in range(3): + result = attention_fn( + inputs['q'], + inputs['k'], + inputs['v'], + inputs['kv_cache'], + inputs['kv_lens'], + inputs['page_indices'], + inputs['cu_q_lens'], + inputs['distribution'], + ) + jax.block_until_ready(result) + + # Benchmark + print("Benchmarking (10 runs)...") + times = [] + for i in range(10): + start = time.time() + result = attention_fn( + inputs['q'], + inputs['k'], + inputs['v'], + inputs['kv_cache'], + inputs['kv_lens'], + inputs['page_indices'], + inputs['cu_q_lens'], + inputs['distribution'], + ) + jax.block_until_ready(result) + elapsed = time.time() - start + times.append(elapsed) + print(f" Run {i+1}: {elapsed*1000:.2f} ms") + + avg_time = sum(times) / len(times) + print(f"\n✓ Average time: {avg_time*1000:.2f} ms") + print(f"✓ Output shape: {result[0].shape}") + + return result, avg_time + + +def main(): + parser = argparse.ArgumentParser(description="Reproduce attention DP issue") + parser.add_argument( + '--mode', + type=str, + choices=['no_dp', 'with_dp', 'both'], + default='both', + help='Which mode to run' + ) + parser.add_argument( + '--dp_size', + type=int, + default=2, + help='Data parallel size for with_dp mode' + ) + parser.add_argument( + '--num_devices_no_dp', + type=int, + default=4, + help='Number of devices for no_dp mode (head parallelism only)' + ) + parser.add_argument( + '--num_devices_with_dp', + type=int, + default=8, + help='Number of devices for with_dp mode (dp_size * head_parallelism)' + ) + parser.add_argument( + '--dump_dir', + type=str, + default='/tmp/attention_dp_repro', + help='Directory to dump HLO files' + ) + parser.add_argument( + '--batch_size', + type=int, + default=256, + help='Batch size' + ) + args = parser.parse_args() + + # Create dump directory + dump_dir = Path(args.dump_dir) + dump_dir.mkdir(parents=True, exist_ok=True) + print(f"HLO dump directory: {dump_dir}") + + # Create test inputs + print("\nCreating test inputs...") + # Note: We'll create DP-specific inputs when running with_dp mode + inputs_no_dp = None + inputs_with_dp = None + + print(f"\nJAX version: {jax.__version__}") + print(f"Available devices: {jax.devices()}") + print(f"Device count: {jax.device_count()}") + + results = {} + + # Run without DP + if args.mode in ['no_dp', 'both']: + print("\nCreating inputs for no_dp mode...") + inputs_no_dp = create_test_inputs(batch_size=args.batch_size, dp_size=1) + result, avg_time = run(inputs_no_dp, dump_dir, num_devices=args.num_devices_no_dp, dp=False) + results['no_dp'] = {'result': result, 'time': avg_time} + + # Run with DP + if args.mode in ['with_dp', 'both']: + print(f"\nCreating inputs for with_dp mode (dp_size={args.dp_size})...") + inputs_with_dp = create_test_inputs(batch_size=args.batch_size, dp_size=args.dp_size) + result, avg_time = run(inputs_with_dp, dump_dir, dp_size=args.dp_size, num_devices=args.num_devices_with_dp, dp=True) + results['with_dp'] = {'result': result, 'time': avg_time} + + # Compare results + if args.mode == 'both': + print("\n" + "="*80) + print("COMPARISON") + print("="*80) + + no_dp_time = results['no_dp']['time'] + with_dp_time = results['with_dp']['time'] + speedup = no_dp_time / with_dp_time + slowdown = with_dp_time / no_dp_time + + print(f"No DP time: {no_dp_time*1000:.2f} ms") + print(f"With DP time: {with_dp_time*1000:.2f} ms") + + if speedup > 1.0: + print(f"✓ DP is {speedup:.2f}x FASTER") + else: + print(f"✗ DP is {slowdown:.2f}x SLOWER") + + # Check output consistency + total = results['no_dp']['result'][0].shape[0] + for i in range(args.dp_size): + + out_no_dp = np.array(results['no_dp']['result'][0], dtype=np.float32) + out_with_dp = np.array(results['with_dp']['result'][0][total*i : total*(i+1), ...], dtype=np.float32) + + max_diff = np.max(np.abs(out_no_dp - out_with_dp)) + print(f"\nMax output difference for DP rank {i}: {max_diff}") + + if max_diff < 1e-2: + print("✓ Outputs match (within tolerance)") + else: + print("✗ Outputs differ significantly!") + + print("\n" + "="*80) + print("NEXT STEPS") + print("="*80) + print(f"\n1. Compare HLO files in: {dump_dir}") + print(f" - no_dp_hlo.txt") + print(f" - with_dp_{args.dp_size}_hlo.txt") + print(f"\n2. Look for:") + print(f" - all-reduce, all-gather, collective-permute operations") + print(f" - Extra transpose/reshape operations") + print(f" - Different memory layouts") + print(f"\n3. Use diff tool:") + print(f" diff {dump_dir}/no_dp_hlo.txt {dump_dir}/with_dp_{args.dp_size}_hlo.txt") + print(f"\n4. Or use XLA dump for more detail:") + print(f" XLA_FLAGS='--xla_dump_to={dump_dir}/xla_dump --xla_dump_hlo_as_text' python {__file__} --mode {args.mode}") + print() + + +if __name__ == '__main__': + main() From d64b1babd1835abda84d249ae43fc894a6591384 Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Tue, 18 Nov 2025 21:38:28 +0000 Subject: [PATCH 14/17] wip --- repro_attention_dp.py | 1576 +++++++++++++++++++++++++++++++++++++---- 1 file changed, 1438 insertions(+), 138 deletions(-) diff --git a/repro_attention_dp.py b/repro_attention_dp.py index dac099ab3..6636b8177 100644 --- a/repro_attention_dp.py +++ b/repro_attention_dp.py @@ -3,12 +3,10 @@ with and without data parallelism. Usage: - python repro_attention_dp.py --mode no_dp - python repro_attention_dp.py --mode with_dp + python repro_attention_dp.py """ import argparse -import os import time from pathlib import Path import numpy as np @@ -17,44 +15,42 @@ import jax.numpy as jnp from jax.sharding import Mesh, PartitionSpec as P from jax import NamedSharding, shard_map - -import sys -sys.path.insert(0, '/home/wenxindong_google_com/tpu-inference') +from tpu_inference.layers.vllm.attention import _jax_attn_func +# import sys +# sys.path.insert(0, '/home/wenxindong_google_com/tpu-inference') from tpu_inference.kernels.ragged_paged_attention.v3.kernel_hd64 import ( - ragged_paged_attention_hd64, get_kv_cache_shape, ) from tpu_inference.layers.common.sharding import ShardingAxisName +from tpu_inference.layers.common.attention_metadata import AttentionMetadata def create_test_inputs( - batch_size: int = 256, + batch_size: int = 256, max_num_tokens: int = 256, num_q_heads: int = 32, num_kv_heads: int = 8, head_dim: int = 64, page_size: int = 256, - pages_per_seq: int = 16, total_num_pages: int = 8282, dp_size: int = 1, ): - # batch_size = batch_size * dp_size total_num_pages = total_num_pages * dp_size - # Q, K, V tensors - use unique seeds for each DP replica + # Q, K, V tensors q = jnp.concatenate([jax.random.normal( - jax.random.PRNGKey(0), # Unique seed per replica + jax.random.PRNGKey(0), (max_num_tokens, num_q_heads, head_dim), dtype=jnp.bfloat16, ) for i in range(dp_size)], axis=0) k = jnp.concatenate([jax.random.normal( - jax.random.PRNGKey(0), # Unique seed per replica + jax.random.PRNGKey(0), (max_num_tokens, num_kv_heads, head_dim), dtype=jnp.bfloat16, ) for i in range(dp_size)], axis=0) v = jnp.concatenate([jax.random.normal( - jax.random.PRNGKey(0), # Unique seed per replica + jax.random.PRNGKey(0), (max_num_tokens, num_kv_heads, head_dim), dtype=jnp.bfloat16, ) for i in range(dp_size)], axis=0) @@ -67,34 +63,1385 @@ def create_test_inputs( head_dim, jnp.bfloat16, ) - kv_cache = jnp.zeros(kv_cache_shape, dtype=jnp.bfloat16) + kv_cache = jax.random.normal(jax.random.PRNGKey(0), kv_cache_shape, dtype=jnp.bfloat16) - # kv_lens: each DP rank has its own requests - kv_lens = [] - for dp_rank in range(dp_size): - kv_lens.append([1024 for _ in range(batch_size)]) - kv_lens = jnp.array(kv_lens, dtype=jnp.int32).reshape(-1) + + # Actual seq_lens from the log for step 849 + seq_lens_rank0 = [2897, 2896, 2896, 2896, 2895, 2895, 2895, 2895, 2894, 2894, 2894, 2894, 2893, 2893, + 2893, 2893, 2892, 2892, 2892, 2892, 2891, 2891, 2891, 2891, 2890, 2890, 2890, 2890, + 2889, 2889, 2889, 2889, 2888, 2888, 2888, 2888, 2887, 2887, 2887, 2887, 2886, 2886, + 2886, 2886, 2885, 2885, 2885, 2885, 2884, 2884, 2884, 2884, 2883, 2883, 2883, 2883, + 2882, 2882, 2882, 2882, 2881, 2881, 2881, 2881, 2880, 2880, 2880, 2880, 2879, 2879, + 2879, 2879, 2878, 2878, 2878, 2878, 2877, 2877, 2877, 2877, 2876, 2876, 2876, 2876, + 2875, 2875, 2875, 2875, 2874, 2874, 2874, 2874, 2873, 2873, 2873, 2873, 2872, 2872, + 2872, 2872, 2871, 2871, 2871, 2871, 2870, 2870, 2870, 2870, 2869, 2869, 2869, 2869, + 2868, 2868, 2868, 2868, 2867, 2867, 2867, 2867, 2866, 2866, 2866, 2866, 2865, 2865, + 2865, 2865, 2864, 2864, 2864, 2863, 2863, 2863, 2863, 2862, 2862, 2862, 2862, 2861, + 2861, 2861, 2861, 2860, 2860, 2860, 2860, 2859, 2859, 2859, 2859, 2858, 2858, 2858, + 2858, 2857, 2857, 2857, 2857, 2856, 2856, 2856, 2856, 2855, 2855, 2855, 2855, 2854, + 2854, 2854, 2854, 2853, 2853, 2853, 2853, 2852, 2852, 2852, 2852, 2851, 2851, 2851, + 2850, 2850, 2850, 2850, 2849, 2849, 2849, 2849, 2848, 2848, 2848, 2848, 2847, 2847, + 2847, 2847, 2846, 2846, 2846, 2846, 2845, 2845, 2845, 2845, 2844, 2844, 2844, 2844, + 2843, 2843, 2843, 2843, 2842, 2842, 2842, 2842, 2841, 2841, 2841, 2841, 2840, 2840, + 2840, 2839, 2839, 2839, 2839, 2838, 2838, 2838, 2838, 2837, 2837, 2837, 2837, 2836, + 2836, 2836, 2836, 2835, 2835, 2835, 2835, 2834, 2834, 2834, 2834, 2833, 2833, 2833, + 2833, 2832, 2832, 2832] - # Page indices: each DP rank manages its own pages - page_indices = jnp.concatenate([jnp.arange( - batch_size * pages_per_seq, dtype=jnp.int32 - ) for _ in range(dp_size)]) + seq_lens_rank1 = [2896, 2896, 2896, 2896, 2895, 2895, 2895, 2894, 2894, 2894, 2894, 2893, 2893, 2893, + 2893, 2892, 2892, 2892, 2892, 2891, 2891, 2891, 2891, 2890, 2890, 2890, 2890, 2889, + 2889, 2889, 2889, 2888, 2888, 2888, 2888, 2887, 2887, 2887, 2887, 2886, 2886, 2886, + 2886, 2885, 2885, 2885, 2885, 2884, 2884, 2884, 2884, 2883, 2883, 2883, 2883, 2882, + 2882, 2882, 2882, 2881, 2881, 2881, 2881, 2880, 2880, 2880, 2880, 2879, 2879, 2879, + 2879, 2878, 2878, 2878, 2878, 2877, 2877, 2877, 2877, 2876, 2876, 2876, 2876, 2875, + 2875, 2875, 2875, 2874, 2874, 2874, 2874, 2873, 2873, 2873, 2873, 2872, 2872, 2872, + 2872, 2871, 2871, 2871, 2871, 2870, 2870, 2870, 2870, 2869, 2869, 2869, 2869, 2868, + 2868, 2868, 2868, 2867, 2867, 2867, 2867, 2866, 2866, 2866, 2866, 2865, 2865, 2865, + 2865, 2864, 2864, 2864, 2863, 2863, 2863, 2863, 2862, 2862, 2862, 2862, 2861, 2861, + 2861, 2861, 2860, 2860, 2860, 2860, 2859, 2859, 2859, 2859, 2858, 2858, 2858, 2858, + 2857, 2857, 2857, 2857, 2856, 2856, 2856, 2856, 2855, 2855, 2855, 2855, 2854, 2854, + 2854, 2854, 2853, 2853, 2853, 2853, 2852, 2852, 2852, 2852, 2851, 2851, 2851, 2851, + 2850, 2850, 2850, 2849, 2849, 2849, 2849, 2848, 2848, 2848, 2848, 2847, 2847, 2847, + 2847, 2846, 2846, 2846, 2846, 2845, 2845, 2845, 2845, 2844, 2844, 2844, 2844, 2843, + 2843, 2843, 2843, 2842, 2842, 2842, 2842, 2841, 2841, 2841, 2841, 2840, 2840, 2840, + 2839, 2839, 2839, 2839, 2838, 2838, 2838, 2838, 2837, 2837, 2837, 2837, 2836, 2836, + 2836, 2836, 2835, 2835, 2835, 2835, 2834, 2834, 2834, 2834, 2833, 2833, 2833, 2833, + 2832, 2832, 2832, 2831] + # from step 1698 + seq_len_no_dp = [3745, 3745, 3743, 3743, 3743, 3742, 3742, 3742, 3742, 3741, 3741, + 3741, 3741, 3740, 3740, 3740, 3740, 3739, 3739, 3739, 3739, 3738, + 3738, 3738, 3738, 3737, 3737, 3737, 3737, 3736, 3736, 3736, 3736, + 3735, 3735, 3735, 3735, 3734, 3734, 3734, 3734, 3733, 3733, 3733, + 3733, 3732, 3732, 3732, 3732, 3731, 3731, 3731, 3731, 3730, 3730, + 3730, 3730, 3729, 3729, 3729, 3729, 3728, 3728, 3728, 3728, 3727, + 3727, 3727, 3727, 3726, 3726, 3726, 3726, 3725, 3725, 3725, 3725, + 3724, 3724, 3724, 3724, 3723, 3723, 3723, 3723, 3722, 3722, 3722, + 3722, 3721, 3721, 3721, 3721, 3720, 3720, 3720, 3720, 3719, 3719, + 3719, 3719, 3718, 3718, 3718, 3718, 3717, 3717, 3717, 3717, 3716, + 3716, 3716, 3716, 3715, 3715, 3715, 3715, 3714, 3714, 3714, 3714, + 3713, 3713, 3713, 3713, 3712, 3712, 3712, 3712, 3711, 3711, 3711, + 3710, 3710, 3710, 3710, 3709, 3709, 3709, 3709, 3708, 3708, 3708, + 3708, 3707, 3707, 3707, 3707, 3706, 3706, 3706, 3706, 3705, 3705, + 3705, 3705, 3704, 3704, 3704, 3704, 3703, 3703, 3703, 3703, 3702, + 3702, 3702, 3702, 3701, 3701, 3701, 3701, 3700, 3700, 3700, 3700, + 3699, 3699, 3699, 3699, 3698, 3698, 3698, 3697, 3697, 3697, 3697, + 3696, 3696, 3696, 3696, 3695, 3695, 3695, 3695, 3694, 3694, 3694, + 3694, 3693, 3693, 3693, 3693, 3692, 3692, 3692, 3692, 3691, 3691, + 3691, 3691, 3690, 3690, 3690, 3690, 3689, 3689, 3689, 3689, 3688, + 3688, 3688, 3687, 3687, 3687, 3687, 3686, 3686, 3686, 3686, 3685, + 3685, 3685, 3685, 3684, 3684, 3684, 3684, 3683, 3683, 3683, 3683, + 3682, 3682, 3682, 3682, 3681, 3681, 3681, 3681, 3680, 3680, 3680, + 3680, 3679, 3679] - # cu_q_lens: cumulative query lengths PER DP RANK - cu_q_lens = [] - for _ in range(dp_size): - cu_q_lens.append([1 * i for i in range(batch_size + 1)]) - cu_q_lens = jnp.array(cu_q_lens, dtype=jnp.int32).reshape(-1) - - # Distribution: per DP rank [decode_end, prefill_end, mixed_end] + # query_start_loc is just [0, 1, 2, ..., 256] for both ranks + query_start_loc_per_rank = list(range(257)) + + # Construct kv_lens and cu_q_lens based on dp_size + if dp_size == 1: + kv_lens = jnp.array(seq_len_no_dp, dtype=jnp.int32) + cu_q_lens = jnp.array(query_start_loc_per_rank, dtype=jnp.int32) + elif dp_size == 2: + kv_lens = jnp.array(seq_lens_rank0 + seq_lens_rank1, dtype=jnp.int32) + cu_q_lens = jnp.array(query_start_loc_per_rank + query_start_loc_per_rank, dtype=jnp.int32) + + # Distribution: [0, 0, 256] per rank (all decode mode) distribution_list = [] for _ in range(dp_size): distribution_list.extend([0, 0, batch_size]) distribution = jnp.array(distribution_list, dtype=jnp.int32) + + + page_indices_rank0 = [[ 1, 2, 3, 4, 5, 6, 7 , 8, 9, 2305, 2561, 2817, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 10, 11, 12, 13, 14, 15, 16, 17, 42, 2306, 2562, 2818, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 18, 19, 20, 21, 22, 23, 24, 25, 43, 2307, 2563, 2819, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 26, 27, 28, 29, 30, 31, 32, 33, 44, 2308, 2564, 2820, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 34, 35, 36, 37, 38, 39, 40, 41, 77, 2309, 2565, 2821, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 45, 46, 47, 48, 49, 50, 51, 52, 78, 2310, 2566, 2822, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 53, 54, 55, 56, 57, 58, 59, 60, 79, 2311, 2567, 2823, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 61, 62, 63, 64, 65, 66, 67, 68, 80, 2312, 2568, 2824, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 69, 70, 71, 72, 73, 74, 75, 76, 113, 2313, 2569, 2825, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 81, 82, 83, 84, 85, 86 , 87 , 88, 114, 2314, 2570, 2826, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 89 , 90 , 91 , 92, 93, 94, 95, 96, 115, 2315, 2571, 2827, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 97 , 98 , 99, 100, 101, 102, 103, 104, 116, 2316, 2572, 2828, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 105, 106, 107, 108, 109, 110, 111, 112, 149, 2317, 2573, 2829, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 117, 118, 119, 120, 121, 122, 123, 124, 150, 2318, 2574, 2830, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 125, 126, 127, 128, 129, 130, 131, 132, 151, 2319, 2575, 2831, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 133, 134, 135, 136, 137, 138, 139, 140, 152, 2320, 2576, 2832, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 141, 142, 143, 144, 145, 146, 147, 148, 185, 2321, 2577, 2833, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 153, 154, 155, 156, 157, 158, 159, 160, 186, 2322, 2578, 2834, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 161, 162, 163, 164, 165, 166, 167, 168, 187, 2323, 2579, 2835, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 169, 170, 171, 172, 173, 174, 175, 176, 188, 2324, 2580, 2836, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 177, 178, 179, 180, 181, 182, 183, 184, 221, 2325, 2581, 2837, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 189, 190, 191, 192, 193, 194, 195, 196, 222, 2326, 2582, 2838, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 197, 198, 199, 200, 201, 202, 203, 204, 223, 2327, 2583, 2839, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 205, 206, 207, 208, 209, 210, 211, 212, 224, 2328, 2584, 2840, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 213, 214, 215, 216, 217, 218, 219, 220, 257, 2329, 2585, 2841, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 225, 226, 227, 228, 229, 230, 231, 232, 258, 2330, 2586, 2842, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 233, 234, 235, 236, 237, 238, 239, 240, 259, 2331, 2587, 2843, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 241, 242, 243, 244, 245, 246, 247, 248, 260, 2332, 2588, 2844, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 249, 250, 251, 252, 253, 254, 255, 256, 293, 2333, 2589, 2845, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 261, 262, 263, 264, 265, 266, 267, 268, 294, 2334, 2590, 2846, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 269, 270, 271, 272, 273, 274, 275, 276, 295, 2335, 2591, 2847, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 277, 278, 279, 280, 281, 282, 283, 284, 296, 2336, 2592, 2848, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 285, 286, 287, 288, 289, 290, 291, 292, 329, 2337, 2593, 2849, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 297, 298, 299, 300, 301, 302, 303, 304, 330, 2338, 2594, 2850, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 305, 306, 307, 308, 309, 310, 311, 312, 331, 2339, 2595, 2851, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 313, 314, 315, 316, 317, 318, 319, 320, 332, 2340, 2596, 2852, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 321, 322, 323, 324, 325, 326, 327, 328, 365, 2341, 2597, 2853, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 333, 334, 335, 336, 337, 338, 339, 340, 366, 2342, 2598, 2854, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 341, 342, 343, 344, 345, 346, 347, 348, 367, 2343, 2599, 2855, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 349, 350, 351, 352, 353, 354, 355, 356, 368, 2344, 2600, 2856, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 357, 358, 359, 360, 361, 362, 363, 364, 401, 2345, 2601, 2857, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 369, 370, 371, 372, 373, 374, 375, 376, 402, 2346, 2602, 2858, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 377, 378, 379, 380, 381, 382, 383, 384, 403, 2347, 2603, 2859, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 385, 386, 387, 388, 389, 390, 391, 392, 404, 2348, 2604, 2860, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 393, 394, 395, 396, 397, 398, 399, 400, 436, 2349, 2605, 2861, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 405, 406, 407, 408, 409, 410, 411, 412, 437, 2350, 2606, 2862, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 413, 414, 415, 416, 417, 418, 419, 420, 438, 2351, 2607, 2863, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 421, 422, 423, 424, 425, 426, 427, 428, 439, 2352, 2608, 2864, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 429, 430, 431, 432, 433, 434, 435, 440, 472, 2353, 2609, 2865, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 441, 442, 443, 444, 445, 446, 447, 448, 473, 2354, 2610, 2866, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 449, 450, 451, 452, 453, 454, 455, 456, 474, 2355, 2611, 2867, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 457, 458, 459, 460, 461, 462, 463, 464, 475, 2356, 2612, 2868, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 465, 466, 467, 468, 469, 470, 471, 476, 508, 2357, 2613, 2869, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 477, 478, 479, 480, 481, 482, 483, 484, 509, 2358, 2614, 2870, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 485, 486, 487, 488, 489, 490, 491, 492, 510, 2359, 2615, 2871, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 493, 494, 495, 496, 497, 498, 499, 500, 511, 2360, 2616, 2872, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 501, 502, 503, 504, 505, 506, 507, 512, 544, 2361, 2617, 2873, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 513, 514, 515, 516, 517, 518, 519, 520, 545, 2362, 2618, 2874, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 521, 522, 523, 524, 525, 526, 527, 528, 546, 2363, 2619, 2875, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 529, 530, 531, 532, 533, 534, 535, 536, 547, 2364, 2620, 2876, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 537, 538, 539, 540, 541, 542, 543, 548, 580, 2365, 2621, 2877, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 549, 550, 551, 552, 553, 554, 555, 556, 581, 2366, 2622, 2878, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 557, 558, 559, 560, 561, 562, 563, 564, 582, 2367, 2623, 2879, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 565, 566, 567, 568, 569, 570, 571, 572, 583, 2368, 2624, 2880, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 573, 574, 575, 576, 577, 578, 579, 584, 615, 2369, 2625, 2881, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 585, 586, 587, 588, 589, 590, 591, 592, 616, 2370, 2626, 2882, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 593, 594, 595, 596, 597, 598, 599, 600, 617, 2371, 2627, 2883, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 601, 602, 603, 604, 605, 606, 607, 608, 618, 2372, 2628, 2884, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 609, 610, 611, 612, 613, 614, 619, 620, 651, 2373, 2629, 2885, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 621, 622, 623, 624, 625, 626, 627, 628, 652, 2374, 2630, 2886, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 629, 630, 631, 632, 633, 634, 635, 636, 653, 2375, 2631, 2887, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 637, 638, 639, 640, 641, 642, 643, 644, 654, 2376, 2632, 2888, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 645, 646, 647, 648, 649, 650, 655, 656, 687, 2377, 2633, 2889, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 657, 658, 659, 660, 661, 662, 663, 664, 688, 2378, 2634, 2890, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 665, 666, 667, 668, 669, 670, 671, 672, 689, 2379, 2635, 2891, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 673, 674, 675, 676, 677, 678, 679, 680, 690, 2380, 2636, 2892, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 681, 682, 683, 684, 685, 686, 691, 692, 723, 2381, 2637, 2893, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 693, 694, 695, 696, 697, 698, 699, 700, 724, 2382, 2638, 2894, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 701, 702, 703, 704, 705, 706, 707, 708, 725, 2383, 2639, 2895, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 709, 710, 711, 712, 713, 714, 715, 716, 726, 2384, 2640, 2896, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 717, 718, 719, 720, 721, 722, 727, 728, 758, 2385, 2641, 2897, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 729, 730, 731, 732, 733, 734, 735, 736, 759, 2386, 2642, 2898, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 737, 738, 739, 740, 741, 742, 743, 744, 760, 2387, 2643, 2899, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 745, 746, 747, 748, 749, 750, 751, 752, 761, 2388, 2644, 2900, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 753, 754, 755, 756, 757, 762, 763, 764, 794, 2389, 2645, 2901, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 765, 766, 767, 768, 769, 770, 771, 772, 795, 2390, 2646, 2902, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 773, 774, 775, 776, 777, 778, 779, 780, 796, 2391, 2647, 2903, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 781, 782, 783, 784, 785, 786, 787, 788, 797, 2392, 2648, 2904, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 789, 790, 791, 792, 793, 798, 799, 800, 830, 2393, 2649, 2905, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 801, 802, 803, 804, 805, 806, 807, 808, 831, 2394, 2650, 2906, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 809, 810, 811, 812, 813, 814, 815, 816, 832, 2395, 2651, 2907, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 817, 818, 819, 820, 821, 822, 823, 824, 833, 2396, 2652, 2908, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 825, 826, 827, 828, 829, 834, 835, 836, 865, 2397, 2653, 2909, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 837, 838, 839, 840, 841, 842, 843, 844, 866, 2398, 2654, 2910, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 845, 846, 847, 848, 849, 850, 851, 852, 867, 2399, 2655, 2911, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 853, 854, 855, 856, 857, 858, 859, 860, 868, 2400, 2656, 2912, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 861, 862, 863, 864, 869, 870, 871, 872, 901, 2401, 2657, 2913, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 873, 874, 875, 876, 877, 878, 879, 880, 902, 2402, 2658, 2914, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 881, 882, 883, 884, 885, 886, 887, 888, 903, 2403, 2659, 2915, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 889, 890, 891, 892, 893, 894, 895, 896, 904, 2404, 2660, 2916, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 897, 898, 899, 900, 905, 906, 907, 908, 936, 2405, 2661, 2917, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 909, 910, 911, 912, 913, 914, 915, 916, 937, 2406, 2662, 2918, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 917, 918, 919, 920, 921, 922, 923, 924, 938, 2407, 2663, 2919, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 925, 926, 927, 928, 929, 930, 931, 932, 939, 2408, 2664, 2920, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 933, 934, 935, 940, 941, 942, 943, 944, 972, 2409, 2665, 2921, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 945, 946, 947, 948, 949, 950, 951, 952, 973, 2410, 2666, 2922, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 953, 954, 955, 956, 957, 958, 959, 960, 974, 2411, 2667, 2923, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 961, 962, 963, 964, 965, 966, 967, 968, 975, 2412, 2668, 2924, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 969, 970, 971, 976, 977, 978, 979, 980, 1008, 2413, 2669, 2925, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 981, 982, 983, 984, 985, 986, 987, 988, 1009, 2414, 2670, 2926, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 989, 990, 991, 992, 993, 994, 995, 996, 1010, 2415, 2671, 2927, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 997, 998, 999, 1000, 1001, 1002,1003, 1004, 1011, 2416, 2672, 2928, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1005, 1006, 1007, 1012,1013, 1014, 1015, 1016, 1043, 2417, 2673, 2929, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1017, 1018, 1019, 1020, 1021, 1022,1023, 1024, 1044, 2418, 2674, 2930, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1025, 1026, 1027, 1028, 1029, 1030, 1031, 1032,1045, 2419, 2675, 2931, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1033, 1034, 1035, 1036, 1037, 1038, 1039, 1040, 1046, 2420, 2676, 2932, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1041, 1042,1047, 1048, 1049, 1050, 1051, 1052,1079, 2421, 2677, 2933, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1053, 1054, 1055, 1056, 1057, 1058, 1059, 1060, 1080, 2422, 2678, 2934, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1061, 1062,1063, 1064, 1065, 1066, 1067, 1068, 1081, 2423, 2679, 2935, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1069, 1070, 1071, 1072,1073, 1074, 1075, 1076, 1082, 2424, 2680, 2936, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1077, 1078, 1083, 1084, 1085, 1086, 1087, 1088, 1114, 2425, 2681, 2937, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1089, 1090, 1091, 1092,1093, 1094, 1095, 1096, 1115, 2426, 2682, 2938, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1097, 1098, 1099, 1100, 1101, 1102,1103, 1104, 1116, 2427, 2683, 2939, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1105, 1106, 1107, 1108, 1109, 1110, 1111, 1112,1117, 2428, 2684, 2940, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1113, 1118, 1119, 1120, 1121, 1122,1123, 1124, 1150, 2429, 2685, 2941, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1125, 1126, 1127, 1128, 1129, 1130, 1131, 1132,1151, 2430, 2686, 2942, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1133, 1134, 1135, 1136, 1137, 1138, 1139, 1140, 1152, 2431, 2687, 2943, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1141, 1142,1143, 1144, 1145, 1146, 1147, 1148, 1153, 2432, 2688, 2944, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1149, 1154, 1155, 1156, 1157, 1158, 1159, 1160, 1185, 2433, 2689, 2945, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1161, 1162,1163, 1164, 1165, 1166, 1167, 1168, 1186, 2434, 2690, 2946, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1169, 1170, 1171, 1172,1173, 1174, 1175, 1176, 1187, 2435, 2691, 2947, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1177, 1178, 1179, 1180, 1181, 1182,1183, 1184, 1220, 2436, 2692, 2948, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1188, 1189, 1190, 1191, 1192,1193, 1194, 1195, 1221, 2437, 2693, 2949, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1196, 1197, 1198, 1199, 1200, 1201, 1202,1203, 1222, 2438, 2694, 2950, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1204, 1205, 1206, 1207, 1208, 1209, 1210, 1211, 1223, 2439, 2695, 2951, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1212,1213, 1214, 1215, 1216, 1217, 1218, 1219, 1255, 2440, 2696, 2952, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1224, 1225, 1226, 1227, 1228, 1229, 1230, 1231, 1256, 2441, 2697, 2953, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1232,1233, 1234, 1235, 1236, 1237, 1238, 1239, 1257, 2442, 2698, 2954, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1240, 1241, 1242,1243, 1244, 1245, 1246, 1247, 1258, 2443, 2699, 2955, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1248, 1249, 1250, 1251, 1252,1253, 1254, 1259, 1291, 2444, 2700, 2956, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1260, 1261, 1262,1263, 1264, 1265, 1266, 1267, 1292, 2445, 2701, 2957, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1268, 1269, 1270, 1271, 1272,1273, 1274, 1275, 1293, 2446, 2702, 2958, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1276, 1277, 1278, 1279, 1280, 1281, 1282,1283, 1294, 2447, 2703, 2959, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1284, 1285, 1286, 1287, 1288, 1289, 1290, 1295, 1326, 2448, 2704, 2960, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1296, 1297, 1298, 1299, 1300, 1301, 1302,1303, 1327, 2449, 2705, 2961, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1304, 1305, 1306, 1307, 1308, 1309, 1310, 1311, 1328, 2450, 2706, 2962, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1312,1313, 1314, 1315, 1316, 1317, 1318, 1319, 1329, 2451, 2707, 2963, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1320, 1321, 1322,1323, 1324, 1325, 1330, 1331, 1362, 2452, 2708, 2964, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1332,1333, 1334, 1335, 1336, 1337, 1338, 1339, 1363, 2453, 2709, 2965, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1340, 1341, 1342,1343, 1344, 1345, 1346, 1347, 1364, 2454, 2710, 2966, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1348, 1349, 1350, 1351, 1352,1353, 1354, 1355, 1365, 2455, 2711, 2967, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1356, 1357, 1358, 1359, 1360, 1361, 1366, 1367, 1397, 2456, 2712, 2968, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1368, 1369, 1370, 1371, 1372,1373, 1374, 1375, 1398, 2457, 2713, 2969, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1376, 1377, 1378, 1379, 1380, 1381, 1382,1383, 1399, 2458, 2714, 2970, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1384, 1385, 1386, 1387, 1388, 1389, 1390, 1391, 1400, 2459, 2715, 2971, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1392,1393, 1394, 1395, 1396, 1401, 1402,1403, 1432, 2460, 2716, 2972, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1404, 1405, 1406, 1407, 1408, 1409, 1410, 1411, 1433, 2461, 2717, 2973, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1412,1413, 1414, 1415, 1416, 1417, 1418, 1419, 1434, 2462, 2718, 2974, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1420, 1421, 1422,1423, 1424, 1425, 1426, 1427, 1435, 2463, 2719, 2975, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1428, 1429, 1430, 1431, 1436, 1437, 1438, 1439, 1468, 2464, 2720, 2976, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1440, 1441, 1442,1443, 1444, 1445, 1446, 1447, 1469, 2465, 2721, 2977, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1448, 1449, 1450, 1451, 1452,1453, 1454, 1455, 1470, 2466, 2722, 2978, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1456, 1457, 1458, 1459, 1460, 1461, 1462,1463, 1471, 2467, 2723, 2979, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1464, 1465, 1466, 1467, 1472,1473, 1474, 1475, 1503, 2468, 2724, 2980, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1476, 1477, 1478, 1479, 1480, 1481, 1482,1483, 1504, 2469, 2725, 2981, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1484, 1485, 1486, 1487, 1488, 1489, 1490, 1491, 1505, 2470, 2726, 2982, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1492,1493, 1494, 1495, 1496, 1497, 1498, 1499, 1506, 2471, 2727, 2983, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1500, 1501, 1502,1507, 1508, 1509, 1510, 1511, 1538, 2472, 2728, 2984, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1512,1513, 1514, 1515, 1516, 1517, 1518, 1519, 1539, 2473, 2729, 2985, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1520, 1521, 1522,1523, 1524, 1525, 1526, 1527, 1540, 2474, 2730, 2986, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1528, 1529, 1530, 1531, 1532,1533, 1534, 1535, 1541, 2475, 2731, 2987, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1536, 1537, 1542,1543, 1544, 1545, 1546, 1547, 1574, 2476, 2732, 2988, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1548, 1549, 1550, 1551, 1552,1553, 1554, 1555, 1575, 2477, 2733, 2989, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1556, 1557, 1558, 1559, 1560, 1561, 1562,1563, 1576, 2478, 2734, 2990, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1564, 1565, 1566, 1567, 1568, 1569, 1570, 1571, 1577, 2479, 2735, 2991, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1572,1573, 1578, 1579, 1580, 1581, 1582,1583, 1609, 2480, 2736, 2992, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1584, 1585, 1586, 1587, 1588, 1589, 1590, 1591, 1610, 2481, 2737, 2993, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1592,1593, 1594, 1595, 1596, 1597, 1598, 1599, 1611, 2482, 2738, 2994, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1600, 1601, 1602,1603, 1604, 1605, 1606, 1607, 1612, 2483, 2739, 2995, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1608, 1613, 1614, 1615, 1616, 1617, 1618, 1619, 1644, 2484, 2740, 2996, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1620, 1621, 1622,1623, 1624, 1625, 1626, 1627, 1645, 2485, 2741, 2997, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1628, 1629, 1630, 1631, 1632,1633, 1634, 1635, 1646, 2486, 2742, 2998, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1636, 1637, 1638, 1639, 1640, 1641, 1642,1643, 1679, 2487, 2743, 2999, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1647, 1648, 1649, 1650, 1651, 1652,1653, 1654, 1680, 2488, 2744, 3000, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1655, 1656, 1657, 1658, 1659, 1660, 1661, 1662,1681, 2489, 2745, 3001, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1663, 1664, 1665, 1666, 1667, 1668, 1669, 1670, 1682, 2490, 2746, 3002, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1671, 1672,1673, 1674, 1675, 1676, 1677, 1678, 1714, 2491, 2747, 3003, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1683, 1684, 1685, 1686, 1687, 1688, 1689, 1690, 1715, 2492, 2748, 3004, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1691, 1692,1693, 1694, 1695, 1696, 1697, 1698, 1716, 2493, 2749, 3005, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1699, 1700, 1701, 1702,1703, 1704, 1705, 1706, 1717, 2494, 2750, 3006, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1707, 1708, 1709, 1710, 1711, 1712,1713, 1718, 1749, 2495, 2751, 3007, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1719, 1720, 1721, 1722,1723, 1724, 1725, 1726, 1750, 2496, 2752, 3008, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1727, 1728, 1729, 1730, 1731, 1732,1733, 1734, 1751, 2497, 2753, 3009, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1735, 1736, 1737, 1738, 1739, 1740, 1741, 1742,1752, 2498, 2754, 3010, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1743, 1744, 1745, 1746, 1747, 1748, 1753, 1754, 1784, 2499, 2755, 3011, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1755, 1756, 1757, 1758, 1759, 1760, 1761, 1762,1785, 2500, 2756, 3012, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1763, 1764, 1765, 1766, 1767, 1768, 1769, 1770, 1786, 2501, 2757, 3013, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1771, 1772,1773, 1774, 1775, 1776, 1777, 1778, 1787, 2502, 2758, 3014, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1779, 1780, 1781, 1782,1783, 1788, 1789, 1790, 1820, 2503, 2759, 3015, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1791, 1792,1793, 1794, 1795, 1796, 1797, 1798, 1821, 2504, 2760, 3016, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1799, 1800, 1801, 1802,1803, 1804, 1805, 1806, 1822, 2505, 2761, 3017, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1807, 1808, 1809, 1810, 1811, 1812,1813, 1814, 1823, 2506, 2762, 3018, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1815, 1816, 1817, 1818, 1819, 1824, 1825, 1826, 1855, 2507, 2763, 3019, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1827, 1828, 1829, 1830, 1831, 1832,1833, 1834, 1856, 2508, 2764, 3020, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1835, 1836, 1837, 1838, 1839, 1840, 1841, 1842,1857, 2509, 2765, 3021, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1843, 1844, 1845, 1846, 1847, 1848, 1849, 1850, 1858, 2510, 2766, 3022, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1851, 1852,1853, 1854, 1859, 1860, 1861, 1862,1890, 2511, 2767, 3023, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1863, 1864, 1865, 1866, 1867, 1868, 1869, 1870, 1891, 2512, 2768, 3024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1871, 1872,1873, 1874, 1875, 1876, 1877, 1878, 1892, 2513, 2769, 3025, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1879, 1880, 1881, 1882,1883, 1884, 1885, 1886, 1893, 2514, 2770, 3026, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1887, 1888, 1889, 1894, 1895, 1896, 1897, 1898, 1925, 2515, 2771, 3027, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1899, 1900, 1901, 1902,1903, 1904, 1905, 1906, 1926, 2516, 2772, 3028, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1907, 1908, 1909, 1910, 1911, 1912,1913, 1914, 1927, 2517, 2773, 3029, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1915, 1916, 1917, 1918, 1919, 1920, 1921, 1922,1928, 2518, 2774, 3030, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1923, 1924, 1929, 1930, 1931, 1932,1933, 1934, 1960, 2519, 2775, 3031, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1935, 1936, 1937, 1938, 1939, 1940, 1941, 1942,1961, 2520, 2776, 3032, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1943, 1944, 1945, 1946, 1947, 1948, 1949, 1950, 1962, 2521, 2777, 3033, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1951, 1952,1953, 1954, 1955, 1956, 1957, 1958, 1963, 2522, 2778, 3034, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1959, 1964, 1965, 1966, 1967, 1968, 1969, 1970, 1996, 2523, 2779, 3035, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1971, 1972,1973, 1974, 1975, 1976, 1977, 1978, 1997, 2524, 2780, 3036, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1979, 1980, 1981, 1982,1983, 1984, 1985, 1986, 1998, 2525, 2781, 3037, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1987, 1988, 1989, 1990, 1991, 1992,1993, 1994, 1999, 2526, 2782, 3038, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1995, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2031, 2527, 2783, 3039, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2007, 2008, 2009, 2010, 2011, 2012, 2013, 2014, 2032, 2528, 2784, 3040, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2015, 2016, 2017, 2018, 2019, 2020, 2021, 2022, 2033, 2529, 2785, 3041, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2023, 2024, 2025, 2026, 2027, 2028, 2029, 2030, 2065, 2530, 2786, 3042, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2034, 2035, 2036, 2037, 2038, 2039, 2040, 2041, 2066, 2531, 2787, 3043, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2042, 2043, 2044, 2045, 2046, 2047, 2048, 2049, 2067, 2532, 2788, 3044, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2050, 2051, 2052, 2053, 2054, 2055, 2056, 2057, 2068, 2533, 2789, 3045, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2058, 2059, 2060, 2061, 2062, 2063, 2064, 2069, 2100, 2534, 2790, 3046, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2070, 2071, 2072, 2073, 2074, 2075, 2076, 2077, 2101, 2535, 2791, 3047, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2078, 2079, 2080, 2081, 2082, 2083, 2084, 2085, 2102, 2536, 2792, 3048, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2086, 2087, 2088, 2089, 2090, 2091, 2092, 2093, 2103, 2537, 2793, 3049, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2094, 2095, 2096, 2097, 2098, 2099, 2104, 2105, 2135, 2538, 2794, 3050, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2106, 2107, 2108, 2109, 2110, 2111, 2112, 2113, 2136, 2539, 2795, 3051, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2114, 2115, 2116, 2117, 2118, 2119, 2120, 2121, 2137, 2540, 2796, 3052, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2122, 2123, 2124, 2125, 2126, 2127, 2128, 2129, 2138, 2541, 2797, 3053, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2130, 2131, 2132, 2133, 2134, 2139, 2140, 2141, 2170, 2542, 2798, 3054, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2142, 2143, 2144, 2145, 2146, 2147, 2148, 2149, 2171, 2543, 2799, 3055, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2150, 2151, 2152, 2153, 2154, 2155, 2156, 2157, 2172, 2544, 2800, 3056, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2158, 2159, 2160, 2161, 2162, 2163, 2164, 2165, 2173, 2545, 2801, 3057, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2166, 2167, 2168, 2169, 2174, 2175, 2176, 2177, 2205, 2546, 2802, 3058, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2178, 2179, 2180, 2181, 2182, 2183, 2184, 2185, 2206, 2547, 2803, 3059, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2186, 2187, 2188, 2189, 2190, 2191, 2192, 2193, 2207, 2548, 2804, 3060, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2194, 2195, 2196, 2197, 2198, 2199, 2200, 2201, 2208, 2549, 2805, 3061, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2202, 2203, 2204, 2209, 2210, 2211, 2212, 2213, 2240, 2550, 2806, 3062, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2214, 2215, 2216, 2217, 2218, 2219, 2220, 2221, 2241, 2551, 2807, 3063, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2222, 2223, 2224, 2225, 2226, 2227, 2228, 2229, 2242, 2552, 2808, 3064, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2230, 2231, 2232, 2233, 2234, 2235, 2236, 2237, 2243, 2553, 2809, 3065, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2238, 2239, 2244, 2245, 2246, 2247, 2248, 2249, 2275, 2554, 2810, 3066, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2250, 2251, 2252, 2253, 2254, 2255, 2256, 2257, 2276, 2555, 2811, 3067, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2258, 2259, 2260, 2261, 2262, 2263, 2264, 2265, 2277, 2556, 2812, 3068, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2266, 2267, 2268, 2269, 2270, 2271, 2272, 2273, 2278, 2557, 2813, 3069, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2274, 2279, 2280, 2281, 2282, 2283, 2284, 2285, 2302, 2558, 2814, 3070, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2286, 2287, 2288, 2289, 2290, 2291, 2292, 2293, 2303, 2559, 2815, 3071, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2294, 2295, 2296, 2297, 2298, 2299, 2300, 2301, 2304, 2560, 2816, 3072, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]] + + + page_indices_rank1 = [[ 1, 2, 3, 4, 5, 6, 7, 8, 33, 2305, 2561, 2817, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 9, 10, 11, 12, 13, 14, 15, 16, 34, 2306, 2562, 2818, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 17, 18, 19, 20, 21, 22, 23, 24, 35, 2307, 2563, 2819, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 25, 26, 27, 28, 29, 30, 31, 32, 36, 2308, 2564, 2820, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 53, 54, 55, 56, 57, 58, 59, 60, 71, 2311, 2567, 2823, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 37, 38, 39, 40, 41, 42, 43, 44, 69, 2309, 2565, 2821, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 45, 46, 47, 48, 49, 50, 51, 52, 70, 2310, 2566, 2822, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 61, 62, 63, 64, 65, 66, 67, 68, 104, 2312, 2568, 2824, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 88, 89 , 90 , 91, 92, 93, 94, 95, 107, 2315, 2571, 2827, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 72, 73, 74, 75, 76, 77, 78, 79, 105, 2313, 2569, 2825, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 80, 81, 82, 83, 84, 85 ,86, 87, 106, 2314, 2570, 2826, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 96, 97, 98, 99, 100, 101, 102, 103, 140, 2316, 2572, 2828, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 124, 125, 126, 127, 128, 129, 130, 131, 143, 2319, 2575, 2831, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 108, 109, 110, 111, 112, 113, 114, 115, 141, 2317, 2573, 2829, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 116, 117, 118, 119, 120, 121, 122, 123, 142, 2318, 2574, 2830, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 132, 133, 134, 135, 136, 137, 138, 139, 176, 2320, 2576, 2832, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 160, 161, 162, 163, 164, 165, 166, 167, 179, 2323, 2579, 2835, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 144, 145, 146, 147, 148, 149, 150, 151, 177, 2321, 2577, 2833, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 152, 153, 154, 155, 156, 157, 158, 159, 178, 2322, 2578, 2834, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 168, 169, 170, 171, 172, 173, 174, 175, 212, 2324, 2580, 2836, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 196, 197, 198, 199, 200, 201, 202, 203, 215, 2327, 2583, 2839, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 180, 181, 182, 183, 184, 185, 186, 187, 213, 2325, 2581, 2837, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 188, 189, 190, 191, 192, 193, 194, 195, 214, 2326, 2582, 2838, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 204, 205, 206, 207, 208, 209, 210, 211, 248, 2328, 2584, 2840, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 232, 233, 234, 235, 236, 237, 238, 239, 251, 2331, 2587, 2843, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 216, 217, 218, 219, 220, 221, 222, 223, 249, 2329, 2585, 2841, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 224, 225, 226, 227, 228, 229, 230, 231, 250, 2330, 2586, 2842, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 240, 241, 242, 243, 244, 245, 246, 247, 284, 2332, 2588, 2844, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 268, 269, 270, 271, 272, 273, 274, 275, 287, 2335, 2591, 2847, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 252, 253, 254, 255, 256, 257, 258, 259, 285, 2333, 2589, 2845, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 260, 261, 262, 263, 264, 265, 266, 267, 286, 2334, 2590, 2846, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 276, 277, 278, 279, 280, 281, 282, 283, 320, 2336, 2592, 2848, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 304, 305, 306, 307, 308, 309, 310, 311, 323, 2339, 2595, 2851, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 288, 289, 290, 291, 292, 293, 294, 295, 321, 2337, 2593, 2849, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 296, 297, 298, 299, 300, 301, 302, 303, 322, 2338, 2594, 2850, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 312, 313, 314, 315, 316, 317, 318, 319, 356, 2340, 2596, 2852, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 340, 341, 342, 343, 344, 345, 346, 347, 359, 2343, 2599, 2855, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 324, 325, 326, 327, 328, 329, 330, 331, 357, 2341, 2597, 2853, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 332, 333, 334, 335, 336, 337, 338, 339, 358, 2342, 2598, 2854, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 348, 349, 350, 351, 352, 353, 354, 355, 392, 2344, 2600, 2856, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 376, 377, 378, 379, 380, 381, 382, 383, 395, 2347, 2603, 2859, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 360, 361, 362, 363, 364, 365, 366, 367, 393, 2345, 2601, 2857, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 368, 369, 370, 371, 372, 373, 374, 375, 394, 2346, 2602, 2858, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 384, 385, 386, 387, 388, 389, 390, 391, 428, 2348, 2604, 2860, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 412, 413, 414, 415, 416, 417, 418, 419, 431, 2351, 2607, 2863, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 396, 397, 398, 399, 400, 401, 402, 403, 429, 2349, 2605, 2861, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 404, 405, 406, 407, 408, 409, 410, 411, 430, 2350, 2606, 2862, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 420, 421, 422, 423, 424, 425, 426, 427, 463, 2352, 2608, 2864, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 448, 449, 450, 451, 452, 453, 454, 455, 466, 2355, 2611, 2867, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 432, 433, 434, 435, 436, 437, 438, 439, 464, 2353, 2609, 2865, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 440, 441, 442, 443, 444, 445, 446, 447, 465, 2354, 2610, 2866, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 456, 457, 458, 459, 460, 461, 462, 467, 499, 2356, 2612, 2868, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 484, 485, 486, 487, 488, 489, 490, 491, 502, 2359, 2615, 2871, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 468, 469, 470, 471, 472, 473, 474, 475, 500, 2357, 2613, 2869, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 476, 477, 478, 479, 480, 481, 482, 483, 501, 2358, 2614, 2870, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 492, 493, 494, 495, 496, 497, 498, 503, 535, 2360, 2616, 2872, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 520, 521, 522, 523, 524, 525, 526, 527, 538, 2363, 2619, 2875, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 504, 505, 506, 507, 508, 509, 510, 511, 536, 2361, 2617, 2873, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 512, 513, 514, 515, 516, 517, 518, 519, 537, 2362, 2618, 2874, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 528, 529, 530, 531, 532, 533, 534, 539, 571, 2364, 2620, 2876, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 556, 557, 558, 559, 560, 561, 562, 563, 574, 2367, 2623, 2879, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 540, 541, 542, 543, 544, 545, 546, 547, 572, 2365, 2621, 2877, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 548, 549, 550, 551, 552, 553, 554, 555, 573, 2366, 2622, 2878, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 564, 565, 566, 567, 568, 569, 570, 575, 606, 2368, 2624, 2880, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 592, 593, 594, 595, 596, 597, 598, 599, 609, 2371, 2627, 2883, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 576, 577, 578, 579, 580, 581, 582, 583, 607, 2369, 2625, 2881, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 584, 585, 586, 587, 588, 589, 590, 591, 608, 2370, 2626, 2882, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 600, 601, 602, 603, 604, 605, 610, 611, 642, 2372, 2628, 2884, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 628, 629, 630, 631, 632, 633, 634, 635, 645, 2375, 2631, 2887, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 612, 613, 614, 615, 616, 617, 618, 619, 643, 2373, 2629, 2885, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 620, 621, 622, 623, 624, 625, 626, 627, 644, 2374, 2630, 2886, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 636, 637, 638, 639, 640, 641, 646, 647, 678, 2376, 2632, 2888, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 664, 665, 666, 667, 668, 669, 670, 671, 681, 2379, 2635, 2891, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 648, 649, 650, 651, 652, 653, 654, 655, 679, 2377, 2633, 2889, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 656, 657, 658, 659, 660, 661, 662, 663, 680, 2378, 2634, 2890, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 672, 673, 674, 675, 676, 677, 682, 683, 714, 2380, 2636, 2892, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 700, 701, 702, 703, 704, 705, 706, 707, 717, 2383, 2639, 2895, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 684, 685, 686, 687, 688, 689, 690, 691, 715, 2381, 2637, 2893, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 692, 693, 694, 695, 696, 697, 698, 699, 716, 2382, 2638, 2894, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 708, 709, 710, 711, 712, 713, 718, 719, 749, 2384, 2640, 2896, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 736, 737, 738, 739, 740, 741, 742, 743, 752, 2387, 2643, 2899, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 720, 721, 722, 723, 724, 725, 726, 727, 750, 2385, 2641, 2897, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 728, 729, 730, 731, 732, 733, 734, 735, 751, 2386, 2642, 2898, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 744, 745, 746, 747, 748, 753, 754, 755, 785, 2388, 2644, 2900, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 772, 773, 774, 775, 776, 777, 778, 779, 788, 2391, 2647, 2903, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 756, 757, 758, 759, 760, 761, 762, 763, 786, 2389, 2645, 2901, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 764, 765, 766, 767, 768, 769, 770, 771, 787, 2390, 2646, 2902, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 780, 781, 782, 783, 784, 789, 790, 791, 821, 2392, 2648, 2904, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 808, 809, 810, 811, 812, 813, 814, 815, 824, 2395, 2651, 2907, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 792, 793, 794, 795, 796, 797, 798, 799, 822, 2393, 2649, 2905, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 800, 801, 802, 803, 804, 805, 806, 807, 823, 2394, 2650, 2906, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 816, 817, 818, 819, 820, 825, 826, 827, 856, 2396, 2652, 2908, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 844, 845, 846, 847, 848, 849, 850, 851, 859, 2399, 2655, 2911, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 828, 829, 830, 831, 832, 833, 834, 835, 857, 2397, 2653, 2909, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 836, 837, 838, 839, 840, 841, 842, 843, 858, 2398, 2654, 2910, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 852, 853, 854, 855, 860, 861, 862, 863, 892, 2400, 2656, 2912, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 880, 881, 882, 883, 884, 885, 886, 887, 895, 2403, 2659, 2915, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 864, 865, 866, 867, 868, 869, 870, 871, 893, 2401, 2657, 2913, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 872, 873, 874, 875, 876, 877, 878, 879, 894, 2402, 2658, 2914, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 888, 889, 890, 891, 896, 897, 898, 899, 928, 2404, 2660, 2916, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 916, 917, 918, 919, 920, 921, 922, 923, 931, 2407, 2663, 2919, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 900, 901, 902, 903, 904, 905, 906, 907, 929, 2405, 2661, 2917, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 908, 909, 910, 911, 912, 913, 914, 915, 930, 2406, 2662, 2918, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 924, 925, 926, 927, 932, 933, 934, 935, 963, 2408, 2664, 2920, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 952, 953, 954, 955, 956, 957, 958, 959, 966, 2411, 2667, 2923, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 936, 937, 938, 939, 940, 941, 942, 943, 964, 2409, 2665, 2921, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 944, 945, 946, 947, 948, 949, 950, 951, 965, 2410, 2666, 2922, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 960, 961, 962, 967, 968, 969, 970, 971, 999, 2412, 2668, 2924, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 988, 989, 990, 991, 992, 993, 994, 995, 1002, 2415, 2671, 2927, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 972, 973, 974, 975, 976, 977, 978, 979, 1000, 2413, 2669, 2925, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 980, 981, 982, 983, 984, 985, 986, 987, 1001, 2414, 2670, 2926, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 996, 997, 998, 1003, 1004, 1005, 1006, 1007, 1034, 2416, 2672, 2928, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1024, 1025, 1026, 1027, 1028, 1029, 1030, 1031, 1037, 2419, 2675, 2931, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1008, 1009, 1010, 1011, 1012,1013, 1014, 1015, 1035, 2417, 2673, 2929, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1016, 1017, 1018, 1019, 1020, 1021, 1022,1023, 1036, 2418, 2674, 2930, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1032,1033, 1038, 1039, 1040, 1041, 1042,1043, 1070, 2420, 2676, 2932, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1060, 1061, 1062,1063, 1064, 1065, 1066, 1067, 1073, 2423, 2679, 2935, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1044, 1045, 1046, 1047, 1048, 1049, 1050, 1051, 1071, 2421, 2677, 2933, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1052,1053, 1054, 1055, 1056, 1057, 1058, 1059, 1072, 2422, 2678, 2934, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1068, 1069, 1074, 1075, 1076, 1077, 1078, 1079, 1105, 2424, 2680, 2936, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1096, 1097, 1098, 1099, 1100, 1101, 1102,1103, 1108, 2427, 2683, 2939, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1080, 1081, 1082,1083, 1084, 1085, 1086, 1087, 1106, 2425, 2681, 2937, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1088, 1089, 1090, 1091, 1092,1093, 1094, 1095, 1107, 2426, 2682, 2938, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1104, 1109, 1110, 1111, 1112,1113, 1114, 1115, 1141, 2428, 2684, 2940, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1132,1133, 1134, 1135, 1136, 1137, 1138, 1139, 1144, 2431, 2687, 2943, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1116, 1117, 1118, 1119, 1120, 1121, 1122,1123, 1142, 2429, 2685, 2941, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1124, 1125, 1126, 1127, 1128, 1129, 1130, 1131, 1143, 2430, 2686, 2942, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1140, 1145, 1146, 1147, 1148, 1149, 1150, 1151, 1176, 2432, 2688, 2944, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1160, 1161, 1162,1163, 1164, 1165, 1166, 1167, 1178, 2434, 2690, 2946, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1152,1153, 1154, 1155, 1156, 1157, 1158, 1159, 1177, 2433, 2689, 2945, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1168, 1169, 1170, 1171, 1172,1173, 1174, 1175, 1211, 2435, 2691, 2947, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1195, 1196, 1197, 1198, 1199, 1200, 1201, 1202,1214, 2438, 2694, 2950, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1179, 1180, 1181, 1182,1183, 1184, 1185, 1186, 1212, 2436, 2692, 2948, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1187, 1188, 1189, 1190, 1191, 1192,1193, 1194, 1213, 2437, 2693, 2949, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1203, 1204, 1205, 1206, 1207, 1208, 1209, 1210, 1246, 2439, 2695, 2951, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1231, 1232,1233, 1234, 1235, 1236, 1237, 1238, 1249, 2442, 2698, 2954, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1215, 1216, 1217, 1218, 1219, 1220, 1221, 1222,1247, 2440, 2696, 2952, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1223, 1224, 1225, 1226, 1227, 1228, 1229, 1230, 1248, 2441, 2697, 2953, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1239, 1240, 1241, 1242,1243, 1244, 1245, 1250, 1282, 2443, 2699, 2955, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1267, 1268, 1269, 1270, 1271, 1272,1273, 1274, 1285, 2446, 2702, 2958, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1251, 1252,1253, 1254, 1255, 1256, 1257, 1258, 1283, 2444, 2700, 2956, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1259, 1260, 1261, 1262,1263, 1264, 1265, 1266, 1284, 2445, 2701, 2957, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1275, 1276, 1277, 1278, 1279, 1280, 1281, 1286, 1317, 2447, 2703, 2959, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1303, 1304, 1305, 1306, 1307, 1308, 1309, 1310, 1320, 2450, 2706, 2962, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1287, 1288, 1289, 1290, 1291, 1292,1293, 1294, 1318, 2448, 2704, 2960, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1295, 1296, 1297, 1298, 1299, 1300, 1301, 1302,1319, 2449, 2705, 2961, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1311, 1312,1313, 1314, 1315, 1316, 1321, 1322,1353, 2451, 2707, 2963, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1339, 1340, 1341, 1342,1343, 1344, 1345, 1346, 1356, 2454, 2710, 2966, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1323, 1324, 1325, 1326, 1327, 1328, 1329, 1330, 1354, 2452, 2708, 2964, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1331, 1332,1333, 1334, 1335, 1336, 1337, 1338, 1355, 2453, 2709, 2965, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1347, 1348, 1349, 1350, 1351, 1352,1357, 1358, 1388, 2455, 2711, 2967, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1375, 1376, 1377, 1378, 1379, 1380, 1381, 1382,1391, 2458, 2714, 2970, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1359, 1360, 1361, 1362,1363, 1364, 1365, 1366, 1389, 2456, 2712, 2968, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1367, 1368, 1369, 1370, 1371, 1372,1373, 1374, 1390, 2457, 2713, 2969, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1383, 1384, 1385, 1386, 1387, 1392,1393, 1394, 1423, 2459, 2715, 2971, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1411, 1412,1413, 1414, 1415, 1416, 1417, 1418, 1426, 2462, 2718, 2974, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1395, 1396, 1397, 1398, 1399, 1400, 1401, 1402,1424, 2460, 2716, 2972, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1403, 1404, 1405, 1406, 1407, 1408, 1409, 1410, 1425, 2461, 2717, 2973, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1419, 1420, 1421, 1422,1427, 1428, 1429, 1430, 1459, 2463, 2719, 2975, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1447, 1448, 1449, 1450, 1451, 1452,1453, 1454, 1462, 2466, 2722, 2978, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1431, 1432,1433, 1434, 1435, 1436, 1437, 1438, 1460, 2464, 2720, 2976, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1439, 1440, 1441, 1442,1443, 1444, 1445, 1446, 1461, 2465, 2721, 2977, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1455, 1456, 1457, 1458, 1463, 1464, 1465, 1466, 1494, 2467, 2723, 2979, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1483, 1484, 1485, 1486, 1487, 1488, 1489, 1490, 1497, 2470, 2726, 2982, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1467, 1468, 1469, 1470, 1471, 1472,1473, 1474, 1495, 2468, 2724, 2980, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1475, 1476, 1477, 1478, 1479, 1480, 1481, 1482,1496, 2469, 2725, 2981, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1491, 1492,1493, 1498, 1499, 1500, 1501, 1502,1530, 2471, 2727, 2983, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1519, 1520, 1521, 1522,1523, 1524, 1525, 1526, 1533, 2474, 2730, 2986, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1503, 1504, 1505, 1506, 1507, 1508, 1509, 1510, 1531, 2472, 2728, 2984, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1511, 1512,1513, 1514, 1515, 1516, 1517, 1518, 1532, 2473, 2729, 2985, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1527, 1528, 1529, 1534, 1535, 1536, 1537, 1538, 1565, 2475, 2731, 2987, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1555, 1556, 1557, 1558, 1559, 1560, 1561, 1562,1568, 2478, 2734, 2990, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1539, 1540, 1541, 1542,1543, 1544, 1545, 1546, 1566, 2476, 2732, 2988, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1547, 1548, 1549, 1550, 1551, 1552,1553, 1554, 1567, 2477, 2733, 2989, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1563, 1564, 1569, 1570, 1571, 1572,1573, 1574, 1600, 2479, 2735, 2991, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1591, 1592,1593, 1594, 1595, 1596, 1597, 1598, 1603, 2482, 2738, 2994, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1575, 1576, 1577, 1578, 1579, 1580, 1581, 1582,1601, 2480, 2736, 2992, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1583, 1584, 1585, 1586, 1587, 1588, 1589, 1590, 1602, 2481, 2737, 2993, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1599, 1604, 1605, 1606, 1607, 1608, 1609, 1610, 1636, 2483, 2739, 2995, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1627, 1628, 1629, 1630, 1631, 1632,1633, 1634, 1639, 2486, 2742, 2998, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1611, 1612,1613, 1614, 1615, 1616, 1617, 1618, 1637, 2484, 2740, 2996, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1619, 1620, 1621, 1622,1623, 1624, 1625, 1626, 1638, 2485, 2741, 2997, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1635, 1640, 1641, 1642,1643, 1644, 1645, 1646, 1671, 2487, 2743, 2999, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1655, 1656, 1657, 1658, 1659, 1660, 1661, 1662,1673, 2489, 2745, 3001, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1647, 1648, 1649, 1650, 1651, 1652,1653, 1654, 1672, 2488, 2744, 3000, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1663, 1664, 1665, 1666, 1667, 1668, 1669, 1670, 1705, 2490, 2746, 3002, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1690, 1691, 1692,1693, 1694, 1695, 1696, 1697, 1708, 2493, 2749, 3005, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1674, 1675, 1676, 1677, 1678, 1679, 1680, 1681, 1706, 2491, 2747, 3003, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1682,1683, 1684, 1685, 1686, 1687, 1688, 1689, 1707, 2492, 2748, 3004, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1698, 1699, 1700, 1701, 1702,1703, 1704, 1709, 1740, 2494, 2750, 3006, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1726, 1727, 1728, 1729, 1730, 1731, 1732,1733, 1743, 2497, 2753, 3009, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1710, 1711, 1712,1713, 1714, 1715, 1716, 1717, 1741, 2495, 2751, 3007, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1718, 1719, 1720, 1721, 1722,1723, 1724, 1725, 1742, 2496, 2752, 3008, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1734, 1735, 1736, 1737, 1738, 1739, 1744, 1745, 1776, 2498, 2754, 3010, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1762,1763, 1764, 1765, 1766, 1767, 1768, 1769, 1779, 2501, 2757, 3013, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1746, 1747, 1748, 1749, 1750, 1751, 1752,1753, 1777, 2499, 2755, 3011, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1754, 1755, 1756, 1757, 1758, 1759, 1760, 1761, 1778, 2500, 2756, 3012, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1770, 1771, 1772,1773, 1774, 1775, 1780, 1781, 1811, 2502, 2758, 3014, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1798, 1799, 1800, 1801, 1802,1803, 1804, 1805, 1814, 2505, 2761, 3017, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1782,1783, 1784, 1785, 1786, 1787, 1788, 1789, 1812, 2503, 2759, 3015, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1790, 1791, 1792,1793, 1794, 1795, 1796, 1797, 1813, 2504, 2760, 3016, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1806, 1807, 1808, 1809, 1810, 1815, 1816, 1817, 1846, 2506, 2762, 3018, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1834, 1835, 1836, 1837, 1838, 1839, 1840, 1841, 1849, 2509, 2765, 3021, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1818, 1819, 1820, 1821, 1822,1823, 1824, 1825, 1847, 2507, 2763, 3019, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1826, 1827, 1828, 1829, 1830, 1831, 1832,1833, 1848, 2508, 2764, 3020, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1842,1843, 1844, 1845, 1850, 1851, 1852,1853, 1881, 2510, 2766, 3022, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1870, 1871, 1872,1873, 1874, 1875, 1876, 1877, 1884, 2513, 2769, 3025, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1854, 1855, 1856, 1857, 1858, 1859, 1860, 1861, 1882, 2511, 2767, 3023, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1862,1863, 1864, 1865, 1866, 1867, 1868, 1869, 1883, 2512, 2768, 3024, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1878, 1879, 1880, 1885, 1886, 1887, 1888, 1889, 1916, 2514, 2770, 3026, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1906, 1907, 1908, 1909, 1910, 1911, 1912,1913, 1919, 2517, 2773, 3029, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1890, 1891, 1892,1893, 1894, 1895, 1896, 1897, 1917, 2515, 2771, 3027, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1898, 1899, 1900, 1901, 1902,1903, 1904, 1905, 1918, 2516, 2772, 3028, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1914, 1915, 1920, 1921, 1922,1923, 1924, 1925, 1952, 2518, 2774, 3030, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1942,1943, 1944, 1945, 1946, 1947, 1948, 1949, 1955, 2521, 2777, 3033, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1926, 1927, 1928, 1929, 1930, 1931, 1932,1933, 1953, 2519, 2775, 3031, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1934, 1935, 1936, 1937, 1938, 1939, 1940, 1941, 1954, 2520, 2776, 3032, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1950, 1951, 1956, 1957, 1958, 1959, 1960, 1961, 1987, 2522, 2778, 3034, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1978, 1979, 1980, 1981, 1982,1983, 1984, 1985, 1990, 2525, 2781, 3037, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1962,1963, 1964, 1965, 1966, 1967, 1968, 1969, 1988, 2523, 2779, 3035, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1970, 1971, 1972,1973, 1974, 1975, 1976, 1977, 1989, 2524, 2780, 3036, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1986, 1991, 1992,1993, 1994, 1995, 1996, 1997, 2022, 2526, 2782, 3038, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013, 2024, 2528, 2784, 3040, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2023, 2527, 2783, 3039, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2014, 2015, 2016, 2017, 2018, 2019, 2020, 2021, 2056, 2529, 2785, 3041, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2041, 2042, 2043, 2044, 2045, 2046, 2047, 2048, 2059, 2532, 2788, 3044, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2025, 2026, 2027, 2028, 2029, 2030, 2031, 2032, 2057, 2530, 2786, 3042, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2033, 2034, 2035, 2036, 2037, 2038, 2039, 2040, 2058, 2531, 2787, 3043, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2049, 2050, 2051, 2052, 2053, 2054, 2055, 2060, 2091, 2533, 2789, 3045, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2077, 2078, 2079, 2080, 2081, 2082, 2083, 2084, 2094, 2536, 2792, 3048, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2061, 2062, 2063, 2064, 2065, 2066, 2067, 2068, 2092, 2534, 2790, 3046, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2069, 2070, 2071, 2072, 2073, 2074, 2075, 2076, 2093, 2535, 2791, 3047, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2085, 2086, 2087, 2088, 2089, 2090, 2095, 2096, 2126, 2537, 2793, 3049, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2113, 2114, 2115, 2116, 2117, 2118, 2119, 2120, 2129, 2540, 2796, 3052, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2097, 2098, 2099, 2100, 2101, 2102, 2103, 2104, 2127, 2538, 2794, 3050, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2105, 2106, 2107, 2108, 2109, 2110, 2111, 2112, 2128, 2539, 2795, 3051, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2121, 2122, 2123, 2124, 2125, 2130, 2131, 2132, 2161, 2541, 2797, 3053, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2149, 2150, 2151, 2152, 2153, 2154, 2155, 2156, 2164, 2544, 2800, 3056, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2133, 2134, 2135, 2136, 2137, 2138, 2139, 2140, 2162, 2542, 2798, 3054, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2141, 2142, 2143, 2144, 2145, 2146, 2147, 2148, 2163, 2543, 2799, 3055, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2157, 2158, 2159, 2160, 2165, 2166, 2167, 2168, 2196, 2545, 2801, 3057, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2185, 2186, 2187, 2188, 2189, 2190, 2191, 2192, 2199, 2548, 2804, 3060, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2169, 2170, 2171, 2172, 2173, 2174, 2175, 2176, 2197, 2546, 2802, 3058, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2177, 2178, 2179, 2180, 2181, 2182, 2183, 2184, 2198, 2547, 2803, 3059, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2193, 2194, 2195, 2200, 2201, 2202, 2203, 2204, 2231, 2549, 2805, 3061, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2221, 2222, 2223, 2224, 2225, 2226, 2227, 2228, 2234, 2552, 2808, 3064, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2205, 2206, 2207, 2208, 2209, 2210, 2211, 2212, 2232, 2550, 2806, 3062, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2213, 2214, 2215, 2216, 2217, 2218, 2219, 2220, 2233, 2551, 2807, 3063, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2229, 2230, 2235, 2236, 2237, 2238, 2239, 2240, 2266, 2553, 2809, 3065, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2257, 2258, 2259, 2260, 2261, 2262, 2263, 2264, 2269, 2556, 2812, 3068, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2241, 2242, 2243, 2244, 2245, 2246, 2247, 2248, 2267, 2554, 2810, 3066, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2249, 2250, 2251, 2252, 2253, 2254, 2255, 2256, 2268, 2555, 2811, 3067, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2265, 2270, 2271, 2272, 2273, 2274, 2275, 2276, 2301, 2557, 2813, 3069, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2277, 2278, 2279, 2280, 2281, 2282, 2283, 2284, 2302, 2558, 2814, 3070, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2285, 2286, 2287, 2288, 2289, 2290, 2291, 2292, 2303, 2559, 2815, 3071, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2293, 2294, 2295, 2296, 2297, 2298, 2299, 2300, 2304, 2560, 2816, 3072, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]] + page_indices_rank0 = sum(page_indices_rank0, []) + page_indices_rank1 = sum(page_indices_rank1, []) + page_indices_no_dp = [[ 1, 2, 3, 4, 5, 6, 7, 8, 17, 2305, 2561, + 2817, 3073, 3329, 3585, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 9, 10, 11, 12, 13, 14, 15, 16, 18, 2306, 2562, + 2818, 3074, 3330, 3586, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 19, 20, 21, 22, 23, 24, 25, 26, 51, 2307, 2563, + 2819, 3075, 3331, 3587, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 27, 28, 29, 30, 31, 32, 33, 34, 52, 2308, 2564, + 2820, 3076, 3332, 3588, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 35, 36, 37, 38, 39, 40, 41, 42, 53, 2309, 2565, + 2821, 3077, 3333, 3589, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 43, 44, 45, 46, 47, 48, 49, 50, 86, 2310, 2566, + 2822, 3078, 3334, 3590, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 54, 55, 56, 57, 58, 59, 60, 61, 87, 2311, 2567, + 2823, 3079, 3335, 3591, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 62, 63, 64, 65, 66, 67, 68, 69, 88, 2312, 2568, + 2824, 3080, 3336, 3592, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 70, 71, 72, 73, 74, 75, 76, 77, 89, 2313, 2569, + 2825, 3081, 3337, 3593, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 78, 79, 80, 81, 82, 83, 84, 85, 122, 2314, 2570, + 2826, 3082, 3338, 3594, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 90, 91, 92, 93, 94, 95, 96, 97, 123, 2315, 2571, + 2827, 3083, 3339, 3595, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 98, 99, 100, 101, 102, 103, 104, 105, 124, 2316, 2572, + 2828, 3084, 3340, 3596, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 106, 107, 108, 109, 110, 111, 112, 113, 125, 2317, 2573, + 2829, 3085, 3341, 3597, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 114, 115, 116, 117, 118, 119, 120, 121, 158, 2318, 2574, + 2830, 3086, 3342, 3598, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 126, 127, 128, 129, 130, 131, 132, 133, 159, 2319, 2575, + 2831, 3087, 3343, 3599, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 134, 135, 136, 137, 138, 139, 140, 141, 160, 2320, 2576, + 2832, 3088, 3344, 3600, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 142, 143, 144, 145, 146, 147, 148, 149, 161, 2321, 2577, + 2833, 3089, 3345, 3601, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 150, 151, 152, 153, 154, 155, 156, 157, 194, 2322, 2578, + 2834, 3090, 3346, 3602, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 162, 163, 164, 165, 166, 167, 168, 169, 195, 2323, 2579, + 2835, 3091, 3347, 3603, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 170, 171, 172, 173, 174, 175, 176, 177, 196, 2324, 2580, + 2836, 3092, 3348, 3604, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 178, 179, 180, 181, 182, 183, 184, 185, 197, 2325, 2581, + 2837, 3093, 3349, 3605, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 186, 187, 188, 189, 190, 191, 192, 193, 230, 2326, 2582, + 2838, 3094, 3350, 3606, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 198, 199, 200, 201, 202, 203, 204, 205, 231, 2327, 2583, + 2839, 3095, 3351, 3607, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 206, 207, 208, 209, 210, 211, 212, 213, 232, 2328, 2584, + 2840, 3096, 3352, 3608, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 214, 215, 216, 217, 218, 219, 220, 221, 233, 2329, 2585, + 2841, 3097, 3353, 3609, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 222, 223, 224, 225, 226, 227, 228, 229, 266, 2330, 2586, + 2842, 3098, 3354, 3610, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 234, 235, 236, 237, 238, 239, 240, 241, 267, 2331, 2587, + 2843, 3099, 3355, 3611, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 242, 243, 244, 245, 246, 247, 248, 249, 268, 2332, 2588, + 2844, 3100, 3356, 3612, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 250, 251, 252, 253, 254, 255, 256, 257, 269, 2333, 2589, + 2845, 3101, 3357, 3613, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 258, 259, 260, 261, 262, 263, 264, 265, 302, 2334, 2590, + 2846, 3102, 3358, 3614, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 270, 271, 272, 273, 274, 275, 276, 277, 303, 2335, 2591, + 2847, 3103, 3359, 3615, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 278, 279, 280, 281, 282, 283, 284, 285, 304, 2336, 2592, + 2848, 3104, 3360, 3616, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 286, 287, 288, 289, 290, 291, 292, 293, 305, 2337, 2593, + 2849, 3105, 3361, 3617, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 294, 295, 296, 297, 298, 299, 300, 301, 338, 2338, 2594, + 2850, 3106, 3362, 3618, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 306, 307, 308, 309, 310, 311, 312, 313, 339, 2339, 2595, + 2851, 3107, 3363, 3619, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 314, 315, 316, 317, 318, 319, 320, 321, 340, 2340, 2596, + 2852, 3108, 3364, 3620, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 322, 323, 324, 325, 326, 327, 328, 329, 341, 2341, 2597, + 2853, 3109, 3365, 3621, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 330, 331, 332, 333, 334, 335, 336, 337, 374, 2342, 2598, + 2854, 3110, 3366, 3622, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 342, 343, 344, 345, 346, 347, 348, 349, 375, 2343, 2599, + 2855, 3111, 3367, 3623, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 350, 351, 352, 353, 354, 355, 356, 357, 376, 2344, 2600, + 2856, 3112, 3368, 3624, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 358, 359, 360, 361, 362, 363, 364, 365, 377, 2345, 2601, + 2857, 3113, 3369, 3625, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 366, 367, 368, 369, 370, 371, 372, 373, 410, 2346, 2602, + 2858, 3114, 3370, 3626, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 378, 379, 380, 381, 382, 383, 384, 385, 411, 2347, 2603, + 2859, 3115, 3371, 3627, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 386, 387, 388, 389, 390, 391, 392, 393, 412, 2348, 2604, + 2860, 3116, 3372, 3628, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 394, 395, 396, 397, 398, 399, 400, 401, 413, 2349, 2605, + 2861, 3117, 3373, 3629, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 402, 403, 404, 405, 406, 407, 408, 409, 445, 2350, 2606, + 2862, 3118, 3374, 3630, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 414, 415, 416, 417, 418, 419, 420, 421, 446, 2351, 2607, + 2863, 3119, 3375, 3631, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 422, 423, 424, 425, 426, 427, 428, 429, 447, 2352, 2608, + 2864, 3120, 3376, 3632, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 430, 431, 432, 433, 434, 435, 436, 437, 448, 2353, 2609, + 2865, 3121, 3377, 3633, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 438, 439, 440, 441, 442, 443, 444, 449, 481, 2354, 2610, + 2866, 3122, 3378, 3634, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 450, 451, 452, 453, 454, 455, 456, 457, 482, 2355, 2611, + 2867, 3123, 3379, 3635, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 458, 459, 460, 461, 462, 463, 464, 465, 483, 2356, 2612, + 2868, 3124, 3380, 3636, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 466, 467, 468, 469, 470, 471, 472, 473, 484, 2357, 2613, + 2869, 3125, 3381, 3637, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 474, 475, 476, 477, 478, 479, 480, 485, 517, 2358, 2614, + 2870, 3126, 3382, 3638, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 486, 487, 488, 489, 490, 491, 492, 493, 518, 2359, 2615, + 2871, 3127, 3383, 3639, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 494, 495, 496, 497, 498, 499, 500, 501, 519, 2360, 2616, + 2872, 3128, 3384, 3640, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 502, 503, 504, 505, 506, 507, 508, 509, 520, 2361, 2617, + 2873, 3129, 3385, 3641, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 510, 511, 512, 513, 514, 515, 516, 521, 553, 2362, 2618, + 2874, 3130, 3386, 3642, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 522, 523, 524, 525, 526, 527, 528, 529, 554, 2363, 2619, + 2875, 3131, 3387, 3643, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 530, 531, 532, 533, 534, 535, 536, 537, 555, 2364, 2620, + 2876, 3132, 3388, 3644, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 538, 539, 540, 541, 542, 543, 544, 545, 556, 2365, 2621, + 2877, 3133, 3389, 3645, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 546, 547, 548, 549, 550, 551, 552, 557, 589, 2366, 2622, + 2878, 3134, 3390, 3646, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 558, 559, 560, 561, 562, 563, 564, 565, 590, 2367, 2623, + 2879, 3135, 3391, 3647, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 566, 567, 568, 569, 570, 571, 572, 573, 591, 2368, 2624, + 2880, 3136, 3392, 3648, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 574, 575, 576, 577, 578, 579, 580, 581, 592, 2369, 2625, + 2881, 3137, 3393, 3649, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 582, 583, 584, 585, 586, 587, 588, 593, 624, 2370, 2626, + 2882, 3138, 3394, 3650, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 594, 595, 596, 597, 598, 599, 600, 601, 625, 2371, 2627, + 2883, 3139, 3395, 3651, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 602, 603, 604, 605, 606, 607, 608, 609, 626, 2372, 2628, + 2884, 3140, 3396, 3652, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 610, 611, 612, 613, 614, 615, 616, 617, 627, 2373, 2629, + 2885, 3141, 3397, 3653, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 618, 619, 620, 621, 622, 623, 628, 629, 660, 2374, 2630, + 2886, 3142, 3398, 3654, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 630, 631, 632, 633, 634, 635, 636, 637, 661, 2375, 2631, + 2887, 3143, 3399, 3655, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 638, 639, 640, 641, 642, 643, 644, 645, 662, 2376, 2632, + 2888, 3144, 3400, 3656, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 646, 647, 648, 649, 650, 651, 652, 653, 663, 2377, 2633, + 2889, 3145, 3401, 3657, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 654, 655, 656, 657, 658, 659, 664, 665, 696, 2378, 2634, + 2890, 3146, 3402, 3658, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 666, 667, 668, 669, 670, 671, 672, 673, 697, 2379, 2635, + 2891, 3147, 3403, 3659, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 674, 675, 676, 677, 678, 679, 680, 681, 698, 2380, 2636, + 2892, 3148, 3404, 3660, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 682, 683, 684, 685, 686, 687, 688, 689, 699, 2381, 2637, + 2893, 3149, 3405, 3661, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 690, 691, 692, 693, 694, 695, 700, 701, 731, 2382, 2638, + 2894, 3150, 3406, 3662, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 702, 703, 704, 705, 706, 707, 708, 709, 732, 2383, 2639, + 2895, 3151, 3407, 3663, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 710, 711, 712, 713, 714, 715, 716, 717, 733, 2384, 2640, + 2896, 3152, 3408, 3664, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 718, 719, 720, 721, 722, 723, 724, 725, 734, 2385, 2641, + 2897, 3153, 3409, 3665, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 726, 727, 728, 729, 730, 735, 736, 737, 767, 2386, 2642, + 2898, 3154, 3410, 3666, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 738, 739, 740, 741, 742, 743, 744, 745, 768, 2387, 2643, + 2899, 3155, 3411, 3667, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 746, 747, 748, 749, 750, 751, 752, 753, 769, 2388, 2644, + 2900, 3156, 3412, 3668, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 754, 755, 756, 757, 758, 759, 760, 761, 770, 2389, 2645, + 2901, 3157, 3413, 3669, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 762, 763, 764, 765, 766, 771, 772, 773, 803, 2390, 2646, + 2902, 3158, 3414, 3670, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 774, 775, 776, 777, 778, 779, 780, 781, 804, 2391, 2647, + 2903, 3159, 3415, 3671, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 782, 783, 784, 785, 786, 787, 788, 789, 805, 2392, 2648, + 2904, 3160, 3416, 3672, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 790, 791, 792, 793, 794, 795, 796, 797, 806, 2393, 2649, + 2905, 3161, 3417, 3673, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 798, 799, 800, 801, 802, 807, 808, 809, 838, 2394, 2650, + 2906, 3162, 3418, 3674, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 810, 811, 812, 813, 814, 815, 816, 817, 839, 2395, 2651, + 2907, 3163, 3419, 3675, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 818, 819, 820, 821, 822, 823, 824, 825, 840, 2396, 2652, + 2908, 3164, 3420, 3676, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 826, 827, 828, 829, 830, 831, 832, 833, 841, 2397, 2653, + 2909, 3165, 3421, 3677, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 834, 835, 836, 837, 842, 843, 844, 845, 874, 2398, 2654, + 2910, 3166, 3422, 3678, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 846, 847, 848, 849, 850, 851, 852, 853, 875, 2399, 2655, + 2911, 3167, 3423, 3679, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 854, 855, 856, 857, 858, 859, 860, 861, 876, 2400, 2656, + 2912, 3168, 3424, 3680, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 862, 863, 864, 865, 866, 867, 868, 869, 877, 2401, 2657, + 2913, 3169, 3425, 3681, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 870, 871, 872, 873, 878, 879, 880, 881, 910, 2402, 2658, + 2914, 3170, 3426, 3682, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 882, 883, 884, 885, 886, 887, 888, 889, 911, 2403, 2659, + 2915, 3171, 3427, 3683, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 890, 891, 892, 893, 894, 895, 896, 897, 912, 2404, 2660, + 2916, 3172, 3428, 3684, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 898, 899, 900, 901, 902, 903, 904, 905, 913, 2405, 2661, + 2917, 3173, 3429, 3685, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 906, 907, 908, 909, 914, 915, 916, 917, 945, 2406, 2662, + 2918, 3174, 3430, 3686, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 918, 919, 920, 921, 922, 923, 924, 925, 946, 2407, 2663, + 2919, 3175, 3431, 3687, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 926, 927, 928, 929, 930, 931, 932, 933, 947, 2408, 2664, + 2920, 3176, 3432, 3688, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 934, 935, 936, 937, 938, 939, 940, 941, 948, 2409, 2665, + 2921, 3177, 3433, 3689, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 942, 943, 944, 949, 950, 951, 952, 953, 981, 2410, 2666, + 2922, 3178, 3434, 3690, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 954, 955, 956, 957, 958, 959, 960, 961, 982, 2411, 2667, + 2923, 3179, 3435, 3691, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 962, 963, 964, 965, 966, 967, 968, 969, 983, 2412, 2668, + 2924, 3180, 3436, 3692, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 970, 971, 972, 973, 974, 975, 976, 977, 984, 2413, 2669, + 2925, 3181, 3437, 3693, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 978, 979, 980, 985, 986, 987, 988, 989, 1016, 2414, 2670, + 2926, 3182, 3438, 3694, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 990, 991, 992, 993, 994, 995, 996, 997, 1017, 2415, 2671, + 2927, 3183, 3439, 3695, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [ 998, 999, 1000, 1001, 1002, 1003, 1004, 1005, 1018, 2416, 2672, + 2928, 3184, 3440, 3696, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1006, 1007, 1008, 1009, 1010, 1011, 1012, 1013, 1019, 2417, 2673, + 2929, 3185, 3441, 3697, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1014, 1015, 1020, 1021, 1022, 1023, 1024, 1025, 1052, 2418, 2674, + 2930, 3186, 3442, 3698, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1026, 1027, 1028, 1029, 1030, 1031, 1032, 1033, 1053, 2419, 2675, + 2931, 3187, 3443, 3699, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1034, 1035, 1036, 1037, 1038, 1039, 1040, 1041, 1054, 2420, 2676, + 2932, 3188, 3444, 3700, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1042, 1043, 1044, 1045, 1046, 1047, 1048, 1049, 1055, 2421, 2677, + 2933, 3189, 3445, 3701, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1050, 1051, 1056, 1057, 1058, 1059, 1060, 1061, 1088, 2422, 2678, + 2934, 3190, 3446, 3702, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1062, 1063, 1064, 1065, 1066, 1067, 1068, 1069, 1089, 2423, 2679, + 2935, 3191, 3447, 3703, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1070, 1071, 1072, 1073, 1074, 1075, 1076, 1077, 1090, 2424, 2680, + 2936, 3192, 3448, 3704, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1078, 1079, 1080, 1081, 1082, 1083, 1084, 1085, 1091, 2425, 2681, + 2937, 3193, 3449, 3705, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1086, 1087, 1092, 1093, 1094, 1095, 1096, 1097, 1123, 2426, 2682, + 2938, 3194, 3450, 3706, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1098, 1099, 1100, 1101, 1102, 1103, 1104, 1105, 1124, 2427, 2683, + 2939, 3195, 3451, 3707, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1106, 1107, 1108, 1109, 1110, 1111, 1112, 1113, 1125, 2428, 2684, + 2940, 3196, 3452, 3708, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1114, 1115, 1116, 1117, 1118, 1119, 1120, 1121, 1126, 2429, 2685, + 2941, 3197, 3453, 3709, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1122, 1127, 1128, 1129, 1130, 1131, 1132, 1133, 1159, 2430, 2686, + 2942, 3198, 3454, 3710, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1134, 1135, 1136, 1137, 1138, 1139, 1140, 1141, 1160, 2431, 2687, + 2943, 3199, 3455, 3711, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1142, 1143, 1144, 1145, 1146, 1147, 1148, 1149, 1161, 2432, 2688, + 2944, 3200, 3456, 3712, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1150, 1151, 1152, 1153, 1154, 1155, 1156, 1157, 1162, 2433, 2689, + 2945, 3201, 3457, 3713, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1158, 1163, 1164, 1165, 1166, 1167, 1168, 1169, 1194, 2434, 2690, + 2946, 3202, 3458, 3714, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1170, 1171, 1172, 1173, 1174, 1175, 1176, 1177, 1195, 2435, 2691, + 2947, 3203, 3459, 3715, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1178, 1179, 1180, 1181, 1182, 1183, 1184, 1185, 1196, 2436, 2692, + 2948, 3204, 3460, 3716, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1186, 1187, 1188, 1189, 1190, 1191, 1192, 1193, 1229, 2437, 2693, + 2949, 3205, 3461, 3717, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1197, 1198, 1199, 1200, 1201, 1202, 1203, 1204, 1230, 2438, 2694, + 2950, 3206, 3462, 3718, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1205, 1206, 1207, 1208, 1209, 1210, 1211, 1212, 1231, 2439, 2695, + 2951, 3207, 3463, 3719, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1213, 1214, 1215, 1216, 1217, 1218, 1219, 1220, 1232, 2440, 2696, + 2952, 3208, 3464, 3720, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1221, 1222, 1223, 1224, 1225, 1226, 1227, 1228, 1264, 2441, 2697, + 2953, 3209, 3465, 3721, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1233, 1234, 1235, 1236, 1237, 1238, 1239, 1240, 1265, 2442, 2698, + 2954, 3210, 3466, 3722, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1241, 1242, 1243, 1244, 1245, 1246, 1247, 1248, 1266, 2443, 2699, + 2955, 3211, 3467, 3723, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1249, 1250, 1251, 1252, 1253, 1254, 1255, 1256, 1267, 2444, 2700, + 2956, 3212, 3468, 3724, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1257, 1258, 1259, 1260, 1261, 1262, 1263, 1268, 1300, 2445, 2701, + 2957, 3213, 3469, 3725, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1269, 1270, 1271, 1272, 1273, 1274, 1275, 1276, 1301, 2446, 2702, + 2958, 3214, 3470, 3726, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1277, 1278, 1279, 1280, 1281, 1282, 1283, 1284, 1302, 2447, 2703, + 2959, 3215, 3471, 3727, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1285, 1286, 1287, 1288, 1289, 1290, 1291, 1292, 1303, 2448, 2704, + 2960, 3216, 3472, 3728, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1293, 1294, 1295, 1296, 1297, 1298, 1299, 1304, 1335, 2449, 2705, + 2961, 3217, 3473, 3729, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1305, 1306, 1307, 1308, 1309, 1310, 1311, 1312, 1336, 2450, 2706, + 2962, 3218, 3474, 3730, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1313, 1314, 1315, 1316, 1317, 1318, 1319, 1320, 1337, 2451, 2707, + 2963, 3219, 3475, 3731, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1321, 1322, 1323, 1324, 1325, 1326, 1327, 1328, 1338, 2452, 2708, + 2964, 3220, 3476, 3732, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1329, 1330, 1331, 1332, 1333, 1334, 1339, 1340, 1370, 2453, 2709, + 2965, 3221, 3477, 3733, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1341, 1342, 1343, 1344, 1345, 1346, 1347, 1348, 1371, 2454, 2710, + 2966, 3222, 3478, 3734, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1349, 1350, 1351, 1352, 1353, 1354, 1355, 1356, 1372, 2455, 2711, + 2967, 3223, 3479, 3735, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1357, 1358, 1359, 1360, 1361, 1362, 1363, 1364, 1373, 2456, 2712, + 2968, 3224, 3480, 3736, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1365, 1366, 1367, 1368, 1369, 1374, 1375, 1376, 1406, 2457, 2713, + 2969, 3225, 3481, 3737, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1377, 1378, 1379, 1380, 1381, 1382, 1383, 1384, 1407, 2458, 2714, + 2970, 3226, 3482, 3738, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1385, 1386, 1387, 1388, 1389, 1390, 1391, 1392, 1408, 2459, 2715, + 2971, 3227, 3483, 3739, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1393, 1394, 1395, 1396, 1397, 1398, 1399, 1400, 1409, 2460, 2716, + 2972, 3228, 3484, 3740, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1401, 1402, 1403, 1404, 1405, 1410, 1411, 1412, 1441, 2461, 2717, + 2973, 3229, 3485, 3741, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1413, 1414, 1415, 1416, 1417, 1418, 1419, 1420, 1442, 2462, 2718, + 2974, 3230, 3486, 3742, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1421, 1422, 1423, 1424, 1425, 1426, 1427, 1428, 1443, 2463, 2719, + 2975, 3231, 3487, 3743, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1429, 1430, 1431, 1432, 1433, 1434, 1435, 1436, 1444, 2464, 2720, + 2976, 3232, 3488, 3744, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1437, 1438, 1439, 1440, 1445, 1446, 1447, 1448, 1477, 2465, 2721, + 2977, 3233, 3489, 3745, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1449, 1450, 1451, 1452, 1453, 1454, 1455, 1456, 1478, 2466, 2722, + 2978, 3234, 3490, 3746, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1457, 1458, 1459, 1460, 1461, 1462, 1463, 1464, 1479, 2467, 2723, + 2979, 3235, 3491, 3747, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1465, 1466, 1467, 1468, 1469, 1470, 1471, 1472, 1480, 2468, 2724, + 2980, 3236, 3492, 3748, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1473, 1474, 1475, 1476, 1481, 1482, 1483, 1484, 1512, 2469, 2725, + 2981, 3237, 3493, 3749, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1485, 1486, 1487, 1488, 1489, 1490, 1491, 1492, 1513, 2470, 2726, + 2982, 3238, 3494, 3750, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1493, 1494, 1495, 1496, 1497, 1498, 1499, 1500, 1514, 2471, 2727, + 2983, 3239, 3495, 3751, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1501, 1502, 1503, 1504, 1505, 1506, 1507, 1508, 1515, 2472, 2728, + 2984, 3240, 3496, 3752, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1509, 1510, 1511, 1516, 1517, 1518, 1519, 1520, 1547, 2473, 2729, + 2985, 3241, 3497, 3753, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1521, 1522, 1523, 1524, 1525, 1526, 1527, 1528, 1548, 2474, 2730, + 2986, 3242, 3498, 3754, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1529, 1530, 1531, 1532, 1533, 1534, 1535, 1536, 1549, 2475, 2731, + 2987, 3243, 3499, 3755, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1537, 1538, 1539, 1540, 1541, 1542, 1543, 1544, 1550, 2476, 2732, + 2988, 3244, 3500, 3756, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1545, 1546, 1551, 1552, 1553, 1554, 1555, 1556, 1583, 2477, 2733, + 2989, 3245, 3501, 3757, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1557, 1558, 1559, 1560, 1561, 1562, 1563, 1564, 1584, 2478, 2734, + 2990, 3246, 3502, 3758, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1565, 1566, 1567, 1568, 1569, 1570, 1571, 1572, 1585, 2479, 2735, + 2991, 3247, 3503, 3759, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1573, 1574, 1575, 1576, 1577, 1578, 1579, 1580, 1586, 2480, 2736, + 2992, 3248, 3504, 3760, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1581, 1582, 1587, 1588, 1589, 1590, 1591, 1592, 1618, 2481, 2737, + 2993, 3249, 3505, 3761, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1593, 1594, 1595, 1596, 1597, 1598, 1599, 1600, 1619, 2482, 2738, + 2994, 3250, 3506, 3762, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1601, 1602, 1603, 1604, 1605, 1606, 1607, 1608, 1620, 2483, 2739, + 2995, 3251, 3507, 3763, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1609, 1610, 1611, 1612, 1613, 1614, 1615, 1616, 1621, 2484, 2740, + 2996, 3252, 3508, 3764, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1617, 1622, 1623, 1624, 1625, 1626, 1627, 1628, 1653, 2485, 2741, + 2997, 3253, 3509, 3765, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1629, 1630, 1631, 1632, 1633, 1634, 1635, 1636, 1654, 2486, 2742, + 2998, 3254, 3510, 3766, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1637, 1638, 1639, 1640, 1641, 1642, 1643, 1644, 1655, 2487, 2743, + 2999, 3255, 3511, 3767, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1645, 1646, 1647, 1648, 1649, 1650, 1651, 1652, 1687, 2488, 2744, + 3000, 3256, 3512, 3768, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1656, 1657, 1658, 1659, 1660, 1661, 1662, 1663, 1688, 2489, 2745, + 3001, 3257, 3513, 3769, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1664, 1665, 1666, 1667, 1668, 1669, 1670, 1671, 1689, 2490, 2746, + 3002, 3258, 3514, 3770, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1672, 1673, 1674, 1675, 1676, 1677, 1678, 1679, 1690, 2491, 2747, + 3003, 3259, 3515, 3771, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1680, 1681, 1682, 1683, 1684, 1685, 1686, 1691, 1723, 2492, 2748, + 3004, 3260, 3516, 3772, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1692, 1693, 1694, 1695, 1696, 1697, 1698, 1699, 1724, 2493, 2749, + 3005, 3261, 3517, 3773, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1700, 1701, 1702, 1703, 1704, 1705, 1706, 1707, 1725, 2494, 2750, + 3006, 3262, 3518, 3774, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1708, 1709, 1710, 1711, 1712, 1713, 1714, 1715, 1726, 2495, 2751, + 3007, 3263, 3519, 3775, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1716, 1717, 1718, 1719, 1720, 1721, 1722, 1727, 1758, 2496, 2752, + 3008, 3264, 3520, 3776, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1728, 1729, 1730, 1731, 1732, 1733, 1734, 1735, 1759, 2497, 2753, + 3009, 3265, 3521, 3777, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1736, 1737, 1738, 1739, 1740, 1741, 1742, 1743, 1760, 2498, 2754, + 3010, 3266, 3522, 3778, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1744, 1745, 1746, 1747, 1748, 1749, 1750, 1751, 1761, 2499, 2755, + 3011, 3267, 3523, 3779, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1752, 1753, 1754, 1755, 1756, 1757, 1762, 1763, 1793, 2500, 2756, + 3012, 3268, 3524, 3780, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1764, 1765, 1766, 1767, 1768, 1769, 1770, 1771, 1794, 2501, 2757, + 3013, 3269, 3525, 3781, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1772, 1773, 1774, 1775, 1776, 1777, 1778, 1779, 1795, 2502, 2758, + 3014, 3270, 3526, 3782, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1780, 1781, 1782, 1783, 1784, 1785, 1786, 1787, 1796, 2503, 2759, + 3015, 3271, 3527, 3783, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1788, 1789, 1790, 1791, 1792, 1797, 1798, 1799, 1828, 2504, 2760, + 3016, 3272, 3528, 3784, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1800, 1801, 1802, 1803, 1804, 1805, 1806, 1807, 1829, 2505, 2761, + 3017, 3273, 3529, 3785, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1808, 1809, 1810, 1811, 1812, 1813, 1814, 1815, 1830, 2506, 2762, + 3018, 3274, 3530, 3786, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1816, 1817, 1818, 1819, 1820, 1821, 1822, 1823, 1831, 2507, 2763, + 3019, 3275, 3531, 3787, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1824, 1825, 1826, 1827, 1832, 1833, 1834, 1835, 1864, 2508, 2764, + 3020, 3276, 3532, 3788, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1836, 1837, 1838, 1839, 1840, 1841, 1842, 1843, 1865, 2509, 2765, + 3021, 3277, 3533, 3789, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1844, 1845, 1846, 1847, 1848, 1849, 1850, 1851, 1866, 2510, 2766, + 3022, 3278, 3534, 3790, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1852, 1853, 1854, 1855, 1856, 1857, 1858, 1859, 1867, 2511, 2767, + 3023, 3279, 3535, 3791, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1860, 1861, 1862, 1863, 1868, 1869, 1870, 1871, 1899, 2512, 2768, + 3024, 3280, 3536, 3792, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1872, 1873, 1874, 1875, 1876, 1877, 1878, 1879, 1900, 2513, 2769, + 3025, 3281, 3537, 3793, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1880, 1881, 1882, 1883, 1884, 1885, 1886, 1887, 1901, 2514, 2770, + 3026, 3282, 3538, 3794, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1888, 1889, 1890, 1891, 1892, 1893, 1894, 1895, 1902, 2515, 2771, + 3027, 3283, 3539, 3795, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1896, 1897, 1898, 1903, 1904, 1905, 1906, 1907, 1934, 2516, 2772, + 3028, 3284, 3540, 3796, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1908, 1909, 1910, 1911, 1912, 1913, 1914, 1915, 1935, 2517, 2773, + 3029, 3285, 3541, 3797, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1916, 1917, 1918, 1919, 1920, 1921, 1922, 1923, 1936, 2518, 2774, + 3030, 3286, 3542, 3798, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1924, 1925, 1926, 1927, 1928, 1929, 1930, 1931, 1937, 2519, 2775, + 3031, 3287, 3543, 3799, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1932, 1933, 1938, 1939, 1940, 1941, 1942, 1943, 1969, 2520, 2776, + 3032, 3288, 3544, 3800, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1944, 1945, 1946, 1947, 1948, 1949, 1950, 1951, 1970, 2521, 2777, + 3033, 3289, 3545, 3801, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1952, 1953, 1954, 1955, 1956, 1957, 1958, 1959, 1971, 2522, 2778, + 3034, 3290, 3546, 3802, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1960, 1961, 1962, 1963, 1964, 1965, 1966, 1967, 1972, 2523, 2779, + 3035, 3291, 3547, 3803, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1968, 1973, 1974, 1975, 1976, 1977, 1978, 1979, 2004, 2524, 2780, + 3036, 3292, 3548, 3804, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1980, 1981, 1982, 1983, 1984, 1985, 1986, 1987, 2005, 2525, 2781, + 3037, 3293, 3549, 3805, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1988, 1989, 1990, 1991, 1992, 1993, 1994, 1995, 2006, 2526, 2782, + 3038, 3294, 3550, 3806, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2038, 2527, 2783, + 3039, 3295, 3551, 3807, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2007, 2008, 2009, 2010, 2011, 2012, 2013, 2014, 2039, 2528, 2784, + 3040, 3296, 3552, 3808, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2015, 2016, 2017, 2018, 2019, 2020, 2021, 2022, 2040, 2529, 2785, + 3041, 3297, 3553, 3809, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2023, 2024, 2025, 2026, 2027, 2028, 2029, 2030, 2041, 2530, 2786, + 3042, 3298, 3554, 3810, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2031, 2032, 2033, 2034, 2035, 2036, 2037, 2042, 2074, 2531, 2787, + 3043, 3299, 3555, 3811, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2043, 2044, 2045, 2046, 2047, 2048, 2049, 2050, 2075, 2532, 2788, + 3044, 3300, 3556, 3812, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2051, 2052, 2053, 2054, 2055, 2056, 2057, 2058, 2076, 2533, 2789, + 3045, 3301, 3557, 3813, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2059, 2060, 2061, 2062, 2063, 2064, 2065, 2066, 2077, 2534, 2790, + 3046, 3302, 3558, 3814, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2067, 2068, 2069, 2070, 2071, 2072, 2073, 2078, 2109, 2535, 2791, + 3047, 3303, 3559, 3815, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2079, 2080, 2081, 2082, 2083, 2084, 2085, 2086, 2110, 2536, 2792, + 3048, 3304, 3560, 3816, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2087, 2088, 2089, 2090, 2091, 2092, 2093, 2094, 2111, 2537, 2793, + 3049, 3305, 3561, 3817, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2095, 2096, 2097, 2098, 2099, 2100, 2101, 2102, 2112, 2538, 2794, + 3050, 3306, 3562, 3818, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2103, 2104, 2105, 2106, 2107, 2108, 2113, 2114, 2144, 2539, 2795, + 3051, 3307, 3563, 3819, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2115, 2116, 2117, 2118, 2119, 2120, 2121, 2122, 2145, 2540, 2796, + 3052, 3308, 3564, 3820, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2123, 2124, 2125, 2126, 2127, 2128, 2129, 2130, 2146, 2541, 2797, + 3053, 3309, 3565, 3821, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2131, 2132, 2133, 2134, 2135, 2136, 2137, 2138, 2147, 2542, 2798, + 3054, 3310, 3566, 3822, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2139, 2140, 2141, 2142, 2143, 2148, 2149, 2150, 2179, 2543, 2799, + 3055, 3311, 3567, 3823, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2151, 2152, 2153, 2154, 2155, 2156, 2157, 2158, 2180, 2544, 2800, + 3056, 3312, 3568, 3824, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2159, 2160, 2161, 2162, 2163, 2164, 2165, 2166, 2181, 2545, 2801, + 3057, 3313, 3569, 3825, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2167, 2168, 2169, 2170, 2171, 2172, 2173, 2174, 2182, 2546, 2802, + 3058, 3314, 3570, 3826, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2175, 2176, 2177, 2178, 2183, 2184, 2185, 2186, 2214, 2547, 2803, + 3059, 3315, 3571, 3827, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2187, 2188, 2189, 2190, 2191, 2192, 2193, 2194, 2215, 2548, 2804, + 3060, 3316, 3572, 3828, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2195, 2196, 2197, 2198, 2199, 2200, 2201, 2202, 2216, 2549, 2805, + 3061, 3317, 3573, 3829, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2203, 2204, 2205, 2206, 2207, 2208, 2209, 2210, 2217, 2550, 2806, + 3062, 3318, 3574, 3830, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2211, 2212, 2213, 2218, 2219, 2220, 2221, 2222, 2249, 2551, 2807, + 3063, 3319, 3575, 3831, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2223, 2224, 2225, 2226, 2227, 2228, 2229, 2230, 2250, 2552, 2808, + 3064, 3320, 3576, 3832, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2231, 2232, 2233, 2234, 2235, 2236, 2237, 2238, 2251, 2553, 2809, + 3065, 3321, 3577, 3833, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2239, 2240, 2241, 2242, 2243, 2244, 2245, 2246, 2252, 2554, 2810, + 3066, 3322, 3578, 3834, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2247, 2248, 2253, 2254, 2255, 2256, 2257, 2258, 2284, 2555, 2811, + 3067, 3323, 3579, 3835, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2259, 2260, 2261, 2262, 2263, 2264, 2265, 2266, 2285, 2556, 2812, + 3068, 3324, 3580, 3836, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2267, 2268, 2269, 2270, 2271, 2272, 2273, 2274, 2286, 2557, 2813, + 3069, 3325, 3581, 3837, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2275, 2276, 2277, 2278, 2279, 2280, 2281, 2282, 2287, 2558, 2814, + 3070, 3326, 3582, 3838, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2283, 2288, 2289, 2290, 2291, 2292, 2293, 2294, 2303, 2559, 2815, + 3071, 3327, 3583, 3839, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], + [2295, 2296, 2297, 2298, 2299, 2300, 2301, 2302, 2304, 2560, 2816, + 3072, 3328, 3584, 3840, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]] - # Optional attention sink - attention_sink = None + page_indices_no_dp = sum(page_indices_no_dp, [] ) + if dp_size == 1: + page_indices = jnp.array(page_indices_no_dp, dtype=jnp.int32) + elif dp_size == 2: + page_indices = jnp.array(page_indices_rank0 + page_indices_rank1, dtype=jnp.int32) + attention_sink = None sm_scale = head_dim ** -0.5 print(f"\nInput creation (dp_size={dp_size}):") @@ -119,12 +1466,12 @@ def create_test_inputs( } def run(inputs, dump_dir, dp_size=2, num_devices=8, dp=True): - """Run attention kernel WITH data parallelism.""" + print("\n" + "="*80) if dp: print(f"Running WITH Data Parallelism (dp_size={dp_size}, num_devices={num_devices})") else: - print(f"Running WITHOUT Data Parallelism (num_devices={num_devices})") + print(f"Running WITHOUT Data Parallelism (dp_size={dp_size}, num_devices={num_devices})") print("="*80) print(f"Input shapes:") @@ -133,56 +1480,58 @@ def run(inputs, dump_dir, dp_size=2, num_devices=8, dp=True): print(f" {key}: {val.shape} {val.dtype}") devices = jax.devices() - total_devices = 8 + dp_size = 2 if dp: - device_array = np.array(devices[:total_devices]).reshape(dp_size, -1) + device_array = np.array(devices[:8]).reshape(dp_size, -1) else: - device_array = np.array(devices[:total_devices//dp_size]).reshape(1, -1) + device_array = np.array(devices[:4]).reshape(1, -1) mesh = Mesh( device_array, axis_names=(ShardingAxisName.ATTN_DATA, ShardingAxisName.ATTN_HEAD), ) print(f"Mesh: {mesh}") - print(f"Mesh shape: {mesh.shape}") + def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, distribution): - # Define sharding specs (matching the actual implementation) - qkv_spec = P(ShardingAxisName.ATTN_DATA, ShardingAxisName.ATTN_HEAD, None) - kv_cache_spec = P(ShardingAxisName.ATTN_DATA, None, ShardingAxisName.ATTN_HEAD, None, None) - - in_specs = ( - qkv_spec, # q - qkv_spec, # k - qkv_spec, # v - kv_cache_spec, # kv_cache - P(ShardingAxisName.ATTN_DATA), # kv_lens - P(ShardingAxisName.ATTN_DATA), # page_indices - P(ShardingAxisName.ATTN_DATA), # cu_q_lens - P(ShardingAxisName.ATTN_DATA), # distribution - ) - out_specs = (qkv_spec, kv_cache_spec) - - print(f"\nSharding specs:") - print(f" qkv_spec: {qkv_spec}") - print(f" kv_cache_spec: {kv_cache_spec}") - - # Create sharded function - def _ragged_paged_attention(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, distribution): - return ragged_paged_attention_hd64( - q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, distribution, - attention_sink=None, - sm_scale=inputs['sm_scale'], + attention_metadata = AttentionMetadata( + input_positions=None, + block_tables=page_indices, + seq_lens=kv_lens, + query_start_loc=cu_q_lens, + request_distribution=distribution, ) + + batch_size, num_heads, head_dim = q.shape + num_kv_heads = k.shape[1] + + # Reshape q, k, v to match _jax_attn_func expectations + q_reshaped = q.reshape(batch_size, num_heads * head_dim) + k_reshaped = k.reshape(batch_size, num_kv_heads * head_dim) + v_reshaped = v.reshape(batch_size, num_kv_heads * head_dim) + + new_kv_cache, outputs = _jax_attn_func( + kv_cache=kv_cache, + q=q_reshaped, + k=k_reshaped, + v=v_reshaped, + sinks=None, + attention_metadata=attention_metadata, + mesh=mesh, + scale=inputs['sm_scale'], + head_size=head_dim, + num_heads=num_heads, + num_kv_heads=num_kv_heads, + q_scale=None, + k_scale=None, + v_scale=None, + sliding_window=None, + ) + + outputs = outputs.reshape(batch_size, num_heads, head_dim) + + return outputs, new_kv_cache - sharded_fn = shard_map( - _ragged_paged_attention, - mesh=mesh, - in_specs=in_specs, - out_specs=out_specs, - check_vma=False, - ) - - attention_fn = jax.jit(sharded_fn) + attention_fn = jax.jit(_attention_wrapper) # Lower and dump HLO print("\nLowering computation...") @@ -205,11 +1554,10 @@ def _ragged_paged_attention(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, hlo_path = Path(dump_dir) / f"no_dp_hlo.txt" hlo_path.write_text(hlo_text) print(f"✓ HLO dumped to: {hlo_path}") - - # Compile - print("Compiling...") - compiled = lowered.compile() - + + qkv_spec = P(ShardingAxisName.ATTN_DATA, ShardingAxisName.ATTN_HEAD, None) + kv_cache_spec = P(ShardingAxisName.ATTN_DATA, None, ShardingAxisName.ATTN_HEAD, None, None) + inputs['q'] = jax.device_put(inputs['q'], NamedSharding(mesh, qkv_spec)) inputs['k'] = jax.device_put(inputs['k'], NamedSharding(mesh, qkv_spec)) inputs['v'] = jax.device_put(inputs['v'], NamedSharding(mesh, qkv_spec)) @@ -235,8 +1583,10 @@ def _ragged_paged_attention(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, jax.block_until_ready(result) # Benchmark - print("Benchmarking (10 runs)...") + print("Benchmarking ...") times = [] + dump_dir = f"gs://wenxindong-vm/trace/debug/gptoss/kernel/dp{dp}" + jax.profiler.start_trace(dump_dir) for i in range(10): start = time.time() result = attention_fn( @@ -253,10 +1603,9 @@ def _ragged_paged_attention(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, elapsed = time.time() - start times.append(elapsed) print(f" Run {i+1}: {elapsed*1000:.2f} ms") - + jax.profiler.stop_trace() avg_time = sum(times) / len(times) print(f"\n✓ Average time: {avg_time*1000:.2f} ms") - print(f"✓ Output shape: {result[0].shape}") return result, avg_time @@ -270,36 +1619,12 @@ def main(): default='both', help='Which mode to run' ) - parser.add_argument( - '--dp_size', - type=int, - default=2, - help='Data parallel size for with_dp mode' - ) - parser.add_argument( - '--num_devices_no_dp', - type=int, - default=4, - help='Number of devices for no_dp mode (head parallelism only)' - ) - parser.add_argument( - '--num_devices_with_dp', - type=int, - default=8, - help='Number of devices for with_dp mode (dp_size * head_parallelism)' - ) parser.add_argument( '--dump_dir', type=str, default='/tmp/attention_dp_repro', help='Directory to dump HLO files' ) - parser.add_argument( - '--batch_size', - type=int, - default=256, - help='Batch size' - ) args = parser.parse_args() # Create dump directory @@ -307,8 +1632,6 @@ def main(): dump_dir.mkdir(parents=True, exist_ok=True) print(f"HLO dump directory: {dump_dir}") - # Create test inputs - print("\nCreating test inputs...") # Note: We'll create DP-specific inputs when running with_dp mode inputs_no_dp = None inputs_with_dp = None @@ -322,15 +1645,15 @@ def main(): # Run without DP if args.mode in ['no_dp', 'both']: print("\nCreating inputs for no_dp mode...") - inputs_no_dp = create_test_inputs(batch_size=args.batch_size, dp_size=1) - result, avg_time = run(inputs_no_dp, dump_dir, num_devices=args.num_devices_no_dp, dp=False) + inputs_no_dp = create_test_inputs(dp_size=1) + result, avg_time = run(inputs_no_dp, dump_dir, dp=False) results['no_dp'] = {'result': result, 'time': avg_time} # Run with DP if args.mode in ['with_dp', 'both']: - print(f"\nCreating inputs for with_dp mode (dp_size={args.dp_size})...") - inputs_with_dp = create_test_inputs(batch_size=args.batch_size, dp_size=args.dp_size) - result, avg_time = run(inputs_with_dp, dump_dir, dp_size=args.dp_size, num_devices=args.num_devices_with_dp, dp=True) + print(f"\nCreating inputs for with_dp mode (dp_size={2})...") + inputs_with_dp = create_test_inputs( dp_size=2) + result, avg_time = run(inputs_with_dp, dump_dir, dp=True) results['with_dp'] = {'result': result, 'time': avg_time} # Compare results @@ -351,35 +1674,12 @@ def main(): print(f"✓ DP is {speedup:.2f}x FASTER") else: print(f"✗ DP is {slowdown:.2f}x SLOWER") - - # Check output consistency - total = results['no_dp']['result'][0].shape[0] - for i in range(args.dp_size): - - out_no_dp = np.array(results['no_dp']['result'][0], dtype=np.float32) - out_with_dp = np.array(results['with_dp']['result'][0][total*i : total*(i+1), ...], dtype=np.float32) - - max_diff = np.max(np.abs(out_no_dp - out_with_dp)) - print(f"\nMax output difference for DP rank {i}: {max_diff}") - - if max_diff < 1e-2: - print("✓ Outputs match (within tolerance)") - else: - print("✗ Outputs differ significantly!") print("\n" + "="*80) - print("NEXT STEPS") - print("="*80) print(f"\n1. Compare HLO files in: {dump_dir}") print(f" - no_dp_hlo.txt") - print(f" - with_dp_{args.dp_size}_hlo.txt") - print(f"\n2. Look for:") - print(f" - all-reduce, all-gather, collective-permute operations") - print(f" - Extra transpose/reshape operations") - print(f" - Different memory layouts") - print(f"\n3. Use diff tool:") - print(f" diff {dump_dir}/no_dp_hlo.txt {dump_dir}/with_dp_{args.dp_size}_hlo.txt") - print(f"\n4. Or use XLA dump for more detail:") + print(f" - with_dp_2_hlo.txt") + print(f"\n2. Or use XLA dump for more detail:") print(f" XLA_FLAGS='--xla_dump_to={dump_dir}/xla_dump --xla_dump_hlo_as_text' python {__file__} --mode {args.mode}") print() From 1c47277566201213c1b10958b19f59eadc537bbf Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Tue, 18 Nov 2025 21:46:17 +0000 Subject: [PATCH 15/17] wip --- repro_attention_dp.py | 14 ++++++++++++-- 1 file changed, 12 insertions(+), 2 deletions(-) diff --git a/repro_attention_dp.py b/repro_attention_dp.py index 6636b8177..584e676a3 100644 --- a/repro_attention_dp.py +++ b/repro_attention_dp.py @@ -20,8 +20,9 @@ # sys.path.insert(0, '/home/wenxindong_google_com/tpu-inference') from tpu_inference.kernels.ragged_paged_attention.v3.kernel_hd64 import ( - get_kv_cache_shape, + get_kv_cache_shape as get_kv_cache_shape_h64, ) +from tpu_inference.kernels.ragged_paged_attention.v3.kernel import get_kv_cache_shape from tpu_inference.layers.common.sharding import ShardingAxisName from tpu_inference.layers.common.attention_metadata import AttentionMetadata @@ -56,7 +57,8 @@ def create_test_inputs( ) for i in range(dp_size)], axis=0) # KV cache - kv_cache_shape = get_kv_cache_shape( + get_kv_cache_shape_fn = get_kv_cache_shape_h64 if head_dim == 64 else get_kv_cache_shape + kv_cache_shape = get_kv_cache_shape_fn( total_num_pages, page_size, num_kv_heads, @@ -1686,3 +1688,11 @@ def main(): if __name__ == '__main__': main() + + +# ================================================================================ +# COMPARISON +# ================================================================================ +# No DP time: 2.63 ms +# With DP time: 2.62 ms +# ✓ DP is 1.00x FASTER \ No newline at end of file From abb1d9af401abcde44d63ea40059ef1dc34f1b6e Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Tue, 18 Nov 2025 22:14:09 +0000 Subject: [PATCH 16/17] wip --- debug_attn_dp.txt | 233 ---- debugging.txt | 423 ------- debugging_baseline.txt | 732 ------------ oss_log_98.txt | 2508 --------------------------------------- oss_log_attn_dp.txt | 2564 ---------------------------------------- oss_log_baseline.txt | 2410 ------------------------------------- oss_log_numerics.txt | 270 ----- 7 files changed, 9140 deletions(-) delete mode 100644 debug_attn_dp.txt delete mode 100644 debugging.txt delete mode 100644 debugging_baseline.txt delete mode 100644 oss_log_98.txt delete mode 100644 oss_log_attn_dp.txt delete mode 100644 oss_log_baseline.txt delete mode 100644 oss_log_numerics.txt diff --git a/debug_attn_dp.txt b/debug_attn_dp.txt deleted file mode 100644 index 24e8e7f8d..000000000 --- a/debug_attn_dp.txt +++ /dev/null @@ -1,233 +0,0 @@ -INFO 11-14 05:25:30 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 -INFO 11-14 05:25:30 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. -INFO 11-14 05:25:30 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. -WARNING 11-14 05:25:30 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") -INFO 11-14 05:25:31 [utils.py:253] non-default args: {'download_dir': '/mnt/disks/persist', 'max_model_len': 1024, 'tensor_parallel_size': 8, 'num_redundant_experts': None, 'eplb_window_size': None, 'eplb_step_interval': None, 'eplb_log_balancedness': None, 'gpu_memory_utilization': 0.8, 'enable_lora': None, 'reasoning_parser_plugin': '', 'additional_config': {'sharding': {'sharding_strategy': {'enable_dp_attention': 1}}}, 'async_scheduling': True, 'model': 'unsloth/gpt-oss-120b-BF16'} -INFO 11-14 05:25:32 [model.py:630] Resolved architecture: GptOssForCausalLM -INFO 11-14 05:25:32 [model.py:1728] Using max model len 1024 -WARNING 11-14 05:25:32 [tpu_jax.py:82] Error getting device name: 'NoneType' object has no attribute 'name' -INFO 11-14 05:25:32 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. -INFO 11-14 05:25:32 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. -INFO 11-14 05:25:32 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=2), device_indexes=None) -WARNING 11-14 05:25:32 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -INFO 11-14 05:25:32 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:33 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=1024, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=8, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=True, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} -(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:33 [tpu_jax.py:228] Pin memory is not supported on TPU. -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [tpu_jax_runner.py:274] Init mesh | mesh=Mesh('data': 1, 'model': 4, axis_types=(Auto, Auto)) -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [compilation_manager.py:34] Enabling JAX compile cache. -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:38 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm -(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:39 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") -(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:39 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:39 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") -(EngineCore_DP0 pid=4095770) WARNING 11-14 05:25:39 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:39 [tpu_jax.py:63] Cannot use None backend on TPU. -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:39 [tpu_jax.py:66] Using Pallas V1 backend. -(EngineCore_DP0 pid=4095770) INFO 11-14 05:25:39 [layer.py:331] Disabling MoE shared_experts cuda stream -(EngineCore_DP0 pid=4095770) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 - main(args) - File "/home/wenxindong_google_com/tpu-inference/examples/offline_inference.py", line 37, in main - llm = LLM(**args) - ^^^^^^^^^^^ - File "/home/wenxindong_google_com/vllm/vllm/entrypoints/llm.py", line 341, in __init__ - self.llm_engine = LLMEngine.from_engine_args( - ^^^^^^^^^^^^^^^^^^^^^^^^^^^ - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/llm_engine.py", line 174, in from_engine_args - return cls( - ^^^^ - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/llm_engine.py", line 108, in __init__ - self.engine_core = EngineCoreClient.make_client( - ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 93, in make_client - return SyncMPClient(vllm_config, executor_class, log_stats) - ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 640, in __init__ - super().__init__( - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 469, in __init__ - with launch_core_engines(vllm_config, executor_class, log_stats) as ( - ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - File "/mnt/disks/persist/vllm_conda/lib/python3.12/contextlib.py", line 144, in __exit__ - next(self.gen) - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/utils.py", line 898, in launch_core_engines - wait_for_engine_startup( - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/utils.py", line 955, in wait_for_engine_startup - raise RuntimeError( -RuntimeError: Engine core initialization failed. See root cause above. Failed core proc(s): {} diff --git a/debugging.txt b/debugging.txt deleted file mode 100644 index 66da4ea0e..000000000 --- a/debugging.txt +++ /dev/null @@ -1,423 +0,0 @@ -INFO 11-14 06:43:43 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 -INFO 11-14 06:43:43 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. -INFO 11-14 06:43:43 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. -WARNING 11-14 06:43:43 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") -INFO 11-14 06:43:44 [utils.py:253] non-default args: {'download_dir': '/mnt/disks/persist', 'max_model_len': 1024, 'tensor_parallel_size': 4, 'data_parallel_size': 2, 'num_redundant_experts': None, 'eplb_window_size': None, 'eplb_step_interval': None, 'eplb_log_balancedness': None, 'enable_lora': None, 'reasoning_parser_plugin': '', 'model': 'unsloth/gpt-oss-120b-BF16'} -INFO 11-14 06:43:45 [model.py:630] Resolved architecture: GptOssForCausalLM -INFO 11-14 06:43:45 [model.py:1728] Using max model len 1024 -WARNING 11-14 06:43:45 [tpu_jax.py:82] Error getting device name: 'NoneType' object has no attribute 'name' -INFO 11-14 06:43:45 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. -INFO 11-14 06:43:45 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. -INFO 11-14 06:43:45 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=2, attention_data_parallelism=1), device_indexes=None) -WARNING 11-14 06:43:45 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -INFO 11-14 06:43:45 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:46 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=1024, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=4, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=True, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} -(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:46 [tpu_jax.py:228] Pin memory is not supported on TPU. -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:51 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:51 [tpu_jax_runner.py:274] Init mesh | mesh=Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:51 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:52 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:52 [compilation_manager.py:34] Enabling JAX compile cache. -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:52 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:52 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm -(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:53 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") -(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:53 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:53 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") -(EngineCore_DP0 pid=113991) WARNING 11-14 06:43:53 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:53 [tpu_jax.py:63] Cannot use None backend on TPU. -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:53 [tpu_jax.py:66] Using Pallas V1 backend. -(EngineCore_DP0 pid=113991) INFO 11-14 06:43:53 [layer.py:331] Disabling MoE shared_experts cuda stream -(EngineCore_DP0 pid=113991) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00. This scheduler interface is not public and compatibility may not be maintained. -(EngineCore_DP0 pid=113991) INFO 11-14 06:45:29 [dp_scheduler.py:93] DPScheduler (Async = False) per-rank limits: max_seqs=256, max_tokens=8192 -(EngineCore_DP0 pid=113991) INFO 11-14 06:45:29 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) -(EngineCore_DP0 pid=113991) WARNING 11-14 06:45:29 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -(EngineCore_DP0 pid=113991) INFO 11-14 06:45:29 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -INFO 11-14 06:45:29 [llm.py:350] Supported tasks: ['generate'] - Adding requests: 0%| | 0/35 [00:00, 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None}, -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [dump_input.py:79] Dumping scheduler output for model execution: DPSchedulerOutput(scheduled_new_reqs=[NewRequestData(req_id=0,prompt_token_ids_len=5,mm_features=[],sampling_params=SamplingParams(n=1, presence_penalty=0.0, frequency_penalty=0.0, repetition_penalty=1.0, temperature=1.0, top_p=1.0, top_k=0, min_p=0.0, seed=None, stop=[], stop_token_ids=[199999], bad_words=[], include_stop_str_in_output=False, ignore_eos=False, max_tokens=16, min_tokens=0, logprobs=None, prompt_logprobs=None, skip_special_tokens=True, spaces_between_special_tokens=True, truncate_prompt_tokens=None, structured_outputs=None, extra_args=None),block_ids=([1],),num_computed_tokens=0,lora_request=None,prompt_embeds_shape=None)], scheduled_cached_reqs=CachedRequestData(req_ids=[], resumed_req_ids=[], new_token_ids=[], all_token_ids=[], new_block_ids=[], num_computed_tokens=[], num_output_tokens=[]), num_scheduled_tokens={0: 5}, total_num_scheduled_tokens=5, scheduled_spec_decode_tokens={}, scheduled_encoder_inputs={}, num_common_prefix_blocks=[1], finished_req_ids=[], free_encoder_mm_hashes=[], pending_structured_output_tokens=false, kv_connector_metadata=null, assigned_dp_rank={0: 0}) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [dump_input.py:81] Dumping scheduler stats: SchedulerStats(num_running_reqs=1, num_waiting_reqs=0, step_counter=0, current_wave=0, kv_cache_usage=1.9061415881982402e-05, prefix_cache_stats=PrefixCacheStats(reset=False, requests=3, queries=15, hits=0, preempted_requests=0, preempted_queries=0, preempted_hits=0), connector_prefix_cache_stats=None, spec_decoding_stats=None, kv_connector_stats=None, waiting_lora_adapters={}, running_lora_adapters={}) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] EngineCore encountered a fatal error. -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] Traceback (most recent call last): -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 848, in run_engine_core -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] engine_core.run_busy_loop() -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 875, in run_busy_loop -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] self._process_engine_step() -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 904, in _process_engine_step -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] outputs, model_executed = self.step_fn() -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 332, in step -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] model_output = future.result() -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/concurrent/futures/_base.py", line 449, in result -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.__get_result() -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/concurrent/futures/_base.py", line 401, in __get_result -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] raise self._exception -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/executor/uniproc_executor.py", line 79, in collective_rpc -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] result = run_method(self.driver_worker, method, args, kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/serial_utils.py", line 459, in run_method -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return func(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/v1/worker/worker_base.py", line 367, in execute_model -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.worker.execute_model(scheduler_output, *args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/worker/tpu_worker_jax.py", line 198, in execute_model -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] output = self.model_runner.execute_model(scheduler_output) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/utils.py", line 313, in wrapper -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] result = func(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/runner/tpu_jax_runner.py", line 526, in execute_model -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] _, output = self._execute_model(scheduler_output) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/runner/tpu_jax_runner.py", line 717, in _execute_model -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] aux_hidden_states) = self.model_fn( -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 169, in step_fun -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] hidden_states = torch.func.functional_call( -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/_functorch/functional_call.py", line 148, in functional_call -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return nn.utils.stateless._functional_call( -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/utils/stateless.py", line 282, in _functional_call -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return module(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 46, in forward -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.compute_hidden_state( -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 60, in compute_hidden_state -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] hidden_state = self.vllm_model(input_ids, positions, -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 716, in forward -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.model(input_ids, positions, intermediate_tensors, inputs_embeds) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/compilation/decorators.py", line 470, in __call__ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] output = self.compiled_callable(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/_dynamo/eval_frame.py", line 761, in compile_wrapper -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] _maybe_set_eval_frame(prior) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 299, in forward -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] x, residual = layer(x, positions, residual) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 236, in forward -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] output = self.mlp(hidden_states) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 189, in forward -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] x = self.experts(hidden_states=x, router_logits=g) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/custom_op.py", line 46, in forward -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self._forward_method(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/custom_op.py", line 76, in forward_tpu -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return self.forward_native(*args, **kwargs) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/layers/fused_moe/layer.py", line 1487, in forward_native -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] fused_output = self.forward_impl(hidden_states, router_logits) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/vllm/vllm/model_executor/layers/fused_moe/layer.py", line 1745, in forward_impl -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] final_hidden_states = self.quant_method.apply( -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/quantization/unquantized.py", line 363, in apply -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] output = fused_moe_func_padded( -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 491, in fused_moe_func_padded -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] return x -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 388, in fused_moe_func -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] x1, x2 = tensor_sharded_gmm_merged_column_parallel( -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 124, in tensor_sharded_gmm_merged_column_parallel -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] gmm_result = shard_map( -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] ValueError: The context mesh AbstractMesh('data': 2, 'model': 4, axis_types=(Manual, Manual), device_kind=TPU7x, num_cores=1) should match the mesh passed to shard_map Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] -------------------- -(EngineCore_DP0 pid=113991) ERROR 11-14 06:45:30 [core.py:857] For simplicity, JAX has removed its internal frames from the traceback of the following exception. Set JAX_TRACEBACK_FILTERING=off to include these. -(EngineCore_DP0 pid=113991) Process EngineCore_DP0: -Traceback (most recent call last): - File "/home/wenxindong_google_com/tpu-inference/examples/offline_inference.py", line 113, in - main(args) - File "/home/wenxindong_google_com/tpu-inference/examples/offline_inference.py", line 92, in main - outputs = llm.generate(prompts, sampling_params) - ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - File "/home/wenxindong_google_com/vllm/vllm/entrypoints/llm.py", line 446, in generate - outputs = self._run_engine(use_tqdm=use_tqdm) - ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - File "/home/wenxindong_google_com/vllm/vllm/entrypoints/llm.py", line 1736, in _run_engine - step_outputs = self.llm_engine.step() - ^^^^^^^^^^^^^^^^^^^^^^ - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/llm_engine.py", line 285, in step - outputs = self.engine_core.get_output() -(EngineCore_DP0 pid=113991) Traceback (most recent call last): - ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ - File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 709, in get_output - raise self._format_exception(outputs) from None -vllm.v1.engine.exceptions.EngineDeadError: EngineCore encountered an issue. See stack trace (above) for the root cause. -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/multiprocessing/process.py", line 314, in _bootstrap -(EngineCore_DP0 pid=113991) self.run() -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/multiprocessing/process.py", line 108, in run -(EngineCore_DP0 pid=113991) self._target(*self._args, **self._kwargs) -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 859, in run_engine_core -(EngineCore_DP0 pid=113991) raise e -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 848, in run_engine_core -(EngineCore_DP0 pid=113991) engine_core.run_busy_loop() -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 875, in run_busy_loop -(EngineCore_DP0 pid=113991) self._process_engine_step() -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 904, in _process_engine_step -(EngineCore_DP0 pid=113991) outputs, model_executed = self.step_fn() -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core.py", line 332, in step -(EngineCore_DP0 pid=113991) model_output = future.result() -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/concurrent/futures/_base.py", line 449, in result -(EngineCore_DP0 pid=113991) return self.__get_result() -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/concurrent/futures/_base.py", line 401, in __get_result -(EngineCore_DP0 pid=113991) raise self._exception -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/executor/uniproc_executor.py", line 79, in collective_rpc -(EngineCore_DP0 pid=113991) result = run_method(self.driver_worker, method, args, kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/serial_utils.py", line 459, in run_method -(EngineCore_DP0 pid=113991) return func(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/v1/worker/worker_base.py", line 367, in execute_model -(EngineCore_DP0 pid=113991) return self.worker.execute_model(scheduler_output, *args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/worker/tpu_worker_jax.py", line 198, in execute_model -(EngineCore_DP0 pid=113991) output = self.model_runner.execute_model(scheduler_output) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/utils.py", line 313, in wrapper -(EngineCore_DP0 pid=113991) result = func(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/runner/tpu_jax_runner.py", line 526, in execute_model -(EngineCore_DP0 pid=113991) _, output = self._execute_model(scheduler_output) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/runner/tpu_jax_runner.py", line 717, in _execute_model -(EngineCore_DP0 pid=113991) aux_hidden_states) = self.model_fn( -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 169, in step_fun -(EngineCore_DP0 pid=113991) hidden_states = torch.func.functional_call( -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/_functorch/functional_call.py", line 148, in functional_call -(EngineCore_DP0 pid=113991) return nn.utils.stateless._functional_call( -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/utils/stateless.py", line 282, in _functional_call -(EngineCore_DP0 pid=113991) return module(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 46, in forward -(EngineCore_DP0 pid=113991) return self.compute_hidden_state( -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/models/vllm/vllm_model_wrapper.py", line 60, in compute_hidden_state -(EngineCore_DP0 pid=113991) hidden_state = self.vllm_model(input_ids, positions, -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 716, in forward -(EngineCore_DP0 pid=113991) return self.model(input_ids, positions, intermediate_tensors, inputs_embeds) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/compilation/decorators.py", line 470, in __call__ -(EngineCore_DP0 pid=113991) output = self.compiled_callable(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/_dynamo/eval_frame.py", line 761, in compile_wrapper -(EngineCore_DP0 pid=113991) _maybe_set_eval_frame(prior) -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 299, in forward -(EngineCore_DP0 pid=113991) x, residual = layer(x, positions, residual) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 236, in forward -(EngineCore_DP0 pid=113991) output = self.mlp(hidden_states) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/models/gpt_oss.py", line 189, in forward -(EngineCore_DP0 pid=113991) x = self.experts(hidden_states=x, router_logits=g) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1773, in _wrapped_call_impl -(EngineCore_DP0 pid=113991) return self._call_impl(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torch/nn/modules/module.py", line 1784, in _call_impl -(EngineCore_DP0 pid=113991) return forward_call(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/custom_op.py", line 46, in forward -(EngineCore_DP0 pid=113991) return self._forward_method(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/custom_op.py", line 76, in forward_tpu -(EngineCore_DP0 pid=113991) return self.forward_native(*args, **kwargs) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/layers/fused_moe/layer.py", line 1487, in forward_native -(EngineCore_DP0 pid=113991) fused_output = self.forward_impl(hidden_states, router_logits) -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/vllm/vllm/model_executor/layers/fused_moe/layer.py", line 1745, in forward_impl -(EngineCore_DP0 pid=113991) final_hidden_states = self.quant_method.apply( -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/quantization/unquantized.py", line 363, in apply -(EngineCore_DP0 pid=113991) output = fused_moe_func_padded( -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 491, in fused_moe_func_padded -(EngineCore_DP0 pid=113991) return x -(EngineCore_DP0 pid=113991) ^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 388, in fused_moe_func -(EngineCore_DP0 pid=113991) x1, x2 = tensor_sharded_gmm_merged_column_parallel( -(EngineCore_DP0 pid=113991) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(EngineCore_DP0 pid=113991) File "/home/wenxindong_google_com/tpu-inference/tpu_inference/layers/vllm/fused_moe.py", line 124, in tensor_sharded_gmm_merged_column_parallel -(EngineCore_DP0 pid=113991) gmm_result = shard_map( -(EngineCore_DP0 pid=113991) ^^^^^^^^^^ -(EngineCore_DP0 pid=113991) ValueError: The context mesh AbstractMesh('data': 2, 'model': 4, axis_types=(Manual, Manual), device_kind=TPU7x, num_cores=1) should match the mesh passed to shard_map Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) -(EngineCore_DP0 pid=113991) -------------------- -(EngineCore_DP0 pid=113991) For simplicity, JAX has removed its internal frames from the traceback of the following exception. Set JAX_TRACEBACK_FILTERING=off to include these. - Processed prompts: 0%| | 0/35 [00:04, 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} -(EngineCore_DP0 pid=59613) WARNING 11-14 06:25:59 [tpu_jax.py:228] Pin memory is not supported on TPU. -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [tpu_jax_runner.py:274] Init mesh | mesh=Mesh('data': 1, 'model': 4, axis_types=(Auto, Auto)) -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192] -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256] -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [compilation_manager.py:34] Enabling JAX compile cache. -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:05 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm -(EngineCore_DP0 pid=59613) WARNING 11-14 06:26:06 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") -(EngineCore_DP0 pid=59613) WARNING 11-14 06:26:06 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=59613) WARNING 11-14 06:26:06 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") -(EngineCore_DP0 pid=59613) WARNING 11-14 06:26:06 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:06 [tpu_jax.py:63] Cannot use None backend on TPU. -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:06 [tpu_jax.py:66] Using Pallas V1 backend. -(EngineCore_DP0 pid=59613) INFO 11-14 06:26:06 [layer.py:331] Disabling MoE shared_experts cuda stream -(EngineCore_DP0 pid=59613) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00, 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:02 [tpu_jax.py:228] Pin memory is not supported on TPU. -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:07 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [tpu_jax_runner.py:278] Creating new model mesh | devices=8, num_slices=1 -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 2, 'attn_dp': 1, 'expert': 1, 'model': 4, axis_types=(Auto, Auto, Auto, Auto)) -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [utils.py:314] Phased-based profiler enabled. Traces will be saved to: gs://wenxindong-vm/trace/gpt_oss/dp2/kv_98 -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [compilation_manager.py:34] Enabling JAX compile cache. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:08 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:09 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:09 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:09 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:33:09 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:09 [tpu_jax.py:63] Cannot use None backend on TPU. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:09 [tpu_jax.py:66] Using Pallas V1 backend. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:33:09 [layer.py:331] Disabling MoE shared_experts cuda stream -(EngineCore_DP0 pid=2733848) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 {'num_tokens': 16} -(EngineCore_DP0 pid=2733848) /mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torchax/tensor.py:154: UserWarning: Explicitly requested dtype int64 requested in astype is not available, and will be truncated to dtype int32. To enable more dtypes, set the jax_enable_x64 configuration option or the JAX_ENABLE_X64 shell environment variable. See https://github.com/jax-ml/jax#current-gotchas for more. -(EngineCore_DP0 pid=2733848) res = jax_function(self._elem, *args, **kwargs) -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:47] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:34:57 [compilation_manager.py:67] Compilation finished in 11.39 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:34:57 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 32} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:57] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:57] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:57] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:34:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:09 [compilation_manager.py:67] Compilation finished in 12.20 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:09 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 64} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:09] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:10] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:22 [compilation_manager.py:67] Compilation finished in 12.88 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:22 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 128} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:24] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:40 [compilation_manager.py:67] Compilation finished in 17.50 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:40 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 256} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:40] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:58 [compilation_manager.py:67] Compilation finished in 18.27 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:35:58 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 512} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:35:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:17 [compilation_manager.py:67] Compilation finished in 19.21 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:18 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 1024} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:18] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:37 [compilation_manager.py:67] Compilation finished in 19.12 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:37 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 2048} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:37] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:38] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:58 [compilation_manager.py:67] Compilation finished in 21.21 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:36:58 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 4096} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:58] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:36:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:37:21 [compilation_manager.py:67] Compilation finished in 23.27 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:37:22 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 8192} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:23] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:37:52 [compilation_manager.py:67] Compilation finished in 30.79 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:37:52 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 16384} -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:52] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:53] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) [2025-11-12 22:37:54] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 37.26 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:32 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:33 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:34 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:35 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:36 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:37 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:38 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:67] Compilation finished in 0.34 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:39 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:40 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:41 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:42 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:43 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:325] Compiling select_from_array with different input shapes. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:304] Compiling select_from_array for select all logits. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.08 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:44 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:67] Compilation finished in 0.55 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:51 [compilation_manager.py:67] Compilation finished in 0.36 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:51 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:51 [compilation_manager.py:67] Compilation finished in 0.59 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:51 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:52 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:53 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:53 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:53 [compilation_manager.py:67] Compilation finished in 0.52 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:53 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:54 [compilation_manager.py:67] Compilation finished in 0.76 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:54 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:55 [compilation_manager.py:67] Compilation finished in 0.46 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:55 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:55 [compilation_manager.py:67] Compilation finished in 0.44 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:55 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:56 [compilation_manager.py:67] Compilation finished in 0.45 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:56 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:56 [compilation_manager.py:67] Compilation finished in 0.47 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:56 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:67] Compilation finished in 0.54 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:67] Compilation finished in 0.64 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:57 [compilation_manager.py:67] Compilation finished in 0.02 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:58 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:59 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:59 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:59 [compilation_manager.py:67] Compilation finished in 0.58 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:38:59 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:00 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:67] Compilation finished in 0.60 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:365] Compiling compute_logits with different input shapes. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:67] Compilation finished in 0.28 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:01 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:67] Compilation finished in 0.36 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:02 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:03 [compilation_manager.py:67] Compilation finished in 0.77 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:03 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:03 [compilation_manager.py:67] Compilation finished in 0.02 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:03 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:04 [compilation_manager.py:67] Compilation finished in 0.84 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:04 [compilation_manager.py:387] Compiling sampling with different input shapes. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': True} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': False} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:05 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': True} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': False} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': True} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:06 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': False} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:07 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:07 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': True} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:07 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:07 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': False} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:67] Compilation finished in 0.53 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': True} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': False} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:08 [compilation_manager.py:67] Compilation finished in 0.02 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': True} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': False} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': True} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': False} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:10 [compilation_manager.py:67] Compilation finished in 0.39 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:10 [compilation_manager.py:455] Compiling gather_logprobs with different input shapes. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:10 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 8} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.70 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 16} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.78 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 32} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.05 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 64} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 128} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.05 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 256} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:11 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 512} -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [compilation_manager.py:67] Compilation finished in 0.04 [secs]. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [compilation_manager.py:751] Compiling structured_decoding with different input shapes. -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:39:12 [compilation_manager.py:754] Structured decoding precompilation skipped since structured decoding is not supported with DP. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [core.py:247] init engine (profile, create kv cache, warmup model) took 270.28 seconds -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:39:12 [scheduler.py:158] Using custom scheduler class . This scheduler interface is not public and compatibility may not be maintained. -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [dp_scheduler.py:93] DPScheduler (Async = True) per-rank limits: max_seqs=256, max_tokens=8192 -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:12 [core.py:181] Batch queue is enabled with size 2 -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:13 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:39:13 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -(EngineCore_DP0 pid=2733848) INFO 11-12 22:39:13 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -(APIServer pid=2733675) [INFO] model_hosting_container_standards - decorators.py:76: [PING] Framework handler registered: ping -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO decorators.py:76: [PING] Framework handler registered: ping -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func -(APIServer pid=2733675) [INFO] model_hosting_container_standards - decorators.py:76: [INVOKE] Framework handler registered: decorated_func -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO decorators.py:76: [INVOKE] Framework handler registered: decorated_func -(APIServer pid=2733675) [INFO] model_hosting_container_standards - __init__.py:127: Starting SageMaker bootstrap process -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO __init__.py:127: Starting SageMaker bootstrap process -(APIServer pid=2733675) [INFO] model_hosting_container_standards - registry.py:109: [REGISTRY] Middleware resolution and registration complete -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO registry.py:109: [REGISTRY] Middleware resolution and registration complete -(APIServer pid=2733675) [INFO] model_hosting_container_standards - core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully -(APIServer pid=2733675) [INFO] model_hosting_container_standards - core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares -(APIServer pid=2733675) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=2733675) [2025-11-12 22:39:13] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=2733675) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=2733675) [2025-11-12 22:39:13] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=2733675) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:93: Creating SageMaker router with unified route resolver -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO sagemaker_router.py:93: Creating SageMaker router with unified route resolver -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:172: Creating router with prefix='', tags=['sagemaker'] -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:172: Creating router with prefix='', tags=['sagemaker'] -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:110: Mounting 2 handlers to router -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:110: Mounting 2 handlers to router -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:184: Router created with 0 routes -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:184: Router created with 0 routes -(APIServer pid=2733675) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:101: SageMaker router created successfully with 0 routes -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO sagemaker_router.py:101: SageMaker router created successfully with 0 routes -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:287: Including router with conflict detection -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:287: Including router with conflict detection -(APIServer pid=2733675) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:305: Successfully included router with 0 routes -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO routing.py:305: Successfully included router with 0 routes -(APIServer pid=2733675) [INFO] model_hosting_container_standards - __init__.py:139: SageMaker bootstrap completed successfully -(APIServer pid=2733675) [2025-11-12 22:39:13] INFO __init__.py:139: SageMaker bootstrap completed successfully -(APIServer pid=2733675) INFO 11-12 22:39:13 [api_server.py:1662] Supported tasks: ['generate'] -(APIServer pid=2733675) WARNING 11-12 22:39:13 [serving_responses.py:189] For gpt-oss, we ignore --enable-auto-tool-choice and always enable tool use. -(APIServer pid=2733675) INFO 11-12 22:39:13 [api_server.py:1972] Starting vLLM API server 0 on http://0.0.0.0:8000 -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:38] Available routes are: -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /openapi.json, Methods: GET, HEAD -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /docs, Methods: GET, HEAD -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /docs/oauth2-redirect, Methods: GET, HEAD -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /redoc, Methods: GET, HEAD -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /health, Methods: GET -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /load, Methods: GET -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /tokenize, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /detokenize, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/models, Methods: GET -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /version, Methods: GET -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/responses, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/responses/{response_id}, Methods: GET -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/responses/{response_id}/cancel, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/messages, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/chat/completions, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/completions, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/embeddings, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /pooling, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /classify, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /score, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/score, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/audio/transcriptions, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/audio/translations, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /rerank, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v1/rerank, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /v2/rerank, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /scale_elastic_ep, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /is_scaling_elastic_ep, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /ping, Methods: GET -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /ping, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /invocations, Methods: POST -(APIServer pid=2733675) INFO 11-12 22:39:13 [launcher.py:46] Route: /metrics, Methods: GET -(APIServer pid=2733675) INFO: Started server process [2733675] -(APIServer pid=2733675) INFO: Waiting for application startup. -(APIServer pid=2733675) INFO: Application startup complete. -(APIServer pid=2733675) INFO: 127.0.0.1:46880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO 11-12 22:39:34 [loggers.py:221] Engine 000: Avg prompt throughput: 204.8 tokens/s, Avg generation throughput: 50.8 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:39:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 127.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:39:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 122.5 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:40:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 117.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:40:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 118.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.2%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=2733848) WARNING 11-12 22:40:20 [tpu_jax_runner.py:666] Should not schedule a request that does nothing! -(APIServer pid=2733675) INFO: 127.0.0.1:46880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49068 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49078 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49094 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49098 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49112 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49116 - "POST /v1/completions HTTP/1.1" 200 OK -(EngineCore_DP0 pid=2733848) INFO 11-12 22:40:21 [utils.py:358] Starting profiling for prefill_heavy phase -(EngineCore_DP0 pid=2733848) INFO 11-12 22:40:21 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 8192, 'num_prefill_tokens': 12288, 'num_decode_tokens': 1, 'padded_total_num_scheduled_tokens': 16384, 'num_reqs': 7} -(APIServer pid=2733675) INFO: 127.0.0.1:49120 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49130 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49138 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49156 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49166 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49178 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49200 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49204 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49206 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49220 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49228 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49244 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49274 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49294 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49304 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49306 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49316 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49324 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49340 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49358 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49366 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49376 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49386 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49392 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49400 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49404 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49416 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49432 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49446 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49468 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49482 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49484 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49496 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49508 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49510 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49534 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49548 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49552 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49562 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49582 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49592 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49596 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49608 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49622 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49630 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49646 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49662 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49674 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49682 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49696 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49700 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49712 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49720 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49728 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49736 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49738 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49754 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49766 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49768 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49770 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49780 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49814 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49830 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49832 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49848 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49854 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49864 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49886 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49904 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49908 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49914 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49916 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49928 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49932 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49950 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49960 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49964 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49976 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49980 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:49996 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50008 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50026 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50030 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50038 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50078 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50090 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50092 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50102 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50106 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50112 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50116 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50120 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50122 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50126 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50142 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50158 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50174 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50184 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50192 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50196 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50200 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50218 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50234 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50238 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50262 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50268 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50280 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50288 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50290 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50304 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50314 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50330 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50336 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50344 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50350 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50368 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50384 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50400 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50412 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50428 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50430 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50436 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50438 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50458 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50466 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50470 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50484 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50494 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50498 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50506 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50522 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50528 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50530 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50542 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50552 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50590 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50596 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50612 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50614 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50620 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50628 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50640 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50646 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50662 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50666 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50682 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50690 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50704 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50714 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50718 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50732 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50740 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50744 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50760 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50768 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50780 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50790 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50824 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50844 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50886 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50900 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50910 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50924 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50932 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50934 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50936 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50938 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50950 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50960 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50982 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50984 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:50986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51002 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51014 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51030 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51044 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51074 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51088 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51090 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51102 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51128 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51130 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51132 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51148 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51174 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51182 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51186 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51198 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51202 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51208 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51230 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51264 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51280 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51294 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51308 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51310 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51320 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51324 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51326 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51334 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51348 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51370 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51378 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51398 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51408 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51420 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51434 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51444 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51454 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51458 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51482 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51492 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51506 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51512 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51528 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51532 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51538 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51546 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51566 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51574 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51598 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51608 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51622 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51636 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51650 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51658 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51666 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51672 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51676 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51702 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51716 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51726 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51734 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51748 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51758 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51770 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51778 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51794 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51810 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51820 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51826 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51832 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51844 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51866 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51882 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51926 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51942 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51956 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51958 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:51984 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52000 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52012 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52016 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52018 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52032 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52048 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52062 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52068 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52078 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52094 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52098 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52106 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52110 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52112 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52126 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52136 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52142 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52156 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52158 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52164 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52176 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52192 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52204 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52212 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52232 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52234 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52240 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52264 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52280 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52284 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52292 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52298 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52324 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52326 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52330 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52344 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52358 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52370 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52378 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52388 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52404 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52408 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52416 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52420 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52436 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52442 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52450 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52470 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52472 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52488 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52504 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52520 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52534 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52540 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52542 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52566 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52572 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52580 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52586 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52608 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52614 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52630 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52638 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52642 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52654 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52656 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52664 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52668 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52672 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52680 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52696 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52706 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52710 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52732 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52746 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52760 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52774 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52790 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52800 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52814 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52824 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52840 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52848 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52852 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52856 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52870 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52892 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52906 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52908 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52926 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52930 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52942 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52952 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52962 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52978 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:52992 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53014 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53030 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53044 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53060 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53072 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53082 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53086 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53092 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53096 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53120 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53132 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53138 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53158 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53164 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53174 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53190 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53198 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53210 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53224 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53240 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53248 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53262 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53266 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53270 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53284 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53286 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53300 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53306 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53320 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53322 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53326 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53340 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53352 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53360 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53376 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53392 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53410 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53424 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53432 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53438 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53440 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53450 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53454 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53468 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53476 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53488 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53512 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53532 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53534 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53550 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53562 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53564 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53570 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53586 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53592 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53596 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53618 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53626 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53628 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53636 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53644 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53658 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53666 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53672 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53674 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53682 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53698 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53714 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53716 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53718 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53730 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53736 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53752 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53758 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53774 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53786 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53790 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53806 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53810 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53838 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53864 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53870 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53888 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53904 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53922 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53936 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53946 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53960 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53978 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53982 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:53990 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54002 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54008 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54024 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54028 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54046 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54052 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54080 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54092 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54114 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54122 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54132 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54158 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54164 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54168 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54174 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54180 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54196 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54206 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54228 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54238 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54260 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54262 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54264 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54288 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54318 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54320 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54322 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54328 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54330 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54350 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54356 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54368 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54380 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54400 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54402 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54418 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54428 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54436 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54454 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54462 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54476 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54480 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54494 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54496 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54498 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54504 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54516 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54530 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54538 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54540 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54552 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54562 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54576 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54590 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54598 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54610 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54622 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54638 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54652 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54658 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54674 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54702 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54716 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54722 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54726 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54736 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54738 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54742 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54752 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54754 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54756 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54764 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54778 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54786 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54824 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54854 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54860 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54868 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54884 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54904 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54916 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54930 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54944 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54958 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54966 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54982 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:54996 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55016 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55030 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55042 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55066 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55072 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55082 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55098 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55102 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55118 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55160 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55176 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55180 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55204 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55206 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55208 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55224 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55228 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55268 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55284 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55300 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55304 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55308 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55310 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55318 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55334 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55344 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55352 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55354 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55376 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55394 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55396 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55420 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55426 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55432 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55440 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55454 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55470 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55484 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55486 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55510 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55514 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55522 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55528 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55540 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55556 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55562 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55564 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55574 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55590 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55598 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55604 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55610 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55620 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55634 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55642 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55648 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55666 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55674 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55698 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55710 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55720 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55726 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55732 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55734 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55740 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55750 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55766 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55780 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55790 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55804 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55810 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55838 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55892 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55894 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55900 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55906 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55910 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55918 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55926 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55938 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55940 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55944 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55954 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55956 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55964 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:55992 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56004 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56014 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56016 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56032 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56040 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56066 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56080 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56096 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56110 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56120 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56134 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56150 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56152 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56168 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56172 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56176 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56190 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56206 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56214 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56218 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56228 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56240 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56248 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56250 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56256 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56262 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56282 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56298 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56310 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56318 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56330 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56334 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56336 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56342 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56354 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56356 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56370 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56384 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56396 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56412 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56418 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56428 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56444 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56460 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56462 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56472 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56482 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56496 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56506 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56516 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56530 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56536 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56552 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56578 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56592 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56610 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56618 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56626 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56628 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56630 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56632 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56642 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56654 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56668 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56682 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56690 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56700 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56714 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56718 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56734 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56738 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56748 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56752 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56760 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56766 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56782 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56790 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56792 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56844 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56848 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56866 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56894 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56900 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56928 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56940 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56942 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56954 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:56992 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57012 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57018 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57044 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57078 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57088 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57114 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57116 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57128 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57136 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57148 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57150 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57156 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57174 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57180 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57196 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57198 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57204 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57210 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57218 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57234 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57244 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57268 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57274 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57286 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57290 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57300 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57316 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57338 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57350 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57374 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57388 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57392 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57400 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57408 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57422 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57436 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57450 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57458 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57472 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57488 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57496 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57514 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57516 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57524 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57540 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57552 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57556 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57570 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57582 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57590 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57596 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57612 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57624 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57634 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57648 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57676 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57686 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57688 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57698 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57714 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57720 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57728 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57744 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57756 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57772 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57792 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57804 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57810 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57824 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57836 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57842 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57856 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57866 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57886 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57888 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57900 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57914 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57930 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57946 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57958 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57974 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:57990 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58016 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58024 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58028 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58038 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58050 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58066 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58074 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58080 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58088 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58094 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58110 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO: 127.0.0.1:58136 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2733675) INFO 11-12 22:40:24 [loggers.py:221] Engine 000: Avg prompt throughput: 5938.7 tokens/s, Avg generation throughput: 86.6 tokens/s, Running: 39 reqs, Waiting: 985 reqs, GPU KV cache usage: 2.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:40:34 [loggers.py:221] Engine 000: Avg prompt throughput: 8192.1 tokens/s, Avg generation throughput: 26.5 tokens/s, Running: 79 reqs, Waiting: 945 reqs, GPU KV cache usage: 4.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:40:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 79 reqs, Waiting: 945 reqs, GPU KV cache usage: 4.2%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=2733848) INFO 11-12 22:40:45 [utils.py:397] Profiling for prefill_heavy phase finished -(APIServer pid=2733675) INFO 11-12 22:40:54 [loggers.py:221] Engine 000: Avg prompt throughput: 34405.1 tokens/s, Avg generation throughput: 329.7 tokens/s, Running: 247 reqs, Waiting: 777 reqs, GPU KV cache usage: 13.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:41:04 [loggers.py:221] Engine 000: Avg prompt throughput: 35225.6 tokens/s, Avg generation throughput: 718.6 tokens/s, Running: 419 reqs, Waiting: 605 reqs, GPU KV cache usage: 22.6%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=2733848) INFO 11-12 22:41:09 [utils.py:358] Starting profiling for decode_heavy phase -(EngineCore_DP0 pid=2733848) INFO 11-12 22:41:09 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 256, 'num_prefill_tokens': 0, 'num_decode_tokens': 512, 'padded_total_num_scheduled_tokens': 512, 'num_reqs': 512} -(APIServer pid=2733675) INFO 11-12 22:41:14 [loggers.py:221] Engine 000: Avg prompt throughput: 21094.6 tokens/s, Avg generation throughput: 1114.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:41:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=2733848) INFO 11-12 22:41:28 [utils.py:397] Profiling for decode_heavy phase finished -(APIServer pid=2733675) INFO 11-12 22:41:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5579.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:41:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10390.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:41:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10338.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:42:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10285.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 35.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:42:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10291.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:42:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10238.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:42:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10185.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:42:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10135.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 45.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:42:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10134.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:43:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10084.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:43:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8445.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:43:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7679.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:43:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8448.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:43:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8394.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:43:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8394.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:44:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8345.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:44:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8259.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 63.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:44:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8343.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:44:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8289.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:44:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8241.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 68.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:44:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8191.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:45:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8188.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:45:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8190.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:45:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8138.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:45:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8089.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 79.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:45:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8089.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:45:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8087.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:46:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8036.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:46:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8036.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:46:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8034.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:46:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7983.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:46:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7933.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:46:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7934.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 93.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:47:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7933.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:47:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7880.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:47:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7883.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:47:34 [loggers.py:221] Engine 000: Avg prompt throughput: 26416.4 tokens/s, Avg generation throughput: 2387.5 tokens/s, Running: 502 reqs, Waiting: 373 reqs, GPU KV cache usage: 77.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:47:44 [loggers.py:221] Engine 000: Avg prompt throughput: 33176.0 tokens/s, Avg generation throughput: 1044.4 tokens/s, Running: 498 reqs, Waiting: 211 reqs, GPU KV cache usage: 54.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:47:54 [loggers.py:221] Engine 000: Avg prompt throughput: 35224.7 tokens/s, Avg generation throughput: 1090.2 tokens/s, Running: 496 reqs, Waiting: 41 reqs, GPU KV cache usage: 30.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:48:04 [loggers.py:221] Engine 000: Avg prompt throughput: 10034.3 tokens/s, Avg generation throughput: 7773.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:48:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10390.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:48:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10339.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:48:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10391.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 36.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:48:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10288.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:48:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10289.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:49:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10188.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:49:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10186.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:49:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10183.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 47.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:49:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 10083.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:49:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7881.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:49:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8036.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 53.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:50:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8393.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:50:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8445.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:50:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8395.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:50:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8343.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:50:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8342.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:50:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8292.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:51:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8291.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:51:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8240.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 70.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:51:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8241.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:51:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8189.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:51:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8189.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 74.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:51:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8138.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:52:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8136.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:52:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8088.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:52:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8087.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:52:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8038.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 85.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:52:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8038.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:52:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 8035.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:53:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7986.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:53:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7982.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:53:24 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7935.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 95.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:53:34 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7935.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:53:44 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7885.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:53:54 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 7925.2 tokens/s, Running: 477 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:54:04 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 1488.2 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2733675) INFO 11-12 22:54:14 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% diff --git a/oss_log_attn_dp.txt b/oss_log_attn_dp.txt deleted file mode 100644 index 7672ef726..000000000 --- a/oss_log_attn_dp.txt +++ /dev/null @@ -1,2564 +0,0 @@ -INFO 11-13 00:09:36 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 -INFO 11-13 00:09:36 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. -INFO 11-13 00:09:36 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. -WARNING 11-13 00:09:36 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") -(APIServer pid=2993839) INFO 11-13 00:09:37 [api_server.py:1897] vLLM API server version 0.11.1rc7.dev48+gdf4d3a44a -(APIServer pid=2993839) INFO 11-13 00:09:37 [utils.py:253] non-default args: {'model_tag': 'unsloth/gpt-oss-120b-BF16', 'model': 'unsloth/gpt-oss-120b-BF16', 'max_model_len': 8192, 'download_dir': '/mnt/disks/persist', 'tensor_parallel_size': 8, 'gpu_memory_utilization': 0.95, 'enable_prefix_caching': False, 'max_num_batched_tokens': 8192, 'max_num_seqs': 256, 'async_scheduling': True, 'additional_config': {'sharding': {'sharding_strategy': {'enable_dp_attention': 1}}}} -(APIServer pid=2993839) INFO 11-13 00:09:37 [model.py:630] Resolved architecture: GptOssForCausalLM -(APIServer pid=2993839) INFO 11-13 00:09:37 [model.py:1728] Using max model len 8192 -(APIServer pid=2993839) INFO 11-13 00:09:37 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. -(APIServer pid=2993839) INFO 11-13 00:09:37 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. -(APIServer pid=2993839) INFO 11-13 00:09:37 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=2), device_indexes=None) -(APIServer pid=2993839) WARNING 11-13 00:09:37 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -(APIServer pid=2993839) INFO 11-13 00:09:37 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -INFO 11-13 00:09:41 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 -INFO 11-13 00:09:41 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. -INFO 11-13 00:09:41 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. -WARNING 11-13 00:09:41 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:42 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=8192, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=8, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=False, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} -(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:43 [tpu_jax.py:228] Pin memory is not supported on TPU. -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [tpu_jax_runner.py:278] Creating new model mesh | devices=8, num_slices=1 -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 1, 'attn_dp': 2, 'expert': 1, 'model': 4, axis_types=(Auto, Auto, Auto, Auto)) -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [utils.py:314] Phased-based profiler enabled. Traces will be saved to: gs://wenxindong-vm/trace/gpt_oss/dp2/attn_dp -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [compilation_manager.py:34] Enabling JAX compile cache. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:48 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm -(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:49 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") -(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:49 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:49 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") -(EngineCore_DP0 pid=2993997) WARNING 11-13 00:09:49 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:49 [tpu_jax.py:63] Cannot use None backend on TPU. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:49 [tpu_jax.py:66] Using Pallas V1 backend. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:09:49 [layer.py:331] Disabling MoE shared_experts cuda stream -(EngineCore_DP0 pid=2993997) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 {'num_tokens': 16} -(EngineCore_DP0 pid=2993997) /mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torchax/tensor.py:154: UserWarning: Explicitly requested dtype int64 requested in astype is not available, and will be truncated to dtype int32. To enable more dtypes, set the jax_enable_x64 configuration option or the JAX_ENABLE_X64 shell environment variable. See https://github.com/jax-ml/jax#current-gotchas for more. -(EngineCore_DP0 pid=2993997) res = jax_function(self._elem, *args, **kwargs) -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:11:33 [compilation_manager.py:67] Compilation finished in 11.81 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:11:33 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 32} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:34] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:11:45 [compilation_manager.py:67] Compilation finished in 12.65 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:11:45 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 64} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:11:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:03 [compilation_manager.py:67] Compilation finished in 17.07 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:03 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 128} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:03] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:21 [compilation_manager.py:67] Compilation finished in 18.33 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:21 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 256} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:22] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:41 [compilation_manager.py:67] Compilation finished in 19.49 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:12:41 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 512} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:41] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:12:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:13:06 [compilation_manager.py:67] Compilation finished in 25.35 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:13:06 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 1024} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:07] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:13:31 [compilation_manager.py:67] Compilation finished in 24.97 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:13:31 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 2048} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:32] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:13:33] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:14:05 [compilation_manager.py:67] Compilation finished in 33.67 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:14:05 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 4096} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:14:42 [compilation_manager.py:67] Compilation finished in 36.63 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:14:42 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 8192} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:42] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:14:43] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:15:19 [compilation_manager.py:67] Compilation finished in 37.42 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:15:19 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 16384} -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:19] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:20] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) [2025-11-13 00:15:21] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:17 [compilation_manager.py:67] Compilation finished in 57.90 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:17 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:29 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:67] Compilation finished in 0.32 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:30 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:31 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16384, 'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:325] Compiling select_from_array with different input shapes. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:304] Compiling select_from_array for select all logits. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.08 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:37 [compilation_manager.py:67] Compilation finished in 0.71 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:37 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:39 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:39 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:39 [compilation_manager.py:67] Compilation finished in 0.64 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:39 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:67] Compilation finished in 0.28 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:67] Compilation finished in 0.54 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:42 [compilation_manager.py:67] Compilation finished in 0.78 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:43 [compilation_manager.py:67] Compilation finished in 0.49 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:43 [compilation_manager.py:67] Compilation finished in 0.46 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:44 [compilation_manager.py:67] Compilation finished in 0.47 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:44 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:45 [compilation_manager.py:67] Compilation finished in 0.80 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:45 [compilation_manager.py:67] Compilation finished in 0.59 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:45 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:46 [compilation_manager.py:67] Compilation finished in 0.78 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:46 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:47 [compilation_manager.py:67] Compilation finished in 0.99 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:47 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:47 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:48 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:49 [compilation_manager.py:67] Compilation finished in 0.40 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:49 [compilation_manager.py:67] Compilation finished in 0.69 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:49 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:67] Compilation finished in 0.34 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:50 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16384, 'index_size': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:51 [compilation_manager.py:67] Compilation finished in 0.59 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:51 [compilation_manager.py:365] Compiling compute_logits with different input shapes. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:51 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:52 [compilation_manager.py:67] Compilation finished in 1.01 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:52 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:53 [compilation_manager.py:67] Compilation finished in 1.10 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:53 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:54 [compilation_manager.py:67] Compilation finished in 1.00 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:54 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:55 [compilation_manager.py:67] Compilation finished in 0.94 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:55 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:56 [compilation_manager.py:67] Compilation finished in 1.02 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:56 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:58 [compilation_manager.py:67] Compilation finished in 1.72 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:16:58 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:00 [compilation_manager.py:67] Compilation finished in 2.15 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:00 [compilation_manager.py:387] Compiling sampling with different input shapes. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:01 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': True} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:04 [compilation_manager.py:67] Compilation finished in 3.50 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:04 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': False} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:04 [compilation_manager.py:67] Compilation finished in 0.24 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:05 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': True} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:08 [compilation_manager.py:67] Compilation finished in 3.43 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:08 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': False} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:09 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': True} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:12 [compilation_manager.py:67] Compilation finished in 2.58 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:12 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': False} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:12 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:13 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': True} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:16 [compilation_manager.py:67] Compilation finished in 3.50 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:16 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': False} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:17 [compilation_manager.py:67] Compilation finished in 0.77 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:18 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': True} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:22 [compilation_manager.py:67] Compilation finished in 3.94 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:22 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': False} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:27 [compilation_manager.py:67] Compilation finished in 5.03 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:27 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': True} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:30 [compilation_manager.py:67] Compilation finished in 3.08 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:30 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': False} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:30 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:30 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': True} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:33 [compilation_manager.py:67] Compilation finished in 2.88 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:33 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 512, 'do_sampling': False} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:67] Compilation finished in 0.43 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:455] Compiling gather_logprobs with different input shapes. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 8} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:67] Compilation finished in 0.75 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:34 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 16} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:35 [compilation_manager.py:67] Compilation finished in 0.70 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:35 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 32} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:37 [compilation_manager.py:67] Compilation finished in 1.98 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:37 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 64} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:39 [compilation_manager.py:67] Compilation finished in 2.00 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:39 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 128} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:41 [compilation_manager.py:67] Compilation finished in 1.93 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:41 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 256} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:43 [compilation_manager.py:67] Compilation finished in 2.01 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:43 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 512} -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:45 [compilation_manager.py:67] Compilation finished in 1.96 [secs]. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:45 [compilation_manager.py:751] Compiling structured_decoding with different input shapes. -(EngineCore_DP0 pid=2993997) WARNING 11-13 00:17:45 [compilation_manager.py:754] Structured decoding precompilation skipped since structured decoding is not supported with DP. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:45 [core.py:247] init engine (profile, create kv cache, warmup model) took 388.63 seconds -(EngineCore_DP0 pid=2993997) WARNING 11-13 00:17:46 [scheduler.py:158] Using custom scheduler class . This scheduler interface is not public and compatibility may not be maintained. -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:46 [dp_scheduler.py:93] DPScheduler (Async = True) per-rank limits: max_seqs=256, max_tokens=8192 -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:46 [core.py:181] Batch queue is enabled with size 2 -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:46 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=2), device_indexes=None) -(EngineCore_DP0 pid=2993997) WARNING 11-13 00:17:46 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -(EngineCore_DP0 pid=2993997) INFO 11-13 00:17:46 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -(APIServer pid=2993839) [INFO] model_hosting_container_standards - decorators.py:76: [PING] Framework handler registered: ping -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO decorators.py:76: [PING] Framework handler registered: ping -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func -(APIServer pid=2993839) [INFO] model_hosting_container_standards - decorators.py:76: [INVOKE] Framework handler registered: decorated_func -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO decorators.py:76: [INVOKE] Framework handler registered: decorated_func -(APIServer pid=2993839) [INFO] model_hosting_container_standards - __init__.py:127: Starting SageMaker bootstrap process -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO __init__.py:127: Starting SageMaker bootstrap process -(APIServer pid=2993839) [INFO] model_hosting_container_standards - registry.py:109: [REGISTRY] Middleware resolution and registration complete -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO registry.py:109: [REGISTRY] Middleware resolution and registration complete -(APIServer pid=2993839) [INFO] model_hosting_container_standards - core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully -(APIServer pid=2993839) [INFO] model_hosting_container_standards - core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares -(APIServer pid=2993839) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=2993839) [2025-11-13 00:17:47] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=2993839) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=2993839) [2025-11-13 00:17:47] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=2993839) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:93: Creating SageMaker router with unified route resolver -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO sagemaker_router.py:93: Creating SageMaker router with unified route resolver -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:172: Creating router with prefix='', tags=['sagemaker'] -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:172: Creating router with prefix='', tags=['sagemaker'] -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:110: Mounting 2 handlers to router -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:110: Mounting 2 handlers to router -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:184: Router created with 0 routes -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:184: Router created with 0 routes -(APIServer pid=2993839) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:101: SageMaker router created successfully with 0 routes -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO sagemaker_router.py:101: SageMaker router created successfully with 0 routes -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:287: Including router with conflict detection -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:287: Including router with conflict detection -(APIServer pid=2993839) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:305: Successfully included router with 0 routes -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO routing.py:305: Successfully included router with 0 routes -(APIServer pid=2993839) [INFO] model_hosting_container_standards - __init__.py:139: SageMaker bootstrap completed successfully -(APIServer pid=2993839) [2025-11-13 00:17:47] INFO __init__.py:139: SageMaker bootstrap completed successfully -(APIServer pid=2993839) INFO 11-13 00:17:47 [api_server.py:1662] Supported tasks: ['generate'] -(APIServer pid=2993839) WARNING 11-13 00:17:47 [serving_responses.py:189] For gpt-oss, we ignore --enable-auto-tool-choice and always enable tool use. -(APIServer pid=2993839) INFO 11-13 00:17:47 [api_server.py:1972] Starting vLLM API server 0 on http://0.0.0.0:8000 -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:38] Available routes are: -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /openapi.json, Methods: GET, HEAD -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /docs, Methods: GET, HEAD -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /docs/oauth2-redirect, Methods: GET, HEAD -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /redoc, Methods: GET, HEAD -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /health, Methods: GET -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /load, Methods: GET -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /tokenize, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /detokenize, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/models, Methods: GET -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /version, Methods: GET -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/responses, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/responses/{response_id}, Methods: GET -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/responses/{response_id}/cancel, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/messages, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/chat/completions, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/completions, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/embeddings, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /pooling, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /classify, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /score, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/score, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/audio/transcriptions, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/audio/translations, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /rerank, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v1/rerank, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /v2/rerank, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /scale_elastic_ep, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /is_scaling_elastic_ep, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /ping, Methods: GET -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /ping, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /invocations, Methods: POST -(APIServer pid=2993839) INFO 11-13 00:17:47 [launcher.py:46] Route: /metrics, Methods: GET -(APIServer pid=2993839) INFO: Started server process [2993839] -(APIServer pid=2993839) INFO: Waiting for application startup. -(APIServer pid=2993839) INFO: Application startup complete. -(APIServer pid=2993839) INFO: 127.0.0.1:36276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO 11-13 01:08:57 [loggers.py:221] Engine 000: Avg prompt throughput: 204.8 tokens/s, Avg generation throughput: 0.3 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:09:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.6 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:09:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.6 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:09:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.6 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:09:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.5 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:09:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.5 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:09:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.3 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:10:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:10:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:10:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:10:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:10:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:10:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:11:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:11:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:11:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 40.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=2993997) WARNING 11-13 01:11:29 [tpu_jax_runner.py:666] Should not schedule a request that does nothing! -(APIServer pid=2993839) INFO: 127.0.0.1:36276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54022 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54036 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54038 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54042 - "POST /v1/completions HTTP/1.1" 200 OK -(EngineCore_DP0 pid=2993997) INFO 11-13 01:11:30 [utils.py:358] Starting profiling for prefill_heavy phase -(EngineCore_DP0 pid=2993997) INFO 11-13 01:11:30 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 6144, 'num_prefill_tokens': 8192, 'num_decode_tokens': 1, 'padded_total_num_scheduled_tokens': 16384, 'num_reqs': 5} -(APIServer pid=2993839) INFO: 127.0.0.1:54052 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54060 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54062 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54068 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54076 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54088 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54094 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54116 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54138 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54142 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54156 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54172 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54176 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54190 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54192 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54200 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54210 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54220 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54232 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54246 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54272 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54274 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54288 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54316 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54342 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54354 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54358 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54374 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54378 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54418 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54434 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54448 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54470 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54490 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54502 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54534 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54536 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54542 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54560 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54570 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54574 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54582 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54610 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54622 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54632 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54646 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54658 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54672 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54686 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54702 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54704 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54708 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54718 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54726 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54740 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54754 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54760 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54768 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54784 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54796 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54810 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54814 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54838 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54906 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54928 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54940 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54964 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54978 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54980 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54988 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:54992 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55000 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55004 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55018 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55048 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55050 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55066 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55072 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55082 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55098 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55112 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55120 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55128 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55150 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55156 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55160 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55176 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55186 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55196 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55200 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55210 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55226 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55230 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55240 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55262 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55280 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55296 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55308 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55314 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55324 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55330 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55340 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55348 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55350 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55378 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55402 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55414 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55424 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55440 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55458 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55470 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55480 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55484 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55490 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55516 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55532 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55546 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55586 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55598 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55614 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55616 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55620 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55628 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55632 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55640 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55656 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55676 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55678 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55682 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55696 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55708 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55714 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55720 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55726 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55736 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55746 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55760 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55764 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55780 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55800 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55814 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55818 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55832 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55840 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55868 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55906 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55914 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55920 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55932 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55944 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55956 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55978 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:55992 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56008 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56010 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56022 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56036 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56044 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56068 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56076 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56080 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56096 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56114 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56130 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56160 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56172 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56186 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56192 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56202 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56222 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56234 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56238 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56240 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56262 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56272 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56286 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56296 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56304 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56306 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56320 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56334 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56340 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56356 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56368 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56378 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56400 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56416 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56420 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56426 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56430 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56442 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56454 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56472 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56488 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56498 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56504 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56512 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56542 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56548 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56576 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56578 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56600 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56610 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56620 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56630 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56640 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56642 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56654 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56666 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56676 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56700 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56716 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56736 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56750 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56754 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56766 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56784 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56790 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56794 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56796 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56800 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56820 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56840 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56858 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56910 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56924 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56938 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56946 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56952 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56960 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56974 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56990 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:56994 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57002 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57016 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57050 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57076 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57088 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57092 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57098 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57114 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57122 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57134 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57142 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57148 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57154 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57168 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57180 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57196 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57212 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57214 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57232 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57246 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57268 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57286 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57300 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57316 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57330 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57334 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57342 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57356 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57368 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57372 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57388 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57396 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57398 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57402 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57410 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57424 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57434 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57444 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57450 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57464 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57466 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57482 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57490 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57494 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57510 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57538 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57540 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57544 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57572 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57580 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57592 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57596 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57612 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57622 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57626 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57638 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57654 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57662 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57676 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57682 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57688 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57702 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57708 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57716 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57720 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57734 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57746 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57758 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57766 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57802 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57808 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57824 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57836 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57852 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57860 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57868 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57882 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57892 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57904 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57920 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57926 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57936 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57942 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57944 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57946 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57958 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57962 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57982 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57988 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:57998 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58010 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58022 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58038 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58050 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58068 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58074 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58084 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58100 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58102 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58110 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58116 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58120 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58138 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58150 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58154 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58170 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58184 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58186 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58196 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58204 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58206 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58214 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58224 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58234 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58248 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58256 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58268 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58292 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58298 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58314 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58320 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58334 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58338 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58348 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58370 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58372 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58388 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58402 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58418 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58424 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58428 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58442 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58454 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58466 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58482 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58494 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58510 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58520 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58534 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58550 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58562 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58576 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58580 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58582 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58592 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58606 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58608 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58618 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58622 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58636 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58652 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58668 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58674 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58696 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58710 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58734 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58748 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58760 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58762 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58766 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58786 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58802 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58804 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58806 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58826 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58830 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58842 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58854 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58868 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58900 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58914 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58922 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58924 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58932 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58934 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58940 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58950 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58952 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58964 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58974 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58980 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:58992 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59008 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59012 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59028 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59046 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59062 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59074 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59084 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59090 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59098 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59102 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59110 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59122 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59130 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59144 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59154 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59166 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59176 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59182 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59200 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59210 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59220 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59232 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59244 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59262 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59280 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59286 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59314 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59318 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59322 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59328 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59342 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59350 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59354 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59356 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59360 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59374 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59382 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59388 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59394 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59396 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59416 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59422 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59426 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59430 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59446 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59458 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59468 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59478 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59490 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59498 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59502 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59510 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59542 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59552 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59574 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59590 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59596 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59608 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59616 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59630 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59634 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59646 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59674 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59686 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59702 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59710 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59722 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59726 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59740 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59754 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59758 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59774 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59784 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59804 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59806 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59818 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59820 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59832 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59840 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59854 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59868 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59892 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59910 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59918 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59928 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59944 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59950 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59954 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59984 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:59986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60000 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60018 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60030 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60040 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60068 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60082 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60092 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60100 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60122 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60134 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60168 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60176 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60178 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60192 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60200 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60204 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60218 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60224 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60236 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60248 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60250 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60268 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60290 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60314 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60324 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60338 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60342 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60348 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60352 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60368 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60380 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60392 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60408 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60412 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60414 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60422 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60434 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60438 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60446 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60472 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60476 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60480 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60492 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60508 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60524 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60536 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60550 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60582 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60596 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60606 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60612 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60618 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60628 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60630 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60638 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60646 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60656 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60670 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60708 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60712 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60718 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60722 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60730 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60736 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60752 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60762 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60778 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60790 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60804 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60808 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60816 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60820 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60830 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60832 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60842 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60872 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60888 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60898 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60904 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60920 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60924 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60934 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60946 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60960 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60984 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:60990 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32770 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32774 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32784 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32794 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32802 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32818 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32848 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32856 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32868 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32872 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32882 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32908 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32914 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32920 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32934 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32942 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32958 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32960 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32980 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:32996 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33010 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33012 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33018 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33024 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33040 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33048 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33072 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33082 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33088 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33102 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33112 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33122 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33126 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33142 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33152 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33154 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33178 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33194 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33202 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33218 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33234 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33244 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33256 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33264 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33290 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33294 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33310 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33320 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33326 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33338 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33348 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33354 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33356 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33358 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33378 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33380 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33382 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33398 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33408 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33418 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33422 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33438 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33440 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33462 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33478 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33490 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33494 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33508 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33512 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33522 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33538 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33548 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33560 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33566 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33572 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33580 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33590 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33592 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33598 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33618 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33634 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33642 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33644 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33648 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33662 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33676 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33686 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33690 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33700 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33702 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33716 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33728 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33744 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33748 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33764 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33770 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33784 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33794 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33802 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33816 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33820 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33848 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33852 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33886 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33888 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33892 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33894 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33902 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33908 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33914 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33916 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33922 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33934 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33950 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33952 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33954 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33964 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33976 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33980 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33984 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:33996 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34004 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34012 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34024 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34032 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34042 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34062 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34076 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34080 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34090 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34092 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34096 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34106 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34110 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34120 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34126 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34132 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34142 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34148 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34164 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34170 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34178 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34194 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34198 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34202 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34232 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34244 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34260 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34272 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34288 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34326 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34330 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34336 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34338 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34368 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34370 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34372 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34382 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34392 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34416 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34426 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34442 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34458 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34464 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34480 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34490 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34508 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34516 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34530 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34544 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34556 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34578 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34598 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34614 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34622 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34632 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34646 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34652 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34666 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34676 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34682 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34706 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34714 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34722 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34732 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34742 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34750 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34764 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34780 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34794 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34806 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34818 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34824 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34892 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34908 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO: 127.0.0.1:34916 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=2993839) INFO 11-13 01:11:37 [loggers.py:221] Engine 000: Avg prompt throughput: 3891.0 tokens/s, Avg generation throughput: 11.9 tokens/s, Running: 29 reqs, Waiting: 995 reqs, GPU KV cache usage: 0.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:11:47 [loggers.py:221] Engine 000: Avg prompt throughput: 1638.3 tokens/s, Avg generation throughput: 2.7 tokens/s, Running: 37 reqs, Waiting: 987 reqs, GPU KV cache usage: 1.2%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=2993997) INFO 11-13 01:11:56 [utils.py:397] Profiling for prefill_heavy phase finished -(APIServer pid=2993839) INFO 11-13 01:11:57 [loggers.py:221] Engine 000: Avg prompt throughput: 3276.6 tokens/s, Avg generation throughput: 7.8 tokens/s, Running: 53 reqs, Waiting: 971 reqs, GPU KV cache usage: 1.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:12:07 [loggers.py:221] Engine 000: Avg prompt throughput: 18023.0 tokens/s, Avg generation throughput: 100.1 tokens/s, Running: 141 reqs, Waiting: 883 reqs, GPU KV cache usage: 4.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:12:17 [loggers.py:221] Engine 000: Avg prompt throughput: 18023.9 tokens/s, Avg generation throughput: 196.9 tokens/s, Running: 229 reqs, Waiting: 795 reqs, GPU KV cache usage: 7.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:12:27 [loggers.py:221] Engine 000: Avg prompt throughput: 17611.2 tokens/s, Avg generation throughput: 292.4 tokens/s, Running: 315 reqs, Waiting: 709 reqs, GPU KV cache usage: 10.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:12:37 [loggers.py:221] Engine 000: Avg prompt throughput: 17613.0 tokens/s, Avg generation throughput: 387.5 tokens/s, Running: 401 reqs, Waiting: 623 reqs, GPU KV cache usage: 12.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:12:47 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.1 tokens/s, Avg generation throughput: 481.9 tokens/s, Running: 487 reqs, Waiting: 537 reqs, GPU KV cache usage: 15.6%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=2993997) INFO 11-13 01:12:50 [utils.py:358] Starting profiling for decode_heavy phase -(EngineCore_DP0 pid=2993997) INFO 11-13 01:12:50 [utils.py:359] Batch composition stats: {'total_num_scheduled_tokens': 256, 'num_prefill_tokens': 0, 'num_decode_tokens': 512, 'padded_total_num_scheduled_tokens': 512, 'num_reqs': 512} -(APIServer pid=2993839) INFO 11-13 01:12:57 [loggers.py:221] Engine 000: Avg prompt throughput: 7168.2 tokens/s, Avg generation throughput: 454.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 16.4%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=2993997) INFO 11-13 01:13:06 [utils.py:397] Profiling for decode_heavy phase finished -(APIServer pid=2993839) INFO 11-13 01:13:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 716.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 16.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:13:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6073.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 16.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:13:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6194.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 18.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:13:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 18.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:13:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6090.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 19.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:13:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 20.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:14:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 21.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:14:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 21.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:14:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6144.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 22.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:14:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6194.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 23.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:14:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 23.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:14:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 25.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:15:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 25.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:15:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6192.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:15:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 27.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:15:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 29.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:15:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 29.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:15:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5631.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:16:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4709.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:16:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4659.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:16:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5373.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 32.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:16:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 32.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:16:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:16:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:17:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 35.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:17:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5579.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 36.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:17:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5577.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 36.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:17:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 38.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:17:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5476.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 38.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:17:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5527.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 39.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:18:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5476.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:18:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:18:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5476.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 42.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:18:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 42.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:18:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:18:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:19:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 44.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:19:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 45.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:19:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.5 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 45.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:19:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 47.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:19:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 47.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:19:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.7 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 48.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:20:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:20:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:20:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 51.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:20:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.4 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 51.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:20:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5426.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:20:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5376.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 53.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:21:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 53.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:21:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.6 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 54.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:21:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.2 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 54.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:21:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5424.0 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 56.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:21:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5376.1 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 56.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:21:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.3 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 57.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:22:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.9 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:22:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5424.8 tokens/s, Running: 512 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:22:28 [loggers.py:221] Engine 000: Avg prompt throughput: 13310.5 tokens/s, Avg generation throughput: 1066.2 tokens/s, Running: 504 reqs, Waiting: 437 reqs, GPU KV cache usage: 51.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:22:38 [loggers.py:221] Engine 000: Avg prompt throughput: 15564.4 tokens/s, Avg generation throughput: 500.0 tokens/s, Running: 500 reqs, Waiting: 361 reqs, GPU KV cache usage: 44.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:22:48 [loggers.py:221] Engine 000: Avg prompt throughput: 17611.5 tokens/s, Avg generation throughput: 547.0 tokens/s, Running: 498 reqs, Waiting: 275 reqs, GPU KV cache usage: 37.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:22:58 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.2 tokens/s, Avg generation throughput: 546.3 tokens/s, Running: 498 reqs, Waiting: 189 reqs, GPU KV cache usage: 30.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:23:08 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.0 tokens/s, Avg generation throughput: 545.2 tokens/s, Running: 496 reqs, Waiting: 105 reqs, GPU KV cache usage: 23.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:23:18 [loggers.py:221] Engine 000: Avg prompt throughput: 17202.6 tokens/s, Avg generation throughput: 544.4 tokens/s, Running: 496 reqs, Waiting: 19 reqs, GPU KV cache usage: 16.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:23:28 [loggers.py:221] Engine 000: Avg prompt throughput: 5937.7 tokens/s, Avg generation throughput: 4500.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 16.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:23:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 16.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:23:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 18.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:23:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 18.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:24:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 20.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:24:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 20.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:24:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 21.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:24:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 21.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:24:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 23.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:24:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 23.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:25:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 25.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:25:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 25.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:25:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:25:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6193.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:25:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 28.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:25:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6143.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 29.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:26:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 29.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:26:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4914.9 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:26:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4709.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 31.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:26:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4863.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 32.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:26:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5580.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 32.9%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:26:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 33.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:27:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:27:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5529.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:27:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5529.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 36.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:27:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5578.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 36.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:27:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 37.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:27:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 38.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:28:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5527.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 38.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:28:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:28:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5529.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:28:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 41.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:28:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 42.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:28:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 42.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:29:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:29:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5478.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:29:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.4 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 45.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:29:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5426.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 45.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:29:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5476.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 46.7%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:29:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 47.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:30:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.2 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 47.5%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:30:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5424.8 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:30:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5376.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.3%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:30:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 50.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:30:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 51.1%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:30:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 51.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:31:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.6 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 53.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:31:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 53.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:31:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5376.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 54.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:31:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5324.7 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 54.8%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:31:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 55.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:31:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5306.3 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 56.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:32:08 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.1 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 56.6%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:32:18 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.5 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:32:28 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.0 tokens/s, Running: 512 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:32:38 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4980.3 tokens/s, Running: 231 reqs, Waiting: 0 reqs, GPU KV cache usage: 26.4%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:32:48 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 353.6 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% -(APIServer pid=2993839) INFO 11-13 01:32:58 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% diff --git a/oss_log_baseline.txt b/oss_log_baseline.txt deleted file mode 100644 index d5b06e0f6..000000000 --- a/oss_log_baseline.txt +++ /dev/null @@ -1,2410 +0,0 @@ -INFO 11-12 01:19:42 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 -INFO 11-12 01:19:43 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. -INFO 11-12 01:19:43 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. -WARNING 11-12 01:19:43 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") -(APIServer pid=1953096) INFO 11-12 01:19:44 [api_server.py:1897] vLLM API server version 0.11.1rc7.dev48+gdf4d3a44a -(APIServer pid=1953096) INFO 11-12 01:19:44 [utils.py:253] non-default args: {'model_tag': 'unsloth/gpt-oss-120b-BF16', 'model': 'unsloth/gpt-oss-120b-BF16', 'max_model_len': 8192, 'download_dir': '/mnt/disks/persist', 'tensor_parallel_size': 4, 'gpu_memory_utilization': 0.98, 'enable_prefix_caching': False, 'max_num_batched_tokens': 8192, 'max_num_seqs': 256, 'async_scheduling': True} -(APIServer pid=1953096) INFO 11-12 01:19:44 [model.py:630] Resolved architecture: GptOssForCausalLM -(APIServer pid=1953096) INFO 11-12 01:19:44 [model.py:1728] Using max model len 8192 -(APIServer pid=1953096) INFO 11-12 01:19:44 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. -(APIServer pid=1953096) INFO 11-12 01:19:44 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. -(APIServer pid=1953096) INFO 11-12 01:19:44 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) -(APIServer pid=1953096) WARNING 11-12 01:19:44 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -(APIServer pid=1953096) INFO 11-12 01:19:44 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -INFO 11-12 01:19:48 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 -INFO 11-12 01:19:49 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. -INFO 11-12 01:19:49 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. -WARNING 11-12 01:19:49 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:49 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=8192, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=4, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=False, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} -(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:50 [tpu_jax.py:228] Pin memory is not supported on TPU. -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 1, 'model': 4, axis_types=(Auto, Auto)) -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192] -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256] -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [compilation_manager.py:34] Enabling JAX compile cache. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:55 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm -(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:56 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") -(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:56 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:56 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") -(EngineCore_DP0 pid=1953269) WARNING 11-12 01:19:56 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:56 [tpu_jax.py:63] Cannot use None backend on TPU. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:56 [tpu_jax.py:66] Using Pallas V1 backend. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:19:56 [layer.py:331] Disabling MoE shared_experts cuda stream -(EngineCore_DP0 pid=1953269) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 {'num_tokens': 16} -(EngineCore_DP0 pid=1953269) /mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/torchax/tensor.py:154: UserWarning: Explicitly requested dtype int64 requested in astype is not available, and will be truncated to dtype int32. To enable more dtypes, set the jax_enable_x64 configuration option or the JAX_ENABLE_X64 shell environment variable. See https://github.com/jax-ml/jax#current-gotchas for more. -(EngineCore_DP0 pid=1953269) res = jax_function(self._elem, *args, **kwargs) -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:27] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:35 [compilation_manager.py:67] Compilation finished in 9.54 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:35 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 32} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:35] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:35] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:35] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:36] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:45 [compilation_manager.py:67] Compilation finished in 9.92 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:45 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 64} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:45] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:46] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:59 [compilation_manager.py:67] Compilation finished in 14.04 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:21:59 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 128} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:21:59] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:00] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:14 [compilation_manager.py:67] Compilation finished in 14.97 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:14 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 256} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:14] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:15] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:29 [compilation_manager.py:67] Compilation finished in 15.32 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:29 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 512} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:29] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:30] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:31] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:48 [compilation_manager.py:67] Compilation finished in 18.31 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:22:48 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 1024} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:22:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:04 [compilation_manager.py:67] Compilation finished in 16.58 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:04 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 2048} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:04] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:05] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:06] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:25 [compilation_manager.py:67] Compilation finished in 20.68 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:25 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 4096} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:25] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:25] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:25] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:26] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:48 [compilation_manager.py:67] Compilation finished in 23.21 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:23:48 [compilation_manager.py:57] Precompile backbone --> {'num_tokens': 8192} -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:48] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) [2025-11-12 01:23:49] WARNING tensor.py:143: In-place to .data modifications still results a copy on TPU -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:67] Compilation finished in 27.73 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:16 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 16, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:17 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 32, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:18 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 64, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 128, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:19 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.22 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 256, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:20 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:21 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 512, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:22 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 1024, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:67] Compilation finished in 0.16 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:23 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:67] Compilation finished in 0.39 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:67] Compilation finished in 0.24 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:24 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 2048, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:67] Compilation finished in 0.24 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:25 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:67] Compilation finished in 0.37 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 4096, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:67] Compilation finished in 0.25 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:26 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:67] Compilation finished in 0.29 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:67] Compilation finished in 0.37 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:27 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.24 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile _substitute_placeholder_token_fn --> {'num_tokens': 8192, 'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:325] Compiling select_from_array with different input shapes. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:304] Compiling select_from_array for select all logits. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 16, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.09 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:28 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 32, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.10 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.11 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 64, 'index_size': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.19 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:29 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 128, 'index_size': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.13 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:30 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:67] Compilation finished in 0.23 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:31 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 256, 'index_size': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:67] Compilation finished in 0.55 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:67] Compilation finished in 0.17 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:67] Compilation finished in 0.18 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:32 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:33 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:33 [compilation_manager.py:67] Compilation finished in 0.53 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:33 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 512, 'index_size': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:34 [compilation_manager.py:67] Compilation finished in 0.76 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:34 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:34 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:35 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:36 [compilation_manager.py:67] Compilation finished in 0.57 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:36 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 1024, 'index_size': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:37 [compilation_manager.py:67] Compilation finished in 0.80 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:37 [compilation_manager.py:67] Compilation finished in 0.52 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:37 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:38 [compilation_manager.py:67] Compilation finished in 0.50 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:38 [compilation_manager.py:67] Compilation finished in 0.49 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:38 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:39 [compilation_manager.py:67] Compilation finished in 0.53 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:39 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:40 [compilation_manager.py:67] Compilation finished in 0.78 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:40 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 2048, 'index_size': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.99 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.15 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:41 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:42 [compilation_manager.py:67] Compilation finished in 0.38 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 4096, 'index_size': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:42 [compilation_manager.py:67] Compilation finished in 0.62 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:42 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.12 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.14 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.21 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:67] Compilation finished in 0.33 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:43 [compilation_manager.py:57] Precompile select_from_array [select all logits] --> {'array_size': 8192, 'index_size': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:67] Compilation finished in 0.58 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:365] Compiling compute_logits with different input shapes. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:67] Compilation finished in 0.27 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:44 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:45 [compilation_manager.py:67] Compilation finished in 0.65 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:45 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:45 [compilation_manager.py:67] Compilation finished in 0.31 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:45 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:46 [compilation_manager.py:67] Compilation finished in 0.39 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:46 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:47 [compilation_manager.py:67] Compilation finished in 1.34 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:47 [compilation_manager.py:57] Precompile compute_logits --> {'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:48 [compilation_manager.py:67] Compilation finished in 1.22 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:48 [compilation_manager.py:387] Compiling sampling with different input shapes. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:49 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': True} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:52 [compilation_manager.py:67] Compilation finished in 3.23 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:52 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 8, 'do_sampling': False} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:52 [compilation_manager.py:67] Compilation finished in 0.20 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:52 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': True} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:55 [compilation_manager.py:67] Compilation finished in 2.43 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:55 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 16, 'do_sampling': False} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:55 [compilation_manager.py:67] Compilation finished in 0.35 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:55 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': True} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:59 [compilation_manager.py:67] Compilation finished in 3.38 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:59 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 32, 'do_sampling': False} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:24:59 [compilation_manager.py:67] Compilation finished in 0.57 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:00 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': True} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:04 [compilation_manager.py:67] Compilation finished in 3.76 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:04 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 64, 'do_sampling': False} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:09 [compilation_manager.py:67] Compilation finished in 5.32 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:09 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': True} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:12 [compilation_manager.py:67] Compilation finished in 2.75 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:12 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 128, 'do_sampling': False} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:12 [compilation_manager.py:67] Compilation finished in 0.26 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:12 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': True} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:15 [compilation_manager.py:67] Compilation finished in 2.96 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:15 [compilation_manager.py:57] Precompile sample --> {'num_reqs': 256, 'do_sampling': False} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:67] Compilation finished in 0.30 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:455] Compiling gather_logprobs with different input shapes. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:67] Compilation finished in 0.72 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:16 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:17 [compilation_manager.py:67] Compilation finished in 0.71 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:17 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:19 [compilation_manager.py:67] Compilation finished in 1.83 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:19 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:21 [compilation_manager.py:67] Compilation finished in 1.77 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:21 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:23 [compilation_manager.py:67] Compilation finished in 1.97 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:23 [compilation_manager.py:57] Precompile gather_logprobs --> {'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:25 [compilation_manager.py:67] Compilation finished in 1.84 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:25 [compilation_manager.py:751] Compiling structured_decoding with different input shapes. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:25 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 8} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:26 [compilation_manager.py:67] Compilation finished in 1.86 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:26 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 16} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:28 [compilation_manager.py:67] Compilation finished in 1.82 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:28 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 32} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:30 [compilation_manager.py:67] Compilation finished in 1.81 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:30 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 64} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:32 [compilation_manager.py:67] Compilation finished in 1.46 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:32 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 128} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:33 [compilation_manager.py:67] Compilation finished in 1.24 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:33 [compilation_manager.py:57] Precompile structured_decode --> {'num_reqs': 256} -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:34 [compilation_manager.py:67] Compilation finished in 1.28 [secs]. -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:34 [core.py:247] init engine (profile, create kv cache, warmup model) took 252.55 seconds -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:35 [core.py:181] Batch queue is enabled with size 2 -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:35 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=4, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=1, attention_data_parallelism=1), device_indexes=None) -(EngineCore_DP0 pid=1953269) WARNING 11-12 01:25:35 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -(EngineCore_DP0 pid=1953269) INFO 11-12 01:25:35 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -(APIServer pid=1953096) [INFO] model_hosting_container_standards - decorators.py:76: [PING] Framework handler registered: ping -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO decorators.py:76: [PING] Framework handler registered: ping -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO base_factory.py:90: [INJECT_ADAPTER_ID] Transform decorator applied to: invocations -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO base_factory.py:115: [INJECT_ADAPTER_ID] Registered transform handler for invocations -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO base_factory.py:90: [STATEFUL_SESSION_MANAGER] Transform decorator applied to: decorated_func -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.transforms.base_factory - base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO base_factory.py:115: [STATEFUL_SESSION_MANAGER] Registered transform handler for decorated_func -(APIServer pid=1953096) [INFO] model_hosting_container_standards - decorators.py:76: [INVOKE] Framework handler registered: decorated_func -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO decorators.py:76: [INVOKE] Framework handler registered: decorated_func -(APIServer pid=1953096) [INFO] model_hosting_container_standards - __init__.py:127: Starting SageMaker bootstrap process -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO __init__.py:127: Starting SageMaker bootstrap process -(APIServer pid=1953096) [INFO] model_hosting_container_standards - registry.py:109: [REGISTRY] Middleware resolution and registration complete -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO registry.py:109: [REGISTRY] Middleware resolution and registration complete -(APIServer pid=1953096) [INFO] model_hosting_container_standards - core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO core.py:100: [MIDDLEWARE_LOADER] Middleware stack rebuilt successfully -(APIServer pid=1953096) [INFO] model_hosting_container_standards - core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO core.py:102: [MIDDLEWARE_LOADER] Processed 3 middlewares -(APIServer pid=1953096) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=1953096) [2025-11-12 01:25:36] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_invocation_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=1953096) [WARNING] model_hosting_container_standards.common.custom_code_ref_resolver.function_loader - function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=1953096) [2025-11-12 01:25:36] WARNING function_loader.py:73: Failed to load function from spec 'model:custom_sagemaker_ping_handler': HandlerFileNotFoundError: File '/opt/ml/model/model.py' not found in search paths: ['/opt/ml/model/'] -(APIServer pid=1953096) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:93: Creating SageMaker router with unified route resolver -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO sagemaker_router.py:93: Creating SageMaker router with unified route resolver -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:172: Creating router with prefix='', tags=['sagemaker'] -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:172: Creating router with prefix='', tags=['sagemaker'] -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:110: Mounting 2 handlers to router -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:110: Mounting 2 handlers to router -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:184: Router created with 0 routes -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:184: Router created with 0 routes -(APIServer pid=1953096) [INFO] model_hosting_container_standards.sagemaker.sagemaker_router - sagemaker_router.py:101: SageMaker router created successfully with 0 routes -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO sagemaker_router.py:101: SageMaker router created successfully with 0 routes -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:287: Including router with conflict detection -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:287: Including router with conflict detection -(APIServer pid=1953096) [INFO] model_hosting_container_standards.common.fastapi.routing - routing.py:305: Successfully included router with 0 routes -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO routing.py:305: Successfully included router with 0 routes -(APIServer pid=1953096) [INFO] model_hosting_container_standards - __init__.py:139: SageMaker bootstrap completed successfully -(APIServer pid=1953096) [2025-11-12 01:25:36] INFO __init__.py:139: SageMaker bootstrap completed successfully -(APIServer pid=1953096) INFO 11-12 01:25:36 [api_server.py:1662] Supported tasks: ['generate'] -(APIServer pid=1953096) WARNING 11-12 01:25:36 [serving_responses.py:189] For gpt-oss, we ignore --enable-auto-tool-choice and always enable tool use. -(APIServer pid=1953096) INFO 11-12 01:25:36 [api_server.py:1972] Starting vLLM API server 0 on http://0.0.0.0:8000 -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:38] Available routes are: -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /openapi.json, Methods: GET, HEAD -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /docs, Methods: GET, HEAD -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /docs/oauth2-redirect, Methods: GET, HEAD -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /redoc, Methods: GET, HEAD -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /health, Methods: GET -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /load, Methods: GET -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /tokenize, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /detokenize, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/models, Methods: GET -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /version, Methods: GET -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/responses, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/responses/{response_id}, Methods: GET -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/responses/{response_id}/cancel, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/messages, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/chat/completions, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/completions, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/embeddings, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /pooling, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /classify, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /score, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/score, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/audio/transcriptions, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/audio/translations, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /rerank, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v1/rerank, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /v2/rerank, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /scale_elastic_ep, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /is_scaling_elastic_ep, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /ping, Methods: GET -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /ping, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /invocations, Methods: POST -(APIServer pid=1953096) INFO 11-12 01:25:36 [launcher.py:46] Route: /metrics, Methods: GET -(APIServer pid=1953096) INFO: Started server process [1953096] -(APIServer pid=1953096) INFO: Waiting for application startup. -(APIServer pid=1953096) INFO: Application startup complete. -(APIServer pid=1953096) INFO: 127.0.0.1:53822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO 11-12 05:15:57 [loggers.py:221] Engine 000: Avg prompt throughput: 204.8 tokens/s, Avg generation throughput: 9.3 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.1%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:16:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 158.7 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:16:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 158.0 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:16:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 158.4 tokens/s, Running: 1 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.3%, Prefix cache hit rate: 0.0% -(EngineCore_DP0 pid=1953269) WARNING 11-12 05:16:35 [tpu_jax_runner.py:666] Should not schedule a request that does nothing! -(APIServer pid=1953096) INFO: 127.0.0.1:53822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52668 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52674 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52678 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52680 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52682 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52690 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52706 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52710 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52712 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52714 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52718 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52734 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52736 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52740 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52750 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52764 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52774 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52786 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52802 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52814 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52838 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52840 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52848 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52864 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52884 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52892 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52900 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52916 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52922 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52928 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52940 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52952 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52954 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52966 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52982 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:52994 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53008 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53014 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53026 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53040 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53048 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53076 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53090 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53096 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53112 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53118 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53128 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53130 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53138 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53144 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53156 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53170 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53180 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53192 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53206 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53208 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53222 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53236 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53246 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53260 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53266 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53282 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53286 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53298 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53304 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53318 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53336 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53344 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53348 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53352 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53360 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53376 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53384 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53398 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53414 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53424 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53426 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53440 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53450 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53458 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53486 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53504 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53520 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53522 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53528 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53532 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53546 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53558 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53572 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53578 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53610 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53614 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53628 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53632 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53646 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53650 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53656 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53662 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53666 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53680 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53696 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53708 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53712 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53726 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53730 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53732 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53746 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53762 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53774 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53778 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53784 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53786 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53792 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53804 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53818 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53832 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53848 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53864 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53868 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53884 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53900 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53902 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53910 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53922 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53936 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53938 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53940 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53952 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53966 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53976 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:53990 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54002 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54012 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54022 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54026 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54038 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54048 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54074 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54084 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54086 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54094 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54114 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54116 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54126 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54134 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54144 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54148 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54160 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54164 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54180 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54190 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54204 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54218 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54224 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54230 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54256 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54260 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54286 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54296 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54316 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54342 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54344 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54360 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54370 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54378 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54388 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54396 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54398 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54412 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54416 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54420 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54434 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54442 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54464 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54480 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54482 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54494 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54502 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54534 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54544 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54548 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54560 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54564 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54572 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54576 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54582 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54590 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54592 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54610 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54624 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54628 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54634 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54638 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54648 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54664 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54672 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54678 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54688 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54702 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54708 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54720 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54732 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54734 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54750 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54762 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54770 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54786 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54788 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54800 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54814 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54820 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54830 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54842 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54844 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54852 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54860 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54882 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54884 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54888 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54926 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54934 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54958 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:54996 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55004 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55016 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55026 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55044 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55076 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55090 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55094 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55106 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55122 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55134 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55144 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55154 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55158 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55168 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55184 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55192 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55202 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55228 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55230 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55240 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55264 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55272 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55288 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55300 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55314 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55320 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55336 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55352 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55356 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55368 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55370 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55384 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55392 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55398 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55420 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55436 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55442 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55472 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55488 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55492 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55504 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55512 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55518 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55534 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55536 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55542 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55552 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55562 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55576 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55588 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55606 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55616 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55632 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55634 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55636 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55642 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55648 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55662 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55664 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55668 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55680 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55708 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55738 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55740 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55746 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55760 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55762 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55792 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55826 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55838 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55848 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55894 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55906 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55920 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55928 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55934 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55944 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55954 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55964 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55978 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55984 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:55998 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56014 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56022 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56032 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56046 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56074 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56086 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56094 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56096 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56102 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56118 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56134 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56156 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56160 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56172 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56176 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56184 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56200 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56206 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56212 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56224 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56238 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56260 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56270 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56282 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56292 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56300 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56326 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56360 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56374 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56376 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56382 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56388 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56392 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56402 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56416 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56420 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56430 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56440 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56444 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56460 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56484 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56488 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56504 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56506 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56512 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56524 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56534 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56542 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56560 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56566 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56578 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56600 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56614 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56626 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56630 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56642 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56654 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56666 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56676 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56700 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56712 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56734 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56738 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56752 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56766 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56776 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56786 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56802 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56804 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56810 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56832 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56838 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56854 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56858 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56872 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56892 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56898 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56904 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56922 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56926 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56930 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56932 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56942 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56944 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56960 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56974 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56990 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:56994 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57004 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57034 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57038 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57052 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57058 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57086 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57100 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57122 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57152 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57172 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57198 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57214 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57230 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57232 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57242 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57258 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57270 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57274 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57278 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57282 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57288 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57310 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57312 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57318 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57328 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57348 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57350 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57360 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57368 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57372 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57376 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57386 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57400 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57416 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57424 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57432 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57446 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57470 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57486 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57498 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57502 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57510 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57514 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57516 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57520 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57530 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57544 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57560 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57566 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57578 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57580 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57590 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57604 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57608 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57616 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57626 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57638 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57646 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57660 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57672 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57680 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57694 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57700 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57708 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57732 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57748 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57762 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57778 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57782 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57798 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57838 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57840 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57882 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57894 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57900 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57912 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57918 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57922 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57938 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57952 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57954 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57962 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:57984 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58000 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58006 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58008 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58022 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58036 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58040 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58046 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58050 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58052 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58060 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58076 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58092 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58096 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58100 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58112 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58118 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58134 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58168 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58182 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58186 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58190 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58204 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58218 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58220 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58230 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58244 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58248 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58262 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58280 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58290 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58302 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58310 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58324 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58336 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58352 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58354 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58362 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58374 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58386 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58388 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58402 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58408 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58414 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58430 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58434 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58448 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58466 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58480 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58492 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58498 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58512 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58528 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58542 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58554 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58556 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58568 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58570 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58574 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58576 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58586 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58594 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58606 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58612 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58620 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58634 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58636 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58652 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58654 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58670 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58684 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58688 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58692 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58700 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58716 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58722 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58724 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58740 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58744 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58758 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58770 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58780 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58794 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58808 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58820 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58824 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58836 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58844 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58852 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58854 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58860 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58872 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58906 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58920 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58936 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58958 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:58986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59000 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59016 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59030 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59032 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59046 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59048 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59056 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59060 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59062 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59076 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59088 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59108 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59116 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59124 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59140 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59150 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59160 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59168 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59172 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59174 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59182 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59190 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59194 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59208 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59216 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59226 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59236 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59244 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59248 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59266 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59276 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59292 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59308 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59320 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59324 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59330 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59356 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59370 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59380 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59386 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59390 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59406 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59420 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59428 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59442 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59456 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59468 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59480 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59492 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59508 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59514 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59528 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59536 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59548 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59552 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59564 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59576 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59588 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59592 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59602 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59604 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59620 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59628 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59638 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59652 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59662 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59674 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59686 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59698 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59704 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59714 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59728 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59732 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59736 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59748 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59750 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59764 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59780 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59794 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59802 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59808 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59818 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59830 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59842 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59854 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59874 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59878 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59880 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59896 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59898 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59906 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59908 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59914 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59916 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59926 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59934 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59940 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59950 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59960 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59962 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59970 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59974 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59982 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59992 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:59994 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60004 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60012 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60022 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60024 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60038 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60044 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60046 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60062 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60080 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60090 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60102 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60112 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60128 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60144 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60158 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60174 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60184 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60194 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60196 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60200 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60208 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60212 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60222 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60238 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60254 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60270 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60280 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60292 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60308 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60318 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60326 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60336 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60346 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60348 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60378 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60394 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60404 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60414 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60430 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60438 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60440 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60452 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60460 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60464 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60466 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60474 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60488 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60490 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60496 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60508 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60512 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60526 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60530 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60540 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60550 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60560 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60566 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60578 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60584 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60596 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60606 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60610 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60620 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60636 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60640 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60650 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60662 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60664 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60668 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60670 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60678 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60680 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60696 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60704 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60716 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60726 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60740 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60744 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60752 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60760 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60766 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60768 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60782 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60794 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60802 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60810 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60812 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60828 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60834 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60842 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60846 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60858 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60862 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60872 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60876 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60882 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60898 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60908 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60918 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60924 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60930 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60936 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60950 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60958 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60972 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60988 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60992 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60996 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:60998 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32778 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32780 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32782 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32784 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32786 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32790 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32796 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32804 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32806 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32808 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32810 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32814 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32816 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32822 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32838 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32850 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32854 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32866 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32870 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32882 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32886 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32890 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32904 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32910 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32920 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32936 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32948 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32950 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32964 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32968 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32978 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32982 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:32986 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33002 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33008 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33020 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33022 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33026 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33038 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33042 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33054 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33064 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33070 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33072 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33084 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33096 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33104 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33114 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33130 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33146 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33162 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33166 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33182 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33188 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33198 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33202 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33208 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33218 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33230 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33244 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33252 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33264 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33280 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33292 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33294 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33306 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33308 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33324 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33332 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33344 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33350 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33364 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33372 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33384 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33398 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33402 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33418 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33430 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33442 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33450 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33464 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33470 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33480 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33484 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33500 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33504 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO: 127.0.0.1:33508 - "POST /v1/completions HTTP/1.1" 200 OK -(APIServer pid=1953096) INFO 11-12 05:16:37 [loggers.py:221] Engine 000: Avg prompt throughput: 1843.1 tokens/s, Avg generation throughput: 136.6 tokens/s, Running: 14 reqs, Waiting: 934 reqs, GPU KV cache usage: 1.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:16:47 [loggers.py:221] Engine 000: Avg prompt throughput: 18840.1 tokens/s, Avg generation throughput: 131.1 tokens/s, Running: 106 reqs, Waiting: 918 reqs, GPU KV cache usage: 11.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:16:57 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.6 tokens/s, Avg generation throughput: 321.7 tokens/s, Running: 192 reqs, Waiting: 832 reqs, GPU KV cache usage: 20.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:17:07 [loggers.py:221] Engine 000: Avg prompt throughput: 14126.2 tokens/s, Avg generation throughput: 1760.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:17:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5988.9 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:17:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.8 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:17:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.9 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 36.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:17:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6040.2 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 38.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:17:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.1 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 40.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:18:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6116.8 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:18:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6065.3 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:18:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6065.5 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:18:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4913.5 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:18:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4299.5 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:18:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 56.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:19:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5453.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:19:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.4 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:19:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5399.9 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:19:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:19:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.6 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 70.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:19:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5349.1 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 71.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:20:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5375.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:20:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5350.5 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:20:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5349.1 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:20:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5349.3 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:20:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5246.3 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 85.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:20:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5297.8 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:21:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5248.1 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:21:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5246.7 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:21:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5247.0 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:21:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5195.4 tokens/s, Running: 256 reqs, Waiting: 768 reqs, GPU KV cache usage: 97.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:21:47 [loggers.py:221] Engine 000: Avg prompt throughput: 204.7 tokens/s, Avg generation throughput: 5092.9 tokens/s, Running: 256 reqs, Waiting: 767 reqs, GPU KV cache usage: 98.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:21:57 [loggers.py:221] Engine 000: Avg prompt throughput: 14129.8 tokens/s, Avg generation throughput: 1116.0 tokens/s, Running: 250 reqs, Waiting: 693 reqs, GPU KV cache usage: 75.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:22:07 [loggers.py:221] Engine 000: Avg prompt throughput: 17612.2 tokens/s, Avg generation throughput: 546.6 tokens/s, Running: 249 reqs, Waiting: 607 reqs, GPU KV cache usage: 51.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:22:17 [loggers.py:221] Engine 000: Avg prompt throughput: 17408.1 tokens/s, Avg generation throughput: 544.8 tokens/s, Running: 248 reqs, Waiting: 522 reqs, GPU KV cache usage: 27.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:22:27 [loggers.py:221] Engine 000: Avg prompt throughput: 3071.2 tokens/s, Avg generation throughput: 5270.4 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 28.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:22:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:22:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5990.1 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:22:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6014.1 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:23:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6142.2 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:23:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6167.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:23:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6116.4 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:23:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6089.9 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:23:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.3 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:23:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4247.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 52.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:24:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5401.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 55.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:24:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5527.8 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:24:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5604.8 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:24:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5554.2 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:24:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.5 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 67.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:24:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.0 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 68.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:25:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.7 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:25:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5477.0 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:25:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:25:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5400.1 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:25:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5400.2 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:25:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.3 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 83.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:26:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5348.6 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:26:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5348.7 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:26:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5299.0 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:26:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.7 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:26:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5246.2 tokens/s, Running: 256 reqs, Waiting: 512 reqs, GPU KV cache usage: 96.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:26:57 [loggers.py:221] Engine 000: Avg prompt throughput: 204.7 tokens/s, Avg generation throughput: 5169.5 tokens/s, Running: 256 reqs, Waiting: 511 reqs, GPU KV cache usage: 98.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:27:07 [loggers.py:221] Engine 000: Avg prompt throughput: 13311.0 tokens/s, Avg generation throughput: 1297.2 tokens/s, Running: 252 reqs, Waiting: 442 reqs, GPU KV cache usage: 77.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:27:17 [loggers.py:221] Engine 000: Avg prompt throughput: 17406.3 tokens/s, Avg generation throughput: 552.5 tokens/s, Running: 252 reqs, Waiting: 356 reqs, GPU KV cache usage: 53.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:27:27 [loggers.py:221] Engine 000: Avg prompt throughput: 18226.7 tokens/s, Avg generation throughput: 577.5 tokens/s, Running: 252 reqs, Waiting: 267 reqs, GPU KV cache usage: 29.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:27:37 [loggers.py:221] Engine 000: Avg prompt throughput: 3275.9 tokens/s, Avg generation throughput: 5014.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 27.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:27:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:27:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5937.6 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:28:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6013.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:28:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.5 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:28:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6117.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:28:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6092.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:28:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.2 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:28:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5606.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:29:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4274.1 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:29:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5298.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:29:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.1 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:29:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5528.7 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:29:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5553.6 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:29:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5451.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 66.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:30:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5501.7 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:30:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5400.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:30:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5401.6 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:30:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5399.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:30:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5350.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:30:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5374.3 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 81.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:31:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5273.6 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:31:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5323.4 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:31:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5273.1 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:31:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5271.9 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 92.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:31:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5272.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 94.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:31:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5221.0 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:32:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5220.8 tokens/s, Running: 256 reqs, Waiting: 256 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:32:17 [loggers.py:221] Engine 000: Avg prompt throughput: 10034.7 tokens/s, Avg generation throughput: 2195.2 tokens/s, Running: 252 reqs, Waiting: 202 reqs, GPU KV cache usage: 82.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:32:27 [loggers.py:221] Engine 000: Avg prompt throughput: 17613.4 tokens/s, Avg generation throughput: 552.8 tokens/s, Running: 252 reqs, Waiting: 117 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:32:37 [loggers.py:221] Engine 000: Avg prompt throughput: 17407.1 tokens/s, Avg generation throughput: 552.6 tokens/s, Running: 252 reqs, Waiting: 31 reqs, GPU KV cache usage: 34.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:32:47 [loggers.py:221] Engine 000: Avg prompt throughput: 7370.0 tokens/s, Avg generation throughput: 3834.5 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 27.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:32:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5963.3 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 30.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:33:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5962.9 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 34.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:33:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6016.0 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 37.1%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:33:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6116.7 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 40.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:33:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6141.9 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 43.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:33:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6117.0 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 46.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:33:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 6091.5 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 49.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:34:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5913.3 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 51.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:34:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4325.1 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 52.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:34:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 4990.2 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 55.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:34:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.5 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 58.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:34:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5502.5 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 61.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:34:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5605.7 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 63.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:35:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5425.6 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 64.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:35:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5527.7 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 68.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:35:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5451.1 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 71.1%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:35:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5427.4 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 74.2%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:35:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5451.3 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 77.3%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:35:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5400.0 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 78.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:36:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5399.7 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 80.4%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:36:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5324.9 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 83.5%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:36:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5348.6 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 86.6%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:36:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5348.2 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 89.7%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:36:47 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5297.1 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.1%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:36:57 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5297.6 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 92.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:37:07 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5247.8 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 95.8%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:37:17 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 5271.6 tokens/s, Running: 256 reqs, Waiting: 0 reqs, GPU KV cache usage: 98.9%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:37:27 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 3317.7 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% -(APIServer pid=1953096) INFO 11-12 05:37:37 [loggers.py:221] Engine 000: Avg prompt throughput: 0.0 tokens/s, Avg generation throughput: 0.0 tokens/s, Running: 0 reqs, Waiting: 0 reqs, GPU KV cache usage: 0.0%, Prefix cache hit rate: 0.0% diff --git a/oss_log_numerics.txt b/oss_log_numerics.txt deleted file mode 100644 index 698aa9a09..000000000 --- a/oss_log_numerics.txt +++ /dev/null @@ -1,270 +0,0 @@ -INFO 11-14 16:36:45 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 -INFO 11-14 16:36:45 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. -INFO 11-14 16:36:45 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. -WARNING 11-14 16:36:45 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") -(APIServer pid=218262) INFO 11-14 16:36:46 [api_server.py:1897] vLLM API server version 0.11.1rc7.dev48+gdf4d3a44a -(APIServer pid=218262) INFO 11-14 16:36:46 [utils.py:253] non-default args: {'model_tag': 'unsloth/gpt-oss-120b-BF16', 'model': 'unsloth/gpt-oss-120b-BF16', 'max_model_len': 8192, 'download_dir': '/mnt/disks/persist', 'tensor_parallel_size': 4, 'data_parallel_size': 2, 'gpu_memory_utilization': 0.98, 'enable_prefix_caching': False, 'max_num_batched_tokens': 8192, 'max_num_seqs': 256, 'async_scheduling': True} -(APIServer pid=218262) INFO 11-14 16:36:47 [model.py:630] Resolved architecture: GptOssForCausalLM -(APIServer pid=218262) INFO 11-14 16:36:47 [model.py:1728] Using max model len 8192 -(APIServer pid=218262) INFO 11-14 16:36:47 [scheduler.py:254] Chunked prefill is enabled with max_num_batched_tokens=8192. -(APIServer pid=218262) INFO 11-14 16:36:47 [config.py:272] Overriding max cuda graph capture size to 1024 for performance. -(APIServer pid=218262) INFO 11-14 16:36:47 [tpu_jax.py:118] Initialized sharding configuration: ShardingConfigManager(total_devices=8, sharding_strategy=ShardingStrategy(tensor_parallelism=4, expert_parallelism=1, sequence_parallelism=1, data_parallelism=2, attention_data_parallelism=1), device_indexes=None) -(APIServer pid=218262) WARNING 11-14 16:36:47 [tpu_jax.py:156] The model dtype is not properly set for JAX backend. Overwriting it to jnp.bfloat16 -(APIServer pid=218262) INFO 11-14 16:36:47 [tpu_jax.py:192] Force using UniProcExecutor for JAX on single host. -INFO 11-14 16:36:51 [__init__.py:26] TPU info: node_name=cuiq-infer-v7-2 | tpu_type=tpu7x-8 | worker_id=0 | num_chips=8 | num_cores_per_chip=2 -INFO 11-14 16:36:51 [importing.py:44] Triton is installed but 0 active driver(s) found (expected 1). Disabling Triton to prevent runtime errors. -INFO 11-14 16:36:51 [importing.py:68] Triton not installed or not compatible; certain GPU-related functions will not be available. -WARNING 11-14 16:36:51 [interface.py:197] Failed to import from vllm._C: ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:52 [core.py:94] Initializing a V1 LLM engine (v0.11.1rc7.dev48+gdf4d3a44a) with config: model='unsloth/gpt-oss-120b-BF16', speculative_config=None, tokenizer='unsloth/gpt-oss-120b-BF16', skip_tokenizer_init=False, tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=8192, download_dir='/mnt/disks/persist', load_format=auto, tensor_parallel_size=4, pipeline_parallel_size=1, data_parallel_size=1, disable_custom_all_reduce=True, quantization=None, enforce_eager=False, kv_cache_dtype=auto, device_config=None, structured_outputs_config=StructuredOutputsConfig(backend='auto', disable_fallback=False, disable_any_whitespace=False, disable_additional_properties=False, reasoning_parser='openai_gptoss', reasoning_parser_plugin='', enable_in_reasoning=False), observability_config=ObservabilityConfig(show_hidden_metrics_for_version=None, otlp_traces_endpoint=None, collect_detailed_traces=None), seed=0, served_model_name=unsloth/gpt-oss-120b-BF16, enable_prefix_caching=False, chunked_prefill_enabled=True, pooler_config=None, compilation_config={'level': None, 'mode': 2, 'debug_dump_path': None, 'cache_dir': '', 'compile_cache_save_format': 'binary', 'backend': 'openxla', 'custom_ops': ['all'], 'splitting_ops': None, 'compile_mm_encoder': True, 'use_inductor': None, 'compile_sizes': None, 'inductor_compile_config': {'enable_auto_functionalized_v2': False}, 'inductor_passes': {}, 'cudagraph_mode': , 'use_cudagraph': True, 'cudagraph_num_of_warmups': 0, 'cudagraph_capture_sizes': None, 'cudagraph_copy_inputs': False, 'full_cuda_graph': False, 'cudagraph_specialize_lora': True, 'use_inductor_graph_partition': False, 'pass_config': {}, 'max_cudagraph_capture_size': 1024, 'local_cache_dir': None} -(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:52 [tpu_jax.py:228] Pin memory is not supported on TPU. -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0 -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:57 [parallel_state.py:1325] rank 0 in world size 1 is assigned as DP rank 0, PP rank 0, TP rank 0, EP rank 0 -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [tpu_jax_runner.py:273] Init mesh | mesh=Mesh('data': 2, 'model': 4, axis_types=(Auto, Auto)) -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [utils.py:314] Phased-based profiler enabled. Traces will be saved to: gs://wenxindong-vm/trace/gpt_oss/dp2/numerics -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [utils.py:93] Prepared token paddings: [16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384] -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [utils.py:59] Prepared request paddings: [8, 16, 32, 64, 128, 256, 512] -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [compilation_manager.py:34] Enabling JAX compile cache. -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [tpu_worker_jax.py:152] Init worker | rank=0 | node_id=0 | is_driver_worker=True | hbm=[(0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75), (0.0, 94.75)]GiB -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:58 [model_loader.py:318] Loading model with MODEL_IMPL_TYPE=vllm -(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:59 [rocm.py:34] Failed to import from amdsmi with ModuleNotFoundError("No module named 'amdsmi'") -(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:59 [rocm.py:39] Failed to import from vllm._C with ModuleNotFoundError("No module named 'vllm._C'") -(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:59 [rocm.py:45] Failed to import from vllm._rocm_C with ModuleNotFoundError("No module named 'vllm._rocm_C'") -(EngineCore_DP0 pid=218428) WARNING 11-14 16:36:59 [registry.py:171] _Backend has been renamed to AttentionBackendEnum. Please update your code to use AttentionBackendEnum instead. _Backend will be removed in a future release. -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:59 [tpu_jax.py:63] Cannot use None backend on TPU. -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:59 [tpu_jax.py:66] Using Pallas V1 backend. -(EngineCore_DP0 pid=218428) INFO 11-14 16:36:59 [layer.py:331] Disabling MoE shared_experts cuda stream -(EngineCore_DP0 pid=218428) Loading safetensors checkpoint shards: 0% Completed | 0/73 [00:00 -(APIServer pid=218262) sys.exit(main()) -(APIServer pid=218262) ^^^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/cli/main.py", line 73, in main -(APIServer pid=218262) args.dispatch_function(args) -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/cli/serve.py", line 59, in cmd -(APIServer pid=218262) uvloop.run(run_server(args)) -(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/uvloop/__init__.py", line 96, in run -(APIServer pid=218262) return __asyncio.run( -(APIServer pid=218262) ^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/asyncio/runners.py", line 195, in run -(APIServer pid=218262) return runner.run(main) -(APIServer pid=218262) ^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/asyncio/runners.py", line 118, in run -(APIServer pid=218262) return self._loop.run_until_complete(task) -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "uvloop/loop.pyx", line 1518, in uvloop.loop.Loop.run_until_complete -(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/site-packages/uvloop/__init__.py", line 48, in wrapper -(APIServer pid=218262) return await main -(APIServer pid=218262) ^^^^^^^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/openai/api_server.py", line 1944, in run_server -(APIServer pid=218262) await run_server_worker(listen_address, sock, args, **uvicorn_kwargs) -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/openai/api_server.py", line 1963, in run_server_worker -(APIServer pid=218262) async with build_async_engine_client( -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/contextlib.py", line 210, in __aenter__ -(APIServer pid=218262) return await anext(self.gen) -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/openai/api_server.py", line 192, in build_async_engine_client -(APIServer pid=218262) async with build_async_engine_client_from_engine_args( -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/contextlib.py", line 210, in __aenter__ -(APIServer pid=218262) return await anext(self.gen) -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/entrypoints/openai/api_server.py", line 233, in build_async_engine_client_from_engine_args -(APIServer pid=218262) async_llm = AsyncLLM.from_vllm_config( -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/utils/func_utils.py", line 116, in inner -(APIServer pid=218262) return fn(*args, **kwargs) -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/async_llm.py", line 202, in from_vllm_config -(APIServer pid=218262) return cls( -(APIServer pid=218262) ^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/async_llm.py", line 132, in __init__ -(APIServer pid=218262) self.engine_core = EngineCoreClient.make_async_mp_client( -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 121, in make_async_mp_client -(APIServer pid=218262) return AsyncMPClient(*client_args) -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 808, in __init__ -(APIServer pid=218262) super().__init__( -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/core_client.py", line 469, in __init__ -(APIServer pid=218262) with launch_core_engines(vllm_config, executor_class, log_stats) as ( -(APIServer pid=218262) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ -(APIServer pid=218262) File "/mnt/disks/persist/vllm_conda/lib/python3.12/contextlib.py", line 144, in __exit__ -(APIServer pid=218262) next(self.gen) -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/utils.py", line 898, in launch_core_engines -(APIServer pid=218262) wait_for_engine_startup( -(APIServer pid=218262) File "/home/wenxindong_google_com/vllm/vllm/v1/engine/utils.py", line 955, in wait_for_engine_startup -(APIServer pid=218262) raise RuntimeError( -(APIServer pid=218262) RuntimeError: Engine core initialization failed. See root cause above. Failed core proc(s): {} From 4b58b7050be22b7346955f0e2382bd6883f5b2fd Mon Sep 17 00:00:00 2001 From: wenxindongwork Date: Thu, 20 Nov 2025 02:44:36 +0000 Subject: [PATCH 17/17] wip --- repro_attention_dp.py | 61 +++++++++++++++++++++++++++++++++---------- 1 file changed, 47 insertions(+), 14 deletions(-) diff --git a/repro_attention_dp.py b/repro_attention_dp.py index 584e676a3..19b6830c3 100644 --- a/repro_attention_dp.py +++ b/repro_attention_dp.py @@ -7,6 +7,7 @@ """ import argparse +from functools import partial import time from pathlib import Path import numpy as np @@ -15,6 +16,8 @@ import jax.numpy as jnp from jax.sharding import Mesh, PartitionSpec as P from jax import NamedSharding, shard_map +from jax.experimental.layout import Layout, Format + from tpu_inference.layers.vllm.attention import _jax_attn_func # import sys # sys.path.insert(0, '/home/wenxindong_google_com/tpu-inference') @@ -23,14 +26,15 @@ get_kv_cache_shape as get_kv_cache_shape_h64, ) from tpu_inference.kernels.ragged_paged_attention.v3.kernel import get_kv_cache_shape -from tpu_inference.layers.common.sharding import ShardingAxisName +from tpu_inference.layers.common.sharding import MESH_AXIS_NAMES_2D, ShardingAxisName from tpu_inference.layers.common.attention_metadata import AttentionMetadata +from tpu_inference.utils import make_optimized_mesh def create_test_inputs( batch_size: int = 256, max_num_tokens: int = 256, - num_q_heads: int = 32, + num_q_heads: int = 64, num_kv_heads: int = 8, head_dim: int = 64, page_size: int = 256, @@ -1443,7 +1447,17 @@ def create_test_inputs( elif dp_size == 2: page_indices = jnp.array(page_indices_rank0 + page_indices_rank1, dtype=jnp.int32) - attention_sink = None + attention_sink = jnp.array([1.0859375, 1.125, 0.09326172, 1.0859375, 0.91796875, 1.4140625, + 0.953125, 0.38671875, 1.140625, 1.0625, 1.546875, 1.6171875, + 0.69140625, 0.4453125, 1.65625, 1.3359375, 1.4296875, 1.0234375, + 1.3828125, 1.890625, 0.953125, 0.70703125, 0.80078125, 0.953125, + 1.375 , 0.30664062, 1.2265625, 1.203125, 1.265625, 1.03125, + 2.171875, 1.2265625, 0.890625, 0.69140625, 0.44921875, 1.28125, + 0.984375 , 0.87109375, 0.59375, 0.70703125, 1.515625, 1.6796875, + 1.6171875 ,1.2109375, 1.6328125, 1.25, 1.8125, 0.53515625, + 1.4609375 , 0.8828125, 2.34375, 0.91015625, 0.56640625, 1.3125, + 1.125 , 0.75390625, 0.63671875, 2.078125, 1.2890625, 1.3828125, + 0.84765625, 0.64453125, 1.4921875, 1.6484375 ] ) sm_scale = head_dim ** -0.5 print(f"\nInput creation (dp_size={dp_size}):") @@ -1482,18 +1496,34 @@ def run(inputs, dump_dir, dp_size=2, num_devices=8, dp=True): print(f" {key}: {val.shape} {val.dtype}") devices = jax.devices() - dp_size = 2 + dp_size = 2 # don't change + total_devices = 8 if dp: - device_array = np.array(devices[:8]).reshape(dp_size, -1) + device_array = np.array(devices[:total_devices]).reshape(dp_size, -1) + mesh_shape = (dp_size, total_devices // dp_size) else: - device_array = np.array(devices[:4]).reshape(1, -1) - mesh = Mesh( + device_array = np.array(devices[:total_devices//dp_size]).reshape(1, -1) + mesh_shape = (1, total_devices // dp_size) + + mesh = make_optimized_mesh(mesh_shape, + MESH_AXIS_NAMES_2D, + devices=devices) + print("optimal mesh created:", mesh.devices) + mesh_dummy = Mesh( device_array, axis_names=(ShardingAxisName.ATTN_DATA, ShardingAxisName.ATTN_HEAD), ) - print(f"Mesh: {mesh}") + print("dummy mesh created:", mesh_dummy.devices) - def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, distribution): + @partial(jax.jit, + compiler_options={ + "xla_tpu_all_gather_collective_matmul_mode": + "post_spmd_conservative", + "xla_tpu_reduce_scatter_collective_matmul_mode": + "post_spmd_conservative" + } +) + def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, distribution, attention_sink): attention_metadata = AttentionMetadata( input_positions=None, @@ -1516,7 +1546,7 @@ def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, dist q=q_reshaped, k=k_reshaped, v=v_reshaped, - sinks=None, + sinks=attention_sink, attention_metadata=attention_metadata, mesh=mesh, scale=inputs['sm_scale'], @@ -1526,14 +1556,14 @@ def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, dist q_scale=None, k_scale=None, v_scale=None, - sliding_window=None, + sliding_window=128, ) outputs = outputs.reshape(batch_size, num_heads, head_dim) return outputs, new_kv_cache - attention_fn = jax.jit(_attention_wrapper) + attention_fn = _attention_wrapper # Lower and dump HLO print("\nLowering computation...") @@ -1546,6 +1576,7 @@ def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, dist inputs['page_indices'], inputs['cu_q_lens'], inputs['distribution'], + inputs['attention_sink'], ) # Dump HLO @@ -1568,7 +1599,7 @@ def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, dist inputs['page_indices'] = jax.device_put(inputs['page_indices'], NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) inputs['cu_q_lens'] = jax.device_put(inputs['cu_q_lens'], NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) inputs['distribution'] = jax.device_put(inputs['distribution'], NamedSharding(mesh, P(ShardingAxisName.ATTN_DATA))) - + inputs['attention_sink'] = jax.device_put(inputs['attention_sink'], NamedSharding(mesh, P(ShardingAxisName.ATTN_HEAD))) # Warm up print("Warming up...") for _ in range(3): @@ -1581,13 +1612,14 @@ def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, dist inputs['page_indices'], inputs['cu_q_lens'], inputs['distribution'], + inputs['attention_sink'], ) jax.block_until_ready(result) # Benchmark print("Benchmarking ...") times = [] - dump_dir = f"gs://wenxindong-vm/trace/debug/gptoss/kernel/dp{dp}" + dump_dir = f"gs://wenxindong-vm/trace/debug/gptoss/kernel/dp={dp}" jax.profiler.start_trace(dump_dir) for i in range(10): start = time.time() @@ -1600,6 +1632,7 @@ def _attention_wrapper(q, k, v, kv_cache, kv_lens, page_indices, cu_q_lens, dist inputs['page_indices'], inputs['cu_q_lens'], inputs['distribution'], + inputs['attention_sink'], ) jax.block_until_ready(result) elapsed = time.time() - start