Files
LEANN/demo.ipynb
yichuan520030910320 371e3de04e add configuable funcname
2025-07-01 05:02:01 +00:00

1226 lines
92 KiB
Plaintext

{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Initializing leann-backend-diskann...\n",
"INFO: Registering backend 'diskann'\n",
"INFO: DiskANN backend loaded successfully\n",
"INFO: LeannBuilder initialized with 'diskann' backend.\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/ubuntu/LEANN_clean/leann/.venv/lib/python3.11/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
" from .autonotebook import tqdm as notebook_tqdm\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"INFO: Computing embeddings for 6 chunks using 'sentence-transformers/all-mpnet-base-v2'...\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"Batches: 100%|██████████| 1/1 [00:00<00:00, 2.82it/s]\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"INFO: Building DiskANN index for 6 vectors with metric Metric.INNER_PRODUCT...\n",
"Using Inner Product search, so need to pre-process base data into temp file. Please ensure there is additional (n*(d+1)*4) bytes for storing pre-processed base vectors, apart from the interim indices created by DiskANN and the final index.\n",
"Pre-processing base file by adding extra coordinate\n",
"✅ DiskANN index built successfully at 'knowledge'\n",
"Writing bin: knowledge_disk.index_max_base_norm.bin\n",
"bin: #pts = 1, #dims = 1, size = 12B\n",
"Finished writing bin.\n",
"Time for preprocessing data for inner product: 0.000163 seconds\n",
"Reading max_norm_of_base from knowledge_disk.index_max_base_norm.bin\n",
"Reading bin file knowledge_disk.index_max_base_norm.bin ...\n",
"Opening bin file knowledge_disk.index_max_base_norm.bin... \n",
"Metadata: #pts = 1, #dims = 1...\n",
"done.\n",
"max_norm_of_base: 1\n",
"! Using prepped_base file at knowledge_prepped_base.bin\n",
"Starting index build: R=32 L=64 Query RAM budget: 4.02653e+09 Indexing ram budget: 8 T: 8\n",
"getting bin metadata\n",
"Time for getting bin metadata: 0.000020 seconds\n",
"Compressing 769-dimensional data into 512 bytes per vector.\n",
"Opened: knowledge_prepped_base.bin, size: 18464, cache_size: 18464\n",
"Training data with 6 samples loaded.\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 256, #dims = 769...\n",
"done.\n",
"PQ pivot file exists. Not generating again\n",
"Opened: knowledge_prepped_base.bin, size: 18464, cache_size: 18464\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 4, #dims = 1...\n",
"done.\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 256, #dims = 769...\n",
"done.\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 769, #dims = 1...\n",
"done.\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 513, #dims = 1...\n",
"done.\n",
"Loaded PQ pivot information\n",
"Processing points [0, 6)...done.\n",
"Time for generating quantized data: 0.051329 seconds\n",
"Full index fits in RAM budget, should consume at most 2.03973e-05GiBs, so building in one shot\n",
"L2: Using AVX2 distance computation DistanceL2Float\n",
"Passed, empty search_params while creating index config\n",
"Using only first 6 from file.. \n",
"Starting index build with 6 points... \n",
"0% of index build completed.Starting final cleanup..done. Link time: 0.00016s\n",
"Index built with degree: max:5 avg:5 min:5 count(deg<2):0\n",
"Not saving tags as they are not enabled.\n",
"Time taken for save: 0.00015s.\n",
"Time for building merged vamana index: 0.000982 seconds\n",
"Opened: knowledge_prepped_base.bin, size: 18464, cache_size: 18464\n",
"Vamana index file size=168\n",
"Opened: knowledge_disk.index, cache_size: 67108864\n",
"medoid: 0B\n",
"max_node_len: 3100B\n",
"nnodes_per_sector: 1B\n",
"# sectors: 6\n",
"Sector #0written\n",
"Finished writing 28672B\n",
"Writing bin: knowledge_disk.index\n",
"bin: #pts = 9, #dims = 1, size = 80B\n",
"Finished writing bin.\n",
"Output disk index file written to knowledge_disk.index\n",
"Finished writing 28672B\n",
"Time for generating disk layout: 0.044798 seconds\n",
"Opened: knowledge_prepped_base.bin, size: 18464, cache_size: 18464\n",
"Loading base knowledge_prepped_base.bin. #points: 6. #dim: 769.\n",
"Wrote 1 points to sample file: knowledge_sample_data.bin\n",
"Indexing time: 0.0974831\n",
"INFO: Leann metadata saved to knowledge.leann.meta.json\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"Opened file : knowledge_disk.index\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"✅ DiskANN index loaded successfully.\n",
"INFO: LeannSearcher initialized with 'diskann' backend using index 'knowledge.leann'.\n",
"Since data is floating point, we assume that it has been appropriately pre-processed (normalization for cosine, and convert-to-l2 by adding extra dimension for MIPS). So we shall invoke an l2 distance function.\n",
"L2: Using AVX2 distance computation DistanceL2Float\n",
"L2: Using AVX2 distance computation DistanceL2Float\n",
"Before index load\n",
"Reading bin file knowledge_pq_compressed.bin ...\n",
"Opening bin file knowledge_pq_compressed.bin... \n",
"Metadata: #pts = 6, #dims = 512...\n",
"done.\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 4, #dims = 1...\n",
"done.\n",
"Offsets: 4096 791560 794644 796704\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 256, #dims = 769...\n",
"done.\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 769, #dims = 1...\n",
"done.\n",
"Reading bin file knowledge_pq_pivots.bin ...\n",
"Opening bin file knowledge_pq_pivots.bin... \n",
"Metadata: #pts = 513, #dims = 1...\n",
"done.\n",
"Loaded PQ Pivots: #ctrs: 256, #dims: 769, #chunks: 512\n",
"Loaded PQ centroids and in-memory compressed vectors. #points: 6 #dim: 769 #aligned_dim: 776 #chunks: 512\n",
"Loading index metadata from knowledge_disk.index\n",
"Disk-Index File Meta-data: # nodes per sector: 1, max node len (bytes): 3100, max node degree: 5\n",
"Disk-Index Meta: nodes per sector: 1, max node len: 3100, max node degree: 5\n",
"Setting up thread-specific contexts for nthreads: 8\n",
"allocating ctx: 0x77203100b000 to thread-id:130971745651648\n",
"allocating ctx: 0x77202fc8c000 to thread-id:130971756137280\n",
"allocating ctx: 0x77202fc7b000 to thread-id:130971735166016\n",
"allocating ctx: 0x77202fc6a000 to thread-id:130983600146240\n",
"allocating ctx: 0x77202fc59000 to thread-id:130971766622912\n",
"allocating ctx: 0x77202fc48000 to thread-id:130971703709120\n",
"allocating ctx: 0x77202fc37000 to thread-id:130971714194752\n",
"allocating ctx: 0x77202fc26000 to thread-id:130971724680384\n",
"Loading centroid data from medoids vector data of 1 medoid(s)\n",
"Reading bin file knowledge_disk.index_max_base_norm.bin ...\n",
"Opening bin file knowledge_disk.index_max_base_norm.bin... \n",
"Metadata: #pts = 1, #dims = 1...\n",
"done.\n",
"Setting re-scaling factor of base vectors to 1\n",
"load_from_separate_paths done.\n",
"Reading (with alignment) bin file knowledge_sample_data.bin ...Metadata: #pts = 1, #dims = 769, aligned_dim = 776... allocating aligned memory of 3104 bytes... done. Copying data to mem_aligned buffer... done.\n",
"reserve ratio: 1\n",
"Graph traversal completed, hops: 3\n",
"Loading the cache list into memory....done.\n",
"After index load\n",
"INFO: Computing embeddings for 1 chunks using 'sentence-transformers/all-mpnet-base-v2'...\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"Batches: 100%|██████████| 1/1 [00:00<00:00, 56.33it/s]"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"INFO: DiskANN ZMQ mode enabled - ensuring embedding server is running\n",
"INFO: Starting session-level embedding server as a background process...\n",
"INFO: Running command from project root: /home/ubuntu/LEANN_clean/leann\n",
"INFO: Server process started with PID: 313817\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"✅ Embedding server is up and ready for this session.\n",
"[EmbeddingServer LOG]: Initializing leann-backend-diskann...\n",
"[EmbeddingServer LOG]: WARNING: Could not import DiskANN backend: cannot import name '_diskannpy' from partially initialized module 'packages.leann-backend-diskann.leann_backend_diskann' (most likely due to a circular import) (/home/ubuntu/LEANN_clean/leann/packages/leann-backend-diskann/leann_backend_diskann/__init__.py)\n",
"[EmbeddingServer LOG]: INFO: Initializing embedding server thread on port 5555\n",
"[EmbeddingServer LOG]: INFO: Using CUDA device\n",
"[EmbeddingServer LOG]: INFO: Loading model sentence-transformers/all-mpnet-base-v2\n",
"[EmbeddingServer LOG]: INFO: Using FP16 precision with model: sentence-transformers/all-mpnet-base-v2\n",
"[EmbeddingServer LOG]: INFO: Loaded 6 demo documents\n",
"[EmbeddingServer LOG]: INFO: ZMQ ROUTER server listening on port 5555\n",
"[EmbeddingServer LOG]: INFO: Embedding server ready to serve requests\n",
"reserve ratio: [EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 3 bytes\n",
"1\n",
"Graph traversal completed, hops: 3\n",
"[EmbeddingServer LOG]: INFO: Request for 1 node embeddings: [0]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 0\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000025 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 1, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 1\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.019455 seconds\n",
"[EmbeddingServer LOG]: Batch size: 1, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000176 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 3.062818 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.052912 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000228 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 3.136761 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 7 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 5 node embeddings: [1, 2, 3, 4, 5]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 5\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000045 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 5, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 5\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.001596 seconds\n",
"[EmbeddingServer LOG]: Batch size: 5, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000094 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 3.517292 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000360 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000155 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 3.520236 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 7 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 5 node embeddings: [3, 4, 2, 1, 0]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 4\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000031 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 5, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 5\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.001254 seconds\n",
"[EmbeddingServer LOG]: Batch size: 5, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000076 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.009231 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000189 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000087 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.011405 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 7 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 5 node embeddings: [0, 1, 2, 4, 5]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 5\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000020 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 5, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 5\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.000968 seconds\n",
"[EmbeddingServer LOG]: Batch size: 5, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000071 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.008908 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000148 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000055 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.010627 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 7 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 5 node embeddings: [3, 1, 0, 2, 5]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 5\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000020 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 5, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 5\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.000959 seconds\n",
"[EmbeddingServer LOG]: Batch size: 5, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000071 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.008822 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000151 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000063 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.010516 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 7 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 5 node embeddings: [0, 2, 3, 4, 5]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 5\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000019 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 5, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 5\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.001046 seconds\n",
"[EmbeddingServer LOG]: Batch size: 5, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000074 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.008821 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000146 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000059 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.010625 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 7 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 5 node embeddings: [1, 0, 3, 4, 5]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 5\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000019 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 5, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 5\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.000947 seconds\n",
"[EmbeddingServer LOG]: Batch size: 5, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000071 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.008823 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000143 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000047 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.010491 seconds\n",
"Score: -0.481 - C++ is a powerful programming language\n",
"Score: -1.049 - Java is a powerful programming language\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 3 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 1 node embeddings: [1]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 1\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000020 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 1, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 1\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.000475 seconds\n",
"[EmbeddingServer LOG]: Batch size: 1, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000245 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.005035 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000223 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000076 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.006687 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [41, 3, 40, 35, 27, 11, 2, 34, 7, 17, 53, 36, 10, 5, 6, 23, 39, 38, 15, 29, 25, 20, 4, 13, 26, 37, 33, 28, 21, 32, 12, 50]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 2 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.006198 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000091 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043852 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000362 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000303 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.051755 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [35, 40, 25, 12, 1, 2, 20, 24, 53, 9, 3, 6, 36, 11, 27, 41, 34, 26, 29, 33, 28, 5, 21, 17, 13, 7, 32, 30, 15, 31, 39, 4]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000036 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.006460 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000094 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043777 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000364 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000125 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.051677 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [41, 14, 30, 27, 11, 7, 31, 15, 53, 0, 4, 5, 1, 36, 13, 37, 39, 40, 38, 3, 22, 29, 34, 32, 19, 33, 25, 26, 35, 28, 8, 50]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000035 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005619 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000119 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043553 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000359 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000145 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050564 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [39, 4, 37, 34, 26, 41, 13, 15, 35, 32, 29, 50, 30, 1, 5, 27, 14, 3, 36, 23, 40, 12, 28, 7, 11, 22, 31, 2, 19, 33, 8, 17]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 50\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.006054 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043605 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000074 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.051038 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [37, 7, 41, 22, 50, 0, 36, 23, 39, 8, 11, 35, 53, 16, 30, 14, 1, 4, 15, 40, 38, 27, 13, 6, 19, 10, 3, 25, 34, 45, 29, 48]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000040 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005921 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000086 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043591 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000359 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000081 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050846 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [55, 54, 44, 45, 49, 46, 51, 8, 42, 52, 43, 50, 53, 47, 0, 2, 24, 5, 15, 36, 37, 41, 1, 6, 19, 9, 35, 16, 7, 17, 22, 26]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005599 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000090 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043636 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000369 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000118 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050578 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [27, 34, 20, 32, 3, 26, 2, 24, 22, 51, 31, 35, 1, 25, 12, 21, 41, 38, 33, 29, 40, 13, 10, 15, 4, 30, 14, 6, 17, 11, 37, 39]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 51\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000036 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005486 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000090 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043729 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000371 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000092 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050599 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [31, 3, 8, 32, 34, 12, 41, 21, 27, 2, 10, 24, 45, 13, 40, 1, 35, 29, 20, 28, 15, 4, 17, 14, 26, 25, 36, 38, 23, 37, 11, 30]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 45\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005491 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000090 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043680 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000072 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050465 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [26, 6, 30, 32, 40, 27, 3, 7, 10, 20, 15, 24, 55, 1, 28, 35, 8, 21, 29, 31, 11, 17, 33, 9, 5, 34, 23, 19, 2, 36, 22, 37]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000032 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005579 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000086 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043559 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000372 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000078 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050408 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [42, 53, 50, 49, 19, 55, 45, 47, 44, 54, 46, 51, 0, 41, 24, 17, 48, 52, 16, 1, 15, 5, 40, 2, 36, 35, 3, 6, 9, 37, 14, 34]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005751 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043583 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000354 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000072 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050691 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [48, 24, 52, 45, 44, 42, 51, 46, 43, 53, 47, 2, 55, 49, 50, 1, 6, 36, 19, 26, 35, 41, 9, 16, 25, 5, 40, 0, 3, 37, 8, 17]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005239 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000086 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043486 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000374 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000132 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050063 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [50, 46, 52, 0, 43, 55, 45, 44, 37, 26, 48, 42, 53, 54, 49, 5, 51, 19, 16, 1, 22, 36, 8, 41, 7, 14, 15, 11, 38, 4, 40, 25]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005200 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000087 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043580 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000364 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000136 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050169 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [48, 5, 17, 55, 49, 50, 43, 53, 46, 42, 47, 52, 24, 54, 44, 51, 15, 16, 0, 19, 37, 35, 8, 1, 22, 41, 6, 2, 9, 7, 36, 27]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005379 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043595 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000364 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000079 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050286 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [1, 10, 6, 26, 55, 18, 2, 7, 34, 38, 28, 21, 17, 53, 24, 19, 3, 41, 36, 11, 13, 40, 33, 5, 25, 27, 20, 32, 4, 31, 12, 15]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005289 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000087 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043688 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000358 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000075 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050273 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [15, 9, 5, 22, 13, 25, 29, 48, 18, 19, 7, 37, 16, 6, 21, 17, 41, 39, 14, 26, 27, 1, 32, 20, 38, 4, 34, 33, 36, 35, 11, 31]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 48\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000032 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005197 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000107 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043549 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000364 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000073 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050126 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [48, 53, 42, 47, 25, 43, 45, 50, 54, 52, 44, 49, 46, 35, 0, 19, 51, 1, 5, 6, 41, 37, 26, 7, 8, 11, 36, 2, 3, 22, 9, 16]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 54\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000035 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004973 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000098 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043565 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000362 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000070 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050157 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [55, 44, 43, 24, 48, 50, 49, 45, 52, 46, 19, 2, 54, 47, 51, 53, 6, 1, 41, 5, 16, 37, 0, 9, 35, 17, 15, 7, 26, 25, 27, 8]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000035 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005029 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000096 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043512 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000359 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000127 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050025 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [1, 29, 37, 33, 49, 36, 34, 15, 23, 13, 25, 53, 41, 3, 5, 4, 10, 27, 14, 11, 35, 2, 7, 39, 38, 31, 28, 22, 6, 32, 12, 30]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000042 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005203 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000095 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043577 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000069 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050252 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [39, 41, 34, 32, 20, 8, 38, 12, 23, 15, 3, 27, 21, 0, 44, 4, 1, 22, 36, 33, 35, 31, 40, 5, 14, 19, 11, 7, 28, 37, 26, 29]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 44\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000057 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005057 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000095 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043559 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000358 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000071 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050047 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [3, 42, 26, 17, 16, 25, 27, 28, 33, 32, 35, 1, 10, 31, 30, 6, 34, 2, 21, 29, 12, 20, 13, 38, 43, 15, 52, 4, 11, 54, 49, 44]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 54\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000035 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004832 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000093 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043604 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000365 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000072 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049907 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [21, 12, 28, 6, 18, 3, 15, 13, 34, 32, 2, 10, 29, 52, 17, 1, 33, 31, 25, 35, 27, 26, 9, 4, 40, 8, 19, 38, 39, 22, 36, 23]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 52\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004736 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000095 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043551 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000075 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049720 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [55, 50, 1, 0, 43, 45, 49, 54, 5, 44, 19, 48, 47, 52, 35, 41, 36, 42, 46, 40, 37, 11, 51, 16, 14, 7, 3, 10, 6, 27, 23, 39]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000052 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005280 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000097 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043612 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000069 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050364 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [20, 34, 2, 12, 21, 31, 17, 33, 15, 3, 35, 28, 13, 29, 26, 10, 27, 1, 8, 9, 32, 6, 4, 25, 19, 24, 30, 14, 22, 23, 7, 11]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 35\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004933 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000093 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043592 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000362 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000087 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049905 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [31, 12, 13, 1, 28, 16, 33, 38, 14, 29, 15, 26, 19, 18, 30, 24, 49, 3, 27, 41, 32, 35, 40, 4, 2, 20, 39, 21, 37, 10, 23, 11]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 49\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005100 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043713 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000358 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000132 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050184 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [8, 22, 17, 21, 41, 25, 45, 27, 14, 19, 7, 32, 6, 34, 2, 18, 0, 13, 1, 5, 20, 39, 38, 37, 40, 4, 9, 23, 31, 3, 29, 36]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 45\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005211 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000086 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043583 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000369 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000082 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050108 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [47, 43, 45, 36, 53, 55, 42, 49, 46, 37, 51, 19, 26, 48, 5, 44, 41, 54, 1, 7, 40, 52, 11, 35, 4, 0, 14, 22, 38, 23, 8, 6]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005326 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043689 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000359 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000077 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050398 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [51, 44, 54, 6, 0, 48, 49, 53, 47, 24, 55, 42, 45, 46, 43, 50, 2, 35, 1, 25, 16, 26, 9, 17, 36, 10, 15, 20, 19, 34, 3, 41]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005019 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000086 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043549 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000354 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000076 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049855 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [1, 33, 12, 26, 28, 24, 30, 35, 27, 4, 32, 21, 13, 34, 2, 29, 7, 19, 53, 41, 40, 20, 31, 10, 25, 36, 38, 6, 23, 15, 11, 39]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004843 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043592 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000077 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049748 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [41, 31, 23, 38, 3, 13, 27, 15, 7, 50, 0, 1, 39, 36, 5, 40, 34, 37, 14, 29, 32, 11, 22, 12, 35, 33, 26, 2, 28, 20, 19, 30]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 50\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000046 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004848 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000086 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043578 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000355 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000079 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049762 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [48, 35, 43, 45, 50, 42, 53, 52, 19, 55, 44, 54, 51, 46, 47, 40, 6, 1, 3, 36, 34, 26, 7, 2, 5, 41, 38, 27, 15, 25, 9, 10]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005006 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000087 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043567 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000356 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000067 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049898 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [27, 37, 25, 11, 31, 7, 17, 24, 46, 3, 23, 1, 14, 32, 5, 15, 28, 26, 40, 22, 33, 4, 34, 21, 8, 13, 10, 38, 6, 29, 20, 19]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 46\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000035 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004698 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043511 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000079 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049511 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [19, 0, 45, 9, 15, 5, 53, 24, 8, 22, 37, 6, 7, 14, 43, 50, 39, 25, 47, 34, 1, 23, 48, 13, 36, 26, 27, 32, 42, 55, 21, 11]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005009 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000087 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043560 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000356 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000067 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049864 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [5, 35, 27, 9, 23, 1, 11, 8, 39, 31, 50, 37, 14, 41, 15, 22, 6, 36, 25, 4, 40, 3, 26, 38, 30, 13, 32, 29, 10, 19, 2, 34]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 50\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004949 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000099 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043564 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000354 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000087 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049865 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [32, 34, 33, 14, 4, 30, 27, 3, 12, 28, 13, 15, 18, 49, 21, 23, 29, 7, 41, 20, 40, 25, 26, 1, 35, 38, 2, 37, 17, 22, 11, 8]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 49\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000036 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004950 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000087 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043601 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000355 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000073 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049895 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [41, 40, 50, 0, 5, 23, 35, 11, 29, 34, 19, 1, 4, 39, 37, 13, 10, 3, 7, 38, 27, 2, 22, 15, 14, 53, 6, 33, 26, 8, 25, 31]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005066 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000090 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043597 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000358 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000077 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.050019 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [48, 42, 52, 46, 43, 49, 50, 6, 24, 55, 54, 45, 51, 53, 47, 35, 5, 1, 19, 41, 8, 16, 37, 36, 3, 9, 26, 0, 15, 2, 34, 40]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000035 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.005022 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000114 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043570 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000364 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000069 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049988 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [1, 23, 30, 0, 5, 39, 25, 32, 53, 41, 7, 35, 37, 14, 36, 27, 40, 10, 13, 4, 38, 3, 22, 15, 6, 34, 29, 26, 33, 28, 17, 50]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000036 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004957 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000085 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043560 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000078 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049927 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [5, 15, 19, 14, 13, 21, 0, 30, 28, 29, 45, 37, 8, 41, 7, 39, 23, 36, 4, 1, 11, 32, 40, 16, 38, 27, 34, 31, 9, 3, 35, 25]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 45\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000035 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004693 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000095 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043676 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000356 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000077 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049752 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [25, 27, 35, 9, 24, 47, 6, 3, 28, 38, 7, 17, 50, 18, 1, 32, 29, 34, 10, 41, 21, 31, 13, 8, 15, 20, 33, 4, 19, 30, 36, 12]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 50\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004860 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000106 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043520 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000085 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049804 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [37, 23, 31, 15, 22, 7, 11, 40, 38, 19, 30, 0, 53, 5, 41, 34, 4, 13, 27, 1, 39, 36, 8, 33, 32, 28, 29, 35, 3, 16, 50, 25]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004716 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000087 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043595 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000356 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000070 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049714 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [52, 50, 48, 6, 24, 54, 44, 55, 49, 42, 45, 43, 46, 53, 47, 26, 9, 25, 35, 16, 2, 36, 1, 10, 3, 19, 5, 41, 40, 27, 7, 8]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004821 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000091 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043538 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000073 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049735 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [48, 44, 45, 47, 5, 24, 9, 54, 42, 55, 50, 49, 52, 43, 53, 51, 37, 1, 16, 19, 15, 6, 8, 41, 7, 36, 0, 40, 22, 35, 17, 11]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004873 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043572 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000353 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000075 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049889 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [20, 15, 32, 2, 12, 3, 17, 13, 6, 28, 26, 18, 49, 33, 22, 31, 34, 35, 1, 8, 25, 9, 41, 10, 27, 19, 40, 29, 30, 38, 7, 4]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 49\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004954 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043505 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000355 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000120 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049897 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [1, 4, 36, 5, 13, 23, 38, 15, 33, 43, 39, 40, 27, 11, 34, 53, 19, 37, 3, 35, 14, 22, 7, 32, 29, 2, 10, 31, 12, 28, 8, 26]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000041 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004878 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000087 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043611 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000364 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000075 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049876 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [35, 25, 9, 20, 52, 2, 7, 15, 40, 53, 24, 1, 26, 10, 21, 17, 3, 8, 5, 41, 19, 11, 36, 13, 12, 28, 34, 27, 16, 32, 29, 38]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000032 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004828 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000089 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043607 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000354 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000077 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049797 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [31, 27, 21, 13, 33, 3, 28, 15, 19, 42, 34, 41, 12, 20, 25, 26, 17, 1, 38, 4, 35, 22, 29, 30, 23, 11, 8, 7, 37, 40, 14, 39]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 42\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004633 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043628 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000354 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000068 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049742 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [5, 14, 38, 47, 41, 22, 11, 34, 0, 50, 30, 16, 7, 23, 39, 36, 40, 1, 4, 15, 8, 19, 13, 27, 35, 32, 31, 33, 53, 3, 28, 29]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004749 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000089 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043532 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000355 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000076 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049615 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [20, 34, 3, 13, 33, 2, 18, 28, 10, 17, 21, 31, 32, 41, 1, 38, 15, 4, 27, 35, 40, 6, 39, 26, 29, 8, 25, 24, 23, 36, 14, 9]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 41\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000035 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004750 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043570 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000353 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000073 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049821 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [19, 8, 6, 17, 16, 21, 26, 48, 15, 20, 25, 7, 22, 35, 1, 2, 10, 32, 3, 5, 13, 12, 27, 29, 33, 43, 28, 31, 55, 45, 42, 18]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004903 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043492 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000357 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000080 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049751 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [1, 30, 26, 28, 23, 29, 32, 4, 15, 34, 13, 7, 20, 24, 53, 41, 3, 25, 31, 11, 33, 40, 38, 5, 10, 35, 39, 14, 36, 12, 8, 50]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000043 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004987 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000089 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043620 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000353 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000070 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049956 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [13, 38, 5, 41, 15, 34, 43, 1, 4, 36, 37, 23, 7, 11, 22, 40, 27, 14, 8, 3, 35, 12, 29, 32, 19, 28, 20, 31, 33, 6, 53, 26]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004892 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000089 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043572 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000355 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000077 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049816 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [15, 2, 24, 21, 9, 1, 32, 25, 18, 45, 20, 6, 35, 8, 3, 33, 12, 34, 26, 27, 10, 40, 28, 19, 31, 30, 11, 38, 13, 22, 4, 29]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 45\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000034 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004802 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043615 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000354 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000071 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049759 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [27, 40, 18, 3, 34, 15, 10, 11, 1, 36, 41, 33, 31, 23, 26, 4, 28, 25, 32, 20, 13, 38, 7, 35, 39, 2, 14, 6, 12, 37, 22, 19]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 41\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000032 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004797 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000086 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043515 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000362 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000073 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049675 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [16, 9, 22, 34, 43, 8, 13, 26, 0, 30, 15, 14, 37, 5, 6, 41, 32, 21, 38, 23, 1, 4, 20, 39, 7, 17, 25, 53, 3, 36, 27, 29]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 0 to 53\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004681 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043572 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000356 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000072 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049589 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [16, 5, 43, 53, 37, 22, 19, 14, 47, 36, 50, 7, 11, 8, 15, 55, 45, 48, 39, 23, 27, 42, 13, 1, 4, 9, 52, 30, 46, 44, 25, 32]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 55\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004735 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000088 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043556 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000356 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000068 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049612 seconds\n",
"[EmbeddingServer LOG]: INFO: Received ZMQ request from client 006b8b45, size 34 bytes\n",
"[EmbeddingServer LOG]: INFO: Request for 32 node embeddings: [1, 12, 52, 6, 34, 17, 18, 24, 43, 35, 10, 3, 21, 20, 40, 41, 36, 15, 33, 28, 31, 38, 4, 29, 7, 27, 32, 13, 25, 9, 26, 11]\n",
"[EmbeddingServer LOG]: DEBUG: Node ID range: 1 to 52\n",
"[EmbeddingServer LOG]: Time taken for text lookup: 0.000033 seconds\n",
"[EmbeddingServer LOG]: INFO: Total batch size: 32, max_batch_size: 128\n",
"[EmbeddingServer LOG]: INFO: Processing batch of size 32\n",
"[EmbeddingServer LOG]: Time taken for tokenization (batch): 0.004743 seconds\n",
"[EmbeddingServer LOG]: Batch size: 32, Sequence length: 256\n",
"[EmbeddingServer LOG]: Time taken for transfer to device (batch): 0.000087 seconds\n",
"[EmbeddingServer LOG]: Time taken for embedding (batch): 0.043615 seconds\n",
"[EmbeddingServer LOG]: Time taken for mean pooling (batch): 0.000354 seconds\n",
"[EmbeddingServer LOG]: INFO: Serialize time: 0.000074 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ E2E time: 0.049773 seconds\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n",
"[EmbeddingServer LOG]: INFO: ZMQ socket timeout, continuing to listen\n"
]
}
],
"source": [
"from leann.api import LeannBuilder, LeannSearcher\n",
"import leann_backend_diskann\n",
"# 1. Build index (no embeddings stored!)\n",
"builder = LeannBuilder(backend_name=\"diskann\")\n",
"builder.add_text(\"Python is a powerful programming language\")\n",
"builder.add_text(\"Machine learning transforms industries\") \n",
"builder.add_text(\"Neural networks process complex data\")\n",
"builder.add_text(\"Java is a powerful programming language\")\n",
"builder.add_text(\"C++ is a powerful programming language\")\n",
"builder.add_text(\"C# is a powerful programming language\")\n",
"builder.build_index(\"knowledge.leann\")\n",
"\n",
"# 2. Search with real-time embeddings\n",
"searcher = LeannSearcher(\"knowledge.leann\")\n",
"results = searcher.search(\"C++ programming languages\", top_k=2,recompute_beighbor_embeddings=True)\n",
"\n",
"for result in results:\n",
" print(f\"Score: {result['score']:.3f} - {result['text']}\")"
]
}
],
"metadata": {
"kernelspec": {
"display_name": ".venv",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.11.11"
}
},
"nbformat": 4,
"nbformat_minor": 2
}