From a513d830c06ead1033057cff08466bf5db900af1 Mon Sep 17 00:00:00 2001 From: Arun Isaac Date: Tue, 11 Oct 2022 12:04:48 +0530 Subject: Correct xapian scalability figures for SQL database access. Earlier, the time estimates included the time taken to retrieve the documents from the SQL database. This is now removed giving a clearer picture of xapian scalability. --- topics/xapian-index-building-scalability.svg | 148 +++++++++++++-------------- topics/xapian-scalability.gmi | 21 ++-- 2 files changed, 81 insertions(+), 88 deletions(-) (limited to 'topics') diff --git a/topics/xapian-index-building-scalability.svg b/topics/xapian-index-building-scalability.svg index 5452117..9d525d4 100644 --- a/topics/xapian-index-building-scalability.svg +++ b/topics/xapian-index-building-scalability.svg @@ -46,12 +46,12 @@ - + - - 0.5 + + 0.44 @@ -59,12 +59,12 @@ - + - - 0.51 + + 0.45 @@ -72,12 +72,12 @@ - + - - 0.52 + + 0.46 @@ -85,12 +85,12 @@ - + - - 0.53 + + 0.47 @@ -98,12 +98,12 @@ - + - - 0.54 + + 0.48 @@ -111,12 +111,12 @@ - + - - 0.55 + + 0.49 @@ -124,12 +124,12 @@ - + - - 0.56 + + 0.5 @@ -137,12 +137,12 @@ - + - - 0.57 + + 0.51 @@ -150,12 +150,12 @@ - + - - 0.58 + + 0.52 @@ -163,12 +163,12 @@ - + - - 0.59 + + 0.53 @@ -176,12 +176,12 @@ - + - - 0.6 + + 0.54 @@ -189,53 +189,53 @@ - + - - 10000 + + 10k - - + - - 100000 + + 100k - - + - - 1x106 + + 1M - @@ -245,21 +245,16 @@ - 1x107 + 10M - - - - Time (in ms) - - + - - Index size (in number of documents) + + Xapian index size (in number of documents) @@ -268,17 +263,16 @@ - - - - - - - - - - + + + + + + + + + @@ -286,10 +280,10 @@ - + - - Time per document to build an index of various sizes + + Time (in ms) per document to build a Xapian index of various sizes diff --git a/topics/xapian-scalability.gmi b/topics/xapian-scalability.gmi index 21eb1d4..cfc4e46 100644 --- a/topics/xapian-scalability.gmi +++ b/topics/xapian-scalability.gmi @@ -2,17 +2,16 @@ As the index grows larger, Xapian takes longer to insert new documents. Shown below is the time (in seconds) taken to build indices of various sizes (in number of documents). -* 10k: 5.0 -* 20k: 10.7 -* 40k: 21.1 -* 80k: 42.3 -* 160k: 87.2 -* 320k: 176.4 -* 640k: 353.9 -* 1280k: 727.5 -* 2560k: 1494.3 -* 5120k: 3037.9 +* 10k: 4.45 +* 20k: 9.48 +* 40k: 20.40 +* 80k: 41.70 +* 160k: 81.63 +* 320k: 159.88 +* 640k: 318.84 +* 1280k: 651.47 +* 2560k: 1357.73 -Notice that it takes 607x, not 512x, more time to build the 5120k index than it takes to build the 10k index. In terms of time, the 10k index takes on average 0.5 ms per document while the 5120k index takes on average 0.59 ms per document. We show this graphically below. +Notice that it takes 305x, not 256x, more time to build the 2560k index than it takes to build the 10k index. In terms of time, the 10k index takes on average 0.45 ms per document while the 2560k index takes on average 0.53 ms per document. We show this graphically below. => xapian-index-building-scalability.svg -- cgit v1.2.3