[Tracker] Updating our FTS Version

From: Martyn Russell <martyn imendio com>
To: Tracker mailing list <tracker-list gnome org>
Subject: [Tracker] Updating our FTS Version
Date: Thu, 05 Mar 2009 17:07:23 +0000

Hi all,

Jamie, this week we realised that QDBM is really taking a lot of timeand is now the most prominent thing to fix to get some speed increase inall areas. Couple this with the fact that we will be trying to move tovstore shortly and FTS right after that, I wanted to have a peek and seewhat is needed to get FTS going.

First I thought I would check the code out you started and compare it toSQLite's FTS3 version to see what changed. I noticed they have madequite some changes, but mostly code white space updates.

I have included in this email a patch with those (mostly white spacechanges) which we could apply to our version so you can see the realdifferences which need more care and attention. Those real differencesare attached in the two extra patches which diff the hash file and thefts file.


Are you happy for me to commit the update patch?

Does it look like it is worth updating our FTS support from the upstreamchanges in SQLite?


--
Regards,
Martyn

--- ../../../sqlite/ext/fts3/fts3.c     2009-03-05 04:20:32.000000000 +0000
+++ tracker-fts.c       2009-03-05 16:48:47.000000000 +0000
@@ -272,29 +272,25 @@
 ** into a single segment.
 */
 
-#if !defined(SQLITE_CORE) || defined(SQLITE_ENABLE_FTS3)
-
-#if defined(SQLITE_ENABLE_FTS3) && !defined(SQLITE_CORE)
-# define SQLITE_CORE 1
-#endif
-
 #include <assert.h>
 #include <stdlib.h>
 #include <stdio.h>
 #include <string.h>
 #include <ctype.h>
+#include <sqlite3ext.h>
 
-#include "fts3.h"
-#include "fts3_expr.h"
-#include "fts3_hash.h"
-#include "fts3_tokenizer.h"
-#ifndef SQLITE_CORE 
-# include "sqlite3ext.h"
-  SQLITE_EXTENSION_INIT1
-#endif
+#define TRACKER_ENABLE_INTERNALS
+#include <libtracker-common/tracker-common.h>
+
+
+#include <libtracker-db/tracker-db-manager.h>
 
+#include "tracker-fts.h"
+#include "tracker-fts-hash.h"
 
-/* TODO(shess) MAN, this thing needs some refactoring.  At minimum, it
+SQLITE_EXTENSION_INIT1
+
+/* TODO(shess) MAN, this thing needs some refactoring. At minimum, it
 ** would be nice to order the file better, perhaps something along the
 ** lines of:
 **
@@ -313,6 +309,109 @@
 # define FTSTRACE(A)
 #endif
 
+static int default_column = 0;
+
+/* Functions from Tracker */
+static TrackerDBResultSet *
+db_metadata_get (TrackerDBInterface *iface, 
+                const gchar        *id, 
+                const gchar        *key)
+{
+       TrackerField *def;
+       const gchar  *proc = NULL;
+
+       g_return_val_if_fail (TRACKER_IS_DB_INTERFACE (iface), NULL);
+       g_return_val_if_fail (id, NULL);
+       g_return_val_if_fail (key, NULL);
+
+       def = tracker_ontology_get_field_by_name (key);
+       
+       if (!def) {
+               g_warning ("Metadata not found for id:'%s' and type:'%s'", id, key);
+               return NULL;
+       }
+
+       switch (tracker_field_get_data_type (def)) {
+       case TRACKER_FIELD_TYPE_INDEX:
+       case TRACKER_FIELD_TYPE_STRING:
+       case TRACKER_FIELD_TYPE_DOUBLE:
+               proc = "GetMetadata";
+               break;
+
+       case TRACKER_FIELD_TYPE_INTEGER:
+       case TRACKER_FIELD_TYPE_DATE:
+               proc = "GetMetadataNumeric";
+               break;
+
+       case TRACKER_FIELD_TYPE_FULLTEXT:
+               proc = "GetContents";
+               break;
+
+       case TRACKER_FIELD_TYPE_KEYWORD:
+               proc = "GetMetadataKeyword";
+               break;
+               
+       default:
+               g_warning ("Metadata could not be retrieved as type:%d is not supported", 
+                          tracker_field_get_data_type (def)); 
+               return NULL;
+       }
+
+       return tracker_db_interface_execute_procedure (iface,
+                                                      NULL, 
+                                                      proc, 
+                                                      id, 
+                                                      tracker_field_get_id (def),
+                                                      NULL);
+}
+
+static gchar *
+db_get_text (const char     *service,
+            const char     *key,    
+            const char     *id) 
+{
+       TrackerDBInterface *iface;
+       gchar              *contents = NULL;
+       TrackerDBResultSet *result_set;
+       
+       if (strcmp (key, "File:Contents") == 0) {
+               iface = tracker_db_manager_get_db_interface_by_type (service,
+                                                                    TRACKER_DB_CONTENT_TYPE_CONTENTS);
+       } else {
+               iface = tracker_db_manager_get_db_interface_by_type (service,
+                                                                    TRACKER_DB_CONTENT_TYPE_METADATA);
+       }
+
+       result_set = db_metadata_get (iface, id, key);
+
+       if (result_set) {
+               tracker_db_result_set_get (result_set, 0, &contents, -1);
+               g_object_unref (result_set);
+       }
+
+       return contents;
+}
+
+static inline int
+get_metadata_weight (int id)
+{
+  if (id == 0) return 1;
+
+  TrackerField *field = tracker_ontology_get_field_by_id (id);
+  
+  if (!field) return 1;
+
+  return tracker_field_get_weight (field);
+
+}
+
+
+
+/*
+ * ** Default span for NEAR operators.
+ * */
+#define SQLITE_FTS3_DEFAULT_NEAR_PARAM 10
+
 /* It is not safe to call isspace(), tolower(), or isalnum() on
 ** hi-bit-set characters.  This is the same solution used in the
 ** tokenizer.
@@ -332,9 +431,18 @@
   return (c&0x80)==0 ? isalnum(c) : 0;
 }
 
+int sqlite3_extension_init(
+  sqlite3 *db,
+  char **pzErrMsg,
+  const sqlite3_api_routines *pApi
+);
+
+
 typedef enum DocListType {
+
   DL_DOCIDS,              /* docids only */
   DL_POSITIONS,           /* docids + positions */
+  DL_POSITIONS_RANK,      /* docids + catid + rank + positions */
   DL_POSITIONS_OFFSETS    /* docids + positions + offsets */
 } DocListType;
 
@@ -588,6 +696,12 @@
   int nData;
 
   sqlite_int64 iDocid;
+  
+#ifdef STORE_CATEGORY
+  int Catid;
+#endif
+  
+  
   int nElement;
 } DLReader;
 
@@ -599,6 +713,14 @@
   assert( !dlrAtEnd(pReader) );
   return pReader->iDocid;
 }
+
+#ifdef STORE_CATEGORY
+static int dlrCatid(DLReader *pReader){
+  //assert( !dlrAtEnd(pReader) );
+  return pReader->Catid;
+}
+#endif
+
 static const char *dlrDocData(DLReader *pReader){
   assert( !dlrAtEnd(pReader) );
   return pReader->pData;
@@ -618,12 +740,24 @@
 static const char *dlrPosData(DLReader *pReader){
   sqlite_int64 iDummy;
   int n = fts3GetVarint(pReader->pData, &iDummy);
+  
+#ifdef STORE_CATEGORY    
+  int Catid;
+  n += fts3GetVarint32(pReader->pData+n, &Catid);
+#endif
+  
   assert( !dlrAtEnd(pReader) );
   return pReader->pData+n;
 }
 static int dlrPosDataLen(DLReader *pReader){
   sqlite_int64 iDummy;
   int n = fts3GetVarint(pReader->pData, &iDummy);
+  
+#ifdef STORE_CATEGORY    
+  int Catid;
+  n += fts3GetVarint32(pReader->pData+n, &Catid);
+#endif
+  
   assert( !dlrAtEnd(pReader) );
   return pReader->nElement-n;
 }
@@ -638,8 +772,16 @@
   /* If there is more data, read the next doclist element. */
   if( pReader->nData!=0 ){
     sqlite_int64 iDocidDelta;
+    
     int iDummy, n = fts3GetVarint(pReader->pData, &iDocidDelta);
     pReader->iDocid += iDocidDelta;
+
+#ifdef STORE_CATEGORY    
+    int Catid;
+    n += fts3GetVarint32(pReader->pData+n, &Catid);
+    pReader->Catid = Catid;
+#endif
+    
     if( pReader->iType>=DL_POSITIONS ){
       assert( n<pReader->nData );
       while( 1 ){
@@ -669,6 +811,10 @@
   pReader->nElement = 0;
   pReader->iDocid = 0;
 
+#ifdef STORE_CATEGORY    
+  pReader->Catid = 0;
+#endif
+
   /* Load the first element's data.  There must be a first element. */
   dlrStep(pReader);
 }
@@ -691,6 +837,12 @@
     sqlite_int64 iDocidDelta;
     int n = fts3GetVarint(pData, &iDocidDelta);
     iPrevDocid += iDocidDelta;
+    
+#ifdef STORE_CATEGORY    
+    int Catid;
+    n += fts3GetVarint32(pData+n, &Catid);
+#endif
+
     if( iType>DL_DOCIDS ){
       int iDummy;
       while( 1 ){
@@ -797,6 +949,29 @@
   dlwAppend(pWriter, dlrDocData(pReader), dlrDocDataBytes(pReader),
             dlrDocid(pReader), dlrDocid(pReader));
 }
+
+
+#ifdef STORE_CATEGORY    
+static void dlwAdd(DLWriter *pWriter, sqlite_int64 iDocid, int Catid){
+  char c[VARINT_MAX];
+  int n = fts3PutVarint(c, iDocid-pWriter->iPrevDocid);
+
+  /* Docids must ascend. */
+  assert( !pWriter->has_iPrevDocid || iDocid>pWriter->iPrevDocid );
+  assert( pWriter->iType==DL_DOCIDS );
+
+  dataBufferAppend(pWriter->b, c, n);
+  pWriter->iPrevDocid = iDocid;
+  
+  n = fts3PutVarint(c, Catid);
+  dataBufferAppend(pWriter->b, c, n);
+  
+#ifndef NDEBUG
+  pWriter->has_iPrevDocid = 1;
+#endif
+}
+#else
+
 static void dlwAdd(DLWriter *pWriter, sqlite_int64 iDocid){
   char c[VARINT_MAX];
   int n = fts3PutVarint(c, iDocid-pWriter->iPrevDocid);
@@ -812,6 +987,8 @@
 #endif
 }
 
+#endif
+
 /*******************************************************************/
 /* PLReader is used to read data from a document's position list.  As
 ** the caller steps through the list, data is cached so that varints
@@ -908,6 +1085,18 @@
   SCRAMBLE(pReader);
 }
 
+
+/* because plrDestroy should only be called when plrAtEnd is true, 
+we create a new convenience function to do this in one call */
+static void plrEndAndDestroy (PLReader *pReader){
+
+       while (!plrAtEnd(pReader)) {
+               plrStep (pReader);
+       }
+       
+       plrDestroy (pReader);
+}
+
 /*******************************************************************/
 /* PLWriter is used in constructing a document's position list.  As a
 ** convenience, if iType is DL_DOCIDS, PLWriter becomes a no-op.
@@ -980,6 +1169,37 @@
   plwAdd(pWriter, plrColumn(pReader), plrPosition(pReader),
          plrStartOffset(pReader), plrEndOffset(pReader));
 }
+
+
+#ifdef STORE_CATEGORY
+static void plwInit(PLWriter *pWriter, DLWriter *dlw, sqlite_int64 iDocid, int Catid){
+  char c[VARINT_MAX];
+  int n;
+
+  pWriter->dlw = dlw;
+
+  /* Docids must ascend. */
+  assert( !pWriter->dlw->has_iPrevDocid || iDocid>pWriter->dlw->iPrevDocid );
+  n = fts3PutVarint(c, iDocid-pWriter->dlw->iPrevDocid);
+  dataBufferAppend(pWriter->dlw->b, c, n);
+  pWriter->dlw->iPrevDocid = iDocid;
+  
+  n = fts3PutVarint(c, Catid);
+  dataBufferAppend(pWriter->dlw->b, c, n);
+    
+#ifndef NDEBUG
+  pWriter->dlw->has_iPrevDocid = 1;
+#endif
+
+  /* [tracker] - the default column (ID = 0) should be that of File:Contents for Files db and Email:Body for 
email db 
+  that way we avoid wrting a column ID and cosuming more bytes for the most voluminous cases */
+  pWriter->iColumn = default_column;
+  pWriter->iPos = 0;
+  pWriter->iOffset = 0;
+}
+
+#else
+
 static void plwInit(PLWriter *pWriter, DLWriter *dlw, sqlite_int64 iDocid){
   char c[VARINT_MAX];
   int n;
@@ -991,6 +1211,7 @@
   n = fts3PutVarint(c, iDocid-pWriter->dlw->iPrevDocid);
   dataBufferAppend(pWriter->dlw->b, c, n);
   pWriter->dlw->iPrevDocid = iDocid;
+    
 #ifndef NDEBUG
   pWriter->dlw->has_iPrevDocid = 1;
 #endif
@@ -999,7 +1220,13 @@
   pWriter->iPos = 0;
   pWriter->iOffset = 0;
 }
+
+#endif
+
+
+
 /* TODO(shess) Should plwDestroy() also terminate the doclist?  But
+
 ** then plwDestroy() would no longer be just a destructor, it would
 ** also be doing work, which isn't consistent with the overall idiom.
 ** Another option would be for plwAdd() to always append any necessary
@@ -1055,15 +1282,36 @@
     dataBufferAppend(b, pCollector->b.pData, pCollector->b.nData);
   }
 }
+
+static void dlcAddPos(DLCollector *pCollector, int iColumn, int iPos,
+                      int iStartOffset, int iEndOffset){
+  plwAdd(&pCollector->plw, iColumn, iPos, iStartOffset, iEndOffset);
+}
+
+
+#ifdef STORE_CATEGORY
+static void dlcNext(DLCollector *pCollector, sqlite_int64 iDocid, int Catid){
+  plwTerminate(&pCollector->plw);
+  plwDestroy(&pCollector->plw);
+  plwInit(&pCollector->plw, &pCollector->dlw, iDocid, Catid);
+}
+
+
+static DLCollector *dlcNew(sqlite_int64 iDocid, DocListType iType, int Catid){
+  DLCollector *pCollector = sqlite3_malloc(sizeof(DLCollector));
+  dataBufferInit(&pCollector->b, 0);
+  dlwInit(&pCollector->dlw, iType, &pCollector->b);
+  plwInit(&pCollector->plw, &pCollector->dlw, iDocid, Catid);
+  return pCollector;
+}
+
+#else
+
 static void dlcNext(DLCollector *pCollector, sqlite_int64 iDocid){
   plwTerminate(&pCollector->plw);
   plwDestroy(&pCollector->plw);
   plwInit(&pCollector->plw, &pCollector->dlw, iDocid);
 }
-static void dlcAddPos(DLCollector *pCollector, int iColumn, int iPos,
-                      int iStartOffset, int iEndOffset){
-  plwAdd(&pCollector->plw, iColumn, iPos, iStartOffset, iEndOffset);
-}
 
 static DLCollector *dlcNew(sqlite_int64 iDocid, DocListType iType){
   DLCollector *pCollector = sqlite3_malloc(sizeof(DLCollector));
@@ -1072,6 +1320,9 @@
   plwInit(&pCollector->plw, &pCollector->dlw, iDocid);
   return pCollector;
 }
+
+#endif
+
 static void dlcDelete(DLCollector *pCollector){
   plwDestroy(&pCollector->plw);
   dlwDestroy(&pCollector->dlw);
@@ -1110,8 +1361,14 @@
 
     while( !plrAtEnd(&plReader) ){
       if( iColumn==-1 || plrColumn(&plReader)==iColumn ){
+
         if( !match ){
+        
+#ifdef STORE_CATEGORY        
+          plwInit(&plWriter, &dlWriter, dlrDocid(&dlReader), dlrCatid(&dlReader));
+#else
           plwInit(&plWriter, &dlWriter, dlrDocid(&dlReader));
+#endif
           match = 1;
         }
         plwAdd(&plWriter, plrColumn(&plReader), plrPosition(&plReader),
@@ -1300,7 +1557,13 @@
 
   plrInit(&left, pLeft);
   plrInit(&right, pRight);
+  
+#ifdef STORE_CATEGORY        
+  plwInit(&writer, pOut, dlrDocid(pLeft), dlrCatid(pLeft));
+#else
   plwInit(&writer, pOut, dlrDocid(pLeft));
+#endif
+
 
   while( !plrAtEnd(&left) || !plrAtEnd(&right) ){
     int c = posListCmp(&left, &right);
@@ -1393,12 +1656,14 @@
 ** If boolean argument isSaveLeft is true, then positionids are copied
 ** from pLeft instead of pRight. In the example above, the positions "5"
 ** and "20" would be added instead of "6" and "21".
+** If isSaveLeft = 2 then both positions are added, 3 or above and postions are appended to left
 */
 static void posListPhraseMerge(
   DLReader *pLeft, 
   DLReader *pRight,
   int nNear,
   int isSaveLeft,
+  int term_num,
   DLWriter *pOut
 ){
   PLReader left, right;
@@ -1410,6 +1675,8 @@
 
   plrInit(&left, pLeft);
   plrInit(&right, pRight);
+  
+
 
   while( !plrAtEnd(&left) && !plrAtEnd(&right) ){
     if( plrColumn(&left)<plrColumn(&right) ){
@@ -1420,15 +1687,32 @@
       plrStep(&right);
     }else{
       if( (plrPosition(&right)-plrPosition(&left))<=(nNear+1) ){
+
         if( !match ){
-          plwInit(&writer, pOut, dlrDocid(pLeft));
+        
+#ifdef STORE_CATEGORY        
+         plwInit(&writer, pOut, dlrDocid(pLeft), dlrCatid(pLeft));
+#else
+         plwInit(&writer, pOut, dlrDocid(pLeft));
+#endif
           match = 1;
         }
-        if( !isSaveLeft ){
+        if( isSaveLeft == 0 ){
           plwAdd(&writer, plrColumn(&right), plrPosition(&right), 0, 0);
-        }else{
+        }else if( isSaveLeft == 1 ){
           plwAdd(&writer, plrColumn(&left), plrPosition(&left), 0, 0);
+        } else {
+          
+          int iPosRight  = plrPosition(&right);
+          int iColumnRight = plrColumn(&right);
+          int i;
+          
+          for (i=term_num; i>=0; i--) {
+            plwAdd(&writer, iColumnRight, iPosRight - i, 0, 0);
+          }
+          
         }
+        
         plrStep(&right);
       }else{
         plrStep(&left);
@@ -1499,10 +1783,11 @@
 static void docListPhraseMerge(
   const char *pLeft, int nLeft,
   const char *pRight, int nRight,
-  int nNear,            /* 0 for a phrase merge, non-zero for a NEAR merge */
-  int nPhrase,          /* Number of tokens in left+right operands to NEAR */
-  DocListType iType,    /* Type of doclist to write to pOut */
-  DataBuffer *pOut      /* Write the combined doclist here */
+  int nNear,           /* 0 for a phrase merge, non-zero for a NEAR merge */
+  int nPhrase,         /* Number of tokens in left+right operands to NEAR */
+  DocListType iType,   /* Type of doclist to write to pOut */
+  DataBuffer *pOut,    /* Write the combined doclist here */
+  int term             /* (tracker) term number */
 ){
   DLReader left, right;
   DLWriter writer;
@@ -1514,7 +1799,6 @@
   dlrInit(&left, DL_POSITIONS, pLeft, nLeft);
   dlrInit(&right, DL_POSITIONS, pRight, nRight);
   dlwInit(&writer, iType, pOut);
-
   while( !dlrAtEnd(&left) && !dlrAtEnd(&right) ){
     if( dlrDocid(&left)<dlrDocid(&right) ){
       dlrStep(&left);
@@ -1522,34 +1806,40 @@
       dlrStep(&right);
     }else{
       if( nNear==0 ){
-        posListPhraseMerge(&left, &right, 0, 0, &writer);
+        posListPhraseMerge(&left, &right, 0, 2, term,  &writer);
       }else{
-        /* This case occurs when two terms (simple terms or phrases) are
-         * connected by a NEAR operator, span (nNear+1). i.e.
-         *
-         *     '"terrible company" NEAR widget'
-         */
-        DataBuffer one = {0, 0, 0};
-        DataBuffer two = {0, 0, 0};
-
-        DLWriter dlwriter2;
-        DLReader dr1 = {0, 0, 0, 0, 0}; 
-        DLReader dr2 = {0, 0, 0, 0, 0};
-
-        dlwInit(&dlwriter2, iType, &one);
-        posListPhraseMerge(&right, &left, nNear-3+nPhrase, 1, &dlwriter2);
-        dlwInit(&dlwriter2, iType, &two);
-        posListPhraseMerge(&left, &right, nNear-1, 0, &dlwriter2);
-
-        if( one.nData) dlrInit(&dr1, iType, one.pData, one.nData);
-        if( two.nData) dlrInit(&dr2, iType, two.pData, two.nData);
-
-        if( !dlrAtEnd(&dr1) || !dlrAtEnd(&dr2) ){
-          PLReader pr1 = {0};
-          PLReader pr2 = {0};
+       /* This case occurs when two terms (simple terms or phrases) are
+        * connected by a NEAR operator, span (nNear+1). i.e.
+        *
+        *     '"terrible company" NEAR widget'
+        */
+       DataBuffer one = {0, 0, 0};
+       DataBuffer two = {0, 0, 0};
+
+       DLWriter dlwriter2;
+       DLReader dr1 = {0, 0, 0, 0, 0};
+       DLReader dr2 = {0, 0, 0, 0, 0};
+
+       dlwInit(&dlwriter2, iType, &one);
+       posListPhraseMerge(&right, &left, nNear-3+nPhrase, 1, term, &dlwriter2);
+       dlwInit(&dlwriter2, iType, &two);
+       posListPhraseMerge(&left, &right, nNear-1, 0, term, &dlwriter2);
+
+       if( one.nData) dlrInit(&dr1, iType, one.pData, one.nData);
+       if( two.nData) dlrInit(&dr2, iType, two.pData, two.nData);
+
+       if( !dlrAtEnd(&dr1) || !dlrAtEnd(&dr2) ){
+         PLReader pr1 = {0};
+         PLReader pr2 = {0};
 
           PLWriter plwriter;
+          
+            
+#ifdef STORE_CATEGORY        
+          plwInit(&plwriter, &writer, dlrDocid(dlrAtEnd(&dr1)?&dr2:&dr1), 
dlrCatid(dlrAtEnd(&dr1)?&dr2:&dr1));
+#else
           plwInit(&plwriter, &writer, dlrDocid(dlrAtEnd(&dr1)?&dr2:&dr1));
+#endif
 
           if( one.nData ) plrInit(&pr1, &dr1);
           if( two.nData ) plrInit(&pr2, &dr2);
@@ -1590,6 +1880,42 @@
 ** Write the intersection of these two doclists into pOut as a
 ** DL_DOCIDS doclist.
 */
+#ifdef STORE_CATEGORY
+static void docListAndMerge(
+  const char *pLeft, int nLeft,
+  const char *pRight, int nRight,
+  DataBuffer *pOut     /* Write the combined doclist here */
+){
+  DLReader left, right;
+  DLWriter writer;
+
+  if( nLeft==0 || nRight==0 ) return;
+
+
+  dlrInit(&left, DL_POSITIONS, pLeft, nLeft);
+  dlrInit(&right, DL_POSITIONS, pRight, nRight);
+  dlwInit(&writer, DL_POSITIONS, pOut);
+  
+ 
+
+  while( !dlrAtEnd(&left) && !dlrAtEnd(&right) ){
+    if(dlrDocid(&left)<dlrDocid(&right) ){
+      dlrStep(&left);
+    }else if( dlrDocid(&right)<dlrDocid(&left) ){
+      dlrStep(&right);
+    }else{
+      posListUnion(&left, &right, &writer);
+      dlrStep(&left);
+      dlrStep(&right);
+    }
+  }
+
+  dlrDestroy(&left);
+  dlrDestroy(&right);
+  dlwDestroy(&writer);
+}  
+  
+#else
 static void docListAndMerge(
   const char *pLeft, int nLeft,
   const char *pRight, int nRight,
@@ -1620,11 +1946,69 @@
   dlrDestroy(&right);
   dlwDestroy(&writer);
 }
+#endif
 
 /* We have two DL_DOCIDS doclists:  pLeft and pRight.
 ** Write the union of these two doclists into pOut as a
 ** DL_DOCIDS doclist.
 */
+
+#ifdef STORE_CATEGORY        
+static void docListOrMerge(
+  const char *pLeft, int nLeft,
+  const char *pRight, int nRight,
+  DataBuffer *pOut     /* Write the combined doclist here */
+){
+  DLReader left, right;
+  DLWriter writer;
+
+  if( nLeft==0 ){
+    if( nRight!=0 ) dataBufferAppend(pOut, pRight, nRight);
+    return;
+  }
+  if( nRight==0 ){
+    dataBufferAppend(pOut, pLeft, nLeft);
+    return;
+  }
+
+  dlrInit(&left, DL_POSITIONS, pLeft, nLeft);
+  dlrInit(&right, DL_POSITIONS, pRight, nRight);
+  dlwInit(&writer, DL_POSITIONS, pOut);
+
+  while( !dlrAtEnd(&left) || !dlrAtEnd(&right) ){
+    if( dlrAtEnd(&right) ){
+      dlwCopy (&writer, &left);
+      dlrStep(&left);
+    }else if( dlrAtEnd(&left) ){
+      
+      dlwCopy (&writer, &right);
+      dlrStep(&right);
+    }else if( dlrDocid(&left)<dlrDocid(&right) ){
+
+      dlwCopy (&writer, &left);
+
+      dlrStep(&left);
+    }else if( dlrDocid(&right)<dlrDocid(&left) ){
+
+      dlwCopy (&writer, &right);
+
+      dlrStep(&right);
+    }else{
+
+      posListUnion(&left, &right, &writer);
+
+      dlrStep(&left);
+      dlrStep(&right);
+    }
+  }
+
+  dlrDestroy(&left);
+  dlrDestroy(&right);
+  dlwDestroy(&writer);
+}
+
+#else
+
 static void docListOrMerge(
   const char *pLeft, int nLeft,
   const char *pRight, int nRight,
@@ -1649,18 +2033,32 @@
   while( !dlrAtEnd(&left) || !dlrAtEnd(&right) ){
     if( dlrAtEnd(&right) ){
       dlwAdd(&writer, dlrDocid(&left));
+      
+
       dlrStep(&left);
     }else if( dlrAtEnd(&left) ){
+      
       dlwAdd(&writer, dlrDocid(&right));
+      
       dlrStep(&right);
     }else if( dlrDocid(&left)<dlrDocid(&right) ){
+
       dlwAdd(&writer, dlrDocid(&left));
+
+
       dlrStep(&left);
     }else if( dlrDocid(&right)<dlrDocid(&left) ){
+
       dlwAdd(&writer, dlrDocid(&right));
+
+      
+
       dlrStep(&right);
     }else{
+
       dlwAdd(&writer, dlrDocid(&left));
+
+
       dlrStep(&left);
       dlrStep(&right);
     }
@@ -1670,11 +2068,46 @@
   dlrDestroy(&right);
   dlwDestroy(&writer);
 }
+#endif
 
 /* We have two DL_DOCIDS doclists:  pLeft and pRight.
 ** Write into pOut as DL_DOCIDS doclist containing all documents that
 ** occur in pLeft but not in pRight.
 */
+#ifdef STORE_CATEGORY   
+static void docListExceptMerge(
+  const char *pLeft, int nLeft,
+  const char *pRight, int nRight,
+  DataBuffer *pOut     /* Write the combined doclist here */
+){
+  DLReader left, right;
+  DLWriter writer;
+
+  if( nLeft==0 ) return;
+  if( nRight==0 ){
+    dataBufferAppend(pOut, pLeft, nLeft);
+    return;
+  }
+
+  dlrInit(&left, DL_POSITIONS, pLeft, nLeft);
+  dlrInit(&right, DL_POSITIONS, pRight, nRight);
+  dlwInit(&writer, DL_POSITIONS, pOut);
+
+  while( !dlrAtEnd(&left) ){
+    while( !dlrAtEnd(&right) && dlrDocid(&right)<dlrDocid(&left) ){
+      dlrStep(&right);
+    }
+    if( dlrAtEnd(&right) || dlrDocid(&left)<dlrDocid(&right) ){
+      dlwCopy (&writer, &left);
+    }
+    dlrStep(&left);
+  }
+
+  dlrDestroy(&left);
+  dlrDestroy(&right);
+  dlwDestroy(&writer);
+}
+#else
 static void docListExceptMerge(
   const char *pLeft, int nLeft,
   const char *pRight, int nRight,
@@ -1698,6 +2131,7 @@
       dlrStep(&right);
     }
     if( dlrAtEnd(&right) || dlrDocid(&left)<dlrDocid(&right) ){
+      
       dlwAdd(&writer, dlrDocid(&left));
     }
     dlrStep(&left);
@@ -1707,6 +2141,7 @@
   dlrDestroy(&right);
   dlwDestroy(&writer);
 }
+#endif
 
 static char *string_dup_n(const char *s, int n){
   char *str = sqlite3_malloc(n + 1);
@@ -1784,6 +2219,90 @@
 /* Forward reference */
 typedef struct fulltext_vtab fulltext_vtab;
 
+/* A single term in a query is represented by an instances of
+** the following structure. Each word which may match against
+** document content is a term. Operators, like NEAR or OR, are
+** not terms. Query terms are organized as a flat list stored
+** in the Query.pTerms array.
+**
+** If the QueryTerm.nPhrase variable is non-zero, then the QueryTerm
+** is the first in a contiguous string of terms that are either part
+** of the same phrase, or connected by the NEAR operator.
+**
+** If the QueryTerm.nNear variable is non-zero, then the token is followed
+** by a NEAR operator with span set to (nNear-1). For example, the
+** following query:
+**
+** The QueryTerm.iPhrase variable stores the index of the token within
+** its phrase, indexed starting at 1, or 1 if the token is not part
+** of any phrase.
+**
+** For example, the data structure used to represent the following query:
+**
+**     ... MATCH 'sqlite NEAR/5 google NEAR/2 "search engine"'
+**
+** is:
+**
+**     {nPhrase=4, iPhrase=1, nNear=6, pTerm="sqlite"},
+**     {nPhrase=0, iPhrase=1, nNear=3, pTerm="google"},
+**     {nPhrase=0, iPhrase=1, nNear=0, pTerm="search"},
+**     {nPhrase=0, iPhrase=2, nNear=0, pTerm="engine"},
+**
+** compiling the FTS3 syntax to Query structures is done by the parseQuery()
+** function.
+*/
+typedef struct QueryTerm {
+  short int nPhrase; /* How many following terms are part of the same phrase */
+  short int iPhrase; /* This is the i-th term of a phrase. */
+  short int iColumn; /* Column of the index that must match this term */
+  signed char nNear; /* term followed by a NEAR operator with span=(nNear-1) */
+  signed char isOr;  /* this term is preceded by "OR" */
+  signed char isNot; /* this term is preceded by "-" */
+  signed char isPrefix; /* this term is followed by "*" */
+  char *pTerm;      /* text of the term.  '\000' terminated.  malloced */
+  int nTerm;        /* Number of bytes in pTerm[] */
+} QueryTerm;
+
+
+/* A query string is parsed into a Query structure.
+ *
+ * We could, in theory, allow query strings to be complicated
+ * nested expressions with precedence determined by parentheses.
+ * But none of the major search engines do this.  (Perhaps the
+ * feeling is that an parenthesized expression is two complex of
+ * an idea for the average user to grasp.)  Taking our lead from
+ * the major search engines, we will allow queries to be a list
+ * of terms (with an implied AND operator) or phrases in double-quotes,
+ * with a single optional "-" before each non-phrase term to designate
+ * negation and an optional OR connector.
+ *
+ * OR binds more tightly than the implied AND, which is what the
+ * major search engines seem to do.  So, for example:
+ *
+ *    [one two OR three]     ==>    one AND (two OR three)
+ *    [one OR two three]     ==>    (one OR two) AND three
+ *
+ * A "-" before a term matches all entries that lack that term.
+ * The "-" must occur immediately before the term with in intervening
+ * space.  This is how the search engines do it.
+ *
+ * A NOT term cannot be the right-hand operand of an OR.  If this
+ * occurs in the query string, the NOT is ignored:
+ *
+ *    [one OR -two]         ==>    one OR two
+ *
+ */
+typedef struct Query {
+  fulltext_vtab *pFts; /* The full text index */
+  int nTerms;          /* Number of terms in the query */
+  QueryTerm *pTerms;   /* Array of terms.  Space obtained from malloc() */
+  int nextIsOr;                /* Set the isOr flag on the next inserted term */
+  int nextIsNear;      /* Set the isOr flag on the next inserted term */
+  int nextColumn;      /* Next word parsed must be in this column */
+  int dfltColumn;      /* The default column */
+} Query;
+
+
 /*
 ** An instance of the following structure keeps track of generated
 ** matching-word offset information and snippets.
@@ -1798,6 +2317,7 @@
     int iToken;          /* The index of the matching document token */
     short int nByte;     /* Number of bytes in the term */
     int iStart;          /* The offset to the first character of the term */
+    int rank;           /* the rank of the snippet */
   } *aMatch;      /* Points to space obtained from malloc */
   char *zOffset;  /* Text rendering of aMatch[] */
   int nOffset;    /* strlen(zOffset) */
@@ -1886,14 +2406,15 @@
 ** arguments.
 */
 struct fulltext_vtab {
-  sqlite3_vtab base;               /* Base class used by SQLite core */
-  sqlite3 *db;                     /* The database connection */
-  const char *zDb;                 /* logical database name */
-  const char *zName;               /* virtual table name */
-  int nColumn;                     /* number of columns in virtual table */
-  char **azColumn;                 /* column names.  malloced */
-  char **azContentColumn;          /* column names in content table; malloced */
-  sqlite3_tokenizer *pTokenizer;   /* tokenizer for inserts and queries */
+  sqlite3_vtab base;              /* Base class used by SQLite core */
+  sqlite3 *db;                    /* The database connection */
+  const char *zDb;                /* logical database name */
+  const char *zName;              /* virtual table name */
+  int nColumn;                    /* number of columns in virtual table */
+  char **azColumn;                /* column names.  malloced */
+  char **azContentColumn;         /* column names in content table; malloced */
+  TrackerParser *parser;          /* tokenizer for inserts and queries */
+  int max_words;
 
   /* Precompiled statements which we keep as long as the table is
   ** open.
@@ -1930,18 +2451,22 @@
 ** is destroyed by xClose.
 */
 typedef struct fulltext_cursor {
-  sqlite3_vtab_cursor base;        /* Base class used by SQLite core */
-  QueryType iCursorType;           /* Copy of sqlite3_index_info.idxNum */
-  sqlite3_stmt *pStmt;             /* Prepared statement in use by the cursor */
-  int eof;                         /* True if at End Of Results */
-  Fts3Expr *pExpr;                 /* Parsed MATCH query string */
-  Snippet snippet;                 /* Cached snippet for the current row */
-  int iColumn;                     /* Column being searched */
-  DataBuffer result;               /* Doclist results from fulltextQuery */
-  DLReader reader;                 /* Result reader if result not empty */
+  sqlite3_vtab_cursor base;       /* Base class used by SQLite core */
+  QueryType iCursorType;          /* Copy of sqlite3_index_info.idxNum */
+  sqlite3_stmt *pStmt;            /* Prepared statement in use by the cursor */
+  int eof;                        /* True if at End Of Results */
+  Query q;                        /* Parsed query string */
+  Snippet snippet;                /* Cached snippet for the current row */
+  int iColumn;                    /* Column being searched */
+  DataBuffer result;              /* Doclist results from fulltextQuery */
+  DLReader reader;                /* Result reader if result not empty */
+  sqlite_int64 currentDocid;
+  int currentCatid;              /* (tracker) Category (service type ID) of the document */
+  GString *offsets;              /* (tracker) pre computed offsets from position data in index */
+  double  rank;                          /* (tracker) pre computed rank from position data in index */
 } fulltext_cursor;
 
-static fulltext_vtab *cursor_vtab(fulltext_cursor *c){
+static struct fulltext_vtab *cursor_vtab(fulltext_cursor *c){
   return (fulltext_vtab *) c->base.pVtab;
 }
 
@@ -2442,9 +2967,9 @@
     }
   }
 
-  if( v->pTokenizer!=NULL ){
-    v->pTokenizer->pModule->xDestroy(v->pTokenizer);
-    v->pTokenizer = NULL;
+  if( v->parser!=NULL ){
+    tracker_parser_free (v->parser);
+    v->parser = NULL;
   }
 
   clearPendingTerms(v);
@@ -2475,7 +3000,7 @@
 ** isFtsIdChar[X] must be 1.
 **
 ** Ticket #1066.  the SQL standard does not allow '$' in the
-** middle of identfiers.  But many SQL implementations do. 
+** middle of identfiers.  But many SQL implementations do.
 ** SQLite will allow '$' in identifiers for compatibility.
 ** But the feature is undocumented.
 */
@@ -2869,20 +3394,15 @@
 ** fulltext index defined by spec.
 */
 static int constructVtab(
-  sqlite3 *db,              /* The SQLite database connection */
-  fts3Hash *pHash,          /* Hash table containing tokenizers */
-  TableSpec *spec,          /* Parsed spec information from parseSpec() */
+  sqlite3 *db,             /* The SQLite database connection */
+  TableSpec *spec,         /* Parsed spec information from parseSpec() */
   sqlite3_vtab **ppVTab,    /* Write the resulting vtab structure here */
   char **pzErr              /* Write any error message here */
 ){
   int rc;
-  int n;
   fulltext_vtab *v = 0;
-  const sqlite3_tokenizer_module *m = NULL;
   char *schema;
 
-  char const *zTok;         /* Name of tokenizer to use for this fts table */
-  int nTok;                 /* Length of zTok, including nul terminator */
 
   v = (fulltext_vtab *) sqlite3_malloc(sizeof(fulltext_vtab));
   if( v==0 ) return SQLITE_NOMEM;
@@ -2897,6 +3417,7 @@
   v->azColumn = spec->azColumn;
   spec->azColumn = 0;
 
+/* comment out tokenizer stuff
   if( spec->azTokenizer==0 ){
     return SQLITE_NOMEM;
   }
@@ -2922,7 +3443,23 @@
     rc = m->xCreate(0, 0, &v->pTokenizer);
   }
   if( rc!=SQLITE_OK ) goto err;
-  v->pTokenizer->pModule = m;
+  */
+
+
+  /* set up our parser */
+
+  TrackerConfig *config = tracker_config_new ();
+
+  TrackerLanguage *language = tracker_language_new (config);
+
+  int min_len = tracker_config_get_min_word_length (config);
+  int max_len = tracker_config_get_max_word_length (config);
+  v->max_words = tracker_config_get_max_words_to_index (config);
+
+  v->parser =  tracker_parser_new (language, max_len, min_len);
+
+  g_object_unref (language);
+
 
   /* TODO: verify the existence of backing tables foo_content, foo_term */
 
@@ -2958,7 +3495,7 @@
   int rc = parseSpec(&spec, argc, argv, pzErr);
   if( rc!=SQLITE_OK ) return rc;
 
-  rc = constructVtab(db, (fts3Hash *)pAux, &spec, ppVTab, pzErr);
+  rc = constructVtab(db,  &spec, ppVTab, pzErr);
   clearTableSpec(&spec);
   return rc;
 }
@@ -3009,7 +3546,7 @@
                 ");");
   if( rc!=SQLITE_OK ) goto out;
 
-  rc = constructVtab(db, (fts3Hash *)pAux, &spec, ppVTab, pzErr);
+  rc = constructVtab(db, &spec, ppVTab, pzErr);
 
 out:
   clearTableSpec(&spec);
@@ -3077,11 +3614,15 @@
 static int fulltextOpen(sqlite3_vtab *pVTab, sqlite3_vtab_cursor **ppCursor){
   fulltext_cursor *c;
 
+  fulltext_vtab *v = (fulltext_vtab *)pVTab;
   c = (fulltext_cursor *) sqlite3_malloc(sizeof(fulltext_cursor));
   if( c ){
     memset(c, 0, sizeof(fulltext_cursor));
     /* sqlite will initialize c->base */
     *ppCursor = &c->base;
+    
+    c->offsets = g_string_new ("");
+        
     FTSTRACE(("FTS3 Open %p: %p\n", pVTab, c));
     return SQLITE_OK;
   }else{
@@ -3089,6 +3630,18 @@
   }
 }
 
+
+/* Free all of the dynamically allocated memory held by *q
+*/
+static void queryClear(Query *q){
+  int i;
+  for(i = 0; i < q->nTerms; ++i){
+    sqlite3_free(q->pTerms[i].pTerm);
+  }
+  sqlite3_free(q->pTerms);
+  CLEAR(q);
+}
+
 /* Free all of the dynamically allocated memory held by the
 ** Snippet
 */
@@ -3098,7 +3651,6 @@
   sqlite3_free(p->zSnippet);
   CLEAR(p);
 }
-
 /*
 ** Append a single entry to the p->aMatch[] log.
 */
@@ -3128,6 +3680,7 @@
   pMatch->nByte = nByte;
 }
 
+
 /*
 ** Sizing information for the circular buffer used in snippetOffsetsOfColumn()
 */
@@ -3135,88 +3688,30 @@
 #define FTS3_ROTOR_MASK (FTS3_ROTOR_SZ-1)
 
 /*
-** Function to iterate through the tokens of a compiled expression.
-**
-** Except, skip all tokens on the right-hand side of a NOT operator.
-** This function is used to find tokens as part of snippet and offset
-** generation and we do nt want snippets and offsets to report matches
-** for tokens on the RHS of a NOT.
-*/
-static int fts3NextExprToken(Fts3Expr **ppExpr, int *piToken){
-  Fts3Expr *p = *ppExpr;
-  int iToken = *piToken;
-  if( iToken<0 ){
-    /* In this case the expression p is the root of an expression tree.
-    ** Move to the first token in the expression tree.
-    */
-    while( p->pLeft ){
-      p = p->pLeft;
-    }
-    iToken = 0;
-  }else{
-    assert(p && p->eType==FTSQUERY_PHRASE );
-    if( iToken<(p->pPhrase->nToken-1) ){
-      iToken++;
-    }else{
-      iToken = 0;
-      while( p->pParent && p->pParent->pLeft!=p ){
-        assert( p->pParent->pRight==p );
-        p = p->pParent;
-      }
-      p = p->pParent;
-      if( p ){
-        assert( p->pRight!=0 );
-        p = p->pRight;
-        while( p->pLeft ){
-          p = p->pLeft;
-        }
-      }
-    }
-  }
-
-  *ppExpr = p;
-  *piToken = iToken;
-  return p?1:0;
-}
-
-/*
-** Return TRUE if the expression node pExpr is located beneath the
-** RHS of a NOT operator.
-*/
-static int fts3ExprBeneathNot(Fts3Expr *p){
-  Fts3Expr *pParent;
-  while( p ){
-    pParent = p->pParent;
-    if( pParent && pParent->eType==FTSQUERY_NOT && pParent->pRight==p ){
-      return 1;
-    }
-    p = pParent;
-  }
-  return 0;
-}
-
-/*
 ** Add entries to pSnippet->aMatch[] for every match that occurs against
 ** document zDoc[0..nDoc-1] which is stored in column iColumn.
 */
 static void snippetOffsetsOfColumn(
-  fulltext_cursor *pCur,         /* The fulltest search cursor */
-  Snippet *pSnippet,             /* The Snippet object to be filled in */
-  int iColumn,                   /* Index of fulltext table column */
-  const char *zDoc,              /* Text of the fulltext table column */
-  int nDoc                       /* Length of zDoc in bytes */
+  Query *pQuery,
+  Snippet *pSnippet,
+  int iColumn,
+  const char *zDoc,
+  int nDoc
+#ifdef STORE_CATEGORY
+  , int position
+#endif  
 ){
-  const sqlite3_tokenizer_module *pTModule;  /* The tokenizer module */
-  sqlite3_tokenizer *pTokenizer;             /* The specific tokenizer */
-  sqlite3_tokenizer_cursor *pTCursor;        /* Tokenizer cursor */
-  fulltext_vtab *pVtab;                /* The full text index */
-  int nColumn;                         /* Number of columns in the index */
-  int i, j;                            /* Loop counters */
-  int rc;                              /* Return code */
+
+  fulltext_vtab *pVtab;                       /* The full text index */
+  int nColumn;                        /* Number of columns in the index */
+  const QueryTerm *aTerm;             /* Query string terms */
+  int nTerm;                          /* Number of query string terms */
+  int i, j;                           /* Loop counters */
   unsigned int match, prevMatch;       /* Phrase search bitmasks */
-  const char *zToken;                  /* Next token from the tokenizer */
-  int nToken;                          /* Size of zToken */
-  int iBegin, iEnd, iPos;              /* Offsets of beginning and end */
+  const char *zToken;                 /* Next token from the tokenizer */
+  int nToken;                         /* Size of zToken */
+  int iBegin, iEnd, iPos;             /* Offsets of beginning and end */
+  gboolean new_paragraph, stop_word;
 
   /* The following variables keep a circular buffer of the last
   ** few tokens */
@@ -3224,49 +3719,64 @@
   int iRotorBegin[FTS3_ROTOR_SZ];      /* Beginning offset of token */
   int iRotorLen[FTS3_ROTOR_SZ];        /* Length of token */
 
-  pVtab = cursor_vtab(pCur);
+  pVtab = pQuery->pFts;
   nColumn = pVtab->nColumn;
-  pTokenizer = pVtab->pTokenizer;
-  pTModule = pTokenizer->pModule;
-  rc = pTModule->xOpen(pTokenizer, zDoc, nDoc, &pTCursor);
-  if( rc ) return;
-  pTCursor->pTokenizer = pTokenizer;
+
+  tracker_parser_reset (pVtab->parser, zDoc, nDoc, FALSE, TRUE, TRUE, FALSE);
+
+  aTerm = pQuery->pTerms;
+  nTerm = pQuery->nTerms;
+
+  if( nTerm>=FTS3_ROTOR_SZ ){
+    nTerm = FTS3_ROTOR_SZ - 1;
+  }
 
   prevMatch = 0;
-  while( !pTModule->xNext(pTCursor, &zToken, &nToken, &iBegin, &iEnd, &iPos) ){
-    Fts3Expr *pIter = pCur->pExpr;
-    int iIter = -1;
+
+  while(1){
+//    rc = pTModule->xNext(pTCursor, &zToken, &nToken, &iBegin, &iEnd, &iPos);
+   
+    
+    zToken = tracker_parser_next (pVtab->parser, 
+                                 &iPos,
+                                 &iBegin,
+                                 &iEnd,
+                                 &new_paragraph,
+                                 &stop_word,
+                                 &nToken);
+
+    if (!zToken) break;
+
+    if (stop_word) {
+      continue;
+    }
+    
+ 
     iRotorBegin[iRotor&FTS3_ROTOR_MASK] = iBegin;
     iRotorLen[iRotor&FTS3_ROTOR_MASK] = iEnd-iBegin;
     match = 0;
-    for(i=0; i<(FTS3_ROTOR_SZ-1) && fts3NextExprToken(&pIter, &iIter); i++){
-      int nPhrase;                    /* Number of tokens in current phrase */
-      struct PhraseToken *pToken;     /* Current token */
-      int iCol;                       /* Column index */
-
-      if( fts3ExprBeneathNot(pIter) ) continue;
-      nPhrase = pIter->pPhrase->nToken;
-      pToken = &pIter->pPhrase->aToken[iIter];
-      iCol = pIter->pPhrase->iColumn;
+    for(i=0; i<nTerm; i++){
+      int iCol;
+      iCol = aTerm[i].iColumn;
       if( iCol>=0 && iCol<nColumn && iCol!=iColumn ) continue;
-      if( pToken->n>nToken ) continue;
-      if( !pToken->isPrefix && pToken->n<nToken ) continue;
-      assert( pToken->n<=nToken );
-      if( memcmp(pToken->z, zToken, pToken->n) ) continue;
-      if( iIter>0 && (prevMatch & (1<<i))==0 ) continue;
+      if( aTerm[i].nTerm>nToken ) continue;
+      if( !aTerm[i].isPrefix && aTerm[i].nTerm<nToken ) continue;
+      assert( aTerm[i].nTerm<=nToken );
+      if( memcmp(aTerm[i].pTerm, zToken, aTerm[i].nTerm) ) continue;
+      if( aTerm[i].iPhrase>1 && (prevMatch & (1<<i))==0 ) continue;
       match |= 1<<i;
-      if( i==(FTS3_ROTOR_SZ-2) || nPhrase==iIter+1 ){
-        for(j=nPhrase-1; j>=0; j--){
-          int k = (iRotor-j) & FTS3_ROTOR_MASK;
-          snippetAppendMatch(pSnippet, iColumn, i-j, iPos-j,
-                iRotorBegin[k], iRotorLen[k]);
-        }
+      if( i==nTerm-1 || aTerm[i+1].iPhrase==1 ){
+       for(j=aTerm[i].iPhrase-1; j>=0; j--){
+         int k = (iRotor-j) & FTS3_ROTOR_MASK;
+         snippetAppendMatch(pSnippet, iColumn, i-j, iPos-j,
+               iRotorBegin[k], iRotorLen[k]);
+       }
       }
     }
     prevMatch = match<<1;
     iRotor++;
   }
-  pTModule->xClose(pTCursor);  
+//  pTModule->xClose(pTCursor);
 }
 
 /*
@@ -3283,156 +3793,191 @@
 ** 
 **     A NEAR/0 E
 **
-** then when this function is called the Snippet contains token offsets
-** 0, 4 and 5. This function removes the "0" entry (because the first A
-** is not near enough to an E).
-**
-** When this function is called, the value pointed to by parameter piLeft is
-** the integer id of the left-most token in the expression tree headed by
-** pExpr. This function increments *piLeft by the total number of tokens
-** in the expression tree headed by pExpr.
-**
-** Return 1 if any trimming occurs.  Return 0 if no trimming is required.
-*/
-static int trimSnippetOffsets(
-  Fts3Expr *pExpr,      /* The search expression */
-  Snippet *pSnippet,    /* The set of snippet offsets to be trimmed */
-  int *piLeft           /* Index of left-most token in pExpr */
-){
-  if( pExpr ){
-    if( trimSnippetOffsets(pExpr->pLeft, pSnippet, piLeft) ){
-      return 1;
-    }
-
-    switch( pExpr->eType ){
-      case FTSQUERY_PHRASE:
-        *piLeft += pExpr->pPhrase->nToken;
-        break;
-      case FTSQUERY_NEAR: {
-        /* The right-hand-side of a NEAR operator is always a phrase. The
-        ** left-hand-side is either a phrase or an expression tree that is 
-        ** itself headed by a NEAR operator. The following initializations
-        ** set local variable iLeft to the token number of the left-most
-        ** token in the right-hand phrase, and iRight to the right most
-        ** token in the same phrase. For example, if we had:
-        **
-        **     <col> MATCH '"abc def" NEAR/2 "ghi jkl"'
-        **
-        ** then iLeft will be set to 2 (token number of ghi) and nToken will
-        ** be set to 4.
-        */
-        Fts3Expr *pLeft = pExpr->pLeft;
-        Fts3Expr *pRight = pExpr->pRight;
-        int iLeft = *piLeft;
-        int nNear = pExpr->nNear;
-        int nToken = pRight->pPhrase->nToken;
-        int jj, ii;
-        if( pLeft->eType==FTSQUERY_NEAR ){
-          pLeft = pLeft->pRight;
-        }
-        assert( pRight->eType==FTSQUERY_PHRASE );
-        assert( pLeft->eType==FTSQUERY_PHRASE );
-        nToken += pLeft->pPhrase->nToken;
-
-        for(ii=0; ii<pSnippet->nMatch; ii++){
-          struct snippetMatch *p = &pSnippet->aMatch[ii];
-          if( p->iTerm==iLeft ){
-            int isOk = 0;
-            /* Snippet ii is an occurence of query term iLeft in the document.
-            ** It occurs at position (p->iToken) of the document. We now
-            ** search for an instance of token (iLeft-1) somewhere in the 
-            ** range (p->iToken - nNear)...(p->iToken + nNear + nToken) within 
-            ** the set of snippetMatch structures. If one is found, proceed. 
-            ** If one cannot be found, then remove snippets ii..(ii+N-1) 
-            ** from the matching snippets, where N is the number of tokens 
-            ** in phrase pRight->pPhrase.
-            */
-            for(jj=0; isOk==0 && jj<pSnippet->nMatch; jj++){
-              struct snippetMatch *p2 = &pSnippet->aMatch[jj];
-              if( p2->iTerm==(iLeft-1) ){
-                if( p2->iToken>=(p->iToken-nNear-1) 
-                 && p2->iToken<(p->iToken+nNear+nToken) 
-                ){
-                  isOk = 1;
-                }
-              }
-            }
-            if( !isOk ){
-              int kk;
-              for(kk=0; kk<pRight->pPhrase->nToken; kk++){
-                pSnippet->aMatch[kk+ii].iTerm = -2;
-              }
-              return 1;
-            }
-          }
-          if( p->iTerm==(iLeft-1) ){
-            int isOk = 0;
-            for(jj=0; isOk==0 && jj<pSnippet->nMatch; jj++){
-              struct snippetMatch *p2 = &pSnippet->aMatch[jj];
-              if( p2->iTerm==iLeft ){
-                if( p2->iToken<=(p->iToken+nNear+1) 
-                 && p2->iToken>(p->iToken-nNear-nToken) 
-                ){
-                  isOk = 1;
-                }
-              }
-            }
-            if( !isOk ){
-              int kk;
-              for(kk=0; kk<pLeft->pPhrase->nToken; kk++){
-                pSnippet->aMatch[ii-kk].iTerm = -2;
-              }
-              return 1;
-            }
-          }
-        }
-        break;
+** then when this function is called the Snippet contains token offsets
+** 0, 4 and 5. This function removes the "0" entry (because the first A
+** is not near enough to an E).
+*/
+static void trimSnippetOffsetsForNear(Query *pQuery, Snippet *pSnippet){
+  int ii;
+  int iDir = 1;
+
+  while(iDir>-2) {
+    assert( iDir==1 || iDir==-1 );
+    for(ii=0; ii<pSnippet->nMatch; ii++){
+      int jj;
+      int nNear;
+      struct snippetMatch *pMatch = &pSnippet->aMatch[ii];
+      QueryTerm *pQueryTerm = &pQuery->pTerms[pMatch->iTerm];
+
+      if( (pMatch->iTerm+iDir)<0
+       || (pMatch->iTerm+iDir)>=pQuery->nTerms
+      ){
+       continue;
+      }
+
+      nNear = pQueryTerm->nNear;
+      if( iDir<0 ){
+       nNear = pQueryTerm[-1].nNear;
       }
-    }
 
-    if( trimSnippetOffsets(pExpr->pRight, pSnippet, piLeft) ){
-      return 1;
+      if( pMatch->iTerm>=0 && nNear ){
+       int isOk = 0;
+       int iNextTerm = pMatch->iTerm+iDir;
+       int iPrevTerm = iNextTerm;
+
+       int iEndToken;
+       int iStartToken;
+
+       if( iDir<0 ){
+         int nPhrase = 1;
+         iStartToken = pMatch->iToken;
+         while( (pMatch->iTerm+nPhrase)<pQuery->nTerms
+             && pQuery->pTerms[pMatch->iTerm+nPhrase].iPhrase>1
+         ){
+           nPhrase++;
+         }
+         iEndToken = iStartToken + nPhrase - 1;
+       }else{
+         iEndToken   = pMatch->iToken;
+         iStartToken = pMatch->iToken+1-pQueryTerm->iPhrase;
+       }
+
+       while( pQuery->pTerms[iNextTerm].iPhrase>1 ){
+         iNextTerm--;
+       }
+       while( (iPrevTerm+1)<pQuery->nTerms &&
+              pQuery->pTerms[iPrevTerm+1].iPhrase>1
+       ){
+         iPrevTerm++;
+       }
+
+       for(jj=0; isOk==0 && jj<pSnippet->nMatch; jj++){
+         struct snippetMatch *p = &pSnippet->aMatch[jj];
+         if( p->iCol==pMatch->iCol && ((
+              p->iTerm==iNextTerm &&
+              p->iToken>iEndToken &&
+              p->iToken<=iEndToken+nNear
+         ) || (
+              p->iTerm==iPrevTerm &&
+              p->iToken<iStartToken &&
+              p->iToken>=iStartToken-nNear
+         ))){
+           isOk = 1;
+         }
+       }
+       if( !isOk ){
+         for(jj=1-pQueryTerm->iPhrase; jj<=0; jj++){
+           pMatch[jj].iTerm = -1;
+         }
+         ii = -1;
+         iDir = 1;
+       }
+      }
     }
+    iDir -= 2;
   }
-  return 0;
 }
 
+
+
 /*
 ** Compute all offsets for the current row of the query.  
 ** If the offsets have already been computed, this routine is a no-op.
 */
 static void snippetAllOffsets(fulltext_cursor *p){
-  int nColumn;
   int iColumn, i;
-  int iFirst, iLast;
-  int iTerm = 0;
-  fulltext_vtab *pFts = cursor_vtab(p);
+  fulltext_vtab *pFts;
 
-  if( p->snippet.nMatch || p->pExpr==0 ){
-    return;
+  if( p->snippet.nMatch ) return;
+  if( p->q.nTerms==0 ) return;
+  pFts = p->q.pFts;
+  
+#ifdef STORE_CATEGORY  
+  PLReader plReader;
+  int col_array[255];
+  gpointer pos_array[255];
+  
+  for (i=0; i<255; i++) {
+    col_array[i] = 0;
+    pos_array[i] = NULL;
+  }
+  
+  
+  int iPos = 0;
+  
+  if (dlrAtEnd (&p->reader)) return;
+  
+  plrInit(&plReader, &p->reader);
+  
+  if (plrAtEnd(&plReader)) return;
+  
+  iColumn = -1;
+    
+  for ( ; !plrAtEnd(&plReader); plrStep(&plReader) ){
+        
+    if (plrColumn (&plReader) != iColumn) {
+    
+      iColumn = plrColumn(&plReader);
+      col_array[iColumn] += 1;
+    }
+        
+    iPos = plrPosition(&plReader);
+    GSList *l = pos_array[iColumn];
+    l = g_slist_prepend (l, GINT_TO_POINTER (iPos)); 
+  }
+
+  plrEndAndDestroy(&plReader);
+  
+  
+  /* get the column with most hits */  
+  int hit_column = 0;
+  int hit_column_count = col_array[0];  
+  
+  /*bias field id 0 more as its the main content field */
+ // if (hit_column_count > 0) hit_column_count++;
+  
+  for (i=1; i<255; i++) {
+    if (col_array [i] > hit_column_count) {
+      hit_column = i;
+      hit_column_count =col_array[i];
+    }
+    
+    g_slist_free (pos_array[i]);
   }
+
+
+  const char *zDoc;
+  int nDoc;
+  zDoc = (const char*)sqlite3_column_text(p->pStmt, hit_column+1);
+  nDoc = sqlite3_column_bytes(p->pStmt, hit_column+1);
+  snippetOffsetsOfColumn(&p->q, &p->snippet, hit_column, zDoc, nDoc, iPos);
+  
+  
+#else  
+  int iFirst, iLast;
+  int nColumn;
+      
   nColumn = pFts->nColumn;
   iColumn = (p->iCursorType - QUERY_FULLTEXT);
   if( iColumn<0 || iColumn>=nColumn ){
-    /* Look for matches over all columns of the full-text index */
     iFirst = 0;
     iLast = nColumn-1;
   }else{
-    /* Look for matches in the iColumn-th column of the index only */
     iFirst = iColumn;
     iLast = iColumn;
   }
+  
+    
   for(i=iFirst; i<=iLast; i++){
     const char *zDoc;
     int nDoc;
     zDoc = (const char*)sqlite3_column_text(p->pStmt, i+1);
     nDoc = sqlite3_column_bytes(p->pStmt, i+1);
-    snippetOffsetsOfColumn(p, &p->snippet, i, zDoc, nDoc);
-  }
-
-  while( trimSnippetOffsets(p->pExpr, &p->snippet, &iTerm) ){
-    iTerm = 0;
+    snippetOffsetsOfColumn(&p->q, &p->snippet, i, zDoc, nDoc);
   }
+#endif  
+  
+  trimSnippetOffsetsForNear(&p->q, &p->snippet);
 }
 
 /*
@@ -3553,7 +4098,7 @@
     aMatch[i].snStatus = SNIPPET_IGNORE;
   }
   nDesired = 0;
-  for(i=0; i<FTS3_ROTOR_SZ; i++){
+  for(i=0; i<pCursor->q.nTerms; i++){
     for(j=0; j<nMatch; j++){
       if( aMatch[j].iTerm==i ){
         aMatch[j].snStatus = SNIPPET_DESIRED;
@@ -3641,11 +4186,10 @@
   fulltext_cursor *c = (fulltext_cursor *) pCursor;
   FTSTRACE(("FTS3 Close %p\n", c));
   sqlite3_finalize(c->pStmt);
-  sqlite3Fts3ExprFree(c->pExpr);
+  queryClear(&c->q);
   snippetClear(&c->snippet);
-  if( c->result.nData!=0 ){
-    dlrDestroy(&c->reader);
-  }
+  g_string_free (c->offsets, TRUE);
+  if( c->result.nData!=0 ) dlrDestroy(&c->reader);
   dataBufferDestroy(&c->result);
   sqlite3_free(c);
   return SQLITE_OK;
@@ -3680,7 +4224,38 @@
       return SQLITE_OK;
     }
     rc = sqlite3_bind_int64(c->pStmt, 1, dlrDocid(&c->reader));
+    c->currentDocid = dlrDocid(&c->reader);
+    c->currentCatid = dlrCatid(&c->reader);
+
+    /* (tracker) read position offsets here */
+    
+    PLReader plReader;
+    gboolean first_pos = TRUE;
+   
+    c->offsets = g_string_assign (c->offsets, "");
+    c->rank = 0;
+
+    plrInit(&plReader, &c->reader);
+  
+    
+    for ( ; !plrAtEnd(&plReader); plrStep(&plReader) ){
+     
+      int col = plrColumn (&plReader);
+      
+      c->rank += get_metadata_weight (col);
+      
+      if (first_pos) {
+        g_string_append_printf (c->offsets, "%d,%d", col, plrPosition (&plReader));
+        first_pos = FALSE;
+      } else {
+        g_string_append_printf (c->offsets, ",%d,%d", col, plrPosition (&plReader));
+      }
+    }
+       
+    plrDestroy(&plReader);
+
     dlrStep(&c->reader);
+    
     if( rc!=SQLITE_OK ) return rc;
     /* TODO(shess) Handle SQLITE_SCHEMA AND SQLITE_BUSY. */
     rc = sqlite3_step(c->pStmt);
@@ -3708,121 +4283,300 @@
 ** The resulting DL_DOCIDS doclist is stored in pResult, which is
 ** overwritten.
 */
-static int docListOfPhrase(
-  fulltext_vtab *pTab,   /* The full text index */
-  Fts3Phrase *pPhrase,   /* Phrase to return a doclist corresponding to */
-  DocListType eListType, /* Either DL_DOCIDS or DL_POSITIONS */
-  DataBuffer *pResult    /* Write the result here */
+static int docListOfTerm(
+  fulltext_vtab *v,    /* The full text index */
+  int iColumn,        /* column to restrict to.  No restriction if >=nColumn */
+  QueryTerm *pQTerm,   /* Term we are looking for, or 1st term of a phrase */
+  DataBuffer *pResult  /* Write the result here */
 ){
-  int ii;
-  int rc = SQLITE_OK;
-  int iCol = pPhrase->iColumn;
-  DocListType eType = eListType;
-  assert( eType==DL_POSITIONS || eType==DL_DOCIDS );
-  if( pPhrase->nToken>1 ){
-    eType = DL_POSITIONS;
-  }
+  DataBuffer left, right, new;
+  int i, rc;
+
+  /* No phrase search if no position info. */
+  assert( pQTerm->nPhrase==0 || DL_DEFAULT!=DL_DOCIDS );
 
   /* This code should never be called with buffered updates. */
-  assert( pTab->nPendingData<0 );
+  assert( v->nPendingData<0 );
 
-  for(ii=0; rc==SQLITE_OK && ii<pPhrase->nToken; ii++){
-    DataBuffer tmp;
-    struct PhraseToken *p = &pPhrase->aToken[ii];
-    rc = termSelect(pTab, iCol, p->z, p->n, p->isPrefix, eType, &tmp);
-    if( rc==SQLITE_OK ){
-      if( ii==0 ){
-        *pResult = tmp;
-      }else{
-        DataBuffer res = *pResult;
-        dataBufferInit(pResult, 0);
-        if( ii==(pPhrase->nToken-1) ){
-          eType = eListType;
-        }
-        docListPhraseMerge(
-          res.pData, res.nData, tmp.pData, tmp.nData, 0, 0, eType, pResult
-        );
-        dataBufferDestroy(&res);
-        dataBufferDestroy(&tmp);
-      }
+  dataBufferInit(&left, 0);
+  
+  #ifdef STORE_CATEGORY
+  rc = termSelect(v, iColumn, pQTerm->pTerm, pQTerm->nTerm, pQTerm->isPrefix,
+                  DL_POSITIONS, &left);
+  #else
+  rc = termSelect(v, iColumn, pQTerm->pTerm, pQTerm->nTerm, pQTerm->isPrefix,
+                  (0<pQTerm->nPhrase ? DL_POSITIONS : DL_DOCIDS), &left);
+  #endif                
+                  
+  if( rc ) return rc;
+  for(i=1; i<=pQTerm->nPhrase && left.nData>0; i++){
+    /* If this token is connected to the next by a NEAR operator, and
+    ** the next token is the start of a phrase, then set nPhraseRight
+    ** to the number of tokens in the phrase. Otherwise leave it at 1.
+    */
+    int nPhraseRight = 1;
+    while( (i+nPhraseRight)<=pQTerm->nPhrase
+       && pQTerm[i+nPhraseRight].nNear==0
+    ){
+      nPhraseRight++;
     }
+
+    dataBufferInit(&right, 0);
+    rc = termSelect(v, iColumn, pQTerm[i].pTerm, pQTerm[i].nTerm,
+                   pQTerm[i].isPrefix, DL_POSITIONS, &right);
+    if( rc ){
+      dataBufferDestroy(&left);
+      return rc;
+    }
+    dataBufferInit(&new, 0);
+
+    #ifdef STORE_CATEGORY
+    docListPhraseMerge(left.pData, left.nData, right.pData, right.nData,
+                       pQTerm[i-1].nNear, pQTerm[i-1].iPhrase + nPhraseRight,
+                       DL_POSITIONS,
+                       &new, i);
+    
+    #else
+    docListPhraseMerge(left.pData, left.nData, right.pData, right.nData,
+                       pQTerm[i-1].nNear, pQTerm[i-1].iPhrase + nPhraseRight,
+                       ((i<pQTerm->nPhrase) ? DL_POSITIONS : DL_DOCIDS),
+                       &new, i);
+
+    #endif                   
+    dataBufferDestroy(&left);
+    dataBufferDestroy(&right);
+    left = new;
   }
+  *pResult = left;
+  return SQLITE_OK;
+}
 
-  return rc;
+/* Add a new term pTerm[0..nTerm-1] to the query *q.
+*/
+static void queryAdd(Query *q, const char *pTerm, int nTerm){
+  QueryTerm *t;
+  ++q->nTerms;
+  q->pTerms = sqlite3_realloc(q->pTerms, q->nTerms * sizeof(q->pTerms[0]));
+  if( q->pTerms==0 ){
+    q->nTerms = 0;
+    return;
+  }
+  t = &q->pTerms[q->nTerms - 1];
+  CLEAR(t);
+  t->pTerm = sqlite3_malloc(nTerm+1);
+  memcpy(t->pTerm, pTerm, nTerm);
+  t->pTerm[nTerm] = 0;
+  t->nTerm = nTerm;
+  t->isOr = q->nextIsOr;
+  t->isPrefix = 0;
+  q->nextIsOr = 0;
+  t->iColumn = q->nextColumn;
+  q->nextColumn = q->dfltColumn;
 }
 
 /*
-** Evaluate the full-text expression pExpr against fts3 table pTab. Write
-** the results into pRes.
-*/
-static int evalFts3Expr(
-  fulltext_vtab *pTab,           /* Fts3 Virtual table object */
-  Fts3Expr *pExpr,               /* Parsed fts3 expression */
-  DataBuffer *pRes               /* OUT: Write results of the expression here */
+** Check to see if the string zToken[0...nToken-1] matches any
+** column name in the virtual table.   If it does,
+** return the zero-indexed column number.  If not, return -1.
+*/
+static int checkColumnSpecifier(
+  fulltext_vtab *pVtab,    /* The virtual table */
+  const char *zToken,     /* Text of the token */
+  int nToken              /* Number of characters in the token */
 ){
-  int rc = SQLITE_OK;
+  int i;
+  for(i=0; i<pVtab->nColumn; i++){
+    if( memcmp(pVtab->azColumn[i], zToken, nToken)==0
+       && pVtab->azColumn[i][nToken]==0 ){
+      return i;
+    }
+  }
+  return -1;
+}
 
-  /* Initialize the output buffer. If this is an empty query (pExpr==0), 
-  ** this is all that needs to be done. Empty queries produce empty 
-  ** result sets.
-  */
-  dataBufferInit(pRes, 0);
-
-  if( pExpr ){
-    if( pExpr->eType==FTSQUERY_PHRASE ){
-      DocListType eType = DL_DOCIDS;
-      if( pExpr->pParent && pExpr->pParent->eType==FTSQUERY_NEAR ){
-        eType = DL_POSITIONS;
-      }
-      rc = docListOfPhrase(pTab, pExpr->pPhrase, eType, pRes);
-    }else{
-      DataBuffer lhs;
-      DataBuffer rhs;
+/*
+** Parse the text at pSegment[0..nSegment-1].  Add additional terms
+** to the query being assemblied in pQuery.
+**
+** inPhrase is true if pSegment[0..nSegement-1] is contained within
+** double-quotes.  If inPhrase is true, then the first term
+** is marked with the number of terms in the phrase less one and
+** OR and "-" syntax is ignored.  If inPhrase is false, then every
+** term found is marked with nPhrase=0 and OR and "-" syntax is significant.
+*/
+static int tokenizeSegment(
+  TrackerParser *parser,                 /* The tokenizer to use */
+  const char *pSegment, int nSegment,    /* Query expression being parsed */
+  int inPhrase,                                  /* True if within "..." */
+  Query *pQuery                                  /* Append results here */
+){
+  int firstIndex = pQuery->nTerms;
+  int iCol;
+  int nTerm = 1;
 
-      dataBufferInit(&rhs, 0);
-      if( SQLITE_OK==(rc = evalFts3Expr(pTab, pExpr->pLeft, &lhs)) 
-       && SQLITE_OK==(rc = evalFts3Expr(pTab, pExpr->pRight, &rhs)) 
+  tracker_parser_reset (parser, pSegment, nSegment, FALSE, TRUE, TRUE, TRUE);
+
+  while( 1 ){
+    const char *pToken;
+    int nToken, iBegin, iEnd, iPos, stop_word, new_paragraph;
+
+
+    pToken = tracker_parser_next (parser, &iPos,
+                                    &iBegin,
+                                    &iEnd,
+                                    &new_paragraph,
+                                    &stop_word,
+                                    &nToken);
+    if (!pToken) {
+      break;
+     }
+
+//   printf("token being indexed  is %s, pos is %d, begin is %d, end is %d and length is %d\n", pToken, 
iPos, iBegin, iEnd, nToken);
+
+    if( !inPhrase &&
+       pSegment[iEnd]==':') {
+
+       int len = iEnd - iBegin;
+       char *field = g_strndup (pSegment + iBegin, len);
+
+    //   printf ("field is %s\n", field);
+
+       if ((iCol = checkColumnSpecifier(pQuery->pFts, field, len))>=0 ){
+          pQuery->nextColumn = iCol;
+          g_free (field);
+          continue;
+       }
+    }
+    if( !inPhrase && pQuery->nTerms>0 && nToken==2
+     && pToken[0] == 'o' && pToken[1] == 'r'
+    ){
+      pQuery->nextIsOr = 1;
+      continue;
+    }
+    if( !inPhrase && pQuery->nTerms>0 && !pQuery->nextIsOr && nToken==4
+      && pToken[0]=='n'
+      && pToken[1]=='e'
+      && pToken[2]=='a'
+      && pToken[3]=='r'
+    ){
+      QueryTerm *pTerm = &pQuery->pTerms[pQuery->nTerms-1];
+      if( (iBegin+6)<nSegment
+       && pSegment[iBegin+4] == '/'
+       && pSegment[iBegin+5]>='0' && pSegment[iBegin+5]<='9'
       ){
-        switch( pExpr->eType ){
-          case FTSQUERY_NEAR: {
-            int nToken;
-            Fts3Expr *pLeft;
-            DocListType eType = DL_DOCIDS;
-            if( pExpr->pParent && pExpr->pParent->eType==FTSQUERY_NEAR ){
-              eType = DL_POSITIONS;
-            }
-            pLeft = pExpr->pLeft;
-            while( pLeft->eType==FTSQUERY_NEAR ){ 
-              pLeft=pLeft->pRight;
-            }
-            assert( pExpr->pRight->eType==FTSQUERY_PHRASE );
-            assert( pLeft->eType==FTSQUERY_PHRASE );
-            nToken = pLeft->pPhrase->nToken + pExpr->pRight->pPhrase->nToken;
-            docListPhraseMerge(lhs.pData, lhs.nData, rhs.pData, rhs.nData, 
-                pExpr->nNear+1, nToken, eType, pRes
-            );
-            break;
-          }
-          case FTSQUERY_NOT: {
-            docListExceptMerge(lhs.pData, lhs.nData, rhs.pData, rhs.nData,pRes);
-            break;
-          }
-          case FTSQUERY_AND: {
-            docListAndMerge(lhs.pData, lhs.nData, rhs.pData, rhs.nData, pRes);
-            break;
-          }
-          case FTSQUERY_OR: {
-            docListOrMerge(lhs.pData, lhs.nData, rhs.pData, rhs.nData, pRes);
-            break;
-          }
-        }
+       pTerm->nNear = (pSegment[iBegin+5] - '0');
+       nToken += 2;
+       if( pSegment[iBegin+6]>='0' && pSegment[iBegin+6]<=9 ){
+         pTerm->nNear = pTerm->nNear * 10 + (pSegment[iBegin+6] - '0');
+         iEnd++;
+       }
+       pToken = tracker_parser_next (parser, &iPos,
+                                    &iBegin,
+                                    &iEnd,
+                                    &new_paragraph,
+                                    &stop_word,
+                                    &nToken);
+       if (!pToken) {
+         break;
+       }
+
+
+      } else {
+       pTerm->nNear = SQLITE_FTS3_DEFAULT_NEAR_PARAM;
       }
-      dataBufferDestroy(&lhs);
-      dataBufferDestroy(&rhs);
+      pTerm->nNear++;
+      continue;
+    }
+
+    if (stop_word != 0) {
+       continue;
+    }
+
+    queryAdd(pQuery, pToken, nToken);
+    if( !inPhrase && iBegin>0) {
+
+   //  printf("first char is %c, prev char is %c\n", pSegment[iBegin], pSegment[iBegin-1]);
+
+      if (pSegment[iBegin-1]=='-' ){
+       pQuery->pTerms[pQuery->nTerms-1].isNot = 1;
+      }
+    }
+    if( iEnd<nSegment && pSegment[iEnd]=='*' ){
+      pQuery->pTerms[pQuery->nTerms-1].isPrefix = 1;
+    }
+    pQuery->pTerms[pQuery->nTerms-1].iPhrase = nTerm;
+    if( inPhrase ){
+      nTerm++;
     }
   }
 
-  return rc;
+  if( inPhrase && pQuery->nTerms>firstIndex ){
+    pQuery->pTerms[firstIndex].nPhrase = pQuery->nTerms - firstIndex - 1;
+  }
+
+  return SQLITE_OK;
+}
+
+/* Parse a query string, yielding a Query object pQuery.
+**
+** The calling function will need to queryClear() to clean up
+** the dynamically allocated memory held by pQuery.
+*/
+static int parseQuery(
+  fulltext_vtab *v,       /* The fulltext index */
+  const char *zInput,     /* Input text of the query string */
+  int nInput,             /* Size of the input text */
+  int dfltColumn,         /* Default column of the index to match against */
+  Query *pQuery                   /* Write the parse results here. */
+){
+  int iInput, inPhrase = 0;
+  int ii;
+  QueryTerm *aTerm;
+
+  if( zInput==0 ) nInput = 0;
+  if( nInput<0 ) nInput = strlen(zInput);
+  pQuery->nTerms = 0;
+  pQuery->pTerms = NULL;
+  pQuery->nextIsOr = 0;
+  pQuery->nextColumn = dfltColumn;
+  pQuery->dfltColumn = dfltColumn;
+  pQuery->pFts = v;
+
+  for(iInput=0; iInput<nInput; ++iInput){
+    int i;
+    for(i=iInput; i<nInput && zInput[i]!='"'; ++i){}
+    if( i>iInput ){
+      tokenizeSegment(v->parser, zInput+iInput, i-iInput, inPhrase,
+                      pQuery);
+    }
+    iInput = i;
+    if( i<nInput ){
+      assert( zInput[i]=='"' );
+      inPhrase = !inPhrase;
+    }
+  }
+
+  if( inPhrase ){
+    /* unmatched quote */
+    queryClear(pQuery);
+    return SQLITE_ERROR;
+  }
+
+  /* Modify the values of the QueryTerm.nPhrase variables to account for
+  ** the NEAR operator. For the purposes of QueryTerm.nPhrase, phrases
+  ** and tokens connected by the NEAR operator are handled as a single
+  ** phrase. See comments above the QueryTerm structure for details.
+  */
+  aTerm = pQuery->pTerms;
+  for(ii=0; ii<pQuery->nTerms; ii++){
+    if( aTerm[ii].nNear || aTerm[ii].nPhrase ){
+      while (aTerm[ii+aTerm[ii].nPhrase].nNear) {
+       aTerm[ii].nPhrase += (1 + aTerm[ii+aTerm[ii].nPhrase+1].nPhrase);
+      }
+    }
+  }
+
+  return SQLITE_OK;
 }
 
 /* TODO(shess) Refactor the code to remove this forward decl. */
@@ -3836,14 +4590,17 @@
 ** they are allowed to match against any column.
 */
 static int fulltextQuery(
-  fulltext_vtab *v,      /* The full text index */
-  int iColumn,           /* Match against this column by default */
-  const char *zInput,    /* The query string */
-  int nInput,            /* Number of bytes in zInput[] */
-  DataBuffer *pResult,   /* Write the result doclist here */
-  Fts3Expr **ppExpr        /* Put parsed query string here */
+  fulltext_vtab *v,     /* The full text index */
+  int iColumn,          /* Match against this column by default */
+  const char *zInput,   /* The query string */
+  int nInput,           /* Number of bytes in zInput[] */
+  DataBuffer *pResult,  /* Write the result doclist here */
+  Query *pQuery                 /* Put parsed query string here */
 ){
-  int rc;
+  int i, iNext, rc;
+  DataBuffer left, right, or, new;
+  int nNot = 0;
+  QueryTerm *aTerm;
 
   /* TODO(shess) Instead of flushing pendingTerms, we could query for
   ** the relevant term and merge the doclist into what we receive from
@@ -3855,20 +4612,86 @@
 
   /* Flush any buffered updates before executing the query. */
   rc = flushPendingTerms(v);
-  if( rc!=SQLITE_OK ){
-    return rc;
+  if( rc!=SQLITE_OK ) return rc;
+
+  /* TODO(shess) I think that the queryClear() calls below are not
+  ** necessary, because fulltextClose() already clears the query.
+  */
+  rc = parseQuery(v, zInput, nInput, iColumn, pQuery);
+  if( rc!=SQLITE_OK ) return rc;
+
+  /* Empty or NULL queries return no results. */
+  if( pQuery->nTerms==0 ){
+    dataBufferInit(pResult, 0);
+    return SQLITE_OK;
   }
 
-  /* Parse the query passed to the MATCH operator. */
-  rc = sqlite3Fts3ExprParse(v->pTokenizer, 
-      v->azColumn, v->nColumn, iColumn, zInput, nInput, ppExpr
-  );
-  if( rc!=SQLITE_OK ){
-    assert( 0==(*ppExpr) );
-    return rc;
+  /* Merge AND terms. */
+  /* TODO(shess) I think we can early-exit if( i>nNot && left.nData==0 ). */
+  aTerm = pQuery->pTerms;
+  for(i = 0; i<pQuery->nTerms; i=iNext){
+    if( aTerm[i].isNot ){
+      /* Handle all NOT terms in a separate pass */
+      nNot++;
+      iNext = i + aTerm[i].nPhrase+1;
+      continue;
+    }
+    iNext = i + aTerm[i].nPhrase + 1;
+    rc = docListOfTerm(v, aTerm[i].iColumn, &aTerm[i], &right);
+    if( rc ){
+      if( i!=nNot ) dataBufferDestroy(&left);
+      queryClear(pQuery);
+      return rc;
+    }
+    while( iNext<pQuery->nTerms && aTerm[iNext].isOr ){
+      rc = docListOfTerm(v, aTerm[iNext].iColumn, &aTerm[iNext], &or);
+      iNext += aTerm[iNext].nPhrase + 1;
+      if( rc ){
+       if( i!=nNot ) dataBufferDestroy(&left);
+       dataBufferDestroy(&right);
+       queryClear(pQuery);
+       return rc;
+      }
+      dataBufferInit(&new, 0);
+      docListOrMerge(right.pData, right.nData, or.pData, or.nData, &new);
+      dataBufferDestroy(&right);
+      dataBufferDestroy(&or);
+      right = new;
+    }
+    if( i==nNot ){          /* first term processed. */
+      left = right;
+    }else{
+      dataBufferInit(&new, 0);
+      docListAndMerge(left.pData, left.nData, right.pData, right.nData, &new);
+      dataBufferDestroy(&right);
+      dataBufferDestroy(&left);
+      left = new;
+    }
+  }
+
+  if( nNot==pQuery->nTerms ){
+    /* We do not yet know how to handle a query of only NOT terms */
+    return SQLITE_ERROR;
   }
 
-  return evalFts3Expr(v, *ppExpr, pResult);
+  /* Do the EXCEPT terms */
+  for(i=0; i<pQuery->nTerms;  i += aTerm[i].nPhrase + 1){
+    if( !aTerm[i].isNot ) continue;
+    rc = docListOfTerm(v, aTerm[i].iColumn, &aTerm[i], &right);
+    if( rc ){
+      queryClear(pQuery);
+      dataBufferDestroy(&left);
+      return rc;
+    }
+    dataBufferInit(&new, 0);
+    docListExceptMerge(left.pData, left.nData, right.pData, right.nData, &new);
+    dataBufferDestroy(&right);
+    dataBufferDestroy(&left);
+    left = new;
+  }
+
+  *pResult = left;
+  return rc;
 }
 
 /*
@@ -3900,43 +4723,21 @@
   fulltext_cursor *c = (fulltext_cursor *) pCursor;
   fulltext_vtab *v = cursor_vtab(c);
   int rc;
+  StringBuffer sb;
 
   FTSTRACE(("FTS3 Filter %p\n",pCursor));
 
-  /* If the cursor has a statement that was not prepared according to
-  ** idxNum, clear it.  I believe all calls to fulltextFilter with a
-  ** given cursor will have the same idxNum , but in this case it's
-  ** easy to be safe.
-  */
-  if( c->pStmt && c->iCursorType!=idxNum ){
-    sqlite3_finalize(c->pStmt);
-    c->pStmt = NULL;
-  }
-
-  /* Get a fresh statement appropriate to idxNum. */
-  /* TODO(shess): Add a prepared-statement cache in the vt structure.
-  ** The cache must handle multiple open cursors.  Easier to cache the
-  ** statement variants at the vt to reduce malloc/realloc/free here.
-  ** Or we could have a StringBuffer variant which allowed stack
-  ** construction for small values.
-  */
-  if( !c->pStmt ){
-    StringBuffer sb;
-    initStringBuffer(&sb);
-    append(&sb, "SELECT docid, ");
-    appendList(&sb, v->nColumn, v->azContentColumn);
-    append(&sb, " FROM %_content");
-    if( idxNum!=QUERY_GENERIC ) append(&sb, " WHERE docid = ?");
-    rc = sql_prepare(v->db, v->zDb, v->zName, &c->pStmt,
-                     stringBufferData(&sb));
-    stringBufferDestroy(&sb);
-    if( rc!=SQLITE_OK ) return rc;
-    c->iCursorType = idxNum;
-  }else{
-    sqlite3_reset(c->pStmt);
-    assert( c->iCursorType==idxNum );
-  }
+  initStringBuffer(&sb);
+  append(&sb, "SELECT docid, ");
+  appendList(&sb, v->nColumn, v->azContentColumn);
+  append(&sb, " FROM %_content");
+  if( idxNum!=QUERY_GENERIC ) append(&sb, " WHERE docid = ?");
+  sqlite3_finalize(c->pStmt);
+  rc = sql_prepare(v->db, v->zDb, v->zName, &c->pStmt, stringBufferData(&sb));
+  stringBufferDestroy(&sb);
+  if( rc!=SQLITE_OK ) return rc;
 
+  c->iCursorType = idxNum;
   switch( idxNum ){
     case QUERY_GENERIC:
       break;
@@ -3948,10 +4749,10 @@
 
     default:   /* full-text search */
     {
-      int iCol = idxNum-QUERY_FULLTEXT;
       const char *zQuery = (const char *)sqlite3_value_text(argv[0]);
       assert( idxNum<=QUERY_FULLTEXT+v->nColumn);
       assert( argc==1 );
+      queryClear(&c->q);
       if( c->result.nData!=0 ){
         /* This case happens if the same cursor is used repeatedly. */
         dlrDestroy(&c->reader);
@@ -3959,10 +4760,17 @@
       }else{
         dataBufferInit(&c->result, 0);
       }
-      rc = fulltextQuery(v, iCol, zQuery, -1, &c->result, &c->pExpr);
+      rc = fulltextQuery(v, idxNum-QUERY_FULLTEXT, zQuery, -1, &c->result, &c->q);
       if( rc!=SQLITE_OK ) return rc;
       if( c->result.nData!=0 ){
+
+#ifdef STORE_CATEGORY
+        dlrInit(&c->reader, DL_POSITIONS, c->result.pData, c->result.nData);
+#else      
         dlrInit(&c->reader, DL_DOCIDS, c->result.pData, c->result.nData);
+
+#endif   
+        
       }
       break;
     }
@@ -3991,6 +4799,13 @@
   fulltext_cursor *c = (fulltext_cursor *) pCursor;
   fulltext_vtab *v = cursor_vtab(c);
 
+#ifdef STORE_CATEGORY 
+  if (idxCol == 0) {
+    sqlite3_result_int (pContext, c->currentCatid);
+    return SQLITE_OK;
+  }
+#endif
+       
   if( idxCol<v->nColumn ){
     sqlite3_value *pVal = sqlite3_column_value(c->pStmt, idxCol+1);
     sqlite3_result_value(pContext, pVal);
@@ -4023,25 +4838,46 @@
 ** we also store positions and offsets in the hash table using that
 ** column number.
 */
-static int buildTerms(fulltext_vtab *v, sqlite_int64 iDocid,
-                      const char *zText, int iColumn){
-  sqlite3_tokenizer *pTokenizer = v->pTokenizer;
-  sqlite3_tokenizer_cursor *pCursor;
+static int buildTerms(fulltext_vtab *v, sqlite_int64 iDocid, 
+
+#ifdef STORE_CATEGORY      
+int Catid,
+#endif
+                     const char *zText, int iColumn){
+                     
   const char *pToken;
   int nTokenBytes;
-  int iStartOffset, iEndOffset, iPosition;
+  int iStartOffset, iEndOffset, iPosition, stop_word, new_paragraph;
   int rc;
+  TrackerParser *parser = v->parser;
+
+  if (!zText) return SQLITE_OK;
+
+  tracker_parser_reset (parser, zText, strlen (zText), FALSE, TRUE, TRUE, FALSE);
+
+  while( 1 ){
+
+    pToken = tracker_parser_next (parser, &iPosition,
+                                    &iStartOffset,
+                                    &iEndOffset,
+                                    &new_paragraph,
+                                    &stop_word,
+                                    &nTokenBytes);
+   if (!pToken) {
+       break;
+   }
+
+  // printf("token being indexed  is %s, begin is %d, end is %d and length is %d\n", pToken, iStartOffset, 
iEndOffset, nTokenBytes);
+
+   if (stop_word) {
+       continue;
+   }
+
+
 
-  rc = pTokenizer->pModule->xOpen(pTokenizer, zText, -1, &pCursor);
-  if( rc!=SQLITE_OK ) return rc;
 
-  pCursor->pTokenizer = pTokenizer;
-  while( SQLITE_OK==(rc=pTokenizer->pModule->xNext(pCursor,
-                                                   &pToken, &nTokenBytes,
-                                                   &iStartOffset, &iEndOffset,
-                                                   &iPosition)) ){
     DLCollector *p;
-    int nData;                   /* Size of doclist before our update. */
+    int nData;                  /* Size of doclist before our update. */
 
     /* Positions can't be negative; we use -1 as a terminator
      * internally.  Token can't be NULL or empty. */
@@ -4053,14 +4889,28 @@
     p = fts3HashFind(&v->pendingTerms, pToken, nTokenBytes);
     if( p==NULL ){
       nData = 0;
+      
+#ifdef STORE_CATEGORY       
+      p = dlcNew(iDocid, DL_DEFAULT, Catid);
+#else
       p = dlcNew(iDocid, DL_DEFAULT);
+#endif
+
       fts3HashInsert(&v->pendingTerms, pToken, nTokenBytes, p);
 
       /* Overhead for our hash table entry, the key, and the value. */
       v->nPendingData += sizeof(struct fts3HashElem)+sizeof(*p)+nTokenBytes;
     }else{
       nData = p->b.nData;
-      if( p->dlw.iPrevDocid!=iDocid ) dlcNext(p, iDocid);
+      if( p->dlw.iPrevDocid!=iDocid ) {
+#ifdef STORE_CATEGORY       
+        dlcNext(p, iDocid, Catid);
+#else
+        dlcNext(p, iDocid);
+#endif
+
+      
+      }
     }
     if( iColumn>=0 ){
       dlcAddPos(p, iColumn, iPosition, iStartOffset, iEndOffset);
@@ -4075,20 +4925,38 @@
   ** though one could argue that failure there means that the data is
   ** not durable.  *ponder*
   */
-  pTokenizer->pModule->xClose(pCursor);
-  if( SQLITE_DONE == rc ) return SQLITE_OK;
-  return rc;
+
+  return SQLITE_OK;
+
 }
 
 /* Add doclists for all terms in [pValues] to pendingTerms table. */
 static int insertTerms(fulltext_vtab *v, sqlite_int64 iDocid,
                        sqlite3_value **pValues){
   int i;
+  
+#ifdef STORE_CATEGORY   
+  
+  /* tracker- category is at column 0 so we dont want to add that value to index */
+  for(i = 1; i < v->nColumn ; ++i){
+    char *zText = (char*)sqlite3_value_text(pValues[i]);
+    
+    /* tracker - as for col id we want col 0 to be the default metadata field (file:contents or email:body) 
, 
+    col 1 to be meatdata id 1, col 2 to be metadat id 2 etc so need to decrement i here */
+    int rc = buildTerms(v, iDocid, sqlite3_value_int (pValues[0]), zText, i-1);
+    if( rc!=SQLITE_OK ) return rc;
+  }
+  
+#else
+
   for(i = 0; i < v->nColumn ; ++i){
     char *zText = (char*)sqlite3_value_text(pValues[i]);
     int rc = buildTerms(v, iDocid, zText, i);
     if( rc!=SQLITE_OK ) return rc;
   }
+  
+#endif  
+
   return SQLITE_OK;
 }
 
@@ -4105,10 +4973,19 @@
   rc = content_select(v, iDocid, &pValues);
   if( rc!=SQLITE_OK ) return rc;
 
+#ifdef STORE_CATEGORY   
+  
+  for(i = 1 ; i < v->nColumn; ++i) {
+    rc = buildTerms(v, iDocid, atoi(pValues[0]), pValues[i], -1);
+    if( rc!=SQLITE_OK ) break;
+  }
+
+#else
   for(i = 0 ; i < v->nColumn; ++i) {
     rc = buildTerms(v, iDocid, pValues[i], -1);
     if( rc!=SQLITE_OK ) break;
   }
+#endif
 
   freeStringArray(v->nColumn, pValues);
   return SQLITE_OK;
@@ -5843,14 +6720,9 @@
 /* Scan the database and merge together the posting lists for the term
 ** into *out.
 */
-static int termSelect(
-  fulltext_vtab *v, 
-  int iColumn,
-  const char *pTerm, int nTerm,             /* Term to query for */
-  int isPrefix,                             /* True for a prefix search */
-  DocListType iType, 
-  DataBuffer *out                           /* Write results here */
-){
+static int termSelect(fulltext_vtab *v, int iColumn,
+                     const char *pTerm, int nTerm, int isPrefix,
+                     DocListType iType, DataBuffer *out){
   DataBuffer doclist;
   sqlite3_stmt *s;
   int rc = sql_get_statement(v, SEGDIR_SELECT_ALL_STMT, &s);
@@ -5860,7 +6732,6 @@
   assert( v->nPendingData<0 );
 
   dataBufferInit(&doclist, 0);
-  dataBufferInit(out, 0);
 
   /* Traverse the segments from oldest to newest so that newer doclist
   ** elements for given docids overwrite older elements.
@@ -6147,12 +7018,37 @@
     snippetAllOffsets(pCursor);
     snippetText(pCursor, zStart, zEnd, zEllipsis);
     sqlite3_result_text(pContext, pCursor->snippet.zSnippet,
-                        pCursor->snippet.nSnippet, SQLITE_STATIC);
+                       pCursor->snippet.nSnippet, SQLITE_STATIC);
+  }
+}
+
+
+/*
+** Implementation of the rank() function for FTS3
+*/
+static void rankFunc(
+  sqlite3_context *pContext,
+  int argc,
+  sqlite3_value **argv
+){
+
+       // TODO
+
+  fulltext_cursor *pCursor;
+  if( argc<1 ) return;
+  if( sqlite3_value_type(argv[0])!=SQLITE_BLOB ||
+      sqlite3_value_bytes(argv[0])!=sizeof(pCursor) ){
+    sqlite3_result_error(pContext, "illegal first argument to html_snippet",-1);
+  }else{
+    memcpy(&pCursor, sqlite3_value_blob(argv[0]), sizeof(pCursor));
+    sqlite3_result_double(pContext, pCursor->rank);
   }
 }
 
 /*
 ** Implementation of the offsets() function for FTS3
+** altered by tracker to omit query term position as that
+** info is not stored in the poisiton data in the index
 */
 static void snippetOffsetsFunc(
   sqlite3_context *pContext,
@@ -6166,11 +7062,11 @@
     sqlite3_result_error(pContext, "illegal first argument to offsets",-1);
   }else{
     memcpy(&pCursor, sqlite3_value_blob(argv[0]), sizeof(pCursor));
-    snippetAllOffsets(pCursor);
-    snippetOffsetText(&pCursor->snippet);
+    
+    /* (tracker) output caches position data in column, position string format */
     sqlite3_result_text(pContext,
-                        pCursor->snippet.zOffset, pCursor->snippet.nOffset,
-                        SQLITE_STATIC);
+                       pCursor->offsets->str, pCursor->offsets->len,
+                       SQLITE_STATIC);
   }
 }
 
@@ -6850,6 +7746,9 @@
   }else if( strcmp(zName,"offsets")==0 ){
     *pxFunc = snippetOffsetsFunc;
     return 1;
+  }else if( strcmp(zName,"rank")==0 ){
+    *pxFunc = rankFunc;
+    return 1;
   }else if( strcmp(zName,"optimize")==0 ){
     *pxFunc = optimizeFunc;
     return 1;
@@ -6918,27 +7817,6 @@
   /* xRename */       fulltextRename,
 };
 
-static void hashDestroy(void *p){
-  fts3Hash *pHash = (fts3Hash *)p;
-  sqlite3Fts3HashClear(pHash);
-  sqlite3_free(pHash);
-}
-
-/*
-** The fts3 built-in tokenizers - "simple" and "porter" - are implemented
-** in files fts3_tokenizer1.c and fts3_porter.c respectively. The following
-** two forward declarations are for functions declared in these files
-** used to retrieve the respective implementations.
-**
-** Calling sqlite3Fts3SimpleTokenizerModule() sets the value pointed
-** to by the argument to point a the "simple" tokenizer implementation.
-** Function ...PorterTokenizerModule() sets *pModule to point to the
-** porter tokenizer/stemmer implementation.
-*/
-void sqlite3Fts3SimpleTokenizerModule(sqlite3_tokenizer_module const**ppModule);
-void sqlite3Fts3PorterTokenizerModule(sqlite3_tokenizer_module const**ppModule);
-void sqlite3Fts3IcuTokenizerModule(sqlite3_tokenizer_module const**ppModule);
-
 int sqlite3Fts3InitHashTable(sqlite3 *, fts3Hash *, const char *);
 
 /*
@@ -6949,45 +7827,13 @@
 */
 int sqlite3Fts3Init(sqlite3 *db){
   int rc = SQLITE_OK;
-  fts3Hash *pHash = 0;
-  const sqlite3_tokenizer_module *pSimple = 0;
-  const sqlite3_tokenizer_module *pPorter = 0;
-  const sqlite3_tokenizer_module *pIcu = 0;
-
-  sqlite3Fts3SimpleTokenizerModule(&pSimple);
-  sqlite3Fts3PorterTokenizerModule(&pPorter);
-#ifdef SQLITE_ENABLE_ICU
-  sqlite3Fts3IcuTokenizerModule(&pIcu);
-#endif
 
-  /* Allocate and initialise the hash-table used to store tokenizers. */
-  pHash = sqlite3_malloc(sizeof(fts3Hash));
-  if( !pHash ){
-    rc = SQLITE_NOMEM;
-  }else{
-    sqlite3Fts3HashInit(pHash, FTS3_HASH_STRING, 1);
-  }
-
-  /* Load the built-in tokenizers into the hash table */
-  if( rc==SQLITE_OK ){
-    if( sqlite3Fts3HashInsert(pHash, "simple", 7, (void *)pSimple)
-     || sqlite3Fts3HashInsert(pHash, "porter", 7, (void *)pPorter) 
-     || (pIcu && sqlite3Fts3HashInsert(pHash, "icu", 4, (void *)pIcu))
-    ){
-      rc = SQLITE_NOMEM;
-    }
-  }
-
-#ifdef SQLITE_TEST
-  sqlite3Fts3ExprInitTestInterface(db);
-#endif
-
-  /* Create the virtual table wrapper around the hash-table and overload 
+  /* Create the virtual table wrapper around the hash-table and overload
   ** the two scalar functions. If this is successful, register the
   ** module with sqlite.
   */
-  if( SQLITE_OK==rc 
-   && SQLITE_OK==(rc = sqlite3Fts3InitHashTable(db, pHash, "fts3_tokenizer"))
+  if( SQLITE_OK==rc
+   && SQLITE_OK==(rc = sqlite3_overload_function(db, "rank", -1))
    && SQLITE_OK==(rc = sqlite3_overload_function(db, "snippet", -1))
    && SQLITE_OK==(rc = sqlite3_overload_function(db, "offsets", -1))
    && SQLITE_OK==(rc = sqlite3_overload_function(db, "optimize", -1))
@@ -6997,28 +7843,23 @@
 #endif
   ){
     return sqlite3_create_module_v2(
-        db, "fts3", &fts3Module, (void *)pHash, hashDestroy
+       db, "trackerfts", &fts3Module, 0, 0
     );
   }
 
-  /* An error has occurred. Delete the hash table and return the error code. */
+  /* An error has occured. Delete the hash table and return the error code. */
   assert( rc!=SQLITE_OK );
-  if( pHash ){
-    sqlite3Fts3HashClear(pHash);
-    sqlite3_free(pHash);
-  }
+
   return rc;
 }
 
-#if !SQLITE_CORE
+
 int sqlite3_extension_init(
-  sqlite3 *db, 
+  sqlite3 *db,
   char **pzErrMsg,
   const sqlite3_api_routines *pApi
 ){
   SQLITE_EXTENSION_INIT2(pApi)
   return sqlite3Fts3Init(db);
 }
-#endif
 
-#endif /* !defined(SQLITE_CORE) || defined(SQLITE_ENABLE_FTS3) */

--- ../../../sqlite/ext/fts3/fts3_hash.c        2008-11-13 19:12:35.000000000 +0000
+++ tracker-fts-hash.c  2009-03-05 16:53:34.000000000 +0000
@@ -23,14 +23,13 @@
 **     * The FTS3 module is being built into the core of
 **       SQLite (in which case SQLITE_ENABLE_FTS3 is defined).
 */
-#if !defined(SQLITE_CORE) || defined(SQLITE_ENABLE_FTS3)
 
 #include <assert.h>
 #include <stdlib.h>
 #include <string.h>
 
-#include "sqlite3.h"
-#include "fts3_hash.h"
+#include <sqlite3.h>
+#include "tracker-fts-hash.h"
 
 /*
 ** Malloc and Free functions
@@ -338,13 +337,6 @@
     return old_data;
   }
   if( data==0 ) return 0;
-  if( pH->htsize==0 ){
-    fts3Rehash(pH,8);
-    if( pH->htsize==0 ){
-      pH->count = 0;
-      return data;
-    }
-  }
   new_elem = (fts3HashElem*)fts3HashMalloc( sizeof(fts3HashElem) );
   if( new_elem==0 ) return data;
   if( pH->copyKey && pKey!=0 ){
@@ -359,6 +351,14 @@
   }
   new_elem->nKey = nKey;
   pH->count++;
+  if( pH->htsize==0 ){
+    fts3Rehash(pH,8);
+    if( pH->htsize==0 ){
+      pH->count = 0;
+      fts3HashFree(new_elem);
+      return data;
+    }
+  }
   if( pH->count > pH->htsize ){
     fts3Rehash(pH,pH->htsize*2);
   }
@@ -370,4 +370,4 @@
   return 0;
 }
 
-#endif /* !defined(SQLITE_CORE) || defined(SQLITE_ENABLE_FTS3) */
+

Index: tracker-fts.c
===================================================================
--- tracker-fts.c       (revision 3021)
+++ tracker-fts.c       (working copy)
@@ -1,7 +1,7 @@
 /*
 ** 2006 Oct 10
 **
-** The author disclaims copyright to this source code. In place of
+** The author disclaims copyright to this source code.  In place of
 ** a legal notice, here is a blessing:
 **
 **    May you do good and not evil.
@@ -13,20 +13,14 @@
 ** This is an SQLite module implementing full-text search.
 */
 
-
-// gcc -shared -o tracker-fts *.c
-//gcc -Wall -fPIC -c *.c
-
-//gcc -shared -Wl,-soname,libtracker-fts.so.1 -o libtracker-fts.so.1.0  *.o
-
 /*
 ** The code in this file is only compiled if:
 **
 **     * The FTS3 module is being built as an extension
-**      (in which case SQLITE_CORE is not defined), or
+**       (in which case SQLITE_CORE is not defined), or
 **
 **     * The FTS3 module is being built into the core of
-**      SQLite (in which case SQLITE_ENABLE_FTS3 is defined).
+**       SQLite (in which case SQLITE_ENABLE_FTS3 is defined).
 */
 
 /* TODO(shess) Consider exporting this comment to an HTML file or the
@@ -35,7 +29,7 @@
 /* The full-text index is stored in a series of b+tree (-like)
 ** structures called segments which map terms to doclists.  The
 ** structures are like b+trees in layout, but are constructed from the
-** bottom up in optimal fashion and are not updatable. Since trees
+** bottom up in optimal fashion and are not updatable.  Since trees
 ** are built from the bottom up, things will be described from the
 ** bottom up.
 **
@@ -46,8 +40,8 @@
 ** using seven bits * per byte as follows:
 **
 ** KEY:
-**        A = 0xxxxxxx    7 bits of data and one flag bit
-**        B = 1xxxxxxx    7 bits of data and one flag bit
+**         A = 0xxxxxxx    7 bits of data and one flag bit
+**         B = 1xxxxxxx    7 bits of data and one flag bit
 **
 **  7 bits - A
 ** 14 bits - BA
@@ -59,28 +53,28 @@
 **
 **** Document lists ****
 ** A doclist (document list) holds a docid-sorted list of hits for a
-** given term. Doclists hold docids, and can optionally associate
+** given term.  Doclists hold docids, and can optionally associate
 ** token positions and offsets with docids.
 **
 ** A DL_POSITIONS_OFFSETS doclist is stored like this:
 **
 ** array {
 **   varint docid;
-**   array {               (position list for column 0)
+**   array {                (position list for column 0)
 **     varint position;     (delta from previous position plus POS_BASE)
 **     varint startOffset;  (delta from previous startOffset)
 **     varint endOffset;    (delta from startOffset)
 **   }
 **   array {
 **     varint POS_COLUMN;   (marks start of position list for new column)
-**     varint column;      (index of new column)
+**     varint column;       (index of new column)
 **     array {
-**      varint position;   (delta from previous position plus POS_BASE)
-**      varint startOffset;(delta from previous startOffset)
-**      varint endOffset;  (delta from startOffset)
+**       varint position;   (delta from previous position plus POS_BASE)
+**       varint startOffset;(delta from previous startOffset)
+**       varint endOffset;  (delta from startOffset)
 **     }
 **   }
-**   varint POS_END;       (marks end of positions for this document.
+**   varint POS_END;        (marks end of positions for this document.
 ** }
 **
 ** Here, array { X } means zero or more occurrences of X, adjacent in
@@ -106,17 +100,17 @@
 ** iterate through a segment's entire leaf layer).  Leaf nodes have
 ** the format:
 **
-** varint iHeight;            (height from leaf level, always 0)
-** varint nTerm;              (length of first term)
-** char pTerm[nTerm];         (content of first term)
-** varint nDoclist;           (length of term's associated doclist)
+** varint iHeight;             (height from leaf level, always 0)
+** varint nTerm;               (length of first term)
+** char pTerm[nTerm];          (content of first term)
+** varint nDoclist;            (length of term's associated doclist)
 ** char pDoclist[nDoclist];    (content of doclist)
 ** array {
-**                            (further terms are delta-encoded)
-**   varint nPrefix;          (length of prefix shared with previous term)
-**   varint nSuffix;          (length of unshared suffix)
+**                             (further terms are delta-encoded)
+**   varint nPrefix;           (length of prefix shared with previous term)
+**   varint nSuffix;           (length of unshared suffix)
 **   char pTermSuffix[nSuffix];(unshared suffix of next term)
-**   varint nDoclist;         (length of term's associated doclist)
+**   varint nDoclist;          (length of term's associated doclist)
 **   char pDoclist[nDoclist];  (content of doclist)
 ** }
 **
@@ -152,15 +146,15 @@
 ** itself grows too big and must be split.  The format of interior
 ** nodes:
 **
-** varint iHeight;          (height from leaf level, always >0)
-** varint iBlockid;         (block id of node's leftmost subtree)
+** varint iHeight;           (height from leaf level, always >0)
+** varint iBlockid;          (block id of node's leftmost subtree)
 ** optional {
-**   varint nTerm;          (length of first term)
+**   varint nTerm;           (length of first term)
 **   char pTerm[nTerm];      (content of first term)
 **   array {
-**                               (further terms are delta-encoded)
-**     varint nPrefix;           (length of shared prefix with previous term)
-**     varint nSuffix;           (length of unshared suffix)
+**                                (further terms are delta-encoded)
+**     varint nPrefix;            (length of shared prefix with previous term)
+**     varint nSuffix;            (length of unshared suffix)
 **     char pTermSuffix[nSuffix]; (unshared suffix of next term)
 **   }
 ** }
@@ -170,11 +164,11 @@
 **
 ** An interior node encodes n terms separating n+1 subtrees.  The
 ** subtree blocks are contiguous, so only the first subtree's blockid
-** is encoded. The subtree at iBlockid will contain all terms less
+** is encoded.  The subtree at iBlockid will contain all terms less
 ** than the first term encoded (or all terms if no term is encoded).
 ** Otherwise, for terms greater than or equal to pTerm[i] but less
 ** than pTerm[i+1], the subtree for that term will be rooted at
-** iBlockid+i. Interior nodes only store enough term data to
+** iBlockid+i.  Interior nodes only store enough term data to
 ** distinguish adjacent children (if the rightmost term of the left
 ** child is "something", and the leftmost term of the right child is
 ** "wicked", only "w" is stored).
@@ -201,21 +195,21 @@
 ** height and the blockid of the previous root).
 **
 ** The meta-information in the segment directory is:
-**   level              - segment level (see below)
-**   idx                - index within level
-**                      - (level,idx uniquely identify a segment)
-**   start_block        - first leaf node
-**   leaves_end_block   - last leaf node
-**   end_block          - last block (including interior nodes)
-**   root               - contents of root node
+**   level               - segment level (see below)
+**   idx                 - index within level
+**                       - (level,idx uniquely identify a segment)
+**   start_block         - first leaf node
+**   leaves_end_block    - last leaf node
+**   end_block           - last block (including interior nodes)
+**   root                - contents of root node
 **
 ** If the root node is a leaf node, then start_block,
 ** leaves_end_block, and end_block are all 0.
 **
 **
 **** Segment merging ****
-** To amortize update costs, segments are groups into levels and
-** merged in matches.  Each increase in level represents exponentially
+** To amortize update costs, segments are grouped into levels and
+** merged in batches.  Each increase in level represents exponentially
 ** more documents.
 **
 ** New documents (actually, document updates) are tokenized and
@@ -234,7 +228,7 @@
 ** deleted.
 **
 ** MERGE_COUNT controls how often we merge segments.  16 seems to be
-** somewhat of a sweet spot for insertion performance. 32 and 64 show
+** somewhat of a sweet spot for insertion performance.  32 and 64 show
 ** very similar performance numbers to 16 on insertion, though they're
 ** a tiny bit slower (perhaps due to more overhead in merge-time
 ** sorting).  8 is about 20% slower than 16, 4 about 50% slower than
@@ -245,10 +239,10 @@
 ** inserted:
 **
 **    MERGE_COUNT   segments
-**      16           25
-**       8           12
-**       4           10
-**       2            6
+**       16           25
+**        8           12
+**        4           10
+**        2            6
 **
 ** This appears to have only a moderate impact on queries for very
 ** frequent terms (which are somewhat dominated by segment merge
@@ -269,12 +263,12 @@
 ** write an empty doclist (varint(docid) varint(POS_END)), for updates
 ** we simply write the new doclist.  Segment merges overwrite older
 ** data for a particular docid with newer data, so deletes or updates
-** will eventually overtake the earlier data and knock it out. The
+** will eventually overtake the earlier data and knock it out.  The
 ** query logic likewise merges doclists so that newer data knocks out
 ** older data.
 **
 ** TODO(shess) Provide a VACUUM type operation to clear out all
-** deletions and duplications. This would basically be a forced merge
+** deletions and duplications.  This would basically be a forced merge
 ** into a single segment.
 */
 
@@ -296,8 +290,6 @@
 
 SQLITE_EXTENSION_INIT1
 
-
-
 /* TODO(shess) MAN, this thing needs some refactoring. At minimum, it
 ** would be nice to order the file better, perhaps something along the
 ** lines of:
@@ -317,11 +309,9 @@
 # define FTSTRACE(A)
 #endif
 
-
 static int default_column = 0;
 
-/*  functions needed from tracker */
-
+/* Functions from Tracker */
 static TrackerDBResultSet *
 db_metadata_get (TrackerDBInterface *iface, 
                 const gchar        *id, 
@@ -375,8 +365,6 @@
                                                       NULL);
 }
 
-
-
 static gchar *
 db_get_text (const char     *service,
             const char     *key,    
@@ -420,8 +408,8 @@
 
 
 /*
-** Default span for NEAR operators.
-*/
+ * ** Default span for NEAR operators.
+ * */
 #define SQLITE_FTS3_DEFAULT_NEAR_PARAM 10
 
 /* It is not safe to call isspace(), tolower(), or isalnum() on
@@ -462,7 +450,7 @@
 ** By default, only positions and not offsets are stored in the doclists.
 ** To change this so that offsets are stored too, compile with
 **
-**         -DDL_DEFAULT=DL_POSITIONS_OFFSETS
+**          -DDL_DEFAULT=DL_POSITIONS_OFFSETS
 **
 ** If DL_DEFAULT is set to DL_DOCIDS, your table can only be inserted
 ** into (no deletes or updates).
@@ -472,8 +460,8 @@
 #endif
 
 enum {
-  POS_END = 0,       /* end of this position list */
-  POS_COLUMN,        /* followed by new column number */
+  POS_END = 0,        /* end of this position list */
+  POS_COLUMN,         /* followed by new column number */
   POS_BASE
 };
 
@@ -560,9 +548,9 @@
 ** dataBufferReplace - replace buffer's data.
 */
 typedef struct DataBuffer {
-  char *pData;         /* Pointer to malloc'ed buffer. */
-  int nCapacity;       /* Size of pData buffer. */
-  int nData;           /* End of data loaded into pData. */
+  char *pData;          /* Pointer to malloc'ed buffer. */
+  int nCapacity;        /* Size of pData buffer. */
+  int nData;            /* End of data loaded into pData. */
 } DataBuffer;
 
 static void dataBufferInit(DataBuffer *pBuffer, int nCapacity){
@@ -585,7 +573,7 @@
 }
 static void dataBufferExpand(DataBuffer *pBuffer, int nAddCapacity){
   assert( nAddCapacity>0 );
-  /* TODO(shess) Consider expanding more aggressively. Note that the
+  /* TODO(shess) Consider expanding more aggressively.  Note that the
   ** underlying malloc implementation may take care of such things for
   ** us already.
   */
@@ -595,15 +583,15 @@
   }
 }
 static void dataBufferAppend(DataBuffer *pBuffer,
-                            const char *pSource, int nSource){
+                             const char *pSource, int nSource){
   assert( nSource>0 && pSource!=NULL );
   dataBufferExpand(pBuffer, nSource);
   memcpy(pBuffer->pData+pBuffer->nData, pSource, nSource);
   pBuffer->nData += nSource;
 }
 static void dataBufferAppend2(DataBuffer *pBuffer,
-                             const char *pSource1, int nSource1,
-                             const char *pSource2, int nSource2){
+                              const char *pSource1, int nSource1,
+                              const char *pSource2, int nSource2){
   assert( nSource1>0 && pSource1!=NULL );
   assert( nSource2>0 && pSource2!=NULL );
   dataBufferExpand(pBuffer, nSource1+nSource2);
@@ -612,14 +600,14 @@
   pBuffer->nData += nSource1+nSource2;
 }
 static void dataBufferReplace(DataBuffer *pBuffer,
-                             const char *pSource, int nSource){
+                              const char *pSource, int nSource){
   dataBufferReset(pBuffer);
   dataBufferAppend(pBuffer, pSource, nSource);
 }
 
 /* StringBuffer is a null-terminated version of DataBuffer. */
 typedef struct StringBuffer {
-  DataBuffer b;                   /* Includes null terminator. */
+  DataBuffer b;            /* Includes null terminator. */
 } StringBuffer;
 
 static void initStringBuffer(StringBuffer *sb){
@@ -746,7 +734,7 @@
   return pReader->nData;
 }
 /* TODO(shess) Consider adding a field to track iDocid varint length
-** to make these two functions faster. This might matter (a tiny bit)
+** to make these two functions faster.  This might matter (a tiny bit)
 ** for queries.
 */
 static const char *dlrPosData(DLReader *pReader){
@@ -797,17 +785,17 @@
     if( pReader->iType>=DL_POSITIONS ){
       assert( n<pReader->nData );
       while( 1 ){
-       n += fts3GetVarint32(pReader->pData+n, &iDummy);
-       assert( n<=pReader->nData );
-       if( iDummy==POS_END ) break;
-       if( iDummy==POS_COLUMN ){
-         n += fts3GetVarint32(pReader->pData+n, &iDummy);
-         assert( n<pReader->nData );
-       }else if( pReader->iType==DL_POSITIONS_OFFSETS ){
-         n += fts3GetVarint32(pReader->pData+n, &iDummy);
-         n += fts3GetVarint32(pReader->pData+n, &iDummy);
-         assert( n<pReader->nData );
-       }
+        n += fts3GetVarint32(pReader->pData+n, &iDummy);
+        assert( n<=pReader->nData );
+        if( iDummy==POS_END ) break;
+        if( iDummy==POS_COLUMN ){
+          n += fts3GetVarint32(pReader->pData+n, &iDummy);
+          assert( n<pReader->nData );
+        }else if( pReader->iType==DL_POSITIONS_OFFSETS ){
+          n += fts3GetVarint32(pReader->pData+n, &iDummy);
+          n += fts3GetVarint32(pReader->pData+n, &iDummy);
+          assert( n<pReader->nData );
+        }
       }
     }
     pReader->nElement = n;
@@ -815,7 +803,7 @@
   }
 }
 static void dlrInit(DLReader *pReader, DocListType iType,
-                   const char *pData, int nData){
+                    const char *pData, int nData){
   assert( pData!=NULL && nData!=0 );
   pReader->iType = iType;
   pReader->pData = pData;
@@ -840,7 +828,7 @@
 ** DLWriter.
 */
 static void docListValidate(DocListType iType, const char *pData, int nData,
-                           sqlite_int64 *pLastDocid){
+                            sqlite_int64 *pLastDocid){
   sqlite_int64 iPrevDocid = 0;
   assert( nData>0 );
   assert( pData!=0 );
@@ -858,15 +846,15 @@
     if( iType>DL_DOCIDS ){
       int iDummy;
       while( 1 ){
-       n += fts3GetVarint32(pData+n, &iDummy);
-       if( iDummy==POS_END ) break;
-       if( iDummy==POS_COLUMN ){
-         n += fts3GetVarint32(pData+n, &iDummy);
-       }else if( iType>DL_POSITIONS ){
-         n += fts3GetVarint32(pData+n, &iDummy);
-         n += fts3GetVarint32(pData+n, &iDummy);
-       }
-       assert( n<=nData );
+        n += fts3GetVarint32(pData+n, &iDummy);
+        if( iDummy==POS_END ) break;
+        if( iDummy==POS_COLUMN ){
+          n += fts3GetVarint32(pData+n, &iDummy);
+        }else if( iType>DL_POSITIONS ){
+          n += fts3GetVarint32(pData+n, &iDummy);
+          n += fts3GetVarint32(pData+n, &iDummy);
+        }
+        assert( n<=nData );
       }
     }
     assert( n<=nData );
@@ -925,11 +913,11 @@
 ** Consider a refactor to make this cleaner.
 */
 static void dlwAppend(DLWriter *pWriter,
-                     const char *pData, int nData,
-                     sqlite_int64 iFirstDocid, sqlite_int64 iLastDocid){
+                      const char *pData, int nData,
+                      sqlite_int64 iFirstDocid, sqlite_int64 iLastDocid){
   sqlite_int64 iDocid = 0;
   char c[VARINT_MAX];
-  int nFirstOld, nFirstNew;    /* Old and new varint len of first docid. */
+  int nFirstOld, nFirstNew;     /* Old and new varint len of first docid. */
 #ifndef NDEBUG
   sqlite_int64 iLastDocidDelta;
 #endif
@@ -946,12 +934,12 @@
   ASSERT_VALID_DOCLIST(pWriter->iType, pData, nData, &iLastDocidDelta);
   assert( iLastDocid==iFirstDocid-iDocid+iLastDocidDelta );
 
-  /* Append recoded initial docid and everything else. Rest of docids
+  /* Append recoded initial docid and everything else.  Rest of docids
   ** should have been delta-encoded from previous initial docid.
   */
   if( nFirstOld<nData ){
     dataBufferAppend2(pWriter->b, c, nFirstNew,
-                     pData+nFirstOld, nData-nFirstOld);
+                      pData+nFirstOld, nData-nFirstOld);
   }else{
     dataBufferAppend(pWriter->b, c, nFirstNew);
   }
@@ -959,7 +947,7 @@
 }
 static void dlwCopy(DLWriter *pWriter, DLReader *pReader){
   dlwAppend(pWriter, dlrDocData(pReader), dlrDocDataBytes(pReader),
-           dlrDocid(pReader), dlrDocid(pReader));
+            dlrDocid(pReader), dlrDocid(pReader));
 }
 
 
@@ -1020,7 +1008,7 @@
   int nData;
 
   DocListType iType;
-  int iColumn;        /* the last column read */
+  int iColumn;         /* the last column read */
   int iPosition;       /* the last position read */
   int iStartOffset;    /* the last start offset read */
   int iEndOffset;      /* the last end offset read */
@@ -1087,7 +1075,7 @@
   pReader->pData = dlrPosData(pDLReader);
   pReader->nData = dlrPosDataLen(pDLReader);
   pReader->iType = pDLReader->iType;
-  pReader->iColumn = default_column;
+  pReader->iColumn = 0;
   pReader->iPosition = 0;
   pReader->iStartOffset = 0;
   pReader->iEndOffset = 0;
@@ -1136,9 +1124,9 @@
 typedef struct PLWriter {
   DLWriter *dlw;
 
-  int iColumn;   /* the last column written */
-  int iPos;      /* the last position written */
-  int iOffset;   /* the last start offset written */
+  int iColumn;    /* the last column written */
+  int iPos;       /* the last position written */
+  int iOffset;    /* the last start offset written */
 } PLWriter;
 
 /* TODO(shess) In the case where the parent is reading these values
@@ -1146,7 +1134,7 @@
 ** the same type as pWriter.
 */
 static void plwAdd(PLWriter *pWriter, int iColumn, int iPos,
-                  int iStartOffset, int iEndOffset){
+                   int iStartOffset, int iEndOffset){
   /* Worst-case space for POS_COLUMN, iColumn, iPosDelta,
   ** iStartOffsetDelta, and iEndOffsetDelta.
   */
@@ -1179,7 +1167,7 @@
 }
 static void plwCopy(PLWriter *pWriter, PLReader *pReader){
   plwAdd(pWriter, plrColumn(pReader), plrPosition(pReader),
-        plrStartOffset(pReader), plrEndOffset(pReader));
+         plrStartOffset(pReader), plrEndOffset(pReader));
 }
 
 
@@ -1278,7 +1266,7 @@
 } DLCollector;
 
 /* TODO(shess) This could also be done by calling plwTerminate() and
-** dataBufferAppend(). I tried that, expecting nominal performance
+** dataBufferAppend().  I tried that, expecting nominal performance
 ** differences, but it seemed to pretty reliably be worth 1% to code
 ** it this way.  I suspect it is the incremental malloc overhead (some
 ** percentage of the plwTerminate() calls will cause a realloc), so
@@ -1355,7 +1343,7 @@
 ** during the merge.
 */
 static void docListTrim(DocListType iType, const char *pData, int nData,
-                       int iColumn, DocListType iOutType, DataBuffer *out){
+                        int iColumn, DocListType iOutType, DataBuffer *out){
   DLReader dlReader;
   DLWriter dlWriter;
 
@@ -1417,7 +1405,7 @@
 static int orderedDLReaderCmp(OrderedDLReader *r1, OrderedDLReader *r2){
   if( dlrAtEnd(r1->pReader) ){
     if( dlrAtEnd(r2->pReader) ) return 0;  /* Both atEnd(). */
-    return 1;                             /* Only r1 atEnd(). */
+    return 1;                              /* Only r1 atEnd(). */
   }
   if( dlrAtEnd(r2->pReader) ) return -1;   /* Only r2 atEnd(). */
 
@@ -1455,7 +1443,7 @@
 ** be fixed.
 */
 static void docListMerge(DataBuffer *out,
-                        DLReader *pReaders, int nReaders){
+                         DLReader *pReaders, int nReaders){
   OrderedDLReader readers[MERGE_COUNT];
   DLWriter writer;
   int i, n;
@@ -1499,7 +1487,7 @@
       nStart += dlrDocDataBytes(readers[0].pReader);
     }else{
       if( pStart!=0 ){
-       dlwAppend(&writer, pStart, nStart, iFirstDocid, iLastDocid);
+        dlwAppend(&writer, pStart, nStart, iFirstDocid, iLastDocid);
       }
       pStart = dlrDocData(readers[0].pReader);
       nStart = dlrDocDataBytes(readers[0].pReader);
@@ -1510,8 +1498,8 @@
 
     /* Drop all of the older elements with the same docid. */
     for(i=1; i<nReaders &&
-            !dlrAtEnd(readers[i].pReader) &&
-            dlrDocid(readers[i].pReader)==iDocid; i++){
+             !dlrAtEnd(readers[i].pReader) &&
+             dlrDocid(readers[i].pReader)==iDocid; i++){
       dlrStep(readers[i].pReader);
     }
 
@@ -1526,9 +1514,9 @@
   dlwDestroy(&writer);
 }
 
-/* Helper function for posListUnion(). Compares the current position
+/* Helper function for posListUnion().  Compares the current position
 ** between left and right, returning as standard C idiom of <0 if
-** left<right, >0 if left>right, and 0 if left==right. "End" always
+** left<right, >0 if left>right, and 0 if left==right.  "End" always
 ** compares greater.
 */
 static int posListCmp(PLReader *pLeft, PLReader *pRight){
@@ -1605,7 +1593,7 @@
 static void docListUnion(
   const char *pLeft, int nLeft,
   const char *pRight, int nRight,
-  DataBuffer *pOut     /* Write the combined doclist here */
+  DataBuffer *pOut      /* Write the combined doclist here */
 ){
   DLReader left, right;
   DLWriter writer;
@@ -1648,14 +1636,14 @@
   dlwDestroy(&writer);
 }
 
-/*
+/* 
 ** This function is used as part of the implementation of phrase and
 ** NEAR matching.
 **
 ** pLeft and pRight are DLReaders positioned to the same docid in
 ** lists of type DL_POSITION. This function writes an entry to the
 ** DLWriter pOut for each position in pRight that is less than
-** (nNear+1) greater (but not equal to or smaller) than a position
+** (nNear+1) greater (but not equal to or smaller) than a position 
 ** in pLeft. For example, if nNear is 0, and the positions contained
 ** by pLeft and pRight are:
 **
@@ -1665,13 +1653,13 @@
 ** then the docid is added to pOut. If pOut is of type DL_POSITIONS,
 ** then a positionids "6" and "21" are also added to pOut.
 **
-** If boolean argument isSaveLeft = 1, then positionids are copied
+** If boolean argument isSaveLeft is true, then positionids are copied
 ** from pLeft instead of pRight. In the example above, the positions "5"
 ** and "20" would be added instead of "6" and "21".
 ** If isSaveLeft = 2 then both positions are added, 3 or above and postions are appended to left
 */
 static void posListPhraseMerge(
-  DLReader *pLeft,
+  DLReader *pLeft, 
   DLReader *pRight,
   int nNear,
   int isSaveLeft,
@@ -1727,7 +1715,7 @@
         
         plrStep(&right);
       }else{
-       plrStep(&left);
+        plrStep(&left);
       }
     }
   }
@@ -1742,7 +1730,7 @@
 }
 
 /*
-** Compare the values pointed to by the PLReaders passed as arguments.
+** Compare the values pointed to by the PLReaders passed as arguments. 
 ** Return -1 if the value pointed to by pLeft is considered less than
 ** the value pointed to by pRight, +1 if it is considered greater
 ** than it, or 0 if it is equal. i.e.
@@ -1777,17 +1765,17 @@
 ** A phrase intersection means that two documents only match
 ** if pLeft.iPos+1==pRight.iPos.
 **
-** A NEAR intersection means that two documents only match if
+** A NEAR intersection means that two documents only match if 
 ** (abs(pLeft.iPos-pRight.iPos)<nNear).
 **
 ** If a NEAR intersection is requested, then the nPhrase argument should
 ** be passed the number of tokens in the two operands to the NEAR operator
 ** combined. For example:
 **
-**      Query syntax               nPhrase
-**     ------------------------------------
-**      "A B C" NEAR "D E"         5
-**      A NEAR B                   2
+**       Query syntax               nPhrase
+**      ------------------------------------
+**       "A B C" NEAR "D E"         5
+**       A NEAR B                   2
 **
 ** iType controls the type of data written to pOut.  If iType is
 ** DL_POSITIONS, the positions are those from pRight.
@@ -1811,7 +1799,6 @@
   dlrInit(&left, DL_POSITIONS, pLeft, nLeft);
   dlrInit(&right, DL_POSITIONS, pRight, nRight);
   dlwInit(&writer, iType, pOut);
-  
   while( !dlrAtEnd(&left) && !dlrAtEnd(&right) ){
     if( dlrDocid(&left)<dlrDocid(&right) ){
       dlrStep(&left);
@@ -1854,7 +1841,7 @@
           plwInit(&plwriter, &writer, dlrDocid(dlrAtEnd(&dr1)?&dr2:&dr1));
 #endif
 
-          if( one.nData ) plrInit(&pr1, &dr1); 
+          if( one.nData ) plrInit(&pr1, &dr1);
           if( two.nData ) plrInit(&pr2, &dr2);
           while( !plrAtEnd(&pr1) || !plrAtEnd(&pr2) ){
             int iCompare = plrCompare(&pr1, &pr2);
@@ -1878,7 +1865,6 @@
         }
         dataBufferDestroy(&one);
         dataBufferDestroy(&two);
-
       }
       dlrStep(&left);
       dlrStep(&right);
@@ -1940,7 +1926,6 @@
 
   if( nLeft==0 || nRight==0 ) return;
 
-
   dlrInit(&left, DL_DOCIDS, pLeft, nLeft);
   dlrInit(&right, DL_DOCIDS, pRight, nRight);
   dlwInit(&writer, DL_DOCIDS, pOut);
@@ -1951,9 +1936,7 @@
     }else if( dlrDocid(&right)<dlrDocid(&left) ){
       dlrStep(&right);
     }else{
-   
       dlwAdd(&writer, dlrDocid(&left));
-      
       dlrStep(&left);
       dlrStep(&right);
     }
@@ -2179,7 +2162,7 @@
  * when one string is used repeatedly in a format string.
  * The caller must free() the returned string. */
 static char *string_format(const char *zFormat,
-                          const char *zDb, const char *zName){
+                           const char *zDb, const char *zName){
   const char *p;
   size_t len = 0;
   size_t nDb = strlen(zDb);
@@ -2212,7 +2195,7 @@
 }
 
 static int sql_exec(sqlite3 *db, const char *zDb, const char *zName,
-                   const char *zFormat){
+                    const char *zFormat){
   char *zCommand = string_format(zFormat, zDb, zName);
   int rc;
   FTSTRACE(("FTS3 sql: %s\n", zCommand));
@@ -2222,7 +2205,7 @@
 }
 
 static int sql_prepare(sqlite3 *db, const char *zDb, const char *zName,
-                      sqlite3_stmt **ppStmt, const char *zFormat){
+                       sqlite3_stmt **ppStmt, const char *zFormat){
   char *zCommand = string_format(zFormat, zDb, zName);
   int rc;
   FTSTRACE(("FTS3 prepare: %s\n", zCommand));
@@ -2325,8 +2308,8 @@
 ** matching-word offset information and snippets.
 */
 typedef struct Snippet {
-  int nMatch;    /* Total number of matches */
-  int nAlloc;    /* Space allocated for aMatch[] */
+  int nMatch;     /* Total number of matches */
+  int nAlloc;     /* Space allocated for aMatch[] */
   struct snippetMatch { /* One entry for each matching term */
     char snStatus;       /* Status flag for use while constructing snippets */
     short int iCol;      /* The column that contains the match */
@@ -2337,7 +2320,7 @@
     int rank;           /* the rank of the snippet */
   } *aMatch;      /* Points to space obtained from malloc */
   char *zOffset;  /* Text rendering of aMatch[] */
-  int nOffset;   /* strlen(zOffset) */
+  int nOffset;    /* strlen(zOffset) */
   char *zSnippet; /* Snippet text */
   int nSnippet;   /* strlen(zSnippet) */
 } Snippet;
@@ -2345,7 +2328,7 @@
 
 typedef enum QueryType {
   QUERY_GENERIC,   /* table scan */
-  QUERY_DOCID,    /* lookup by docid */
+  QUERY_DOCID,     /* lookup by docid */
   QUERY_FULLTEXT   /* QUERY_FULLTEXT + [i] is a full-text search for column i*/
 } QueryType;
 
@@ -2371,7 +2354,7 @@
   SEGDIR_DELETE_ALL_STMT,
   SEGDIR_COUNT_STMT,
 
-  MAX_STMT                    /* Always at end! */
+  MAX_STMT                     /* Always at end! */
 } fulltext_statement;
 
 /* These must exactly match the enum above. */
@@ -2449,7 +2432,7 @@
   /* These buffer pending index updates during transactions.
   ** nPendingData estimates the memory size of the pending data.  It
   ** doesn't include the hash-bucket overhead, nor any malloc
-  ** overhead. When nPendingData exceeds kPendingThreshold, the
+  ** overhead.  When nPendingData exceeds kPendingThreshold, the
   ** buffer is flushed even before the transaction closes.
   ** pendingTerms stores the data, and is only valid when nPendingData
   ** is >=0 (nPendingData<0 means pendingTerms has not been
@@ -2520,7 +2503,7 @@
 
 /* Return a dynamically generated statement of the form
  *   update %_content set [col_0] = ?, [col_1] = ?, ...
- *                   where docid = ?
+ *                    where docid = ?
  */
 static const char *contentUpdateStatement(fulltext_vtab *v){
   StringBuffer sb;
@@ -2544,23 +2527,23 @@
 ** and cached, otherwise the cached version is reset.
 */
 static int sql_get_statement(fulltext_vtab *v, fulltext_statement iStmt,
-                            sqlite3_stmt **ppStmt){
+                             sqlite3_stmt **ppStmt){
   assert( iStmt<MAX_STMT );
   if( v->pFulltextStatements[iStmt]==NULL ){
     const char *zStmt;
     int rc;
     switch( iStmt ){
       case CONTENT_INSERT_STMT:
-       zStmt = contentInsertStatement(v); break;
+        zStmt = contentInsertStatement(v); break;
       case CONTENT_SELECT_STMT:
-       zStmt = contentSelectStatement(v); break;
+        zStmt = contentSelectStatement(v); break;
       case CONTENT_UPDATE_STMT:
-       zStmt = contentUpdateStatement(v); break;
+        zStmt = contentUpdateStatement(v); break;
       default:
-       zStmt = fulltext_zStatement[iStmt];
+        zStmt = fulltext_zStatement[iStmt];
     }
     rc = sql_prepare(v->db, v->zDb, v->zName, &v->pFulltextStatements[iStmt],
-                        zStmt);
+                         zStmt);
     if( zStmt != fulltext_zStatement[iStmt]) sqlite3_free((void *) zStmt);
     if( rc!=SQLITE_OK ) return rc;
   } else {
@@ -2573,7 +2556,7 @@
 }
 
 /* Like sqlite3_step(), but convert SQLITE_DONE to SQLITE_OK and
-** SQLITE_ROW to SQLITE_ERROR. Useful for statements like UPDATE,
+** SQLITE_ROW to SQLITE_ERROR.  Useful for statements like UPDATE,
 ** where we expect no results.
 */
 static int sql_single_step(sqlite3_stmt *s){
@@ -2582,20 +2565,20 @@
 }
 
 /* Like sql_get_statement(), but for special replicated LEAF_SELECT
-** statements. idx -1 is a special case for an uncached version of
+** statements.  idx -1 is a special case for an uncached version of
 ** the statement (used in the optimize implementation).
 */
 /* TODO(shess) Write version for generic statements and then share
 ** that between the cached-statement functions.
 */
 static int sql_get_leaf_statement(fulltext_vtab *v, int idx,
-                                 sqlite3_stmt **ppStmt){
+                                  sqlite3_stmt **ppStmt){
   assert( idx>=-1 && idx<MERGE_COUNT );
   if( idx==-1 ){
     return sql_prepare(v->db, v->zDb, v->zName, ppStmt, LEAF_SELECT);
   }else if( v->pLeafSelectStmts[idx]==NULL ){
     int rc = sql_prepare(v->db, v->zDb, v->zName, &v->pLeafSelectStmts[idx],
-                        LEAF_SELECT);
+                         LEAF_SELECT);
     if( rc!=SQLITE_OK ) return rc;
   }else{
     int rc = sqlite3_reset(v->pLeafSelectStmts[idx]);
@@ -2611,7 +2594,7 @@
 ** generated.
 */
 static int content_insert(fulltext_vtab *v, sqlite3_value *docid,
-                         sqlite3_value **pValues){
+                          sqlite3_value **pValues){
   sqlite3_stmt *s;
   int i;
   int rc = sql_get_statement(v, CONTENT_INSERT_STMT, &s);
@@ -2629,9 +2612,9 @@
 }
 
 /* update %_content set col0 = pValues[0], col1 = pValues[1], ...
- *                 where docid = [iDocid] */
+ *                  where docid = [iDocid] */
 static int content_update(fulltext_vtab *v, sqlite3_value **pValues,
-                         sqlite_int64 iDocid){
+                          sqlite_int64 iDocid){
   sqlite3_stmt *s;
   int i;
   int rc = sql_get_statement(v, CONTENT_UPDATE_STMT, &s);
@@ -2664,7 +2647,7 @@
  * TODO: Perhaps we should return pointer/length strings here for consistency
  * with other code which uses pointer/length. */
 static int content_select(fulltext_vtab *v, sqlite_int64 iDocid,
-                         const char ***pValues){
+                          const char ***pValues){
   sqlite3_stmt *s;
   const char **values;
   int i;
@@ -2737,7 +2720,7 @@
 **   returns assigned blockid in *piBlockid
 */
 static int block_insert(fulltext_vtab *v, const char *pData, int nData,
-                       sqlite_int64 *piBlockid){
+                        sqlite_int64 *piBlockid){
   sqlite3_stmt *s;
   int rc = sql_get_statement(v, BLOCK_INSERT_STMT, &s);
   if( rc!=SQLITE_OK ) return rc;
@@ -2761,7 +2744,7 @@
 ** which form a segment.
 */
 static int block_delete(fulltext_vtab *v,
-                       sqlite_int64 iStartBlockid, sqlite_int64 iEndBlockid){
+                        sqlite_int64 iStartBlockid, sqlite_int64 iEndBlockid){
   sqlite3_stmt *s;
   int rc = sql_get_statement(v, BLOCK_DELETE_STMT, &s);
   if( rc!=SQLITE_OK ) return rc;
@@ -2816,10 +2799,10 @@
 ** )
 */
 static int segdir_set(fulltext_vtab *v, int iLevel, int idx,
-                     sqlite_int64 iStartBlockid,
-                     sqlite_int64 iLeavesEndBlockid,
-                     sqlite_int64 iEndBlockid,
-                     const char *pRootData, int nRootData){
+                      sqlite_int64 iStartBlockid,
+                      sqlite_int64 iLeavesEndBlockid,
+                      sqlite_int64 iEndBlockid,
+                      const char *pRootData, int nRootData){
   sqlite3_stmt *s;
   int rc = sql_get_statement(v, SEGDIR_SET_STMT, &s);
   if( rc!=SQLITE_OK ) return rc;
@@ -2850,8 +2833,8 @@
 ** SQLITE_ROW if there are blocks, else an error.
 */
 static int segdir_span(fulltext_vtab *v, int iLevel,
-                      sqlite_int64 *piStartBlockid,
-                      sqlite_int64 *piEndBlockid){
+                       sqlite_int64 *piStartBlockid,
+                       sqlite_int64 *piEndBlockid){
   sqlite3_stmt *s;
   int rc = sql_get_statement(v, SEGDIR_SPAN_STMT, &s);
   if( rc!=SQLITE_OK ) return rc;
@@ -2865,7 +2848,7 @@
 
   /* This happens if all segments at this level are entirely inline. */
   if( SQLITE_NULL==sqlite3_column_type(s, 0) ){
-    /* We expect only one row. We must execute another sqlite3_step()
+    /* We expect only one row.  We must execute another sqlite3_step()
      * to complete the iteration; otherwise the table will remain locked. */
     int rc2 = sqlite3_step(s);
     if( rc2==SQLITE_ROW ) return SQLITE_ERROR;
@@ -3002,18 +2985,18 @@
 /*
 ** Token types for parsing the arguments to xConnect or xCreate.
 */
-#define TOKEN_EOF        0    /* End of file */
-#define TOKEN_SPACE      1    /* Any kind of whitespace */
-#define TOKEN_ID         2    /* An identifier */
-#define TOKEN_STRING     3    /* A string literal */
-#define TOKEN_PUNCT      4    /* A single punctuation character */
+#define TOKEN_EOF         0    /* End of file */
+#define TOKEN_SPACE       1    /* Any kind of whitespace */
+#define TOKEN_ID          2    /* An identifier */
+#define TOKEN_STRING      3    /* A string literal */
+#define TOKEN_PUNCT       4    /* A single punctuation character */
 
 /*
 ** If X is a character that can be used in an identifier then
 ** ftsIdChar(X) will be true.  Otherwise it is false.
 **
 ** For ASCII, any character with the high-order bit set is
-** allowed in an identifier.  For 7-bit characters,
+** allowed in an identifier.  For 7-bit characters, 
 ** isFtsIdChar[X] must be 1.
 **
 ** Ticket #1066.  the SQL standard does not allow '$' in the
@@ -3034,7 +3017,7 @@
 
 
 /*
-** Return the length of the token that begins at z[0].
+** Return the length of the token that begins at z[0]. 
 ** Store the token type in *tokenType before returning.
 */
 static int ftsGetToken(const char *z, int *tokenType){
@@ -3054,13 +3037,13 @@
     case '"': {
       int delim = z[0];
       for(i=1; (c=z[i])!=0; i++){
-       if( c==delim ){
-         if( z[i+1]==delim ){
-           i++;
-         }else{
-           break;
-         }
-       }
+        if( c==delim ){
+          if( z[i+1]==delim ){
+            i++;
+          }else{
+            break;
+          }
+        }
       }
       *tokenType = TOKEN_STRING;
       return i + (c!=0);
@@ -3072,7 +3055,7 @@
     }
     default: {
       if( !ftsIdChar(*z) ){
-       break;
+        break;
       }
       for(i=1; ftsIdChar(z[i]); i++){}
       *tokenType = TOKEN_ID;
@@ -3089,7 +3072,7 @@
 */
 typedef struct FtsToken {
   const char *z;       /* Pointer to token text.  Not '\000' terminated */
-  short int n;        /* Length of the token text in bytes. */
+  short int n;         /* Length of the token text in bytes. */
 } FtsToken;
 
 /*
@@ -3147,10 +3130,10 @@
 **
 ** Examples:
 **
-**     "abc"   becomes  abc
-**     'xyz'   becomes  xyz
-**     [pqr]   becomes  pqr
-**     `mno`   becomes  mno
+**     "abc"   becomes   abc
+**     'xyz'   becomes   xyz
+**     [pqr]   becomes   pqr
+**     `mno`   becomes   mno
 */
 static void dequoteString(char *z){
   int quote;
@@ -3158,20 +3141,20 @@
   if( z==0 ) return;
   quote = z[0];
   switch( quote ){
-    case '\'': break;
-    case '"':  break;
-    case '`':  break;                /* For MySQL compatibility */
-    case '[':  quote = ']';  break;  /* For MS SqlServer compatibility */
-    default:   return;
+    case '\'':  break;
+    case '"':   break;
+    case '`':   break;                /* For MySQL compatibility */
+    case '[':   quote = ']';  break;  /* For MS SqlServer compatibility */
+    default:    return;
   }
   for(i=1, j=0; z[i]; i++){
     if( z[i]==quote ){
       if( z[i+1]==quote ){
-       z[j++] = quote;
-       i++;
+        z[j++] = quote;
+        i++;
       }else{
-       z[j++] = 0;
-       break;
+        z[j++] = 0;
+        break;
       }
     }else{
       z[j++] = z[i];
@@ -3180,30 +3163,30 @@
 }
 
 /*
-** The input azIn is a NULL-terminated list of tokens. Remove the first
+** The input azIn is a NULL-terminated list of tokens.  Remove the first
 ** token and all punctuation tokens.  Remove the quotes from
 ** around string literal tokens.
 **
 ** Example:
 **
-**     input:     tokenize chinese ( 'simplifed' , 'mixed' )
-**     output:    chinese simplifed mixed
+**     input:      tokenize chinese ( 'simplifed' , 'mixed' )
+**     output:     chinese simplifed mixed
 **
 ** Another example:
 **
-**     input:     delimiters ( '[' , ']' , '...' )
-**     output:    [ ] ...
+**     input:      delimiters ( '[' , ']' , '...' )
+**     output:     [ ] ...
 */
 static void tokenListToIdList(char **azIn){
   int i, j;
   if( azIn ){
     for(i=0, j=-1; azIn[i]; i++){
       if( safe_isalnum(azIn[i][0]) || azIn[i][1] ){
-       dequoteString(azIn[i]);
-       if( j>=0 ){
-         azIn[j] = azIn[i];
-       }
-       j++;
+        dequoteString(azIn[i]);
+        if( j>=0 ){
+          azIn[j] = azIn[i];
+        }
+        j++;
       }
     }
     azIn[j] = 0;
@@ -3213,7 +3196,7 @@
 
 /*
 ** Find the first alphanumeric token in the string zIn.  Null-terminate
-** this token. Remove any quotation marks.  And return a pointer to
+** this token.  Remove any quotation marks.  And return a pointer to
 ** the result.
 */
 static char *firstToken(char *zIn, char **pzTail){
@@ -3237,10 +3220,10 @@
 
 /* Return true if...
 **
-**   * s begins with the string t, ignoring case
-**   * s is longer than t
-**   * The first character of s beyond t is not a alphanumeric
-**
+**   *  s begins with the string t, ignoring case
+**   *  s is longer than t
+**   *  The first character of s beyond t is not a alphanumeric
+** 
 ** Ignore leading space in *s.
 **
 ** To put it another way, return true if the first token of
@@ -3260,12 +3243,12 @@
 ** and use by fulltextConnect and fulltextCreate.
 */
 typedef struct TableSpec {
-  const char *zDb;        /* Logical database name */
-  const char *zName;      /* Name of the full-text index */
-  int nColumn;            /* Number of columns to be indexed */
-  char **azColumn;        /* Original names of columns to be indexed */
+  const char *zDb;         /* Logical database name */
+  const char *zName;       /* Name of the full-text index */
+  int nColumn;             /* Number of columns to be indexed */
+  char **azColumn;         /* Original names of columns to be indexed */
   char **azContentColumn;  /* Column names for %_content */
-  char **azTokenizer;     /* Name of tokenizer and its arguments */
+  char **azTokenizer;      /* Name of tokenizer and its arguments */
 } TableSpec;
 
 /*
@@ -3280,17 +3263,17 @@
 /* Parse a CREATE VIRTUAL TABLE statement, which looks like this:
  *
  * CREATE VIRTUAL TABLE email
- *       USING fts3(subject, body, tokenize mytokenizer(myarg))
+ *        USING fts3(subject, body, tokenize mytokenizer(myarg))
  *
  * We return parsed information in a TableSpec structure.
- *
+ * 
  */
 static int parseSpec(TableSpec *pSpec, int argc, const char *const*argv,
-                    char**pzErr){
+                     char**pzErr){
   int i, n;
   char *z, *zDummy;
   char **azArg;
-  const char *zTokenizer = 0;   /* argv[] entry describing the tokenizer */
+  const char *zTokenizer = 0;    /* argv[] entry describing the tokenizer */
 
   assert( argc>=3 );
   /* Current interface:
@@ -3298,7 +3281,7 @@
   ** argv[1] - database name
   ** argv[2] - table name
   ** argv[3..] - columns, optionally followed by tokenizer specification
-  **            and snippet delimiters specification.
+  **             and snippet delimiters specification.
   */
 
   /* Make a copy of the complete argv[][] array in a single allocation.
@@ -3347,7 +3330,7 @@
   ** Each content column name will be of the form cNNAAAA
   ** where NN is the column number and AAAA is the sanitized
   ** column name.  "sanitized" means that special characters are
-  ** converted to "_". The cNN prefix guarantees that all column
+  ** converted to "_".  The cNN prefix guarantees that all column
   ** names are unique.
   **
   ** The AAAA suffix is not strictly necessary.  It is included
@@ -3384,9 +3367,9 @@
 ** using sqlite3_free().
 */
 static char *fulltextSchema(
-  int nColumn,                 /* Number of columns */
-  const char *const* azColumn, /* List of columns */
-  const char *zTableName       /* Name of the table */
+  int nColumn,                  /* Number of columns */
+  const char *const* azColumn,  /* List of columns */
+  const char *zTableName        /* Name of the table */
 ){
   int i;
   char *zSchema, *zNext;
@@ -3414,7 +3397,7 @@
   sqlite3 *db,             /* The SQLite database connection */
   TableSpec *spec,         /* Parsed spec information from parseSpec() */
   sqlite3_vtab **ppVTab,    /* Write the resulting vtab structure here */
-  char **pzErr             /* Write any error message here */
+  char **pzErr              /* Write any error message here */
 ){
   int rc;
   fulltext_vtab *v = 0;
@@ -3426,7 +3409,7 @@
   CLEAR(v);
   /* sqlite will initialize v->base */
   v->db = db;
-  v->zDb = spec->zDb;      /* Freed when azColumn is freed */
+  v->zDb = spec->zDb;       /* Freed when azColumn is freed */
   v->zName = spec->zName;   /* Freed when azColumn is freed */
   v->nColumn = spec->nColumn;
   v->azContentColumn = spec->azContentColumn;
@@ -3439,7 +3422,7 @@
     return SQLITE_NOMEM;
   }
 
-  zTok = spec->azTokenizer[0];
+  zTok = spec->azTokenizer[0]; 
   if( !zTok ){
     zTok = "simple";
   }
@@ -3455,7 +3438,7 @@
   for(n=0; spec->azTokenizer[n]; n++){}
   if( n ){
     rc = m->xCreate(n-1, (const char*const*)&spec->azTokenizer[1],
-                   &v->pTokenizer);
+                    &v->pTokenizer);
   }else{
     rc = m->xCreate(0, 0, &v->pTokenizer);
   }
@@ -3481,7 +3464,7 @@
   /* TODO: verify the existence of backing tables foo_content, foo_term */
 
   schema = fulltextSchema(v->nColumn, (const char*const*)v->azColumn,
-                         spec->zName);
+                          spec->zName);
   rc = sqlite3_declare_vtab(db, schema);
   sqlite3_free(schema);
   if( rc!=SQLITE_OK ) goto err;
@@ -3524,8 +3507,8 @@
 ** code.  Work it into the top-of-file comment at that time.
 */
 static int fulltextCreate(sqlite3 *db, void *pAux,
-                         int argc, const char * const *argv,
-                         sqlite3_vtab **ppVTab, char **pzErr){
+                          int argc, const char * const *argv,
+                          sqlite3_vtab **ppVTab, char **pzErr){
   int rc;
   TableSpec spec;
   StringBuffer schema;
@@ -3544,23 +3527,23 @@
   if( rc!=SQLITE_OK ) goto out;
 
   rc = sql_exec(db, spec.zDb, spec.zName,
-               "create table %_segments("
-               "  blockid INTEGER PRIMARY KEY,"
-               "  block blob"
-               ");"
-               );
+                "create table %_segments("
+                "  blockid INTEGER PRIMARY KEY,"
+                "  block blob"
+                ");"
+                );
   if( rc!=SQLITE_OK ) goto out;
 
   rc = sql_exec(db, spec.zDb, spec.zName,
-               "create table %_segdir("
-               "  level integer,"
-               "  idx integer,"
-               "  start_block integer,"
-               "  leaves_end_block integer,"
-               "  end_block integer,"
-               "  root blob,"
-               "  primary key(level, idx)"
-               ");");
+                "create table %_segdir("
+                "  level integer,"
+                "  idx integer,"
+                "  start_block integer,"
+                "  leaves_end_block integer,"
+                "  end_block integer,"
+                "  root blob,"
+                "  primary key(level, idx)"
+                ");");
   if( rc!=SQLITE_OK ) goto out;
 
   rc = constructVtab(db, &spec, ppVTab, pzErr);
@@ -3581,14 +3564,14 @@
     pConstraint = &pInfo->aConstraint[i];
     if( pConstraint->usable ) {
       if( (pConstraint->iColumn==-1 || pConstraint->iColumn==v->nColumn+1) &&
-         pConstraint->op==SQLITE_INDEX_CONSTRAINT_EQ ){
-       pInfo->idxNum = QUERY_DOCID;      /* lookup by docid */
-       FTSTRACE(("FTS3 QUERY_DOCID\n"));
+          pConstraint->op==SQLITE_INDEX_CONSTRAINT_EQ ){
+        pInfo->idxNum = QUERY_DOCID;      /* lookup by docid */
+        FTSTRACE(("FTS3 QUERY_DOCID\n"));
       } else if( pConstraint->iColumn>=0 && pConstraint->iColumn<=v->nColumn &&
-                pConstraint->op==SQLITE_INDEX_CONSTRAINT_MATCH ){
-       /* full-text search */
-       pInfo->idxNum = QUERY_FULLTEXT + pConstraint->iColumn;
-       FTSTRACE(("FTS3 QUERY_FULLTEXT %d\n", pConstraint->iColumn));
+                 pConstraint->op==SQLITE_INDEX_CONSTRAINT_MATCH ){
+        /* full-text search */
+        pInfo->idxNum = QUERY_FULLTEXT + pConstraint->iColumn;
+        FTSTRACE(("FTS3 QUERY_FULLTEXT %d\n", pConstraint->iColumn));
       } else continue;
 
       pInfo->aConstraintUsage[i].argvIndex = 1;
@@ -3597,7 +3580,7 @@
       /* An arbitrary value for now.
        * TODO: Perhaps docid matches should be considered cheaper than
        * full-text searches. */
-      pInfo->estimatedCost = 1.0;
+      pInfo->estimatedCost = 1.0;   
 
       return SQLITE_OK;
     }
@@ -3618,10 +3601,10 @@
 
   FTSTRACE(("FTS3 Destroy %p\n", pVTab));
   rc = sql_exec(v->db, v->zDb, v->zName,
-               "drop table if exists %_content;"
-               "drop table if exists %_segments;"
-               "drop table if exists %_segdir;"
-               );
+                "drop table if exists %_content;"
+                "drop table if exists %_segments;"
+                "drop table if exists %_segdir;"
+                );
   if( rc!=SQLITE_OK ) return rc;
 
   fulltext_vtab_destroy((fulltext_vtab *)pVTab);
@@ -3672,9 +3655,9 @@
 ** Append a single entry to the p->aMatch[] log.
 */
 static void snippetAppendMatch(
-  Snippet *p,              /* Append the entry to this snippet */
-  int iCol, int iTerm,     /* The column and query term */
-  int iToken,              /* Matching token in document */
+  Snippet *p,               /* Append the entry to this snippet */
+  int iCol, int iTerm,      /* The column and query term */
+  int iToken,               /* Matching token in document */
   int iStart, int nByte     /* Offset and size of the match */
 ){
   int i;
@@ -3701,7 +3684,7 @@
 /*
 ** Sizing information for the circular buffer used in snippetOffsetsOfColumn()
 */
-#define FTS3_ROTOR_SZ  (32)
+#define FTS3_ROTOR_SZ   (32)
 #define FTS3_ROTOR_MASK (FTS3_ROTOR_SZ-1)
 
 /*
@@ -3732,7 +3715,7 @@
 
   /* The following variables keep a circular buffer of the last
   ** few tokens */
-  unsigned int iRotor = 0;            /* Index of current token */
+  unsigned int iRotor = 0;             /* Index of current token */
   int iRotorBegin[FTS3_ROTOR_SZ];      /* Beginning offset of token */
   int iRotorLen[FTS3_ROTOR_SZ];        /* Length of token */
 
@@ -3798,7 +3781,7 @@
 
 /*
 ** Remove entries from the pSnippet structure to account for the NEAR
-** operator. When this is called, pSnippet contains the list of token
+** operator. When this is called, pSnippet contains the list of token 
 ** offsets produced by treating all NEAR operators as AND operators.
 ** This function removes any entries that should not be present after
 ** accounting for the NEAR restriction. For example, if the queried
@@ -3807,7 +3790,7 @@
 **     "A B C D E A"
 **
 ** and the query is:
-**
+** 
 **     A NEAR/0 E
 **
 ** then when this function is called the Snippet contains token offsets
@@ -3898,7 +3881,7 @@
 
 
 /*
-** Compute all offsets for the current row of the query.
+** Compute all offsets for the current row of the query.  
 ** If the offsets have already been computed, this routine is a no-op.
 */
 static void snippetAllOffsets(fulltext_cursor *p){
@@ -3999,7 +3982,8 @@
 
 /*
 ** Convert the information in the aMatch[] array of the snippet
-** into the string zOffset[0..nOffset-1].
+** into the string zOffset[0..nOffset-1]. This string is used as
+** the return of the SQL offsets() function.
 */
 static void snippetOffsetText(Snippet *p){
   int i;
@@ -4011,14 +3995,14 @@
   for(i=0; i<p->nMatch; i++){
     struct snippetMatch *pMatch = &p->aMatch[i];
     if( pMatch->iTerm>=0 ){
-      /* If snippetMatch.iTerm is less than 0, then the match was
-      ** discarded as part of processing the NEAR operator (see the
-      ** trimSnippetOffsetsForNear() function for details). Ignore
+      /* If snippetMatch.iTerm is less than 0, then the match was 
+      ** discarded as part of processing the NEAR operator (see the 
+      ** trimSnippetOffsetsForNear() function for details). Ignore 
       ** it in this case
       */
       zBuf[0] = ' ';
       sqlite3_snprintf(sizeof(zBuf)-1, &zBuf[cnt>0], "%d %d %d %d",
-         pMatch->iCol, pMatch->iTerm, pMatch->iStart, pMatch->nByte);
+          pMatch->iCol, pMatch->iTerm, pMatch->iStart, pMatch->nByte);
       append(&sb, zBuf);
       cnt++;
     }
@@ -4037,12 +4021,12 @@
 ** to be a little left or right so that the break point is better.
 */
 static int wordBoundary(
-  int iBreak,                  /* The suggested break point */
-  const char *zDoc,            /* Document text */
-  int nDoc,                    /* Number of bytes in zDoc[] */
-  struct snippetMatch *aMatch, /* Matching words */
-  int nMatch,                  /* Number of entries in aMatch[] */
-  int iCol                     /* The column number for zDoc[] */
+  int iBreak,                   /* The suggested break point */
+  const char *zDoc,             /* Document text */
+  int nDoc,                     /* Number of bytes in zDoc[] */
+  struct snippetMatch *aMatch,  /* Matching words */
+  int nMatch,                   /* Number of entries in aMatch[] */
+  int iCol                      /* The column number for zDoc[] */
 ){
   int i;
   if( iBreak<=10 ){
@@ -4077,7 +4061,7 @@
 /*
 ** Allowed values for Snippet.aMatch[].snStatus
 */
-#define SNIPPET_IGNORE 0   /* It is ok to omit this match from the snippet */
+#define SNIPPET_IGNORE  0   /* It is ok to omit this match from the snippet */
 #define SNIPPET_DESIRED 1   /* We want to include this match in the snippet */
 
 /*
@@ -4102,7 +4086,7 @@
   int iStart, iEnd;
   int tailEllipsis = 0;
   int iMatch;
-
+  
 
   sqlite3_free(pCursor->snippet.zSnippet);
   pCursor->snippet.zSnippet = 0;
@@ -4117,9 +4101,9 @@
   for(i=0; i<pCursor->q.nTerms; i++){
     for(j=0; j<nMatch; j++){
       if( aMatch[j].iTerm==i ){
-       aMatch[j].snStatus = SNIPPET_DESIRED;
-       nDesired++;
-       break;
+        aMatch[j].snStatus = SNIPPET_DESIRED;
+        nDesired++;
+        break;
       }
     }
   }
@@ -4158,27 +4142,27 @@
     while( iMatch<nMatch && aMatch[iMatch].iCol<iCol ){ iMatch++; }
     while( iStart<iEnd ){
       while( iMatch<nMatch && aMatch[iMatch].iStart<iStart
-            && aMatch[iMatch].iCol<=iCol ){
-       iMatch++;
+             && aMatch[iMatch].iCol<=iCol ){
+        iMatch++;
       }
       if( iMatch<nMatch && aMatch[iMatch].iStart<iEnd
-            && aMatch[iMatch].iCol==iCol ){
-       nappend(&sb, &zDoc[iStart], aMatch[iMatch].iStart - iStart);
-       iStart = aMatch[iMatch].iStart;
-       append(&sb, zStartMark);
-       nappend(&sb, &zDoc[iStart], aMatch[iMatch].nByte);
-       append(&sb, zEndMark);
-       iStart += aMatch[iMatch].nByte;
-       for(j=iMatch+1; j<nMatch; j++){
-         if( aMatch[j].iTerm==aMatch[iMatch].iTerm
-             && aMatch[j].snStatus==SNIPPET_DESIRED ){
-           nDesired--;
-           aMatch[j].snStatus = SNIPPET_IGNORE;
-         }
-       }
+             && aMatch[iMatch].iCol==iCol ){
+        nappend(&sb, &zDoc[iStart], aMatch[iMatch].iStart - iStart);
+        iStart = aMatch[iMatch].iStart;
+        append(&sb, zStartMark);
+        nappend(&sb, &zDoc[iStart], aMatch[iMatch].nByte);
+        append(&sb, zEndMark);
+        iStart += aMatch[iMatch].nByte;
+        for(j=iMatch+1; j<nMatch; j++){
+          if( aMatch[j].iTerm==aMatch[iMatch].iTerm
+              && aMatch[j].snStatus==SNIPPET_DESIRED ){
+            nDesired--;
+            aMatch[j].snStatus = SNIPPET_IGNORE;
+          }
+        }
       }else{
-       nappend(&sb, &zDoc[iStart], iEnd - iStart);
-       iStart = iEnd;
+        nappend(&sb, &zDoc[iStart], iEnd - iStart);
+        iStart = iEnd;
       }
     }
     tailCol = iCol;
@@ -4222,14 +4206,14 @@
     rc = sqlite3_step(c->pStmt);
     switch( rc ){
       case SQLITE_ROW:
-       c->eof = 0;
-       return SQLITE_OK;
+        c->eof = 0;
+        return SQLITE_OK;
       case SQLITE_DONE:
-       c->eof = 1;
-       return SQLITE_OK;
+        c->eof = 1;
+        return SQLITE_OK;
       default:
-       c->eof = 1;
-       return rc;
+        c->eof = 1;
+        return rc;
     }
   } else {  /* full-text query */
     rc = sqlite3_reset(c->pStmt);
@@ -4290,12 +4274,11 @@
 ** docListOfTerm().
 */
 static int termSelect(fulltext_vtab *v, int iColumn,
-                     const char *pTerm, int nTerm, int isPrefix,
-                     DocListType iType, DataBuffer *out);
+                      const char *pTerm, int nTerm, int isPrefix,
+                      DocListType iType, DataBuffer *out);
 
-/* Return a DocList corresponding to the query term *pTerm.  If *pTerm
-** is the first term of a phrase query, go ahead and evaluate the phrase
-** query and return the doclist for the entire phrase query.
+/* 
+** Return a DocList corresponding to the phrase *pPhrase.
 **
 ** The resulting DL_DOCIDS doclist is stored in pResult, which is
 ** overwritten.
@@ -4729,7 +4712,7 @@
 */
 /* TODO(shess) Upgrade the cursor initialization and destruction to
 ** account for fulltextFilter() being called multiple times on the
-** same cursor.  The current solution is very fragile. Apply fix to
+** same cursor.  The current solution is very fragile.  Apply fix to
 ** fts3 as appropriate.
 */
 static int fulltextFilter(
@@ -4771,11 +4754,11 @@
       assert( argc==1 );
       queryClear(&c->q);
       if( c->result.nData!=0 ){
-       /* This case happens if the same cursor is used repeatedly. */
-       dlrDestroy(&c->reader);
-       dataBufferReset(&c->result);
+        /* This case happens if the same cursor is used repeatedly. */
+        dlrDestroy(&c->reader);
+        dataBufferReset(&c->result);
       }else{
-       dataBufferInit(&c->result, 0);
+        dataBufferInit(&c->result, 0);
       }
       rc = fulltextQuery(v, idxNum-QUERY_FULLTEXT, zQuery, -1, &c->result, &c->q);
       if( rc!=SQLITE_OK ) return rc;
@@ -4807,12 +4790,12 @@
 
 /* This is the xColumn method of the virtual table.  The SQLite
 ** core calls this method during a query when it needs the value
-** of a column from the virtual table. This method needs to use
+** of a column from the virtual table.  This method needs to use
 ** one of the sqlite3_result_*() routines to store the requested
 ** value back in the pContext.
 */
 static int fulltextColumn(sqlite3_vtab_cursor *pCursor,
-                         sqlite3_context *pContext, int idxCol){
+                          sqlite3_context *pContext, int idxCol){
   fulltext_cursor *c = (fulltext_cursor *) pCursor;
   fulltext_vtab *v = cursor_vtab(c);
 
@@ -4841,7 +4824,7 @@
 
 /* This is the xRowid method.  The SQLite core calls this routine to
 ** retrieve the rowid for the current row of the result set.  fts3
-** exposes %_content.docid as the rowid for the virtual table. The
+** exposes %_content.docid as the rowid for the virtual table.  The
 ** rowid should be written to *pRowid.
 */
 static int fulltextRowid(sqlite3_vtab_cursor *pCursor, sqlite_int64 *pRowid){
@@ -4937,7 +4920,7 @@
     v->nPendingData += p->b.nData-nData;
   }
 
-  /* TODO(shess) Check return? Should this be able to cause errors at
+  /* TODO(shess) Check return?  Should this be able to cause errors at
   ** this point?  Actually, same question about sqlite3_finalize(),
   ** though one could argue that failure there means that the data is
   ** not durable.  *ponder*
@@ -4949,7 +4932,7 @@
 
 /* Add doclists for all terms in [pValues] to pendingTerms table. */
 static int insertTerms(fulltext_vtab *v, sqlite_int64 iDocid,
-                      sqlite3_value **pValues){
+                       sqlite3_value **pValues){
   int i;
   
 #ifdef STORE_CATEGORY   
@@ -5015,7 +4998,7 @@
 ** new row.  Add doclists for terms to pendingTerms.
 */
 static int index_insert(fulltext_vtab *v, sqlite3_value *pRequestDocid,
-                       sqlite3_value **pValues, sqlite_int64 *piDocid){
+                        sqlite3_value **pValues, sqlite_int64 *piDocid){
   int rc;
 
   rc = content_insert(v, pRequestDocid, pValues);  /* execute an SQL INSERT */
@@ -5047,7 +5030,7 @@
 ** to pendingTerms for terms in the new data.
 */
 static int index_update(fulltext_vtab *v, sqlite_int64 iRow,
-                       sqlite3_value **pValues){
+                        sqlite3_value **pValues){
   int rc = initPendingTerms(v, iRow);
   if( rc!=SQLITE_OK ) return rc;
 
@@ -5099,13 +5082,13 @@
 ** layer is being constructed.
 */
 typedef struct InteriorBlock {
-  DataBuffer term;          /* Leftmost term in block's subtree. */
-  DataBuffer data;          /* Accumulated data for the block. */
+  DataBuffer term;           /* Leftmost term in block's subtree. */
+  DataBuffer data;           /* Accumulated data for the block. */
   struct InteriorBlock *next;
 } InteriorBlock;
 
 static InteriorBlock *interiorBlockNew(int iHeight, sqlite_int64 iChildBlock,
-                                      const char *pTerm, int nTerm){
+                                       const char *pTerm, int nTerm){
   InteriorBlock *block = sqlite3_malloc(sizeof(InteriorBlock));
   char c[VARINT_MAX+VARINT_MAX];
   int n;
@@ -5188,11 +5171,11 @@
 #endif
 
 typedef struct InteriorWriter {
-  int iHeight;                  /* from 0 at leaves. */
+  int iHeight;                   /* from 0 at leaves. */
   InteriorBlock *first, *last;
   struct InteriorWriter *parentWriter;
 
-  DataBuffer term;              /* Last term written to block "last". */
+  DataBuffer term;               /* Last term written to block "last". */
   sqlite_int64 iOpeningChildBlock; /* First child block in block "last". */
 #ifndef NDEBUG
   sqlite_int64 iLastChildBlock;  /* for consistency checks. */
@@ -5204,8 +5187,8 @@
 ** next level down the tree.
 */
 static void interiorWriterInit(int iHeight, const char *pTerm, int nTerm,
-                              sqlite_int64 iChildBlock,
-                              InteriorWriter *pWriter){
+                               sqlite_int64 iChildBlock,
+                               InteriorWriter *pWriter){
   InteriorBlock *block;
   assert( iHeight>0 );
   CLEAR(pWriter);
@@ -5225,8 +5208,8 @@
 ** with pTerm[nTerm] as the leftmost term in iChildBlock's subtree.
 */
 static void interiorWriterAppend(InteriorWriter *pWriter,
-                                const char *pTerm, int nTerm,
-                                sqlite_int64 iChildBlock){
+                                 const char *pTerm, int nTerm,
+                                 sqlite_int64 iChildBlock){
   char c[VARINT_MAX+VARINT_MAX];
   int n, nPrefix = 0;
 
@@ -5242,7 +5225,7 @@
     n = fts3PutVarint(c, nTerm);
   }else{
     while( nPrefix<pWriter->term.nData &&
-          pTerm[nPrefix]==pWriter->term.pData[nPrefix] ){
+           pTerm[nPrefix]==pWriter->term.pData[nPrefix] ){
       nPrefix++;
     }
 
@@ -5261,13 +5244,13 @@
   if( pWriter->last->data.nData+n+nTerm-nPrefix>INTERIOR_MAX &&
       iChildBlock-pWriter->iOpeningChildBlock>INTERIOR_MIN_TERMS ){
     pWriter->last->next = interiorBlockNew(pWriter->iHeight, iChildBlock,
-                                          pTerm, nTerm);
+                                           pTerm, nTerm);
     pWriter->last = pWriter->last->next;
     pWriter->iOpeningChildBlock = iChildBlock;
     dataBufferReset(&pWriter->term);
   }else{
     dataBufferAppend2(&pWriter->last->data, c, n,
-                     pTerm+nPrefix, nTerm-nPrefix);
+                      pTerm+nPrefix, nTerm-nPrefix);
     dataBufferReplace(&pWriter->term, pTerm, nTerm);
   }
   ASSERT_VALID_INTERIOR_BLOCK(pWriter->last);
@@ -5301,8 +5284,8 @@
 ** recursively ask for their root into.
 */
 static int interiorWriterRootInfo(fulltext_vtab *v, InteriorWriter *pWriter,
-                                 char **ppRootInfo, int *pnRootInfo,
-                                 sqlite_int64 *piEndBlockid){
+                                  char **ppRootInfo, int *pnRootInfo,
+                                  sqlite_int64 *piEndBlockid){
   InteriorBlock *block = pWriter->first;
   sqlite_int64 iBlockid = 0;
   int rc;
@@ -5324,8 +5307,8 @@
 
   pWriter->parentWriter = sqlite3_malloc(sizeof(*pWriter->parentWriter));
   interiorWriterInit(pWriter->iHeight+1,
-                    block->term.pData, block->term.nData,
-                    iBlockid, pWriter->parentWriter);
+                     block->term.pData, block->term.nData,
+                     iBlockid, pWriter->parentWriter);
 
   /* Flush additional blocks and append to the higher interior
   ** node.
@@ -5337,12 +5320,12 @@
     *piEndBlockid = iBlockid;
 
     interiorWriterAppend(pWriter->parentWriter,
-                        block->term.pData, block->term.nData, iBlockid);
+                         block->term.pData, block->term.nData, iBlockid);
   }
 
   /* Parent node gets the chance to be the root. */
   return interiorWriterRootInfo(v, pWriter->parentWriter,
-                               ppRootInfo, pnRootInfo, piEndBlockid);
+                                ppRootInfo, pnRootInfo, piEndBlockid);
 }
 
 /****************************************************************/
@@ -5353,7 +5336,7 @@
   const char *pData;
   int nData;
 
-  DataBuffer term;         /* previous term, for decoding term delta. */
+  DataBuffer term;          /* previous term, for decoding term delta. */
 
   sqlite_int64 iBlockid;
 } InteriorReader;
@@ -5367,7 +5350,7 @@
 ** and the blob is empty or otherwise contains suspect data?
 */
 static void interiorReaderInit(const char *pData, int nData,
-                              InteriorReader *pReader){
+                               InteriorReader *pReader){
   int n, nTerm;
 
   /* Require at least the leading flag byte */
@@ -5445,7 +5428,7 @@
 ** results.  If isPrefix, equality means equal through nTerm bytes.
 */
 static int interiorReaderTermCmp(InteriorReader *pReader,
-                                const char *pTerm, int nTerm, int isPrefix){
+                                 const char *pTerm, int nTerm, int isPrefix){
   const char *pReaderTerm = interiorReaderTerm(pReader);
   int nReaderTerm = interiorReaderTermBytes(pReader);
   int c, n = nReaderTerm<nTerm ? nReaderTerm : nTerm;
@@ -5496,18 +5479,18 @@
 typedef struct LeafWriter {
   int iLevel;
   int idx;
-  sqlite_int64 iStartBlockid;    /* needed to create the root info */
-  sqlite_int64 iEndBlockid;      /* when we're done writing. */
+  sqlite_int64 iStartBlockid;     /* needed to create the root info */
+  sqlite_int64 iEndBlockid;       /* when we're done writing. */
 
-  DataBuffer term;               /* previous encoded term */
-  DataBuffer data;               /* encoding buffer */
+  DataBuffer term;                /* previous encoded term */
+  DataBuffer data;                /* encoding buffer */
 
   /* bytes of first term in the current node which distinguishes that
   ** term from the last term of the previous node.
   */
   int nTermDistinct;
 
-  InteriorWriter parentWriter;   /* if we overflow */
+  InteriorWriter parentWriter;    /* if we overflow */
   int has_parent;
 } LeafWriter;
 
@@ -5595,7 +5578,7 @@
 ** contain it.
 */
 static int leafWriterInternalFlush(fulltext_vtab *v, LeafWriter *pWriter,
-                                  int iData, int nData){
+                                   int iData, int nData){
   sqlite_int64 iBlockid = 0;
   const char *pStartingTerm;
   int nStartingTerm, rc, n;
@@ -5624,10 +5607,10 @@
 
   if( pWriter->has_parent ){
     interiorWriterAppend(&pWriter->parentWriter,
-                        pStartingTerm, nStartingTerm, iBlockid);
+                         pStartingTerm, nStartingTerm, iBlockid);
   }else{
     interiorWriterInit(1, pStartingTerm, nStartingTerm, iBlockid,
-                      &pWriter->parentWriter);
+                       &pWriter->parentWriter);
     pWriter->has_parent = 1;
   }
 
@@ -5659,8 +5642,8 @@
 ** all).
 */
 static int leafWriterRootInfo(fulltext_vtab *v, LeafWriter *pWriter,
-                             char **ppRootInfo, int *pnRootInfo,
-                             sqlite_int64 *piEndBlockid){
+                              char **ppRootInfo, int *pnRootInfo,
+                              sqlite_int64 *piEndBlockid){
   /* we can fit the segment entirely inline */
   if( !pWriter->has_parent && pWriter->data.nData<ROOT_MAX ){
     *ppRootInfo = pWriter->data.pData;
@@ -5686,7 +5669,7 @@
   *piEndBlockid = pWriter->iEndBlockid;
 
   return interiorWriterRootInfo(v, &pWriter->parentWriter,
-                               ppRootInfo, pnRootInfo, piEndBlockid);
+                                ppRootInfo, pnRootInfo, piEndBlockid);
 }
 
 /* Collect the rootInfo data and store it into the segment directory.
@@ -5705,8 +5688,8 @@
   if( iEndBlockid==0 && nRootInfo==0 ) return SQLITE_OK;
 
   return segdir_set(v, pWriter->iLevel, pWriter->idx,
-                   pWriter->iStartBlockid, pWriter->iEndBlockid,
-                   iEndBlockid, pRootInfo, nRootInfo);
+                    pWriter->iStartBlockid, pWriter->iEndBlockid,
+                    iEndBlockid, pRootInfo, nRootInfo);
 }
 
 static void leafWriterDestroy(LeafWriter *pWriter){
@@ -5721,13 +5704,13 @@
 ** boundary is crossed.
 */
 static int leafWriterEncodeTerm(LeafWriter *pWriter,
-                               const char *pTerm, int nTerm){
+                                const char *pTerm, int nTerm){
   char c[VARINT_MAX+VARINT_MAX];
   int n, nPrefix = 0;
 
   assert( nTerm>0 );
   while( nPrefix<pWriter->term.nData &&
-        pTerm[nPrefix]==pWriter->term.pData[nPrefix] ){
+         pTerm[nPrefix]==pWriter->term.pData[nPrefix] ){
     nPrefix++;
     /* Failing this implies that the terms weren't in order. */
     assert( nPrefix<nTerm );
@@ -5735,18 +5718,18 @@
 
   if( pWriter->data.nData==0 ){
     /* Encode the node header and leading term as:
-    ** varint(0)
-    ** varint(nTerm)
-    ** char pTerm[nTerm]
+    **  varint(0)
+    **  varint(nTerm)
+    **  char pTerm[nTerm]
     */
     n = fts3PutVarint(c, '\0');
     n += fts3PutVarint(c+n, nTerm);
     dataBufferAppend2(&pWriter->data, c, n, pTerm, nTerm);
   }else{
     /* Delta-encode the term as:
-    ** varint(nPrefix)
-    ** varint(nSuffix)
-    ** char pTermSuffix[nSuffix]
+    **  varint(nPrefix)
+    **  varint(nSuffix)
+    **  char pTermSuffix[nSuffix]
     */
     n = fts3PutVarint(c, nPrefix);
     n += fts3PutVarint(c+n, nTerm-nPrefix);
@@ -5758,13 +5741,13 @@
 }
 
 /* Used to avoid a memmove when a large amount of doclist data is in
-** the buffer. This constructs a node and term header before
+** the buffer.  This constructs a node and term header before
 ** iDoclistData and flushes the resulting complete node using
 ** leafWriterInternalFlush().
 */
 static int leafWriterInlineFlush(fulltext_vtab *v, LeafWriter *pWriter,
-                                const char *pTerm, int nTerm,
-                                int iDoclistData){
+                                 const char *pTerm, int nTerm,
+                                 int iDoclistData){
   char c[VARINT_MAX+VARINT_MAX];
   int iData, n = fts3PutVarint(c, 0);
   n += fts3PutVarint(c+n, nTerm);
@@ -5787,8 +5770,8 @@
 ** %_segments.
 */
 static int leafWriterStepMerge(fulltext_vtab *v, LeafWriter *pWriter,
-                              const char *pTerm, int nTerm,
-                              DLReader *pReaders, int nReaders){
+                               const char *pTerm, int nTerm,
+                               DLReader *pReaders, int nReaders){
   char c[VARINT_MAX+VARINT_MAX];
   int iTermData = pWriter->data.nData, iDoclistData;
   int i, nData, n, nActualData, nActual, rc, nTermDistinct;
@@ -5812,8 +5795,8 @@
 
   docListMerge(&pWriter->data, pReaders, nReaders);
   ASSERT_VALID_DOCLIST(DL_DEFAULT,
-                      pWriter->data.pData+iDoclistData+n,
-                      pWriter->data.nData-iDoclistData-n, NULL);
+                       pWriter->data.pData+iDoclistData+n,
+                       pWriter->data.nData-iDoclistData-n, NULL);
 
   /* The actual amount of doclist data at this point could be smaller
   ** than the length we encoded.  Additionally, the space required to
@@ -5862,8 +5845,8 @@
   */
   if( nActual<n ){
     memmove(pWriter->data.pData+iDoclistData+nActual,
-           pWriter->data.pData+iDoclistData+n,
-           pWriter->data.nData-(iDoclistData+n));
+            pWriter->data.pData+iDoclistData+n,
+            pWriter->data.nData-(iDoclistData+n));
     pWriter->data.nData -= n-nActual;
   }
 
@@ -5899,8 +5882,8 @@
     assert( 2*STANDALONE_MIN<=LEAF_MAX );
     assert( n+pWriter->data.nData-iDoclistData<iDoclistData );
     memcpy(pWriter->data.pData+n,
-          pWriter->data.pData+iDoclistData,
-          pWriter->data.nData-iDoclistData);
+           pWriter->data.pData+iDoclistData,
+           pWriter->data.nData-iDoclistData);
     pWriter->data.nData -= iDoclistData-n;
   }
   ASSERT_VALID_LEAF_NODE(pWriter->data.pData, pWriter->data.nData);
@@ -5915,8 +5898,8 @@
 ** constructed directly in pWriter->data.
 */
 static int leafWriterStep(fulltext_vtab *v, LeafWriter *pWriter,
-                         const char *pTerm, int nTerm,
-                         const char *pData, int nData){
+                          const char *pTerm, int nTerm,
+                          const char *pData, int nData){
   int rc;
   DLReader reader;
 
@@ -5931,9 +5914,9 @@
 /****************************************************************/
 /* LeafReader is used to iterate over an individual leaf node. */
 typedef struct LeafReader {
-  DataBuffer term;         /* copy of current term. */
+  DataBuffer term;          /* copy of current term. */
 
-  const char *pData;       /* data for current term. */
+  const char *pData;        /* data for current term. */
   int nData;
 } LeafReader;
 
@@ -5970,7 +5953,7 @@
 }
 
 static void leafReaderInit(const char *pData, int nData,
-                          LeafReader *pReader){
+                           LeafReader *pReader){
   int nTerm, n;
 
   assert( nData>0 );
@@ -6019,7 +6002,7 @@
 ** If isPrefix, equality means equal through nTerm bytes.
 */
 static int leafReaderTermCmp(LeafReader *pReader,
-                            const char *pTerm, int nTerm, int isPrefix){
+                             const char *pTerm, int nTerm, int isPrefix){
   int c, n = pReader->term.nData<nTerm ? pReader->term.nData : nTerm;
   if( n==0 ){
     if( pReader->term.nData>0 ) return -1;
@@ -6039,13 +6022,13 @@
 ** leaf layer of the tree.
 */
 typedef struct LeavesReader {
-  int idx;                 /* Index within the segment. */
+  int idx;                  /* Index within the segment. */
 
-  sqlite3_stmt *pStmt;     /* Statement we're streaming leaves from. */
-  int eof;                 /* we've seen SQLITE_DONE from pStmt. */
+  sqlite3_stmt *pStmt;      /* Statement we're streaming leaves from. */
+  int eof;                  /* we've seen SQLITE_DONE from pStmt. */
 
   LeafReader leafReader;    /* reader for the current leaf. */
-  DataBuffer rootData;     /* root data for inline. */
+  DataBuffer rootData;      /* root data for inline. */
 } LeavesReader;
 
 /* Access the current term. */
@@ -6106,11 +6089,11 @@
 ** stream of blocks between iStartBlockid and iEndBlockid, inclusive.
 */
 static int leavesReaderInit(fulltext_vtab *v,
-                           int idx,
-                           sqlite_int64 iStartBlockid,
-                           sqlite_int64 iEndBlockid,
-                           const char *pRootData, int nRootData,
-                           LeavesReader *pReader){
+                            int idx,
+                            sqlite_int64 iStartBlockid,
+                            sqlite_int64 iEndBlockid,
+                            const char *pRootData, int nRootData,
+                            LeavesReader *pReader){
   CLEAR(pReader);
   pReader->idx = idx;
 
@@ -6119,7 +6102,7 @@
     /* Entire leaf level fit in root data. */
     dataBufferReplace(&pReader->rootData, pRootData, nRootData);
     leafReaderInit(pReader->rootData.pData, pReader->rootData.nData,
-                  &pReader->leafReader);
+                   &pReader->leafReader);
   }else{
     sqlite3_stmt *s;
     int rc = sql_get_leaf_statement(v, idx, &s);
@@ -6140,8 +6123,8 @@
 
     pReader->pStmt = s;
     leafReaderInit(sqlite3_column_blob(pReader->pStmt, 0),
-                  sqlite3_column_bytes(pReader->pStmt, 0),
-                  &pReader->leafReader);
+                   sqlite3_column_bytes(pReader->pStmt, 0),
+                   &pReader->leafReader);
   }
   return SQLITE_OK;
 }
@@ -6166,8 +6149,8 @@
     }
     leafReaderDestroy(&pReader->leafReader);
     leafReaderInit(sqlite3_column_blob(pReader->pStmt, 0),
-                  sqlite3_column_bytes(pReader->pStmt, 0),
-                  &pReader->leafReader);
+                   sqlite3_column_bytes(pReader->pStmt, 0),
+                   &pReader->leafReader);
   }
   return SQLITE_OK;
 }
@@ -6183,8 +6166,8 @@
   if( leavesReaderAtEnd(lr2) ) return -1;
 
   return leafReaderTermCmp(&lr1->leafReader,
-                          leavesReaderTerm(lr2), leavesReaderTermBytes(lr2),
-                          0);
+                           leavesReaderTerm(lr2), leavesReaderTermBytes(lr2),
+                           0);
 }
 
 /* Similar to leavesReaderTermCmp(), with additional ordering by idx
@@ -6214,7 +6197,7 @@
 ** order.
 */
 static int leavesReadersInit(fulltext_vtab *v, int iLevel,
-                            LeavesReader *pReaders, int *piReaders){
+                             LeavesReader *pReaders, int *piReaders){
   sqlite3_stmt *s;
   int i, rc = sql_get_statement(v, SEGDIR_SELECT_LEVEL_STMT, &s);
   if( rc!=SQLITE_OK ) return rc;
@@ -6231,7 +6214,7 @@
 
     assert( i<MERGE_COUNT );
     rc = leavesReaderInit(v, i, iStart, iEnd, pRootData, nRootData,
-                         &pReaders[i]);
+                          &pReaders[i]);
     if( rc!=SQLITE_OK ) break;
 
     i++;
@@ -6258,8 +6241,8 @@
 */
 /* TODO(shess) Consider putting this inline in segmentMerge(). */
 static int leavesReadersMerge(fulltext_vtab *v,
-                             LeavesReader *pReaders, int nReaders,
-                             LeafWriter *pWriter){
+                              LeavesReader *pReaders, int nReaders,
+                              LeafWriter *pWriter){
   DLReader dlReaders[MERGE_COUNT];
   const char *pTerm = leavesReaderTerm(pReaders);
   int i, nTerm = leavesReaderTermBytes(pReaders);
@@ -6268,8 +6251,8 @@
 
   for(i=0; i<nReaders; i++){
     dlrInit(&dlReaders[i], DL_DEFAULT,
-           leavesReaderData(pReaders+i),
-           leavesReaderDataBytes(pReaders+i));
+            leavesReaderData(pReaders+i),
+            leavesReaderDataBytes(pReaders+i));
   }
 
   return leafWriterStepMerge(v, pWriter, pTerm, nTerm, dlReaders, nReaders);
@@ -6284,7 +6267,7 @@
 */
 static int segdirNextIndex(fulltext_vtab *v, int iLevel, int *pidx){
   int rc = segdir_max_index(v, iLevel, pidx);
-  if( rc==SQLITE_DONE ){             /* No segments at iLevel. */
+  if( rc==SQLITE_DONE ){              /* No segments at iLevel. */
     *pidx = 0;
   }else if( rc==SQLITE_ROW ){
     if( *pidx==(MERGE_COUNT-1) ){
@@ -6370,7 +6353,7 @@
 
 /* Accumulate the union of *acc and *pData into *acc. */
 static void docListAccumulateUnion(DataBuffer *acc,
-                                  const char *pData, int nData) {
+                                   const char *pData, int nData) {
   DataBuffer tmp = *acc;
   dataBufferInit(acc, tmp.nData+nData);
   docListUnion(tmp.pData, tmp.nData, pData, nData, acc);
@@ -6393,8 +6376,8 @@
 ** Internal function for loadSegmentLeaf().
 */
 static int loadSegmentLeavesInt(fulltext_vtab *v, LeavesReader *pReader,
-                               const char *pTerm, int nTerm, int isPrefix,
-                               DataBuffer *out){
+                                const char *pTerm, int nTerm, int isPrefix,
+                                DataBuffer *out){
   /* doclist data is accumulated into pBuffers similar to how one does
   ** increment in binary arithmetic.  If index 0 is empty, the data is
   ** stored there.  If there is data there, it is merged and the
@@ -6414,38 +6397,38 @@
     ** use a confusing name.]
     */
     int c = leafReaderTermCmp(&pReader->leafReader, pTerm, nTerm, isPrefix);
-    if( c>0 ) break;     /* Past any possible matches. */
+    if( c>0 ) break;      /* Past any possible matches. */
     if( c==0 ){
       const char *pData = leavesReaderData(pReader);
       int iBuffer, nData = leavesReaderDataBytes(pReader);
 
       /* Find the first empty buffer. */
       for(iBuffer=0; iBuffer<nBuffers; ++iBuffer){
-       if( 0==pBuffers[iBuffer].nData ) break;
+        if( 0==pBuffers[iBuffer].nData ) break;
       }
 
       /* Out of buffers, add an empty one. */
       if( iBuffer==nBuffers ){
-       if( nBuffers==nMaxBuffers ){
-         DataBuffer *p;
-         nMaxBuffers += 20;
-
-         /* Manual realloc so we can handle NULL appropriately. */
-         p = sqlite3_malloc(nMaxBuffers*sizeof(*pBuffers));
-         if( p==NULL ){
-           rc = SQLITE_NOMEM;
-           break;
-         }
+        if( nBuffers==nMaxBuffers ){
+          DataBuffer *p;
+          nMaxBuffers += 20;
+
+          /* Manual realloc so we can handle NULL appropriately. */
+          p = sqlite3_malloc(nMaxBuffers*sizeof(*pBuffers));
+          if( p==NULL ){
+            rc = SQLITE_NOMEM;
+            break;
+          }
 
-         if( nBuffers>0 ){
-           assert(pBuffers!=NULL);
-           memcpy(p, pBuffers, nBuffers*sizeof(*pBuffers));
-           sqlite3_free(pBuffers);
-         }
-         pBuffers = p;
-       }
-       dataBufferInit(&(pBuffers[nBuffers]), 0);
-       nBuffers++;
+          if( nBuffers>0 ){
+            assert(pBuffers!=NULL);
+            memcpy(p, pBuffers, nBuffers*sizeof(*pBuffers));
+            sqlite3_free(pBuffers);
+          }
+          pBuffers = p;
+        }
+        dataBufferInit(&(pBuffers[nBuffers]), 0);
+        nBuffers++;
       }
 
       /* At this point, must have an empty at iBuffer. */
@@ -6453,32 +6436,32 @@
 
       /* If empty was first buffer, no need for merge logic. */
       if( iBuffer==0 ){
-       dataBufferReplace(&(pBuffers[0]), pData, nData);
+        dataBufferReplace(&(pBuffers[0]), pData, nData);
       }else{
-       /* pAcc is the empty buffer the merged data will end up in. */
-       DataBuffer *pAcc = &(pBuffers[iBuffer]);
-       DataBuffer *p = &(pBuffers[0]);
-
-       /* Handle position 0 specially to avoid need to prime pAcc
-       ** with pData/nData.
-       */
-       dataBufferSwap(p, pAcc);
-       docListAccumulateUnion(pAcc, pData, nData);
-
-       /* Accumulate remaining doclists into pAcc. */
-       for(++p; p<pAcc; ++p){
-         docListAccumulateUnion(pAcc, p->pData, p->nData);
-
-         /* dataBufferReset() could allow a large doclist to blow up
-         ** our memory requirements.
-         */
-         if( p->nCapacity<1024 ){
-           dataBufferReset(p);
-         }else{
-           dataBufferDestroy(p);
-           dataBufferInit(p, 0);
-         }
-       }
+        /* pAcc is the empty buffer the merged data will end up in. */
+        DataBuffer *pAcc = &(pBuffers[iBuffer]);
+        DataBuffer *p = &(pBuffers[0]);
+
+        /* Handle position 0 specially to avoid need to prime pAcc
+        ** with pData/nData.
+        */
+        dataBufferSwap(p, pAcc);
+        docListAccumulateUnion(pAcc, pData, nData);
+
+        /* Accumulate remaining doclists into pAcc. */
+        for(++p; p<pAcc; ++p){
+          docListAccumulateUnion(pAcc, p->pData, p->nData);
+
+          /* dataBufferReset() could allow a large doclist to blow up
+          ** our memory requirements.
+          */
+          if( p->nCapacity<1024 ){
+            dataBufferReset(p);
+          }else{
+            dataBufferDestroy(p);
+            dataBufferInit(p, 0);
+          }
+        }
       }
     }
   }
@@ -6489,12 +6472,12 @@
     int iBuffer;
     for(iBuffer=0; iBuffer<nBuffers; ++iBuffer){
       if( pBuffers[iBuffer].nData>0 ){
-       if( out->nData==0 ){
-         dataBufferSwap(out, &(pBuffers[iBuffer]));
-       }else{
-         docListAccumulateUnion(out, pBuffers[iBuffer].pData,
-                                pBuffers[iBuffer].nData);
-       }
+        if( out->nData==0 ){
+          dataBufferSwap(out, &(pBuffers[iBuffer]));
+        }else{
+          docListAccumulateUnion(out, pBuffers[iBuffer].pData,
+                                 pBuffers[iBuffer].nData);
+        }
       }
     }
   }
@@ -6509,8 +6492,8 @@
 
 /* Call loadSegmentLeavesInt() with pData/nData as input. */
 static int loadSegmentLeaf(fulltext_vtab *v, const char *pData, int nData,
-                          const char *pTerm, int nTerm, int isPrefix,
-                          DataBuffer *out){
+                           const char *pTerm, int nTerm, int isPrefix,
+                           DataBuffer *out){
   LeavesReader reader;
   int rc;
 
@@ -6530,9 +6513,9 @@
 ** out.
 */
 static int loadSegmentLeaves(fulltext_vtab *v,
-                            sqlite_int64 iStartLeaf, sqlite_int64 iEndLeaf,
-                            const char *pTerm, int nTerm, int isPrefix,
-                            DataBuffer *out){
+                             sqlite_int64 iStartLeaf, sqlite_int64 iEndLeaf,
+                             const char *pTerm, int nTerm, int isPrefix,
+                             DataBuffer *out){
   int rc;
   LeavesReader reader;
 
@@ -6558,9 +6541,9 @@
 ** it is not worthwhile.
 */
 static void getChildrenContaining(const char *pData, int nData,
-                                 const char *pTerm, int nTerm, int isPrefix,
-                                 sqlite_int64 *piStartChild,
-                                 sqlite_int64 *piEndChild){
+                                  const char *pTerm, int nTerm, int isPrefix,
+                                  sqlite_int64 *piStartChild,
+                                  sqlite_int64 *piEndChild){
   InteriorReader reader;
 
   assert( nData>1 );
@@ -6605,7 +6588,7 @@
 
   assert( iBlockid!=0 );
   assert( pTerm!=NULL );
-  assert( nTerm!=0 );       /* TODO(shess) Why not allow this? */
+  assert( nTerm!=0 );        /* TODO(shess) Why not allow this? */
   assert( piStartChild!=NULL );
   assert( piEndChild!=NULL );
 
@@ -6620,7 +6603,7 @@
   if( rc!=SQLITE_ROW ) return rc;
 
   getChildrenContaining(sqlite3_column_blob(s, 0), sqlite3_column_bytes(s, 0),
-                       pTerm, nTerm, isPrefix, piStartChild, piEndChild);
+                        pTerm, nTerm, isPrefix, piStartChild, piEndChild);
 
   /* We expect only one row.  We must execute another sqlite3_step()
    * to complete the iteration; otherwise the table will remain
@@ -6637,9 +6620,9 @@
 ** loadSegment() to make error-handling cleaner.
 */
 static int loadSegmentInt(fulltext_vtab *v, const char *pData, int nData,
-                         sqlite_int64 iLeavesEnd,
-                         const char *pTerm, int nTerm, int isPrefix,
-                         DataBuffer *out){
+                          sqlite_int64 iLeavesEnd,
+                          const char *pTerm, int nTerm, int isPrefix,
+                          DataBuffer *out){
   /* Special case where root is a leaf. */
   if( *pData=='\0' ){
     return loadSegmentLeaf(v, pData, nData, pTerm, nTerm, isPrefix, out);
@@ -6651,19 +6634,19 @@
     ** until we find the set of leaf nodes to scan for the term.
     */
     getChildrenContaining(pData, nData, pTerm, nTerm, isPrefix,
-                         &iStartChild, &iEndChild);
+                          &iStartChild, &iEndChild);
     while( iStartChild>iLeavesEnd ){
       sqlite_int64 iNextStart, iNextEnd;
       rc = loadAndGetChildrenContaining(v, iStartChild, pTerm, nTerm, isPrefix,
-                                       &iNextStart, &iNextEnd);
+                                        &iNextStart, &iNextEnd);
       if( rc!=SQLITE_OK ) return rc;
 
       /* If we've branched, follow the end branch, too. */
       if( iStartChild!=iEndChild ){
-       sqlite_int64 iDummy;
-       rc = loadAndGetChildrenContaining(v, iEndChild, pTerm, nTerm, isPrefix,
-                                         &iDummy, &iNextEnd);
-       if( rc!=SQLITE_OK ) return rc;
+        sqlite_int64 iDummy;
+        rc = loadAndGetChildrenContaining(v, iEndChild, pTerm, nTerm, isPrefix,
+                                          &iDummy, &iNextEnd);
+        if( rc!=SQLITE_OK ) return rc;
       }
 
       assert( iNextStart<=iNextEnd );
@@ -6675,7 +6658,7 @@
 
     /* Scan through the leaf segments for doclists. */
     return loadSegmentLeaves(v, iStartChild, iEndChild,
-                            pTerm, nTerm, isPrefix, out);
+                             pTerm, nTerm, isPrefix, out);
   }
 }
 
@@ -6691,15 +6674,15 @@
 */
 /* TODO(shess) The current merge is likely to be slow for large
 ** doclists (though it should process from newest/smallest to
-** oldest/largest, so it may not be that bad). It might be useful to
+** oldest/largest, so it may not be that bad).  It might be useful to
 ** modify things to allow for N-way merging.  This could either be
 ** within a segment, with pairwise merges across segments, or across
 ** all segments at once.
 */
 static int loadSegment(fulltext_vtab *v, const char *pData, int nData,
-                      sqlite_int64 iLeavesEnd,
-                      const char *pTerm, int nTerm, int isPrefix,
-                      DataBuffer *out){
+                       sqlite_int64 iLeavesEnd,
+                       const char *pTerm, int nTerm, int isPrefix,
+                       DataBuffer *out){
   DataBuffer result;
   int rc;
 
@@ -6710,7 +6693,7 @@
 
   dataBufferInit(&result, 0);
   rc = loadSegmentInt(v, pData, nData, iLeavesEnd,
-                     pTerm, nTerm, isPrefix, &result);
+                      pTerm, nTerm, isPrefix, &result);
   if( rc==SQLITE_OK && result.nData>0 ){
     if( out->nData==0 ){
       DataBuffer tmp = *out;
@@ -6758,7 +6741,7 @@
     const int nData = sqlite3_column_bytes(s, 2);
     const sqlite_int64 iLeavesEnd = sqlite3_column_int64(s, 1);
     rc = loadSegment(v, pData, nData, iLeavesEnd, pTerm, nTerm, isPrefix,
-                    &doclist);
+                     &doclist);
     if( rc!=SQLITE_OK ) goto err;
   }
   if( rc==SQLITE_DONE ){
@@ -6770,7 +6753,7 @@
       */
       if( iColumn==v->nColumn) iColumn = -1;
       docListTrim(DL_DEFAULT, doclist.pData, doclist.nData,
-                 iColumn, iType, out);
+                  iColumn, iType, out);
     }
     rc = SQLITE_OK;
   }
@@ -6839,7 +6822,7 @@
     dataBufferReset(&dl);
     dlcAddDoclist(pData[i].pCollector, &dl);
     rc = leafWriterStep(v, &writer,
-                       pData[i].pTerm, pData[i].nTerm, dl.pData, dl.nData);
+                        pData[i].pTerm, pData[i].nTerm, dl.pData, dl.nData);
     if( rc!=SQLITE_OK ) goto err;
   }
   rc = leafWriterFinalize(v, &writer);
@@ -6901,7 +6884,7 @@
 /* This function implements the xUpdate callback; it is the top-level entry
  * point for inserting, deleting or updating a row in a full-text table. */
 static int fulltextUpdate(sqlite3_vtab *pVtab, int nArg, sqlite3_value **ppArg,
-                         sqlite_int64 *pRowid){
+                          sqlite_int64 *pRowid){
   fulltext_vtab *v = (fulltext_vtab *) pVtab;
   int rc;
 
@@ -6915,15 +6898,15 @@
       */
       rc = content_exists(v);
       if( rc==SQLITE_ROW ){
-       rc = SQLITE_OK;
+        rc = SQLITE_OK;
       }else if( rc==SQLITE_DONE ){
-       /* Clear the pending terms so we don't flush a useless level-0
-       ** segment when the transaction closes.
-       */
-       rc = clearPendingTerms(v);
-       if( rc==SQLITE_OK ){
-         rc = segdir_delete_all(v);
-       }
+        /* Clear the pending terms so we don't flush a useless level-0
+        ** segment when the transaction closes.
+        */
+        rc = clearPendingTerms(v);
+        if( rc==SQLITE_OK ){
+          rc = segdir_delete_all(v);
+        }
       }
     }
   } else if( sqlite3_value_type(ppArg[0]) != SQLITE_NULL ){
@@ -6936,10 +6919,10 @@
      */
     sqlite_int64 rowid = sqlite3_value_int64(ppArg[0]);
     if( sqlite3_value_type(ppArg[1]) != SQLITE_INTEGER ||
-       sqlite3_value_int64(ppArg[1]) != rowid ){
+        sqlite3_value_int64(ppArg[1]) != rowid ){
       rc = SQLITE_ERROR;  /* we don't allow changing the rowid */
     }else if( sqlite3_value_type(ppArg[2+v->nColumn+1]) != SQLITE_INTEGER ||
-             sqlite3_value_int64(ppArg[2+v->nColumn+1]) != rowid ){
+              sqlite3_value_int64(ppArg[2+v->nColumn+1]) != rowid ){
       rc = SQLITE_ERROR;  /* we don't allow changing the docid */
     }else{
       assert( nArg==2+v->nColumn+2);
@@ -6955,7 +6938,7 @@
     sqlite3_value *pRequestDocid = ppArg[2+v->nColumn+1];
     assert( nArg==2+v->nColumn+2);
     if( SQLITE_NULL != sqlite3_value_type(pRequestDocid) &&
-       SQLITE_NULL != sqlite3_value_type(ppArg[1]) ){
+        SQLITE_NULL != sqlite3_value_type(ppArg[1]) ){
       /* TODO(shess) Consider allowing this to work if the values are
       ** identical.  I'm inclined to discourage that usage, though,
       ** given that both rowid and docid are special columns.  Better
@@ -6966,7 +6949,7 @@
       rc = SQLITE_ERROR;
     }else{
       if( SQLITE_NULL == sqlite3_value_type(pRequestDocid) ){
-       pRequestDocid = ppArg[1];
+        pRequestDocid = ppArg[1];
       }
       rc = index_insert(v, pRequestDocid, &ppArg[2], pRowid);
     }
@@ -7026,10 +7009,10 @@
     if( argc>=2 ){
       zStart = (const char*)sqlite3_value_text(argv[1]);
       if( argc>=3 ){
-       zEnd = (const char*)sqlite3_value_text(argv[2]);
-       if( argc>=4 ){
-         zEllipsis = (const char*)sqlite3_value_text(argv[3]);
-       }
+        zEnd = (const char*)sqlite3_value_text(argv[2]);
+        if( argc>=4 ){
+          zEllipsis = (const char*)sqlite3_value_text(argv[3]);
+        }
       }
     }
     snippetAllOffsets(pCursor);
@@ -7153,14 +7136,14 @@
   }
 }
 
-/* optimize() helper function. Put the readers in order and iterate
+/* optimize() helper function.  Put the readers in order and iterate
 ** through them, merging doclists for matching terms into pWriter.
 ** Returns SQLITE_OK on success, or the SQLite error code which
 ** prevented success.
 */
 static int optimizeInternal(fulltext_vtab *v,
-                           OptLeavesReader *readers, int nReaders,
-                           LeafWriter *pWriter){
+                            OptLeavesReader *readers, int nReaders,
+                            LeafWriter *pWriter){
   int i, rc = SQLITE_OK;
   DataBuffer doclist, merged, tmp;
 
@@ -7188,9 +7171,9 @@
       /* Trim deletions from the doclist. */
       dataBufferReset(&merged);
       docListTrim(DL_DEFAULT,
-                 optLeavesReaderData(&readers[0]),
-                 optLeavesReaderDataBytes(&readers[0]),
-                 -1, DL_DEFAULT, &merged);
+                  optLeavesReaderData(&readers[0]),
+                  optLeavesReaderDataBytes(&readers[0]),
+                  -1, DL_DEFAULT, &merged);
     }else{
       DLReader dlReaders[MERGE_COUNT];
       int iReader, nReaders;
@@ -7199,33 +7182,33 @@
       ** one pass index 0 will reference the accumulated doclist.
       */
       dlrInit(&dlReaders[0], DL_DEFAULT,
-             optLeavesReaderData(&readers[0]),
-             optLeavesReaderDataBytes(&readers[0]));
+              optLeavesReaderData(&readers[0]),
+              optLeavesReaderDataBytes(&readers[0]));
       iReader = 1;
 
       assert( iReader<i );  /* Must execute the loop at least once. */
       while( iReader<i ){
-       /* Merge 16 inputs per pass. */
-       for( nReaders=1; iReader<i && nReaders<MERGE_COUNT;
-            iReader++, nReaders++ ){
-         dlrInit(&dlReaders[nReaders], DL_DEFAULT,
-                 optLeavesReaderData(&readers[iReader]),
-                 optLeavesReaderDataBytes(&readers[iReader]));
-       }
+        /* Merge 16 inputs per pass. */
+        for( nReaders=1; iReader<i && nReaders<MERGE_COUNT;
+             iReader++, nReaders++ ){
+          dlrInit(&dlReaders[nReaders], DL_DEFAULT,
+                  optLeavesReaderData(&readers[iReader]),
+                  optLeavesReaderDataBytes(&readers[iReader]));
+        }
 
-       /* Merge doclists and swap result into accumulator. */
-       dataBufferReset(&merged);
-       docListMerge(&merged, dlReaders, nReaders);
-       tmp = merged;
-       merged = doclist;
-       doclist = tmp;
+        /* Merge doclists and swap result into accumulator. */
+        dataBufferReset(&merged);
+        docListMerge(&merged, dlReaders, nReaders);
+        tmp = merged;
+        merged = doclist;
+        doclist = tmp;
 
-       while( nReaders-- > 0 ){
-         dlrDestroy(&dlReaders[nReaders]);
-       }
+        while( nReaders-- > 0 ){
+          dlrDestroy(&dlReaders[nReaders]);
+        }
 
-       /* Accumulated doclist to reader 0 for next pass. */
-       dlrInit(&dlReaders[0], DL_DEFAULT, doclist.pData, doclist.nData);
+        /* Accumulated doclist to reader 0 for next pass. */
+        dlrInit(&dlReaders[0], DL_DEFAULT, doclist.pData, doclist.nData);
       }
 
       /* Destroy reader that was left in the pipeline. */
@@ -7234,15 +7217,15 @@
       /* Trim deletions from the doclist. */
       dataBufferReset(&merged);
       docListTrim(DL_DEFAULT, doclist.pData, doclist.nData,
-                 -1, DL_DEFAULT, &merged);
+                  -1, DL_DEFAULT, &merged);
     }
 
     /* Only pass doclists with hits (skip if all hits deleted). */
     if( merged.nData>0 ){
       rc = leafWriterStep(v, pWriter,
-                         optLeavesReaderTerm(&readers[0]),
-                         optLeavesReaderTermBytes(&readers[0]),
-                         merged.pData, merged.nData);
+                          optLeavesReaderTerm(&readers[0]),
+                          optLeavesReaderTermBytes(&readers[0]),
+                          merged.pData, merged.nData);
       if( rc!=SQLITE_OK ) goto err;
     }
 
@@ -7266,12 +7249,12 @@
 ** table-named column.
 */
 static void optimizeFunc(sqlite3_context *pContext,
-                        int argc, sqlite3_value **argv){
+                         int argc, sqlite3_value **argv){
   fulltext_cursor *pCursor;
   if( argc>1 ){
     sqlite3_result_error(pContext, "excess arguments to optimize()",-1);
   }else if( sqlite3_value_type(argv[0])!=SQLITE_BLOB ||
-           sqlite3_value_bytes(argv[0])!=sizeof(pCursor) ){
+            sqlite3_value_bytes(argv[0])!=sizeof(pCursor) ){
     sqlite3_result_error(pContext, "illegal first argument to optimize",-1);
   }else{
     fulltext_vtab *v;
@@ -7292,7 +7275,7 @@
     if( rc!=SQLITE_OK ) goto err;
     if( nReaders==0 || nReaders==1 ){
       sqlite3_result_text(pContext, "Index already optimal", -1,
-                         SQLITE_STATIC);
+                          SQLITE_STATIC);
       return;
     }
 
@@ -7316,14 +7299,14 @@
 
       assert( i<nReaders );
       rc = leavesReaderInit(v, -1, iStart, iEnd, pRootData, nRootData,
-                           &readers[i].reader);
+                            &readers[i].reader);
       if( rc!=SQLITE_OK ) break;
 
       readers[i].segment = i;
       i++;
     }
 
-    /* If we managed to succesfully read them all, optimize them. */
+    /* If we managed to successfully read them all, optimize them. */
     if( rc==SQLITE_DONE ){
       assert( i==nReaders );
       rc = optimizeInternal(v, readers, nReaders, &writer);
@@ -7339,8 +7322,8 @@
     */
     if( rc==SQLITE_OK ){
       for( i=0; i<=iMaxLevel; i++ ){
-       rc = segdir_delete(v, i);
-       if( rc!=SQLITE_OK ) break;
+        rc = segdir_delete(v, i);
+        if( rc!=SQLITE_OK ) break;
       }
 
       if( rc==SQLITE_OK ) rc = leafWriterFinalize(v, &writer);
@@ -7360,7 +7343,7 @@
     {
       char buf[512];
       sqlite3_snprintf(sizeof(buf), buf, "Error in optimize: %s",
-                      sqlite3_errmsg(sqlite3_context_db_handle(pContext)));
+                       sqlite3_errmsg(sqlite3_context_db_handle(pContext)));
       sqlite3_result_error(pContext, buf, -1);
     }
   }
@@ -7371,7 +7354,7 @@
 ** pull the error from the context's db handle.
 */
 static void generateError(sqlite3_context *pContext,
-                         const char *prefix, const char *msg){
+                          const char *prefix, const char *msg){
   char buf[512];
   if( msg==NULL ) msg = sqlite3_errmsg(sqlite3_context_db_handle(pContext));
   sqlite3_snprintf(sizeof(buf), buf, "%s: %s", prefix, msg);
@@ -7385,14 +7368,14 @@
 ** fit in a leaf).
 */
 static int collectSegmentTerms(fulltext_vtab *v, sqlite3_stmt *s,
-                              fts3Hash *pTerms){
+                               fts3Hash *pTerms){
   const sqlite_int64 iStartBlockid = sqlite3_column_int64(s, 0);
   const sqlite_int64 iEndBlockid = sqlite3_column_int64(s, 1);
   const char *pRootData = sqlite3_column_blob(s, 2);
   const int nRootData = sqlite3_column_bytes(s, 2);
   LeavesReader reader;
   int rc = leavesReaderInit(v, 0, iStartBlockid, iEndBlockid,
-                           pRootData, nRootData, &reader);
+                            pRootData, nRootData, &reader);
   if( rc!=SQLITE_OK ) return rc;
 
   while( rc==SQLITE_OK && !leavesReaderAtEnd(&reader) ){
@@ -7436,7 +7419,7 @@
     assert( iTerm<nTerms );
     pData[iTerm].pTerm = fts3HashKey(e);
     pData[iTerm].nTerm = fts3HashKeysize(e);
-    pData[iTerm].pCollector = fts3HashData(e); /* unused */
+    pData[iTerm].pCollector = fts3HashData(e);  /* unused */
   }
   assert( iTerm==nTerms );
 
@@ -7481,7 +7464,7 @@
   if( argc!=3 && argc!=1 ){
     generateError(pContext, "dump_terms", "incorrect arguments");
   }else if( sqlite3_value_type(argv[0])!=SQLITE_BLOB ||
-           sqlite3_value_bytes(argv[0])!=sizeof(pCursor) ){
+            sqlite3_value_bytes(argv[0])!=sizeof(pCursor) ){
     generateError(pContext, "dump_terms", "illegal first argument");
   }else{
     fulltext_vtab *v;
@@ -7500,10 +7483,10 @@
     }else{
       rc = sql_get_statement(v, SEGDIR_SELECT_SEGMENT_STMT, &s);
       if( rc==SQLITE_OK ){
-       rc = sqlite3_bind_int(s, 1, sqlite3_value_int(argv[1]));
-       if( rc==SQLITE_OK ){
-         rc = sqlite3_bind_int(s, 2, sqlite3_value_int(argv[2]));
-       }
+        rc = sqlite3_bind_int(s, 1, sqlite3_value_int(argv[1]));
+        if( rc==SQLITE_OK ){
+          rc = sqlite3_bind_int(s, 2, sqlite3_value_int(argv[2]));
+        }
       }
     }
 
@@ -7525,22 +7508,22 @@
     }else{
       const int nTerms = fts3HashCount(&terms);
       if( nTerms>0 ){
-       rc = generateTermsResult(pContext, &terms);
-       if( rc==SQLITE_NOMEM ){
-         generateError(pContext, "dump_terms", "out of memory");
-       }else{
-         assert( rc==SQLITE_OK );
-       }
+        rc = generateTermsResult(pContext, &terms);
+        if( rc==SQLITE_NOMEM ){
+          generateError(pContext, "dump_terms", "out of memory");
+        }else{
+          assert( rc==SQLITE_OK );
+        }
       }else if( argc==3 ){
-       /* The specific segment asked for could not be found. */
-       generateError(pContext, "dump_terms", "segment not found");
+        /* The specific segment asked for could not be found. */
+        generateError(pContext, "dump_terms", "segment not found");
       }else{
-       /* No segments found. */
-       /* TODO(shess): It should be impossible to reach this.  This
-       ** case can only happen for an empty table, in which case
-       ** SQLite has no rows to call this function on.
-       */
-       sqlite3_result_null(pContext);
+        /* No segments found. */
+        /* TODO(shess): It should be impossible to reach this.  This
+        ** case can only happen for an empty table, in which case
+        ** SQLite has no rows to call this function on.
+        */
+        sqlite3_result_null(pContext);
       }
     }
     sqlite3Fts3HashClear(&terms);
@@ -7551,7 +7534,7 @@
 ** pContext.
 */
 static void createDoclistResult(sqlite3_context *pContext,
-                               const char *pData, int nData){
+                                const char *pData, int nData){
   DataBuffer dump;
   DLReader dlReader;
 
@@ -7571,33 +7554,33 @@
       int iColumn = plrColumn(&plReader);
 
       sqlite3_snprintf(sizeof(buf), buf, "[%lld %d[",
-                      dlrDocid(&dlReader), iColumn);
+                       dlrDocid(&dlReader), iColumn);
       dataBufferAppend(&dump, buf, strlen(buf));
 
       for( ; !plrAtEnd(&plReader); plrStep(&plReader) ){
-       if( plrColumn(&plReader)!=iColumn ){
-         iColumn = plrColumn(&plReader);
-         sqlite3_snprintf(sizeof(buf), buf, "] %d[", iColumn);
-         assert( dump.nData>0 );
-         dump.nData--;                     /* Overwrite trailing space. */
-         assert( dump.pData[dump.nData]==' ');
-         dataBufferAppend(&dump, buf, strlen(buf));
-       }
-       if( DL_DEFAULT==DL_POSITIONS_OFFSETS ){
-         sqlite3_snprintf(sizeof(buf), buf, "%d,%d,%d ",
-                          plrPosition(&plReader),
-                          plrStartOffset(&plReader), plrEndOffset(&plReader));
-       }else if( DL_DEFAULT==DL_POSITIONS ){
-         sqlite3_snprintf(sizeof(buf), buf, "%d ", plrPosition(&plReader));
-       }else{
-         assert( NULL=="Unhandled DL_DEFAULT value");
-       }
-       dataBufferAppend(&dump, buf, strlen(buf));
+        if( plrColumn(&plReader)!=iColumn ){
+          iColumn = plrColumn(&plReader);
+          sqlite3_snprintf(sizeof(buf), buf, "] %d[", iColumn);
+          assert( dump.nData>0 );
+          dump.nData--;                     /* Overwrite trailing space. */
+          assert( dump.pData[dump.nData]==' ');
+          dataBufferAppend(&dump, buf, strlen(buf));
+        }
+        if( DL_DEFAULT==DL_POSITIONS_OFFSETS ){
+          sqlite3_snprintf(sizeof(buf), buf, "%d,%d,%d ",
+                           plrPosition(&plReader),
+                           plrStartOffset(&plReader), plrEndOffset(&plReader));
+        }else if( DL_DEFAULT==DL_POSITIONS ){
+          sqlite3_snprintf(sizeof(buf), buf, "%d ", plrPosition(&plReader));
+        }else{
+          assert( NULL=="Unhandled DL_DEFAULT value");
+        }
+        dataBufferAppend(&dump, buf, strlen(buf));
       }
       plrDestroy(&plReader);
 
       assert( dump.nData>0 );
-      dump.nData--;                    /* Overwrite trailing space. */
+      dump.nData--;                     /* Overwrite trailing space. */
       assert( dump.pData[dump.nData]==' ');
       dataBufferAppend(&dump, "]] ", 3);
     }
@@ -7605,7 +7588,7 @@
   dlrDestroy(&dlReader);
 
   assert( dump.nData>0 );
-  dump.nData--;                            /* Overwrite trailing space. */
+  dump.nData--;                     /* Overwrite trailing space. */
   assert( dump.pData[dump.nData]==' ');
   dump.pData[dump.nData] = '\0';
   assert( dump.nData>0 );
@@ -7645,10 +7628,10 @@
   if( argc!=2 && argc!=4 ){
     generateError(pContext, "dump_doclist", "incorrect arguments");
   }else if( sqlite3_value_type(argv[0])!=SQLITE_BLOB ||
-           sqlite3_value_bytes(argv[0])!=sizeof(pCursor) ){
+            sqlite3_value_bytes(argv[0])!=sizeof(pCursor) ){
     generateError(pContext, "dump_doclist", "illegal first argument");
   }else if( sqlite3_value_text(argv[1])==NULL ||
-           sqlite3_value_text(argv[1])[0]=='\0' ){
+            sqlite3_value_text(argv[1])[0]=='\0' ){
     generateError(pContext, "dump_doclist", "empty second argument");
   }else{
     const char *pTerm = (const char *)sqlite3_value_text(argv[1]);
@@ -7673,45 +7656,45 @@
       /* Get our specific segment's information. */
       rc = sql_get_statement(v, SEGDIR_SELECT_SEGMENT_STMT, &s);
       if( rc==SQLITE_OK ){
-       rc = sqlite3_bind_int(s, 1, sqlite3_value_int(argv[2]));
-       if( rc==SQLITE_OK ){
-         rc = sqlite3_bind_int(s, 2, sqlite3_value_int(argv[3]));
-       }
+        rc = sqlite3_bind_int(s, 1, sqlite3_value_int(argv[2]));
+        if( rc==SQLITE_OK ){
+          rc = sqlite3_bind_int(s, 2, sqlite3_value_int(argv[3]));
+        }
       }
 
       if( rc==SQLITE_OK ){
-       rc = sqlite3_step(s);
+        rc = sqlite3_step(s);
 
-       if( rc==SQLITE_DONE ){
-         dataBufferDestroy(&doclist);
-         generateError(pContext, "dump_doclist", "segment not found");
-         return;
-       }
+        if( rc==SQLITE_DONE ){
+          dataBufferDestroy(&doclist);
+          generateError(pContext, "dump_doclist", "segment not found");
+          return;
+        }
 
-       /* Found a segment, load it into doclist. */
-       if( rc==SQLITE_ROW ){
-         const sqlite_int64 iLeavesEnd = sqlite3_column_int64(s, 1);
-         const char *pData = sqlite3_column_blob(s, 2);
-         const int nData = sqlite3_column_bytes(s, 2);
-
-         /* loadSegment() is used by termSelect() to load each
-         ** segment's data.
-         */
-         rc = loadSegment(v, pData, nData, iLeavesEnd, pTerm, nTerm, 0,
-                          &doclist);
-         if( rc==SQLITE_OK ){
-           rc = sqlite3_step(s);
-
-           /* Should not have more than one matching segment. */
-           if( rc!=SQLITE_DONE ){
-             sqlite3_reset(s);
-             dataBufferDestroy(&doclist);
-             generateError(pContext, "dump_doclist", "invalid segdir");
-             return;
-           }
-           rc = SQLITE_OK;
-         }
-       }
+        /* Found a segment, load it into doclist. */
+        if( rc==SQLITE_ROW ){
+          const sqlite_int64 iLeavesEnd = sqlite3_column_int64(s, 1);
+          const char *pData = sqlite3_column_blob(s, 2);
+          const int nData = sqlite3_column_bytes(s, 2);
+
+          /* loadSegment() is used by termSelect() to load each
+          ** segment's data.
+          */
+          rc = loadSegment(v, pData, nData, iLeavesEnd, pTerm, nTerm, 0,
+                           &doclist);
+          if( rc==SQLITE_OK ){
+            rc = sqlite3_step(s);
+
+            /* Should not have more than one matching segment. */
+            if( rc!=SQLITE_DONE ){
+              sqlite3_reset(s);
+              dataBufferDestroy(&doclist);
+              generateError(pContext, "dump_doclist", "invalid segdir");
+              return;
+            }
+            rc = SQLITE_OK;
+          }
+        }
       }
 
       sqlite3_reset(s);
@@ -7719,14 +7702,14 @@
 
     if( rc==SQLITE_OK ){
       if( doclist.nData>0 ){
-       createDoclistResult(pContext, doclist.pData, doclist.nData);
+        createDoclistResult(pContext, doclist.pData, doclist.nData);
       }else{
-       /* TODO(shess): This can happen if the term is not present, or
-       ** if all instances of the term have been deleted and this is
-       ** an all-index dump.  It may be interesting to distinguish
-       ** these cases.
-       */
-       sqlite3_result_text(pContext, "", 0, SQLITE_STATIC);
+        /* TODO(shess): This can happen if the term is not present, or
+        ** if all instances of the term have been deleted and this is
+        ** an all-index dump.  It may be interesting to distinguish
+        ** these cases.
+        */
+        sqlite3_result_text(pContext, "", 0, SQLITE_STATIC);
       }
     }else if( rc==SQLITE_NOMEM ){
       /* Handle out-of-memory cases specially because if they are
@@ -7800,8 +7783,8 @@
     "ALTER TABLE %Q.'%q_content'  RENAME TO '%q_content';"
     "ALTER TABLE %Q.'%q_segments' RENAME TO '%q_segments';"
     "ALTER TABLE %Q.'%q_segdir'   RENAME TO '%q_segdir';"
-    , p->zDb, p->zName, zName
-    , p->zDb, p->zName, zName
+    , p->zDb, p->zName, zName 
+    , p->zDb, p->zName, zName 
     , p->zDb, p->zName, zName
   );
   if( zSql ){
@@ -7812,24 +7795,24 @@
 }
 
 static const sqlite3_module fts3Module = {
-  /* iVersion     */ 0,
-  /* xCreate      */ fulltextCreate,
-  /* xConnect     */ fulltextConnect,
+  /* iVersion      */ 0,
+  /* xCreate       */ fulltextCreate,
+  /* xConnect      */ fulltextConnect,
   /* xBestIndex    */ fulltextBestIndex,
   /* xDisconnect   */ fulltextDisconnect,
-  /* xDestroy     */ fulltextDestroy,
-  /* xOpen        */ fulltextOpen,
-  /* xClose       */ fulltextClose,
-  /* xFilter      */ fulltextFilter,
-  /* xNext        */ fulltextNext,
-  /* xEof         */ fulltextEof,
-  /* xColumn      */ fulltextColumn,
-  /* xRowid       */ fulltextRowid,
-  /* xUpdate      */ fulltextUpdate,
-  /* xBegin       */ fulltextBegin,
-  /* xSync        */ fulltextSync,
-  /* xCommit      */ fulltextCommit,
-  /* xRollback    */ fulltextRollback,
+  /* xDestroy      */ fulltextDestroy,
+  /* xOpen         */ fulltextOpen,
+  /* xClose        */ fulltextClose,
+  /* xFilter       */ fulltextFilter,
+  /* xNext         */ fulltextNext,
+  /* xEof          */ fulltextEof,
+  /* xColumn       */ fulltextColumn,
+  /* xRowid        */ fulltextRowid,
+  /* xUpdate       */ fulltextUpdate,
+  /* xBegin        */ fulltextBegin,
+  /* xSync         */ fulltextSync,
+  /* xCommit       */ fulltextCommit,
+  /* xRollback     */ fulltextRollback,
   /* xFindFunction */ fulltextFindFunction,
   /* xRename */       fulltextRename,
 };
Index: tracker-fts-hash.c
===================================================================
--- tracker-fts-hash.c  (revision 3021)
+++ tracker-fts-hash.c  (working copy)
@@ -1,7 +1,7 @@
 /*
 ** 2001 September 22
 **
-** The author disclaims copyright to this source code. In place of
+** The author disclaims copyright to this source code.  In place of
 ** a legal notice, here is a blessing:
 **
 **    May you do good and not evil.
@@ -18,10 +18,10 @@
 ** The code in this file is only compiled if:
 **
 **     * The FTS3 module is being built as an extension
-**      (in which case SQLITE_CORE is not defined), or
+**       (in which case SQLITE_CORE is not defined), or
 **
 **     * The FTS3 module is being built into the core of
-**      SQLite (in which case SQLITE_ENABLE_FTS3 is defined).
+**       SQLite (in which case SQLITE_ENABLE_FTS3 is defined).
 */
 
 #include <assert.h>
@@ -49,8 +49,8 @@
 ** fields of the Hash structure.
 **
 ** "pNew" is a pointer to the hash table that is to be initialized.
-** keyClass is one of the constants
-** FTS3_HASH_BINARY or FTS3_HASH_STRING.  The value of keyClass
+** keyClass is one of the constants 
+** FTS3_HASH_BINARY or FTS3_HASH_STRING.  The value of keyClass 
 ** determines what kind of key the hash table will use.  "copyKey" is
 ** true if the hash table should make its own private copy of keys and
 ** false if it should just use the supplied pointer.
@@ -71,7 +71,7 @@
 ** to the empty state.
 */
 void sqlite3Fts3HashClear(fts3Hash *pH){
-  fts3HashElem *elem;        /* For looping over all elements of the table */
+  fts3HashElem *elem;         /* For looping over all elements of the table */
 
   assert( pH!=0 );
   elem = pH->first;
@@ -127,7 +127,7 @@
 /*
 ** Return a pointer to the appropriate hash function given the key class.
 **
-** The C syntax in this function definition may be unfamilar to some
+** The C syntax in this function definition may be unfamilar to some 
 ** programmers, so we provide the following additional explanation:
 **
 ** The name of the function is "ftsHashFunction".  The function takes a
@@ -163,17 +163,17 @@
 /* Link an element into the hash table
 */
 static void fts3HashInsertElement(
-  fts3Hash *pH,                   /* The complete hash table */
+  fts3Hash *pH,            /* The complete hash table */
   struct _fts3ht *pEntry,  /* The entry into which pNew is inserted */
-  fts3HashElem *pNew      /* The element to be inserted */
+  fts3HashElem *pNew       /* The element to be inserted */
 ){
-  fts3HashElem *pHead;    /* First element already in pEntry */
+  fts3HashElem *pHead;     /* First element already in pEntry */
   pHead = pEntry->chain;
   if( pHead ){
     pNew->next = pHead;
     pNew->prev = pHead->prev;
     if( pHead->prev ){ pHead->prev->next = pNew; }
-    else            { pH->first = pNew; }
+    else             { pH->first = pNew; }
     pHead->prev = pNew;
   }else{
     pNew->next = pH->first;
@@ -187,11 +187,11 @@
 
 
 /* Resize the hash table so that it cantains "new_size" buckets.
-** "new_size" must be a power of 2.  The hash table might fail
+** "new_size" must be a power of 2.  The hash table might fail 
 ** to resize if sqliteMalloc() fails.
 */
 static void fts3Rehash(fts3Hash *pH, int new_size){
-  struct _fts3ht *new_ht;         /* The new hash table */
+  struct _fts3ht *new_ht;          /* The new hash table */
   fts3HashElem *elem, *next_elem;  /* For looping over existing elements */
   int (*xHash)(const void*,int);   /* The hash function */
 
@@ -217,10 +217,10 @@
   const fts3Hash *pH, /* The pH to be searched */
   const void *pKey,   /* The key we are searching for */
   int nKey,
-  int h                      /* The hash for this key. */
+  int h               /* The hash for this key. */
 ){
-  fts3HashElem *elem;           /* Used to loop thru the element list */
-  int count;                    /* Number of elements left to test */
+  fts3HashElem *elem;            /* Used to loop thru the element list */
+  int count;                     /* Number of elements left to test */
   int (*xCompare)(const void*,int,const void*,int);  /* comparison function */
 
   if( pH->ht ){
@@ -229,8 +229,8 @@
     count = pEntry->count;
     xCompare = ftsCompareFunction(pH->keyClass);
     while( count-- && elem ){
-      if( (*xCompare)(elem->pKey,elem->nKey,pKey,nKey)==0 ){
-       return elem;
+      if( (*xCompare)(elem->pKey,elem->nKey,pKey,nKey)==0 ){ 
+        return elem;
       }
       elem = elem->next;
     }
@@ -242,13 +242,13 @@
 ** element and a hash on the element's key.
 */
 static void fts3RemoveElementByHash(
-  fts3Hash *pH,                /* The pH containing "elem" */
-  fts3HashElem* elem,  /* The element to be removed from the pH */
-  int h                        /* Hash value for the element */
+  fts3Hash *pH,         /* The pH containing "elem" */
+  fts3HashElem* elem,   /* The element to be removed from the pH */
+  int h                 /* Hash value for the element */
 ){
   struct _fts3ht *pEntry;
   if( elem->prev ){
-    elem->prev->next = elem->next;
+    elem->prev->next = elem->next; 
   }else{
     pH->first = elem->next;
   }
@@ -280,8 +280,8 @@
 ** found, or NULL if there is no match.
 */
 void *sqlite3Fts3HashFind(const fts3Hash *pH, const void *pKey, int nKey){
-  int h;                /* A hash on key */
-  fts3HashElem *elem;   /* The element that matches key */
+  int h;                 /* A hash on key */
+  fts3HashElem *elem;    /* The element that matches key */
   int (*xHash)(const void*,int);  /* The hash function */
 
   if( pH==0 || pH->ht==0 ) return 0;
@@ -297,7 +297,7 @@
 ** and the data is "data".
 **
 ** If no element exists with a matching key, then a new
-** element is created. A copy of the key is made if the copyKey
+** element is created.  A copy of the key is made if the copyKey
 ** flag is set.  NULL is returned.
 **
 ** If another element already exists with the same key, then the
@@ -311,12 +311,12 @@
 void *sqlite3Fts3HashInsert(
   fts3Hash *pH,        /* The hash table to insert into */
   const void *pKey,    /* The key */
-  int nKey,           /* Number of bytes in the key */
-  void *data          /* The data */
+  int nKey,            /* Number of bytes in the key */
+  void *data           /* The data */
 ){
-  int hraw;                /* Raw hash value of the key */
-  int h;                   /* the hash of the key modulo hash table size */
-  fts3HashElem *elem;      /* Used to loop thru the element list */
+  int hraw;                 /* Raw hash value of the key */
+  int h;                    /* the hash of the key modulo hash table size */
+  fts3HashElem *elem;       /* Used to loop thru the element list */
   fts3HashElem *new_elem;   /* New element added to the pH */
   int (*xHash)(const void*,int);  /* The hash function */

Follow-Ups:
- Re: [Tracker] Updating our FTS Version
  - From: Jamie McCracken

[Date Prev][Date Next] [Thread Prev][Thread Next] [Thread Index] [Date Index] [Author Index]