fts2.c

来自「sqlite database for embed linux」· C语言代码 · 共 1,979 行 · 第 1/5 页
1,979 行
    */    if( dlrDocData(readers[0].pReader)==pStart+nStart ){      nStart += dlrDocDataBytes(readers[0].pReader);    }else{      if( pStart!=0 ){        dlwAppend(&writer, pStart, nStart, iFirstDocid, iLastDocid);      }      pStart = dlrDocData(readers[0].pReader);      nStart = dlrDocDataBytes(readers[0].pReader);      iFirstDocid = iDocid;    }    iLastDocid = iDocid;    dlrStep(readers[0].pReader);    /* Drop all of the older elements with the same docid. */    for(i=1; i<nReaders &&             !dlrAtEnd(readers[i].pReader) &&             dlrDocid(readers[i].pReader)==iDocid; i++){      dlrStep(readers[i].pReader);    }    /* Get the readers back into order. */    while( i-->0 ){      orderedDLReaderReorder(readers+i, nReaders-i);    }  }  /* Copy over any remaining elements. */  if( nStart>0 ) dlwAppend(&writer, pStart, nStart, iFirstDocid, iLastDocid);  dlwDestroy(&writer);}/* pLeft and pRight are DLReaders positioned to the same docid.**** If there are no instances in pLeft or pRight where the position** of pLeft is one less than the position of pRight, then this** routine adds nothing to pOut.**** If there are one or more instances where positions from pLeft** are exactly one less than positions from pRight, then add a new** document record to pOut.  If pOut wants to hold positions, then** include the positions from pRight that are one more than a** position in pLeft.  In other words:  pRight.iPos==pLeft.iPos+1.*/static void mergePosList(DLReader *pLeft, DLReader *pRight, DLWriter *pOut){  PLReader left, right;  PLWriter writer;  int match = 0;  assert( dlrDocid(pLeft)==dlrDocid(pRight) );  assert( pOut->iType!=DL_POSITIONS_OFFSETS );  plrInit(&left, pLeft);  plrInit(&right, pRight);  while( !plrAtEnd(&left) && !plrAtEnd(&right) ){    if( plrColumn(&left)<plrColumn(&right) ){      plrStep(&left);    }else if( plrColumn(&left)>plrColumn(&right) ){      plrStep(&right);    }else if( plrPosition(&left)+1<plrPosition(&right) ){      plrStep(&left);    }else if( plrPosition(&left)+1>plrPosition(&right) ){      plrStep(&right);    }else{      if( !match ){        plwInit(&writer, pOut, dlrDocid(pLeft));        match = 1;      }      plwAdd(&writer, plrColumn(&right), plrPosition(&right), 0, 0);      plrStep(&left);      plrStep(&right);    }  }  if( match ){    plwTerminate(&writer);    plwDestroy(&writer);  }  plrDestroy(&left);  plrDestroy(&right);}/* We have two doclists with positions:  pLeft and pRight.** Write the phrase intersection of these two doclists into pOut.**** A phrase intersection means that two documents only match** if pLeft.iPos+1==pRight.iPos.**** iType controls the type of data written to pOut.  If iType is** DL_POSITIONS, the positions are those from pRight.*/static void docListPhraseMerge(  const char *pLeft, int nLeft,  const char *pRight, int nRight,  DocListType iType,  DataBuffer *pOut      /* Write the combined doclist here */){  DLReader left, right;  DLWriter writer;  if( nLeft==0 || nRight==0 ) return;  assert( iType!=DL_POSITIONS_OFFSETS );  dlrInit(&left, DL_POSITIONS, pLeft, nLeft);  dlrInit(&right, DL_POSITIONS, pRight, nRight);  dlwInit(&writer, iType, pOut);  while( !dlrAtEnd(&left) && !dlrAtEnd(&right) ){    if( dlrDocid(&left)<dlrDocid(&right) ){      dlrStep(&left);    }else if( dlrDocid(&right)<dlrDocid(&left) ){      dlrStep(&right);    }else{      mergePosList(&left, &right, &writer);      dlrStep(&left);      dlrStep(&right);    }  }  dlrDestroy(&left);  dlrDestroy(&right);  dlwDestroy(&writer);}/* We have two DL_DOCIDS doclists:  pLeft and pRight.** Write the intersection of these two doclists into pOut as a** DL_DOCIDS doclist.*/static void docListAndMerge(  const char *pLeft, int nLeft,  const char *pRight, int nRight,  DataBuffer *pOut      /* Write the combined doclist here */){  DLReader left, right;  DLWriter writer;  if( nLeft==0 || nRight==0 ) return;  dlrInit(&left, DL_DOCIDS, pLeft, nLeft);  dlrInit(&right, DL_DOCIDS, pRight, nRight);  dlwInit(&writer, DL_DOCIDS, pOut);  while( !dlrAtEnd(&left) && !dlrAtEnd(&right) ){    if( dlrDocid(&left)<dlrDocid(&right) ){      dlrStep(&left);    }else if( dlrDocid(&right)<dlrDocid(&left) ){      dlrStep(&right);    }else{      dlwAdd(&writer, dlrDocid(&left));      dlrStep(&left);      dlrStep(&right);    }  }  dlrDestroy(&left);  dlrDestroy(&right);  dlwDestroy(&writer);}/* We have two DL_DOCIDS doclists:  pLeft and pRight.** Write the union of these two doclists into pOut as a** DL_DOCIDS doclist.*/static void docListOrMerge(  const char *pLeft, int nLeft,  const char *pRight, int nRight,  DataBuffer *pOut      /* Write the combined doclist here */){  DLReader left, right;  DLWriter writer;  if( nLeft==0 ){    dataBufferAppend(pOut, pRight, nRight);    return;  }  if( nRight==0 ){    dataBufferAppend(pOut, pLeft, nLeft);    return;  }  dlrInit(&left, DL_DOCIDS, pLeft, nLeft);  dlrInit(&right, DL_DOCIDS, pRight, nRight);  dlwInit(&writer, DL_DOCIDS, pOut);  while( !dlrAtEnd(&left) || !dlrAtEnd(&right) ){    if( dlrAtEnd(&right) ){      dlwAdd(&writer, dlrDocid(&left));      dlrStep(&left);    }else if( dlrAtEnd(&left) ){      dlwAdd(&writer, dlrDocid(&right));      dlrStep(&right);    }else if( dlrDocid(&left)<dlrDocid(&right) ){      dlwAdd(&writer, dlrDocid(&left));      dlrStep(&left);    }else if( dlrDocid(&right)<dlrDocid(&left) ){      dlwAdd(&writer, dlrDocid(&right));      dlrStep(&right);    }else{      dlwAdd(&writer, dlrDocid(&left));      dlrStep(&left);      dlrStep(&right);    }  }  dlrDestroy(&left);  dlrDestroy(&right);  dlwDestroy(&writer);}/* We have two DL_DOCIDS doclists:  pLeft and pRight.** Write into pOut as DL_DOCIDS doclist containing all documents that** occur in pLeft but not in pRight.*/static void docListExceptMerge(  const char *pLeft, int nLeft,  const char *pRight, int nRight,  DataBuffer *pOut      /* Write the combined doclist here */){  DLReader left, right;  DLWriter writer;  if( nLeft==0 ) return;  if( nRight==0 ){    dataBufferAppend(pOut, pLeft, nLeft);    return;  }  dlrInit(&left, DL_DOCIDS, pLeft, nLeft);  dlrInit(&right, DL_DOCIDS, pRight, nRight);  dlwInit(&writer, DL_DOCIDS, pOut);  while( !dlrAtEnd(&left) ){    while( !dlrAtEnd(&right) && dlrDocid(&right)<dlrDocid(&left) ){      dlrStep(&right);    }    if( dlrAtEnd(&right) || dlrDocid(&left)<dlrDocid(&right) ){      dlwAdd(&writer, dlrDocid(&left));    }    dlrStep(&left);  }  dlrDestroy(&left);  dlrDestroy(&right);  dlwDestroy(&writer);}static char *string_dup_n(const char *s, int n){  char *str = malloc(n + 1);  memcpy(str, s, n);  str[n] = '\0';  return str;}/* Duplicate a string; the caller must free() the returned string. * (We don't use strdup() since it's not part of the standard C library and * may not be available everywhere.) */static char *string_dup(const char *s){  return string_dup_n(s, strlen(s));}/* Format a string, replacing each occurrence of the % character with * zDb.zName.  This may be more convenient than sqlite_mprintf() * when one string is used repeatedly in a format string. * The caller must free() the returned string. */static char *string_format(const char *zFormat,                           const char *zDb, const char *zName){  const char *p;  size_t len = 0;  size_t nDb = strlen(zDb);  size_t nName = strlen(zName);  size_t nFullTableName = nDb+1+nName;  char *result;  char *r;  /* first compute length needed */  for(p = zFormat ; *p ; ++p){    len += (*p=='%' ? nFullTableName : 1);  }  len += 1;  /* for null terminator */  r = result = malloc(len);  for(p = zFormat; *p; ++p){    if( *p=='%' ){      memcpy(r, zDb, nDb);      r += nDb;      *r++ = '.';      memcpy(r, zName, nName);      r += nName;    } else {      *r++ = *p;    }  }  *r++ = '\0';  assert( r == result + len );  return result;}static int sql_exec(sqlite3 *db, const char *zDb, const char *zName,                    const char *zFormat){  char *zCommand = string_format(zFormat, zDb, zName);  int rc;  TRACE(("FTS2 sql: %s\n", zCommand));  rc = sqlite3_exec(db, zCommand, NULL, 0, NULL);  free(zCommand);  return rc;}static int sql_prepare(sqlite3 *db, const char *zDb, const char *zName,                       sqlite3_stmt **ppStmt, const char *zFormat){  char *zCommand = string_format(zFormat, zDb, zName);  int rc;  TRACE(("FTS2 prepare: %s\n", zCommand));  rc = sqlite3_prepare(db, zCommand, -1, ppStmt, NULL);  free(zCommand);  return rc;}/* end utility functions *//* Forward reference */typedef struct fulltext_vtab fulltext_vtab;/* A single term in a query is represented by an instances of** the following structure.*/typedef struct QueryTerm {  short int nPhrase; /* How many following terms are part of the same phrase */  short int iPhrase; /* This is the i-th term of a phrase. */  short int iColumn; /* Column of the index that must match this term */  signed char isOr;  /* this term is preceded by "OR" */  signed char isNot; /* this term is preceded by "-" */  char *pTerm;       /* text of the term.  '\000' terminated.  malloced */  int nTerm;         /* Number of bytes in pTerm[] */} QueryTerm;/* A query string is parsed into a Query structure. * * We could, in theory, allow query strings to be complicated * nested expressions with precedence determined by parentheses. * But none of the major search engines do this.  (Perhaps the * feeling is that an parenthesized expression is two complex of * an idea for the average user to grasp.)  Taking our lead from * the major search engines, we will allow queries to be a list * of terms (with an implied AND operator) or phrases in double-quotes, * with a single optional "-" before each non-phrase term to designate * negation and an optional OR connector. * * OR binds more tightly than the implied AND, which is what the * major search engines seem to do.  So, for example: *  *    [one two OR three]     ==>    one AND (two OR three) *    [one OR two three]     ==>    (one OR two) AND three * * A "-" before a term matches all entries that lack that term. * The "-" must occur immediately before the term with in intervening * space.  This is how the search engines do it. * * A NOT term cannot be the right-hand operand of an OR.  If this * occurs in the query string, the NOT is ignored: * *    [one OR -two]          ==>    one OR two * */typedef struct Query {  fulltext_vtab *pFts;  /* The full text index */  int nTerms;           /* Number of terms in the query */  QueryTerm *pTerms;    /* Array of terms.  Space obtained from malloc() */  int nextIsOr;         /* Set the isOr flag on the next inserted term */  int nextColumn;       /* Next word parsed must be in this column */  int dfltColumn;       /* The default column */} Query;/*** An instance of the following structure keeps track of generated** matching-word offset information and snippets.*/typedef struct Snippet {  int nMatch;     /* Total number of matches */  int nAlloc;     /* Space allocated for aMatch[] */  struct snippetMatch { /* One entry for each matching term */    char snStatus;       /* Status flag for use while constructing snippets */    short int iCol;      /* The column that contains the match */    short int iTerm;     /* The index in Query.pTerms[] of the matching term */    short int nByte;     /* Number of bytes in the term */    int iStart;          /* The offset to the first character of the term */  } *aMatch;      /* Points to space obtained from malloc */  char *zOffset;  /* Text rendering of aMatch[] */  int nOffset;    /* strlen(zOffset) */  char *zSnippet; /* Snippet text */  int nSnippet;   /* strlen(zSnippet) */} Snippet;
fts2.c - 源码说明

本页面展示了「sqlite database for embed linux」中的 fts2.c 源码文件，采用 C语言编程语言编写，共 1,979 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。
虫虫下载站收录了大量与database相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。
⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?