fts5origintext6.test 7.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210
  1. # 2014 Jan 08
  2. #
  3. # The author disclaims copyright to this source code. In place of
  4. # a legal notice, here is a blessing:
  5. #
  6. # May you do good and not evil.
  7. # May you find forgiveness for yourself and forgive others.
  8. # May you share freely, never taking more than you give.
  9. #
  10. #***********************************************************************
  11. #
  12. # Tests focused on phrase queries.
  13. #
  14. source [file join [file dirname [info script]] fts5_common.tcl]
  15. set testprefix fts5origintext6
  16. # If SQLITE_ENABLE_FTS5 is not defined, omit this file.
  17. ifcapable !fts5 {
  18. finish_test
  19. return
  20. }
  21. proc insert_data {tbl} {
  22. db eval "
  23. INSERT INTO $tbl (rowid, x, y) VALUES
  24. (1, 'ChH BDd HhG efc BjJ BGi GBG FdD','ciJ AFf ADf fBJ fhC GFI JEH fcA'),
  25. (2, 'deg AIG Fie jII cCd Hbf igF fEE','GeA Ija gJg EDc HFi DDI dCf aDd'),
  26. (3, 'IJC hga deC Jfa Aeg hfh CcH dfb','ajD hgC Jaf IfH CHe jIG AjD adF'),
  27. (4, 'FiH GJH IDA AiG bBc CGG Eih bIH','hHg JaH aii IHE Ggd gcH gji CGc'),
  28. (5, 'ceg CAd jFI GAB BGg EeC IdH acG','bBC eIG ifH eDE Adj bjb GCj ebA'),
  29. (6, 'Eac Fbh aFF Eea jeG EIj HCc JJH','hbd giE Gfe eiI dEF abE cJf cAb'),
  30. (7, 'dic hAc jEC AiG FEF jHc HiD HBI','aEd ebE Gfi AJG EBA faj GiG jjE'),
  31. (8, 'Fca iEe EgE jjJ gce ijf EGc EBi','gaI dhH bFg CFc HeC CjI Jfg ccH'),
  32. (9, 'cfd iaa HCf iHJ HjG ffh ABb ibi','CfG bia Dai eii Ejg Jeg fCg hDb'),
  33. (10, 'Jjf hJC IID HJj bGB EbJ cgg eBj','jci jhi JAF jIg Bei Bcd cAC AJd'),
  34. (11, 'egG Cdi bFf fEB hfH jDH jia Efd','FAd eCg fAi aiC baC eJG acF iGE'),
  35. (12, 'Ada Gde CJI ADG gJA Cbb ccF iAB','eAE ajC FBB ccd Jgh fJg ieg hGE'),
  36. (13, 'gBb fDG Jdd HdD fiJ Bed Cig iGg','heC FeI iaj gdg ebB giC HaD FIe'),
  37. (14, 'FiI iDd Ffe igI bgB EJf FHG hDF','cjC AeI abf Fah cbJ ffH jEb aib'),
  38. (15, 'jaF hBI jIH Gdh FEc Fij hgj jFh','dGA ADH feh AAI AfJ DbC gBi hGH'),
  39. (16, 'gjH BGg iGj aFE CAH edI idf HEH','hIf DDg fjB hGi cHF BCH FjG Bgd'),
  40. (17, 'iaI JGH hji gcj Dda eeG jDd CBi','cHg jeh caG gIc feF ihG hgJ Abj'),
  41. (18, 'jHI iDB eFf AiH EFB CDb IAj GbC','Ghe dEI gdI jai gib dAG BIa djb'),
  42. (19, 'abI fHG Ccf aAc FDa fiC agF bdB','afi hde IgE bGF cfg DHD diE aca'),
  43. (20, 'IFh eDJ jfh cDg dde JGJ GAf fIJ','IBa EfH faE aeI FIF baJ FGj EIH'),
  44. (21, 'Dee bFC bBA dEI CEj aJI ghA dCH','hBA ddA HJh dfj egI Dij dFE bGE'),
  45. (22, 'JFE BCj FgA afc Jda FGD iHJ HDh','eAI jHe BHD Gah bbD Bgj gbh eGB'),
  46. (23, 'edE CJE FjG aFI edA Cea FId iFe','ABG jcA ddj EEc Dcg hAI agA biA'),
  47. (24, 'AgE cfc eef cGh aFB DcH efJ hcH','eGF HaB diG fgi bdc iGJ FGJ fFB'),
  48. (25, 'aCa AgI GhC DDI hGJ Hgc Gcg bbG','iID Fga jHa jIj idj DFD bAC AFJ'),
  49. (26, 'gjC JGh Fge faa eCA iGG gHE Gai','bDi hFE BbI DHD Adb Fgi hCa Hij'),
  50. (27, 'Eji jEI jhF DFC afH cDh AGc dHA','IDe GcA ChF DIb Bif HfH agD DGh'),
  51. (28, 'gDD AEE Dfg ICf Cbi JdE jgH eEi','eEb dBG FDE jgf cAI FaJ jaA cDd'),
  52. (29, 'cbe Gec hgB Egi bca dHg bAJ jBf','EFB DgD GJc fDb EeE bBA GFC Hbe'),
  53. (30, 'Adc eHB afI hDc Bhh baE hcJ BBd','JAH deg bcF Dab Bgj Gbb JHi FIB'),
  54. (31, 'agF dIj AJJ Hfg cCG hED Igc fHC','JEf eia dHf Ggc Agj geD bEE Gei'),
  55. (32, 'DAd cCe cbJ FjG gJe gba dJA GCf','eAf hFc bGE ABI hHA IcE abF CCE'),
  56. (33, 'fFh jJe DhJ cDJ EBi AfD eFI IhG','fEG GCc Bjd EFF ggg CFe EHd ciB'),
  57. (34, 'Ejb BjI eAF HaD eEJ FaG Eda AHC','Iah hgD EJG fdD cIE Daj IFf eJh'),
  58. (35, 'aHG eCe FjA djJ dAJ jiJ IaE GGB','Acg iEF JfB FIC Eei ggj dic Iii'),
  59. (36, 'Fdb EDF GaF JjB ehH IgC hgi DCG','cag DHI Fah hAJ bbh egG Hia hgJ'),
  60. (37, 'HGg icC JEC AFJ Ddh dhi hfC Ich','fEg bED Bff hCJ EiA cIf bfG cGA'),
  61. (38, 'aEJ jGI BCi FaA ebA BHj cIJ GcC','dCH ADd bGB cFE AgF geD cbG jIc'),
  62. (39, 'JFB bBi heA BFA hgB Ahj EIE CgI','EIJ JFG FJE GeA Hdg HeH ACh GiA'),
  63. (40, 'agB DDC CED igC Dfc DhI eiC fHi','dAB dcg iJF cej Fcc cAc AfB Fdd'),
  64. (41, 'BdF DHj Ege hcG DEd eFa dCf gBb','FBG ChB cej iGd Hbh fCc Ibe Abh'),
  65. (42, 'Bgc DjI cbC jGD bdb hHB IJA IJH','heg cii abb IGf eDe hJc dii fcE'),
  66. (43, 'fhf ECa FiA aDh Jbf CiB Jhe ajD','GFE bIF aeD gDE BIE Jea DfC BEc'),
  67. (44, 'GjE dBj DbJ ICF aDh EEH Ejb jFb','dJj aEc IBg bEG Faf fjA hjf FAF'),
  68. (45, 'BfA efd IIJ AHG dDF eGg dIJ Gcb','Bfj jeb Ahc dAE ACH Dfb ieb dhC'),
  69. (46, 'Ibj ege geC dJh CIi hbD EAG fGA','DEb BFe Bjg FId Fhg HeF JAc BbE'),
  70. (47, 'dhB afC hgG bEJ aIe Cbe iEE JCD','bdg Ajc FGA jbh Jge iAj fIA jbE'),
  71. (48, 'egH iDi bfH iiI hGC jFF Hfd AHB','bjE Beb iCc haB gIH Dea bga dfd'),
  72. (49, 'jgf chc jGc Baj HBb jdE hgh heI','FFB aBd iEB EIG HGf Bbj EIi JbI'),
  73. (50, 'jhe EGi ajA fbH geh EHe FdC bij','jDE bBC gbH HeE dcH iBH IFE AHi'),
  74. (51, 'aCb JiD cgJ Bjj iAI Hbe IAF FhH','ijf bhE Jdf FED dCH bbG HcJ ebH');
  75. "
  76. }
  77. foreach_detail_mode $testprefix {
  78. foreach external {0 1 2} {
  79. reset_db
  80. proc tokens {cmd} {
  81. set ret [list]
  82. for {set iTok 0} {$iTok < [$cmd xInstCount]} {incr iTok} {
  83. set txt [$cmd xInstToken $iTok 0]
  84. set txt [string map [list "\0" "."] $txt]
  85. lappend ret $txt
  86. }
  87. set ret
  88. }
  89. sqlite3_fts5_create_function db tokens tokens
  90. sqlite3_fts5_register_origintext db
  91. set E(0) internal
  92. set E(1) external
  93. set E(2) contentless
  94. set e $E($external)
  95. db eval { CREATE TABLE ex(x, y) }
  96. switch -- $external {
  97. 0 {
  98. do_execsql_test 1.$e.0 {
  99. CREATE VIRTUAL TABLE ft USING fts5(
  100. x, y, tokenize="origintext unicode61", tokendata=1, detail=%DETAIL%
  101. );
  102. }
  103. }
  104. 1 {
  105. do_execsql_test 1.$e.0 {
  106. CREATE VIRTUAL TABLE ft USING fts5(
  107. x, y, tokenize="origintext unicode61", tokendata=1, detail=%DETAIL%,
  108. content=ex
  109. );
  110. }
  111. }
  112. 2 {
  113. do_execsql_test 1.$e.0 {
  114. CREATE VIRTUAL TABLE ft USING fts5(
  115. x, y, tokenize="origintext unicode61", tokendata=1, detail=%DETAIL%,
  116. content=
  117. );
  118. }
  119. }
  120. }
  121. insert_data ex
  122. insert_data ft
  123. proc prefixquery {prefix bInst bYOnly} {
  124. set ret [list]
  125. db eval { SELECT rowid, x, y FROM ex ORDER BY rowid } {
  126. set row [list]
  127. set bSeen 0
  128. set T [concat $x $y]
  129. if {$bYOnly} { set T $y }
  130. foreach w $T {
  131. if {[string match -nocase $prefix $w]} {
  132. set bSeen 1
  133. if {$bInst} {
  134. set v [string tolower $w]
  135. if {$w != $v} { append v ".$w" }
  136. lappend row $v
  137. }
  138. }
  139. }
  140. if {$bSeen} {
  141. lappend ret $rowid
  142. lappend ret $row
  143. }
  144. }
  145. set ret
  146. }
  147. proc do_prefixquery_test {tn prefix} {
  148. set bInst [expr {$::e!="contentless" || "%DETAIL%"=="full"}]
  149. set expect [prefixquery $prefix $bInst 0]
  150. set expect2 [prefixquery $prefix $bInst 1]
  151. uplevel [list do_execsql_test $tn.1 "
  152. SELECT rowid, tokens(ft) FROM ft('$prefix')
  153. " $expect]
  154. uplevel [list do_execsql_test $tn.2 "
  155. SELECT rowid, tokens(ft) FROM ft(fts5_insttoken('$prefix'))
  156. " $expect]
  157. db eval { INSERT INTO ft(ft, rank) VALUES('insttoken', 1) }
  158. uplevel [list do_execsql_test $tn.3 "
  159. SELECT rowid, tokens(ft) FROM ft('$prefix')
  160. " $expect]
  161. db eval { INSERT INTO ft(ft, rank) VALUES('insttoken', 0) }
  162. if {"%DETAIL%"!="none"} {
  163. uplevel [list do_execsql_test $tn.4 "
  164. SELECT rowid, tokens(ft) FROM ft('y: $prefix')
  165. " $expect2]
  166. uplevel [list do_execsql_test $tn.5 "
  167. SELECT rowid, tokens(ft) FROM ft(fts5_insttoken('y: $prefix'))
  168. " $expect2]
  169. db eval { INSERT INTO ft(ft, rank) VALUES('insttoken', 1) }
  170. uplevel [list do_execsql_test $tn.6 "
  171. SELECT rowid, tokens(ft) FROM ft('y: $prefix')
  172. " $expect2]
  173. db eval { INSERT INTO ft(ft, rank) VALUES('insttoken', 0) }
  174. }
  175. }
  176. do_prefixquery_test 1.$e.1 a*
  177. do_prefixquery_test 1.$e.2 b*
  178. do_prefixquery_test 1.$e.3 c*
  179. do_prefixquery_test 1.$e.4 d*
  180. do_prefixquery_test 1.$e.5 e*
  181. do_prefixquery_test 1.$e.6 f*
  182. do_prefixquery_test 1.$e.7 g*
  183. do_prefixquery_test 1.$e.8 h*
  184. do_prefixquery_test 1.$e.9 i*
  185. do_prefixquery_test 1.$e.10 j*
  186. }}
  187. finish_test