2
0

SegmentInfoTest.php 32 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551
  1. <?php
  2. /**
  3. * @category Zend
  4. * @package Zend_Search_Lucene
  5. * @subpackage UnitTests
  6. */
  7. /**
  8. * Zend_Search_Lucene_Index_SegmentInfo
  9. */
  10. require_once 'Zend/Search/Lucene/Index/SegmentInfo.php';
  11. /**
  12. * PHPUnit test case
  13. */
  14. require_once 'PHPUnit/Framework/TestCase.php';
  15. /**
  16. * @category Zend
  17. * @package Zend_Search_Lucene
  18. * @subpackage UnitTests
  19. */
  20. class Zend_Search_Lucene_Index_SegmentInfoTest extends PHPUnit_Framework_TestCase
  21. {
  22. public function testCreate()
  23. {
  24. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  25. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  26. $this->assertTrue($segmentInfo instanceof Zend_Search_Lucene_Index_SegmentInfo);
  27. }
  28. public function testOpenCompoundFile()
  29. {
  30. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  31. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  32. $file1 = $segmentInfo->openCompoundFile('.fnm');
  33. $this->assertTrue($file1 instanceof Zend_Search_Lucene_Storage_File);
  34. $file2 = $segmentInfo->openCompoundFile('.tii');
  35. $file3 = $segmentInfo->openCompoundFile('.tii');
  36. $file4 = $segmentInfo->openCompoundFile('.tii', false);
  37. $this->assertTrue($file2 instanceof Zend_Search_Lucene_Storage_File);
  38. $this->assertTrue($file2 === $file3);
  39. $this->assertTrue($file4 instanceof Zend_Search_Lucene_Storage_File);
  40. $this->assertTrue($file2 !== $file4);
  41. }
  42. public function testCompoundFileLength()
  43. {
  44. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  45. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  46. $this->assertEquals($segmentInfo->compoundFileLength('.tii'), 58);
  47. }
  48. public function testGetFieldNum()
  49. {
  50. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  51. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  52. $this->assertEquals($segmentInfo->getFieldNum('contents'), 2);
  53. $this->assertEquals($segmentInfo->getFieldNum('non-presented-field'), -1);
  54. }
  55. public function testGetField()
  56. {
  57. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  58. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  59. $fieldInfo = $segmentInfo->getField(2);
  60. $this->assertEquals($fieldInfo->name, 'contents');
  61. $this->assertTrue((boolean)$fieldInfo->isIndexed);
  62. $this->assertEquals($fieldInfo->number, 2);
  63. $this->assertFalse((boolean)$fieldInfo->storeTermVector);
  64. }
  65. public function testGetFields()
  66. {
  67. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  68. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  69. $this->assertTrue($segmentInfo->getFields() == array('path' => 'path', 'modified' => 'modified', 'contents' => 'contents'));
  70. $this->assertTrue($segmentInfo->getFields(true) == array('path' => 'path', 'modified' => 'modified', 'contents' => 'contents'));
  71. }
  72. public function testGetFieldInfos()
  73. {
  74. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  75. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  76. $fieldInfos = $segmentInfo->getFieldInfos();
  77. $this->assertEquals($fieldInfos[0]->name, 'path');
  78. $this->assertTrue((boolean)$fieldInfos[0]->isIndexed);
  79. $this->assertEquals($fieldInfos[0]->number, 0);
  80. $this->assertFalse((boolean)$fieldInfos[0]->storeTermVector);
  81. $this->assertEquals($fieldInfos[1]->name, 'modified');
  82. $this->assertTrue((boolean)$fieldInfos[1]->isIndexed);
  83. $this->assertEquals($fieldInfos[1]->number, 1);
  84. $this->assertFalse((boolean)$fieldInfos[1]->storeTermVector);
  85. $this->assertEquals($fieldInfos[2]->name, 'contents');
  86. $this->assertTrue((boolean)$fieldInfos[2]->isIndexed);
  87. $this->assertEquals($fieldInfos[2]->number, 2);
  88. $this->assertFalse((boolean)$fieldInfos[2]->storeTermVector);
  89. }
  90. public function testCount()
  91. {
  92. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  93. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  94. $this->assertEquals($segmentInfo->count(), 2);
  95. }
  96. public function testNumDocs()
  97. {
  98. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  99. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_3', 2);
  100. $this->assertEquals($segmentInfo->count(), 2);
  101. $this->assertEquals($segmentInfo->numDocs(), 1);
  102. }
  103. public function testGetName()
  104. {
  105. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  106. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  107. $this->assertEquals($segmentInfo->getName(), '_1');
  108. }
  109. public function testGetTermInfo()
  110. {
  111. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  112. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  113. $termInfo = $segmentInfo->getTermInfo(new Zend_Search_Lucene_Index_Term('apart', 'contents'));
  114. $this->assertEquals($termInfo->docFreq, 1);
  115. $this->assertEquals($termInfo->freqPointer, 29);
  116. $this->assertEquals($termInfo->proxPointer, 119);
  117. $this->assertEquals($termInfo->skipOffset, 0);
  118. $this->assertEquals($termInfo->indexPointer, null);
  119. $termInfo1 = $segmentInfo->getTermInfo(new Zend_Search_Lucene_Index_Term('apart', 'contents'));
  120. // test for requesting cached information
  121. $this->assertTrue($termInfo === $termInfo1);
  122. // request for non-existing term
  123. $this->assertTrue($segmentInfo->getTermInfo(new Zend_Search_Lucene_Index_Term('nonusedterm', 'contents')) === null);
  124. }
  125. public function testTermFreqs()
  126. {
  127. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  128. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  129. $termPositions = $segmentInfo->termFreqs(new Zend_Search_Lucene_Index_Term('bgcolor', 'contents'));
  130. $this->assertTrue($termPositions == array(0 => 3, 1 => 1));
  131. $termPositions = $segmentInfo->termFreqs(new Zend_Search_Lucene_Index_Term('bgcolor', 'contents'), 10);
  132. $this->assertTrue($termPositions == array(10 => 3, 11 => 1));
  133. }
  134. public function testTermPositions()
  135. {
  136. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  137. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  138. $termPositions = $segmentInfo->termPositions(new Zend_Search_Lucene_Index_Term('bgcolor', 'contents'));
  139. $this->assertTrue($termPositions == array(0 => array(69, 239, 370),
  140. 1 => array(58)
  141. ));
  142. $termPositions = $segmentInfo->termPositions(new Zend_Search_Lucene_Index_Term('bgcolor', 'contents'), 10);
  143. $this->assertTrue($termPositions == array(10 => array(69, 239, 370),
  144. 11 => array(58)
  145. ));
  146. }
  147. public function testNorm()
  148. {
  149. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  150. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  151. $this->assertTrue(abs($segmentInfo->norm(1, 'contents') - 0.0546875) < 0.000001);
  152. }
  153. public function testNormVector()
  154. {
  155. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  156. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  157. $this->assertEquals($segmentInfo->normVector('contents'), "\x69\x6B");
  158. }
  159. public function testHasDeletions()
  160. {
  161. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  162. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2);
  163. $this->assertFalse($segmentInfo->hasDeletions());
  164. $segmentInfo1 = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_3', 2);
  165. $this->assertTrue($segmentInfo1->hasDeletions());
  166. }
  167. public function testDelete()
  168. {
  169. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  170. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2, 0 /* search for _1.del file */);
  171. $this->assertFalse($segmentInfo->hasDeletions());
  172. $segmentInfo->delete(0);
  173. $this->assertTrue($segmentInfo->hasDeletions());
  174. $delGen = $segmentInfo->getDelGen();
  175. // don't write changes
  176. unset($segmentInfo);
  177. $segmentInfo1 = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2, $delGen);
  178. // Changes wasn't written, segment still has no deletions
  179. $this->assertFalse($segmentInfo1->hasDeletions());
  180. $segmentInfo1->delete(0);
  181. $segmentInfo1->writeChanges();
  182. $delGen = $segmentInfo1->getDelGen();
  183. unset($segmentInfo1);
  184. $segmentInfo2 = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2, $delGen);
  185. $this->assertTrue($segmentInfo2->hasDeletions());
  186. unset($segmentInfo2);
  187. $directory->deleteFile('_1_' . base_convert($delGen, 10, 36) . '.del');
  188. $segmentInfo3 = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_1', 2, -1 /* no detetions file */);
  189. $this->assertFalse($segmentInfo3->hasDeletions());
  190. }
  191. public function testIsDeleted()
  192. {
  193. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  194. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_2', 2);
  195. $this->assertFalse($segmentInfo->isDeleted(0));
  196. $segmentInfo1 = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_3', 2);
  197. $this->assertTrue($segmentInfo1->isDeleted(0));
  198. $this->assertFalse($segmentInfo1->isDeleted(1));
  199. }
  200. public function testTermStreamStyleReading()
  201. {
  202. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  203. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_3', 2);
  204. $this->assertEquals($segmentInfo->resetTermsStream(6, Zend_Search_Lucene_Index_SegmentInfo::SM_FULL_INFO), 8);
  205. $terms = array();
  206. $terms[] = $segmentInfo->currentTerm();
  207. $firstTermPositions = $segmentInfo->currentTermPositions();
  208. $this->assertEquals(count($firstTermPositions), 1);
  209. reset($firstTermPositions); // go to the first element
  210. $this->assertEquals(key($firstTermPositions), 7);
  211. $this->assertTrue(current($firstTermPositions) ==
  212. array(105, 113, 130, 138, 153, 168, 171, 216, 243, 253, 258, 265, 302, 324,
  213. 331, 351, 359, 366, 370, 376, 402, 410, 418, 425, 433, 441, 460, 467));
  214. while (($term = $segmentInfo->nextTerm()) != null) {
  215. $terms[] = $term;
  216. }
  217. $this->assertTrue($terms ==
  218. array(new Zend_Search_Lucene_Index_Term('a', 'contents'),
  219. new Zend_Search_Lucene_Index_Term('about', 'contents'),
  220. new Zend_Search_Lucene_Index_Term('accesskey', 'contents'),
  221. new Zend_Search_Lucene_Index_Term('align', 'contents'),
  222. new Zend_Search_Lucene_Index_Term('alink', 'contents'),
  223. new Zend_Search_Lucene_Index_Term('already', 'contents'),
  224. new Zend_Search_Lucene_Index_Term('and', 'contents'),
  225. new Zend_Search_Lucene_Index_Term('are', 'contents'),
  226. new Zend_Search_Lucene_Index_Term('at', 'contents'),
  227. new Zend_Search_Lucene_Index_Term('b', 'contents'),
  228. new Zend_Search_Lucene_Index_Term('be', 'contents'),
  229. new Zend_Search_Lucene_Index_Term('been', 'contents'),
  230. new Zend_Search_Lucene_Index_Term('bgcolor', 'contents'),
  231. new Zend_Search_Lucene_Index_Term('body', 'contents'),
  232. new Zend_Search_Lucene_Index_Term('border', 'contents'),
  233. new Zend_Search_Lucene_Index_Term('bottom', 'contents'),
  234. new Zend_Search_Lucene_Index_Term('bug', 'contents'),
  235. new Zend_Search_Lucene_Index_Term('bugs', 'contents'),
  236. new Zend_Search_Lucene_Index_Term('can', 'contents'),
  237. new Zend_Search_Lucene_Index_Term('care', 'contents'),
  238. new Zend_Search_Lucene_Index_Term('cellpadding', 'contents'),
  239. new Zend_Search_Lucene_Index_Term('cellspacing', 'contents'),
  240. new Zend_Search_Lucene_Index_Term('center', 'contents'),
  241. new Zend_Search_Lucene_Index_Term('chapter', 'contents'),
  242. new Zend_Search_Lucene_Index_Term('charset', 'contents'),
  243. new Zend_Search_Lucene_Index_Term('check', 'contents'),
  244. new Zend_Search_Lucene_Index_Term('class', 'contents'),
  245. new Zend_Search_Lucene_Index_Term('click', 'contents'),
  246. new Zend_Search_Lucene_Index_Term('colspan', 'contents'),
  247. new Zend_Search_Lucene_Index_Term('contains', 'contents'),
  248. new Zend_Search_Lucene_Index_Term('content', 'contents'),
  249. new Zend_Search_Lucene_Index_Term('contributing', 'contents'),
  250. new Zend_Search_Lucene_Index_Term('developers', 'contents'),
  251. new Zend_Search_Lucene_Index_Term('div', 'contents'),
  252. new Zend_Search_Lucene_Index_Term('docbook', 'contents'),
  253. new Zend_Search_Lucene_Index_Term('documentation', 'contents'),
  254. new Zend_Search_Lucene_Index_Term('does', 'contents'),
  255. new Zend_Search_Lucene_Index_Term('don', 'contents'),
  256. new Zend_Search_Lucene_Index_Term('double', 'contents'),
  257. new Zend_Search_Lucene_Index_Term('easiest', 'contents'),
  258. new Zend_Search_Lucene_Index_Term('equiv', 'contents'),
  259. new Zend_Search_Lucene_Index_Term('existing', 'contents'),
  260. new Zend_Search_Lucene_Index_Term('explanations', 'contents'),
  261. new Zend_Search_Lucene_Index_Term('ff', 'contents'),
  262. new Zend_Search_Lucene_Index_Term('ffffff', 'contents'),
  263. new Zend_Search_Lucene_Index_Term('fill', 'contents'),
  264. new Zend_Search_Lucene_Index_Term('find', 'contents'),
  265. new Zend_Search_Lucene_Index_Term('fixed', 'contents'),
  266. new Zend_Search_Lucene_Index_Term('footer', 'contents'),
  267. new Zend_Search_Lucene_Index_Term('for', 'contents'),
  268. new Zend_Search_Lucene_Index_Term('form', 'contents'),
  269. new Zend_Search_Lucene_Index_Term('found', 'contents'),
  270. new Zend_Search_Lucene_Index_Term('generator', 'contents'),
  271. new Zend_Search_Lucene_Index_Term('guide', 'contents'),
  272. new Zend_Search_Lucene_Index_Term('h', 'contents'),
  273. new Zend_Search_Lucene_Index_Term('hasn', 'contents'),
  274. new Zend_Search_Lucene_Index_Term('have', 'contents'),
  275. new Zend_Search_Lucene_Index_Term('head', 'contents'),
  276. new Zend_Search_Lucene_Index_Term('header', 'contents'),
  277. new Zend_Search_Lucene_Index_Term('hesitate', 'contents'),
  278. new Zend_Search_Lucene_Index_Term('home', 'contents'),
  279. new Zend_Search_Lucene_Index_Term('homepage', 'contents'),
  280. new Zend_Search_Lucene_Index_Term('how', 'contents'),
  281. new Zend_Search_Lucene_Index_Term('hr', 'contents'),
  282. new Zend_Search_Lucene_Index_Term('href', 'contents'),
  283. new Zend_Search_Lucene_Index_Term('html', 'contents'),
  284. new Zend_Search_Lucene_Index_Term('http', 'contents'),
  285. new Zend_Search_Lucene_Index_Term('if', 'contents'),
  286. new Zend_Search_Lucene_Index_Term('in', 'contents'),
  287. new Zend_Search_Lucene_Index_Term('index', 'contents'),
  288. new Zend_Search_Lucene_Index_Term('information', 'contents'),
  289. new Zend_Search_Lucene_Index_Term('is', 'contents'),
  290. new Zend_Search_Lucene_Index_Term('iso', 'contents'),
  291. new Zend_Search_Lucene_Index_Term('it', 'contents'),
  292. new Zend_Search_Lucene_Index_Term('latest', 'contents'),
  293. new Zend_Search_Lucene_Index_Term('left', 'contents'),
  294. new Zend_Search_Lucene_Index_Term('link', 'contents'),
  295. new Zend_Search_Lucene_Index_Term('list', 'contents'),
  296. new Zend_Search_Lucene_Index_Term('manual', 'contents'),
  297. new Zend_Search_Lucene_Index_Term('meet', 'contents'),
  298. new Zend_Search_Lucene_Index_Term('meta', 'contents'),
  299. new Zend_Search_Lucene_Index_Term('modular', 'contents'),
  300. new Zend_Search_Lucene_Index_Term('more', 'contents'),
  301. new Zend_Search_Lucene_Index_Term('n', 'contents'),
  302. new Zend_Search_Lucene_Index_Term('name', 'contents'),
  303. new Zend_Search_Lucene_Index_Term('navfooter', 'contents'),
  304. new Zend_Search_Lucene_Index_Term('navheader', 'contents'),
  305. new Zend_Search_Lucene_Index_Term('navigation', 'contents'),
  306. new Zend_Search_Lucene_Index_Term('net', 'contents'),
  307. new Zend_Search_Lucene_Index_Term('new', 'contents'),
  308. new Zend_Search_Lucene_Index_Term('newpackage', 'contents'),
  309. new Zend_Search_Lucene_Index_Term('next', 'contents'),
  310. new Zend_Search_Lucene_Index_Term('of', 'contents'),
  311. new Zend_Search_Lucene_Index_Term('on', 'contents'),
  312. new Zend_Search_Lucene_Index_Term('out', 'contents'),
  313. new Zend_Search_Lucene_Index_Term('p', 'contents'),
  314. new Zend_Search_Lucene_Index_Term('package', 'contents'),
  315. new Zend_Search_Lucene_Index_Term('packages', 'contents'),
  316. new Zend_Search_Lucene_Index_Term('page', 'contents'),
  317. new Zend_Search_Lucene_Index_Term('patches', 'contents'),
  318. new Zend_Search_Lucene_Index_Term('pear', 'contents'),
  319. new Zend_Search_Lucene_Index_Term('persists', 'contents'),
  320. new Zend_Search_Lucene_Index_Term('php', 'contents'),
  321. new Zend_Search_Lucene_Index_Term('please', 'contents'),
  322. new Zend_Search_Lucene_Index_Term('prev', 'contents'),
  323. new Zend_Search_Lucene_Index_Term('previous', 'contents'),
  324. new Zend_Search_Lucene_Index_Term('proper', 'contents'),
  325. new Zend_Search_Lucene_Index_Term('quote', 'contents'),
  326. new Zend_Search_Lucene_Index_Term('read', 'contents'),
  327. new Zend_Search_Lucene_Index_Term('rel', 'contents'),
  328. new Zend_Search_Lucene_Index_Term('report', 'contents'),
  329. new Zend_Search_Lucene_Index_Term('reported', 'contents'),
  330. new Zend_Search_Lucene_Index_Term('reporting', 'contents'),
  331. new Zend_Search_Lucene_Index_Term('requirements', 'contents'),
  332. new Zend_Search_Lucene_Index_Term('right', 'contents'),
  333. new Zend_Search_Lucene_Index_Term('sect', 'contents'),
  334. new Zend_Search_Lucene_Index_Term('span', 'contents'),
  335. new Zend_Search_Lucene_Index_Term('still', 'contents'),
  336. new Zend_Search_Lucene_Index_Term('stylesheet', 'contents'),
  337. new Zend_Search_Lucene_Index_Term('submitting', 'contents'),
  338. new Zend_Search_Lucene_Index_Term('summary', 'contents'),
  339. new Zend_Search_Lucene_Index_Term('system', 'contents'),
  340. new Zend_Search_Lucene_Index_Term('t', 'contents'),
  341. new Zend_Search_Lucene_Index_Term('table', 'contents'),
  342. new Zend_Search_Lucene_Index_Term('take', 'contents'),
  343. new Zend_Search_Lucene_Index_Term('target', 'contents'),
  344. new Zend_Search_Lucene_Index_Term('td', 'contents'),
  345. new Zend_Search_Lucene_Index_Term('text', 'contents'),
  346. new Zend_Search_Lucene_Index_Term('th', 'contents'),
  347. new Zend_Search_Lucene_Index_Term('that', 'contents'),
  348. new Zend_Search_Lucene_Index_Term('the', 'contents'),
  349. new Zend_Search_Lucene_Index_Term('think', 'contents'),
  350. new Zend_Search_Lucene_Index_Term('this', 'contents'),
  351. new Zend_Search_Lucene_Index_Term('tips', 'contents'),
  352. new Zend_Search_Lucene_Index_Term('title', 'contents'),
  353. new Zend_Search_Lucene_Index_Term('to', 'contents'),
  354. new Zend_Search_Lucene_Index_Term('top', 'contents'),
  355. new Zend_Search_Lucene_Index_Term('tr', 'contents'),
  356. new Zend_Search_Lucene_Index_Term('translating', 'contents'),
  357. new Zend_Search_Lucene_Index_Term('type', 'contents'),
  358. new Zend_Search_Lucene_Index_Term('u', 'contents'),
  359. new Zend_Search_Lucene_Index_Term('unable', 'contents'),
  360. new Zend_Search_Lucene_Index_Term('up', 'contents'),
  361. new Zend_Search_Lucene_Index_Term('using', 'contents'),
  362. new Zend_Search_Lucene_Index_Term('valign', 'contents'),
  363. new Zend_Search_Lucene_Index_Term('version', 'contents'),
  364. new Zend_Search_Lucene_Index_Term('vlink', 'contents'),
  365. new Zend_Search_Lucene_Index_Term('way', 'contents'),
  366. new Zend_Search_Lucene_Index_Term('which', 'contents'),
  367. new Zend_Search_Lucene_Index_Term('width', 'contents'),
  368. new Zend_Search_Lucene_Index_Term('will', 'contents'),
  369. new Zend_Search_Lucene_Index_Term('with', 'contents'),
  370. new Zend_Search_Lucene_Index_Term('writing', 'contents'),
  371. new Zend_Search_Lucene_Index_Term('you', 'contents'),
  372. new Zend_Search_Lucene_Index_Term('your', 'contents'),
  373. new Zend_Search_Lucene_Index_Term('1178009946', 'modified'),
  374. new Zend_Search_Lucene_Index_Term('bugs', 'path'),
  375. new Zend_Search_Lucene_Index_Term('contributing', 'path'),
  376. new Zend_Search_Lucene_Index_Term('html', 'path'),
  377. new Zend_Search_Lucene_Index_Term('indexsource', 'path'),
  378. new Zend_Search_Lucene_Index_Term('newpackage', 'path'),
  379. ));
  380. unset($segmentInfo);
  381. $segmentInfo1 = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_3', 2);
  382. $this->assertEquals($segmentInfo1->resetTermsStream(6, Zend_Search_Lucene_Index_SegmentInfo::SM_MERGE_INFO), 7);
  383. }
  384. public function testTermStreamStyleReadingSkipTo()
  385. {
  386. $directory = new Zend_Search_Lucene_Storage_Directory_Filesystem(dirname(__FILE__) . '/_source/_files');
  387. $segmentInfo = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_3', 2);
  388. $this->assertEquals($segmentInfo->resetTermsStream(6, Zend_Search_Lucene_Index_SegmentInfo::SM_FULL_INFO), 8);
  389. $segmentInfo->skipTo(new Zend_Search_Lucene_Index_Term('prefetch', 'contents'));
  390. $terms = array();
  391. $terms[] = $segmentInfo->currentTerm();
  392. $firstTermPositions = $segmentInfo->currentTermPositions();
  393. $this->assertEquals(count($firstTermPositions), 1);
  394. reset($firstTermPositions); // go to the first element
  395. $this->assertEquals(key($firstTermPositions), 7);
  396. $this->assertTrue(current($firstTermPositions) == array(112, 409));
  397. while (($term = $segmentInfo->nextTerm()) != null) {
  398. $terms[] = $term;
  399. }
  400. $this->assertTrue($terms ==
  401. array(new Zend_Search_Lucene_Index_Term('prev', 'contents'),
  402. new Zend_Search_Lucene_Index_Term('previous', 'contents'),
  403. new Zend_Search_Lucene_Index_Term('proper', 'contents'),
  404. new Zend_Search_Lucene_Index_Term('quote', 'contents'),
  405. new Zend_Search_Lucene_Index_Term('read', 'contents'),
  406. new Zend_Search_Lucene_Index_Term('rel', 'contents'),
  407. new Zend_Search_Lucene_Index_Term('report', 'contents'),
  408. new Zend_Search_Lucene_Index_Term('reported', 'contents'),
  409. new Zend_Search_Lucene_Index_Term('reporting', 'contents'),
  410. new Zend_Search_Lucene_Index_Term('requirements', 'contents'),
  411. new Zend_Search_Lucene_Index_Term('right', 'contents'),
  412. new Zend_Search_Lucene_Index_Term('sect', 'contents'),
  413. new Zend_Search_Lucene_Index_Term('span', 'contents'),
  414. new Zend_Search_Lucene_Index_Term('still', 'contents'),
  415. new Zend_Search_Lucene_Index_Term('stylesheet', 'contents'),
  416. new Zend_Search_Lucene_Index_Term('submitting', 'contents'),
  417. new Zend_Search_Lucene_Index_Term('summary', 'contents'),
  418. new Zend_Search_Lucene_Index_Term('system', 'contents'),
  419. new Zend_Search_Lucene_Index_Term('t', 'contents'),
  420. new Zend_Search_Lucene_Index_Term('table', 'contents'),
  421. new Zend_Search_Lucene_Index_Term('take', 'contents'),
  422. new Zend_Search_Lucene_Index_Term('target', 'contents'),
  423. new Zend_Search_Lucene_Index_Term('td', 'contents'),
  424. new Zend_Search_Lucene_Index_Term('text', 'contents'),
  425. new Zend_Search_Lucene_Index_Term('th', 'contents'),
  426. new Zend_Search_Lucene_Index_Term('that', 'contents'),
  427. new Zend_Search_Lucene_Index_Term('the', 'contents'),
  428. new Zend_Search_Lucene_Index_Term('think', 'contents'),
  429. new Zend_Search_Lucene_Index_Term('this', 'contents'),
  430. new Zend_Search_Lucene_Index_Term('tips', 'contents'),
  431. new Zend_Search_Lucene_Index_Term('title', 'contents'),
  432. new Zend_Search_Lucene_Index_Term('to', 'contents'),
  433. new Zend_Search_Lucene_Index_Term('top', 'contents'),
  434. new Zend_Search_Lucene_Index_Term('tr', 'contents'),
  435. new Zend_Search_Lucene_Index_Term('translating', 'contents'),
  436. new Zend_Search_Lucene_Index_Term('type', 'contents'),
  437. new Zend_Search_Lucene_Index_Term('u', 'contents'),
  438. new Zend_Search_Lucene_Index_Term('unable', 'contents'),
  439. new Zend_Search_Lucene_Index_Term('up', 'contents'),
  440. new Zend_Search_Lucene_Index_Term('using', 'contents'),
  441. new Zend_Search_Lucene_Index_Term('valign', 'contents'),
  442. new Zend_Search_Lucene_Index_Term('version', 'contents'),
  443. new Zend_Search_Lucene_Index_Term('vlink', 'contents'),
  444. new Zend_Search_Lucene_Index_Term('way', 'contents'),
  445. new Zend_Search_Lucene_Index_Term('which', 'contents'),
  446. new Zend_Search_Lucene_Index_Term('width', 'contents'),
  447. new Zend_Search_Lucene_Index_Term('will', 'contents'),
  448. new Zend_Search_Lucene_Index_Term('with', 'contents'),
  449. new Zend_Search_Lucene_Index_Term('writing', 'contents'),
  450. new Zend_Search_Lucene_Index_Term('you', 'contents'),
  451. new Zend_Search_Lucene_Index_Term('your', 'contents'),
  452. new Zend_Search_Lucene_Index_Term('1178009946', 'modified'),
  453. new Zend_Search_Lucene_Index_Term('bugs', 'path'),
  454. new Zend_Search_Lucene_Index_Term('contributing', 'path'),
  455. new Zend_Search_Lucene_Index_Term('html', 'path'),
  456. new Zend_Search_Lucene_Index_Term('indexsource', 'path'),
  457. new Zend_Search_Lucene_Index_Term('newpackage', 'path'),
  458. ));
  459. unset($segmentInfo);
  460. $segmentInfo1 = new Zend_Search_Lucene_Index_SegmentInfo($directory, '_3', 2);
  461. $this->assertEquals($segmentInfo1->resetTermsStream(6, Zend_Search_Lucene_Index_SegmentInfo::SM_MERGE_INFO), 7);
  462. }
  463. }