[Zope-CVS] CVS: Products/ZCTextIndex/tests - testIndex.py:1.1.2.1 test_index.py:NONE
Guido van Rossum
guido@python.org
Wed, 1 May 2002 10:25:42 -0400
Update of /cvs-repository/Products/ZCTextIndex/tests
In directory cvs.zope.org:/tmp/cvs-serv26338
Added Files:
Tag: TextIndexDS9-branch
testIndex.py
Removed Files:
Tag: TextIndexDS9-branch
test_index.py
Log Message:
Rename test_index.py to testIndex.py
=== Added File Products/ZCTextIndex/tests/testIndex.py ===
##############################################################################
#
# Copyright (c) 2001, 2002 Zope Corporation and Contributors.
# All Rights Reserved.
#
# This software is subject to the provisions of the Zope Public License,
# Version 2.0 (ZPL). A copy of the ZPL should accompany this distribution.
# THIS SOFTWARE IS PROVIDED "AS IS" AND ANY AND ALL EXPRESS OR IMPLIED
# WARRANTIES ARE DISCLAIMED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
# WARRANTIES OF TITLE, MERCHANTABILITY, AGAINST INFRINGEMENT, AND FITNESS
# FOR A PARTICULAR PURPOSE.
#
##############################################################################
from unittest import TestCase, TestSuite, main, makeSuite
from Products.ZCTextIndex.Index import Index
class SimpleLexicon:
def __init__(self):
self._words = {}
def sourceToWordIds(self, text):
words = text.split()
wids = []
for word in words:
wid = self._words.get(word)
if wid is None:
wid = len(self._words)
self._words[word] = wid
wids.append(wid)
return wids
def termToWordIds(self, text):
words = text.split()
wids = []
for word in words:
wid = self._words.get(word)
if wid is None:
continue
wids.append(wid)
return wids
class Indexable:
def __init__(self, text):
self.text = text
class MethodIndexable:
def __init__(self, text):
self._text = text
def text(self):
return self._text
class IndexTest(TestCase):
def setUp(self):
self.lexicon = SimpleLexicon()
self.index = Index(self.lexicon, "text")
def test_index_document(self, DOCID=1):
doc = Indexable("this is a simple document")
self.index.index_object(DOCID, doc)
self.assert_(self.index._docweight[DOCID])
self.assertEqual(len(self.index._wordinfo), 5)
self.assertEqual(len(self.index._docwords), 1)
self.assertEqual(len(self.index._docwords[DOCID]), 5)
for docfreq, map in self.index._wordinfo.values():
self.assertEqual(docfreq, 1)
self.assertEqual(len(map), 1)
self.assert_(map.has_key(DOCID))
def test_unindex_document(self):
DOCID = 1
self.test_index_document(DOCID)
self.index.unindex_object(DOCID)
self.assertEqual(len(self.index._docweight), 0)
self.assertEqual(len(self.index._wordinfo), 0)
self.assertEqual(len(self.index._docwords), 0)
def test_index_two_documents(self):
self.test_index_document()
doc = MethodIndexable('not the same document')
DOCID = 2
self.index.index_object(DOCID, doc)
self.assert_(self.index._docweight[DOCID])
self.assertEqual(len(self.index._wordinfo), 8)
self.assertEqual(len(self.index._docwords), 2)
self.assertEqual(len(self.index._docwords[DOCID]), 4)
document_wid = self.lexicon._words["document"]
for wid, (docfreq, map) in self.index._wordinfo.items():
if wid == document_wid:
self.assertEqual(docfreq, 2)
self.assertEqual(len(map), 2)
self.assert_(map.has_key(1))
self.assert_(map.has_key(DOCID))
else:
self.assertEqual(docfreq, 1)
self.assertEqual(len(map), 1)
def test_index_two_unindex_one(self):
# index two documents, unindex one, and test the results
self.test_index_two_documents()
self.index.unindex_object(1)
DOCID = 2
self.assertEqual(len(self.index._docweight), 1)
self.assert_(self.index._docweight[DOCID])
self.assertEqual(len(self.index._wordinfo), 4)
self.assertEqual(len(self.index._docwords), 1)
self.assertEqual(len(self.index._docwords[DOCID]), 4)
for docfreq, map in self.index._wordinfo.values():
self.assertEqual(docfreq, 1)
self.assertEqual(len(map), 1)
self.assert_(map.has_key(DOCID))
def test_index_duplicated_words(self, DOCID=1):
doc = Indexable("this is a repititive repititive repititive document")
self.index.index_object(DOCID, doc)
self.assert_(self.index._docweight[DOCID])
self.assertEqual(len(self.index._wordinfo), 5)
self.assertEqual(len(self.index._docwords), 1)
self.assertEqual(len(self.index._docwords[DOCID]), 5)
repititive_wid = self.lexicon._words["repititive"]
for wid, (docfreq, map) in self.index._wordinfo.items():
if wid == repititive_wid:
self.assertEqual(docfreq, 1)
else:
self.assertEqual(docfreq, 1)
self.assertEqual(len(map), 1)
self.assert_(map.has_key(DOCID))
def test_simple_query_oneresult(self):
self.index.index_object(1, MethodIndexable('not the same document'))
results = self.index.search("document")
self.assertEqual(len(results), 1)
self.assert_(results.has_key(1))
def test_simple_query_noresults(self):
self.index.index_object(1, MethodIndexable('not the same document'))
results = self.index.search("frobnicate")
self.assertEqual(len(results), 0)
def test_query_oneresult(self):
self.index.index_object(1, Indexable(
'not the same document'))
self.index.index_object(2, MethodIndexable(
'something about something else'))
results = self.index.search("document")
self.assertEqual(len(results), 1)
self.assert_(results.has_key(1))
def test_suite():
return makeSuite(IndexTest)
if __name__=='__main__':
main(defaultTest='test_suite')
=== Removed File Products/ZCTextIndex/tests/test_index.py ===