[Zope-CVS] CVS: Products/ZCTextIndex/tests - testIndex.py:1.1.2.1 test_index.py:NONE

Guido van Rossum guido@python.org
Wed, 1 May 2002 10:25:42 -0400


Update of /cvs-repository/Products/ZCTextIndex/tests
In directory cvs.zope.org:/tmp/cvs-serv26338

Added Files:
      Tag: TextIndexDS9-branch
	testIndex.py 
Removed Files:
      Tag: TextIndexDS9-branch
	test_index.py 
Log Message:
Rename test_index.py to testIndex.py

=== Added File Products/ZCTextIndex/tests/testIndex.py ===
##############################################################################
#
# Copyright (c) 2001, 2002 Zope Corporation and Contributors.
# All Rights Reserved.
# 
# This software is subject to the provisions of the Zope Public License,
# Version 2.0 (ZPL).  A copy of the ZPL should accompany this distribution.
# THIS SOFTWARE IS PROVIDED "AS IS" AND ANY AND ALL EXPRESS OR IMPLIED
# WARRANTIES ARE DISCLAIMED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
# WARRANTIES OF TITLE, MERCHANTABILITY, AGAINST INFRINGEMENT, AND FITNESS
# FOR A PARTICULAR PURPOSE.
# 
##############################################################################

from unittest import TestCase, TestSuite, main, makeSuite

from Products.ZCTextIndex.Index import Index


class SimpleLexicon:
    def __init__(self):
        self._words = {}

    def sourceToWordIds(self, text):
        words = text.split()
        wids = []
        for word in words:
            wid = self._words.get(word)
            if wid is None:
                wid = len(self._words)
                self._words[word] = wid
            wids.append(wid)
        return wids

    def termToWordIds(self, text):
        words = text.split()
        wids = []
        for word in words:
            wid = self._words.get(word)
            if wid is None:
                continue
            wids.append(wid)
        return wids


class Indexable:
    def __init__(self, text):
        self.text = text

class MethodIndexable:
    def __init__(self, text):
        self._text = text

    def text(self):
        return self._text


class IndexTest(TestCase):
    def setUp(self):
        self.lexicon = SimpleLexicon()
        self.index = Index(self.lexicon, "text")

    def test_index_document(self, DOCID=1):
        doc = Indexable("this is a simple document")
        self.index.index_object(DOCID, doc)
        self.assert_(self.index._docweight[DOCID])
        self.assertEqual(len(self.index._wordinfo), 5)
        self.assertEqual(len(self.index._docwords), 1)
        self.assertEqual(len(self.index._docwords[DOCID]), 5)
        for docfreq, map in self.index._wordinfo.values():
            self.assertEqual(docfreq, 1)
            self.assertEqual(len(map), 1)
            self.assert_(map.has_key(DOCID))

    def test_unindex_document(self):
        DOCID = 1
        self.test_index_document(DOCID)
        self.index.unindex_object(DOCID)
        self.assertEqual(len(self.index._docweight), 0)
        self.assertEqual(len(self.index._wordinfo), 0)
        self.assertEqual(len(self.index._docwords), 0)

    def test_index_two_documents(self):
        self.test_index_document()
        doc = MethodIndexable('not the same document')
        DOCID = 2
        self.index.index_object(DOCID, doc)
        self.assert_(self.index._docweight[DOCID])
        self.assertEqual(len(self.index._wordinfo), 8)
        self.assertEqual(len(self.index._docwords), 2)
        self.assertEqual(len(self.index._docwords[DOCID]), 4)
        document_wid = self.lexicon._words["document"]
        for wid, (docfreq, map) in self.index._wordinfo.items():
            if wid == document_wid:
                self.assertEqual(docfreq, 2)
                self.assertEqual(len(map), 2)
                self.assert_(map.has_key(1))
                self.assert_(map.has_key(DOCID))
            else:
                self.assertEqual(docfreq, 1)
                self.assertEqual(len(map), 1)

    def test_index_two_unindex_one(self):
        # index two documents, unindex one, and test the results
        self.test_index_two_documents()
        self.index.unindex_object(1)
        DOCID = 2
        self.assertEqual(len(self.index._docweight), 1)
        self.assert_(self.index._docweight[DOCID])
        self.assertEqual(len(self.index._wordinfo), 4)
        self.assertEqual(len(self.index._docwords), 1)
        self.assertEqual(len(self.index._docwords[DOCID]), 4)
        for docfreq, map in self.index._wordinfo.values():
            self.assertEqual(docfreq, 1)
            self.assertEqual(len(map), 1)
            self.assert_(map.has_key(DOCID))

    def test_index_duplicated_words(self, DOCID=1):
        doc = Indexable("this is a repititive repititive repititive document")
        self.index.index_object(DOCID, doc)
        self.assert_(self.index._docweight[DOCID])
        self.assertEqual(len(self.index._wordinfo), 5)
        self.assertEqual(len(self.index._docwords), 1)
        self.assertEqual(len(self.index._docwords[DOCID]), 5)
        repititive_wid = self.lexicon._words["repititive"]
        for wid, (docfreq, map) in self.index._wordinfo.items():
            if wid == repititive_wid:
                self.assertEqual(docfreq, 1)
            else:
                self.assertEqual(docfreq, 1)
            self.assertEqual(len(map), 1)
            self.assert_(map.has_key(DOCID))

    def test_simple_query_oneresult(self):
        self.index.index_object(1, MethodIndexable('not the same document'))
        results = self.index.search("document")
        self.assertEqual(len(results), 1)
        self.assert_(results.has_key(1))

    def test_simple_query_noresults(self):
        self.index.index_object(1, MethodIndexable('not the same document'))
        results = self.index.search("frobnicate")
        self.assertEqual(len(results), 0)

    def test_query_oneresult(self):
        self.index.index_object(1, Indexable(
            'not the same document'))
        self.index.index_object(2, MethodIndexable(
            'something about something else'))
        results = self.index.search("document")
        self.assertEqual(len(results), 1)
        self.assert_(results.has_key(1))

def test_suite():
    return makeSuite(IndexTest)

if __name__=='__main__':
    main(defaultTest='test_suite')

=== Removed File Products/ZCTextIndex/tests/test_index.py ===