Changeset 159:e4e3160be9c0 for classifier/classifier.py
- Timestamp:
- 08/19/07 10:34:17 (15 months ago)
- Files:
-
- 1 modified
-
classifier/classifier.py (modified) (3 diffs)
Legend:
- Unmodified
- Added
- Removed
-
classifier/classifier.py
r157 r159 42 42 wich means: store words in categories 43 43 """ 44 self.backend.add Category(name=category, title=category)44 self.backend.add_category(name=category) 45 45 data = self.tokenizer.transform(data, self.options) 46 46 for element in data: 47 self.backend.add Word(element, self.language, category)47 self.backend.add_word(element, self.language, category) 48 48 49 49 def unlearn(self, data, category): … … 116 116 117 117 def corpusSize(self, language=None): 118 return self.backend.wordCount(language=language) 118 119 return self.backend.word_count(language=language) 119 120 120 121 def categorySize(self, category, language=None): 121 return self.backend.word Count(category=category, language=language)122 return self.backend.word_count(category=category, language=language) 122 123 123 124 def _buildWordProbabilities(self, language=None): 124 125 probs = {} 125 for cat in self.backend.list Categories():126 for cat in self.backend.list_categories(): 126 127 probs[cat] = self._buildCategoryWordProbabilities(cat, language) 127 128 return probs … … 138 139 them_count = float(max(corpus_size - category_size, 1)) 139 140 probabilities = {} 140 words = self.backend.list Words(language, complete=True)141 words = self.backend.list_words(language, complete=True) 141 142 142 143 for word in words:
