#!/usr/bin/env python """ popindex.py - generate a popcon index to be used by the recommender as the users repository, based on filters provided by config """ __author__ = "Tassia Camoes Araujo " __copyright__ = "Copyright (C) 2011 Tassia Camoes Araujo" __license__ = """ This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see . """ import os import sys sys.path.insert(0,'../') import logging import datetime from config import Config from data import PopconXapianIndex if __name__ == '__main__': cfg = Config() begin_time = datetime.datetime.now() logging.info("Popcon indexing started at %s" % begin_time) # use config file or command line options popindex = PopconXapianIndex(cfg) end_time = datetime.datetime.now() logging.info("Popcon indexing completed at %s" % end_time) logging.info("Number of documents (submissions): %d" % popindex.get_doccount()) delta = end_time - begin_time logging.info("Time elapsed: %d seconds." % delta.seconds) if cfg.index_mode=="cluster" or cfg.index_mode=="recluster": logging.info("Medoids: %d\tDispersion:%f" % (cfg.k_medoids,popindex.cluster_dispersion))