Source code for lerot.experiment.LearningExperiment

# This file is part of Lerot.
#
# Lerot is free software: you can redistribute it and/or modify
# it under the terms of the GNU Lesser General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# Lerot is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public License
# along with Lerot.  If not, see <http://www.gnu.org/licenses/>.

# KH, 2012/06/14
"""
Runs an online learning experiment. The "environment" logic is located here,
e.g., sampling queries, observing user clicks, external evaluation of result
lists
"""

import sys
import logging
import warnings
from numpy.linalg import norm

from ..utils import get_cosine_similarity
from AbstractLearningExperiment import AbstractLearningExperiment


[docs]class LearningExperiment(AbstractLearningExperiment):
    """
    Represents an experiment in which a retrieval system learns from
    implicit user feedback. The experiment is initialized as specified in the
    provided arguments, or config file.
    """

[docs]    def run(self):
        """
        A single run of the experiment.
        """
        query_keys = sorted(self.training_queries.keys())
        query_length = len(query_keys)

        online_evaluation = {}
        offline_test_evaluation = {}
        # offline_train_evaluation = {}

        for eval_name, eval_dict in self.evaluations:
            dict_name = eval_name + '@' + str(eval_dict['cutoff'])
            # Stop if there are duplicate evaluations
            if dict_name in online_evaluation:
                warnings.warn("Duplicate evaluation arguments, omitting..")
                continue
            online_evaluation[dict_name] = []
            offline_test_evaluation[dict_name] = []
            # offline_train_evaluation[dict_name] = []
        similarities = [.0]

        # Process queries
        for query_count in xrange(self.num_queries):
            logging.debug("Query nr: {}".format(query_count))
            previous_solution_w = self.system.get_solution().w
            qid = self._sample_qid(query_keys, query_count, query_length)
            query = self.training_queries[qid]
            # get result list for the current query from the system
            result_list = self.system.get_ranked_list(query)

            # Online evaluation
            for eval_name, eval_dict in self.evaluations:
                a = float(eval_dict['eval_class'].evaluate_ranking(result_list,
                          query, eval_dict['cutoff']))
                online_evaluation[eval_name + '@' +
                                  str(eval_dict['cutoff'])].append(a)

            # generate click feedback
            clicks = self.um.get_clicks(result_list, query.get_labels())
            # send feedback to system
            current_solution = self.system.update_solution(clicks)

            # compute current offline performance (over all documents)
            for eval_name, eval_dict in self.evaluations:
                # Create dict name as done above
                dict_name = eval_name + '@' + str(eval_dict['cutoff'])
                if (not (previous_solution_w == current_solution.w).all()) or \
                        len(offline_test_evaluation[dict_name]) == 0:
                    e1 = eval_dict['eval_class'].evaluate_all(
                        current_solution, self.test_queries,
                        eval_dict['cutoff'])
                    # e2 = eval_dict['eval_class'].evaluate_all(
                    #     current_solution, self.training_queries,
                    #     eval_dict['cutoff'])
                    offline_test_evaluation[dict_name].append(float(e1))
                    # offline_train_evaluation[dict_name].append(float(e2))
                else:
                    offline_test_evaluation[dict_name].append(
                                    offline_test_evaluation[dict_name][-1])
                    # offline_train_evaluation[dict_name].append(
                    #                 offline_train_evaluation[dict_name][-1])

            similarities.append(float(get_cosine_similarity(
                previous_solution_w, current_solution.w)))

        # Print new line for the next run
        sys.stdout.write('\nDone')
        sys.stdout.write('\n')
        sys.stdout.flush()

        # Finalize evaluation measures after training is done
        summary = {"weight_sim": similarities, "final_weights":
                   previous_solution_w.tolist()}
        for eval_name, eval_dict in self.evaluations:
            dict_name = eval_name + '@' + str(eval_dict['cutoff'])
            logging.info("Final offline %s = %.3f" % (dict_name,
                         offline_test_evaluation[dict_name][-1]))
            summary["online_" + dict_name] = online_evaluation[dict_name]
            summary["offline_test_" + dict_name] = \
                offline_test_evaluation[dict_name]
            # summary["offline_train_" + dict_name] = \
            #     offline_train_evaluation[dict_name]
        logging.info("Length of final weight vector = %.3f" %
                     norm(current_solution.w))
        return summary