/* * Copyright 2011 Steven Gribble * * This file is part of the UW CSE 333 course project sequence * (333proj). * * 333proj is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * 333proj is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with 333proj. If not, see . */ #ifndef HW3_QUERYPROCESSOR_H_ #define HW3_QUERYPROCESSOR_H_ #include #include #include #include #include "./fileindexutil.h" #include "./DocIDTableReader.h" #include "./DocTableReader.h" #include "./FileIndexReader.h" #include "./IndexTableReader.h" using std::list; using std::vector; using std::string; namespace hw3 { // A QueryProcessor is a class that is given a set of names of index // files, and uses the various FileIndexReader and HashTableReader // classes to process queries against the indices. class QueryProcessor { public: // Construct a QueryProcessor. Arguments: // // - indexlist: a std::list containing a list of index // filenames that the QueryProcessor should use. // // - validate: a bool indicating whether or not to validate the // checksums in the index files. Defaults to true. QueryProcessor(list indexlist, bool validate = true); // The destructor. ~QueryProcessor(); // This structure defines a single query result. As with HW2, // the rank of a query result is the sum of the number of occurrences // of query words within the document. class QueryResult { public: bool operator<(const QueryResult &rhs) const { return rank > rhs.rank; } std::string document_name; // The name of a matching document. uint32_t rank; // The rank of the matching document. }; // This method processes a query against the indices and returns a // vector of QueryResults, sorted in descending order of rank. If no // documents match the query, then a valid but empty vector will be // returned. std::vector ProcessQuery(const std::vector &query); protected: // The list of index files we process. std::list indexlist_; // The arrays of pointers to DocTableReader and IndexTableReader // objects. uint32_t arraylen_; DocTableReader **dtr_array_; IndexTableReader **itr_array_; private: // Disable the copy constructor and assignment operator. DISALLOW_COPY_AND_ASSIGN(QueryProcessor); }; } // namespace hw3 #endif // HW3_QUERYPROCESSOR_H_