Handle <title> in SVG
[xapian.git] / xapian-core / api / vectortermlist.h
blob8fc810db411f859809a64391517668ac9d51af2e
1 /** @file
2 * @brief A vector-like container of terms which can be iterated.
3 */
4 /* Copyright (C) 2011,2012,2017 Olly Betts
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License as
8 * published by the Free Software Foundation; either version 2 of the
9 * License, or (at your option) any later version.
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
21 #ifndef XAPIAN_INCLUDED_VECTORTERMLIST_H
22 #define XAPIAN_INCLUDED_VECTORTERMLIST_H
24 #include "xapian/types.h"
26 #include "net/length.h"
27 #include "termlist.h"
29 /** This class stores a list of terms.
31 * To be memory efficient, we store the terms in a single string using a
32 * suitable simple encoding. This way the number of bytes needed will
33 * usually be the sum of the lengths of all the terms plus the number of
34 * terms. If we used std::vector<std::string> here like we used to, that
35 * would need something like an additional 30 bytes per term (30 calculated
36 * for GCC 4.x on x86_64).
38 class VectorTermList : public TermList {
39 /// The encoded terms.
40 std::string data;
42 /// Pointer to the next term's data, or NULL if we are at end.
43 const char * p;
45 /// The number of terms in the list.
46 Xapian::termcount num_terms;
48 /// The current term.
49 std::string current_term;
51 public:
52 template<typename I>
53 VectorTermList(I begin, I end) : num_terms(0)
55 // First calculate how much space we'll need so we can reserve it.
56 size_t total_size = 0;
57 for (I i = begin; i != end; ++i) {
58 ++num_terms;
59 const std::string & s = *i;
60 total_size += s.size() + 1;
61 if (s.size() >= 255) {
62 // Not a common case, so just assume the worst case rather than
63 // trying to carefully calculate the exact size.
64 total_size += 5;
67 data.reserve(total_size);
69 // Now encode all the terms into data.
70 for (I i = begin; i != end; ++i) {
71 const std::string & s = *i;
72 data += encode_length(s.size());
73 data += s;
76 p = data.data();
79 Xapian::termcount get_approx_size() const;
81 std::string get_termname() const;
83 Xapian::termcount get_wdf() const;
85 Xapian::doccount get_termfreq() const;
87 TermList * next();
89 TermList * skip_to(const std::string &);
91 bool at_end() const;
93 Xapian::termcount positionlist_count() const;
95 Xapian::PositionIterator positionlist_begin() const;
98 #endif // XAPIAN_INCLUDED_VECTORTERMLIST_H