| 1 | /**************************************************************************** |
| 2 | ** |
| 3 | ** Copyright (C) 2016 The Qt Company Ltd. |
| 4 | ** Contact: https://www.qt.io/licensing/ |
| 5 | ** |
| 6 | ** This file is part of the QtXmlPatterns module of the Qt Toolkit. |
| 7 | ** |
| 8 | ** $QT_BEGIN_LICENSE:LGPL$ |
| 9 | ** Commercial License Usage |
| 10 | ** Licensees holding valid commercial Qt licenses may use this file in |
| 11 | ** accordance with the commercial license agreement provided with the |
| 12 | ** Software or, alternatively, in accordance with the terms contained in |
| 13 | ** a written agreement between you and The Qt Company. For licensing terms |
| 14 | ** and conditions see https://www.qt.io/terms-conditions. For further |
| 15 | ** information use the contact form at https://www.qt.io/contact-us. |
| 16 | ** |
| 17 | ** GNU Lesser General Public License Usage |
| 18 | ** Alternatively, this file may be used under the terms of the GNU Lesser |
| 19 | ** General Public License version 3 as published by the Free Software |
| 20 | ** Foundation and appearing in the file LICENSE.LGPL3 included in the |
| 21 | ** packaging of this file. Please review the following information to |
| 22 | ** ensure the GNU Lesser General Public License version 3 requirements |
| 23 | ** will be met: https://www.gnu.org/licenses/lgpl-3.0.html. |
| 24 | ** |
| 25 | ** GNU General Public License Usage |
| 26 | ** Alternatively, this file may be used under the terms of the GNU |
| 27 | ** General Public License version 2.0 or (at your option) the GNU General |
| 28 | ** Public license version 3 or any later version approved by the KDE Free |
| 29 | ** Qt Foundation. The licenses are as published by the Free Software |
| 30 | ** Foundation and appearing in the file LICENSE.GPL2 and LICENSE.GPL3 |
| 31 | ** included in the packaging of this file. Please review the following |
| 32 | ** information to ensure the GNU General Public License requirements will |
| 33 | ** be met: https://www.gnu.org/licenses/gpl-2.0.html and |
| 34 | ** https://www.gnu.org/licenses/gpl-3.0.html. |
| 35 | ** |
| 36 | ** $QT_END_LICENSE$ |
| 37 | ** |
| 38 | ****************************************************************************/ |
| 39 | |
| 40 | // |
| 41 | // W A R N I N G |
| 42 | // ------------- |
| 43 | // |
| 44 | // This file is not part of the Qt API. It exists purely as an |
| 45 | // implementation detail. This header file may change from version to |
| 46 | // version without notice, or even be removed. |
| 47 | // |
| 48 | // We mean it. |
| 49 | |
| 50 | #ifndef Patternist_AccelTree_H |
| 51 | #define Patternist_AccelTree_H |
| 52 | |
| 53 | #include <QHash> |
| 54 | #include <QUrl> |
| 55 | #include <QVector> |
| 56 | #include <QXmlName> |
| 57 | |
| 58 | #include <private/qitem_p.h> |
| 59 | #include <private/qnamepool_p.h> |
| 60 | |
| 61 | QT_BEGIN_NAMESPACE |
| 62 | |
| 63 | namespace QPatternist |
| 64 | { |
| 65 | template<bool> class AccelTreeBuilder; |
| 66 | |
| 67 | /** |
| 68 | * @short Stores an XML document using the XPath Accelerator scheme, also |
| 69 | * known as pre/post numbering. |
| 70 | * |
| 71 | * Working on this code will be destructive without a proper understanding of |
| 72 | * the Accelerator scheme, so do check out the links. We don't implement any form |
| 73 | * of staircase join, although that is only due to time constraints. |
| 74 | * |
| 75 | * @author Frans Englich <frans.englich@nokia.com> |
| 76 | * @see <a href="http://www.pathfinder-xquery.org/?q=research/xpath-accel">XPath |
| 77 | * Accelerator</a> |
| 78 | * @see <a href="http://www.pathfinder-xquery.org/files/xpath-accel.pdf">Accelerating |
| 79 | * XPath Location Steps, Torsten Grust</a> |
| 80 | * @see <a href="http://citeseer.ist.psu.edu/cache/papers/cs/29367/http:zSzzSzwww.informatik.uni-konstanz.dezSz~grustzSzfileszSzstaircase-join.pdf/grust03staircase.pdf">Staircase Join: |
| 81 | * Teach a Relational DBMS to Watch its (Axis) Steps</a> |
| 82 | * @see <a href="http://ftp.cwi.nl/CWIreports/INS/INS-E0510.pdf">Loop-lifted |
| 83 | * staircase join: from XPath to XQuery, Torsten Grust</a> |
| 84 | * @see <a href="http://englich.wordpress.com/2007/01/09/xmlstat/">xmlstat, Frans Englich</a> |
| 85 | * @see <a href"http://www.inf.uni-konstanz.de/dbis/publications/download/accelerating-locsteps.pdf">Accelerating |
| 86 | * XPath Evaluation in Any RDBMS, Torsten Grust</a> |
| 87 | */ |
| 88 | class Q_AUTOTEST_EXPORT AccelTree : public QAbstractXmlNodeModel |
| 89 | { |
| 90 | friend class AccelTreePrivate; |
| 91 | public: |
| 92 | using QAbstractXmlNodeModel::createIndex; |
| 93 | |
| 94 | typedef QExplicitlySharedDataPointer<AccelTree> Ptr; |
| 95 | typedef qint32 PreNumber; |
| 96 | typedef PreNumber PostNumber; |
| 97 | typedef qint8 Depth; |
| 98 | |
| 99 | AccelTree(const QUrl &docURI, const QUrl &bURI); |
| 100 | |
| 101 | /** |
| 102 | * @short Houses data for a node, and that all node kinds have. |
| 103 | * |
| 104 | * BasicNodeData is internal to the Accel tree implementation, and is |
| 105 | * only used by those classes. |
| 106 | * |
| 107 | * @author Frans Englich <frans.englich@nokia.com> |
| 108 | * @todo Can't m_kind be coded somewhere else? If m_name is invalid, |
| 109 | * its bits can be used to distinguish the node types that doesn't have |
| 110 | * names, and for elements, attributes and processing instructions, we need |
| 111 | * two bits, somewhere. Attributes and processing instructions can't have a |
| 112 | * size, is that of help? There's also certain rules for the names. For instance, |
| 113 | * a processing instruction will never have a prefix nor namespace. Neither |
| 114 | * will an attribute node have a default, non-empty namespace, right? |
| 115 | * @todo Compress text nodes, add general support for it in Patternist. |
| 116 | */ |
| 117 | class BasicNodeData |
| 118 | { |
| 119 | public: |
| 120 | /* No need to initialize the members. See AccelTreeBuilder. */ |
| 121 | inline BasicNodeData() |
| 122 | { |
| 123 | } |
| 124 | |
| 125 | inline BasicNodeData(const PreNumber aDepth, |
| 126 | const PreNumber aParent, |
| 127 | const QXmlNodeModelIndex::NodeKind k, |
| 128 | const PreNumber s, |
| 129 | const QXmlName n = QXmlName()) : m_parent(aParent) |
| 130 | , m_size(s) |
| 131 | , m_name(n) |
| 132 | , m_depth(aDepth) |
| 133 | , m_kind(k) |
| 134 | { |
| 135 | } |
| 136 | |
| 137 | inline Depth depth() const |
| 138 | { |
| 139 | return m_depth; |
| 140 | } |
| 141 | |
| 142 | inline PreNumber parent() const |
| 143 | { |
| 144 | return m_parent; |
| 145 | } |
| 146 | |
| 147 | /** |
| 148 | * @see AccelTree::size() |
| 149 | */ |
| 150 | inline PreNumber size() const |
| 151 | { |
| 152 | /* Remember that we use the m_size to signal compression if |
| 153 | * we're a text node. */ |
| 154 | if(m_kind == QXmlNodeModelIndex::Text) |
| 155 | return 0; |
| 156 | else |
| 157 | return m_size; |
| 158 | } |
| 159 | |
| 160 | inline void setSize(const PreNumber aSize) |
| 161 | { |
| 162 | m_size = aSize; |
| 163 | } |
| 164 | |
| 165 | inline QXmlNodeModelIndex::NodeKind kind() const |
| 166 | { |
| 167 | return m_kind; |
| 168 | } |
| 169 | |
| 170 | inline QXmlName name() const |
| 171 | { |
| 172 | return m_name; |
| 173 | } |
| 174 | |
| 175 | inline bool isCompressed() const |
| 176 | { |
| 177 | Q_ASSERT_X(m_kind == QXmlNodeModelIndex::Text, Q_FUNC_INFO, |
| 178 | "Currently, only text nodes are compressed." ); |
| 179 | /* Note, we don't call size() here, since it has logic for text |
| 180 | * nodes. */ |
| 181 | return m_size == IsCompressed; |
| 182 | } |
| 183 | |
| 184 | private: |
| 185 | /** |
| 186 | * This is the pre number of the parent. |
| 187 | */ |
| 188 | PreNumber m_parent; |
| 189 | |
| 190 | /** |
| 191 | * This is the count of children this node has. |
| 192 | * |
| 193 | * In the case of a text node, which cannot have children, |
| 194 | * it is set to IsCompressed, if the content has been the result |
| 195 | * of CompressedWhitespace::compress(). If it's not compressed, |
| 196 | * it is zero. |
| 197 | */ |
| 198 | PreNumber m_size; |
| 199 | |
| 200 | /** |
| 201 | * For text nodes, and less importantly, comments, |
| 202 | * this variable is not used. |
| 203 | */ |
| 204 | QXmlName m_name; |
| 205 | |
| 206 | Depth m_depth; |
| 207 | |
| 208 | /** |
| 209 | * Technically it is sufficient with 7 bits. However, at least MSVC |
| 210 | * 2005 miscompiles it such that QXmlNodeModelIndex::Text becomes |
| 211 | * -64 instead of 64 with hilarious crashes as result. |
| 212 | * |
| 213 | * Fortunately this extra bit would be padded anyway. |
| 214 | */ |
| 215 | QXmlNodeModelIndex::NodeKind m_kind : 8; |
| 216 | }; |
| 217 | |
| 218 | virtual QUrl baseUri(const QXmlNodeModelIndex &ni) const; |
| 219 | virtual QUrl documentUri(const QXmlNodeModelIndex &ni) const; |
| 220 | virtual QXmlNodeModelIndex::NodeKind kind(const QXmlNodeModelIndex &ni) const; |
| 221 | virtual QXmlNodeModelIndex::DocumentOrder compareOrder(const QXmlNodeModelIndex &ni1, |
| 222 | const QXmlNodeModelIndex &ni2) const; |
| 223 | |
| 224 | /** |
| 225 | * @short Returns the root node. |
| 226 | * |
| 227 | * This function does not use @p n, so a default constructed |
| 228 | * QXmlNodeModelIndex may be passed. |
| 229 | */ |
| 230 | virtual QXmlNodeModelIndex root(const QXmlNodeModelIndex &n) const; |
| 231 | |
| 232 | virtual QXmlNodeModelIndex parent(const QXmlNodeModelIndex &ni) const; |
| 233 | virtual QXmlNodeModelIndex::Iterator::Ptr iterate(const QXmlNodeModelIndex &ni, |
| 234 | QXmlNodeModelIndex::Axis axis) const; |
| 235 | virtual QXmlName name(const QXmlNodeModelIndex &ni) const; |
| 236 | virtual QVector<QXmlName> namespaceBindings(const QXmlNodeModelIndex &n) const; |
| 237 | virtual void sendNamespaces(const QXmlNodeModelIndex &n, |
| 238 | QAbstractXmlReceiver *const receiver) const; |
| 239 | virtual QString stringValue(const QXmlNodeModelIndex &n) const; |
| 240 | virtual QVariant typedValue(const QXmlNodeModelIndex &n) const; |
| 241 | virtual Item::Iterator::Ptr sequencedTypedValue(const QXmlNodeModelIndex &n) const; |
| 242 | virtual ItemType::Ptr type(const QXmlNodeModelIndex &ni) const; |
| 243 | virtual QXmlNodeModelIndex elementById(const QXmlName &id) const; |
| 244 | virtual QVector<QXmlNodeModelIndex> nodesByIdref(const QXmlName &idref) const; |
| 245 | virtual void copyNodeTo(const QXmlNodeModelIndex &node, |
| 246 | QAbstractXmlReceiver *const receiver, |
| 247 | const NodeCopySettings &settings) const; |
| 248 | |
| 249 | friend class AccelTreeBuilder<false>; |
| 250 | friend class AccelTreeBuilder<true>; |
| 251 | |
| 252 | enum Constants |
| 253 | { |
| 254 | IsCompressed = 1 |
| 255 | }; |
| 256 | |
| 257 | /** |
| 258 | * The key is the pre number of an element, and the value is a vector |
| 259 | * containing the namespace declarations being declared on that |
| 260 | * element. Therefore, it does not reflect the namespaces being in |
| 261 | * scope for that element. For that, a walk along axis ancestor is |
| 262 | * necessary. |
| 263 | */ |
| 264 | QHash<PreNumber, QVector<QXmlName> > namespaces; |
| 265 | |
| 266 | /** |
| 267 | * Stores data for nodes. The QHash's value is the data of the processing instruction, and the |
| 268 | * content of a text node or comment. |
| 269 | */ |
| 270 | QHash<PreNumber, QString> data; |
| 271 | |
| 272 | QVector<BasicNodeData> basicData; |
| 273 | QHash<PreNumber, QPair<qint64, qint64> > sourcePositions; |
| 274 | |
| 275 | inline QUrl documentUri() const |
| 276 | { |
| 277 | return m_documentURI; |
| 278 | } |
| 279 | |
| 280 | inline QUrl baseUri() const |
| 281 | { |
| 282 | return m_baseURI; |
| 283 | } |
| 284 | |
| 285 | /** |
| 286 | * @short Returns @c true if the node identified by @p pre has child |
| 287 | * nodes(in the sense of the XDM), but also if it has namespace nodes, |
| 288 | * or attribute nodes. |
| 289 | */ |
| 290 | inline bool hasChildren(const PreNumber pre) const |
| 291 | { |
| 292 | return basicData.at(i: pre).size() > 0; |
| 293 | } |
| 294 | |
| 295 | /** |
| 296 | * @short Returns the parent node of @p pre. |
| 297 | * |
| 298 | * If @p pre parent doesn't have a parent node, the return value is |
| 299 | * undefined. |
| 300 | * |
| 301 | * @see hasParent() |
| 302 | */ |
| 303 | inline PreNumber parent(const PreNumber pre) const |
| 304 | { |
| 305 | return basicData.at(i: pre).parent(); |
| 306 | } |
| 307 | |
| 308 | inline bool hasParent(const PreNumber pre) const |
| 309 | { |
| 310 | return basicData.at(i: pre).depth() > 0; |
| 311 | } |
| 312 | |
| 313 | inline bool hasFollowingSibling(const PreNumber pre) const |
| 314 | { |
| 315 | return pre < maximumPreNumber(); |
| 316 | } |
| 317 | |
| 318 | inline PostNumber postNumber(const PreNumber pre) const |
| 319 | { |
| 320 | const BasicNodeData &b = basicData.at(i: pre); |
| 321 | return pre + b.size() - b.depth(); |
| 322 | } |
| 323 | |
| 324 | inline QXmlNodeModelIndex::NodeKind kind(const PreNumber pre) const |
| 325 | { |
| 326 | return basicData.at(i: pre).kind(); |
| 327 | } |
| 328 | |
| 329 | inline PreNumber maximumPreNumber() const |
| 330 | { |
| 331 | return basicData.count() - 1; |
| 332 | } |
| 333 | |
| 334 | inline PreNumber toPreNumber(const QXmlNodeModelIndex n) const |
| 335 | { |
| 336 | return n.data(); |
| 337 | } |
| 338 | |
| 339 | inline PreNumber size(const PreNumber pre) const |
| 340 | { |
| 341 | Q_ASSERT_X(basicData.at(pre).size() != -1, Q_FUNC_INFO, |
| 342 | "The size cannot be -1. That means an uninitialized value is attempted to be used." ); |
| 343 | return basicData.at(i: pre).size(); |
| 344 | } |
| 345 | |
| 346 | inline Depth depth(const PreNumber pre) const |
| 347 | { |
| 348 | return basicData.at(i: pre).depth(); |
| 349 | } |
| 350 | |
| 351 | void printStats(const NamePool::Ptr &np) const; |
| 352 | |
| 353 | inline QXmlName name(const PreNumber pre) const |
| 354 | { |
| 355 | return basicData.at(i: pre).name(); |
| 356 | } |
| 357 | |
| 358 | inline bool isCompressed(const PreNumber pre) const |
| 359 | { |
| 360 | return basicData.at(i: pre).isCompressed(); |
| 361 | } |
| 362 | |
| 363 | static inline bool hasPrefix(const QVector<QXmlName> &nbs, const QXmlName::PrefixCode prefix); |
| 364 | |
| 365 | QUrl m_documentURI; |
| 366 | QUrl m_baseURI; |
| 367 | |
| 368 | protected: |
| 369 | virtual QXmlNodeModelIndex nextFromSimpleAxis(QAbstractXmlNodeModel::SimpleAxis, |
| 370 | const QXmlNodeModelIndex&) const; |
| 371 | virtual QVector<QXmlNodeModelIndex> attributes(const QXmlNodeModelIndex &element) const; |
| 372 | |
| 373 | private: |
| 374 | /** |
| 375 | * Returns the source location for the object with the given @p index. |
| 376 | */ |
| 377 | QSourceLocation sourceLocation(const QXmlNodeModelIndex &index) const; |
| 378 | |
| 379 | /** |
| 380 | * Copies the children of @p node to @p receiver. |
| 381 | */ |
| 382 | inline void copyChildren(const QXmlNodeModelIndex &node, |
| 383 | QAbstractXmlReceiver *const receiver, |
| 384 | const NodeCopySettings &settings) const; |
| 385 | |
| 386 | /** |
| 387 | * The key is the xml:id value, and the value is the element |
| 388 | * with that value. |
| 389 | */ |
| 390 | QHash<QXmlName::LocalNameCode, PreNumber> m_IDs; |
| 391 | }; |
| 392 | } |
| 393 | |
| 394 | Q_DECLARE_TYPEINFO(QPatternist::AccelTree::BasicNodeData, Q_MOVABLE_TYPE); |
| 395 | |
| 396 | QT_END_NAMESPACE |
| 397 | |
| 398 | #endif |
| 399 | |