1 // SVNReportParser -- parser for SVN report XML data
3 // Copyright (C) 2012 James Turner <zakalawe@mac.com>
5 // This program is free software; you can redistribute it and/or
6 // modify it under the terms of the GNU General Public License as
7 // published by the Free Software Foundation; either version 2 of the
8 // License, or (at your option) any later version.
10 // This program is distributed in the hope that it will be useful, but
11 // WITHOUT ANY WARRANTY; without even the implied warranty of
12 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 // General Public License for more details.
15 // You should have received a copy of the GNU General Public License
16 // along with this program; if not, write to the Free Software
17 // Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
20 # include <simgear_config.h>
23 #include "SVNReportParser.hxx"
32 #include <boost/foreach.hpp>
34 #include "simgear/misc/sg_path.hxx"
35 #include "simgear/misc/sg_dir.hxx"
36 #include "simgear/debug/logstream.hxx"
37 #include "simgear/xml/easyxml.hxx"
38 #include "simgear/misc/strutils.hxx"
39 #include "simgear/package/md5.h"
44 # include "sg_expat.h"
47 #include "SVNDirectory.hxx"
48 #include "SVNRepository.hxx"
49 #include "DAVMultiStatus.hxx"
56 using namespace simgear;
58 #define DAV_NS "DAV::"
59 #define SVN_NS "svn::"
60 #define SUBVERSION_DAV_NS "http://subversion.tigris.org/xmlns/dav/"
64 #define MAX_ENCODED_INT_LEN 10
67 decode_size(unsigned char* &p,
68 const unsigned char *end)
70 if (p + MAX_ENCODED_INT_LEN < end)
71 end = p + MAX_ENCODED_INT_LEN;
72 /* Decode bytes until we're done. */
76 result = (result << 7) | (*p & 0x7f);
77 if (((*p++ >> 7) & 0x1) == 0) {
86 try_decode_size(unsigned char* &p,
87 const unsigned char *end)
89 if (p + MAX_ENCODED_INT_LEN < end)
90 end = p + MAX_ENCODED_INT_LEN;
93 if (((*p++ >> 7) & 0x1) == 0) {
101 // const char* SVN_UPDATE_REPORT_TAG = SVN_NS "update-report";
102 // const char* SVN_TARGET_REVISION_TAG = SVN_NS "target-revision";
103 const char* SVN_OPEN_DIRECTORY_TAG = SVN_NS "open-directory";
104 const char* SVN_OPEN_FILE_TAG = SVN_NS "open-file";
105 const char* SVN_ADD_DIRECTORY_TAG = SVN_NS "add-directory";
106 const char* SVN_ADD_FILE_TAG = SVN_NS "add-file";
107 const char* SVN_TXDELTA_TAG = SVN_NS "txdelta";
108 const char* SVN_SET_PROP_TAG = SVN_NS "set-prop";
109 const char* SVN_DELETE_ENTRY_TAG = SVN_NS "delete-entry";
111 const char* SVN_DAV_MD5_CHECKSUM = SUBVERSION_DAV_NS ":md5-checksum";
113 const char* DAV_HREF_TAG = DAV_NS "href";
114 const char* DAV_CHECKED_IN_TAG = SVN_NS "checked-in";
117 const int svn_txdelta_source = 0;
118 const int svn_txdelta_target = 1;
119 const int svn_txdelta_new = 2;
121 const size_t DELTA_HEADER_SIZE = 4;
124 * helper struct to decode and store the SVN delta header
127 struct SVNDeltaWindow
131 static bool isWindowComplete(unsigned char* buffer, size_t bytes)
133 unsigned char* p = buffer;
134 unsigned char* pEnd = p + bytes;
135 // if we can't decode five sizes, certainly incomplete
136 for (int i=0; i<5; i++) {
137 if (!try_decode_size(p, pEnd)) {
143 // ignore these three
144 decode_size(p, pEnd);
145 decode_size(p, pEnd);
146 decode_size(p, pEnd);
147 size_t instructionLen = decode_size(p, pEnd);
148 size_t newLength = decode_size(p, pEnd);
149 size_t headerLength = p - buffer;
151 return (bytes >= (instructionLen + newLength + headerLength));
154 SVNDeltaWindow(unsigned char* p) :
158 sourceViewOffset = decode_size(p, p+20);
159 sourceViewLength = decode_size(p, p+20);
160 targetViewLength = decode_size(p, p+20);
161 instructionLength = decode_size(p, p+20);
162 newLength = decode_size(p, p+20);
164 headerLength = p - _ptr;
168 bool apply(std::vector<char>& output, std::istream& source)
170 unsigned char* pEnd = _ptr + instructionLength;
171 unsigned char* newData = pEnd;
173 while (_ptr < pEnd) {
174 int op = ((*_ptr >> 6) & 0x3);
176 SG_LOG(SG_IO, SG_INFO, "SVNDeltaWindow: bad opcode:" << op);
180 int length = *_ptr++ & 0x3f;
184 length = decode_size(_ptr, pEnd);
188 SG_LOG(SG_IO, SG_INFO, "SVNDeltaWindow: malformed stream, 0 length" << op);
192 // if op != new, decode another size value
193 if (op != svn_txdelta_new) {
194 offset = decode_size(_ptr, pEnd);
197 if (op == svn_txdelta_target) {
199 output.push_back(output[offset++]);
202 } else if (op == svn_txdelta_new) {
203 output.insert(output.end(), newData, newData + length);
204 } else if (op == svn_txdelta_source) {
205 source.seekg(offset);
206 char* sourceBuf = (char*) malloc(length);
208 source.read(sourceBuf, length);
209 output.insert(output.end(), sourceBuf, sourceBuf + length);
212 } // of instruction loop
219 return headerLength + instructionLength + newLength;
222 unsigned int sourceViewOffset;
223 size_t sourceViewLength,
234 } // of anonymous namespace
236 class SVNReportParser::SVNReportParserPrivate
239 SVNReportParserPrivate(SVNRepository* repo) :
241 status(SVNRepository::SVN_NO_ERROR),
243 currentPath(repo->fsBase())
246 currentDir = repo->rootDir();
249 ~SVNReportParserPrivate()
253 void startElement (const char * name, const char** attributes)
255 if (status != SVNRepository::SVN_NO_ERROR) {
259 ExpatAtts attrs(attributes);
260 tagStack.push_back(name);
261 if (!strcmp(name, SVN_TXDELTA_TAG)) {
263 } else if (!strcmp(name, SVN_ADD_FILE_TAG)) {
264 string fileName(attrs.getValue("name"));
265 SGPath filePath(currentDir->fsDir().file(fileName));
266 currentPath = filePath;
268 } else if (!strcmp(name, SVN_OPEN_FILE_TAG)) {
269 string fileName(attrs.getValue("name"));
270 SGPath filePath(Dir(currentPath).file(fileName));
271 currentPath = filePath;
273 DAVResource* res = currentDir->collection()->childWithName(fileName);
274 if (!res || !filePath.exists()) {
275 // set error condition
279 } else if (!strcmp(name, SVN_ADD_DIRECTORY_TAG)) {
280 string dirName(attrs.getValue("name"));
281 Dir d(currentDir->fsDir().file(dirName));
283 // policy decision : if we're doing an add, wipe the existing
287 currentDir = currentDir->addChildDirectory(dirName);
288 currentPath = currentDir->fsPath();
289 currentDir->beginUpdateReport();
290 //cout << "addDir:" << currentPath << endl;
291 } else if (!strcmp(name, SVN_SET_PROP_TAG)) {
292 setPropName = attrs.getValue("name");
293 setPropValue.clear();
294 } else if (!strcmp(name, SVN_DAV_MD5_CHECKSUM)) {
296 } else if (!strcmp(name, SVN_OPEN_DIRECTORY_TAG)) {
298 if (attrs.getValue("name")) {
299 dirName = string(attrs.getValue("name"));
301 openDirectory(dirName);
302 } else if (!strcmp(name, SVN_DELETE_ENTRY_TAG)) {
303 string entryName(attrs.getValue("name"));
304 deleteEntry(entryName);
305 } else if (!strcmp(name, DAV_CHECKED_IN_TAG) || !strcmp(name, DAV_HREF_TAG)) {
306 // don't warn on these ones
308 //std::cerr << "unhandled element:" << name << std::endl;
312 void openDirectory(const std::string& dirName)
314 if (dirName.empty()) {
315 // root directory, we shall assume
316 currentDir = tree->rootDir();
319 currentDir = currentDir->child(dirName);
323 currentPath = currentDir->fsPath();
324 currentDir->beginUpdateReport();
327 void deleteEntry(const std::string& entryName)
329 currentDir->deleteChildByName(entryName);
332 bool decodeTextDelta(const SGPath& outputPath)
334 string decoded = strutils::decodeBase64(txDeltaData);
335 size_t bytesToDecode = decoded.size();
336 std::vector<char> output;
337 unsigned char* p = (unsigned char*) decoded.data();
338 if (memcmp(p, "SVN\0", DELTA_HEADER_SIZE) != 0) {
339 return false; // bad header
342 bytesToDecode -= DELTA_HEADER_SIZE;
343 p += DELTA_HEADER_SIZE;
344 std::ifstream source;
345 source.open(outputPath.c_str(), std::ios::in | std::ios::binary);
347 while (bytesToDecode > 0) {
348 if (!SVNDeltaWindow::isWindowComplete(p, bytesToDecode)) {
349 SG_LOG(SG_IO, SG_WARN, "SVN txdelta broken window");
353 SVNDeltaWindow window(p);
354 assert(bytesToDecode >= window.size());
355 window.apply(output, source);
356 bytesToDecode -= window.size();
363 f.open(outputPath.c_str(),
364 std::ios::out | std::ios::trunc | std::ios::binary);
365 f.write(output.data(), output.size());
367 // compute MD5 while we have the file in memory
368 memset(&md5Context, 0, sizeof(SG_MD5_CTX));
369 SG_MD5Init(&md5Context);
370 SG_MD5Update(&md5Context, (unsigned char*) output.data(), output.size());
371 SG_MD5Final(&md5Context);
372 decodedFileMd5 = strutils::encodeHex(md5Context.digest, 16);
377 void endElement (const char * name)
379 if (status != SVNRepository::SVN_NO_ERROR) {
383 assert(tagStack.back() == name);
386 if (!strcmp(name, SVN_TXDELTA_TAG)) {
387 if (!decodeTextDelta(currentPath)) {
388 fail(SVNRepository::SVN_ERROR_TXDELTA);
390 } else if (!strcmp(name, SVN_ADD_FILE_TAG)) {
391 finishFile(currentDir->addChildFile(currentPath.file()));
392 } else if (!strcmp(name, SVN_OPEN_FILE_TAG)) {
393 DAVResource* res = currentDir->collection()->childWithName(currentPath.file());
396 } else if (!strcmp(name, SVN_ADD_DIRECTORY_TAG)) {
398 currentPath = currentPath.dir();
399 currentDir->updateReportComplete();
400 currentDir = currentDir->parent();
401 } else if (!strcmp(name, SVN_SET_PROP_TAG)) {
402 if (setPropName == "svn:entry:committed-rev") {
403 revision = strutils::to_int(setPropValue);
404 currentVersionName = setPropValue;
406 // for directories we have the resource already
407 // for adding files, we might not; we set the version name
408 // above when ending the add/open-file element
409 currentDir->collection()->setVersionName(currentVersionName);
412 } else if (!strcmp(name, SVN_DAV_MD5_CHECKSUM)) {
413 // validate against (presumably) just written file
414 if (decodedFileMd5 != md5Sum) {
415 fail(SVNRepository::SVN_ERROR_CHECKSUM);
417 } else if (!strcmp(name, SVN_OPEN_DIRECTORY_TAG)) {
418 if (currentDir->parent()) {
419 // pop the collection stack
420 currentDir = currentDir->parent();
423 currentDir->updateReportComplete();
424 currentPath = currentDir->fsPath();
426 // std::cout << "element:" << name;
430 void finishFile(DAVResource* res)
432 res->setVersionName(currentVersionName);
434 currentPath = currentPath.dir();
438 void data (const char * s, int length)
440 if (status != SVNRepository::SVN_NO_ERROR) {
444 if (tagStack.back() == SVN_SET_PROP_TAG) {
445 setPropValue += string(s, length);
446 } else if (tagStack.back() == SVN_TXDELTA_TAG) {
447 txDeltaData += string(s, length);
448 } else if (tagStack.back() == SVN_DAV_MD5_CHECKSUM) {
449 md5Sum += string(s, length);
453 void pi (const char * target, const char * data) {}
455 string tagN(const unsigned int n) const
457 size_t sz = tagStack.size();
462 return tagStack[sz - (1 + n)];
465 void fail(SVNRepository::ResultCode err)
471 DAVCollection* rootCollection;
472 SVNDirectory* currentDir;
473 SVNRepository::ResultCode status;
476 XML_Parser xmlParser;
479 string_list tagStack;
480 string currentVersionName;
485 unsigned int revision;
486 SG_MD5_CTX md5Context;
487 string md5Sum, decodedFileMd5;
488 std::string setPropName, setPropValue;
492 ////////////////////////////////////////////////////////////////////////
493 // Static callback functions for Expat.
494 ////////////////////////////////////////////////////////////////////////
496 #define VISITOR static_cast<SVNReportParser::SVNReportParserPrivate *>(userData)
499 start_element (void * userData, const char * name, const char ** atts)
501 VISITOR->startElement(name, atts);
505 end_element (void * userData, const char * name)
507 VISITOR->endElement(name);
511 character_data (void * userData, const char * s, int len)
513 VISITOR->data(s, len);
517 processing_instruction (void * userData,
521 VISITOR->pi(target, data);
526 ///////////////////////////////////////////////////////////////////////////////
528 SVNReportParser::SVNReportParser(SVNRepository* repo) :
529 _d(new SVNReportParserPrivate(repo))
534 SVNReportParser::~SVNReportParser()
538 SVNRepository::ResultCode
539 SVNReportParser::innerParseXML(const char* data, int size)
541 if (_d->status != SVNRepository::SVN_NO_ERROR) {
545 bool isEnd = (data == NULL);
546 if (!XML_Parse(_d->xmlParser, data, size, isEnd)) {
547 SG_LOG(SG_IO, SG_INFO, "SVN parse error:" << XML_ErrorString(XML_GetErrorCode(_d->xmlParser))
548 << " at line:" << XML_GetCurrentLineNumber(_d->xmlParser)
549 << " column " << XML_GetCurrentColumnNumber(_d->xmlParser));
551 XML_ParserFree(_d->xmlParser);
552 _d->parserInited = false;
553 return SVNRepository::SVN_ERROR_XML;
555 XML_ParserFree(_d->xmlParser);
556 _d->parserInited = false;
562 SVNRepository::ResultCode
563 SVNReportParser::parseXML(const char* data, int size)
565 if (_d->status != SVNRepository::SVN_NO_ERROR) {
569 if (!_d->parserInited) {
570 _d->xmlParser = XML_ParserCreateNS(0, ':');
571 XML_SetUserData(_d->xmlParser, _d.get());
572 XML_SetElementHandler(_d->xmlParser, start_element, end_element);
573 XML_SetCharacterDataHandler(_d->xmlParser, character_data);
574 XML_SetProcessingInstructionHandler(_d->xmlParser, processing_instruction);
575 _d->parserInited = true;
578 return innerParseXML(data, size);
581 SVNRepository::ResultCode SVNReportParser::finishParse()
583 if (_d->status != SVNRepository::SVN_NO_ERROR) {
587 return innerParseXML(NULL, 0);
590 std::string SVNReportParser::etagFromRevision(unsigned int revision)
592 // etags look like W/"7//", hopefully this is stable
593 // across different servers and similar
594 std::ostringstream os;
595 os << "W/\"" << revision << "//";