1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71

72

73

74

75

76

77

78

79

80

81

82

83

84

85

86

87

88

89

90

91

92

93

94

95

96

97

98

99

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

# This file is part of Buildbot.  Buildbot is free software: you can 

# redistribute it and/or modify it under the terms of the GNU General Public 

# License as published by the Free Software Foundation, version 2. 

# 

# This program is distributed in the hope that it will be useful, but WITHOUT 

# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS 

# FOR A PARTICULAR PURPOSE.  See the GNU General Public License for more 

# details. 

# 

# You should have received a copy of the GNU General Public License along with 

# this program; if not, write to the Free Software Foundation, Inc., 51 

# Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. 

# 

# Copyright Buildbot Team Members 

 

from __future__ import with_statement 

 

 

# Based on the work of Dave Peticolas for the P4poll 

# Changed to svn (using xml.dom.minidom) by Niklaus Giger 

# Hacked beyond recognition by Brian Warner 

 

from twisted.python import log 

from twisted.internet import defer, utils 

 

from buildbot import util 

from buildbot.changes import base 

 

import xml.dom.minidom 

import os, urllib 

 

# these split_file_* functions are available for use as values to the 

# split_file= argument. 

def split_file_alwaystrunk(path): 

    return (None, path) 

 

def split_file_branches(path): 

    # turn trunk/subdir/file.c into (None, "subdir/file.c") 

    # and branches/1.5.x/subdir/file.c into ("branches/1.5.x", "subdir/file.c") 

    pieces = path.split('/') 

    if pieces[0] == 'trunk': 

        return (None, '/'.join(pieces[1:])) 

    elif pieces[0] == 'branches': 

        return ('/'.join(pieces[0:2]), '/'.join(pieces[2:])) 

    else: 

        return None 

 

 

class SVNPoller(base.PollingChangeSource, util.ComparableMixin): 

    """ 

    Poll a Subversion repository for changes and submit them to the change 

    master. 

    """ 

 

    compare_attrs = ["svnurl", "split_file", 

                     "svnuser", "svnpasswd", "project", 

                     "pollInterval", "histmax", 

                     "svnbin", "category", "cachepath"] 

 

    parent = None # filled in when we're added 

    last_change = None 

    loop = None 

 

    def __init__(self, svnurl, split_file=None, 

                 svnuser=None, svnpasswd=None, 

                 pollInterval=10*60, histmax=100, 

                 svnbin='svn', revlinktmpl='', category=None, 

                 project='', cachepath=None, pollinterval=-2, 

                 extra_args=None): 

        # for backward compatibility; the parameter used to be spelled with 'i' 

        if pollinterval != -2: 

            pollInterval = pollinterval 

 

        if svnurl.endswith("/"): 

            svnurl = svnurl[:-1] # strip the trailing slash 

        self.svnurl = svnurl 

        self.extra_args = extra_args 

        self.split_file = split_file or split_file_alwaystrunk 

        self.svnuser = svnuser 

        self.svnpasswd = svnpasswd 

 

        self.revlinktmpl = revlinktmpl 

 

        self.environ = os.environ.copy() # include environment variables 

                                         # required for ssh-agent auth 

 

        self.svnbin = svnbin 

        self.pollInterval = pollInterval 

        self.histmax = histmax 

        self._prefix = None 

        self.category = category 

        self.project = project 

 

        self.cachepath = cachepath 

        if self.cachepath and os.path.exists(self.cachepath): 

            try: 

                with open(self.cachepath, "r") as f: 

                    self.last_change = int(f.read().strip()) 

                    log.msg("SVNPoller: SVNPoller(%s) setting last_change to %s" % (self.svnurl, self.last_change)) 

                # try writing it, too 

                with open(self.cachepath, "w") as f: 

                    f.write(str(self.last_change)) 

            except: 

                self.cachepath = None 

                log.msg(("SVNPoller: SVNPoller(%s) cache file corrupt or unwriteable; " + 

                        "skipping and not using") % self.svnurl) 

                log.err() 

 

    def describe(self): 

        return "SVNPoller: watching %s" % self.svnurl 

 

    def poll(self): 

        # Our return value is only used for unit testing. 

 

        # we need to figure out the repository root, so we can figure out 

        # repository-relative pathnames later. Each SVNURL is in the form 

        # (ROOT)/(PROJECT)/(BRANCH)/(FILEPATH), where (ROOT) is something 

        # like svn://svn.twistedmatrix.com/svn/Twisted (i.e. there is a 

        # physical repository at /svn/Twisted on that host), (PROJECT) is 

        # something like Projects/Twisted (i.e. within the repository's 

        # internal namespace, everything under Projects/Twisted/ has 

        # something to do with Twisted, but these directory names do not 

        # actually appear on the repository host), (BRANCH) is something like 

        # "trunk" or "branches/2.0.x", and (FILEPATH) is a tree-relative 

        # filename like "twisted/internet/defer.py". 

 

        # our self.svnurl attribute contains (ROOT)/(PROJECT) combined 

        # together in a way that we can't separate without svn's help. If the 

        # user is not using the split_file= argument, then self.svnurl might 

        # be (ROOT)/(PROJECT)/(BRANCH) . In any case, the filenames we will 

        # get back from 'svn log' will be of the form 

        # (PROJECT)/(BRANCH)/(FILEPATH), but we want to be able to remove 

        # that (PROJECT) prefix from them. To do this without requiring the 

        # user to tell us how svnurl is split into ROOT and PROJECT, we do an 

        # 'svn info --xml' command at startup. This command will include a 

        # <root> element that tells us ROOT. We then strip this prefix from 

        # self.svnurl to determine PROJECT, and then later we strip the 

        # PROJECT prefix from the filenames reported by 'svn log --xml' to 

        # get a (BRANCH)/(FILEPATH) that can be passed to split_file() to 

        # turn into separate BRANCH and FILEPATH values. 

 

        # whew. 

 

        if self.project: 

            log.msg("SVNPoller: polling " + self.project) 

        else: 

            log.msg("SVNPoller: polling") 

 

        d = defer.succeed(None) 

        if not self._prefix: 

            d.addCallback(lambda _ : self.get_prefix()) 

            def set_prefix(prefix): 

                self._prefix = prefix 

            d.addCallback(set_prefix) 

 

        d.addCallback(self.get_logs) 

        d.addCallback(self.parse_logs) 

        d.addCallback(self.get_new_logentries) 

        d.addCallback(self.create_changes) 

        d.addCallback(self.submit_changes) 

        d.addCallback(self.finished_ok) 

        d.addErrback(log.err, 'SVNPoller: Error in  while polling') # eat errors 

        return d 

 

    def getProcessOutput(self, args): 

        # this exists so we can override it during the unit tests 

        d = utils.getProcessOutput(self.svnbin, args, self.environ) 

        return d 

 

    def get_prefix(self): 

        args = ["info", "--xml", "--non-interactive", self.svnurl] 

        if self.svnuser: 

            args.extend(["--username=%s" % self.svnuser]) 

        if self.svnpasswd: 

            args.extend(["--password=%s" % self.svnpasswd]) 

        if self.extra_args: 

            args.extend(self.extra_args) 

        d = self.getProcessOutput(args) 

        def determine_prefix(output): 

            try: 

                doc = xml.dom.minidom.parseString(output) 

            except xml.parsers.expat.ExpatError: 

                log.msg("SVNPoller: SVNPoller._determine_prefix_2: ExpatError in '%s'" 

                        % output) 

                raise 

            rootnodes = doc.getElementsByTagName("root") 

            if not rootnodes: 

                # this happens if the URL we gave was already the root. In this 

                # case, our prefix is empty. 

                self._prefix = "" 

                return self._prefix 

            rootnode = rootnodes[0] 

            root = "".join([c.data for c in rootnode.childNodes]) 

            # root will be a unicode string 

            assert self.svnurl.startswith(root), \ 

                    ("svnurl='%s' doesn't start with <root>='%s'" % 

                    (self.svnurl, root)) 

            prefix = self.svnurl[len(root):] 

            if prefix.startswith("/"): 

                prefix = prefix[1:] 

            log.msg("SVNPoller: svnurl=%s, root=%s, so prefix=%s" % 

                    (self.svnurl, root, prefix)) 

            return prefix 

        d.addCallback(determine_prefix) 

        return d 

 

    def get_logs(self, _): 

        args = [] 

        args.extend(["log", "--xml", "--verbose", "--non-interactive"]) 

        if self.svnuser: 

            args.extend(["--username=%s" % self.svnuser]) 

        if self.svnpasswd: 

            args.extend(["--password=%s" % self.svnpasswd]) 

        if self.extra_args: 

            args.extend(self.extra_args) 

        args.extend(["--limit=%d" % (self.histmax), self.svnurl]) 

        d = self.getProcessOutput(args) 

        return d 

 

    def parse_logs(self, output): 

        # parse the XML output, return a list of <logentry> nodes 

        try: 

            doc = xml.dom.minidom.parseString(output) 

        except xml.parsers.expat.ExpatError: 

            log.msg("SVNPoller: SVNPoller.parse_logs: ExpatError in '%s'" % output) 

            raise 

        logentries = doc.getElementsByTagName("logentry") 

        return logentries 

 

 

    def get_new_logentries(self, logentries): 

        last_change = old_last_change = self.last_change 

 

        # given a list of logentries, calculate new_last_change, and 

        # new_logentries, where new_logentries contains only the ones after 

        # last_change 

 

        new_last_change = None 

        new_logentries = [] 

        if logentries: 

            new_last_change = int(logentries[0].getAttribute("revision")) 

 

            if last_change is None: 

                # if this is the first time we've been run, ignore any changes 

                # that occurred before now. This prevents a build at every 

                # startup. 

                log.msg('SVNPoller: starting at change %s' % new_last_change) 

            elif last_change == new_last_change: 

                # an unmodified repository will hit this case 

                log.msg('SVNPoller: no changes') 

            else: 

                for el in logentries: 

                    if last_change == int(el.getAttribute("revision")): 

                        break 

                    new_logentries.append(el) 

                new_logentries.reverse() # return oldest first 

 

        self.last_change = new_last_change 

        log.msg('SVNPoller: _process_changes %s .. %s' % 

                (old_last_change, new_last_change)) 

        return new_logentries 

 

 

    def _get_text(self, element, tag_name): 

        try: 

            child_nodes = element.getElementsByTagName(tag_name)[0].childNodes 

            text = "".join([t.data for t in child_nodes]) 

        except: 

            text = "<unknown>" 

        return text 

 

    def _transform_path(self, path): 

        assert path.startswith(self._prefix), \ 

                ("filepath '%s' should start with prefix '%s'" % 

                (path, self._prefix)) 

        relative_path = path[len(self._prefix):] 

        if relative_path.startswith("/"): 

            relative_path = relative_path[1:] 

        where = self.split_file(relative_path) 

        # 'where' is either None or (branch, final_path) 

        return where 

 

    def create_changes(self, new_logentries): 

        changes = [] 

 

        for el in new_logentries: 

            revision = str(el.getAttribute("revision")) 

 

            revlink='' 

 

            if self.revlinktmpl: 

                if revision: 

                    revlink = self.revlinktmpl % urllib.quote_plus(revision) 

 

            log.msg("Adding change revision %s" % (revision,)) 

            author   = self._get_text(el, "author") 

            comments = self._get_text(el, "msg") 

            # there is a "date" field, but it provides localtime in the 

            # repository's timezone, whereas we care about buildmaster's 

            # localtime (since this will get used to position the boxes on 

            # the Waterfall display, etc). So ignore the date field, and 

            # addChange will fill in with the current time 

            branches = {} 

            try: 

                pathlist = el.getElementsByTagName("paths")[0] 

            except IndexError: # weird, we got an empty revision 

                log.msg("ignoring commit with no paths") 

                continue 

 

            for p in pathlist.getElementsByTagName("path"): 

                action = p.getAttribute("action") 

                path = "".join([t.data for t in p.childNodes]) 

                # the rest of buildbot is certaily not yet ready to handle 

                # unicode filenames, because they get put in RemoteCommands 

                # which get sent via PB to the buildslave, and PB doesn't 

                # handle unicode. 

                path = path.encode("ascii") 

                if path.startswith("/"): 

                    path = path[1:] 

                where = self._transform_path(path) 

 

                # if 'where' is None, the file was outside any project that 

                # we care about and we should ignore it 

                if where: 

                    branch, filename = where 

                    if not branch in branches: 

                        branches[branch] = { 'files': []} 

                    branches[branch]['files'].append(filename) 

 

                    if not branches[branch].has_key('action'): 

                        branches[branch]['action'] = action 

 

            for branch in branches.keys(): 

                action = branches[branch]['action'] 

                files  = branches[branch]['files'] 

                number_of_files_changed = len(files) 

 

                if action == u'D' and number_of_files_changed == 1 and files[0] == '': 

                    log.msg("Ignoring deletion of branch '%s'" % branch) 

                else: 

                    chdict = dict( 

                            author=author, 

                            files=files, 

                            comments=comments, 

                            revision=revision, 

                            branch=branch, 

                            revlink=revlink, 

                            category=self.category, 

                            repository=self.svnurl, 

                            project = self.project) 

                    changes.append(chdict) 

 

        return changes 

 

    @defer.inlineCallbacks 

    def submit_changes(self, changes): 

        for chdict in changes: 

            yield self.master.addChange(src='svn', **chdict) 

 

    def finished_ok(self, res): 

        if self.cachepath: 

            with open(self.cachepath, "w") as f: 

                f.write(str(self.last_change)) 

 

        log.msg("SVNPoller: finished polling %s" % res) 

        return res