apibuild.py 98.8 KB
Newer Older
1
#!/usr/bin/env python
2 3 4 5 6 7 8 9
#
# This is the API builder, it parses the C sources and build the
# API formal description in XML.
#
# See Copyright for the status of this software.
#
# daniel@veillard.com
#
10 11 12

from __future__ import print_function

13 14
import os
import sys
15
import glob
16
import re
17

18 19 20 21
quiet = True
warnings = 0
debug = False
debugsym = None
22 23 24 25

#
# C parser analysis code
#
26
included_files = {
27
  "libvirt-common.h": "header with general libvirt API definitions",
28
  "libvirt-domain.h": "header with general libvirt API definitions",
29
  "libvirt-domain-snapshot.h": "header with general libvirt API definitions",
30
  "libvirt-event.h": "header with general libvirt API definitions",
31
  "libvirt-host.h": "header with general libvirt API definitions",
32
  "libvirt-interface.h": "header with general libvirt API definitions",
33
  "libvirt-network.h": "header with general libvirt API definitions",
34
  "libvirt-nodedev.h": "header with general libvirt API definitions",
35
  "libvirt-nwfilter.h": "header with general libvirt API definitions",
36
  "libvirt-secret.h": "header with general libvirt API definitions",
37
  "libvirt-storage.h": "header with general libvirt API definitions",
38
  "libvirt-stream.h": "header with general libvirt API definitions",
39 40
  "virterror.h": "header with error specific API definitions",
  "libvirt.c": "Main interfaces for the libvirt library",
41
  "libvirt-domain.c": "Domain interfaces for the libvirt library",
42
  "libvirt-domain-snapshot.c": "Domain snapshot interfaces for the libvirt library",
43
  "libvirt-host.c": "Host interfaces for the libvirt library",
44
  "libvirt-interface.c": "Interface interfaces for the libvirt library",
45
  "libvirt-network.c": "Network interfaces for the libvirt library",
46
  "libvirt-nodedev.c": "Node device interfaces for the libvirt library",
47
  "libvirt-nwfilter.c": "NWFilter interfaces for the libvirt library",
48
  "libvirt-secret.c": "Secret interfaces for the libvirt library",
49
  "libvirt-storage.c": "Storage interfaces for the libvirt library",
50
  "libvirt-stream.c": "Stream interfaces for the libvirt library",
51
  "virerror.c": "implements error handling and reporting code for libvirt",
52
  "virevent.c": "event loop for monitoring file handles",
53
  "virtypedparam.c": "virTypedParameters APIs",
54 55
}

56 57 58 59 60
qemu_included_files = {
  "libvirt-qemu.h": "header with QEMU specific API definitions",
  "libvirt-qemu.c": "Implementations for the QEMU specific APIs",
}

61 62 63 64 65
lxc_included_files = {
  "libvirt-lxc.h": "header with LXC specific API definitions",
  "libvirt-lxc.c": "Implementations for the LXC specific APIs",
}

66 67 68 69 70
admin_included_files = {
  "libvirt-admin.h": "header with admin specific API definitions",
  "libvirt-admin.c": "Implementations for the admin specific APIs",
}

71 72
ignored_words = {
  "ATTRIBUTE_UNUSED": (0, "macro keyword"),
73
  "ATTRIBUTE_SENTINEL": (0, "macro keyword"),
74
  "VIR_DEPRECATED": (0, "macro keyword"),
75
  "VIR_EXPORT_VAR": (0, "macro keyword"),
76 77 78
  "WINAPI": (0, "Windows keyword"),
  "__declspec": (3, "Windows keyword"),
  "__stdcall": (0, "Windows keyword"),
79 80
}

D
Daniel Veillard 已提交
81
ignored_functions = {
82
  "virConnectSupportsFeature": "private function for remote access",
D
Daniel Veillard 已提交
83 84 85 86 87
  "virDomainMigrateFinish": "private function for migration",
  "virDomainMigrateFinish2": "private function for migration",
  "virDomainMigratePerform": "private function for migration",
  "virDomainMigratePrepare": "private function for migration",
  "virDomainMigratePrepare2": "private function for migration",
C
Chris Lalancette 已提交
88
  "virDomainMigratePrepareTunnel": "private function for tunnelled migration",
89 90 91 92 93 94
  "virDomainMigrateBegin3": "private function for migration",
  "virDomainMigrateFinish3": "private function for migration",
  "virDomainMigratePerform3": "private function for migration",
  "virDomainMigratePrepare3": "private function for migration",
  "virDomainMigrateConfirm3": "private function for migration",
  "virDomainMigratePrepareTunnel3": "private function for tunnelled migration",
95
  "DllMain": "specific function for Win32",
96
  "virTypedParamsValidate": "internal function in virtypedparam.c",
97
  "virTypedParameterValidateSet": "internal function in virtypedparam.c",
98 99
  "virTypedParameterAssign": "internal function in virtypedparam.c",
  "virTypedParameterAssignFromStr": "internal function in virtypedparam.c",
100
  "virTypedParameterToString": "internal function in virtypedparam.c",
101
  "virTypedParamsCheck": "internal function in virtypedparam.c",
102
  "virTypedParamsCopy": "internal function in virtypedparam.c",
103 104 105 106 107 108
  "virDomainMigrateBegin3Params": "private function for migration",
  "virDomainMigrateFinish3Params": "private function for migration",
  "virDomainMigratePerform3Params": "private function for migration",
  "virDomainMigratePrepare3Params": "private function for migration",
  "virDomainMigrateConfirm3Params": "private function for migration",
  "virDomainMigratePrepareTunnel3Params": "private function for tunnelled migration",
J
Jiri Denemark 已提交
109
  "virErrorCopyNew": "private",
D
Daniel Veillard 已提交
110 111
}

112 113 114 115 116 117
ignored_macros = {
  "_virSchedParameter": "backward compatibility macro for virTypedParameter",
  "_virBlkioParameter": "backward compatibility macro for virTypedParameter",
  "_virMemoryParameter": "backward compatibility macro for virTypedParameter",
}

118 119
# macros that should be completely skipped
hidden_macros = {
120 121
  "VIR_DEPRECATED": "internal macro to mark deprecated apis",
  "VIR_EXPORT_VAR": "internal macro to mark exported vars",
122 123
}

124
def escape(raw):
125 126 127 128 129
    raw = raw.replace('&', '&')
    raw = raw.replace('<', '&lt;')
    raw = raw.replace('>', '&gt;')
    raw = raw.replace("'", '&apos;')
    raw = raw.replace('"', '&quot;')
130 131 132
    return raw

def uniq(items):
133
    return sorted(set(items))
134 135

class identifier:
136 137
    def __init__(self, name, header=None, module=None, type=None, lineno=0,
                 info=None, extra=None, conditionals=None):
138
        self.name = name
139 140 141 142 143 144 145
        self.header = header
        self.module = module
        self.type = type
        self.info = info
        self.extra = extra
        self.lineno = lineno
        self.static = 0
146
        if conditionals is None or len(conditionals) == 0:
147 148 149
            self.conditionals = None
        else:
            self.conditionals = conditionals[:]
150
        if self.name == debugsym and not quiet:
151 152
            print("=> define %s : %s" % (debugsym, (module, type, info,
                                         extra, conditionals)))
153 154 155

    def __repr__(self):
        r = "%s %s:" % (self.type, self.name)
156 157
        if self.static:
            r = r + " static"
158
        if self.module is not None:
159
            r = r + " from %s" % (self.module)
160
        if self.info is not None:
161
            r = r + " " + repr(self.info)
162
        if self.extra is not None:
163
            r = r + " " + repr(self.extra)
164
        if self.conditionals is not None:
165
            r = r + " " + repr(self.conditionals)
166
        return r
167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183


    def set_header(self, header):
        self.header = header
    def set_module(self, module):
        self.module = module
    def set_type(self, type):
        self.type = type
    def set_info(self, info):
        self.info = info
    def set_extra(self, extra):
        self.extra = extra
    def set_lineno(self, lineno):
        self.lineno = lineno
    def set_static(self, static):
        self.static = static
    def set_conditionals(self, conditionals):
184
        if conditionals is None or len(conditionals) == 0:
185 186 187
            self.conditionals = None
        else:
            self.conditionals = conditionals[:]
188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207

    def get_name(self):
        return self.name
    def get_header(self):
        return self.module
    def get_module(self):
        return self.module
    def get_type(self):
        return self.type
    def get_info(self):
        return self.info
    def get_lineno(self):
        return self.lineno
    def get_extra(self):
        return self.extra
    def get_static(self):
        return self.static
    def get_conditionals(self):
        return self.conditionals

208
    def update(self, header, module, type=None, info=None, extra=None,
209
               conditionals=None):
210
        if self.name == debugsym and not quiet:
211 212
            print("=> update %s : %s" % (debugsym, (module, type, info,
                                         extra, conditionals)))
213
        if header is not None and self.header is None:
214
            self.set_header(module)
215
        if module is not None and (self.module is None or self.header == self.module):
216
            self.set_module(module)
217
        if type is not None and self.type is None:
218
            self.set_type(type)
219
        if info is not None:
220
            self.set_info(info)
221
        if extra is not None:
222
            self.set_extra(extra)
223
        if conditionals is not None:
224
            self.set_conditionals(conditionals)
225 226

class index:
227
    def __init__(self, name="noname"):
228 229 230
        self.name = name
        self.identifiers = {}
        self.functions = {}
231 232 233
        self.variables = {}
        self.includes = {}
        self.structs = {}
234
        self.unions = {}
235 236 237 238 239
        self.enums = {}
        self.typedefs = {}
        self.macros = {}
        self.references = {}
        self.info = {}
240

241 242 243
    def warning(self, msg):
        global warnings
        warnings = warnings + 1
244
        print(msg)
245

246
    def add_ref(self, name, header, module, static, type, lineno, info=None, extra=None, conditionals=None):
247
        if name[0:2] == '__':
248
            return None
249 250
        d = None
        try:
251 252 253 254 255
           d = self.identifiers[name]
           d.update(header, module, type, lineno, info, extra, conditionals)
        except:
           d = identifier(name, header, module, type, lineno, info, extra, conditionals)
           self.identifiers[name] = d
256

257
        if d is not None and static == 1:
258
            d.set_static(1)
259

260
        if d is not None and name is not None and type is not None:
261
            self.references[name] = d
262

263
        if name == debugsym and not quiet:
264
            print("New ref: %s" % (d))
265

266
        return d
267

268
    def add(self, name, header, module, static, type, lineno, info=None, extra=None, conditionals=None):
269
        if name[0:2] == '__':
270
            return None
271 272
        d = None
        try:
273 274 275 276 277 278
           d = self.identifiers[name]
           d.update(header, module, type, lineno, info, extra, conditionals)
        except:
           d = identifier(name, header, module, type, lineno, info, extra, conditionals)
           self.identifiers[name] = d

279
        if d is not None and static == 1:
280 281
            d.set_static(1)

282
        if d is not None and name is not None and type is not None:
283 284 285 286 287 288 289 290 291 292
            if type == "function":
                self.functions[name] = d
            elif type == "functype":
                self.functions[name] = d
            elif type == "variable":
                self.variables[name] = d
            elif type == "include":
                self.includes[name] = d
            elif type == "struct":
                self.structs[name] = d
293 294
            elif type == "union":
                self.unions[name] = d
295 296 297 298 299 300 301
            elif type == "enum":
                self.enums[name] = d
            elif type == "typedef":
                self.typedefs[name] = d
            elif type == "macro":
                self.macros[name] = d
            else:
302
                self.warning("Unable to register type ", type)
303

304
        if name == debugsym and not quiet:
305
            print("New symbol: %s" % (d))
306 307

        return d
308 309 310 311 312 313 314

    def merge(self, idx):
        for id in idx.functions.keys():
              #
              # macro might be used to override functions or variables
              # definitions
              #
A
Andrea Bolognani 已提交
315
             if id in self.macros:
316
                 del self.macros[id]
A
Andrea Bolognani 已提交
317
             if id in self.functions:
318 319
                 self.warning("function %s from %s redeclared in %s" % (
                    id, self.functions[id].header, idx.functions[id].header))
320 321 322
             else:
                 self.functions[id] = idx.functions[id]
                 self.identifiers[id] = idx.functions[id]
323 324 325 326 327
        for id in idx.variables.keys():
              #
              # macro might be used to override functions or variables
              # definitions
              #
A
Andrea Bolognani 已提交
328
             if id in self.macros:
329
                 del self.macros[id]
A
Andrea Bolognani 已提交
330
             if id in self.variables:
331 332
                 self.warning("variable %s from %s redeclared in %s" % (
                    id, self.variables[id].header, idx.variables[id].header))
333 334 335
             else:
                 self.variables[id] = idx.variables[id]
                 self.identifiers[id] = idx.variables[id]
336
        for id in idx.structs.keys():
A
Andrea Bolognani 已提交
337
             if id in self.structs:
338 339
                 self.warning("struct %s from %s redeclared in %s" % (
                    id, self.structs[id].header, idx.structs[id].header))
340 341 342
             else:
                 self.structs[id] = idx.structs[id]
                 self.identifiers[id] = idx.structs[id]
343
        for id in idx.unions.keys():
A
Andrea Bolognani 已提交
344
             if id in self.unions:
345 346
                 print("union %s from %s redeclared in %s" % (
                    id, self.unions[id].header, idx.unions[id].header))
347 348 349
             else:
                 self.unions[id] = idx.unions[id]
                 self.identifiers[id] = idx.unions[id]
350
        for id in idx.typedefs.keys():
A
Andrea Bolognani 已提交
351
             if id in self.typedefs:
352 353
                 self.warning("typedef %s from %s redeclared in %s" % (
                    id, self.typedefs[id].header, idx.typedefs[id].header))
354 355 356
             else:
                 self.typedefs[id] = idx.typedefs[id]
                 self.identifiers[id] = idx.typedefs[id]
357 358 359 360 361
        for id in idx.macros.keys():
              #
              # macro might be used to override functions or variables
              # definitions
              #
A
Andrea Bolognani 已提交
362
             if id in self.variables:
363
                 continue
A
Andrea Bolognani 已提交
364
             if id in self.functions:
365
                 continue
A
Andrea Bolognani 已提交
366
             if id in self.enums:
367
                 continue
A
Andrea Bolognani 已提交
368
             if id in self.macros:
369 370
                 self.warning("macro %s from %s redeclared in %s" % (
                    id, self.macros[id].header, idx.macros[id].header))
371 372 373
             else:
                 self.macros[id] = idx.macros[id]
                 self.identifiers[id] = idx.macros[id]
374
        for id in idx.enums.keys():
A
Andrea Bolognani 已提交
375
             if id in self.enums:
376 377
                 self.warning("enum %s from %s redeclared in %s" % (
                    id, self.enums[id].header, idx.enums[id].header))
378 379 380
             else:
                 self.enums[id] = idx.enums[id]
                 self.identifiers[id] = idx.enums[id]
381 382 383

    def merge_public(self, idx):
        for id in idx.functions.keys():
A
Andrea Bolognani 已提交
384
             if id in self.functions:
385
                 up = idx.functions[id]
386
                 # check that function condition agrees with header
387
                 if up.conditionals != self.functions[id].conditionals:
388 389 390
                     self.warning("Header condition differs from Function for %s:" \
                                      % id)
                     self.warning("  H: %s" % self.functions[id].conditionals)
391
                     self.warning("  C: %s" % up.conditionals)
392 393
                 self.functions[id].update(None, up.module, up.type, up.info, up.extra)
         #     else:
394 395
         #         print("Function %s from %s is not declared in headers" % (
         #               id, idx.functions[id].module))
396
         # TODO: do the same for variables.
397 398 399

    def analyze_dict(self, type, dict):
        count = 0
400
        public = 0
401
        for name in dict.keys():
402 403 404 405
            id = dict[name]
            count = count + 1
            if id.static == 0:
                public = public + 1
406
        if count != public:
407
            print("  %d %s , %d public" % (count, type, public))
408
        elif count != 0:
409
            print("  %d public %s" % (count, type))
410 411 412


    def analyze(self):
413 414 415 416 417 418 419
        if not quiet:
            self.analyze_dict("functions", self.functions)
            self.analyze_dict("variables", self.variables)
            self.analyze_dict("structs", self.structs)
            self.analyze_dict("unions", self.unions)
            self.analyze_dict("typedefs", self.typedefs)
            self.analyze_dict("macros", self.macros)
420

421 422 423 424 425
class CLexer:
    """A lexer for the C language, tokenize the input by reading and
       analyzing it line by line"""
    def __init__(self, input):
        self.input = input
426 427 428
        self.tokens = []
        self.line = ""
        self.lineno = 0
429 430 431

    def getline(self):
        line = ''
432 433 434 435 436
        while line == '':
            line = self.input.readline()
            if not line:
                return None
            self.lineno = self.lineno + 1
437 438
            line = line.lstrip()
            line = line.rstrip()
439 440 441 442 443 444
            if line == '':
                continue
            while line[-1] == '\\':
                line = line[:-1]
                n = self.input.readline()
                self.lineno = self.lineno + 1
445 446
                n = n.lstrip()
                n = n.rstrip()
447 448 449 450
                if not n:
                    break
                else:
                    line = line + n
451
        return line
452

453 454 455 456
    def getlineno(self):
        return self.lineno

    def push(self, token):
457
        self.tokens.insert(0, token)
458 459

    def debug(self):
460 461 462
        print("Last token: ", self.last)
        print("Token queue: ", self.tokens)
        print("Line %d end: " % (self.lineno), self.line)
463 464 465

    def token(self):
        while self.tokens == []:
466 467 468 469 470
            if self.line == "":
                line = self.getline()
            else:
                line = self.line
                self.line = ""
471
            if line is None:
472 473 474
                return None

            if line[0] == '#':
475
                self.tokens = list(map((lambda x: ('preproc', x)),
J
John Ferlan 已提交
476
                                       line.split()))
477 478 479 480 481 482 483 484

                # We might have whitespace between the '#' and preproc
                # macro name, so instead of having a single token element
                # of '#define' we might end up with '#' and 'define'. This
                # merges them back together
                if self.tokens[0][1] == "#":
                    self.tokens[0] = ('preproc', self.tokens[0][1] + self.tokens[1][1])
                    self.tokens = self.tokens[:1] + self.tokens[2:]
485
                break
486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507
            l = len(line)
            if line[0] == '"' or line[0] == "'":
                end = line[0]
                line = line[1:]
                found = 0
                tok = ""
                while found == 0:
                    i = 0
                    l = len(line)
                    while i < l:
                        if line[i] == end:
                            self.line = line[i+1:]
                            line = line[:i]
                            l = i
                            found = 1
                            break
                        if line[i] == '\\':
                            i = i + 1
                        i = i + 1
                    tok = tok + line
                    if found == 0:
                        line = self.getline()
508
                        if line is None:
509 510 511 512
                            return None
                self.last = ('string', tok)
                return self.last

513
            if line.startswith("/*"):
514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532
                line = line[2:]
                found = 0
                tok = ""
                while found == 0:
                    i = 0
                    l = len(line)
                    while i < l:
                        if line[i] == '*' and i+1 < l and line[i+1] == '/':
                            self.line = line[i+2:]
                            line = line[:i-1]
                            l = i
                            found = 1
                            break
                        i = i + 1
                    if tok != "":
                        tok = tok + "\n"
                    tok = tok + line
                    if found == 0:
                        line = self.getline()
533
                        if line is None:
534 535 536
                            return None
                self.last = ('comment', tok)
                return self.last
537
            if line.startswith("//"):
538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561
                line = line[2:]
                self.last = ('comment', line)
                return self.last
            i = 0
            while i < l:
                if line[i] == '/' and i+1 < l and line[i+1] == '/':
                    self.line = line[i:]
                    line = line[:i]
                    break
                if line[i] == '/' and i+1 < l and line[i+1] == '*':
                    self.line = line[i:]
                    line = line[:i]
                    break
                if line[i] == '"' or line[i] == "'":
                    self.line = line[i:]
                    line = line[:i]
                    break
                i = i + 1
            l = len(line)
            i = 0
            while i < l:
                if line[i] == ' ' or line[i] == '\t':
                    i = i + 1
                    continue
562
                if line[i].isalnum():
563 564
                    s = i
                    while i < l:
565
                        if line[i] not in " \t(){}:;,+-*/%&!|[]=><":
566 567 568 569 570
                            i = i + 1
                        else:
                            break
                    self.tokens.append(('name', line[s:i]))
                    continue
571
                if line[i] in "(){}:;,[]":
572
#                 if line[i] == '(' or line[i] == ')' or line[i] == '{' or \
573 574 575 576 577
#                   line[i] == '}' or line[i] == ':' or line[i] == ';' or \
#                   line[i] == ',' or line[i] == '[' or line[i] == ']':
                    self.tokens.append(('sep', line[i]))
                    i = i + 1
                    continue
578
                if line[i] in "+-*><=/%&!|.":
579
#                 if line[i] == '+' or line[i] == '-' or line[i] == '*' or \
580 581 582
#                   line[i] == '>' or line[i] == '<' or line[i] == '=' or \
#                   line[i] == '/' or line[i] == '%' or line[i] == '&' or \
#                   line[i] == '!' or line[i] == '|' or line[i] == '.':
583
                    if line[i] == '.' and i + 2 < l and \
584 585 586 587 588 589
                       line[i+1] == '.' and line[i+2] == '.':
                        self.tokens.append(('name', '...'))
                        i = i + 3
                        continue

                    j = i + 1
590
                    if j < l and line[j] in "+-*><=/%&!|":
591 592 593 594 595 596 597 598 599 600 601 602
#                       line[j] == '+' or line[j] == '-' or line[j] == '*' or \
#                       line[j] == '>' or line[j] == '<' or line[j] == '=' or \
#                       line[j] == '/' or line[j] == '%' or line[j] == '&' or \
#                       line[j] == '!' or line[j] == '|'):
                        self.tokens.append(('op', line[i:j+1]))
                        i = j + 1
                    else:
                        self.tokens.append(('op', line[i]))
                        i = i + 1
                    continue
                s = i
                while i < l:
603
                    if line[i] not in " \t(){}:;,+-*/%&!|[]=><":
604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624
#                        line[i] != ' ' and line[i] != '\t' and
#                        line[i] != '(' and line[i] != ')' and
#                        line[i] != '{'  and line[i] != '}' and
#                        line[i] != ':' and line[i] != ';' and
#                        line[i] != ',' and line[i] != '+' and
#                        line[i] != '-' and line[i] != '*' and
#                        line[i] != '/' and line[i] != '%' and
#                        line[i] != '&' and line[i] != '!' and
#                        line[i] != '|' and line[i] != '[' and
#                        line[i] != ']' and line[i] != '=' and
#                        line[i] != '*' and line[i] != '>' and
#                        line[i] != '<'):
                        i = i + 1
                    else:
                        break
                self.tokens.append(('name', line[s:i]))

        tok = self.tokens[0]
        self.tokens = self.tokens[1:]
        self.last = tok
        return tok
625

626 627
class CParser:
    """The C module parser"""
628
    def __init__(self, filename, idx=None):
629
        self.filename = filename
630 631 632 633
        if len(filename) > 2 and filename[-2:] == '.h':
            self.is_header = 1
        else:
            self.is_header = 0
634
        self.input = open(filename)
635
        self.lexer = CLexer(self.input)
636
        if idx is None:
637 638 639 640 641 642 643 644 645 646
            self.index = index()
        else:
            self.index = idx
        self.top_comment = ""
        self.last_comment = ""
        self.comment = None
        self.collect_ref = 0
        self.no_error = 0
        self.conditionals = []
        self.defines = []
647 648 649 650 651 652 653 654 655 656 657 658 659

    def collect_references(self):
        self.collect_ref = 1

    def stop_error(self):
        self.no_error = 1

    def start_error(self):
        self.no_error = 0

    def lineno(self):
        return self.lexer.getlineno()

660
    def index_add(self, name, module, static, type, info=None, extra=None):
661 662 663 664 665 666
        if self.is_header == 1:
            self.index.add(name, module, module, static, type, self.lineno(),
                           info, extra, self.conditionals)
        else:
            self.index.add(name, None, module, static, type, self.lineno(),
                           info, extra, self.conditionals)
667 668

    def index_add_ref(self, name, module, static, type, info=None,
669
                      extra=None):
670 671 672 673 674 675
        if self.is_header == 1:
            self.index.add_ref(name, module, module, static, type,
                               self.lineno(), info, extra, self.conditionals)
        else:
            self.index.add_ref(name, None, module, static, type, self.lineno(),
                               info, extra, self.conditionals)
676 677

    def warning(self, msg):
678 679
        global warnings
        warnings = warnings + 1
680
        if self.no_error:
681
            return
682
        print(msg)
683 684 685

    def error(self, msg, token=-1):
        if self.no_error:
686
            return
687

688
        print("Parse Error: " + msg)
689
        if token != -1:
690
            print("Got token ", token)
691 692
        self.lexer.debug()
        sys.exit(1)
693 694

    def debug(self, msg, token=-1):
695
        print("Debug: " + msg)
696
        if token != -1:
697
            print("Got token ", token)
698
        self.lexer.debug()
699 700

    def parseTopComment(self, comment):
701
        res = {}
702
        lines = comment.split("\n")
703 704
        item = None
        for line in lines:
C
Claudio Bley 已提交
705
            line = line.lstrip().lstrip('*').lstrip()
706 707 708 709 710 711 712

            m = re.match('([_.a-zA-Z0-9]+):(.*)', line)
            if m:
                item = m.group(1)
                line = m.group(2).lstrip()

            if item:
A
Andrea Bolognani 已提交
713
                if item in res:
714 715 716 717
                    res[item] = res[item] + " " + line
                else:
                    res[item] = line
        self.index.info = res
718

719 720 721 722 723 724 725 726 727 728 729 730 731
    def strip_lead_star(self, line):
        l = len(line)
        i = 0
        while i < l:
            if line[i] == ' ' or line[i] == '\t':
                i += 1
            elif line[i] == '*':
                return line[:i] + line[i + 1:]
            else:
                 return line
        return line

    def cleanupComment(self):
732
        if not isinstance(self.comment, str):
733 734 735 736 737 738 739 740
            return
        # remove the leading * on multi-line comments
        lines = self.comment.splitlines(True)
        com = ""
        for line in lines:
            com = com + self.strip_lead_star(line)
        self.comment = com.strip()

741
    def parseComment(self, token):
742
        com = token[1]
743
        if self.top_comment == "":
744
            self.top_comment = com
745
        if self.comment is None or com[0] == '*':
746
            self.comment = com
747
        else:
748
            self.comment = self.comment + com
749
        token = self.lexer.token()
750

751
        if self.comment.find("DOC_DISABLE") != -1:
752
            self.stop_error()
753

754
        if self.comment.find("DOC_ENABLE") != -1:
755
            self.start_error()
756

757
        return token
758 759 760 761

    #
    # Parse a comment block associate to a typedef
    #
762
    def parseTypeComment(self, name, quiet=0):
763
        if name[0:2] == '__':
764
            quiet = 1
765 766

        args = []
767
        desc = ""
768

769
        if self.comment is None:
770 771 772
            if not quiet:
                self.warning("Missing comment for type %s" % (name))
            return((args, desc))
773
        if self.comment[0] != '*':
774 775 776
            if not quiet:
                self.warning("Missing * in type comment for %s" % (name))
            return((args, desc))
777
        lines = self.comment.split('\n')
778 779 780 781 782 783 784 785 786 787 788 789 790 791 792
        if lines[0] == '*':
            del lines[0]
        if lines[0] != "* %s:" % (name):
            if not quiet:
                self.warning("Misformatted type comment for %s" % (name))
                self.warning("  Expecting '* %s:' got '%s'" % (name, lines[0]))
            return((args, desc))
        del lines[0]
        while len(lines) > 0 and lines[0] == '*':
            del lines[0]
        desc = ""
        while len(lines) > 0:
            l = lines[0]
            while len(l) > 0 and l[0] == '*':
                l = l[1:]
793
            l = l.strip()
794 795 796
            desc = desc + " " + l
            del lines[0]

797
        desc = desc.strip()
798 799 800 801 802 803

        if quiet == 0:
            if desc == "":
                self.warning("Type comment for %s lack description of the macro" % (name))

        return(desc)
804 805 806
    #
    # Parse a comment block associate to a macro
    #
807
    def parseMacroComment(self, name, quiet=0):
808 809
        global ignored_macros

810
        if name[0:2] == '__':
811
            quiet = 1
A
Andrea Bolognani 已提交
812
        if name in ignored_macros:
813
            quiet = 1
814 815

        args = []
816
        desc = ""
817

818
        if self.comment is None:
819 820 821
            if not quiet:
                self.warning("Missing comment for macro %s" % (name))
            return((args, desc))
822
        if self.comment[0] != '*':
823 824 825
            if not quiet:
                self.warning("Missing * in macro comment for %s" % (name))
            return((args, desc))
826
        lines = self.comment.split('\n')
827 828 829 830 831 832 833 834 835 836 837 838 839
        if lines[0] == '*':
            del lines[0]
        if lines[0] != "* %s:" % (name):
            if not quiet:
                self.warning("Misformatted macro comment for %s" % (name))
                self.warning("  Expecting '* %s:' got '%s'" % (name, lines[0]))
            return((args, desc))
        del lines[0]
        while lines[0] == '*':
            del lines[0]
        while len(lines) > 0 and lines[0][0:3] == '* @':
            l = lines[0][3:]
            try:
840 841 842
                (arg, desc) = l.split(':', 1)
                desc = desc.strip()
                arg = arg.strip()
843
            except:
844 845 846 847 848 849
                if not quiet:
                    self.warning("Misformatted macro comment for %s" % (name))
                    self.warning("  problem with '%s'" % (lines[0]))
                del lines[0]
                continue
            del lines[0]
850
            l = lines[0].strip()
851 852 853
            while len(l) > 2 and l[0:3] != '* @':
                while l[0] == '*':
                    l = l[1:]
854
                desc = desc + ' ' + l.strip()
855 856 857 858
                del lines[0]
                if len(lines) == 0:
                    break
                l = lines[0]
859
            args.append((arg, desc))
860 861 862 863 864 865 866
        while len(lines) > 0 and lines[0] == '*':
            del lines[0]
        desc = ""
        while len(lines) > 0:
            l = lines[0]
            while len(l) > 0 and l[0] == '*':
                l = l[1:]
867
            l = l.strip()
868 869
            desc = desc + " " + l
            del lines[0]
870

871
        desc = desc.strip()
872

873 874 875
        if quiet == 0:
            if desc == "":
                self.warning("Macro comment for %s lack description of the macro" % (name))
876

877
        return((args, desc))
878 879

     #
880
     # Parse a comment block and merge the information found in the
881 882 883
     # parameters descriptions, finally returns a block as complete
     # as possible
     #
884
    def mergeFunctionComment(self, name, description, quiet=0):
D
Daniel Veillard 已提交
885 886
        global ignored_functions

887
        if name == 'main':
888
            quiet = 1
889
        if name[0:2] == '__':
890
            quiet = 1
A
Andrea Bolognani 已提交
891
        if name in ignored_functions:
D
Daniel Veillard 已提交
892
            quiet = 1
893

894 895 896
        (ret, args) = description
        desc = ""
        retdesc = ""
897

898
        if self.comment is None:
899 900 901
            if not quiet:
                self.warning("Missing comment for function %s" % (name))
            return(((ret[0], retdesc), args, desc))
902
        if self.comment[0] != '*':
903 904 905
            if not quiet:
                self.warning("Missing * in function comment for %s" % (name))
            return(((ret[0], retdesc), args, desc))
906
        lines = self.comment.split('\n')
907 908 909 910 911 912 913 914 915 916 917 918 919 920
        if lines[0] == '*':
            del lines[0]
        if lines[0] != "* %s:" % (name):
            if not quiet:
                self.warning("Misformatted function comment for %s" % (name))
                self.warning("  Expecting '* %s:' got '%s'" % (name, lines[0]))
            return(((ret[0], retdesc), args, desc))
        del lines[0]
        while lines[0] == '*':
            del lines[0]
        nbargs = len(args)
        while len(lines) > 0 and lines[0][0:3] == '* @':
            l = lines[0][3:]
            try:
921 922 923
                (arg, desc) = l.split(':', 1)
                desc = desc.strip()
                arg = arg.strip()
924
            except:
925 926 927 928 929 930
                if not quiet:
                    self.warning("Misformatted function comment for %s" % (name))
                    self.warning("  problem with '%s'" % (lines[0]))
                del lines[0]
                continue
            del lines[0]
931
            l = lines[0].strip()
932 933 934
            while len(l) > 2 and l[0:3] != '* @':
                while l[0] == '*':
                    l = l[1:]
935
                desc = desc + ' ' + l.strip()
936 937 938 939 940 941 942 943
                del lines[0]
                if len(lines) == 0:
                    break
                l = lines[0]
            i = 0
            while i < nbargs:
                if args[i][1] == arg:
                    args[i] = (args[i][0], arg, desc)
944
                    break
945 946 947 948 949 950 951 952 953 954 955 956
                i = i + 1
            if i >= nbargs:
                if not quiet:
                    self.warning("Unable to find arg %s from function comment for %s" % (
                       arg, name))
        while len(lines) > 0 and lines[0] == '*':
            del lines[0]
        desc = None
        while len(lines) > 0:
            l = lines[0]
            i = 0
            # Remove all leading '*', followed by at most one ' ' character
957
            # since we need to preserve correct indentation of code examples
958 959 960 961 962 963
            while i < len(l) and l[i] == '*':
                i = i + 1
            if i > 0:
                if i < len(l) and l[i] == ' ':
                    i = i + 1
                l = l[i:]
964
            if len(l) >= 6 and l[0:7] == "Returns":
965
                try:
966
                    l = l.split(' ', 1)[1]
967 968
                except:
                    l = ""
969
                retdesc = l.strip()
970 971 972 973 974
                del lines[0]
                while len(lines) > 0:
                    l = lines[0]
                    while len(l) > 0 and l[0] == '*':
                        l = l[1:]
975
                    l = l.strip()
976 977 978 979 980 981 982 983 984 985 986
                    retdesc = retdesc + " " + l
                    del lines[0]
            else:
                if desc is not None:
                    desc = desc + "\n" + l
                else:
                    desc = l
                del lines[0]

        if desc is None:
            desc = ""
987 988
        retdesc = retdesc.strip()
        desc = desc.strip()
989 990 991 992 993 994 995

        if quiet == 0:
             #
             # report missing comments
             #
            i = 0
            while i < nbargs:
996
                if args[i][2] is None and args[i][0] != "void" and args[i][1] is not None:
997 998 999 1000 1001 1002 1003 1004 1005
                    self.warning("Function comment for %s lacks description of arg %s" % (name, args[i][1]))
                i = i + 1
            if retdesc == "" and ret[0] != "void":
                self.warning("Function comment for %s lacks description of return value" % (name))
            if desc == "":
                self.warning("Function comment for %s lacks description of the function" % (name))


        return(((ret[0], retdesc), args, desc))
1006 1007

    def parsePreproc(self, token):
1008
        if debug:
1009
            print("=> preproc ", token, self.lexer.tokens)
1010
        name = token[1]
1011 1012
        if name == "#include":
            token = self.lexer.token()
1013
            if token is None:
1014 1015 1016 1017 1018 1019 1020 1021
                return None
            if token[0] == 'preproc':
                self.index_add(token[1], self.filename, not self.is_header,
                                "include")
                return self.lexer.token()
            return token
        if name == "#define":
            token = self.lexer.token()
1022
            if token is None:
1023 1024 1025 1026 1027 1028
                return None
            if token[0] == 'preproc':
                 # TODO macros with arguments
                name = token[1]
                lst = []
                token = self.lexer.token()
1029
                while token is not None and token[0] == 'preproc' and \
1030 1031 1032
                      token[1][0] != '#':
                    lst.append(token[1])
                    token = self.lexer.token()
1033
                try:
1034
                    name = name.split('(') [0]
1035 1036
                except:
                    pass
1037 1038 1039 1040 1041

                # skip hidden macros
                if name in hidden_macros:
                    return token

1042 1043 1044 1045
                strValue = None
                if len(lst) == 1 and lst[0][0] == '"' and lst[0][-1] == '"':
                    strValue = lst[0][1:-1]
                (args, desc) = self.parseMacroComment(name, not self.is_header)
1046
                self.index_add(name, self.filename, not self.is_header,
1047
                               "macro", (args, desc, strValue))
1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070
                return token

        #
        # Processing of conditionals modified by Bill 1/1/05
        #
        # We process conditionals (i.e. tokens from #ifdef, #ifndef,
        # #if, #else and #endif) for headers and mainline code,
        # store the ones from the header in libxml2-api.xml, and later
        # (in the routine merge_public) verify that the two (header and
        # mainline code) agree.
        #
        # There is a small problem with processing the headers. Some of
        # the variables are not concerned with enabling / disabling of
        # library functions (e.g. '__XML_PARSER_H__'), and we don't want
        # them to be included in libxml2-api.xml, or involved in
        # the check between the header and the mainline code.  To
        # accomplish this, we ignore any conditional which doesn't include
        # the string 'ENABLED'
        #
        if name == "#ifdef":
            apstr = self.lexer.tokens[0][1]
            try:
                self.defines.append(apstr)
1071
                if apstr.find('ENABLED') != -1:
1072 1073 1074 1075 1076 1077 1078
                    self.conditionals.append("defined(%s)" % apstr)
            except:
                pass
        elif name == "#ifndef":
            apstr = self.lexer.tokens[0][1]
            try:
                self.defines.append(apstr)
1079
                if apstr.find('ENABLED') != -1:
1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090
                    self.conditionals.append("!defined(%s)" % apstr)
            except:
                pass
        elif name == "#if":
            apstr = ""
            for tok in self.lexer.tokens:
                if apstr != "":
                    apstr = apstr + " "
                apstr = apstr + tok[1]
            try:
                self.defines.append(apstr)
1091
                if apstr.find('ENABLED') != -1:
1092 1093 1094 1095 1096
                    self.conditionals.append(apstr)
            except:
                pass
        elif name == "#else":
            if self.conditionals != [] and \
1097
               self.defines[-1].find('ENABLED') != -1:
1098 1099 1100
                self.conditionals[-1] = "!(%s)" % self.conditionals[-1]
        elif name == "#endif":
            if self.conditionals != [] and \
1101
               self.defines[-1].find('ENABLED') != -1:
1102 1103 1104
                self.conditionals = self.conditionals[:-1]
            self.defines = self.defines[:-1]
        token = self.lexer.token()
1105
        while token is not None and token[0] == 'preproc' and \
1106 1107 1108
            token[1][0] != '#':
            token = self.lexer.token()
        return token
1109 1110 1111 1112 1113 1114

     #
     # token acquisition on top of the lexer, it handle internally
     # preprocessor and comments since they are logically not part of
     # the program structure.
     #
1115 1116 1117
    def push(self, tok):
        self.lexer.push(tok)

1118 1119 1120 1121
    def token(self):
        global ignored_words

        token = self.lexer.token()
1122
        while token is not None:
1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133
            if token[0] == 'comment':
                token = self.parseComment(token)
                continue
            elif token[0] == 'preproc':
                token = self.parsePreproc(token)
                continue
            elif token[0] == "name" and token[1] == "__const":
                token = ("name", "const")
                return token
            elif token[0] == "name" and token[1] == "__attribute":
                token = self.lexer.token()
1134
                while token is not None and token[1] != ";":
1135 1136
                    token = self.lexer.token()
                return token
A
Andrea Bolognani 已提交
1137
            elif token[0] == "name" and token[1] in ignored_words:
1138 1139 1140 1141 1142 1143 1144 1145 1146
                (n, info) = ignored_words[token[1]]
                i = 0
                while i < n:
                    token = self.lexer.token()
                    i = i + 1
                token = self.lexer.token()
                continue
            else:
                if debug:
1147
                    print("=> ", token)
1148 1149
                return token
        return None
1150 1151 1152 1153 1154

     #
     # Parse a typedef, it records the type and its name.
     #
    def parseTypedef(self, token):
1155
        if token is None:
1156 1157
            return None
        token = self.parseType(token)
1158
        if token is None:
1159 1160 1161 1162 1163
            self.error("parsing typedef")
            return None
        base_type = self.type
        type = base_type
         #self.debug("end typedef type", token)
1164
        while token is not None:
1165 1166 1167
            if token[0] == "name":
                name = token[1]
                signature = self.signature
1168
                if signature is not None:
1169
                    type = type.split('(')[0]
1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188
                    d = self.mergeFunctionComment(name,
                            ((type, None), signature), 1)
                    self.index_add(name, self.filename, not self.is_header,
                                    "functype", d)
                else:
                    if base_type == "struct":
                        self.index_add(name, self.filename, not self.is_header,
                                        "struct", type)
                        base_type = "struct " + name
                    else:
                        # TODO report missing or misformatted comments
                        info = self.parseTypeComment(name, 1)
                        self.index_add(name, self.filename, not self.is_header,
                                    "typedef", type, info)
                token = self.token()
            else:
                self.error("parsing typedef: expecting a name")
                return token
             #self.debug("end typedef", token)
1189
            if token is not None and token[0] == 'sep' and token[1] == ',':
1190 1191
                type = base_type
                token = self.token()
1192
                while token is not None and token[0] == "op":
1193 1194
                    type = type + token[1]
                    token = self.token()
1195
            elif token is not None and token[0] == 'sep' and token[1] == ';':
1196
                break
1197
            elif token is not None and token[0] == 'name':
1198
                type = base_type
1199
                continue
1200 1201 1202 1203 1204
            else:
                self.error("parsing typedef: expecting ';'", token)
                return token
        token = self.token()
        return token
1205

1206 1207 1208 1209 1210
     #
     # Parse a C code block, used for functions it parse till
     # the balancing } included
     #
    def parseBlock(self, token):
1211
        while token is not None:
1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243
            if token[0] == "sep" and token[1] == "{":
                token = self.token()
                token = self.parseBlock(token)
            elif token[0] == "sep" and token[1] == "}":
                self.comment = None
                token = self.token()
                return token
            else:
                if self.collect_ref == 1:
                    oldtok = token
                    token = self.token()
                    if oldtok[0] == "name" and oldtok[1][0:3] == "vir":
                        if token[0] == "sep" and token[1] == "(":
                            self.index_add_ref(oldtok[1], self.filename,
                                                0, "function")
                            token = self.token()
                        elif token[0] == "name":
                            token = self.token()
                            if token[0] == "sep" and (token[1] == ";" or
                               token[1] == "," or token[1] == "="):
                                self.index_add_ref(oldtok[1], self.filename,
                                                    0, "type")
                    elif oldtok[0] == "name" and oldtok[1][0:4] == "XEN_":
                        self.index_add_ref(oldtok[1], self.filename,
                                            0, "typedef")
                    elif oldtok[0] == "name" and oldtok[1][0:7] == "LIBXEN_":
                        self.index_add_ref(oldtok[1], self.filename,
                                            0, "typedef")

                else:
                    token = self.token()
        return token
1244 1245 1246 1247 1248 1249

     #
     # Parse a C struct definition till the balancing }
     #
    def parseStruct(self, token):
        fields = []
1250
         #self.debug("start parseStruct", token)
1251
        while token is not None:
1252 1253 1254 1255 1256 1257
            if token[0] == "sep" and token[1] == "{":
                token = self.token()
                token = self.parseTypeBlock(token)
            elif token[0] == "sep" and token[1] == "}":
                self.struct_fields = fields
                 #self.debug("end parseStruct", token)
1258
                 #print(fields)
1259 1260 1261 1262 1263 1264 1265
                token = self.token()
                return token
            else:
                base_type = self.type
                 #self.debug("before parseType", token)
                token = self.parseType(token)
                 #self.debug("after parseType", token)
1266
                if token is not None and token[0] == "name":
1267 1268 1269 1270 1271
                    fname = token[1]
                    token = self.token()
                    if token[0] == "sep" and token[1] == ";":
                        self.comment = None
                        token = self.token()
1272 1273 1274 1275 1276 1277 1278
                        self.cleanupComment()
                        if self.type == "union":
                            fields.append((self.type, fname, self.comment,
                                           self.union_fields))
                            self.union_fields = []
                        else:
                            fields.append((self.type, fname, self.comment))
1279 1280 1281
                        self.comment = None
                    else:
                        self.error("parseStruct: expecting ;", token)
1282
                elif token is not None and token[0] == "sep" and token[1] == "{":
1283 1284
                    token = self.token()
                    token = self.parseTypeBlock(token)
1285
                    if token is not None and token[0] == "name":
1286
                        token = self.token()
1287
                    if token is not None and token[0] == "sep" and token[1] == ";":
1288 1289 1290 1291 1292 1293
                        token = self.token()
                    else:
                        self.error("parseStruct: expecting ;", token)
                else:
                    self.error("parseStruct: name", token)
                    token = self.token()
1294
                self.type = base_type
1295
        self.struct_fields = fields
1296
         #self.debug("end parseStruct", token)
1297
         #print(fields)
1298
        return token
1299

1300 1301 1302 1303 1304 1305
     #
     # Parse a C union definition till the balancing }
     #
    def parseUnion(self, token):
        fields = []
        # self.debug("start parseUnion", token)
1306
        while token is not None:
1307 1308 1309 1310 1311 1312
            if token[0] == "sep" and token[1] == "{":
                token = self.token()
                token = self.parseTypeBlock(token)
            elif token[0] == "sep" and token[1] == "}":
                self.union_fields = fields
                # self.debug("end parseUnion", token)
1313
                # print(fields)
1314 1315 1316 1317 1318 1319 1320
                token = self.token()
                return token
            else:
                base_type = self.type
                # self.debug("before parseType", token)
                token = self.parseType(token)
                # self.debug("after parseType", token)
1321
                if token is not None and token[0] == "name":
1322 1323 1324 1325 1326 1327 1328 1329 1330 1331
                    fname = token[1]
                    token = self.token()
                    if token[0] == "sep" and token[1] == ";":
                        self.comment = None
                        token = self.token()
                        self.cleanupComment()
                        fields.append((self.type, fname, self.comment))
                        self.comment = None
                    else:
                        self.error("parseUnion: expecting ;", token)
1332
                elif token is not None and token[0] == "sep" and token[1] == "{":
1333 1334
                    token = self.token()
                    token = self.parseTypeBlock(token)
1335
                    if token is not None and token[0] == "name":
1336
                        token = self.token()
1337
                    if token is not None and token[0] == "sep" and token[1] == ";":
1338 1339 1340 1341 1342 1343
                        token = self.token()
                    else:
                        self.error("parseUnion: expecting ;", token)
                else:
                    self.error("parseUnion: name", token)
                    token = self.token()
1344
                self.type = base_type
1345 1346
        self.union_fields = fields
        # self.debug("end parseUnion", token)
1347
        # print(fields)
1348 1349
        return token

1350 1351 1352 1353 1354
     #
     # Parse a C enum block, parse till the balancing }
     #
    def parseEnumBlock(self, token):
        self.enums = []
1355 1356
        name = None
        comment = ""
E
Eric Blake 已提交
1357
        value = "-1"
1358
        commentsBeforeVal = self.comment is not None
1359
        while token is not None:
1360 1361 1362 1363
            if token[0] == "sep" and token[1] == "{":
                token = self.token()
                token = self.parseTypeBlock(token)
            elif token[0] == "sep" and token[1] == "}":
1364
                if name is not None:
1365
                    self.cleanupComment()
1366
                    if self.comment is not None:
1367 1368 1369 1370 1371 1372
                        comment = self.comment
                        self.comment = None
                    self.enums.append((name, value, comment))
                token = self.token()
                return token
            elif token[0] == "name":
J
Jiri Denemark 已提交
1373 1374 1375
                self.cleanupComment()
                if name is not None:
                    if self.comment is not None:
1376
                        comment = self.comment.strip()
J
Jiri Denemark 已提交
1377 1378 1379 1380 1381 1382 1383 1384 1385
                        self.comment = None
                    self.enums.append((name, value, comment))
                name = token[1]
                comment = ""
                token = self.token()
                if token[0] == "op" and token[1][0] == "=":
                    value = ""
                    if len(token[1]) > 1:
                        value = token[1][1:]
1386
                    token = self.token()
J
Jiri Denemark 已提交
1387 1388
                    while token[0] != "sep" or (token[1] != ',' and
                          token[1] != '}'):
1389
                        # We might be dealing with '1U << 12' here
1390
                        value = value + re.sub("^(\d+)U$", "\\1", token[1])
1391
                        token = self.token()
J
Jiri Denemark 已提交
1392 1393 1394 1395 1396
                else:
                    try:
                        value = "%d" % (int(value) + 1)
                    except:
                        self.warning("Failed to compute value of enum %s" % (name))
1397
                        value = ""
J
Jiri Denemark 已提交
1398
                if token[0] == "sep" and token[1] == ",":
1399 1400 1401 1402
                    if commentsBeforeVal:
                        self.cleanupComment()
                        self.enums.append((name, value, self.comment))
                        name = comment = self.comment = None
J
Jiri Denemark 已提交
1403
                    token = self.token()
1404 1405 1406
            else:
                token = self.token()
        return token
1407

1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496
    def parseVirEnumDecl(self, token):
        if token[0] != "name":
            self.error("parsing VIR_ENUM_DECL: expecting name", token)

        token = self.token()

        if token[0] != "sep":
            self.error("parsing VIR_ENUM_DECL: expecting ')'", token)

        if token[1] != ')':
            self.error("parsing VIR_ENUM_DECL: expecting ')'", token)

        token = self.token()
        if token[0] == "sep" and token[1] == ';':
            token = self.token()

        return token

    def parseVirEnumImpl(self, token):
        # First the type name
        if token[0] != "name":
            self.error("parsing VIR_ENUM_IMPL: expecting name", token)

        token = self.token()

        if token[0] != "sep":
            self.error("parsing VIR_ENUM_IMPL: expecting ','", token)

        if token[1] != ',':
            self.error("parsing VIR_ENUM_IMPL: expecting ','", token)
        token = self.token()

        # Now the sentinel name
        if token[0] != "name":
            self.error("parsing VIR_ENUM_IMPL: expecting name", token)

        token = self.token()

        if token[0] != "sep":
            self.error("parsing VIR_ENUM_IMPL: expecting ','", token)

        if token[1] != ',':
            self.error("parsing VIR_ENUM_IMPL: expecting ','", token)

        token = self.token()

        # Now a list of strings (optional comments)
        while token is not None:
            isGettext = False
            # First a string, optionally with N_(...)
            if token[0] == 'name':
                if token[1] != 'N_':
                    self.error("parsing VIR_ENUM_IMPL: expecting 'N_'", token)
                token = self.token()
                if token[0] != "sep" or token[1] != '(':
                    self.error("parsing VIR_ENUM_IMPL: expecting '('", token)
                token = self.token()
                isGettext = True

                if token[0] != "string":
                    self.error("parsing VIR_ENUM_IMPL: expecting a string", token)
                token = self.token()
            elif token[0] == "string":
                token = self.token()
            else:
                self.error("parsing VIR_ENUM_IMPL: expecting a string", token)

            # Then a separator
            if token[0] == "sep":
                if isGettext and token[1] == ')':
                    token = self.token()

                if token[1] == ',':
                    token = self.token()

                if token[1] == ')':
                    token = self.token()
                    break

            # Then an optional comment
            if token[0] == "comment":
                token = self.token()


        if token[0] == "sep" and token[1] == ';':
            token = self.token()

        return token

1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514
    def parseVirLogInit(self, token):
        if token[0] != "string":
            self.error("parsing VIR_LOG_INIT: expecting string", token)

        token = self.token()

        if token[0] != "sep":
            self.error("parsing VIR_LOG_INIT: expecting ')'", token)

        if token[1] != ')':
            self.error("parsing VIR_LOG_INIT: expecting ')'", token)

        token = self.token()
        if token[0] == "sep" and token[1] == ';':
            token = self.token()

        return token

1515
     #
1516
     # Parse a C definition block, used for structs or unions it parse till
1517 1518 1519
     # the balancing }
     #
    def parseTypeBlock(self, token):
1520
        while token is not None:
1521 1522 1523 1524 1525 1526 1527 1528 1529
            if token[0] == "sep" and token[1] == "{":
                token = self.token()
                token = self.parseTypeBlock(token)
            elif token[0] == "sep" and token[1] == "}":
                token = self.token()
                return token
            else:
                token = self.token()
        return token
1530 1531 1532 1533 1534 1535 1536 1537

     #
     # Parse a type: the fact that the type name can either occur after
     #    the definition or within the definition makes it a little harder
     #    if inside, the name token is pushed back before returning
     #
    def parseType(self, token):
        self.type = ""
1538
        self.struct_fields = []
1539
        self.union_fields = []
1540
        self.signature = None
1541
        if token is None:
1542 1543
            return token

1544 1545
        while (token[0] == "name" and
               token[1] in ["const", "unsigned", "signed"]):
1546 1547 1548 1549 1550
            if self.type == "":
                self.type = token[1]
            else:
                self.type = self.type + " " + token[1]
            token = self.token()
1551

1552
        if token[0] == "name" and token[1] == "long":
1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566
            if self.type == "":
                self.type = token[1]
            else:
                self.type = self.type + " " + token[1]

            # some read ahead for long long
            oldtmp = token
            token = self.token()
            if token[0] == "name" and token[1] == "long":
                self.type = self.type + " " + token[1]
            else:
                self.push(token)
                token = oldtmp

1567 1568
            oldtmp = token
            token = self.token()
1569
            if token[0] == "name" and token[1] == "int":
1570 1571 1572 1573
                self.type = self.type + " " + token[1]
            else:
                self.push(token)
                token = oldtmp
1574 1575

        elif token[0] == "name" and token[1] == "short":
1576 1577 1578 1579
            if self.type == "":
                self.type = token[1]
            else:
                self.type = self.type + " " + token[1]
1580

1581
        elif token[0] == "name" and token[1] == "struct":
1582 1583 1584 1585 1586 1587 1588 1589 1590
            if self.type == "":
                self.type = token[1]
            else:
                self.type = self.type + " " + token[1]
            token = self.token()
            nametok = None
            if token[0] == "name":
                nametok = token
                token = self.token()
1591
            if token is not None and token[0] == "sep" and token[1] == "{":
1592 1593
                token = self.token()
                token = self.parseStruct(token)
1594
            elif token is not None and token[0] == "op" and token[1] == "*":
1595 1596
                self.type = self.type + " " + nametok[1] + " *"
                token = self.token()
1597
                while token is not None and token[0] == "op" and token[1] == "*":
1598 1599 1600 1601 1602 1603 1604 1605
                    self.type = self.type + " *"
                    token = self.token()
                if token[0] == "name":
                    nametok = token
                    token = self.token()
                else:
                    self.error("struct : expecting name", token)
                    return token
1606
            elif token is not None and token[0] == "name" and nametok is not None:
1607 1608 1609
                self.type = self.type + " " + nametok[1]
                return token

1610
            if nametok is not None:
1611 1612 1613
                self.lexer.push(token)
                token = nametok
            return token
1614

1615 1616 1617 1618 1619 1620 1621 1622 1623 1624
        elif token[0] == "name" and token[1] == "union":
            if self.type == "":
                self.type = token[1]
            else:
                self.type = self.type + " " + token[1]
            token = self.token()
            nametok = None
            if token[0] == "name":
                nametok = token
                token = self.token()
1625
            if token is not None and token[0] == "sep" and token[1] == "{":
1626 1627
                token = self.token()
                token = self.parseUnion(token)
1628
            elif token is not None and token[0] == "name" and nametok is not None:
1629 1630 1631
                self.type = self.type + " " + nametok[1]
                return token

1632
            if nametok is not None:
1633 1634 1635 1636
                self.lexer.push(token)
                token = nametok
            return token

1637
        elif token[0] == "name" and token[1] == "enum":
1638 1639 1640 1641 1642 1643
            if self.type == "":
                self.type = token[1]
            else:
                self.type = self.type + " " + token[1]
            self.enums = []
            token = self.token()
1644
            if token is not None and token[0] == "sep" and token[1] == "{":
1645 1646
                # drop comments before the enum block
                self.comment = None
1647 1648 1649 1650 1651
                token = self.token()
                token = self.parseEnumBlock(token)
            else:
                self.error("parsing enum: expecting '{'", token)
            enum_type = None
1652
            if token is not None and token[0] != "name":
1653 1654 1655 1656 1657 1658 1659 1660 1661
                self.lexer.push(token)
                token = ("name", "enum")
            else:
                enum_type = token[1]
            for enum in self.enums:
                self.index_add(enum[0], self.filename,
                               not self.is_header, "enum",
                               (enum[1], enum[2], enum_type))
            return token
1662 1663
        elif token[0] == "name" and token[1] == "VIR_ENUM_DECL":
            token = self.token()
1664
            if token is not None and token[0] == "sep" and token[1] == "(":
1665 1666 1667 1668
                token = self.token()
                token = self.parseVirEnumDecl(token)
            else:
                self.error("parsing VIR_ENUM_DECL: expecting '('", token)
1669
            if token is not None:
1670 1671 1672 1673 1674 1675
                self.lexer.push(token)
                token = ("name", "virenumdecl")
            return token

        elif token[0] == "name" and token[1] == "VIR_ENUM_IMPL":
            token = self.token()
1676
            if token is not None and token[0] == "sep" and token[1] == "(":
1677 1678 1679 1680
                token = self.token()
                token = self.parseVirEnumImpl(token)
            else:
                self.error("parsing VIR_ENUM_IMPL: expecting '('", token)
1681
            if token is not None:
1682 1683 1684
                self.lexer.push(token)
                token = ("name", "virenumimpl")
            return token
1685

1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697
        elif token[0] == "name" and token[1] == "VIR_LOG_INIT":
            token = self.token()
            if token is not None and token[0] == "sep" and token[1] == "(":
                token = self.token()
                token = self.parseVirLogInit(token)
            else:
                self.error("parsing VIR_LOG_INIT: expecting '('", token)
            if token is not None:
                self.lexer.push(token)
                token = ("name", "virloginit")
            return token

1698 1699 1700 1701 1702 1703 1704 1705 1706 1707
        elif token[0] == "name":
            if self.type == "":
                self.type = token[1]
            else:
                self.type = self.type + " " + token[1]
        else:
            self.error("parsing type %s: expecting a name" % (self.type),
                       token)
            return token
        token = self.token()
1708
        while token is not None and (token[0] == "op" or
1709 1710 1711
              token[0] == "name" and token[1] == "const"):
            self.type = self.type + " " + token[1]
            token = self.token()
1712 1713

         #
1714 1715
         # if there is a parenthesis here, this means a function type
         #
1716
        if token is not None and token[0] == "sep" and token[1] == '(':
1717 1718
            self.type = self.type + token[1]
            token = self.token()
1719
            while token is not None and token[0] == "op" and token[1] == '*':
1720 1721
                self.type = self.type + token[1]
                token = self.token()
1722
            if token is None or token[0] != "name":
1723
                self.error("parsing function type, name expected", token)
1724 1725 1726 1727
                return token
            self.type = self.type + token[1]
            nametok = token
            token = self.token()
1728
            if token is not None and token[0] == "sep" and token[1] == ')':
1729 1730
                self.type = self.type + token[1]
                token = self.token()
1731
                if token is not None and token[0] == "sep" and token[1] == '(':
1732
                    token = self.token()
1733 1734 1735
                    type = self.type
                    token = self.parseSignature(token)
                    self.type = type
1736
                else:
1737
                    self.error("parsing function type, '(' expected", token)
1738 1739
                    return token
            else:
1740
                self.error("parsing function type, ')' expected", token)
1741 1742 1743 1744 1745 1746 1747 1748
                return token
            self.lexer.push(token)
            token = nametok
            return token

         #
         # do some lookahead for arrays
         #
1749
        if token is not None and token[0] == "name":
1750 1751
            nametok = token
            token = self.token()
1752
            if token is not None and token[0] == "sep" and token[1] == '[':
1753
                self.type = self.type + " " + nametok[1]
1754
                while token is not None and token[0] == "sep" and token[1] == '[':
1755 1756
                    self.type = self.type + token[1]
                    token = self.token()
1757
                    while token is not None and token[0] != 'sep' and \
1758 1759 1760
                          token[1] != ']' and token[1] != ';':
                        self.type = self.type + token[1]
                        token = self.token()
1761
                if token is not None and token[0] == 'sep' and token[1] == ']':
1762 1763 1764
                    self.type = self.type + token[1]
                    token = self.token()
                else:
1765
                    self.error("parsing array type, ']' expected", token)
1766
                    return token
1767
            elif token is not None and token[0] == "sep" and token[1] == ':':
1768 1769 1770 1771 1772 1773 1774
                 # remove :12 in case it's a limited int size
                token = self.token()
                token = self.token()
            self.lexer.push(token)
            token = nametok

        return token
1775 1776 1777 1778 1779 1780

     #
     # Parse a signature: '(' has been parsed and we scan the type definition
     #    up to the ')' included
    def parseSignature(self, token):
        signature = []
1781
        if token is not None and token[0] == "sep" and token[1] == ')':
1782 1783 1784
            self.signature = []
            token = self.token()
            return token
1785
        while token is not None:
1786
            token = self.parseType(token)
1787
            if token is not None and token[0] == "name":
1788 1789
                signature.append((self.type, token[1], None))
                token = self.token()
1790
            elif token is not None and token[0] == "sep" and token[1] == ',':
1791 1792
                token = self.token()
                continue
1793
            elif token is not None and token[0] == "sep" and token[1] == ')':
1794 1795 1796 1797 1798
                 # only the type was provided
                if self.type == "...":
                    signature.append((self.type, "...", None))
                else:
                    signature.append((self.type, None, None))
1799
            if token is not None and token[0] == "sep":
1800 1801 1802 1803 1804 1805 1806 1807
                if token[1] == ',':
                    token = self.token()
                    continue
                elif token[1] == ')':
                    token = self.token()
                    break
        self.signature = signature
        return token
1808

1809 1810 1811
    # this dict contains the functions that are allowed to use [unsigned]
    # long for legacy reasons in their signature and return type. this list is
    # fixed. new procedures and public APIs have to use [unsigned] long long
1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847
    long_legacy_functions = {
        "virGetVersion": (False, ("libVer", "typeVer")),
        "virConnectGetLibVersion": (False, ("libVer")),
        "virConnectGetVersion": (False, ("hvVer")),
        "virDomainGetMaxMemory": (True, ()),
        "virDomainMigrate": (False, ("flags", "bandwidth")),
        "virDomainMigrate2": (False, ("flags", "bandwidth")),
        "virDomainMigrateBegin3": (False, ("flags", "bandwidth")),
        "virDomainMigrateConfirm3": (False, ("flags", "bandwidth")),
        "virDomainMigrateDirect": (False, ("flags", "bandwidth")),
        "virDomainMigrateFinish": (False, ("flags")),
        "virDomainMigrateFinish2": (False, ("flags")),
        "virDomainMigrateFinish3": (False, ("flags")),
        "virDomainMigratePeer2Peer": (False, ("flags", "bandwidth")),
        "virDomainMigratePerform": (False, ("flags", "bandwidth")),
        "virDomainMigratePerform3": (False, ("flags", "bandwidth")),
        "virDomainMigratePrepare": (False, ("flags", "bandwidth")),
        "virDomainMigratePrepare2": (False, ("flags", "bandwidth")),
        "virDomainMigratePrepare3": (False, ("flags", "bandwidth")),
        "virDomainMigratePrepareTunnel": (False, ("flags", "bandwidth")),
        "virDomainMigratePrepareTunnel3": (False, ("flags", "bandwidth")),
        "virDomainMigrateToURI": (False, ("flags", "bandwidth")),
        "virDomainMigrateToURI2": (False, ("flags", "bandwidth")),
        "virDomainMigrateVersion1": (False, ("flags", "bandwidth")),
        "virDomainMigrateVersion2": (False, ("flags", "bandwidth")),
        "virDomainMigrateVersion3": (False, ("flags", "bandwidth")),
        "virDomainMigrateSetMaxSpeed": (False, ("bandwidth")),
        "virDomainSetMaxMemory": (False, ("memory")),
        "virDomainSetMemory": (False, ("memory")),
        "virDomainSetMemoryFlags": (False, ("memory")),
        "virDomainBlockCommit": (False, ("bandwidth")),
        "virDomainBlockJobSetSpeed": (False, ("bandwidth")),
        "virDomainBlockPull": (False, ("bandwidth")),
        "virDomainBlockRebase": (False, ("bandwidth")),
        "virDomainMigrateGetMaxSpeed": (False, ("bandwidth"))
    }
1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870

    def checkLongLegacyFunction(self, name, return_type, signature):
        if "long" in return_type and "long long" not in return_type:
            try:
                if not CParser.long_legacy_functions[name][0]:
                    raise Exception()
            except:
                self.error(("function '%s' is not allowed to return long, "
                            "use long long instead") % (name))

        for param in signature:
            if "long" in param[0] and "long long" not in param[0]:
                try:
                    if param[1] not in CParser.long_legacy_functions[name][1]:
                        raise Exception()
                except:
                    self.error(("function '%s' is not allowed to take long "
                                "parameter '%s', use long long instead")
                               % (name, param[1]))

    # this dict contains the structs that are allowed to use [unsigned]
    # long for legacy reasons. this list is fixed. new structs have to use
    # [unsigned] long long
1871 1872 1873 1874 1875
    long_legacy_struct_fields = {
        "_virDomainInfo": ("maxMem", "memory"),
        "_virNodeInfo": ("memory"),
        "_virDomainBlockJobInfo": ("bandwidth")
    }
1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887

    def checkLongLegacyStruct(self, name, fields):
        for field in fields:
            if "long" in field[0] and "long long" not in field[0]:
                try:
                    if field[1] not in CParser.long_legacy_struct_fields[name]:
                        raise Exception()
                except:
                    self.error(("struct '%s' is not allowed to contain long "
                                "field '%s', use long long instead") \
                               % (name, field[1]))

1888 1889 1890 1891 1892 1893 1894
     #
     # Parse a global definition, be it a type, variable or function
     # the extern "C" blocks are a bit nasty and require it to recurse.
     #
    def parseGlobal(self, token):
        static = 0
        if token[1] == 'extern':
1895
            token = self.token()
1896
            if token is None:
1897 1898 1899 1900
                return token
            if token[0] == 'string':
                if token[1] == 'C':
                    token = self.token()
1901
                    if token is None:
1902 1903 1904
                        return token
                    if token[0] == 'sep' and token[1] == "{":
                        token = self.token()
1905
#                        print('Entering extern "C line ', self.lineno())
1906
                        while token is not None and (token[0] != 'sep' or
1907 1908 1909 1910 1911 1912 1913 1914
                              token[1] != "}"):
                            if token[0] == 'name':
                                token = self.parseGlobal(token)
                            else:
                                self.error(
                                 "token %s %s unexpected at the top level" % (
                                        token[0], token[1]))
                                token = self.parseGlobal(token)
1915
#                        print('Exiting extern "C" line', self.lineno())
1916 1917 1918 1919 1920 1921 1922
                        token = self.token()
                        return token
                else:
                    return token
        elif token[1] == 'static':
            static = 1
            token = self.token()
1923
            if token is None or token[0] != 'name':
1924 1925 1926 1927 1928 1929 1930 1931
                return token

        if token[1] == 'typedef':
            token = self.token()
            return self.parseTypedef(token)
        else:
            token = self.parseType(token)
            type_orig = self.type
1932
        if token is None or token[0] != "name":
1933 1934 1935 1936
            return token
        type = type_orig
        self.name = token[1]
        token = self.token()
1937
        while token is not None and (token[0] == "sep" or token[0] == "op"):
1938 1939 1940 1941
            if token[0] == "sep":
                if token[1] == "[":
                    type = type + token[1]
                    token = self.token()
1942
                    while token is not None and (token[0] != "sep" or \
1943 1944 1945 1946
                          token[1] != ";"):
                        type = type + token[1]
                        token = self.token()

1947
            if token is not None and token[0] == "op" and token[1] == "=":
1948 1949 1950 1951 1952 1953 1954 1955 1956
                 #
                 # Skip the initialization of the variable
                 #
                token = self.token()
                if token[0] == 'sep' and token[1] == '{':
                    token = self.token()
                    token = self.parseBlock(token)
                else:
                    self.comment = None
1957
                    while token is not None and (token[0] != "sep" or \
1958 1959 1960
                          (token[1] != ';' and token[1] != ',')):
                            token = self.token()
                self.comment = None
1961
                if token is None or token[0] != "sep" or (token[1] != ';' and
1962 1963 1964
                   token[1] != ','):
                    self.error("missing ';' or ',' after value")

1965
            if token is not None and token[0] == "sep":
1966 1967 1968 1969
                if token[1] == ";":
                    self.comment = None
                    token = self.token()
                    if type == "struct":
1970
                        self.checkLongLegacyStruct(self.name, self.struct_fields)
1971 1972 1973 1974 1975 1976 1977 1978 1979
                        self.index_add(self.name, self.filename,
                             not self.is_header, "struct", self.struct_fields)
                    else:
                        self.index_add(self.name, self.filename,
                             not self.is_header, "variable", type)
                    break
                elif token[1] == "(":
                    token = self.token()
                    token = self.parseSignature(token)
1980
                    if token is None:
1981 1982
                        return None
                    if token[0] == "sep" and token[1] == ";":
1983
                        self.checkLongLegacyFunction(self.name, type, self.signature)
1984 1985 1986 1987 1988 1989
                        d = self.mergeFunctionComment(self.name,
                                ((type, None), self.signature), 1)
                        self.index_add(self.name, self.filename, static,
                                        "function", d)
                        token = self.token()
                    elif token[0] == "sep" and token[1] == "{":
1990
                        self.checkLongLegacyFunction(self.name, type, self.signature)
1991 1992 1993 1994 1995
                        d = self.mergeFunctionComment(self.name,
                                ((type, None), self.signature), static)
                        self.index_add(self.name, self.filename, static,
                                        "function", d)
                        token = self.token()
1996
                        token = self.parseBlock(token)
1997 1998 1999 2000 2001 2002
                elif token[1] == ',':
                    self.comment = None
                    self.index_add(self.name, self.filename, static,
                                    "variable", type)
                    type = type_orig
                    token = self.token()
2003
                    while token is not None and token[0] == "sep":
2004 2005
                        type = type + token[1]
                        token = self.token()
2006
                    if token is not None and token[0] == "name":
2007 2008 2009 2010 2011 2012
                        self.name = token[1]
                        token = self.token()
                else:
                    break

        return token
2013 2014

    def parse(self):
2015
        if not quiet:
2016
            print("Parsing %s" % (self.filename))
2017
        token = self.token()
2018
        while token is not None:
2019
            if token[0] == 'name':
2020
                token = self.parseGlobal(token)
2021
            else:
2022 2023 2024 2025 2026
                self.error("token %s %s unexpected at the top level" % (
                       token[0], token[1]))
                token = self.parseGlobal(token)
                return
        self.parseTopComment(self.top_comment)
2027
        return self.index
2028

2029 2030 2031

class docBuilder:
    """A documentation builder"""
J
Jiri Denemark 已提交
2032
    def __init__(self, name, path='.', directories=['.'], includes=[]):
2033
        self.name = name
J
Jiri Denemark 已提交
2034
        self.path = path
2035
        self.directories = directories
2036
        if name == "libvirt":
2037
            self.includes = includes + list(included_files.keys())
2038
        elif name == "libvirt-qemu":
2039
            self.includes = includes + list(qemu_included_files.keys())
2040
        elif name == "libvirt-lxc":
2041
            self.includes = includes + list(lxc_included_files.keys())
2042
        elif name == "libvirt-admin":
2043
            self.includes = includes + list(admin_included_files.keys())
2044 2045 2046
        self.modules = {}
        self.headers = {}
        self.idx = index()
2047
        self.xref = {}
2048 2049
        self.index = {}
        self.basename = name
2050
        self.errors = 0
2051

2052 2053 2054
    def warning(self, msg):
        global warnings
        warnings = warnings + 1
2055
        print(msg)
2056

2057 2058
    def error(self, msg):
        self.errors += 1
2059
        print("Error:", msg, file=sys.stderr)
2060

2061
    def indexString(self, id, str):
2062
        if str is None:
2063
            return
2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075 2076 2077 2078 2079
        str = str.replace("'", ' ')
        str = str.replace('"', ' ')
        str = str.replace("/", ' ')
        str = str.replace('*', ' ')
        str = str.replace("[", ' ')
        str = str.replace("]", ' ')
        str = str.replace("(", ' ')
        str = str.replace(")", ' ')
        str = str.replace("<", ' ')
        str = str.replace('>', ' ')
        str = str.replace("&", ' ')
        str = str.replace('#', ' ')
        str = str.replace(",", ' ')
        str = str.replace('.', ' ')
        str = str.replace(';', ' ')
        tokens = str.split()
2080
        for token in tokens:
C
Cole Robinson 已提交
2081 2082 2083 2084 2085 2086 2087 2088 2089
            c = token[0]
            if not re.match(r"[a-zA-Z]", c):
                pass
            elif len(token) < 3:
                pass
            else:
                lower = token.lower()
                # TODO: generalize this a bit
                if lower == 'and' or lower == 'the':
2090
                    pass
C
Cole Robinson 已提交
2091 2092
                elif token in self.xref:
                    self.xref[token].append(id)
2093
                else:
C
Cole Robinson 已提交
2094
                    self.xref[token] = [id]
2095 2096

    def analyze(self):
2097
        if not quiet:
2098
            print("Project %s : %d headers, %d modules" % (self.name, len(self.headers.keys()), len(self.modules.keys())))
2099
        self.idx.analyze()
2100 2101

    def scanHeaders(self):
2102 2103 2104
        for header in self.headers.keys():
            parser = CParser(header)
            idx = parser.parse()
2105
            self.headers[header] = idx
2106
            self.idx.merge(idx)
2107 2108

    def scanModules(self):
2109 2110 2111 2112 2113 2114
        for module in self.modules.keys():
            parser = CParser(module)
            idx = parser.parse()
            # idx.analyze()
            self.modules[module] = idx
            self.idx.merge_public(idx)
2115 2116 2117

    def scan(self):
        for directory in self.directories:
2118 2119 2120 2121
            files = glob.glob(directory + "/*.c")
            for file in files:
                skip = 1
                for incl in self.includes:
2122
                    if file.find(incl) != -1:
2123
                        skip = 0
2124 2125
                        break
                if skip == 0:
2126
                    self.modules[file] = None
2127 2128 2129 2130
            files = glob.glob(directory + "/*.h")
            for file in files:
                skip = 1
                for incl in self.includes:
2131
                    if file.find(incl) != -1:
2132
                        skip = 0
2133 2134
                        break
                if skip == 0:
2135
                    self.headers[file] = None
2136 2137
        self.scanHeaders()
        self.scanModules()
2138

2139 2140
    def modulename_file(self, file):
        module = os.path.basename(file)
2141 2142 2143 2144 2145
        if module[-2:] == '.h':
            module = module[:-2]
        elif module[-2:] == '.c':
            module = module[:-2]
        return module
2146 2147 2148 2149

    def serialize_enum(self, output, name):
        id = self.idx.enums[name]
        output.write("    <enum name='%s' file='%s'" % (name,
2150
                     self.modulename_file(id.header)))
2151
        if id.info is not None:
2152
            info = id.info
2153
            if info[0] is not None and info[0] != '':
2154 2155 2156 2157
                try:
                    val = eval(info[0])
                except:
                    val = info[0]
2158
                output.write(" value='%s'" % (val))
2159
            if info[2] is not None and info[2] != '':
2160
                output.write(" type='%s'" % info[2])
2161
            if info[1] is not None and info[1] != '':
2162
                output.write(" info='%s'" % escape(info[1]))
2163 2164 2165 2166
        output.write("/>\n")

    def serialize_macro(self, output, name):
        id = self.idx.macros[name]
2167
        output.write("    <macro name='%s' file='%s'" % (name,
2168
                     self.modulename_file(id.header)))
2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190
        if id.info is None:
            args = []
            desc = None
            strValue = None
        else:
            (args, desc, strValue) = id.info

        if strValue is not None:
            output.write(" string='%s'" % strValue)
        output.write(">\n")

        if desc is not None and desc != "":
            output.write("      <info><![CDATA[%s]]></info>\n" % (desc))
            self.indexString(name, desc)
        for arg in args:
            (name, desc) = arg
            if desc is not None and desc != "":
                output.write("      <arg name='%s' info='%s'/>\n" % (
                             name, escape(desc)))
                self.indexString(name, desc)
            else:
                output.write("      <arg name='%s'/>\n" % (name))
2191 2192
        output.write("    </macro>\n")

2193
    def serialize_union(self, output, field, desc):
2194
        output.write("      <field name='%s' type='union' info='%s'>\n" % (field[1], desc))
2195 2196 2197
        output.write("        <union>\n")
        for f in field[3]:
            desc = f[2]
2198
            if desc is None:
2199 2200 2201
                desc = ''
            else:
                desc = escape(desc)
2202
            output.write("          <field name='%s' type='%s' info='%s'/>\n" % (f[1], f[0], desc))
2203 2204 2205 2206

        output.write("        </union>\n")
        output.write("      </field>\n")

2207 2208
    def serialize_typedef(self, output, name):
        id = self.idx.typedefs[name]
2209 2210 2211 2212
        if id.info[0:7] == 'struct ':
            output.write("    <struct name='%s' file='%s' type='%s'" % (
                     name, self.modulename_file(id.header), id.info))
            name = id.info[7:]
2213 2214
            if (name in self.idx.structs and
                    isinstance(self.idx.structs[name].info, (list, tuple))):
2215
                output.write(">\n")
2216 2217 2218 2219
                try:
                    for field in self.idx.structs[name].info:
                        desc = field[2]
                        self.indexString(name, desc)
2220
                        if desc is None:
2221 2222 2223
                            desc = ''
                        else:
                            desc = escape(desc)
2224 2225 2226
                        if field[0] == "union":
                            self.serialize_union(output, field, desc)
                        else:
2227
                            output.write("      <field name='%s' type='%s' info='%s'/>\n" % (field[1], field[0], desc))
2228
                except:
2229
                    self.warning("Failed to serialize struct %s" % (name))
2230 2231
                output.write("    </struct>\n")
            else:
2232
                output.write("/>\n")
2233
        else:
2234 2235
            output.write("    <typedef name='%s' file='%s' type='%s'" % (
                         name, self.modulename_file(id.header), id.info))
2236
            try:
2237
                desc = id.extra
2238
                if desc is not None and desc != "":
2239 2240 2241 2242 2243 2244
                    output.write(">\n      <info><![CDATA[%s]]></info>\n" % (desc))
                    output.write("    </typedef>\n")
                else:
                    output.write("/>\n")
            except:
                output.write("/>\n")
2245 2246 2247

    def serialize_variable(self, output, name):
        id = self.idx.variables[name]
2248
        if id.info is not None:
2249 2250 2251 2252 2253
            output.write("    <variable name='%s' file='%s' type='%s'/>\n" % (
                    name, self.modulename_file(id.header), id.info))
        else:
            output.write("    <variable name='%s' file='%s'/>\n" % (
                    name, self.modulename_file(id.header)))
2254

2255 2256
    def serialize_function(self, output, name):
        id = self.idx.functions[name]
2257
        if name == debugsym and not quiet:
2258
            print("=>", id)
2259

2260
        # NB: this is consumed by a regex in 'getAPIFilenames' in hvsupport.pl
2261
        output.write("    <%s name='%s' file='%s' module='%s'>\n" % (id.type,
2262 2263 2264 2265 2266
                     name, self.modulename_file(id.header),
                     self.modulename_file(id.module)))
        #
        # Processing of conditionals modified by Bill 1/1/05
        #
2267
        if id.conditionals is not None:
2268 2269 2270 2271 2272
            apstr = ""
            for cond in id.conditionals:
                if apstr != "":
                    apstr = apstr + " &amp;&amp; "
                apstr = apstr + cond
2273
            output.write("      <cond>%s</cond>\n" % (apstr))
2274 2275 2276 2277
        try:
            (ret, params, desc) = id.info
            output.write("      <info><![CDATA[%s]]></info>\n" % (desc))
            self.indexString(name, desc)
2278
            if ret[0] is not None:
2279 2280
                if ret[0] == "void":
                    output.write("      <return type='void'/>\n")
A
Andrea Bolognani 已提交
2281
                elif (ret[1] is None or ret[1] == '') and name not in ignored_functions:
2282
                    self.error("Missing documentation for return of function `%s'" % name)
2283 2284 2285 2286 2287 2288 2289
                else:
                    output.write("      <return type='%s' info='%s'/>\n" % (
                             ret[0], escape(ret[1])))
                    self.indexString(name, ret[1])
            for param in params:
                if param[0] == 'void':
                    continue
2290
                if (param[2] is None or param[2] == ''):
A
Andrea Bolognani 已提交
2291
                    if name in ignored_functions:
2292 2293 2294
                        output.write("      <arg name='%s' type='%s' info=''/>\n" % (param[1], param[0]))
                    else:
                        self.error("Missing documentation for arg `%s' of function `%s'" % (param[1], name))
2295 2296 2297 2298
                else:
                    output.write("      <arg name='%s' type='%s' info='%s'/>\n" % (param[1], param[0], escape(param[2])))
                    self.indexString(name, param[2])
        except:
2299
            print("Exception:", sys.exc_info()[1], file=sys.stderr)
2300
            self.warning("Failed to save function %s info: %s" % (name, repr(id.info)))
2301 2302 2303 2304
        output.write("    </%s>\n" % (id.type))

    def serialize_exports(self, output, file):
        module = self.modulename_file(file)
2305 2306
        output.write("    <file name='%s'>\n" % (module))
        dict = self.headers[file]
2307
        if dict.info is not None:
2308 2309 2310
            for data in ('Summary', 'Description', 'Author'):
                try:
                    output.write("     <%s>%s</%s>\n" % (
C
Cole Robinson 已提交
2311
                                 data.lower(),
2312
                                 escape(dict.info[data]),
C
Cole Robinson 已提交
2313 2314
                                 data.lower()))
                except KeyError:
2315
                    self.warning("Header %s lacks a %s description" % (module, data))
A
Andrea Bolognani 已提交
2316
            if 'Description' in dict.info:
2317
                desc = dict.info['Description']
2318
                if desc.find("DEPRECATED") != -1:
2319
                    output.write("     <deprecated/>\n")
2320

2321
        for id in uniq(dict.macros.keys()):
2322
            # Macros are sometime used to masquerade other types.
A
Andrea Bolognani 已提交
2323
            if id in dict.functions:
2324
                continue
A
Andrea Bolognani 已提交
2325
            if id in dict.variables:
2326
                continue
A
Andrea Bolognani 已提交
2327
            if id in dict.typedefs:
2328
                continue
A
Andrea Bolognani 已提交
2329
            if id in dict.structs:
2330
                continue
A
Andrea Bolognani 已提交
2331
            if id in dict.unions:
2332
                continue
A
Andrea Bolognani 已提交
2333
            if id in dict.enums:
2334 2335
                continue
            output.write("     <exports symbol='%s' type='macro'/>\n" % (id))
2336
        for id in uniq(dict.enums.keys()):
2337
            output.write("     <exports symbol='%s' type='enum'/>\n" % (id))
2338
        for id in uniq(dict.typedefs.keys()):
2339
            output.write("     <exports symbol='%s' type='typedef'/>\n" % (id))
2340
        for id in uniq(dict.structs.keys()):
2341
            output.write("     <exports symbol='%s' type='struct'/>\n" % (id))
2342
        for id in uniq(dict.variables.keys()):
2343
            output.write("     <exports symbol='%s' type='variable'/>\n" % (id))
2344
        for id in uniq(dict.functions.keys()):
2345 2346
            output.write("     <exports symbol='%s' type='function'/>\n" % (id))
        output.write("    </file>\n")
2347 2348

    def serialize_xrefs_files(self, output):
2349
        headers = sorted(self.headers.keys())
2350
        for file in headers:
2351 2352 2353
            module = self.modulename_file(file)
            output.write("    <file name='%s'>\n" % (module))
            dict = self.headers[file]
2354 2355 2356 2357 2358 2359
            ids = uniq(list(dict.functions.keys()) + \
                       list(dict.variables.keys()) + \
                       list(dict.macros.keys()) + \
                       list(dict.typedefs.keys()) + \
                       list(dict.structs.keys()) + \
                       list(dict.enums.keys()))
2360 2361 2362
            for id in ids:
                output.write("      <ref name='%s'/>\n" % (id))
            output.write("    </file>\n")
2363 2364 2365 2366
        pass

    def serialize_xrefs_functions(self, output):
        funcs = {}
2367 2368 2369 2370 2371 2372 2373
        for name in self.idx.functions.keys():
            id = self.idx.functions[name]
            try:
                (ret, params, desc) = id.info
                for param in params:
                    if param[0] == 'void':
                        continue
A
Andrea Bolognani 已提交
2374
                    if param[0] in funcs:
2375 2376 2377 2378 2379
                        funcs[param[0]].append(name)
                    else:
                        funcs[param[0]] = [name]
            except:
                pass
2380
        typ = sorted(funcs.keys())
2381
        for type in typ:
2382
            if type in ['', "void", "int", "char *", "const char *"]:
2383 2384 2385 2386 2387 2388 2389 2390 2391 2392
                continue
            output.write("    <type name='%s'>\n" % (type))
            ids = funcs[type]
            ids.sort()
            pid = ''    # not sure why we have dups, but get rid of them!
            for id in ids:
                if id != pid:
                    output.write("      <ref name='%s'/>\n" % (id))
                    pid = id
            output.write("    </type>\n")
2393 2394 2395

    def serialize_xrefs_constructors(self, output):
        funcs = {}
2396 2397 2398 2399 2400 2401
        for name in self.idx.functions.keys():
            id = self.idx.functions[name]
            try:
                (ret, params, desc) = id.info
                if ret[0] == "void":
                    continue
A
Andrea Bolognani 已提交
2402
                if ret[0] in funcs:
2403 2404 2405 2406 2407
                    funcs[ret[0]].append(name)
                else:
                    funcs[ret[0]] = [name]
            except:
                pass
2408
        typ = sorted(funcs.keys())
2409
        for type in typ:
2410
            if type in ['', "void", "int", "char *", "const char *"]:
2411 2412
                continue
            output.write("    <type name='%s'>\n" % (type))
2413
            ids = sorted(funcs[type])
2414 2415 2416
            for id in ids:
                output.write("      <ref name='%s'/>\n" % (id))
            output.write("    </type>\n")
2417 2418

    def serialize_xrefs_alpha(self, output):
2419
        letter = None
2420
        ids = sorted(self.idx.identifiers.keys())
2421 2422
        for id in ids:
            if id[0] != letter:
2423
                if letter is not None:
2424 2425 2426 2427
                    output.write("    </letter>\n")
                letter = id[0]
                output.write("    <letter name='%s'>\n" % (letter))
            output.write("      <ref name='%s'/>\n" % (id))
2428
        if letter is not None:
2429
            output.write("    </letter>\n")
2430 2431

    def serialize_xrefs_references(self, output):
2432
        typ = sorted(self.idx.identifiers.keys())
2433 2434 2435 2436 2437 2438 2439
        for id in typ:
            idf = self.idx.identifiers[id]
            module = idf.header
            output.write("    <reference name='%s' href='%s'/>\n" % (id,
                         'html/' + self.basename + '-' +
                         self.modulename_file(module) + '.html#' +
                         id))
2440 2441 2442

    def serialize_xrefs_index(self, output):
        index = self.xref
2443
        typ = sorted(index.keys())
2444 2445 2446 2447 2448 2449 2450 2451
        letter = None
        count = 0
        chunk = 0
        chunks = []
        for id in typ:
            if len(index[id]) > 30:
                continue
            if id[0] != letter:
2452 2453
                if letter is None or count > 200:
                    if letter is not None:
2454 2455 2456
                        output.write("      </letter>\n")
                        output.write("    </chunk>\n")
                        count = 0
2457
                        chunks.append(["chunk%s" % (chunk - 1), first_letter, letter])
2458 2459 2460
                    output.write("    <chunk name='chunk%s'>\n" % (chunk))
                    first_letter = id[0]
                    chunk = chunk + 1
2461
                elif letter is not None:
2462 2463 2464 2465
                    output.write("      </letter>\n")
                letter = id[0]
                output.write("      <letter name='%s'>\n" % (letter))
            output.write("        <word name='%s'>\n" % (id))
2466
            tokens = index[id]
2467 2468 2469 2470 2471 2472 2473 2474 2475
            tokens.sort()
            tok = None
            for token in tokens:
                if tok == token:
                    continue
                tok = token
                output.write("          <ref name='%s'/>\n" % (token))
                count = count + 1
            output.write("        </word>\n")
2476
        if letter is not None:
2477 2478 2479
            output.write("      </letter>\n")
            output.write("    </chunk>\n")
            if count != 0:
2480
                chunks.append(["chunk%s" % (chunk - 1), first_letter, letter])
2481 2482 2483 2484 2485
            output.write("    <chunks>\n")
            for ch in chunks:
                output.write("      <chunk name='%s' start='%s' end='%s'/>\n" % (
                             ch[0], ch[1], ch[2]))
            output.write("    </chunks>\n")
2486 2487

    def serialize_xrefs(self, output):
2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503 2504 2505
        output.write("  <references>\n")
        self.serialize_xrefs_references(output)
        output.write("  </references>\n")
        output.write("  <alpha>\n")
        self.serialize_xrefs_alpha(output)
        output.write("  </alpha>\n")
        output.write("  <constructors>\n")
        self.serialize_xrefs_constructors(output)
        output.write("  </constructors>\n")
        output.write("  <functions>\n")
        self.serialize_xrefs_functions(output)
        output.write("  </functions>\n")
        output.write("  <files>\n")
        self.serialize_xrefs_files(output)
        output.write("  </files>\n")
        output.write("  <index>\n")
        self.serialize_xrefs_index(output)
        output.write("  </index>\n")
2506 2507

    def serialize(self):
J
Jiri Denemark 已提交
2508
        filename = "%s/%s-api.xml" % (self.path, self.name)
2509
        if not quiet:
2510
            print("Saving XML description %s" % (filename))
2511 2512 2513 2514
        output = open(filename, "w")
        output.write('<?xml version="1.0" encoding="ISO-8859-1"?>\n')
        output.write("<api name='%s'>\n" % self.name)
        output.write("  <files>\n")
2515
        headers = sorted(self.headers.keys())
2516 2517 2518 2519
        for file in headers:
            self.serialize_exports(output, file)
        output.write("  </files>\n")
        output.write("  <symbols>\n")
2520
        macros = sorted(self.idx.macros.keys())
2521 2522
        for macro in macros:
            self.serialize_macro(output, macro)
2523
        enums = sorted(self.idx.enums.keys())
2524 2525
        for enum in enums:
            self.serialize_enum(output, enum)
2526
        typedefs = sorted(self.idx.typedefs.keys())
2527 2528
        for typedef in typedefs:
            self.serialize_typedef(output, typedef)
2529
        variables = sorted(self.idx.variables.keys())
2530 2531
        for variable in variables:
            self.serialize_variable(output, variable)
2532
        functions = sorted(self.idx.functions.keys())
2533 2534 2535 2536 2537 2538
        for function in functions:
            self.serialize_function(output, function)
        output.write("  </symbols>\n")
        output.write("</api>\n")
        output.close()

2539
        if self.errors > 0:
2540
            print("apibuild.py: %d error(s) encountered during generation" % self.errors, file=sys.stderr)
2541 2542
            sys.exit(3)

J
Jiri Denemark 已提交
2543
        filename = "%s/%s-refs.xml" % (self.path, self.name)
2544
        if not quiet:
2545
            print("Saving XML Cross References %s" % (filename))
2546 2547 2548 2549 2550 2551 2552 2553
        output = open(filename, "w")
        output.write('<?xml version="1.0" encoding="ISO-8859-1"?>\n')
        output.write("<apirefs name='%s'>\n" % self.name)
        self.serialize_xrefs(output)
        output.write("</apirefs>\n")
        output.close()


A
Andrea Bolognani 已提交
2554 2555 2556 2557
class app:
    def warning(self, msg):
        global warnings
        warnings = warnings + 1
2558
        print(msg)
A
Andrea Bolognani 已提交
2559 2560 2561

    def rebuild(self, name):
        if name not in ["libvirt", "libvirt-qemu", "libvirt-lxc", "libvirt-admin"]:
A
Andrea Bolognani 已提交
2562
            self.warning("rebuild() failed, unknown module %s" % name)
A
Andrea Bolognani 已提交
2563 2564 2565 2566 2567 2568
            return None
        builder = None
        srcdir = os.path.abspath((os.environ["srcdir"]))
        builddir = os.path.abspath((os.environ["builddir"]))
        if srcdir == builddir:
            builddir = None
2569
        if glob.glob(srcdir + "/../src/libvirt.c") != []:
A
Andrea Bolognani 已提交
2570
            if not quiet:
2571
                print("Rebuilding API description for %s" % name)
A
Andrea Bolognani 已提交
2572 2573 2574
            dirs = [srcdir + "/../src",
                    srcdir + "/../src/util",
                    srcdir + "/../include/libvirt"]
2575 2576
            if (builddir and
                not os.path.exists(srcdir + "/../include/libvirt/libvirt-common.h")):
A
Andrea Bolognani 已提交
2577 2578
                dirs.append(builddir + "/../include/libvirt")
            builder = docBuilder(name, srcdir, dirs, [])
2579
        elif glob.glob("src/libvirt.c") != []:
A
Andrea Bolognani 已提交
2580
            if not quiet:
2581
                print("Rebuilding API description for %s" % name)
A
Andrea Bolognani 已提交
2582 2583 2584 2585 2586 2587 2588 2589 2590 2591 2592 2593 2594 2595 2596 2597 2598 2599
            builder = docBuilder(name, srcdir,
                                 ["src", "src/util", "include/libvirt"],
                                 [])
        else:
            self.warning("rebuild() failed, unable to guess the module")
            return None
        builder.scan()
        builder.analyze()
        builder.serialize()
        return builder

    #
    # for debugging the parser
    #
    def parse(self, filename):
        parser = CParser(filename)
        idx = parser.parse()
        return idx
2600 2601 2602


if __name__ == "__main__":
A
Andrea Bolognani 已提交
2603
    app = app()
2604 2605
    if len(sys.argv) > 1:
        debug = 1
A
Andrea Bolognani 已提交
2606
        app.parse(sys.argv[1])
2607
    else:
A
Andrea Bolognani 已提交
2608 2609 2610 2611
        app.rebuild("libvirt")
        app.rebuild("libvirt-qemu")
        app.rebuild("libvirt-lxc")
        app.rebuild("libvirt-admin")
2612 2613 2614 2615
    if warnings > 0:
        sys.exit(2)
    else:
        sys.exit(0)