File: find-duplicated-sids.py

package info (click to toggle)
libreoffice 1%3A5.2.7-1%2Bdeb9u11
  • links: PTS, VCS
  • area: main
  • in suites: stretch
  • size: 2,603,628 kB
  • sloc: cpp: 4,054,182; java: 289,998; xml: 272,393; ansic: 48,279; python: 37,075; perl: 33,686; yacc: 12,078; sh: 9,840; makefile: 8,917; cs: 6,600; objc: 2,388; lex: 2,178; asm: 1,348; awk: 882; pascal: 876; php: 79; csh: 20; sed: 5
file content (92 lines) | stat: -rwxr-xr-x 3,328 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
#!/usr/bin/python


# Scan .hrc files for conflicting SID constants
#
# This is not as easy as it sounds because some of the constants depend on other constants whose names do not start with SID_
#

import subprocess
import sys

sidNameToValue = dict()
sidNameToOriginalLine = dict()


def extractSidValue(sidValue):
    if isinstance(sidValue, int):
        return sidValue
    if sidValue.isdigit():
        return int(sidValue)
    if sidValue[0:2] == "0x":
        return int(sidValue, 16)
    if sidValue.find("+") != -1:
        tokens = sidValue.split("+")
        tokens1 = tokens[0].strip()
        tokens2 = tokens[1].strip()
        return extractSidValue(tokens1) + extractSidValue(tokens2)
    rv = extractSidValue(sidNameToValue[sidValue])
    sidNameToValue[sidValue] = rv
    return rv


#a = subprocess.Popen("git grep -P '#define\s+(SID_|SC_|DETECTIVE_|DRAWTEXTBAR_|DRAW_BAR_|RID_|OBJBAR_FORMAT_|TAB_POPUP_|DATA_MENU_|EXTRA_MENU_|FORMAT_MENU_|INSERT_MENU_|VIEW_MENU_|EDIT_MENU_|FILE_MENU_|SC_FUNCTION_|RC_)'", stdout=subprocess.PIPE, shell=True)
a = subprocess.Popen("git grep -Pn '#define\s+(\S+)' -- *.hrc", stdout=subprocess.PIPE, shell=True)

with a.stdout as txt:
    for line in txt:
        originalLine = line.strip()
        # strip the '#define' off the front
        idx1 = line.find(" ")
        line = line[idx1 : len(line)].strip()
        # extract the name
        idx1 = line.find(" ")
        if (idx1 == -1): continue
        sidName = line[0 : idx1].strip()
        line = line[idx1 : len(line)].strip()
        # strip any trailing comments
        idx1 = line.find("//")
        if (idx1 != -1):
            line = line[0 : idx1].strip()
        idx1 = line.find("/*")
        if (idx1 != -1):
            line = line[0 : idx1].strip()
        if len(line) == 0: continue
        # strip brackets
        if line[0] == "(": line = line[1:]
        if line[len(line)-1] == ")": line = line[0:len(line)-1]
        sidTextValue = line.strip()
        # ignore the #define strings
        if (sidTextValue.find("\"") != -1): continue
        # ignore the multiline macros
        if (sidTextValue.find("\\") != -1): continue
        # check for redefinitions
        if sidName[0:4] == "SID_" and sidNameToValue.has_key(sidName):
            print "Redefinition:\n\t",  sidNameToOriginalLine[sidName], "\n\t" , originalLine
        else:
            sidNameToValue[sidName] = sidTextValue
        sidNameToOriginalLine[sidName] = originalLine

    # decode the constants into their numeric values recursively
    sidNamesToIgnore = set()
    for sidName in sidNameToValue:
        sidTextValue = sidNameToValue[sidName]
        try:
            sidValueNum = extractSidValue(sidTextValue)
            sidNameToValue[sidName] = sidValueNum
        except KeyError:
            sidNamesToIgnore.add(sidName)

    # check for conflicts    
    sidValueToName = dict()
    for sidName in sidNameToValue:
        if sidName in sidNamesToIgnore: continue
        if sidName[0:4] != "SID_": continue
        sidValue = sidNameToValue[sidName]
        if sidValueToName.has_key(sidValue):
            print "conflict:\n\t", sidNameToOriginalLine[sidName], "\n\t", sidNameToOriginalLine[sidValueToName[sidValue]]
        else:
            sidValueToName[sidValue] = sidName