summaryrefslogtreecommitdiff
path: root/cad/src/tools/packageData_checker.py
blob: 42af2c5af8519d18169ec17e76216583be2c376e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
#!/usr/bin/env python
# Copyright 2007-2008 Nanorex, Inc.  See LICENSE file for details. 
"""
packageData_checker.py - script for checking and reporting on packageData.py

Note: some of this code might be moved into packageData
if all users of that data should use this code to canonicalize it
before making other use of it (eg for import graphing).

@author: Bruce
@version: $Id$
@copyright: 2007-2008 Nanorex, Inc.  See LICENSE file for details.
"""

import sys
import os

LIST_UNCLASSIFIED_FILES = True


#bruce 080107 temporary debug prints to find out why SEMBot run of this seems to do nothing
# print >> sys.stderr, "packageData_checker.py debug: starting import"

from packageData import packageMapping, layer_aliases, topic_mapping
from packageData import packageMapping_for_files
from packageData import packageMapping_for_packages

from packageData import needs_renaming_for_clarity
from packageData import needs_refactoring # use this someday?
from packageData import listing_order # use this? (it's not yet well ordered as of 080104)
from packageData import subdir_notes
 

# utils for looking at output of AllPyFiles, not yet used within this file

def source_path_parts(path):
    p1 = path.split('/')
    assert p1[0] == '.'
    return p1[1:]

def topmodule(pathparts):
    if not len(pathparts) == 1:
        return None
    module = pathparts[0]
    assert module.endswith('.py')
    return module[:-3]

#e should add routine to look for toplevel files not present in packageMapping

# ==

# flags for packageClassification
LAYER_ONLY = 'LAYER_ONLY'
TOPIC_ONLY = 'TOPIC_ONLY'
LAYER_AND_TOPIC = 'LAYER_AND_TOPIC'

def packageClassification(value, flags):
    """
    @param value: a string value from the packageMapping global variable,
                  e.g. "ui/propmgr|commands/BuildSomething" or "widget" or ...
                  which has a layer and an optional |topic
                  both of which might be word or word/word etc
    """
    parts = value.split('|')
    assert len(parts) in (1,2)
    if len(parts) == 1:
        layer = parts[0]
        topic = None
    else:
        layer, topic = parts
    layer = canonicalize(layer, layer_aliases)
    if topic is None:
        topic = layer # or, "dflt_" + layer??
    topic = canonicalize(topic, topic_mapping)
    if flags == LAYER_ONLY:
        return layer
    elif flags == TOPIC_ONLY:
        return topic
    else:
        # LAYER_AND_TOPIC
        if layer == topic:
            return layer
        return layer + "|" + topic
    pass

def canonicalize(value, dict1):
    """
    Canonicalize value by repeatedly doing value = dict1[value],
    but if this enters a cycle, report error and return original value.
    """
    orig_value = value
    prior_values = [value]
    while dict1.has_key(value):
        value = dict1[value]
        if value in prior_values:
            print >> sys.stderr, "error: canonicalize loop: %r" % (prior_values + [value])
            return orig_value
        prior_values.append(value)
    return value

def check_basename(basename):
    """
    Return an improved basename; fix and report errors.
    """
    if ' ' in basename:
        print >> sys.stderr, "error: basename should not contain %r: %r" % (' ', basename,)
        assert 0 # can't handle this error
    for suffix in (".py", "/"):
        if basename.endswith( suffix):
            print >> sys.stderr, "error: basename should not end with %r: %r" % (suffix, basename,)
            basename = basename[:-len(suffix)]
            print >> sys.stderr, " (using %r instead)" % basename
    return basename
        
def summarize_packageMapping( flags):

    counts = {}
    
    for basename, value in packageMapping.items():
        basename = check_basename(basename)
        classification = packageClassification(value, flags)
        countnow = counts.setdefault(classification, 0)
        countnow += 1
        counts[classification] = countnow

    items = counts.items()
    items.sort() # by classification

    print
    print "classication: count (for %s)" % (flags,)
    print
    for classification, count in items:
        print "%s: %d" % (classification, count)
    return

def summarize_packageMapping_using_default_flags():
    ## summarize_packageMapping( LAYER_ONLY)
    summarize_packageMapping( TOPIC_ONLY)
    return

# ==

T_MODULE = "module"
T_PACKAGE = "package"
T_SUBDIR_NOTE = "subdir note"

# sortorder values
ORDER_ERROR = -2
ORDER_SUBDIR_NOTE = -1
ORDER_INLINE_NOTE = 0
ORDER_MODULE = 1
ORDER_NEW_SUBPACKAGE = 2

class _VirtualSubdir(type({})):
    
    def __init__(self, basename):
        self.__basename = basename
        super(_VirtualSubdir, self).__init__()
        
    def print_listing(self, indent = "", skip_toplevel_indent = False):
        if not skip_toplevel_indent:
            print indent + self.__basename + "/" + "   (%d)" % len(self)
            subindent = indent + "    "
        else:
            print indent + self.__basename + "/" + "   (%d)" % len(self) + " contains:"
            print
            subindent = indent
        items = [(sortorder, basename.lower(), basename, explan) for (basename, (sortorder, explan)) in self.items()]
        items.sort()
        last_sortorder = None
        for sortorder, basename_tolower, basename, explan in items:
            ## if last_sortorder is not None and ...
            if (sortorder != last_sortorder or sortorder == ORDER_NEW_SUBPACKAGE):
                print subindent # blank line before subdirs or between types of item
            last_sortorder = sortorder
            if type(explan) == type(""):
                print_with_word_wrapping(subindent, explan, 80)
            else:
                child = explan
                # assert isinstance(child, _VirtualSubdir)
                child.print_listing(subindent)
    pass

def print_with_word_wrapping(indent, line, limit):
    words = line.split()
    sofar = indent # print this, or more
    while words:
        nextword = words[0]
        words = words[1:]
        # construct trial line
        trial = sofar
        if trial != indent:
            trial += ' '
        trial += nextword
        if len(trial) > limit:
            # nextword won't fit, print prior line and use nextword to start next line
            print sofar
            sofar = indent + nextword
        else:
            sofar = trial
        continue
    if sofar != indent:
        print sofar
    return

_toplevel_virtual_subdir = _VirtualSubdir("cad/src")

def get_virtual_subdir(parts, assert_already_there = False): # should be a method in _toplevel_virtual_subdir
    """
    @param parts: list of 1 or more pathname components
    """
    if len(parts) > 1:
        parent = get_virtual_subdir(parts[:-1])
        basename = parts[-1]
    else:
        parent = _toplevel_virtual_subdir
        basename = parts[-1]
    if parent.has_key(basename):
        sortorder, child = parent[basename]
        assert sortorder == ORDER_NEW_SUBPACKAGE
        assert isinstance(child, _VirtualSubdir)
    else:
        assert not assert_already_there, "missing subdir: %r" % (parts,)
        child = _VirtualSubdir(basename)
        sortorder = ORDER_NEW_SUBPACKAGE
        explan = child ### an object; for other sortorders, a string
        parent[basename] = (sortorder, explan)
        assert parent.has_key(basename)
    return child

def collect_virtual_listing( packageDict, ftype ):
    """
    @param packageDict: packageMapping_for_files or packageMapping_for_packages
    @param ftype: T_MODULE or T_PACKAGE
    """
    for basename, value in packageDict.items():
        basename = check_basename(basename)
        subdirname = packageClassification(value, TOPIC_ONLY)
        parts = subdirname.split('/')
        dir1 = get_virtual_subdir(parts) # also adds items for subdir into its parent dirs
        if ftype == T_MODULE:
            explan = "%s.py" % basename
            if basename in needs_renaming_for_clarity:
                explan += " (rename to %s)" % needs_renaming_for_clarity[basename]
            sortorder = ORDER_MODULE
        elif ftype == T_PACKAGE: # preexisting package
            explan = " [ inlined contents of %s/ ]" % basename
            # someday: add number of files in there, or even list the first 5 files as children
            sortorder = ORDER_INLINE_NOTE
        else:
            explan = " [ error: unrecognized ftype %r, basename = %r]" % (ftype, basename)
            sortorder = ORDER_ERROR
            print >>sys.stderr, explan
        assert not dir1.has_key(basename), "duplicate basename: %r" % (basename,)
        dir1[basename] = (sortorder, explan)
    return

def print_listings():
    """
    """
    
    global packageMapping_for_files

    if LIST_UNCLASSIFIED_FILES: #bruce 080223; usage: pass cad/src/*.py == ../*.py as arguments
        packageMapping_for_files = dict(packageMapping_for_files)
        for pyfile in sys.argv[1:]:
            if pyfile.endswith('.py'):
                basename_ext = os.path.basename(pyfile)
                basename, ext = os.path.splitext(basename_ext)
                if not packageMapping_for_files.has_key(basename):
                    packageMapping_for_files[basename] = " NOT YET CLASSIFIED: "
                    # print "missing file:", basename
            else:
                print "unrecognized argument: %r" % (pyfile,)
            continue
    
    collect_virtual_listing( packageMapping_for_files, T_MODULE)
    collect_virtual_listing( packageMapping_for_packages, T_PACKAGE)

    for subdirname, note in subdir_notes.items():
        parts = subdirname.split('/')
        dir1 = get_virtual_subdir(parts, assert_already_there = True)
        FAKENAME_NOTE = " FAKENAME_NOTE " # not a valid basename, but a string (since .lower() gets called on it)
        sort_order = ORDER_SUBDIR_NOTE
        dir1[FAKENAME_NOTE] = (sort_order, note)
        
    _toplevel_virtual_subdir.print_listing(skip_toplevel_indent = True)
    return

# print >> sys.stderr, "packageData_checker.py debug: done with most of import"

if __name__ == '__main__':
    # print >> sys.stderr, "packageData_checker.py debug: starting __main__ section"
    ## summarize_packageMapping_using_default_flags()
    print_listings()
    print
    print "[end]"
    # print >> sys.stderr, "packageData_checker.py debug: ending __main__ section"

# print >> sys.stderr, "packageData_checker.py debug: done with all of import"

# end