1 | #!/usr/bin/env python2
|
2 | """src_tree.py: Publish a directory tree as HTML.
|
3 |
|
4 | TODO:
|
5 |
|
6 | - dir listing:
|
7 | - should have columns
|
8 | - or add line counts, and file counts?
|
9 | - render README.md - would be nice
|
10 |
|
11 | - Could use JSON Template {.template} like test/wild_report.py
|
12 | - for consistent header and all that
|
13 |
|
14 | AUTO
|
15 |
|
16 | - overview.html and for-translation.html should link to these files, not Github
|
17 | """
|
18 | from __future__ import print_function
|
19 |
|
20 | import json
|
21 | import os
|
22 | import shutil
|
23 | import sys
|
24 |
|
25 | from doctools.util import log
|
26 | from doctools import html_head
|
27 | from test import wild_report
|
28 | from vendor import jsontemplate
|
29 |
|
30 | T = jsontemplate.Template
|
31 |
|
32 |
|
33 | def DetectType(path):
|
34 |
|
35 | # Most support moved to src-tree.sh and micro-syntax
|
36 |
|
37 | if path.endswith('.test.sh'):
|
38 | return 'spec'
|
39 |
|
40 | else:
|
41 | return 'other'
|
42 |
|
43 |
|
44 | def Breadcrumb(rel_path, out_f, is_file=False):
|
45 | offset = -1 if is_file else 0
|
46 | data = wild_report.MakeNav(rel_path, root_name='OILS', offset=offset)
|
47 | out_f.write(wild_report.NAV_TEMPLATE.expand({'nav': data}))
|
48 |
|
49 |
|
50 | # CSS class .line has white-space: pre
|
51 |
|
52 | # To avoid copy-paste problem, you could try the <div> solutions like this:
|
53 | # https://gitlab.com/gitlab-examples/python-getting-started/-/blob/master/manage.py?ref_type=heads
|
54 |
|
55 | # Note: we are compressing some stuff
|
56 |
|
57 | ROW_T = T("""\
|
58 | <tr>
|
59 | <td class=num>{line_num}</td>
|
60 | <td id=L{line_num}>
|
61 | <span class="line {.section line_class}{@}{.end}">{line}</span>
|
62 | </td>
|
63 | </tr>
|
64 | """,
|
65 | default_formatter='html')
|
66 |
|
67 | LISTING_T = T("""\
|
68 | {.section dirs}
|
69 | <h1>Dirs</h1>
|
70 | <div id="dirs" class="listing">
|
71 | {.repeated section @}
|
72 | <a href="{name|htmltag}/index.html">{name|html}/</a> <br/>
|
73 | {.end}
|
74 | </div>
|
75 | {.end}
|
76 |
|
77 | {.section files}
|
78 | <h1>Files</h1>
|
79 | <div id="files" class="listing">
|
80 | {.repeated section @}
|
81 | <a href="{url|htmltag}">{anchor|html}</a> <br/>
|
82 | {.end}
|
83 | </div>
|
84 | {.end}
|
85 |
|
86 | </body>
|
87 | """)
|
88 |
|
89 | FILE_COUNTS_T = T("""\
|
90 | <div id="file-counts"> {num_lines} lines, {num_sig_lines} significant </div>
|
91 | """,
|
92 | default_formatter='html')
|
93 |
|
94 |
|
95 | def SpecFiles(pairs, attrs_f):
|
96 |
|
97 | for i, (path, html_out) in enumerate(pairs):
|
98 | #log(path)
|
99 |
|
100 | try:
|
101 | os.makedirs(os.path.dirname(html_out))
|
102 | except OSError:
|
103 | pass
|
104 |
|
105 | with open(path) as in_f, open(html_out, 'w') as out_f:
|
106 | title = path
|
107 |
|
108 | # How deep are we?
|
109 | n = path.count('/') + 2
|
110 | base_dir = '/'.join(['..'] * n)
|
111 |
|
112 | #css_urls = ['%s/web/base.css' % base_dir, '%s/web/src-tree.css' % base_dir]
|
113 | css_urls = ['%s/web/src-tree.css' % base_dir]
|
114 |
|
115 | html_head.Write(out_f, title, css_urls=css_urls)
|
116 |
|
117 | out_f.write('''
|
118 | <body class="">
|
119 | <div id="home-link">
|
120 | <a href="https://github.com/oilshell/oil/blob/master/%s">View on Github</a>
|
121 | |
|
122 | <a href="/">oils.pub</a>
|
123 | </div>
|
124 | <table>
|
125 | ''' % path)
|
126 |
|
127 | file_type = DetectType(path)
|
128 |
|
129 | line_num = 1 # 1-based
|
130 | for line in in_f:
|
131 | if line.endswith('\n'):
|
132 | line = line[:-1]
|
133 |
|
134 | # Write line numbers
|
135 | row = {'line_num': line_num, 'line': line}
|
136 |
|
137 | s = line.lstrip()
|
138 |
|
139 | if file_type == 'spec':
|
140 | if s.startswith('####'):
|
141 | row['line_class'] = 'spec-comment'
|
142 | elif s.startswith('#'):
|
143 | row['line_class'] = 'comm'
|
144 |
|
145 | out_f.write(ROW_T.expand(row))
|
146 |
|
147 | line_num += 1
|
148 |
|
149 | # could be parsed by 'dirs'
|
150 | print('%s lines=%d' % (path, line_num), file=attrs_f)
|
151 |
|
152 | out_f.write('''
|
153 | </table>
|
154 | </body>
|
155 | </html>''')
|
156 |
|
157 | return i + 1
|
158 |
|
159 |
|
160 | def ReadFragments(in_f):
|
161 | while True:
|
162 | path = ReadNetString(in_f)
|
163 | if path is None:
|
164 | break
|
165 |
|
166 | html_frag = ReadNetString(in_f)
|
167 | if html_frag is None:
|
168 | raise RuntimeError('Expected 2nd record (HTML fragment)')
|
169 |
|
170 | s = ReadNetString(in_f)
|
171 | if s is None:
|
172 | raise RuntimeError('Expected 3rd record (file summary)')
|
173 |
|
174 | summary = json.loads(s)
|
175 |
|
176 | yield path, html_frag, summary
|
177 |
|
178 |
|
179 | def WriteHtmlFragments(in_f, out_dir, attrs_f=sys.stdout):
|
180 |
|
181 | i = 0
|
182 | for rel_path, html_frag, summary in ReadFragments(in_f):
|
183 | html_size = len(html_frag)
|
184 | if html_size > 300000:
|
185 | out_path = os.path.join(out_dir, rel_path)
|
186 | try:
|
187 | os.makedirs(os.path.dirname(out_path))
|
188 | except OSError:
|
189 | pass
|
190 |
|
191 | shutil.copyfile(rel_path, out_path)
|
192 |
|
193 | # Attrs are parsed by MakeTree(), and then used by WriteDirsHtml().
|
194 | # So we can print the right link.
|
195 | print('%s raw=1' % rel_path, file=attrs_f)
|
196 |
|
197 | file_size = os.path.getsize(rel_path)
|
198 | log('Big HTML fragment of %.1f KB', float(html_size) / 1000)
|
199 | log('Copied %s -> %s, %.1f KB', rel_path, out_path,
|
200 | float(file_size) / 1000)
|
201 |
|
202 | continue
|
203 |
|
204 | html_out = os.path.join(out_dir, rel_path + '.html')
|
205 |
|
206 | try:
|
207 | os.makedirs(os.path.dirname(html_out))
|
208 | except OSError:
|
209 | pass
|
210 |
|
211 | with open(html_out, 'w') as out_f:
|
212 | title = rel_path
|
213 |
|
214 | # How deep are we?
|
215 | n = rel_path.count('/') + 2
|
216 | base_dir = '/'.join(['..'] * n)
|
217 |
|
218 | #css_urls = ['%s/web/base.css' % base_dir, '%s/web/src-tree.css' % base_dir]
|
219 | css_urls = ['%s/web/src-tree.css' % base_dir]
|
220 | html_head.Write(out_f, title, css_urls=css_urls)
|
221 |
|
222 | out_f.write('''
|
223 | <body class="">
|
224 | <p>
|
225 | ''')
|
226 | Breadcrumb(rel_path, out_f, is_file=True)
|
227 |
|
228 | out_f.write('''
|
229 | <span id="home-link">
|
230 | <a href="https://github.com/oilshell/oil/blob/master/%s">View on Github</a>
|
231 | |
|
232 | <a href="/">oils.pub</a>
|
233 | </span>
|
234 | </p>
|
235 | ''' % rel_path)
|
236 |
|
237 | out_f.write(FILE_COUNTS_T.expand(summary))
|
238 |
|
239 | out_f.write('<table>')
|
240 | out_f.write(html_frag)
|
241 |
|
242 | print('%s lines=%d' % (rel_path, summary['num_lines']),
|
243 | file=attrs_f)
|
244 |
|
245 | out_f.write('''
|
246 | </table>
|
247 | </body>
|
248 | </html>''')
|
249 |
|
250 | i += 1
|
251 |
|
252 | log('Wrote %d HTML fragments', i)
|
253 |
|
254 |
|
255 | class DirNode:
|
256 | """Entry in the file system tree.
|
257 |
|
258 | Similar to test/wild_report.py
|
259 | """
|
260 |
|
261 | def __init__(self):
|
262 | self.files = {} # filename -> attrs dict
|
263 | self.dirs = {} # subdir name -> DirNode object
|
264 |
|
265 | # Can accumulate total lines here
|
266 | self.subtree_stats = {} # name -> value
|
267 |
|
268 |
|
269 | def DebugPrint(node, indent=0):
|
270 | """Pretty-print our tree data structure."""
|
271 | ind = indent * ' '
|
272 | #print('FILES', node.files.keys())
|
273 | for name in node.files:
|
274 | print('%s%s - %s' % (ind, name, node.files[name]))
|
275 |
|
276 | for name, child in node.dirs.iteritems():
|
277 | print('%s%s/ - %s' % (ind, name, child.subtree_stats))
|
278 | DebugPrint(child, indent=indent + 1)
|
279 |
|
280 |
|
281 | def UpdateNodes(node, path_parts, attrs):
|
282 | """Similar to test/wild_report.py."""
|
283 |
|
284 | first = path_parts[0]
|
285 | rest = path_parts[1:]
|
286 |
|
287 | if rest: # update an intermediate node
|
288 | if first in node.dirs:
|
289 | child = node.dirs[first]
|
290 | else:
|
291 | child = DirNode()
|
292 | node.dirs[first] = child
|
293 |
|
294 | UpdateNodes(child, rest, attrs)
|
295 | # TODO: Update subtree_stats
|
296 |
|
297 | else:
|
298 | # leaf node
|
299 | node.files[first] = attrs
|
300 |
|
301 |
|
302 | def MakeTree(stdin, root_node):
|
303 | """Reads a stream of lines Each line contains a path and key=value attrs.
|
304 |
|
305 | - Doesn't handle filenames with spaces
|
306 | - Doesn't handle empty dirs that are leaves (since only files are first
|
307 | class)
|
308 | """
|
309 | for line in sys.stdin:
|
310 | parts = line.split()
|
311 | path = parts[0]
|
312 |
|
313 | # Examples:
|
314 | # {'lines': '345'}
|
315 | # {'raw': '1'}
|
316 | attrs = {}
|
317 | for part in parts[1:]:
|
318 | k, v = part.split('=')
|
319 | attrs[k] = v
|
320 |
|
321 | path_parts = path.split('/')
|
322 | UpdateNodes(root_node, path_parts, attrs)
|
323 |
|
324 |
|
325 | def WriteDirsHtml(node, out_dir, rel_path='', base_url=''):
|
326 | #log('WriteDirectory %s %s %s', out_dir, rel_path, base_url)
|
327 |
|
328 | files = []
|
329 | for name in sorted(node.files):
|
330 | attrs = node.files[name]
|
331 |
|
332 | # Big files are raw, e.g. match.re2c.h and syntax_asdl.py
|
333 | url = name if attrs.get('raw') else '%s.html' % name
|
334 | f = {'url': url, 'anchor': name}
|
335 | files.append(f)
|
336 |
|
337 | dirs = []
|
338 | for name in sorted(node.dirs):
|
339 | dirs.append({'name': name})
|
340 |
|
341 | data = {'files': files, 'dirs': dirs}
|
342 | body = LISTING_T.expand(data)
|
343 |
|
344 | path = os.path.join(out_dir, 'index.html')
|
345 | with open(path, 'w') as f:
|
346 |
|
347 | title = '%s - Listing' % rel_path
|
348 | prefix = '%s../..' % base_url
|
349 | css_urls = ['%s/web/base.css' % prefix, '%s/web/src-tree.css' % prefix]
|
350 | html_head.Write(f, title, css_urls=css_urls)
|
351 |
|
352 | f.write('''
|
353 | <body>
|
354 | <p>
|
355 | ''')
|
356 | Breadcrumb(rel_path, f)
|
357 |
|
358 | f.write('''
|
359 | <span id="home-link">
|
360 | <a href="/">oils.pub</a>
|
361 | </span>
|
362 | </p>
|
363 | ''')
|
364 |
|
365 | f.write(body)
|
366 |
|
367 | f.write('</html>')
|
368 |
|
369 | # Recursive
|
370 | for name, child in node.dirs.iteritems():
|
371 | child_out = os.path.join(out_dir, name)
|
372 | child_rel = os.path.join(rel_path, name)
|
373 | child_base = base_url + '../'
|
374 | WriteDirsHtml(child,
|
375 | child_out,
|
376 | rel_path=child_rel,
|
377 | base_url=child_base)
|
378 |
|
379 |
|
380 | def ReadNetString(in_f):
|
381 |
|
382 | digits = []
|
383 | for i in xrange(10): # up to 10 digits
|
384 | c = in_f.read(1)
|
385 | if c == '':
|
386 | return None # EOF
|
387 |
|
388 | if c == ':':
|
389 | break
|
390 |
|
391 | if not c.isdigit():
|
392 | raise RuntimeError('Bad byte %r' % c)
|
393 |
|
394 | digits.append(c)
|
395 |
|
396 | if c != ':':
|
397 | raise RuntimeError('Expected colon, got %r' % c)
|
398 |
|
399 | n = int(''.join(digits))
|
400 |
|
401 | s = in_f.read(n)
|
402 | if len(s) != n:
|
403 | raise RuntimeError('Expected %d bytes, got %d' % (n, len(s)))
|
404 |
|
405 | c = in_f.read(1)
|
406 | if c != ',':
|
407 | raise RuntimeError('Expected comma, got %r' % c)
|
408 |
|
409 | return s
|
410 |
|
411 |
|
412 | def main(argv):
|
413 | action = argv[1]
|
414 |
|
415 | if action == 'spec-files':
|
416 | # Policy for _tmp/spec/osh-minimal/foo.test.html
|
417 | # This just changes the HTML names?
|
418 |
|
419 | out_dir = argv[2]
|
420 | spec_names = argv[3:]
|
421 |
|
422 | pairs = []
|
423 | for name in spec_names:
|
424 | src = 'spec/%s.test.sh' % name
|
425 | html_out = os.path.join(out_dir, '%s.test.html' % name)
|
426 | pairs.append((src, html_out))
|
427 |
|
428 | attrs_f = sys.stdout
|
429 | n = SpecFiles(pairs, attrs_f)
|
430 | log('%s: Wrote %d HTML files -> %s', os.path.basename(sys.argv[0]), n,
|
431 | out_dir)
|
432 |
|
433 | elif action == 'smoosh-file':
|
434 | # TODO: Should fold this generated code into the source tree, and run in CI
|
435 |
|
436 | in_path = argv[2]
|
437 | out_path = argv[3]
|
438 | pairs = [(in_path, out_path)]
|
439 |
|
440 | attrs_f = sys.stdout
|
441 | n = SpecFiles(pairs, attrs_f)
|
442 | log('%s: %s -> %s', os.path.basename(sys.argv[0]), in_path, out_path)
|
443 |
|
444 | elif action == 'write-html-fragments':
|
445 |
|
446 | out_dir = argv[2]
|
447 | WriteHtmlFragments(sys.stdin, out_dir)
|
448 |
|
449 | elif action == 'dirs':
|
450 | # stdin: a bunch of merged ATTRs file?
|
451 |
|
452 | # We load them, and write a whole tree?
|
453 | out_dir = argv[2]
|
454 |
|
455 | # I think we make a big data structure here
|
456 |
|
457 | root_node = DirNode()
|
458 | MakeTree(sys.stdin, root_node)
|
459 |
|
460 | if 0:
|
461 | DebugPrint(root_node)
|
462 |
|
463 | WriteDirsHtml(root_node, out_dir)
|
464 |
|
465 | else:
|
466 | raise RuntimeError('Invalid action %r' % action)
|
467 |
|
468 |
|
469 | if __name__ == '__main__':
|
470 | main(sys.argv)
|