OILS / doctools / html_lib.py View on Github | oils.pub

48 lines, 18 significant
1#!/usr/bin/env python2
2"""html_lib.py.
3
4Shared between HTML processors.
5
6TODO: Write a "pull parser" API!
7"""
8from __future__ import print_function
9
10import cgi
11import re
12
13
14def AttrsToString(attrs):
15 if not attrs:
16 return ''
17
18 # Important: there's a leading space here.
19 # TODO: Change href="$help:command" to href="help.html#command"
20 return ''.join(' %s="%s"' % (k, cgi.escape(v)) for (k, v) in attrs)
21
22
23def PrettyHref(s, preserve_anchor_case=False):
24 """Turn arbitrary heading text into href with no special characters.
25
26 This is modeled after what github does. It makes everything lower case.
27 """
28 # Split by whitespace or hyphen
29 words = re.split(r'[\s\-]+', s)
30
31 if preserve_anchor_case:
32 # doc/ref: Keep only alphanumeric and /, for List/append, cmd/append
33 # Note that "preserve_anchor_case" could be renamed
34 keep_re = r'[\w/]+'
35 else:
36 # Keep only alphanumeric
37 keep_re = r'\w+'
38
39 keep = [''.join(re.findall(keep_re, w)) for w in words]
40
41 # Join with - and lowercase. And then remove empty words, unlike Github.
42 # This is SIMILAR to what Github does, but there's no need to be 100%
43 # compatible.
44
45 pretty = '-'.join(p for p in keep if p)
46 if not preserve_anchor_case:
47 pretty = pretty.lower()
48 return pretty