1 | #!/usr/bin/env python2
|
2 | # coding=utf8
|
3 | # Copyright 2016 Andy Chu. All rights reserved.
|
4 | # Licensed under the Apache License, Version 2.0 (the "License");
|
5 | # you may not use this file except in compliance with the License.
|
6 | # You may obtain a copy of the License at
|
7 | #
|
8 | # http://www.apache.org/licenses/LICENSE-2.0
|
9 | from __future__ import print_function
|
10 | """
|
11 | libc_test.py: Tests for libc.py
|
12 | """
|
13 | import unittest
|
14 | import sys
|
15 |
|
16 | import libc # module under test
|
17 |
|
18 | # guard some tests that fail on Darwin
|
19 | IS_DARWIN = sys.platform == 'darwin'
|
20 |
|
21 | class LibcTest(unittest.TestCase):
|
22 |
|
23 | def testFnmatch(self):
|
24 |
|
25 | cases = [
|
26 | # (pattern, string, result)
|
27 |
|
28 | ('', '', 1), # no pattern is valid
|
29 | ('a', 'a', 1),
|
30 | ('?', 'a', 1),
|
31 |
|
32 | # Test escaping of glob operator chars
|
33 | ('\\?', '-', 0),
|
34 | ('\\?', '?', 1),
|
35 |
|
36 | ('\\*', '-', 0),
|
37 | ('\\*', '*', 1),
|
38 |
|
39 | ('\\[', '-', 0),
|
40 | ('\\[', '[', 1),
|
41 |
|
42 | ('\\!', '-', 0),
|
43 | ('\\!', '!', 1),
|
44 |
|
45 | # What if we also escape extended glob chars?
|
46 | # Extra escaping is OK, so we should ALWAYS escape them.
|
47 | ('\\(', '(', 1),
|
48 | ('\\(', 'x', 0),
|
49 | ('\\(', '\\', 0),
|
50 | ('\\(', '\\(', 0),
|
51 |
|
52 | ('\\|', '|', 1),
|
53 | ('\\|', 'x', 0),
|
54 |
|
55 | ('\\\\', '\\', 1),
|
56 | ('\\\\', 'x', 0),
|
57 | ('\\\\', '\\extra', 0),
|
58 |
|
59 | ('\\f', '\\', 0), # no match
|
60 |
|
61 | # Hm this is weird, c is not a special character
|
62 | ('\\c', 'c', 1),
|
63 | ('\\c', '\\c', 0),
|
64 | ('\\\\c', '\\c', 1), # the proper way to match
|
65 |
|
66 | ('c:\\foo', 'c:\\foo', 0),
|
67 | ('c:\\foo', 'c:foo', 1),
|
68 |
|
69 | ('strange]one', 'strange]one', 1),
|
70 |
|
71 | # What is another error? Invalid escape is OK?
|
72 | None if IS_DARWIN else ('\\', '\\', 0), # no pattern is valid
|
73 |
|
74 | ('[[:alpha:]]', 'a', 1),
|
75 | ('[^[:alpha:]]', 'a', 0), # negate
|
76 | ('[[:alpha:]]', 'aa', 0), # exact match fails
|
77 |
|
78 | # Combining char class and a literal character
|
79 | ('[[:alpha:]7]', '7', 1),
|
80 | ('[[:alpha:]][[:alpha:]]', 'az', 1),
|
81 |
|
82 | ('[a]', 'a', 1),
|
83 | # Hm [] is treated as a constant string, not an empty char class.
|
84 | # Should we change LooksLikeGlob?
|
85 | ('[]', '', 0),
|
86 |
|
87 | ('[a-z]', 'a', 1),
|
88 | ('[a-z]', '-', 0),
|
89 |
|
90 | # THIS IS INCONSISTENT WITH REGEX!
|
91 | # Somehow in regexes (at least ERE) GNU libc treats [a\-z] as [a-z].
|
92 | # See below.
|
93 | ('[a\-z]', '-', 1),
|
94 | ('[a\-z]', 'b', 0),
|
95 |
|
96 | # Need double backslash in character class
|
97 | ('[\\\\]', '\\', 1),
|
98 |
|
99 | # Can you escape ] with \? Yes in fnmatch
|
100 | ('[\\]]', '\\', 0),
|
101 | ('[\\]]', ']', 1),
|
102 |
|
103 |
|
104 | None if IS_DARWIN else ('[]', 'a', 0),
|
105 | None if IS_DARWIN else ('[]', '[]', 1),
|
106 |
|
107 | ('?.c', 'a.c', 1),
|
108 | ('?.c', 'aa.c', 0),
|
109 | # mu character
|
110 | ('?.c', '\xce\xbc.c', 1),
|
111 | ]
|
112 |
|
113 | for pat, s, expected in filter(None, cases):
|
114 | actual = libc.fnmatch(pat, s)
|
115 | self.assertEqual(
|
116 | expected, actual, '%r %r -> got %d' % (pat, s, actual))
|
117 |
|
118 | def testFnmatchExtglob(self):
|
119 | # NOTE: We always use FNM_EXTMATCH when available
|
120 |
|
121 | # With GNU extension.
|
122 | cases = [
|
123 | # One of these
|
124 | ('--@(help|verbose)', '--verbose', 1),
|
125 | ('--@(help|verbose)', '--foo', 0),
|
126 |
|
127 | ('--*(help|verbose)', '--verbose', 1),
|
128 | ('--*(help|verbose)', '--', 1),
|
129 | ('--*(help|verbose)', '--helpverbose', 1), # Not what we want
|
130 |
|
131 | ('--+(help|verbose)', '--verbose', 1),
|
132 | ('--+(help|verbose)', '--', 0),
|
133 | ('--+(help|verbose)', '--helpverbose', 1), # Not what we want
|
134 |
|
135 | ('--?(help|verbose)', '--verbose', 1),
|
136 | ('--?(help|verbose)', '--helpverbose', 0),
|
137 |
|
138 | # Neither of these
|
139 | ('--!(help|verbose)', '--verbose', 0),
|
140 |
|
141 | # escaping *
|
142 | ('@(ab\*)', 'ab*', 1),
|
143 | ('@(ab\*)', 'abc', 0),
|
144 | # escaping ?
|
145 | ('@(ab\?)', 'ab?', 1),
|
146 | ('@(ab\?)', 'abc', 0),
|
147 |
|
148 | # escaping []
|
149 | ('@(ab\[\])', 'ab[]', 1),
|
150 | ('@(ab\[\])', 'abcd', 0),
|
151 |
|
152 | # escaping :
|
153 | ('@(ab\:)', 'ab:', 1),
|
154 | ('@(ab\:)', 'abc', 0),
|
155 |
|
156 | # escaping a is no-op
|
157 | (r'@(\ab)', 'ab', 1),
|
158 | (r'@(\ab)', r'\ab', 0),
|
159 |
|
160 | #('@(ab\|)', 'ab|', 1), # GNU libc bug? THIS SHOULD WORK
|
161 |
|
162 | # There's no way to escape | in extended glob??? wtf.
|
163 | #('@(ab\|)', 'ab', 1),
|
164 | #('@(ab\|)', 'ab\\', 1),
|
165 | #('@(ab\|)', 'ab\\|', 1),
|
166 | ]
|
167 | for pat, s, expected in cases:
|
168 | actual = libc.fnmatch(pat, s)
|
169 | self.assertEqual(expected, actual,
|
170 | "Matching %s against %s: got %s but expected %s" %
|
171 | (pat, s, actual, expected))
|
172 |
|
173 | def testGlob(self):
|
174 | print(libc.glob('*.py', 0))
|
175 |
|
176 | # This will not match anything!
|
177 | print(libc.glob('\\', 0))
|
178 | # This one will match a file named \
|
179 | print(libc.glob('\\\\', 0))
|
180 | print(libc.glob('[[:punct:]]', 0))
|
181 |
|
182 | def testRegexMatchError(self):
|
183 | # See core/util_test.py for more tests
|
184 | try:
|
185 | libc.regex_search(r'*', 0, 'abcd', 0)
|
186 | except ValueError as e:
|
187 | print(e)
|
188 | else:
|
189 | self.fail('Expected ValueError')
|
190 |
|
191 | def testRegexFirstGroupMatch(self):
|
192 | s='oXooXoooXoX'
|
193 | self.assertEqual(
|
194 | (1, 3),
|
195 | libc.regex_first_group_match('(X.)', s, 0))
|
196 |
|
197 | # Match from position 3
|
198 | self.assertEqual(
|
199 | (4, 6),
|
200 | libc.regex_first_group_match('(X.)', s, 3))
|
201 |
|
202 | # Match from position 3
|
203 | self.assertEqual(
|
204 | (8, 10),
|
205 | libc.regex_first_group_match('(X.)', s, 6))
|
206 |
|
207 | # Syntax Error
|
208 | self.assertRaises(
|
209 | RuntimeError, libc.regex_first_group_match, r'*', 'abcd', 0)
|
210 |
|
211 | def testRegexFirstGroupMatchError(self):
|
212 | # Helping to debug issue #291
|
213 | s = ''
|
214 | if 0:
|
215 | # Invalid regex syntax
|
216 | libc.regex_first_group_match("(['+-'])", s, 6)
|
217 |
|
218 | def testSpecialCharsInCharClass(self):
|
219 | CASES = [
|
220 | ("([a-z]+)", '123abc123', (3, 6)),
|
221 |
|
222 | # Uh what the heck, \- means the same thing as -? It's just ignored. At
|
223 | # least in GNU libc.
|
224 |
|
225 | # https://stackoverflow.com/questions/28495913/how-do-you-escape-a-hyphen-as-character-range-in-a-posix-regex
|
226 | # The <hyphen> character shall be treated as itself if it occurs first (after an initial '^', if any) or last in the list, or as an ending range point in a range expression
|
227 |
|
228 | ("([a\-z]+)", '123abc123', (3, 6)),
|
229 |
|
230 | # This is an inverted range. TODO: Need to fix the error message.
|
231 | #("([a\-.]+)", '123abc123', None),
|
232 |
|
233 | ("([\\\\]+)", 'a\\b', (1, 2)),
|
234 |
|
235 | # Can you escape ] with \? Yes in fnmatch, but NO here!!!
|
236 | ('([\\]])', '\\', None),
|
237 | ('([\\]])', ']', None),
|
238 |
|
239 | # Weird parsing!!!
|
240 | ('([\\]])', '\\]', (0, 2)),
|
241 |
|
242 | ]
|
243 |
|
244 | for pat, s, expected in CASES:
|
245 | result = libc.regex_first_group_match(pat, s, 0)
|
246 | self.assertEqual(expected, result,
|
247 | "FAILED: pat %r s %r result %s" % (pat, s, result))
|
248 |
|
249 | def testRealpathFailOnNonexistentDirectory(self):
|
250 | # This behaviour is actually inconsistent with GNU readlink,
|
251 | # but matches behaviour of busybox readlink
|
252 | # (https://github.com/jgunthorpe/busybox)
|
253 | self.assertEqual(None, libc.realpath('_tmp/nonexistent'))
|
254 |
|
255 | # Consistent with GNU
|
256 | self.assertEqual(None, libc.realpath('_tmp/nonexistent/supernonexistent'))
|
257 |
|
258 | def testPrintTime(self):
|
259 | print('', file=sys.stderr)
|
260 | libc.print_time(0.1, 0.2, 0.3)
|
261 | print('', file=sys.stderr)
|
262 |
|
263 | def testGethostname(self):
|
264 | print(libc.gethostname())
|
265 |
|
266 | def testGetTerminalWidth(self):
|
267 | try:
|
268 | width = libc.get_terminal_width()
|
269 | except IOError as e:
|
270 | print('error getting terminal width: %s' % e)
|
271 | else:
|
272 | print('width % d' % width)
|
273 |
|
274 | def testWcsWidth(self):
|
275 | if not IS_DARWIN:
|
276 | self.assertEqual(1, libc.wcswidth("▶️"))
|
277 | self.assertEqual(28, libc.wcswidth("(osh) ~/.../unchanged/oil ▶️ "))
|
278 |
|
279 | mu = u"\u03bc".encode('utf-8')
|
280 | print(repr(mu))
|
281 | print(mu)
|
282 | print(len(mu))
|
283 | self.assertEqual(1, libc.wcswidth(mu))
|
284 |
|
285 | self.assertEqual(2, libc.wcswidth("→ "))
|
286 |
|
287 | # mbstowcs fails on invalid utf-8
|
288 | try:
|
289 | # first byte of mu
|
290 | libc.wcswidth("\xce")
|
291 | except UnicodeError as e:
|
292 | self.assertEqual('mbstowcs() 1', e.message)
|
293 | else:
|
294 | self.fail('Expected failure')
|
295 |
|
296 | # wcswidth fails on unprintable character
|
297 | try:
|
298 | libc.wcswidth("\x01")
|
299 | except UnicodeError as e:
|
300 | self.assertEqual('wcswidth()', e.message)
|
301 | else:
|
302 | self.fail('Expected failure')
|
303 |
|
304 | self.assertRaises(UnicodeError, libc.wcswidth, "\xfe")
|
305 |
|
306 |
|
307 | if __name__ == '__main__':
|
308 | # To simulate the OVM_MAIN patch in pythonrun.c
|
309 | libc.cpython_reset_locale()
|
310 | unittest.main()
|