pyext/libc_test.py

OILS / pyext / libc_test.py View on Github | oilshell.org

310 lines, 173 significant

1	#!/usr/bin/env python2
2	# coding=utf8
3	# Copyright 2016 Andy Chu. All rights reserved.
4	# Licensed under the Apache License, Version 2.0 (the "License");
5	# you may not use this file except in compliance with the License.
6	# You may obtain a copy of the License at
7	#
8	# http://www.apache.org/licenses/LICENSE-2.0
9	from __future__ import print_function
10	"""
11	libc_test.py: Tests for libc.py
12	"""
13	import unittest
14	import sys
15
16	import libc # module under test
17
18	# guard some tests that fail on Darwin
19	IS_DARWIN = sys.platform == 'darwin'
20
21	class LibcTest(unittest.TestCase):
22
23	def testFnmatch(self):
24
25	cases = [
26	# (pattern, string, result)
27
28	('', '', 1), # no pattern is valid
29	('a', 'a', 1),
30	('?', 'a', 1),
31
32	# Test escaping of glob operator chars
33	('\\?', '-', 0),
34	('\\?', '?', 1),
35
36	('\\*', '-', 0),
37	('\\', '', 1),
38
39	('\\[', '-', 0),
40	('\\[', '[', 1),
41
42	('\\!', '-', 0),
43	('\\!', '!', 1),
44
45	# What if we also escape extended glob chars?
46	# Extra escaping is OK, so we should ALWAYS escape them.
47	('\\(', '(', 1),
48	('\\(', 'x', 0),
49	('\\(', '\\', 0),
50	('\\(', '\\(', 0),
51
52	('\\\|', '\|', 1),
53	('\\\|', 'x', 0),
54
55	('\\\\', '\\', 1),
56	('\\\\', 'x', 0),
57	('\\\\', '\\extra', 0),
58
59	('\\f', '\\', 0), # no match
60
61	# Hm this is weird, c is not a special character
62	('\\c', 'c', 1),
63	('\\c', '\\c', 0),
64	('\\\\c', '\\c', 1), # the proper way to match
65
66	('c:\\foo', 'c:\\foo', 0),
67	('c:\\foo', 'c:foo', 1),
68
69	('strange]one', 'strange]one', 1),
70
71	# What is another error? Invalid escape is OK?
72	None if IS_DARWIN else ('\\', '\\', 0), # no pattern is valid
73
74	('[[:alpha:]]', 'a', 1),
75	('[^[:alpha:]]', 'a', 0), # negate
76	('[[:alpha:]]', 'aa', 0), # exact match fails
77
78	# Combining char class and a literal character
79	('[[:alpha:]7]', '7', 1),
80	('[[:alpha:]][[:alpha:]]', 'az', 1),
81
82	('[a]', 'a', 1),
83	# Hm [] is treated as a constant string, not an empty char class.
84	# Should we change LooksLikeGlob?
85	('[]', '', 0),
86
87	('[a-z]', 'a', 1),
88	('[a-z]', '-', 0),
89
90	# THIS IS INCONSISTENT WITH REGEX!
91	# Somehow in regexes (at least ERE) GNU libc treats [a\-z] as [a-z].
92	# See below.
93	('[a\-z]', '-', 1),
94	('[a\-z]', 'b', 0),
95
96	# Need double backslash in character class
97	('[\\\\]', '\\', 1),
98
99	# Can you escape ] with \? Yes in fnmatch
100	('[\\]]', '\\', 0),
101	('[\\]]', ']', 1),
102
103
104	None if IS_DARWIN else ('[]', 'a', 0),
105	None if IS_DARWIN else ('[]', '[]', 1),
106
107	('?.c', 'a.c', 1),
108	('?.c', 'aa.c', 0),
109	# mu character
110	('?.c', '\xce\xbc.c', 1),
111	]
112
113	for pat, s, expected in filter(None, cases):
114	actual = libc.fnmatch(pat, s)
115	self.assertEqual(
116	expected, actual, '%r %r -> got %d' % (pat, s, actual))
117
118	def testFnmatchExtglob(self):
119	# NOTE: We always use FNM_EXTMATCH when available
120
121	# With GNU extension.
122	cases = [
123	# One of these
124	('--@(help\|verbose)', '--verbose', 1),
125	('--@(help\|verbose)', '--foo', 0),
126
127	('--*(help\|verbose)', '--verbose', 1),
128	('--*(help\|verbose)', '--', 1),
129	('--*(help\|verbose)', '--helpverbose', 1), # Not what we want
130
131	('--+(help\|verbose)', '--verbose', 1),
132	('--+(help\|verbose)', '--', 0),
133	('--+(help\|verbose)', '--helpverbose', 1), # Not what we want
134
135	('--?(help\|verbose)', '--verbose', 1),
136	('--?(help\|verbose)', '--helpverbose', 0),
137
138	# Neither of these
139	('--!(help\|verbose)', '--verbose', 0),
140
141	# escaping *
142	('@(ab\)', 'ab', 1),
143	('@(ab\*)', 'abc', 0),
144	# escaping ?
145	('@(ab\?)', 'ab?', 1),
146	('@(ab\?)', 'abc', 0),
147
148	# escaping []
149	('@(ab\[\])', 'ab[]', 1),
150	('@(ab\[\])', 'abcd', 0),
151
152	# escaping :
153	('@(ab\:)', 'ab:', 1),
154	('@(ab\:)', 'abc', 0),
155
156	# escaping a is no-op
157	(r'@(\ab)', 'ab', 1),
158	(r'@(\ab)', r'\ab', 0),
159
160	#('@(ab\\|)', 'ab\|', 1), # GNU libc bug? THIS SHOULD WORK
161
162	# There's no way to escape \| in extended glob??? wtf.
163	#('@(ab\\|)', 'ab', 1),
164	#('@(ab\\|)', 'ab\\', 1),
165	#('@(ab\\|)', 'ab\\\|', 1),
166	]
167	for pat, s, expected in cases:
168	actual = libc.fnmatch(pat, s)
169	self.assertEqual(expected, actual,
170	"Matching %s against %s: got %s but expected %s" %
171	(pat, s, actual, expected))
172
173	def testGlob(self):
174	print(libc.glob('*.py'))
175
176	# This will not match anything!
177	print(libc.glob('\\'))
178	# This one will match a file named \
179	print(libc.glob('\\\\'))
180	print(libc.glob('[[:punct:]]'))
181
182	def testRegexMatchError(self):
183	# See core/util_test.py for more tests
184	try:
185	libc.regex_search(r'*', 0, 'abcd', 0)
186	except ValueError as e:
187	print(e)
188	else:
189	self.fail('Expected ValueError')
190
191	def testRegexFirstGroupMatch(self):
192	s='oXooXoooXoX'
193	self.assertEqual(
194	(1, 3),
195	libc.regex_first_group_match('(X.)', s, 0))
196
197	# Match from position 3
198	self.assertEqual(
199	(4, 6),
200	libc.regex_first_group_match('(X.)', s, 3))
201
202	# Match from position 3
203	self.assertEqual(
204	(8, 10),
205	libc.regex_first_group_match('(X.)', s, 6))
206
207	# Syntax Error
208	self.assertRaises(
209	RuntimeError, libc.regex_first_group_match, r'*', 'abcd', 0)
210
211	def testRegexFirstGroupMatchError(self):
212	# Helping to debug issue #291
213	s = ''
214	if 0:
215	# Invalid regex syntax
216	libc.regex_first_group_match("(['+-'])", s, 6)
217
218	def testSpecialCharsInCharClass(self):
219	CASES = [
220	("([a-z]+)", '123abc123', (3, 6)),
221
222	# Uh what the heck, \- means the same thing as -? It's just ignored. At
223	# least in GNU libc.
224
225	# https://stackoverflow.com/questions/28495913/how-do-you-escape-a-hyphen-as-character-range-in-a-posix-regex
226	# The <hyphen> character shall be treated as itself if it occurs first (after an initial '^', if any) or last in the list, or as an ending range point in a range expression
227
228	("([a\-z]+)", '123abc123', (3, 6)),
229
230	# This is an inverted range. TODO: Need to fix the error message.
231	#("([a\-.]+)", '123abc123', None),
232
233	("([\\\\]+)", 'a\\b', (1, 2)),
234
235	# Can you escape ] with \? Yes in fnmatch, but NO here!!!
236	('([\\]])', '\\', None),
237	('([\\]])', ']', None),
238
239	# Weird parsing!!!
240	('([\\]])', '\\]', (0, 2)),
241
242	]
243
244	for pat, s, expected in CASES:
245	result = libc.regex_first_group_match(pat, s, 0)
246	self.assertEqual(expected, result,
247	"FAILED: pat %r s %r result %s" % (pat, s, result))
248
249	def testRealpathFailOnNonexistentDirectory(self):
250	# This behaviour is actually inconsistent with GNU readlink,
251	# but matches behaviour of busybox readlink
252	# (https://github.com/jgunthorpe/busybox)
253	self.assertEqual(None, libc.realpath('_tmp/nonexistent'))
254
255	# Consistent with GNU
256	self.assertEqual(None, libc.realpath('_tmp/nonexistent/supernonexistent'))
257
258	def testPrintTime(self):
259	print('', file=sys.stderr)
260	libc.print_time(0.1, 0.2, 0.3)
261	print('', file=sys.stderr)
262
263	def testGethostname(self):
264	print(libc.gethostname())
265
266	def testGetTerminalWidth(self):
267	try:
268	width = libc.get_terminal_width()
269	except IOError as e:
270	print('error getting terminal width: %s' % e)
271	else:
272	print('width % d' % width)
273
274	def testWcsWidth(self):
275	if not IS_DARWIN:
276	self.assertEqual(1, libc.wcswidth("▶️"))
277	self.assertEqual(28, libc.wcswidth("(osh) ~/.../unchanged/oil ▶️ "))
278
279	mu = u"\u03bc".encode('utf-8')
280	print(repr(mu))
281	print(mu)
282	print(len(mu))
283	self.assertEqual(1, libc.wcswidth(mu))
284
285	self.assertEqual(2, libc.wcswidth("→ "))
286
287	# mbstowcs fails on invalid utf-8
288	try:
289	# first byte of mu
290	libc.wcswidth("\xce")
291	except UnicodeError as e:
292	self.assertEqual('mbstowcs() 1', e.message)
293	else:
294	self.fail('Expected failure')
295
296	# wcswidth fails on unprintable character
297	try:
298	libc.wcswidth("\x01")
299	except UnicodeError as e:
300	self.assertEqual('wcswidth()', e.message)
301	else:
302	self.fail('Expected failure')
303
304	self.assertRaises(UnicodeError, libc.wcswidth, "\xfe")
305
306
307	if __name__ == '__main__':
308	# To simulate the OVM_MAIN patch in pythonrun.c
309	libc.cpython_reset_locale()
310	unittest.main()