hb_test_tools.py 5.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
#!/usr/bin/python

import sys, os, re, difflib, unicodedata

class Colors:
	class Null:
		red = ''
		green = ''
		end = ''
	class ANSI:
		red = '\033[41;37;1m'
		green = '\033[42;37;1m'
		end = '\033[m'
	class HTML:
		red = '<span style="color:red">'
		green = '<span style="color:green">'
		end = '</span>'

	@staticmethod
	def Auto (argv = [], out = sys.stdout):
		if "--color" in argv or os.isatty (out.fileno ()):
			if "--color" in sys.argv[1:]:
				argv.remove ("--color")
B
Behdad Esfahbod 已提交
24
			return Colors.ANSI, argv
25
		else:
B
Behdad Esfahbod 已提交
26
			return Colors.Null, argv
27

B
Behdad Esfahbod 已提交
28 29 30 31
	@staticmethod
	def Default (argv = []):
		return Colors.ANSI

32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86

class FancyDiffer:

	diff_regex = re.compile ('([a-za-z0-9_]*)([^a-za-z0-9_]?)')

	@staticmethod
	def diff_lines (l1, l2, colors=Colors.Null):

		ss = [FancyDiffer.diff_regex.sub (r'\1\n\2\n', l).splitlines (True) for l in (l1, l2)]
		oo = ["",""]
		st = [False, False]
		for l in difflib.Differ().compare (*ss):
			if l[0] == '?':
				continue
			if l[0] == ' ':
				for i in range(2):
					if st[i]:
						oo[i] += colors.end
						st[i] = False
				oo = [o + l[2:] for o in oo]
				continue
			if l[0] == '-':
				if not st[0]:
					oo[0] += colors.red
					st[0] = True
				oo[0] += l[2:]
				continue
			if l[0] == '+':
				if not st[1]:
					oo[1] += colors.green
					st[1] = True
				oo[1] += l[2:]
		for i in range(2):
			if st[i]:
				oo[i] += colors.end
				st[i] = 0
		oo = [o.replace ('\n', '') for o in oo]
		if oo[0] == oo[1]:
			return [' ', oo[0], '\n']
		return ['-', oo[0], '\n', '+', oo[1], '\n']

	@staticmethod
	def diff_files (f1, f2, colors=Colors.Null):
		for (l1,l2) in zip (f1, f2):
			if l1 == l2:
				sys.stdout.writelines ([" ", l1])
				continue

			sys.stdout.writelines (FancyDiffer.diff_lines (l1, l2, colors))
		# print out residues
		for l in f1:
			sys.stdout.writelines (["-", colors.red, l1, colors.end])
		for l in f1:
			sys.stdout.writelines (["-", colors.green, l1, colors.end])

B
Behdad Esfahbod 已提交
87

88 89 90 91 92 93 94 95 96
class DiffFilters:

	@staticmethod
	def filter_failures (f):
		for l in f:
			if l[0] in '-+':
				sys.stdout.writelines (l)


B
Behdad Esfahbod 已提交
97 98 99 100 101 102 103 104 105
class ShapeFilters:

	@staticmethod
	def filter_failures (f):
		for l in f:
			if l[0] in '-+':
				sys.stdout.writelines (l)


106 107 108
class UtilMains:

	@staticmethod
109
	def process_multiple_files (callback, mnemonic = "FILE"):
110 111

		if len (sys.argv) == 1:
112
			print "Usage: %s %s..." % (sys.argv[0], mnemonic)
113 114 115
			sys.exit (1)

		for s in sys.argv[1:]:
B
Behdad Esfahbod 已提交
116
			callback (FileHelpers.open_file_or_stdin (s))
117 118

	@staticmethod
119 120 121 122 123 124 125 126 127 128 129
	def process_multiple_args (callback, mnemonic):

		if len (sys.argv) == 1:
			print "Usage: %s %s..." % (sys.argv[0], mnemonic)
			sys.exit (1)

		for s in sys.argv[1:]:
			callback (s)

	@staticmethod
	def filter_multiple_strings_or_stdin (callback, mnemonic, \
130 131 132 133 134
					      separator = " ", \
					      concat_separator = False):

		if len (sys.argv) == 1 or ('--stdin' in sys.argv and len (sys.argv) != 2):
			print "Usage:\n  %s %s...\nor:\n  %s --stdin" \
135
			      % (sys.argv[0], mnemonic, sys.argv[0])
136 137 138 139
			sys.exit (1)

		if '--stdin' in sys.argv:
			sys.argv.remove ('--stdin')
B
Behdad Esfahbod 已提交
140 141 142 143
			while (1):
				line = sys.stdin.readline ()
				if not len (line):
					break
144 145 146 147 148 149 150 151 152 153 154 155
				print callback (line)
		else:
			args = sys.argv[1:]
			if concat_separator != False:
				args = [concat_separator.join (args)]
			print separator.join (callback (x) for x in (args))


class Unicode:

	@staticmethod
	def decode (s):
B
Behdad Esfahbod 已提交
156
		return '<' + u','.join ("U+%04X" % ord (u) for u in unicode (s, 'utf-8')).encode ('utf-8') + '>'
157 158 159

	@staticmethod
	def encode (s):
B
Behdad Esfahbod 已提交
160
		s = re.sub (r"[<+>,\\uU\n	]", " ", s)
161
		s = re.sub (r"0[xX]", " ", s)
B
Behdad Esfahbod 已提交
162
		return u''.join (unichr (int (x, 16)) for x in s.split (' ') if len (x)).encode ('utf-8')
163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198

	shorthands = {
		"ZERO WIDTH NON-JOINER": "ZWNJ",
		"ZERO WIDTH JOINER": "ZWJ",
		"NARROW NO-BREAK SPACE": "NNBSP",
		"COMBINING GRAPHEME JOINER": "CGJ",
		"LEFT-TO-RIGHT MARK": "LRM",
		"RIGHT-TO-LEFT MARK": "RLM",
		"LEFT-TO-RIGHT EMBEDDING": "LRE",
		"RIGHT-TO-LEFT EMBEDDING": "RLE",
		"POP DIRECTIONAL FORMATTING": "PDF",
		"LEFT-TO-RIGHT OVERRIDE": "LRO",
		"RIGHT-TO-LEFT OVERRIDE": "RLO",
	}

	@staticmethod
	def pretty_name (u):
		try:
			s = unicodedata.name (u)
		except ValueError:
			return "XXX"
		s = re.sub (".* LETTER ", "", s)
		s = re.sub (".* VOWEL SIGN (.*)", r"\1-MATRA", s)
		s = re.sub (".* SIGN ", "", s)
		s = re.sub (".* COMBINING ", "", s)
		if re.match (".* VIRAMA", s):
			s = "HALANT"
		if s in Unicode.shorthands:
			s = Unicode.shorthands[s]
		return s

	@staticmethod
	def pretty_names (s):
		s = re.sub (r"[<+>\\uU]", " ", s)
		s = re.sub (r"0[xX]", " ", s)
		s = [unichr (int (x, 16)) for x in re.split ('[, \n]', s) if len (x)]
B
Behdad Esfahbod 已提交
199
		return u' + '.join (Unicode.pretty_name (x) for x in s).encode ('utf-8')
200

B
Behdad Esfahbod 已提交
201

202
class FileHelpers:
B
Behdad Esfahbod 已提交
203 204 205 206 207 208

	@staticmethod
	def open_file_or_stdin (f):
		if f == '-':
			return sys.stdin
		return file (f)
209

210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238

class Manifest:

	@staticmethod
	def print_to_stdout (s, strict = True):
		if not os.path.exists (s):
			if strict:
				print >> sys.stderr, "%s: %s does not exist" (sys.argv[0], s)
				sys.exit (1)
			return

		if os.path.isdir (s):

			if s[-1] != '/':
				s += "/"

			try:
				m = file (s + "/MANIFEST")
				items = [x.strip () for x in m.readlines ()]
				for f in items:
					Manifest.print_to_stdout (s + f)
			except IOError:
				if strict:
					print >> sys.stderr, "%s: %s does not exist" (sys.argv[0], s + "/MANIFEST")
					sys.exit (1)
				return
		else:
			print s

239 240
if __name__ == '__main__':
	pass