blob: 702f8cc168cf11f3d083518786206bc69653712c (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
  | 
#!/usr/bin/env python3
# unidump version 0.1.1
# made by ubq323 in the year 2021
# please use this software for GOOD, not for EVIL
import unicodedata
import sys
uniquify = True
arg=""
args = sys.argv[1:]
while len(args) > 0:
	arg = args.pop(0)
	if arg[0] != '-' or arg == "--":
		break
	if arg == "-a":
		uniquify = False
		arg = ""
	if arg == "-h" or arg == "--help":
		print(f"usage: {sys.argv[0]} [-a] [text...]")
		print("\t-a: don't deduplicate input characters")
		print("\tif no text supplied, takes input from stdin")
		sys.exit(0)
s = arg+" ".join(args)
if len(s) == 0:
	s = sys.stdin.read()
def row(c):
	try:
		name = unicodedata.name(c).rjust(50)
	except ValueError:
		name = " "*50
	number = ("U+"+hex(ord(c))[2:].zfill(4)).rjust(7).upper()
	to_c = c
	if c == '\n':
		to_c = ' '
	cat = unicodedata.category(c)
	if cat[0] == "M":
		to_c = chr(0x25cc) + to_c
	return f"{to_c} | {unicodedata.category(c)} | {name} | {number}"
seen = set()
for c in s:
	if uniquify:
		if c in seen:
			continue
		seen.add(c)
	print(row(c))
  |