-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathrun.out
166 lines (162 loc) · 6.75 KB
/
run.out
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
+ export LANG=en_US.UTF-8 LC_ALL=en_US.UTF-8
+ LANG=en_US.UTF-8
+ LC_ALL=en_US.UTF-8
+ date
Thu Dec 16 20:36:18 EST 2021
++ dirname glibc-unicode-sorting/run.sh
+ cd glibc-unicode-sorting
+ pwd
/root/glibc-unicode-sorting
+ which dpkg
which: no dpkg in (/usr/kerberos/sbin:/usr/kerberos/bin:/usr/local/sbin:/usr/local/bin:/sbin:/bin:/usr/sbin:/usr/bin)
+ which rpm
/bin/rpm
+ rpm -qa
+ grep -E '(glibc|langpack)'
glibc-headers-2.5-49.el5_5.7
glibc-2.5-49.el5_5.7
glibc-devel-2.5-49.el5_5.7
glibc-common-2.5-49.el5_5.7
++ curl -s http://169.254.169.254/latest/meta-data/ami-id
+ SOURCE_AMI=ami-eb84ed82
++ cat /etc/issue
+ OS_VERS='Red Hat Enterprise Linux Server release 5.5 (Tikanga)
Kernel \r on an \m'
+ UNICODE_VERS=14
+ which dpkg
which: no dpkg in (/usr/kerberos/sbin:/usr/kerberos/bin:/usr/local/sbin:/usr/local/bin:/sbin:/bin:/usr/sbin:/usr/bin)
+ which rpm
/bin/rpm
++ rpm -q glibc --queryformat '%{version}-%{release}'
+ GLIBC_VERS=2.5-49.el5_5.7
+ '[' -f /etc/os-release ']'
+ '[' -f /etc/system-release ']'
+ '[' -f /etc/system-release-cpe ']'
+ curl -kO https://www.unicode.org/Public/14.0.0/ucd/UnicodeData.txt
% Total % Received % Xferd Average Speed Time Time Time Current
Dload Upload Total Spent Left Speed
0 1853k 0 0 0 0 0 0 --:--:-- --:--:-- --:--:-- 0 25 1853k 25 464k 0 0 1255k 0 0:00:01 --:--:-- 0:00:01 2494k100 1853k 100 1853k 0 0 2939k 0 --:--:-- --:--:-- --:--:-- 4146k
real 0m0.642s
user 0m0.012s
sys 0m0.000s
+ perl '-naF;' -CO '-e
sub pr3 {printf("%s%08x\n",$_[1],$_[0])}
sub pr2 {pr3($_[0],"B".$_[1]."B");pr3($_[0],"D".$_[1]."D");pr3($_[0],$_[1]);pr3($_[0],$_[1]."B");pr3($_[0],$_[1]."BB");pr3($_[0],$_[1]."D");pr3($_[0],$_[1]."DD")}
sub pr {pr2($_[0],$_[1].chr($_[0]));pr2($_[0],$_[1].chr($_[0]).chr($_[0]));pr3($_[0],"1B".chr($_[0])."B");pr3($_[0],"1B-".chr($_[0])."B")}
if(/<control>/){next}; # skip control characters
if($F[2] eq "Cs"){next}; # skip surrogates
if(/ First>/){$fi=hex("0x".$F[0]);next}; # generate blocks
if(/ Last>/){$la=hex("0x".$F[0]);for($fi..$la){pr($_)};next};
pr(hex("0x".$F[0])) # generate individual characters
' UnicodeData.txt
+ split -l500000 - _base-characters
real 0m6.609s
user 0m5.960s
sys 0m0.532s
+ wc _base-charactersaa _base-charactersab _base-charactersac _base-charactersad _base-charactersae _base-charactersaf _base-charactersag _base-charactersah _base-charactersai _base-charactersaj
500000 500090 7453517 _base-charactersaa
500000 500000 7512259 _base-charactersab
500000 500000 8218750 _base-charactersac
500000 500000 8218750 _base-charactersad
500000 500000 8218750 _base-charactersae
500000 500000 8218750 _base-charactersaf
500000 500000 8218750 _base-charactersag
500000 500000 8218750 _base-charactersah
500000 500000 8218750 _base-charactersai
14640 14640 240645 _base-charactersaj
4514640 4514730 72737671 total
+ locale
LANG=en_US.UTF-8
LC_CTYPE="en_US.UTF-8"
LC_NUMERIC="en_US.UTF-8"
LC_TIME="en_US.UTF-8"
LC_COLLATE="en_US.UTF-8"
LC_MONETARY="en_US.UTF-8"
LC_MESSAGES="en_US.UTF-8"
LC_PAPER="en_US.UTF-8"
LC_NAME="en_US.UTF-8"
LC_ADDRESS="en_US.UTF-8"
LC_TELEPHONE="en_US.UTF-8"
LC_MEASUREMENT="en_US.UTF-8"
LC_IDENTIFICATION="en_US.UTF-8"
LC_ALL=en_US.UTF-8
+ date
Thu Dec 16 20:36:28 EST 2021
++ ls -1 _base-charactersaa _base-charactersab _base-charactersac _base-charactersad _base-charactersae _base-charactersaf _base-charactersag _base-charactersah _base-charactersai _base-charactersaj
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersaa -o _s_base-charactersaa
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersab -o _s_base-charactersab
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersac -o _s_base-charactersac
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersad -o _s_base-charactersad
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersae -o _s_base-charactersae
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersaf -o _s_base-charactersaf
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersag -o _s_base-charactersag
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersah -o _s_base-charactersah
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersai -o _s_base-charactersai
+ for FILE in '$(ls -1 _base-characters*)'
+ sort _base-charactersaj -o _s_base-charactersaj
+ jobs
[1] Running sort $FILE -o _s$FILE &
[2] Running sort $FILE -o _s$FILE &
[3] Running sort $FILE -o _s$FILE &
[4] Running sort $FILE -o _s$FILE &
[5] Running sort $FILE -o _s$FILE &
[6] Running sort $FILE -o _s$FILE &
[7] Running sort $FILE -o _s$FILE &
[8] Running sort $FILE -o _s$FILE &
[9]- Running sort $FILE -o _s$FILE &
[10]+ Done sort $FILE -o _s$FILE
+ wait
+ date
Thu Dec 16 20:36:50 EST 2021
+ sort -m _s_base-charactersaa _s_base-charactersab _s_base-charactersac _s_base-charactersad _s_base-charactersae _s_base-charactersaf _s_base-charactersag _s_base-charactersah _s_base-charactersai _s_base-charactersaj -o unicode-14-chars-sorted-glibc-2.5-49.el5_5.7.txt
real 0m1.819s
user 0m1.644s
sys 0m0.164s
+ rm -v _base-charactersaa _base-charactersab _base-charactersac _base-charactersad _base-charactersae _base-charactersaf _base-charactersag _base-charactersah _base-charactersai _base-charactersaj _s_base-charactersaa _s_base-charactersab _s_base-charactersac _s_base-charactersad _s_base-charactersae _s_base-charactersaf _s_base-charactersag _s_base-charactersah _s_base-charactersai _s_base-charactersaj UnicodeData.txt
removed `_base-charactersaa'
removed `_base-charactersab'
removed `_base-charactersac'
removed `_base-charactersad'
removed `_base-charactersae'
removed `_base-charactersaf'
removed `_base-charactersag'
removed `_base-charactersah'
removed `_base-charactersai'
removed `_base-charactersaj'
removed `_s_base-charactersaa'
removed `_s_base-charactersab'
removed `_s_base-charactersac'
removed `_s_base-charactersad'
removed `_s_base-charactersae'
removed `_s_base-charactersaf'
removed `_s_base-charactersag'
removed `_s_base-charactersah'
removed `_s_base-charactersai'
removed `_s_base-charactersaj'
removed `UnicodeData.txt'
+ ls -ltr
total 71136
-rw-r--r-- 1 root root 1794 Dec 16 20:36 run.sh
-rw-r--r-- 1 root root 72737671 Dec 16 20:36 unicode-14-chars-sorted-glibc-2.5-49.el5_5.7.txt
-rw-r--r-- 1 root root 6473 Dec 16 20:36 run.out
+ wc unicode-14-chars-sorted-glibc-2.5-49.el5_5.7.txt
4514640 4514730 72737671 unicode-14-chars-sorted-glibc-2.5-49.el5_5.7.txt
+ echo 1-1
+ echo 11
+ LC_COLLATE=en_US.UTF-8
+ sort
11
1-1
+ date
Thu Dec 16 20:36:56 EST 2021