From e98c955c2c375377f5af889f04dbd4bee947e8a1 Mon Sep 17 00:00:00 2001 From: Mark Shoulson Date: Fri, 2 Dec 2016 09:23:00 -0500 Subject: Added more emoji, including big lists of (raw) new characters from other blocks and unicode 9.0 Also added makefile --- emojitrans2.pl | 11 ++++++++++- 1 file changed, 10 insertions(+), 1 deletion(-) (limited to 'emojitrans2.pl') diff --git a/emojitrans2.pl b/emojitrans2.pl index 3b98ad2..b18fb3a 100755 --- a/emojitrans2.pl +++ b/emojitrans2.pl @@ -1,9 +1,12 @@ #!/usr/bin/perl -p +use feature 'unicode_strings'; +use utf8; BEGIN { binmode(STDOUT, ":utf8"); binmode(STDIN, ":utf8"); %specials = ('%' => 'percent', '-' => 'minus', + '_' => 'underscore', '>' => 'greater', '<' => 'less', ',' => 'comma', @@ -16,17 +19,23 @@ BEGIN { binmode(STDOUT, ":utf8"); '#' => 'numbersign', '@' => 'at', '|' => 'bar', + '`' => 'grave', '~' => 'asciitilde', '^' => 'asciicircum', '(' => 'parenleft', ')' => 'parenright', '[' => 'bracketleft', ']' => 'bracketright', + '{' => 'braceleft', + '}' => 'braceright', "'" => 'apostrophe', '\\' => 'backslash', ':' => 'colon', ';' => 'semicolon', + '=' => 'equal', ' ' => 'space', + '*' => 'asterisk', + '♫' => 'Multi_key', ); sub splitup { @@ -49,7 +58,7 @@ sub splitup { unless (/^#/) { my $hold=$_; s// /; - s({([][[:alnum:] _+:;%@><,.^\$+#()?!/|'\\~-]+)})(splitup($1))e; + s({([][[:alnum:] _+:;%@>=`<,.^\$+#()?!/|'\\~*{}♫-]+)})(splitup($1))e; if (length($1) > 7) { $_=$hold; s/^/### /; -- cgit v1.2.3 From f4456d1b08c6b714d6f9d07363e8d054c659c85c Mon Sep 17 00:00:00 2001 From: Mark Shoulson Date: Sun, 19 Feb 2017 19:33:35 -0500 Subject: Add parens.compose. --- emojitrans2.pl | 3 +- parens.compose | 177 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 179 insertions(+), 1 deletion(-) create mode 100644 parens.compose (limited to 'emojitrans2.pl') diff --git a/emojitrans2.pl b/emojitrans2.pl index b18fb3a..c978b7e 100755 --- a/emojitrans2.pl +++ b/emojitrans2.pl @@ -57,10 +57,11 @@ sub splitup { unless (/^#/) { my $hold=$_; + s///; s// /; s({([][[:alnum:] _+:;%@>=`<,.^\$+#()?!/|'\\~*{}♫-]+)})(splitup($1))e; if (length($1) > 7) { $_=$hold; - s/^/### /; + s/^/### /; } } diff --git a/parens.compose b/parens.compose new file mode 100644 index 0000000..100e79c --- /dev/null +++ b/parens.compose @@ -0,0 +1,177 @@ + <1> : "⑴" U2474 # PARENTHESIZED DIGIT ONE + <2> : "⑵" U2475 # PARENTHESIZED DIGIT TWO + <3> : "⑶" U2476 # PARENTHESIZED DIGIT THREE + <4> : "⑷" U2477 # PARENTHESIZED DIGIT FOUR + <5> : "⑸" U2478 # PARENTHESIZED DIGIT FIVE + <6> : "⑹" U2479 # PARENTHESIZED DIGIT SIX + <7> : "⑺" U247A # PARENTHESIZED DIGIT SEVEN + <8> : "⑻" U247B # PARENTHESIZED DIGIT EIGHT + <9> : "⑼" U247C # PARENTHESIZED DIGIT NINE + <1> <0> : "⑽" U247D # PARENTHESIZED NUMBER TEN + <1> <1> : "⑾" U247E # PARENTHESIZED NUMBER ELEVEN + <1> <2> : "⑿" U247F # PARENTHESIZED NUMBER TWELVE + <1> <3> : "⒀" U2480 # PARENTHESIZED NUMBER THIRTEEN + <1> <4> : "⒁" U2481 # PARENTHESIZED NUMBER FOURTEEN + <1> <5> : "⒂" U2482 # PARENTHESIZED NUMBER FIFTEEN + <1> <6> : "⒃" U2483 # PARENTHESIZED NUMBER SIXTEEN + <1> <7> : "⒄" U2484 # PARENTHESIZED NUMBER SEVENTEEN + <1> <8> : "⒅" U2485 # PARENTHESIZED NUMBER EIGHTEEN + <1> <9> : "⒆" U2486 # PARENTHESIZED NUMBER NINETEEN + <2> <0> : "⒇" U2487 # PARENTHESIZED NUMBER TWENTY + : "⒜" U249C # PARENTHESIZED LATIN SMALL LETTER A + : "⒝" U249D # PARENTHESIZED LATIN SMALL LETTER B + : "⒞" U249E # PARENTHESIZED LATIN SMALL LETTER C + : "⒟" U249F # PARENTHESIZED LATIN SMALL LETTER D + : "⒠" U24A0 # PARENTHESIZED LATIN SMALL LETTER E + : "⒡" U24A1 # PARENTHESIZED LATIN SMALL LETTER F + : "⒢" U24A2 # PARENTHESIZED LATIN SMALL LETTER G + : "⒣" U24A3 # PARENTHESIZED LATIN SMALL LETTER H + : "⒤" U24A4 # PARENTHESIZED LATIN SMALL LETTER I + : "⒥" U24A5 # PARENTHESIZED LATIN SMALL LETTER J + : "⒦" U24A6 # PARENTHESIZED LATIN SMALL LETTER K + : "⒧" U24A7 # PARENTHESIZED LATIN SMALL LETTER L + : "⒨" U24A8 # PARENTHESIZED LATIN SMALL LETTER M + : "⒩" U24A9 # PARENTHESIZED LATIN SMALL LETTER N + : "⒪" U24AA # PARENTHESIZED LATIN SMALL LETTER O +

: "🄟" U1F11F # PARENTHESIZED LATIN CAPITAL LETTER P + : "🄠" U1F120 # PARENTHESIZED LATIN CAPITAL LETTER Q + : "🄡" U1F121 # PARENTHESIZED LATIN CAPITAL LETTER R + : "🄢" U1F122 # PARENTHESIZED LATIN CAPITAL LETTER S + : "🄣" U1F123 # PARENTHESIZED LATIN CAPITAL LETTER T + : "🄤" U1F124 # PARENTHESIZED LATIN CAPITAL LETTER U + : "🄥" U1F125 # PARENTHESIZED LATIN CAPITAL LETTER V + : "🄦" U1F126 # PARENTHESIZED LATIN CAPITAL LETTER W + : "🄧" U1F127 # PARENTHESIZED LATIN CAPITAL LETTER X + : "🄨" U1F128 # PARENTHESIZED LATIN CAPITAL LETTER Y + : "🄩" U1F129 # PARENTHESIZED LATIN CAPITAL LETTER Z + <1> : "⒈" U2488 # DIGIT ONE FULL STOP + <2> : "⒉" U2489 # DIGIT TWO FULL STOP + <3> : "⒊" U248A # DIGIT THREE FULL STOP + <4> : "⒋" U248B # DIGIT FOUR FULL STOP + <5> : "⒌" U248C # DIGIT FIVE FULL STOP + <6> : "⒍" U248D # DIGIT SIX FULL STOP + <7> : "⒎" U248E # DIGIT SEVEN FULL STOP + <8> : "⒏" U248F # DIGIT EIGHT FULL STOP + <9> : "⒐" U2490 # DIGIT NINE FULL STOP + <1> <0> : "⒑" U2491 # NUMBER TEN FULL STOP + <1> <1> : "⒒" U2492 # NUMBER ELEVEN FULL STOP + <1> <2> : "⒓" U2493 # NUMBER TWELVE FULL STOP + <1> <3> : "⒔" U2494 # NUMBER THIRTEEN FULL STOP + <1> <4> : "⒕" U2495 # NUMBER FOURTEEN FULL STOP + <1> <5> : "⒖" U2496 # NUMBER FIFTEEN FULL STOP + <1> <6> : "⒗" U2497 # NUMBER SIXTEEN FULL STOP + <1> <7> : "⒘" U2498 # NUMBER SEVENTEEN FULL STOP + <1> <8> : "⒙" U2499 # NUMBER EIGHTEEN FULL STOP + <1> <9> : "⒚" U249A # NUMBER NINETEEN FULL STOP + <2> <0> : "⒛" U249B # NUMBER TWENTY FULL STOP + <0> : "🄀" U1F100 # DIGIT ZERO FULL STOP + <1> <1> : "⓫" U24EB # NEGATIVE CIRCLED NUMBER ELEVEN + <1> <2> : "⓬" U24EC # NEGATIVE CIRCLED NUMBER TWELVE + <1> <3> : "⓭" U24ED # NEGATIVE CIRCLED NUMBER THIRTEEN + <1> <4> : "⓮" U24EE # NEGATIVE CIRCLED NUMBER FOURTEEN + <1> <5> : "⓯" U24EF # NEGATIVE CIRCLED NUMBER FIFTEEN + <1> <6> : "⓰" U24F0 # NEGATIVE CIRCLED NUMBER SIXTEEN + <1> <7> : "⓱" U24F1 # NEGATIVE CIRCLED NUMBER SEVENTEEN + <1> <8> : "⓲" U24F2 # NEGATIVE CIRCLED NUMBER EIGHTEEN + <1> <9> : "⓳" U24F3 # NEGATIVE CIRCLED NUMBER NINETEEN + <2> <0> : "⓴" U24F4 # NEGATIVE CIRCLED NUMBER TWENTY + <0> : "⓿" U24FF # NEGATIVE CIRCLED DIGIT ZERO + <1> : "❶" U2776 # DINGBAT NEGATIVE CIRCLED DIGIT ONE + <2> : "❷" U2777 # DINGBAT NEGATIVE CIRCLED DIGIT TWO + <3> : "❸" U2778 # DINGBAT NEGATIVE CIRCLED DIGIT THREE + <4> : "❹" U2779 # DINGBAT NEGATIVE CIRCLED DIGIT FOUR + <5> : "❺" U277A # DINGBAT NEGATIVE CIRCLED DIGIT FIVE + <6> : "❻" U277B # DINGBAT NEGATIVE CIRCLED DIGIT SIX + <7> : "❼" U277C # DINGBAT NEGATIVE CIRCLED DIGIT SEVEN + <8> : "❽" U277D # DINGBAT NEGATIVE CIRCLED DIGIT EIGHT + <9> : "❾" U277E # DINGBAT NEGATIVE CIRCLED DIGIT NINE + <1> <0> : "❿" U277F # DINGBAT NEGATIVE CIRCLED NUMBER TEN + : "🅐" U1F150 # NEGATIVE CIRCLED LATIN CAPITAL LETTER A + : "🅑" U1F151 # NEGATIVE CIRCLED LATIN CAPITAL LETTER B + : "🅒" U1F152 # NEGATIVE CIRCLED LATIN CAPITAL LETTER C + : "🅓" U1F153 # NEGATIVE CIRCLED LATIN CAPITAL LETTER D + : "🅔" U1F154 # NEGATIVE CIRCLED LATIN CAPITAL LETTER E + : "🅕" U1F155 # NEGATIVE CIRCLED LATIN CAPITAL LETTER F + : "🅖" U1F156 # NEGATIVE CIRCLED LATIN CAPITAL LETTER G + : "🅗" U1F157 # NEGATIVE CIRCLED LATIN CAPITAL LETTER H + : "🅘" U1F158 # NEGATIVE CIRCLED LATIN CAPITAL LETTER I + : "🅙" U1F159 # NEGATIVE CIRCLED LATIN CAPITAL LETTER J + : "🅚" U1F15A # NEGATIVE CIRCLED LATIN CAPITAL LETTER K + : "🅛" U1F15B # NEGATIVE CIRCLED LATIN CAPITAL LETTER L + : "🅜" U1F15C # NEGATIVE CIRCLED LATIN CAPITAL LETTER M + : "🅝" U1F15D # NEGATIVE CIRCLED LATIN CAPITAL LETTER N + : "🅞" U1F15E # NEGATIVE CIRCLED LATIN CAPITAL LETTER O +

: "🅟" U1F15F # NEGATIVE CIRCLED LATIN CAPITAL LETTER P + : "🅠" U1F160 # NEGATIVE CIRCLED LATIN CAPITAL LETTER Q + : "🅡" U1F161 # NEGATIVE CIRCLED LATIN CAPITAL LETTER R + : "🅢" U1F162 # NEGATIVE CIRCLED LATIN CAPITAL LETTER S + : "🅣" U1F163 # NEGATIVE CIRCLED LATIN CAPITAL LETTER T + : "🅤" U1F164 # NEGATIVE CIRCLED LATIN CAPITAL LETTER U + : "🅥" U1F165 # NEGATIVE CIRCLED LATIN CAPITAL LETTER V + : "🅦" U1F166 # NEGATIVE CIRCLED LATIN CAPITAL LETTER W + : "🅧" U1F167 # NEGATIVE CIRCLED LATIN CAPITAL LETTER X + : "🅨" U1F168 # NEGATIVE CIRCLED LATIN CAPITAL LETTER Y + : "🅩" U1F169 # NEGATIVE CIRCLED LATIN CAPITAL LETTER Z + : "🅰" U1F170 # NEGATIVE SQUARED LATIN CAPITAL LETTER A + : "🅱" U1F171 # NEGATIVE SQUARED LATIN CAPITAL LETTER B + : "🅲" U1F172 # NEGATIVE SQUARED LATIN CAPITAL LETTER C + : "🅳" U1F173 # NEGATIVE SQUARED LATIN CAPITAL LETTER D + : "🅴" U1F174 # NEGATIVE SQUARED LATIN CAPITAL LETTER E + : "🅵" U1F175 # NEGATIVE SQUARED LATIN CAPITAL LETTER F + : "🅶" U1F176 # NEGATIVE SQUARED LATIN CAPITAL LETTER G + : "🅷" U1F177 # NEGATIVE SQUARED LATIN CAPITAL LETTER H + : "🅸" U1F178 # NEGATIVE SQUARED LATIN CAPITAL LETTER I + : "🅹" U1F179 # NEGATIVE SQUARED LATIN CAPITAL LETTER J + : "🅺" U1F17A # NEGATIVE SQUARED LATIN CAPITAL LETTER K + : "🅻" U1F17B # NEGATIVE SQUARED LATIN CAPITAL LETTER L + : "🅼" U1F17C # NEGATIVE SQUARED LATIN CAPITAL LETTER M + : "🅽" U1F17D # NEGATIVE SQUARED LATIN CAPITAL LETTER N + : "🅾" U1F17E # NEGATIVE SQUARED LATIN CAPITAL LETTER O +

: "🅿" U1F17F # NEGATIVE SQUARED LATIN CAPITAL LETTER P + : "🆀" U1F180 # NEGATIVE SQUARED LATIN CAPITAL LETTER Q + : "🆁" U1F181 # NEGATIVE SQUARED LATIN CAPITAL LETTER R + : "🆂" U1F182 # NEGATIVE SQUARED LATIN CAPITAL LETTER S + : "🆃" U1F183 # NEGATIVE SQUARED LATIN CAPITAL LETTER T + : "🆄" U1F184 # NEGATIVE SQUARED LATIN CAPITAL LETTER U + : "🆅" U1F185 # NEGATIVE SQUARED LATIN CAPITAL LETTER V + : "🆆" U1F186 # NEGATIVE SQUARED LATIN CAPITAL LETTER W + : "🆇" U1F187 # NEGATIVE SQUARED LATIN CAPITAL LETTER X + : "🆈" U1F188 # NEGATIVE SQUARED LATIN CAPITAL LETTER Y + : "🆉" U1F189 # NEGATIVE SQUARED LATIN CAPITAL LETTER Z + : "🆏" U1F18F # NEGATIVE SQUARED WC + <1> : "⓵" U24F5 # DOUBLE CIRCLED DIGIT ONE + <2> : "⓶" U24F6 # DOUBLE CIRCLED DIGIT TWO + <3> : "⓷" U24F7 # DOUBLE CIRCLED DIGIT THREE + <4> : "⓸" U24F8 # DOUBLE CIRCLED DIGIT FOUR + <5> : "⓹" U24F9 # DOUBLE CIRCLED DIGIT FIVE + <6> : "⓺" U24FA # DOUBLE CIRCLED DIGIT SIX + <7> : "⓻" U24FB # DOUBLE CIRCLED DIGIT SEVEN + <8> : "⓼" U24FC # DOUBLE CIRCLED DIGIT EIGHT + <9> : "⓽" U24FD # DOUBLE CIRCLED DIGIT NINE + <1> <0> : "⓾" U24FE # DOUBLE CIRCLED NUMBER TEN -- cgit v1.2.3 From 19c513019dcc864c0a039b1e4affe4f6eef21f46 Mon Sep 17 00:00:00 2001 From: Mark Shoulson Date: Wed, 8 Mar 2017 10:31:21 -0500 Subject: Fixed some comments. Added just 2 or 3 new chars. --- dotXCompose | 5 ++++- emojitrans2.pl | 3 ++- modletters-base | 4 ++-- modletters.compose | 5 ++++- 4 files changed, 12 insertions(+), 5 deletions(-) (limited to 'emojitrans2.pl') diff --git a/dotXCompose b/dotXCompose index 0666a4c..2437cbb 100644 --- a/dotXCompose +++ b/dotXCompose @@ -770,6 +770,9 @@ include "%L" : "✉" U2709 # ENVELOPE : "♿" U267F # WHEELCHAIR SYMBOL : "☤" U2624 # CADEUCEUS +## Don't usually do sequences, but exception made for the +## "eyewitness" compound emoji sequence: + : "👁️‍🗨️" # Something different for STAFF OF AESCULAPIUS? <1> : "⚕" U2695 # STAFF OF AESCULAPIUS # 26B0 COFFIN ? @@ -914,9 +917,9 @@ include "%L" : "Ꞌ" UA78B # LATIN CAPITAL LETTER SALTILLO # I'll use capitals for a different double : "ʬ" U02AC # LATIN LETTER BILABIAL PERCUSSIVE +# Also handy for writing urls: http://ʬw.omniglot.com/ # Sorry, I miss having this and hate having to use colon instead: : "ː" U02D0 # MODIFIER LETTER TRIANGULAR COLON -# Also handy for writing urls: http://ʬw.omniglot.com/ # ɣ? ᴥ? Important enough to add? ᴥ is cool just as a "latin" letter. : "ɣ" U0263 # LATIN SMALL LETTER GAMMA # It looks like a ɣ and makes an "o" sorta sound: diff --git a/emojitrans2.pl b/emojitrans2.pl index c978b7e..27ee545 100755 --- a/emojitrans2.pl +++ b/emojitrans2.pl @@ -29,6 +29,7 @@ BEGIN { binmode(STDOUT, ":utf8"); '{' => 'braceleft', '}' => 'braceright', "'" => 'apostrophe', + '"' => 'quotedbl', '\\' => 'backslash', ':' => 'colon', ';' => 'semicolon', @@ -59,7 +60,7 @@ unless (/^#/) { my $hold=$_; s///; s// /; - s({([][[:alnum:] _+:;%@>=`<,.^\$+#()?!/|'\\~*{}♫-]+)})(splitup($1))e; + s({([][[:alnum:] _+:;%@>=`<,.^\$+#()?!/|'"\\~*{}♫-]+)})(splitup($1))e; if (length($1) > 7) { $_=$hold; s/^/### /; diff --git a/modletters-base b/modletters-base index 1945572..d85b5ef 100644 --- a/modletters-base +++ b/modletters-base @@ -468,6 +468,6 @@ #- 1EFD;LATIN SMALL LETTER MIDDLE-WELSH V;Ll;0;L;;;;;N;;;1EFC;;1EFC {!#ww} : "ỽ" U1EFD # LATIN SMALL LETTER MIDDLE-WELSH V #- A78B;LATIN CAPITAL LETTER SALTILLO;Lu;0;L;;;;;N;;;;A78C; - {!#/"} "Ꞌ" # LATIN CAPITAL LETTER SALTILLO + {!#/"} : "Ꞌ" UA78B # LATIN CAPITAL LETTER SALTILLO #- A78C;LATIN SMALL LETTER SALTILLO;Ll;0;L;;;;;N;;;A78B;;A78B - {!#/'} "ꞌ" # LATIN SMALL LETTER SALTILLO + {!#/'} : "ꞌ" UA78C # LATIN SMALL LETTER SALTILLO diff --git a/modletters.compose b/modletters.compose index ea3cf43..caa9e4e 100644 --- a/modletters.compose +++ b/modletters.compose @@ -1,4 +1,3 @@ -### I think this is going to be a private one. ### For davka *letters*, not punctuation that looks like it. ### Mnemonic/signal: <♫>!#, because they are not numbers. ### Maybe #!^ for ones that are just raised letters? Those not as critical. @@ -468,3 +467,7 @@ : "Ỽ" U1EFC # LATIN CAPITAL LETTER MIDDLE-WELSH V #- 1EFD;LATIN SMALL LETTER MIDDLE-WELSH V;Ll;0;L;;;;;N;;;1EFC;;1EFC : "ỽ" U1EFD # LATIN SMALL LETTER MIDDLE-WELSH V +#- A78B;LATIN CAPITAL LETTER SALTILLO;Lu;0;L;;;;;N;;;;A78C; + : "Ꞌ" UA78B # LATIN CAPITAL LETTER SALTILLO +#- A78C;LATIN SMALL LETTER SALTILLO;Ll;0;L;;;;;N;;;A78B;;A78B + : "ꞌ" UA78C # LATIN SMALL LETTER SALTILLO -- cgit v1.2.3

: "⒫" U24AB # PARENTHESIZED LATIN SMALL LETTER P + : "⒬" U24AC # PARENTHESIZED LATIN SMALL LETTER Q + : "⒭" U24AD # PARENTHESIZED LATIN SMALL LETTER R + : "⒮" U24AE # PARENTHESIZED LATIN SMALL LETTER S + : "⒯" U24AF # PARENTHESIZED LATIN SMALL LETTER T + : "⒰" U24B0 # PARENTHESIZED LATIN SMALL LETTER U + : "⒱" U24B1 # PARENTHESIZED LATIN SMALL LETTER V + : "⒲" U24B2 # PARENTHESIZED LATIN SMALL LETTER W + : "⒳" U24B3 # PARENTHESIZED LATIN SMALL LETTER X + : "⒴" U24B4 # PARENTHESIZED LATIN SMALL LETTER Y + : "⒵" U24B5 # PARENTHESIZED LATIN SMALL LETTER Z + : "🄐" U1F110 # PARENTHESIZED LATIN CAPITAL LETTER A + : "🄑" U1F111 # PARENTHESIZED LATIN CAPITAL LETTER B + : "🄒" U1F112 # PARENTHESIZED LATIN CAPITAL LETTER C + : "🄓" U1F113 # PARENTHESIZED LATIN CAPITAL LETTER D + : "🄔" U1F114 # PARENTHESIZED LATIN CAPITAL LETTER E + : "🄕" U1F115 # PARENTHESIZED LATIN CAPITAL LETTER F + : "🄖" U1F116 # PARENTHESIZED LATIN CAPITAL LETTER G + : "🄗" U1F117 # PARENTHESIZED LATIN CAPITAL LETTER H + : "🄘" U1F118 # PARENTHESIZED LATIN CAPITAL LETTER I + : "🄙" U1F119 # PARENTHESIZED LATIN CAPITAL LETTER J + : "🄚" U1F11A # PARENTHESIZED LATIN CAPITAL LETTER K + : "🄛" U1F11B # PARENTHESIZED LATIN CAPITAL LETTER L + : "🄜" U1F11C # PARENTHESIZED LATIN CAPITAL LETTER M + : "🄝" U1F11D # PARENTHESIZED LATIN CAPITAL LETTER N + : "🄞" U1F11E # PARENTHESIZED LATIN CAPITAL LETTER O +