|
|
(未显示2个用户的5个中间版本) |
第1行: |
第1行: |
| {{Dup|Talk:聊天字母}}
| | Chart generator (current version) |
| This adaptable C++ code converts [[聊天字母|ASCII-based alphabet]] to ampersand-encoded [[PUA]].
| |
| There may be bugs. [http://tio.run/##7Vjdb9s2EH/XX8G4WGAjDiyK@kTiAEEfigIbVrTYU@AHhaIdoTLlSnK8rsjfnh15lE05tus2yfawJUDo@/wdj3c8OnyxOOdFKmePj28yMc2lIB8@/v7u4/Vvzptc8mKZCXLJ6ybLy6sup8rlDFjGSBT5FP7UguRTZzQi7@Vi2RAhs5rkkkixKkDLWco6n0mREX6XVoSP3QsyGuVKdUuUf7mJJ2sh@bIUS@HksgFBYVmhgBRCzpo7h5eyBg3QKsT9jReEk/E3x9U/w50LeSXhaETDfwmYeRrYR55PcfE65r6/w9yPUBggGaBlgJYBM0K0DAJcQlwiBezHzlkQBT4bun8KN@G4RLikYA5rGGoyNFxDGWGSDJUDl2mnEQJHBjhC4AiBIwSONHDor1OtvCB@eKudBS76Zrco9FCISH5ohALJSC8sRso3UQVIJtqSTZHyFHDs6h0ztPONootLbMzRG0PzBKNiAKy3iuEkPprQI85YAyemuMxWp3rxKFLcpBrJxHAzXJgRBihELkMqMDsOMZEMvbeRY1VTqC7FxMAZHiAzblpkk2SBS4xC45zh0TPDTQ9tOXIeLkaj609v378nTUk@/HFN@r@Ke1EMrE6fVel/u9NN3XtPNKCmQpXuFweGTj/GXNV0opeQhXZUQZz8HLDV6RZE/AKb0kH6HbfYzklkdXqMvBgbPg4P@9Y@k2462A/uOFkXlzb3jzLXwN5@YRDH3aioNvE7VQ2drv2YNOCNGeNNBbOB7IBkqOrhIcPtrrnxji5@V6X3wu5iLuT/Xfy6wHBHuHyrixUvRRHOCTORXDMnXB9JHBAuXvduZIR4h7vJc7v4n0o1dPFhc7WbWyhXx7kv84wslvVdHx@qdPDNgYdtH16fV3X@lyjVx4FikuauKlf9nkqheY2W96KaFuWqN7hwyIOj3rJgNxlzeqGI4mwMHx4MCC9EWrUoY1e5nIt5LRoAGLpDC0wb37gbP@OTE255WsCDvOl6wojHSBAVjX6n99HP2PNCcnqqvFKgKAsM5SkqjLQRavvASULNUBw1dIHLJpNL6iXIthLhkXqRckFSqZIoebNMm7yUhKfwTaBsyK2Aj4u8SQvYXabTRFSiCO5h2u/9wuE3u@gN4aEAV9AG75yGWv2hDQ1256/jUs/@A3Gxl45rg2fF1c1x4ltp9Hamke4J13@lNNLdafS207gvruCV0kgPpJF64U/nMfx@vPMUvtTO8ywrVOy1@KFknj0nmdGrBLcBPduXURZtJdQw9rlUIxpdoj/8st@1qHtDuKmewNHNcW1Oy1UJwYtpkw7qkqXMMyGbfJqb/wWkvBFVbw265cHbjtqKYVeIOw/RbTdlRQ2HSNuQTTp3h0yPCdn28LyQN56MhWNbrcNiUwjrsyxXkoiqKqt2GJl5Qwd6cKi31zzNZX@grJvqq/KxussL0ecnYy8IMFI@nolGbayPpQcb4pAekwozeVAERdzU/V5bo7h7pcyMss23hhMx43bbzjON36KAAozyt3i/EPUvo21/9PRU4wX7/WKLop6Zczv1GL3koAVHFsJysr5zyNEzFClAa7ffgXkyK9bq9Ah12kJ/X7@4gqzgO@Tc6kY7q7YB7HutbNldUu@AXVu32zF0z3ONvPu4zbjc8m@V0dNycLbxO57Nvbwp0QeeQin38buHfi3NRV2nM3Ez0Z6nuoANb1g3GbSPrrlPq3QB/SVIsypJWs2Wc@j5GkpB39Orsvqcy5nusUo0y0oSF1rs8fFv Try it online!]
| |
|
| |
|
| <pre class="mw-collapsible">#define PROGRAM | | <pre>import sys |
| #include <cstdio>
| | import os.path |
| #include <cstring>
| | import pypinyin |
| #define elif else if | | import xdi8string # all the characters spaced out translated into shidinn |
| // Input ends in newline
| | f=open("wikifile.txt","w",encoding="utf-8") |
| unsigned char c=0; //input
| |
| unsigned char iq[8]; //input queue
| |
| int iql=0; //input queue length
| |
| const int lev[256]={
| |
| 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, //16
| |
| 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, //32
| |
| 000040,000041,000042,000000, 000044,000000,000000,000047, 000050,000051,000052,000053, 000054,000055,000056,000057, //48
| |
| +57543,0xe09c,0xe097,0xe09a, 0xe066,0xe067,0xe096,0xe06a, 0xe099,+57503,000072,000073, 000074,000075,000076,000077, //64
| |
| 000000,0xe093,0xe06b,+57550, 0xe03b,0xe092,0xe069,+57546, 0xe03e,+57547,+57538,+57544, 0xe095,+57549,0xe03f,+57542, //80
| |
| +57537,+57545,+57540,+57548, 0xe098,+57539,0xe09b,+57536, +57502,0xe094,+57541,000000, 000000,000000,000000,000002, //96
| |
| 000003,0xe06f,0xe021,0xe06c, 0xe061,0xe091,0xe06d,0xe063, 0xe065,0xe09d,0xe035,0xe054, 0xe060,0xe033,0xe039,0xe090, //112
| |
| 0xe032,0xe036,0xe03d,0xe03c, 0xe062,0xe06e,0xe068,0xe034, 0xe037,0xe038,0xe03a,000000, 000000,000000,000007
| |
| };//ASCII to PUA (Level)
| |
| const int gra[256]={
| |
| 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, //16
| |
| 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, //32
| |
| 000000,0xe020,000000,000000, +57637,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, //48
| |
| 000000,000000,000000,000000, 000000,+57590,+57636,000000, +57589,000000,000000,000000, 000000,000000,000000,000000, //64
| |
| 000000,000000,+57598,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, +57634,000000,+57595,+57597, //80
| |
| +57585,+57587,+57586,000000, 000000,000000,000000,+57639, 000000,+57593,000000,000000, 000000,000000,000000,000000, //96
| |
| 000000,+57594,000000,000000, 000000,000000,000000,+57632, 000000,000000,000000,+57588, 000000,+57591,+57640,000000, //112
| |
| +57635,+57599,+57584,+57551, 000000,000000,+57633,+57592, +57596,+57638
| |
| };//ASCII to PUA (Grave)
| |
| const int cen[256]={
| |
| 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, //16
| |
| 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, //32
| |
| 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,0xe00c,000000, //48
| |
| 0xe00a,0xe001,0xe002,0xe003, 0xe004,0xe005,0xe006,0xe007, 0xe008,0xe009,000000,000000, 000000,000000,000000,000000, //64
| |
| 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, 000000,000000,000000,000000, //80
| |
| 000000,000000,000000,000000, 0xe00b
| |
| };
| |
|
| |
|
| void push(char c1){
| | characters=[chr(i) for i in range(0x4e00,0xa000)] |
| if(iql>sizeof(iq)){
| | plaintext=' '.join(chr(n) for n in range(0x4e00,0xa000)) |
| throw("e001 queue overflow");
| | ciphertext=xdi8string.output |
| }
| |
| iq[iql]=c1;
| |
| iql+=1;
| |
| }
| |
|
| |
|
| void clear(char c1=0){
| | b1i45=[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
| memset(iq,0,sizeof(iq));
| | 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
| iq[0]=c1;
| | 0,(0),0,0,0,0,0,0,0,0,0,0,0,0,0,0, |
| iql=!!c1;
| | 0,44,39,42,22,23,38,26,41,0,0,0,0,0,0,0, |
| }
| | 0,35,27,0,11,34,25,0,14,0,0,0,37,0,15,0, |
| | 0,0,0,0,40,0,43,0,0,36,0,0,0,0,0,0, |
| | 0,31,1,28,17,33,29,19,21,45,5,20,16,3,9,32, |
| | 2,6,13,12,18,30,24,4,7,8,10,0,0,0,0,0,0] |
| | b1i90000=[(((i-1)%9+1) * (10**((i-1)//9))if i!=0 else 0) for i in b1i45] |
|
| |
|
| void print(char c1=0){
| | def b1i45encode(word): |
| if(iql==0){
| | return ' '.join((str(b1i45[ord(q)]) if len(str(b1i45[ord(q)]))>=2 else '0'+str(b1i45[ord(q)])) for q in word) |
| ;
| |
| } elif(iq[0]==226 && iq[1]==135 && iq[2]==167){
| |
| if(iq[4]==96){
| |
| if(gra[iq[3]]<129){
| |
| throw("e002 space and punctuation can not be capitalized"); | |
| }
| |
| printf("%c%c%d;",38,35,gra[iq[3]]-16);
| |
| }
| |
| if(iql==4){
| |
| if(lev[iq[3]]<129){
| |
| throw("e003 space and punctuation can not be capitalized");
| |
| }
| |
| printf("%c%c%d;",38,35,lev[iq[3]]-16);
| |
| }
| |
| } elif(iq[0]==94){
| |
| if(iq[2]==96){
| |
| if(gra[iq[1]]<129){
| |
| throw("e004 space and punctuation can not be capitalized");
| |
| }
| |
| printf("%c%c%d;",38,35,gra[iq[1]]-16);
| |
| }
| |
| if(iql==2){
| |
| if(lev[iq[1]]<129){
| |
| throw("e005 space and punctuation can not be capitalized");
| |
| }
| |
| printf("%c%c%d;",38,35,lev[iq[1]]-16);
| |
| }
| |
| } elif(iq[0]==126){
| |
| if(iq[2]==96){
| |
| if(gra[iq[1]]<129){
| |
| throw("e006 space and punctuation can not be made middle case");
| |
| }
| |
| printf("%c%c%d;",38,35,gra[iq[1]]+16);
| |
| }
| |
| if(iql==2){
| |
| if(lev[iq[1]]<129){
| |
| throw("e007 space and punctuation can not be made middle case");
| |
| }
| |
| printf("%c%c%d;",38,35,lev[iq[1]]+16);
| |
| }
| |
| } elif(iq[0]==37){
| |
| if(iq[2]==37){
| |
| printf("%c%c%d;",38,35,cen[iq[1]]);
| |
| } else {
| |
| printf("%s",iq);
| |
| }
| |
| } elif(iq[1]==96){
| |
| if(gra[iq[0]]<10){
| |
| throw("e010 unidentified character");
| |
| } elif(gra[iq[0]]<127){
| |
| printf("%s",iq);
| |
| } else {
| |
| printf("%c%c%d;",38,35,gra[iq[0]]);
| |
| }
| |
| } elif(iql==1){
| |
| if(lev[iq[0]]<10){
| |
| throw("e011 unidentified character");
| |
| } elif(lev[iq[0]]<127){
| |
| printf("%s",iq);
| |
| } else {
| |
| printf("%c%c%d;",38,35,lev[iq[0]]);
| |
| }
| |
| } else {
| |
| throw("e03f unknown error");
| |
| }
| |
| clear(c1);
| |
| }
| |
|
| |
|
| int main() {
| | def b1i90000sum(word): |
| try{
| | return sum([b1i90000[ord(q)] for q in word]) |
| while(c!=255){
| | |
| c=getchar();
| | plain=plaintext.split() |
| if(c==10){
| | cipher=ciphertext.split() |
| print();
| | |
| puts("");
| | maxlength=0 |
| } elif(c==13){
| | maxlench=[] |
| ;
| | |
| } elif(iql==0){
| | f.write("Do not simply rely on this chart to translate, as this chart did not handle [[talk:希顶日本语#注意多音字|homograph]] properly. The calculation may be incorrect. If so, please fix it.") |
| push(c);
| | |
| } elif(c==226){
| | f.write("{| class=\"wikitable sortable\"\n"); |
| print(c); //Capital sign
| | f.write("! Character !! Unicode decimal !! Stroke count !! han4 yu3 pin1 yin1 !! xdi8 aho !! [[b1i45密码|b1i45]] !! xdi8 aho letter count !! [[希顶解经|Numeral sum]] !! Stress pattern !! Notes\n") |
| } elif(iql==1&&c==135){
| | for p in range(len(plain)): |
| push(c);
| | if(plain[p]!=cipher[p]): |
| } elif(iql==2&&c==167){
| | f.write("|-\n"); |
| push(c);
| | f.write("| "+plain[p]+" || ") |
| } elif(31<c&&c<126&&c!=96){
| | f.write(str(ord(plain[p]))) |
| if(iq[0]==226 && iq[1]==135 && iq[2]==167 && iql==3){
| | f.write(" || || ") |
| push(c);
| | f.write(pypinyin.pinyin(characters[p],style=pypinyin.Style.TONE3,neutral_tone_with_five=True)[0][0]) |
| } elif(iq[0]==94 && iql==1){
| | f.write(" || "+cipher[p]) |
| push(c);
| | f.write(" || "+b1i45encode(cipher[p])) |
| } elif(iq[0]==126 && iql==1){
| | f.write(" || "+str(len(cipher[p]))) |
| push(c);
| | f.write(" || "+str(b1i90000sum(cipher[p])) + "\n") |
| } elif(iql>1&&iq[iql-1]==96){
| | if(maxlength<len(cipher[p])): |
| print(c);
| | maxlench=[p] |
| } elif(31<iq[iql-1]&&iq[iql-1]<126){
| | maxlength=len(cipher[p]) |
| print(c);
| | elif(maxlength<=len(cipher[p])): |
| } else {
| | maxlench+=[p] |
| push(c);
| | f.write("|}") |
| }
| | print(maxlench,maxlength,len(maxlench)) |
| } elif(c==96){
| | |
| push(c);
| | f.close(); |
| } elif(c==94){
| | </pre> |
| print(c);
| |
| } elif(c==126){
| |
| print(c);
| |
| } else {
| |
| push(c);
| |
| }
| |
| }
| |
| print();
| |
| }catch(const char message[]){
| |
| fputs(message,stderr); //Swap the two arguments if not working
| |
| }
| |
| return 0;
| |
| }</pre>
| |
Chart generator (current version)
import sys
import os.path
import pypinyin
import xdi8string # all the characters spaced out translated into shidinn
f=open("wikifile.txt","w",encoding="utf-8")
characters=[chr(i) for i in range(0x4e00,0xa000)]
plaintext=' '.join(chr(n) for n in range(0x4e00,0xa000))
ciphertext=xdi8string.output
b1i45=[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,(0),0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,44,39,42,22,23,38,26,41,0,0,0,0,0,0,0,
0,35,27,0,11,34,25,0,14,0,0,0,37,0,15,0,
0,0,0,0,40,0,43,0,0,36,0,0,0,0,0,0,
0,31,1,28,17,33,29,19,21,45,5,20,16,3,9,32,
2,6,13,12,18,30,24,4,7,8,10,0,0,0,0,0,0]
b1i90000=[(((i-1)%9+1) * (10**((i-1)//9))if i!=0 else 0) for i in b1i45]
def b1i45encode(word):
return ' '.join((str(b1i45[ord(q)]) if len(str(b1i45[ord(q)]))>=2 else '0'+str(b1i45[ord(q)])) for q in word)
def b1i90000sum(word):
return sum([b1i90000[ord(q)] for q in word])
plain=plaintext.split()
cipher=ciphertext.split()
maxlength=0
maxlench=[]
f.write("Do not simply rely on this chart to translate, as this chart did not handle [[talk:希顶日本语#注意多音字|homograph]] properly. The calculation may be incorrect. If so, please fix it.")
f.write("{| class=\"wikitable sortable\"\n");
f.write("! Character !! Unicode decimal !! Stroke count !! han4 yu3 pin1 yin1 !! xdi8 aho !! [[b1i45密码|b1i45]] !! xdi8 aho letter count !! [[希顶解经|Numeral sum]] !! Stress pattern !! Notes\n")
for p in range(len(plain)):
if(plain[p]!=cipher[p]):
f.write("|-\n");
f.write("| "+plain[p]+" || ")
f.write(str(ord(plain[p])))
f.write(" || || ")
f.write(pypinyin.pinyin(characters[p],style=pypinyin.Style.TONE3,neutral_tone_with_five=True)[0][0])
f.write(" || "+cipher[p])
f.write(" || "+b1i45encode(cipher[p]))
f.write(" || "+str(len(cipher[p])))
f.write(" || "+str(b1i90000sum(cipher[p])) + "\n")
if(maxlength<len(cipher[p])):
maxlench=[p]
maxlength=len(cipher[p])
elif(maxlength<=len(cipher[p])):
maxlench+=[p]
f.write("|}")
print(maxlench,maxlength,len(maxlench))
f.close();