% This is the cweb file cefsconv.w of the CJK Package Ver. 4.8.5 16-Oct-2021 % Copyright (C) 1994-2021 Werner Lemberg % % This program is free software; you can redistribute it and/or modify % it under the terms of the GNU General Public License as published by % the Free Software Foundation; either version 2 of the License, or % (at your option) any later version. % % This program is distributed in the hope that it will be useful, % but WITHOUT ANY WARRANTY; without even the implied warranty of % MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the % GNU General Public License for more details. % % You should have received a copy of the GNU General Public License % along with this program in doc/COPYING; if not, write to the Free % Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, % MA 02110-1301 USA % To print this CWEB file you should (but not must) use the CWEAVE of the % c2cweb-package (found at the CTAN archives, e.g. ftp.dante.de) and then say % % cweave +a cefsconv.w % % This (fully compatible) CWEAVE can transform CWEB-files with alternative % output rules (look at the position of braces below!) the author (it's me % too :-) prefer. Otherwise this file will be formatted traditionally. \def\title{cefsconv (CJK Version 4.8.5)} \def\topofcontents{ \null\vfill \centerline{\titlefont The {\ttitlefont cefsconv} program} \vskip 20pt \centerline{(CJK Version 4.8.5)} \vfill} \def\botofcontents{ \vfill \noindent Copyright \copyright\ 1996, 1998 by Werner Lemberg \bigskip\noindent Permission is granted to make and distribute verbatim copies of this document provided that the copyright notice and this permission notice are preserved on all copies. \smallskip\noindent Permission is granted to copy and distribute modified versions of this document under the conditions for verbatim copying, provided that the entire resulting derived work is distributed under the terms of a permission notice identical to this one.} \pageno=\contentspagenumber \advance\pageno by 1 \let\maybe=\iftrue \fullpageheight=240mm \pageheight=223mm \pagewidth=158mm \setpage \frenchspacing \noinx \nosecs \nocon @* Function and Use. This small program will convert SJIS encoding with CNS encoded Chinese characters using the {\it Chinese Encoding Framework (CEF)} into a `preprocessed' form. The need of this program arises from the fact that SJIS encoding uses the characters `\.{\\}', `\.{\{}', and `\.{\}}' which have special meanings in \TeX. Use this program as a filter: \hskip 2em \.{cefsconv < input\_file > output\_file} @* The program. In contrast to \.{cefconv} two tasks will be executed: Replacing all occurrences of two byte SJIS encoded characters \.{XY} with \.{\char94 \char94 7fX\char94 \char94 7fZZZ\char94 \char94 7f} (\.{X} and \.{Y} are the first and the second byte of the character; \.{ZZZ} represents the second byte as a decimal number). Replacing CEF macros of the form \.{\&xx-yyzz;} (\.{xx} can be C1--C7 for the CNS planes 1--7, C0 for Big~5 encoding, an encoding CX reserved for IRIZ, a private encoding CY, and U for Unicode encoding; \.{yyzz} is a hexadecimal representation of the code point in this plane) with \medskip \quad\.{\char94 \char94 7f72\char94 \char94 7fXX\char94 \char94 7f% \char94 \char94 7f"0yy\char94 \char94 7f"0zz\char94 \char94 7f}\quad. \medskip \.{XX} is the corresponding CJK encoding of \.{xx}; the number `72' specifies a macro in the file \.{MULEenc.sty} which further processes this representation -- it is necessary to explicitly load this file with \.{\\usepackage}. Additionally we define a \TeX\ macro at the very beginning to signal a preprocessed file. The following code is very simple. No error detection is done because \TeX\ which will see the output of \.{cefsconv} complains loudly if something is wrong. Note that the user-defined character area of SJIS (with the first bytes in the range 0xF0--0xFC) is not supported because it is not portable. @d banner "cefsconv (CJK ver. 4.8.5)" @c #include #include #include @# int main(int argc, char *argv[]) {int ch, i; unsigned char in[16]; unsigned char out[32]; unsigned char *inp, *outp; fprintf(stdout, "\\def\\CNSpreproc{%s}", banner);@# ch = fgetc(stdin);@# while(!feof(stdin)) {if((ch >= 0x81 && ch <= 0x9F) || (ch >= 0xE0 && ch <= 0xEF)) {fprintf(stdout, "\177%c\177", ch);@# ch = fgetc(stdin); if(!feof(stdin)) fprintf(stdout, "%d\177", ch); } else if(ch == '&') /* the macro test is hardcoded to make things simple */ {inp = in; outp = out; *inp = ch; *(++inp) = fgetc(stdin);@# if(*inp == 'C' && !feof(stdin)) {*(++inp) = fgetc(stdin); if(*inp == '0' && !feof(stdin)) {*(outp++) = 'B'; *(outp++) = 'g'; *(outp++) = '5'; } else if(*inp >= '1' && *inp <= '7' && !feof(stdin)) {*(outp++) = 'C'; *(outp++) = 'N'; *(outp++) = 'S'; *(outp++) = *inp; } else if((*inp == 'X' || *inp == 'Y') && !feof(stdin)) {*(outp++) = 'C'; *(outp++) = 'E'; *(outp++) = 'F'; *(outp++) = *inp; } else goto no_macro; } else if(*inp == 'U' && !feof(stdin)) {*(outp++) = 'U'; *(outp++) = 'T'; *(outp++) = 'F'; *(outp++) = '8'; } else goto no_macro;@# *(++inp) = fgetc(stdin); if(*inp != '-' || feof(stdin)) goto no_macro;@# *(outp++) = '\177'; *(outp++) = '\177'; *(outp++) = '\"'; *(outp++) = '0';@# *(++inp) = fgetc(stdin); if(isxdigit(*inp) && *inp < 0x80 && !feof(stdin)) *(outp++) = toupper(*inp); else goto no_macro;@# *(++inp) = fgetc(stdin); if(isxdigit(*inp) && *inp < 0x80 && !feof(stdin)) *(outp++) = toupper(*inp); else goto no_macro;@# *(outp++) = '\177'; *(outp++) = '\"'; *(outp++) = '0';@# *(++inp) = fgetc(stdin); if(isxdigit(*inp) && *inp < 0x80 && !feof(stdin)) *(outp++) = toupper(*inp); else goto no_macro;@# *(++inp) = fgetc(stdin); if(isxdigit(*inp) && *inp < 0x80 && !feof(stdin)) *(outp++) = toupper(*inp); else goto no_macro;@# *(outp++) = '\177'; *outp = '\0';@# *(++inp) = fgetc(stdin); if(*inp != ';' || feof(stdin)) goto no_macro;@# outp = out; fprintf(stdout, "\17772\177"); while(*outp) fputc(*(outp++), stdout);@# ch = fgetc(stdin); continue;@# no_macro: ch = *inp; i = inp - in; inp = in; while(i--) fputc(*(inp++), stdout); continue; } else fputc(ch, stdout);@# ch = fgetc(stdin); } exit(EXIT_SUCCESS); return 0; /* never reached */ }