This is charsets.c in view mode; [Download] [Up]
/* * charsets.c - Character set conversions. * * Written by * Jouko Valta (jopi@stekt.oulu.fi) * * This file is part of VICE, the Versatile Commodore Emulator. * See README for copyright notice. * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA * 02111-1307 USA. * */ #include "vice.h" #include <stdio.h> #include <stdlib.h> #include <ctype.h> #include "charsets.h" /* ------------------------------------------------------------------------- */ void petconvstring(char *c, int dir) { char *p = c; switch (dir) { case 0: /* to petscii */ for (; *p; p++) *p = p_topetcii(*p); break; case 1: /* to ascii */ case 2: /* to ascii, convert also screencodes */ --dir; for (; *p; p++) { *p = p_toascii(*p, dir); } } } void unix_filename(char *p) { while(*p) { if (*p == '/') *p= '_'; p++; } } int p_toascii(int c, int cs) { c &= 0xff; switch (c) { case 0x0a: case 0x0d: return (cs ? (c | 0x40) : '\n'); /* Pet screen codes or CR/LF */ case 0x40: case 0x60: return (c); case 0xa0: /* CBM: Shifted Space */ case 0xe0: return (' '); case 0xff: return (0x7e); default: switch (c & 0xe0) { case 0x40: /* 41 - 7E */ case 0x60: return (c ^ 0x20); case 0xc0: /* C0 - DF */ return (c ^ 0x80); case 0x00: /* 01 - 1F */ if (cs && c) /* Pet screen codes */ return (c | 0x40); } /* switch */ } /* switch */ return ((isprint(c) ? c : '.')); } int p_topetcii(int c) { if (c == 0x7e) /* '~' is ASCII for 'pi' */ return (0xff); else if ((c >= 0x5b) && (c <= 0x7e)) return (c ^ 0x20); else if ((c >= 'A') && (c <= 'Z')) /* C0 - DF */ return (c | 0x80); return (c); } /* ------------------------------------------------------------------------- */ /* * Control Codes */ /* * Printer's control code symbols */ char *ctrl1[] = { "", "", "", "", "", "wht", "", "", "dish", "ensh", "\n", "", "\f", "\n", "swlc", "", "", "down", "rvon", "home", "del", "", "", "", "", "", "", "esc", "red", "rght", "grn", "blu" }; char *ctrl2[] = { "", "orng", "", "", "", "F1", "F3", "F5", "F7", "F2", "F4", "F6", "F8", "sret", "swuc", "", "blk", "up", "rvof", "clr", "inst", "brn", "lred", "gry1", "gry2", "lgrn", "lblu", "gry3", "pur", "left", "yel", "cyn" }; char *cbmkeys[] = { "SHIFT-SPACE", "CBM-K", "CBM-I", "CBM-T", "CBM-@", "CBM-G", "CBM-+", "CBM-M", "CBM-POUND", "SHIFT-POUND", "CBM-N", "CBM-Q", "CBM-D", "CBM-Z", "CBM-S", "CBM-P", "CBM-A", "CBM-E", "CBM-R", "CBM-W", "CBM-H", "CBM-J", "CBM-L", "CBM-Y", "CBM-U", "CBM-O", "SHIFT-@", "CBM-F", "CBM-C", "CBM-X", "CBM-V", "CBM-B" }; char *ctrl_to_str(int clean, BYTE c) { static char buf[16]; if (c == 0x0a || c == 0xc || c == 0xd) return (ctrl1[c]); /* The rest of control codes must be skipped when clean is set */ if (!clean) { if ((c < 0x20) && *ctrl1[c]) sprintf(buf, "(%s)", ctrl1[c]); else if (((c & 0x7f) < 0x20) && *ctrl2[c & 0x1f]) sprintf(buf, "(%s)", ctrl2[c & 0x1f]); else sprintf(buf, "($%02x)", c & 0xff); return (buf); } /* !clean */ return (NULL); } char *cbm_to_str(BYTE c) { static char buf[16]; switch (c) { case 0x60: return "(SHIFT-*)"; case 0x7c: return "(CBM--)"; /* Conflicts with Scandinavian Chars */ case 0x7f: return "(CBM-*)"; /* case 0xff: return "(pi)"; */ default: if ((c > 0xa0 && c <= 0xbf) || (c > 0xe0 && c <= 0xfe)) sprintf (buf, "(%s)", cbmkeys[c & 0x1f]); else return (NULL); } /* switch */ return (buf); } /* ------------------------------------------------------------------------- */ /* * Commodore's International character sets */ static char *langnames[] = { /* International Charsets */ "commodore", /* CBM */ "usa", /* US */ "germany", /* GER */ "denmark-1", /* DEN1 */ "france", /* FRA */ "sweden-1", /* SWE1 */ "italy", /* ITA */ "spain", /* SPA */ "denmark-2", /* DEN2 */ "sweden-2", /* SWE2 */ "finland", /* FIN */ "norway", /* NOR */ "england" /* UK */ "commodore-din" /* C-DIN */ }; /* 7-bit */ /* ASCII/ISO 646 family */ static BYTE ASCextens[][11] = { /* graphics/uppercase -- uppercase/lowercase */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x2b,0x7c,0x7d,0x26 }, /* CBM */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x7b,0x7c,0x7d,0x7e }, /* US */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x55, 0x7b,0x7c,0x75,0x7e }, /* GER */ { 0x23, 0x24, 0x40, 0x7b,0x7c,0x7d, 0x5b,0x5c,0x5d,0x7e }, /* DEN1 */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x7b,0x7c,0x7d,0x7e }, /* FRA */ { 0x23, 0x24, 0x40, 0x7b,0x7c,0x7d, 0x5b,0x5c,0x5d,0x7e }, /* SWE1 */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x7b,0x7c,0x7d,0x7e }, /* ITA */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x7b,0x7c,0x7d,0x7e }, /* SPA */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x7b,0x7c,0x7d,0x7e }, /* DEN2 */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x7b,0x7c,0x7d,0x7e }, /* SWE2 */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x7b,0x7c,0x7d,0x7e }, /* UK */ { 0x23, 0x24, 0x40, 0x5b,0x5c,0x5d, 0x2b,0x7c,0x7d,0x26 } /* CBM-DIN */ }; /* 8-bit */ static BYTE ISOextens[][11] = { { 0x23, 0x24, 0x40, 0x5B, 0xA3, 0x5D, 0x2B, 0x7C, 0x7D, 0x26 }, { 0x23, 0x24, 0x40, 0x5B, 0x5C, 0x5D, 0x7B, 0x7C, 0x7D, 0x7E }, { 0x23, 0x24, 0xA7, 0xC4, 0xD6, 0xDC, 0xE4, 0xF6, 0xFC, 0xDF }, { 0x23, 0x24, 0x40, 0xE6, 0xF8, 0xE5, 0xC6, 0xD8, 0xC5, 0x7E }, { 0x23, 0x24, 0xE0, 0xB0, 0xE7, 0xA7, 0xE9, 0xF9, 0xE8, 0x98 }, { 0x23, 0xA4, 0xC9, 0xE4, 0xF6, 0xE5, 0xC4, 0xD6, 0xC5, 0xFC }, { 0x23, 0x24, 0x40, 0xB0, 0x5C, 0xE9, 0xE0, 0xF2, 0xE8, 0xEC }, { 0xA0, 0x24, 0x40, 0xA1, 0xD1, 0xBF, 0x98, 0xF1, 0x7D, 0x7E }, { 0x23, 0x24, 0x40, 0xC6, 0xD8, 0xC5, 0xE6, 0xF8, 0xE6, 0x7E }, { 0x23, 0xA4, 0xC9, 0xC4, 0xD6, 0xC5, 0xE4, 0xF6, 0xE5, 0xFC }, { 0x23, 0x24, 0x40, 0xC4, 0xD6, 0xC5, 0xE4, 0xF6, 0xE5, 0x7E }, { 0x23, 0xA4, 0xC9, 0xC6, 0xD8, 0xC5, 0xE6, 0xF8, 0xE6, 0xFC }, { 0xA3, 0x24, 0x40, 0x5B, 0x5C, 0x5D, 0x7B, 0x7C, 0x7D, 0x7E }, { 0x23, 0x24, 0xA7, 0x5B, 0xA3, 0x5D, 0x2B, 0x7C, 0x7D, 0x26 } }; /* * C64 Uppercase 97-122 (61-7A) and 160-192 (A0-C0) to ASCII */ static BYTE ASCgraphics1[] = { 35,124, 45, 45, 45, 45,124,124, 92, 92, 47, 92, 92, 47, 47, 92, 35, 95, 35,124, 47, 88, 79, 35,124, 35 }; static BYTE ASCgraphics2[] = { 32,124, 35, 45, 45,124, 35,124, 35, 47,124,124, 47, 92, 92, 45, 47, 45, 45,124,124,124,124, 45, 45, 45, 47, 92, 92, 47, 47, 35 }; /* ------------------------------------------------------------------------- */ static BYTE (*extens)[11] = &ASCextens[0]; static BYTE *graphics1 = (BYTE *)ASCgraphics1; static BYTE *graphics2 = (BYTE *)ASCgraphics2; int set_locale(char *localename) { if (!localename && !(localename = getenv("LC_CTYPE")) ) return (-1); if (!strcmp(localename, "Latin1") || !strcmp(localename, "iso_8859_1") || !strcmp(localename, "iso-8859-1")) { extens = ISOextens; graphics1 = (BYTE *)ASCgraphics1; graphics2 = (BYTE *)ASCgraphics2; } else { extens = ASCextens; graphics1 = (BYTE *)ASCgraphics1; graphics2 = (BYTE *)ASCgraphics2; } return (0); } /* * PETSCII to ASCII or 8-bit conversion. Alas, there is not just * one or two conversions, but a complete chaos... * -- and then there are all the various standard sets... */ /* * Convert a national CBM character to its standard * international equivalent. * * Parameters: * lang 0-10 CBM language codes * case 0 lowercase, otherwise uppercase * c byte to convert */ int p_toichar(int lang, int lwcase, BYTE c) { if (lang < 0 || lang > NUM_LANGUAGES) { fprintf (stderr, "Fatal error: language not recognized.\n"); exit (2); } /* Duplicate codes C0 - DF */ if ((c >= 0xc0) && (c <= 0xdf)) /* Same as 96 - 127 */ c ^= 0xa0; else if (c == 255) c = 126; /* CBM-x Graphics Images A0 - BF, E0 - FE */ else if (c >= 0xa0) /* C0 -- FF is handled by now */ c = graphics2[c & 0x1f]; /* @ / Eacute / Section */ #if 0 if (c == 0x40) return (extens1[lang][2]); else if (c == 0x60) { /* Standard mode: vertical bar; all others: left quote (`) */ } #endif /* Alphabetics ... */ if ((c >= 0x41) && (c <= 0x5a)) { if (lwcase) c ^= 0x20; } else if ((c >= 0x5b) && (c <= 0x5d)) { if (!lwcase && (lang == CS_DEN1 || lang == CS_SWE1)) c = extens[lang][c -0x5b + 6]; else c = extens[lang][c -0x58]; } else if ((c >= 0x61) && (c <= 0x7a)) { if (lwcase) c ^= 0x20; else c = graphics1[c -0x61]; } else if ((c >= 0x7b) && (c <= 0x7e)) { c = extens[lang][c -0x7b + 6]; } return (c); } /* ------------------------------------------------------------------------- */ /* * Language name to code. */ int str_to_lang(char *name) { int j, token; char *p, *q; if (!name || !*name) return (-1); for (p = name; *p; p++) { if (isalpha ((int)*p)) *p = tolower(*p); else if (*p == '_' || *p == '/') *p = '-'; } for (token = 0; token < NUM_LANGUAGES; token++) { for (p = langnames[token], q = (char *)name, j = 0; *p && *q && *p == *q; p++, q++, j++); /* found an exact match */ if (j && !*p) { /*fprintf (stderr, "found %s %2x\n", langnames[token], token);*/ return token; } } /* for */ return (-1); }
These are the contents of the former NiCE NeXT User Group NeXTSTEP/OpenStep software archive, currently hosted by Netfuture.ch.