1
Fork 0
mirror of https://git.savannah.gnu.org/git/guile.git synced 2025-04-30 11:50:28 +02:00
guile/libguile/mbstrings.c
Jim Blandy 20e6290e38 C files should #include only the header files they need, not
libguile.h (which #includes all the header files); the pointless
recompilation was wasting my time.
* Makefile.in (all .o dependency lists): Regenerated.
* libguile.h: Don't try to get a definition for size_t here...
* __scm.h: Do it here.
* _scm.h: Since this is the internal libguile header, put things
here that all (or a majority) of the libguile files will want.
Don't #include <libguile.h> here; that generates dependencies on
way too much.  Instead, get "__scm.h", "error.h", "pairs.h",
"list.h", "gc.h", "gsubr.h", "procs.h", "numbers.h", "symbols.h",
"boolean.h", "strings.h", "vectors.h", "root.h", "ports.h", and
"async.h".
* alist.c: Get "eq.h", "list.h", "alist.h".
* append.c: Get "append.h", "list.h".
* arbiters.c: Get "arbiters.h", "smob.h".
* async.c: Get "async.h", "smob.h", "throw.h", "eval.h".
* boolean.c: Get "boolean.h".
* chars.c: Get "chars.h".
* continuations.c: Get "continuations.h", "dynwind.h", "debug.h",
"stackchk.h".
* debug.c: Get "debug.h", "feature.h", "read.h", "strports.h",
"continuations.h", "alist.h", "srcprop.h", "procprop.h", "smob.h",
"genio.h", "throw.h", "eval.h".
* dynwind.c: Get "dynwind.h", "alist.h", "eval.h".
* eq.c: Get "eq.h", "unif.h", "smob.h", "strorder.h",
"stackchk.h".
* error.c: Get "error.h", "throw.h", "genio.h", "pairs.h".
* eval.c: Get "eval.h", "stackchk.h", "srcprop.h", "debug.h",
"hashtab.h", "procprop.h", "markers.h", "smob.h", "throw.h",
"continuations.h", "eq.h", "sequences.h", "alist.h", "append.h",
"debug.h".
* fdsocket.c: Get "fdsocket.h", "unif.h", "filesys.h".
* feature.c: Get "feature.h".
* files.c: Get "files.h".
* filesys.c: Get "filesys.h", "smob.h", "genio.h".
* fports.c: Get "fports.h", "markers.h".
* gc.c: Get "async.h", "unif.h", "smob.h", "weaks.h",
"genio.h", "struct.h", "stackchk.h", "stime.h".
* gdbint.c: Get "gdbint.h", "chars.h", "eval.h", "print.h",
"read.h", "strports.h", "tag.h".
* genio.c: Get "genio.h", "chars.h".
* gsubr.c: Get "gsubr.h", "genio.h".
* hash.c: Get "hash.h", "chars.h".
* hashtab.c: Get "hashtab.h", "eval.h", "hash.h", "alist.h".
* init.c: Get everyone who has an scm_init_mumble function:
"weaks.h", "vports.h", "version.h", "vectors.h", "variable.h",
"unif.h", "throw.h", "tag.h", "symbols.h", "struct.h",
"strports.h", "strorder.h", "strop.h", "strings.h", "stime.h",
"stackchk.h", "srcprop.h", "socket.h", "simpos.h", "sequences.h",
"scmsigs.h", "read.h", "ramap.h", "procs.h", "procprop.h",
"print.h", "posix.h", "ports.h", "pairs.h", "options.h",
"objprop.h", "numbers.h", "mbstrings.h", "mallocs.h", "load.h",
"list.h", "kw.h", "ioext.h", "hashtab.h", "hash.h", "gsubr.h",
"gdbint.h", "gc.h", "fports.h", "filesys.h", "files.h",
"feature.h", "fdsocket.h", "eval.h", "error.h", "eq.h",
"dynwind.h", "debug.h", "continuations.h", "chars.h", "boolean.h",
"async.h", "arbiters.h", "append.h", "alist.h".
* ioext.c: Get "ioext.h", "fports.h".
* kw.c: Get "kw.h", "smob.h", "mbstrings.h", "genio.h".
* list.c: Get "list.h", "eq.h".
* load.c: Get "load.h", "eval.h", "read.h", "fports.h".
* mallocs.c: Get "smob.h", "genio.h".
* markers.c: Get "markers.h".
* mbstrings.c: Get "mbstrings.h", "read.h", "genio.h", "unif.h",
"chars.h".
* numbers.c: Get "unif.h", "genio.h".
* objprop.c: Get "objprop.h", "weaks.h", "alist.h", "hashtab.h".
* options.c: Get "options.h".
* ports.c: Get "ports.h", "vports.h", "strports.h", "fports.h",
"markers.h", "chars.h", "genio.h".
* posix.c: Get "posix.h", "sequences.h", "feature.h", "unif.h",
"read.h", "scmsigs.h", "genio.h", "fports.h".
* print.c: Get "print.h",  "unif.h", "weaks.h", "read.h",
"procprop.h", "eval.h", "smob.h", "mbstrings.h", "genio.h",
"chars.h".
* procprop.c: Get "procprop.h", "eval.h", "alist.h".
* procs.c: Get "procs.h".
* ramap.c: Get "ramap.h", "feature.h", "eval.h", "eq.h",
"chars.h", "smob.h", "unif.h".
* read.c: Get "alist.h", "kw.h", "mbstrings.h", "unif.h",
"eval.h", "genio.h", "chars.h".
* root.c: Get "root.h", "stackchk.h".
* scmsigs.c: Get "scmsigs.h".
* sequences.c: Get "sequences.h".
* simpos.c: Get "simpos.h", "scmsigs.h".
* smob.c: Get "smob.h".
* socket.c: Get "socket.h", "feature.h".
* srcprop.c: Get "srcprop.h", "weaks.h", "hashtab.h", "debug.h",
"alist.h", "smob.h".
* stackchk.c: Get "stackchk.h", "genio.h".
* stime.c: Get "stime.h"."libguile/continuations.h".
* strings.c: Get "strings.h", "chars.h".
* strop.c: Get "strop.h", "chars.h".
* strorder.c: Get "strorder.h", "chars.h".
* strports.c: Get "strports.h", "print.h", "eval.h", "unif.h".
* struct.c: Get "struct.h", "chars.h".
* symbols.c: Get "symbols.h", "mbstrings.h", "alist.h",
"variable.h", "eval.h", "chars.h".
* tag.c: Get "tag.h", "struct.h", "chars.h".
* throw.c: Get "throw.h", "continuations.h", "debug.h",
"dynwind.h", "eval.h", "alist.h", "smob.h", "genio.h".
* unif.c: Get "unif.h", "feature.h", "strop.h", "sequences.h",
"smob.h", "genio.h", "eval.h", "chars.h".
* variable.c: Get "variable.h", "smob.h", "genio.h".
* vectors.c: Get "vectors.h", "eq.h".
* version.c: Get "version.h".
* vports.c: Get "vports.h", "fports.h", "chars.h", "eval.h".
* weaks.c: Get "weaks.h".
1996-09-10 02:26:07 +00:00

573 lines
11 KiB
C
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

/* Copyright (C) 1995, 1996 Free Software Foundation, Inc.
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2, or (at your option)
* any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this software; see the file COPYING. If not, write to
* the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
*
* As a special exception, the Free Software Foundation gives permission
* for additional uses of the text contained in its release of GUILE.
*
* The exception is that, if you link the GUILE library with other files
* to produce an executable, this does not by itself cause the
* resulting executable to be covered by the GNU General Public License.
* Your use of that executable is in no way restricted on account of
* linking the GUILE library code into it.
*
* This exception does not however invalidate any other reasons why
* the executable file might be covered by the GNU General Public License.
*
* This exception applies only to the code released by the
* Free Software Foundation under the name GUILE. If you copy
* code from other Free Software Foundation releases into a copy of
* GUILE, as the General Public License permits, the exception does
* not apply to the code that you add in this way. To avoid misleading
* anyone as to the status of such modified files, you must delete
* this exception notice from them.
*
* If you write modifications of your own for GUILE, it is your choice
* whether to permit this exception to apply to your modifications.
* If you do not wish that, delete this exception notice.
*/
#include "extchrs.h"
#include <stdio.h>
#include "_scm.h"
#include "chars.h"
#include "unif.h"
#include "genio.h"
#include "read.h"
#include "mbstrings.h"
SCM_PROC(s_multi_byte_string_p, "multi-byte-string?", 1, 0, 0, scm_multi_byte_string_p);
#ifdef __STDC__
SCM
scm_multi_byte_string_p (SCM obj)
#else
SCM
scm_multi_byte_string_p (obj)
SCM obj;
#endif
{
return (SCM_MB_STRINGP (obj)
? SCM_BOOL_T
: SCM_BOOL_F);
}
#ifdef __STDC__
SCM
scm_regular_string_p (SCM obj)
#else
SCM
scm_regular_string_p (obj)
SCM obj;
#endif
{
return (SCM_REGULAR_STRINGP (obj)
? SCM_BOOL_T
: SCM_BOOL_F);
}
SCM_PROC(s_list_to_multi_byte_string, "list->multi-byte-string", 1, 0, 0, scm_multi_byte_string);
SCM_PROC(s_multi_byte_string, "multi-byte-string", 0, 0, 1, scm_multi_byte_string);
#ifdef __STDC__
SCM
scm_multi_byte_string (SCM chrs)
#else
SCM
scm_multi_byte_string (chrs)
SCM chrs;
#endif
{
SCM res;
register char *data;
long i;
long byte_len;
i = scm_ilength (chrs);
SCM_ASSERT (i >= 0, chrs, SCM_ARG1, s_multi_byte_string);
i = i * XMB_CUR_MAX;
res = scm_makstr (i, 0);
SCM_SETLENGTH (res, SCM_LENGTH (res), scm_tc7_mb_string);
data = SCM_CHARS (res);
byte_len = 0;
xwctomb (0, 0);
while (i && SCM_NNULLP (chrs))
{
int used;
SCM ch;
ch = SCM_CAR (chrs);
SCM_ASSERT (SCM_ICHRP (ch), chrs, SCM_ARG1, s_multi_byte_string);
used = xwctomb (data + byte_len, SCM_ICHR (ch));
SCM_ASSERT (used >= 0, chrs, SCM_ARG1, s_multi_byte_string);
byte_len += (used ? used : 1);
chrs = SCM_CDR (chrs);
--i;
}
res = scm_vector_set_length_x (res, SCM_MAKINUM (byte_len));
return res;
}
#ifdef __STDC__
int
scm_mb_ilength (unsigned char * data, int size)
#else
int
scm_mb_ilength (data, size)
unsigned char * data;
int size;
#endif
{
int pos;
int len;
len = 0;
pos = 0;
xmblen (0, 0);
while (pos < size)
{
int inc;
inc = xmblen (data + pos, size - pos);
if (inc == 0)
++inc;
if (inc < 0)
return -1;
++len;
pos += inc;
}
return len;
}
SCM_PROC(s_multi_byte_string_length, "multi-byte-string-length", 1, 0, 0, scm_multi_byte_string_length);
#ifdef __STDC__
SCM
scm_multi_byte_string_length (SCM str)
#else
SCM
scm_multi_byte_string_length (str)
SCM str;
#endif
{
int size;
int len;
unsigned char * data;
SCM_ASSERT (SCM_NIMP (str) && SCM_ROSTRINGP (str), str, SCM_ARG1, s_multi_byte_string_length);
data = SCM_ROCHARS (str);
size = SCM_ROLENGTH (str);
len = scm_mb_ilength (data, size);
SCM_ASSERT (len >= 0, str, SCM_ARG1, s_multi_byte_string_length);
return SCM_MAKINUM (len);
}
SCM_PROC(s_symbol_multi_byte_p, "symbol-multi-byte?", 1, 0, 0, scm_symbol_multi_byte_p);
#ifdef __STDC__
SCM
scm_symbol_multi_byte_p (SCM symbol)
#else
SCM
scm_symbol_multi_byte_p (symbol)
SCM symbol;
#endif
{
return SCM_SYMBOL_MULTI_BYTE_SCM_STRINGP(symbol);
}
SCM_PROC(s_set_symbol_multi_byte_x, "set-symbol-multi-byte!", 2, 0, 0, scm_set_symbol_multi_byte_x);
#ifdef __STDC__
SCM
scm_set_symbol_multi_byte_x (SCM symbol, SCM val)
#else
SCM
scm_set_symbol_multi_byte_x (symbol, val)
SCM symbol;
SCM val;
#endif
{
if (SCM_TYP7 (symbol) == scm_tc7_msymbol)
{
SCM_SYMBOL_MULTI_BYTE_SCM_STRINGP(symbol) = (SCM_FALSEP (val)
? SCM_BOOL_F
: SCM_BOOL_T);
}
return SCM_UNSPECIFIED;
}
SCM_PROC(s_regular_port_p, "regular-port?", 1, 0, 0, scm_regular_port_p);
#ifdef __STDC__
SCM
scm_regular_port_p (SCM p)
#else
SCM
scm_regular_port_p (p)
SCM p;
#endif
{
return (SCM_PORT_REPRESENTATION(p) == scm_regular_port
? SCM_BOOL_T
: SCM_BOOL_F);
}
SCM_PROC(s_regular_port_x, "regular-port!", 1, 0, 0, scm_regular_port_x);
#ifdef __STDC__
SCM
scm_regular_port_x (SCM p)
#else
SCM
scm_regular_port_x (p)
SCM p;
#endif
{
SCM_PORT_REPRESENTATION(p) = scm_regular_port;
return SCM_UNSPECIFIED;
}
SCM_PROC(s_multi_byte_port_p, "multi-byte-port?", 1, 0, 0, scm_multi_byte_port_p);
#ifdef __STDC__
SCM
scm_multi_byte_port_p (SCM p)
#else
SCM
scm_multi_byte_port_p (p)
SCM p;
#endif
{
return (SCM_PORT_REPRESENTATION(p) == scm_mb_port
? SCM_BOOL_T
: SCM_BOOL_F);
}
SCM_PROC(s_multi_byte_port_x, "multi-byte-port!", 1, 0, 0, scm_multi_byte_port_x);
#ifdef __STDC__
SCM
scm_multi_byte_port_x (SCM p)
#else
SCM
scm_multi_byte_port_x (p)
SCM p;
#endif
{
SCM_PORT_REPRESENTATION(p) = scm_mb_port;
return SCM_UNSPECIFIED;
}
SCM_PROC(s_wide_character_port_p, "wide-character-port?", 1, 0, 0, scm_wide_character_port_p);
#ifdef __STDC__
SCM
scm_wide_character_port_p (SCM p)
#else
SCM
scm_wide_character_port_p (p)
SCM p;
#endif
{
return (SCM_PORT_REPRESENTATION(p) == scm_wchar_port
? SCM_BOOL_T
: SCM_BOOL_F);
}
SCM_PROC(s_wide_character_port_x, "wide-character-port!", 1, 0, 0, scm_wide_character_port_x);
#ifdef __STDC__
SCM
scm_wide_character_port_x (SCM p)
#else
SCM
scm_wide_character_port_x (p)
SCM p;
#endif
{
SCM_PORT_REPRESENTATION(p) = scm_wchar_port;
return SCM_UNSPECIFIED;
}
#ifdef __STDC__
void
scm_put_wchar (int c, SCM port, int writing)
#else
void
scm_put_wchar (c, port, writing)
int c;
SCM port;
int writing;
#endif
{
if (writing)
scm_gen_puts (scm_regular_string, "#\\", port);
switch (SCM_PORT_REPRESENTATION (port))
{
case scm_regular_port:
{
if (c < 256)
{
if (!writing)
scm_gen_putc ((unsigned char)c, port);
else if ((c <= ' ') && scm_charnames[c])
scm_gen_puts (scm_regular_string, scm_charnames[c], port);
else if (c > '\177')
scm_intprint (c, 8, port);
else
scm_gen_putc ((int) c, port);
}
else
{
print_octal:
if (!writing)
scm_gen_putc ('\\', port);
scm_intprint (c, 8, port);
}
break;
}
case scm_mb_port:
{
char buf[256];
int len;
if (XMB_CUR_MAX > sizeof (buf))
goto print_octal;
len = xwctomb (buf, c);
if (len < 0)
goto print_octal;
if (len == 0)
scm_gen_putc (0, port);
else
scm_gen_putc (c, port);
break;
}
case scm_wchar_port:
{
scm_gen_putc (c, port);
break;
}
}
}
#ifdef __STDC__
void
scm_print_mb_string (SCM exp, SCM port, int writing)
#else
void
scm_print_mb_string (exp, port, writing)
SCM exp;
SCM port;
int writing;
#endif
{
if (writing)
{
int i;
int len;
char * data;
scm_gen_putc ('\"', port);
i = 0;
len = SCM_ROLENGTH (exp);
data = SCM_ROCHARS (exp);
while (i < len)
{
xwchar_t c;
int inc;
inc = xmbtowc (&c, data + i, len - i);
if (inc == 0)
inc = 1;
if (inc < 0)
{
inc = 1;
c = data[i];
}
i += inc;
switch (c)
{
case '\"':
case '\\':
scm_gen_putc ('\\', port);
default:
scm_gen_putc (c, port);
}
}
scm_gen_putc ('\"', port);
}
else
scm_gen_write (scm_mb_string, SCM_ROCHARS (exp), SCM_ROLENGTH (exp), port);
}
#ifdef __STDC__
void
scm_print_mb_symbol (SCM exp, SCM port)
#else
void
scm_print_mb_symbol (exp, port)
SCM exp;
SCM port;
#endif
{
int pos;
int end;
int len;
char * str;
int weird;
int maybe_weird;
int mw_pos;
int inc;
xwchar_t c;
len = SCM_LENGTH (exp);
str = SCM_CHARS (exp);
scm_remember (&exp);
pos = 0;
weird = 0;
maybe_weird = 0;
for (end = pos; end < len; end += inc)
{
inc = xmbtowc (&c, str + end, len - end);
if (inc < 0)
{
inc = 1;
c = str[end];
goto weird_handler;
}
if (inc == 0)
{
inc = 1;
goto weird_handler;
}
switch (c)
{
#ifdef BRACKETS_AS_PARENS
case '[':
case ']':
#endif
case '(':
case ')':
case '\"':
case ';':
case SCM_WHITE_SPACES:
case SCM_LINE_INCREMENTORS:
weird_handler:
if (maybe_weird)
{
end = mw_pos;
maybe_weird = 0;
}
if (!weird)
{
scm_gen_write (scm_regular_string, "#{", 2, port);
weird = 1;
}
if (pos < end)
{
int q;
int qinc;
q = pos;
while (q < end)
{
qinc = xmbtowc (&c, str + q, end - q);
if (inc <= 0)
{
inc = 1;
c = str[q];
}
scm_gen_putc (c, port);
q += qinc;
}
}
{
char buf[2];
buf[0] = '\\';
buf[1] = str[end];
scm_gen_write (scm_regular_string, buf, 2, port);
}
pos = end + 1;
break;
case '\\':
if (weird)
goto weird_handler;
if (!maybe_weird)
{
maybe_weird = 1;
mw_pos = pos;
}
break;
case '}':
case '#':
if (weird)
goto weird_handler;
break;
default:
break;
}
}
if (pos < end)
{
int q;
int qinc;
q = pos;
while (q < end)
{
qinc = xmbtowc (&c, str + q, end - q);
if (inc <= 0)
inc = 1;
scm_gen_putc (c, port);
q += qinc;
}
}
if (weird)
scm_gen_write (scm_regular_string, "}#", 2, port);
}
#ifdef __STDC__
void
scm_init_mbstrings (void)
#else
void
scm_init_mbstrings ()
#endif
{
#include "mbstrings.x"
}