aboutsummaryrefslogtreecommitdiff
blob: 4351eea39715885fb0afccf96fe35e25505944c6 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
/* Copyright (C) 1996 Free Software Foundation, Inc.
This file is part of the GNU C Library.
Contributed by Ulrich Drepper <drepper@gnu.ai.mit.edu>, 1996.

The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Library General Public License as
published by the Free Software Foundation; either version 2 of the
License, or (at your option) any later version.

The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Library General Public License for more details.

You should have received a copy of the GNU Library General Public
License along with the GNU C Library; see the file COPYING.LIB.  If
not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
Boston, MA 02111-1307, USA.  */

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

#include <assert.h>
#include <stdlib.h>

#include "charset.h"
#include "stringtrans.h"


/* Global variable.  */
enum encoding_method encoding_method = ENC_UCS4;


void *xmalloc (size_t __n);
void *xrealloc (void *__p, size_t __n);


#define ADDC(ch)							      \
  do									      \
    {									      \
      char *cp;								      \
      if (bufact + (encoding_method == ENC_UCS4 ? 4 : 1) >= bufmax)	      \
	{								      \
	  bufmax *= 2;							      \
	  buf = xrealloc (buf, bufmax);					      \
	}								      \
      cp = &buf[bufact];						      \
      if (encode_char (ch, &cp) < 0)					      \
	{								      \
	  free (buf);							      \
	  return NULL;							      \
	}								      \
      bufact = cp - buf;						      \
    }									      \
  while (0)


char *
translate_string (char *str, struct charset_t *charset)
{
  char *buf;
  size_t bufact = 0;
  size_t bufmax = 56;

  buf = (char *) xmalloc (bufmax);

  while (str[0] != '\0')
    {
      char *tp;
      unsigned int value;

      if (str[0] != '<')
	{
	  ADDC (*str++);
	  continue;
	}

      tp = &str[1];
      while (tp[0] != '\0' && tp[0] != '>')
	if (tp[0] == '\\')
	  if (tp[1] != '\0')
	    tp += 2;
	  else
	    ++tp;
	else
	  ++tp;

      if (tp[0] == '\0')
	{
	  free (buf);
	  return NULL;
	}

      value = charset_find_value (charset, str + 1, tp - (str + 1));
      if ((wchar_t) value == ILLEGAL_CHAR_VALUE)
	{
	  free (buf);
	  return NULL;
	}
      else
	/* Encode string using current method.  */
	ADDC (value);

      str = &tp[1];
    }

  ADDC ('\0');

  return buf;
}


int
encode_char (unsigned int value, char **cpp)
{
  switch (encoding_method)
    {
    case ENC_UCS1:
      if (value > 255)
	return -1;
      *(*cpp)++ = (char) value;
      break;

    case ENC_UCS4:
#if __BYTE_ORDER == __BIG_ENDIAN
      *(*cpp)++ = (char) (value >> 24);
      *(*cpp)++ = (char) ((value >> 16) & 0xff);
      *(*cpp)++ = (char) ((value >> 8) & 0xff);
      *(*cpp)++ = (char) (value & 0xff);
#else
      *(*cpp)++ = (char) (value & 0xff);
      *(*cpp)++ = (char) ((value >>= 8) & 0xff);
      *(*cpp)++ = (char) ((value >>= 8) & 0xff);
      *(*cpp)++ = (char) ((value >>= 8) & 0xff);
#endif
      break;

    default:
      return -1;
    }

  return 0;
}