summary refs log tree commit diff
path: root/locale/programs/charset.c
blob: fdacf25328a071d1a93a1d3a93a38ff64c9dfa3b (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
/* Copyright (C) 1996, 1997 Free Software Foundation, Inc.
   This file is part of the GNU C Library.
   Contributed by Ulrich Drepper <drepper@gnu.ai.mit.edu>, 1996.

   The GNU C Library is free software; you can redistribute it and/or
   modify it under the terms of the GNU Library General Public License as
   published by the Free Software Foundation; either version 2 of the
   License, or (at your option) any later version.

   The GNU C Library is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   Library General Public License for more details.

   You should have received a copy of the GNU Library General Public
   License along with the GNU C Library; see the file COPYING.LIB.  If not,
   write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
   Boston, MA 02111-1307, USA.  */

#ifdef HAVE_CONFIG_H
# include <config.h>
#endif

#include <alloca.h>
#include <ctype.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>

#include "error.h"
#include "charset.h"


static void
insert_char (struct linereader *lr, struct charset_t *cs, int bytes,
	     unsigned int value, const char *from, const char *to);


void
charset_new_char (struct linereader *lr, struct charset_t *cs, int bytes,
		  unsigned int value, const char *from, const char *to)
{
  if (bytes < cs->mb_cur_min)
    lr_error (lr, _("too few bytes in character encoding"));
  else if (bytes > cs->mb_cur_max)
    lr_error (lr, _("too many bytes in character encoding"));
  else
    insert_char (lr, cs, bytes, value, from, to);
}


void
charset_new_unicode (struct linereader *lr, struct charset_t *cs, int bytes,
		     unsigned int value, const char *from, const char *to)
{
  /* For now: perhaps <Uxxxx> support will be removed again... */
  insert_char (lr, cs, bytes, value, from, to);
}


unsigned int
charset_find_value (const struct charset_t *cs, const char *name, size_t len)
{
  void *result;

  if (find_entry ((hash_table *) &cs->char_table, name, len, &result) < 0)
    return ILLEGAL_CHAR_VALUE;

  return (unsigned int) ((unsigned long int) result);
}


static void
insert_char (struct linereader *lr, struct charset_t *cs, int bytes,
	     unsigned int value, const char *from, const char *to)
{
  const char *cp;
  char *buf;
  int prefix_len, len1, len2;
  unsigned int from_nr, to_nr, cnt;

  if (to == NULL)
    {
      if (insert_entry (&cs->char_table, from, strlen (from),
			(void *) (unsigned long int) value)
	  < 0)
	lr_error (lr, _("duplicate character name `%s'"), from);

      return;
    }

  /* We have a range: the names must have names with equal prefixes
     and an equal number of digits, where the second number is greater
     or equal than the first.  */
  len1 = strlen (from);
  len2 = strlen (to);

  if (len1 != len2)
    {
    illegal_range:
      lr_error (lr, _("illegal names for character range"));
      return;
    }

  cp = &from[len1 - 1];
  while (isdigit (*cp) && cp >= from)
    --cp;

  prefix_len = (cp - from) + 1;

  if (cp == &from[len1 - 1] || strncmp (from, to, prefix_len) != 0)
    goto illegal_range;

  from_nr = strtoul (&from[prefix_len], NULL, 10);
  to_nr = strtoul (&to[prefix_len], NULL, 10);

  if (from_nr > to_nr)
    {
      lr_error (lr, _("upper limit in range is not smaller then lower limit"));
      return;
    }

  buf = alloca (len1 + 1);
  memcpy (buf, from, prefix_len);

  for (cnt = from_nr; cnt <= to_nr; ++cnt)
    {
      sprintf (&buf[prefix_len], "%0*d", len1 - prefix_len, cnt);

      if (insert_entry (&cs->char_table, buf, len1,
			(void *) (unsigned long int) (value + (cnt - from_nr)))
	  < 0)
	lr_error (lr, _("duplicate character name `%s'"), buf);
    }
}