summaryrefslogtreecommitdiff
path: root/device/lib/pic14/libc/mbrtowc.c
blob: e62bc04b8677dc1d63e0815519bae584b983382e (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
/*-------------------------------------------------------------------------
   mbrtowc.c - convert a multibyte sequence to a wide character

   Copyright (C) 2016, Philipp Klaus Krause, pkk@spth.de

   Modifications for PIC14 by
   Copyright (C) 2019 Gonzalo Pérez de Olaguer Córdoba <salo@gpoc.es>

   This library is free software; you can redistribute it and/or modify it
   under the terms of the GNU General Public License as published by the
   Free Software Foundation; either version 2, or (at your option) any
   later version.

   This library is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License 
   along with this library; see the file COPYING. If not, write to the
   Free Software Foundation, 51 Franklin Street, Fifth Floor, Boston,
   MA 02110-1301, USA.

   As a special exception, if you link this library with other files,
   some of which are compiled with SDCC, to produce an executable,
   this library does not by itself cause the resulting executable to
   be covered by the GNU General Public License. This exception does
   not however invalidate any other reasons why the executable file
   might be covered by the GNU General Public License.
-------------------------------------------------------------------------*/

#include <wchar.h>
#include <errno.h>

size_t mbrtowc(wchar_t *restrict pwc, const char *restrict s, size_t n, mbstate_t *restrict ps)
{
	unsigned char first_byte;
	unsigned char seqlen;
	char mbseq[4];
	wchar_t codepoint;
	unsigned char i, j;
	static mbstate_t sps;

	if(!s)
#if defined(__SDCC_pic14)
		/* try to minimize nested calls */
		{ pwc = 0; s = ""; n = 1; }
#else
		return(mbrtowc(0, "", 1, ps));
#endif
	if(!n)
		goto eilseq;
	if(!ps)
	{
		ps = &sps;
	}

	for(i = 0; ps->c[i] && i < 3; i++)
		mbseq[i] = ps->c[i];

	seqlen = 1;
	first_byte = ps->c[0] ? ps->c[0] : *s;

	if(first_byte & 0x80)
	{
		while (first_byte & (0x80 >> seqlen))
			seqlen++;
		first_byte &= (0xff >> (seqlen + 1));
	}

	if(seqlen > 4)
		goto eilseq;

	if(i + n < seqlen) // Incomplete multibyte character
	{
		for(;n-- ; i++)
			ps->c[i] = *s++;
		return(-2);
	}

	for(j = 0; j < i; j++)
		ps->c[j] = 0;

	for(n = 1, i = i ? i : 1; i < seqlen; i++, n++)
	{
		mbseq[i] = *s++;
		if((mbseq[i] & 0xc0) != 0x80)
			goto eilseq;
	}

	codepoint = first_byte;

	for(s = mbseq + 1, seqlen--; seqlen; seqlen--)
	{
		codepoint <<= 6;
		codepoint |= (*s & 0x3f);
		s++;
	}

	if(codepoint >= 0xd800 && codepoint <= 0xdfff) // UTF-16 surrogate.
		return(-1);

	if(pwc)
		*pwc = codepoint;
	return(n);

eilseq:
	errno = EILSEQ;
	return(-1);
}