Context Navigation

str.c@ b06414f

Visit:

lfn serial ticket/834-toolchain-update topic/msim-upgrade topic/simplify-dev-export

Last change on this file since b06414f was b06414f, checked in by Jakub Jermar <jakub@…>, 8 years ago

Use proper sizes for buffers holding conversions from/to UTF-16 LFN's

FAT uses UTF-16 for encoding long file names. HelenOS needs to convert
these strings into and from its native UTF-8 encoding. The size of the
UTF-8 buffer in bytes needs to be at least 4 times the number of
characters in a LFN.

Property mode set to 100644

File size: 44.3 KB

Line
1	/*
2	* Copyright (c) 2005 Martin Decky
3	* Copyright (c) 2008 Jiri Svoboda
4	* Copyright (c) 2011 Martin Sucha
5	* Copyright (c) 2011 Oleg Romanenko
6	* All rights reserved.
7	*
8	* Redistribution and use in source and binary forms, with or without
9	* modification, are permitted provided that the following conditions
10	* are met:
11	*
12	* - Redistributions of source code must retain the above copyright
13	* notice, this list of conditions and the following disclaimer.
14	* - Redistributions in binary form must reproduce the above copyright
15	* notice, this list of conditions and the following disclaimer in the
16	* documentation and/or other materials provided with the distribution.
17	* - The name of the author may not be used to endorse or promote products
18	* derived from this software without specific prior written permission.
19	*
20	* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
21	* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
22	* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
23	* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
24	* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
25	* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26	* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27	* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28	* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
29	* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30	*/
31
32	/** @addtogroup libc
33	* @{
34	*/
35	/** @file
36	*/
37
38	#include <str.h>
39	#include <stdlib.h>
40	#include <stddef.h>
41	#include <assert.h>
42	#include <stdint.h>
43	#include <ctype.h>
44	#include <malloc.h>
45	#include <errno.h>
46	#include <align.h>
47	#include <mem.h>
48
49	/** Check the condition if wchar_t is signed */
50	#ifdef WCHAR_IS_UNSIGNED
51	#define WCHAR_SIGNED_CHECK(cond) (true)
52	#else
53	#define WCHAR_SIGNED_CHECK(cond) (cond)
54	#endif
55
56	/** Byte mask consisting of lowest @n bits (out of 8) */
57	#define LO_MASK_8(n) ((uint8_t) ((1 << (n)) - 1))
58
59	/** Byte mask consisting of lowest @n bits (out of 32) */
60	#define LO_MASK_32(n) ((uint32_t) ((1 << (n)) - 1))
61
62	/** Byte mask consisting of highest @n bits (out of 8) */
63	#define HI_MASK_8(n) (~LO_MASK_8(8 - (n)))
64
65	/** Number of data bits in a UTF-8 continuation byte */
66	#define CONT_BITS 6
67
68	/** Decode a single character from a string.
69	*
70	* Decode a single character from a string of size @a size. Decoding starts
71	* at @a offset and this offset is moved to the beginning of the next
72	* character. In case of decoding error, offset generally advances at least
73	* by one. However, offset is never moved beyond size.
74	*
75	* @param str String (not necessarily NULL-terminated).
76	* @param offset Byte offset in string where to start decoding.
77	* @param size Size of the string (in bytes).
78	*
79	* @return Value of decoded character, U_SPECIAL on decoding error or
80	* NULL if attempt to decode beyond @a size.
81	*
82	*/
83	wchar_t str_decode(const char str, size_t offset, size_t size)
84	{
85	if (*offset + 1 > size)
86	return 0;
87
88	/* First byte read from string */
89	uint8_t b0 = (uint8_t) str[(*offset)++];
90
91	/* Determine code length */
92
93	unsigned int b0_bits; /* Data bits in first byte */
94	unsigned int cbytes; /* Number of continuation bytes */
95
96	if ((b0 & 0x80) == 0) {
97	/* 0xxxxxxx (Plain ASCII) */
98	b0_bits = 7;
99	cbytes = 0;
100	} else if ((b0 & 0xe0) == 0xc0) {
101	/* 110xxxxx 10xxxxxx */
102	b0_bits = 5;
103	cbytes = 1;
104	} else if ((b0 & 0xf0) == 0xe0) {
105	/* 1110xxxx 10xxxxxx 10xxxxxx */
106	b0_bits = 4;
107	cbytes = 2;
108	} else if ((b0 & 0xf8) == 0xf0) {
109	/* 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx */
110	b0_bits = 3;
111	cbytes = 3;
112	} else {
113	/* 10xxxxxx -- unexpected continuation byte */
114	return U_SPECIAL;
115	}
116
117	if (*offset + cbytes > size)
118	return U_SPECIAL;
119
120	wchar_t ch = b0 & LO_MASK_8(b0_bits);
121
122	/* Decode continuation bytes */
123	while (cbytes > 0) {
124	uint8_t b = (uint8_t) str[(*offset)++];
125
126	/* Must be 10xxxxxx */
127	if ((b & 0xc0) != 0x80)
128	return U_SPECIAL;
129
130	/* Shift data bits to ch */
131	ch = (ch << CONT_BITS) \| (wchar_t) (b & LO_MASK_8(CONT_BITS));
132	cbytes--;
133	}
134
135	return ch;
136	}
137
138	/** Decode a single character from a string to the left.
139	*
140	* Decode a single character from a string of size @a size. Decoding starts
141	* at @a offset and this offset is moved to the beginning of the previous
142	* character. In case of decoding error, offset generally decreases at least
143	* by one. However, offset is never moved before 0.
144	*
145	* @param str String (not necessarily NULL-terminated).
146	* @param offset Byte offset in string where to start decoding.
147	* @param size Size of the string (in bytes).
148	*
149	* @return Value of decoded character, U_SPECIAL on decoding error or
150	* NULL if attempt to decode beyond @a start of str.
151	*
152	*/
153	wchar_t str_decode_reverse(const char str, size_t offset, size_t size)
154	{
155	if (*offset == 0)
156	return 0;
157
158	size_t processed = 0;
159	/* Continue while continuation bytes found */
160	while (*offset > 0 && processed < 4) {
161	uint8_t b = (uint8_t) str[--(*offset)];
162
163	if (processed == 0 && (b & 0x80) == 0) {
164	/* 0xxxxxxx (Plain ASCII) */
165	return b & 0x7f;
166	}
167	else if ((b & 0xe0) == 0xc0 \|\| (b & 0xf0) == 0xe0 \|\|
168	(b & 0xf8) == 0xf0) {
169	/* Start byte */
170	size_t start_offset = *offset;
171	return str_decode(str, &start_offset, size);
172	}
173	else if ((b & 0xc0) != 0x80) {
174	/* Not a continuation byte */
175	return U_SPECIAL;
176	}
177	processed++;
178	}
179	/* Too many continuation bytes */
180	return U_SPECIAL;
181	}
182
183	/** Encode a single character to string representation.
184	*
185	* Encode a single character to string representation (i.e. UTF-8) and store
186	* it into a buffer at @a offset. Encoding starts at @a offset and this offset
187	* is moved to the position where the next character can be written to.
188	*
189	* @param ch Input character.
190	* @param str Output buffer.
191	* @param offset Byte offset where to start writing.
192	* @param size Size of the output buffer (in bytes).
193	*
194	* @return EOK if the character was encoded successfully, EOVERFLOW if there
195	* was not enough space in the output buffer or EINVAL if the character
196	* code was invalid.
197	*/
198	int chr_encode(const wchar_t ch, char str, size_t offset, size_t size)
199	{
200	if (*offset >= size)
201	return EOVERFLOW;
202
203	if (!chr_check(ch))
204	return EINVAL;
205
206	/* Unsigned version of ch (bit operations should only be done
207	on unsigned types). */
208	uint32_t cc = (uint32_t) ch;
209
210	/* Determine how many continuation bytes are needed */
211
212	unsigned int b0_bits; /* Data bits in first byte */
213	unsigned int cbytes; /* Number of continuation bytes */
214
215	if ((cc & ~LO_MASK_32(7)) == 0) {
216	b0_bits = 7;
217	cbytes = 0;
218	} else if ((cc & ~LO_MASK_32(11)) == 0) {
219	b0_bits = 5;
220	cbytes = 1;
221	} else if ((cc & ~LO_MASK_32(16)) == 0) {
222	b0_bits = 4;
223	cbytes = 2;
224	} else if ((cc & ~LO_MASK_32(21)) == 0) {
225	b0_bits = 3;
226	cbytes = 3;
227	} else {
228	/* Codes longer than 21 bits are not supported */
229	return EINVAL;
230	}
231
232	/* Check for available space in buffer */
233	if (*offset + cbytes >= size)
234	return EOVERFLOW;
235
236	/* Encode continuation bytes */
237	unsigned int i;
238	for (i = cbytes; i > 0; i--) {
239	str[*offset + i] = 0x80 \| (cc & LO_MASK_32(CONT_BITS));
240	cc = cc >> CONT_BITS;
241	}
242
243	/* Encode first byte */
244	str[*offset] = (cc & LO_MASK_32(b0_bits)) \| HI_MASK_8(8 - b0_bits - 1);
245
246	/* Advance offset */
247	*offset += cbytes + 1;
248
249	return EOK;
250	}
251
252	/** Get size of string.
253	*
254	* Get the number of bytes which are used by the string @a str (excluding the
255	* NULL-terminator).
256	*
257	* @param str String to consider.
258	*
259	* @return Number of bytes used by the string
260	*
261	*/
262	size_t str_size(const char *str)
263	{
264	size_t size = 0;
265
266	while (*str++ != 0)
267	size++;
268
269	return size;
270	}
271
272	/** Get size of wide string.
273	*
274	* Get the number of bytes which are used by the wide string @a str (excluding the
275	* NULL-terminator).
276	*
277	* @param str Wide string to consider.
278	*
279	* @return Number of bytes used by the wide string
280	*
281	*/
282	size_t wstr_size(const wchar_t *str)
283	{
284	return (wstr_length(str) * sizeof(wchar_t));
285	}
286
287	/** Get size of string with length limit.
288	*
289	* Get the number of bytes which are used by up to @a max_len first
290	* characters in the string @a str. If @a max_len is greater than
291	* the length of @a str, the entire string is measured (excluding the
292	* NULL-terminator).
293	*
294	* @param str String to consider.
295	* @param max_len Maximum number of characters to measure.
296	*
297	* @return Number of bytes used by the characters.
298	*
299	*/
300	size_t str_lsize(const char *str, size_t max_len)
301	{
302	size_t len = 0;
303	size_t offset = 0;
304
305	while (len < max_len) {
306	if (str_decode(str, &offset, STR_NO_LIMIT) == 0)
307	break;
308
309	len++;
310	}
311
312	return offset;
313	}
314
315	/** Get size of string with size limit.
316	*
317	* Get the number of bytes which are used by the string @a str
318	* (excluding the NULL-terminator), but no more than @max_size bytes.
319	*
320	* @param str String to consider.
321	* @param max_size Maximum number of bytes to measure.
322	*
323	* @return Number of bytes used by the string
324	*
325	*/
326	size_t str_nsize(const char *str, size_t max_size)
327	{
328	size_t size = 0;
329
330	while ((*str++ != 0) && (size < max_size))
331	size++;
332
333	return size;
334	}
335
336	/** Get size of wide string with size limit.
337	*
338	* Get the number of bytes which are used by the wide string @a str
339	* (excluding the NULL-terminator), but no more than @max_size bytes.
340	*
341	* @param str Wide string to consider.
342	* @param max_size Maximum number of bytes to measure.
343	*
344	* @return Number of bytes used by the wide string
345	*
346	*/
347	size_t wstr_nsize(const wchar_t *str, size_t max_size)
348	{
349	return (wstr_nlength(str, max_size) * sizeof(wchar_t));
350	}
351
352	/** Get size of wide string with length limit.
353	*
354	* Get the number of bytes which are used by up to @a max_len first
355	* wide characters in the wide string @a str. If @a max_len is greater than
356	* the length of @a str, the entire wide string is measured (excluding the
357	* NULL-terminator).
358	*
359	* @param str Wide string to consider.
360	* @param max_len Maximum number of wide characters to measure.
361	*
362	* @return Number of bytes used by the wide characters.
363	*
364	*/
365	size_t wstr_lsize(const wchar_t *str, size_t max_len)
366	{
367	return (wstr_nlength(str, max_len * sizeof(wchar_t)) * sizeof(wchar_t));
368	}
369
370	/** Get number of characters in a string.
371	*
372	* @param str NULL-terminated string.
373	*
374	* @return Number of characters in string.
375	*
376	*/
377	size_t str_length(const char *str)
378	{
379	size_t len = 0;
380	size_t offset = 0;
381
382	while (str_decode(str, &offset, STR_NO_LIMIT) != 0)
383	len++;
384
385	return len;
386	}
387
388	/** Get number of characters in a wide string.
389	*
390	* @param str NULL-terminated wide string.
391	*
392	* @return Number of characters in @a str.
393	*
394	*/
395	size_t wstr_length(const wchar_t *wstr)
396	{
397	size_t len = 0;
398
399	while (*wstr++ != 0)
400	len++;
401
402	return len;
403	}
404
405	/** Get number of characters in a string with size limit.
406	*
407	* @param str NULL-terminated string.
408	* @param size Maximum number of bytes to consider.
409	*
410	* @return Number of characters in string.
411	*
412	*/
413	size_t str_nlength(const char *str, size_t size)
414	{
415	size_t len = 0;
416	size_t offset = 0;
417
418	while (str_decode(str, &offset, size) != 0)
419	len++;
420
421	return len;
422	}
423
424	/** Get number of characters in a string with size limit.
425	*
426	* @param str NULL-terminated string.
427	* @param size Maximum number of bytes to consider.
428	*
429	* @return Number of characters in string.
430	*
431	*/
432	size_t wstr_nlength(const wchar_t *str, size_t size)
433	{
434	size_t len = 0;
435	size_t limit = ALIGN_DOWN(size, sizeof(wchar_t));
436	size_t offset = 0;
437
438	while ((offset < limit) && (*str++ != 0)) {
439	len++;
440	offset += sizeof(wchar_t);
441	}
442
443	return len;
444	}
445
446	/** Get character display width on a character cell display.
447	*
448	* @param ch Character
449	* @return Width of character in cells.
450	*/
451	size_t chr_width(wchar_t ch)
452	{
453	return 1;
454	}
455
456	/** Get string display width on a character cell display.
457	*
458	* @param str String
459	* @return Width of string in cells.
460	*/
461	size_t str_width(const char *str)
462	{
463	size_t width = 0;
464	size_t offset = 0;
465	wchar_t ch;
466
467	while ((ch = str_decode(str, &offset, STR_NO_LIMIT)) != 0)
468	width += chr_width(ch);
469
470	return width;
471	}
472
473	/** Check whether character is plain ASCII.
474	*
475	* @return True if character is plain ASCII.
476	*
477	*/
478	bool ascii_check(wchar_t ch)
479	{
480	if (WCHAR_SIGNED_CHECK(ch >= 0) && (ch <= 127))
481	return true;
482
483	return false;
484	}
485
486	/** Check whether character is valid
487	*
488	* @return True if character is a valid Unicode code point.
489	*
490	*/
491	bool chr_check(wchar_t ch)
492	{
493	if (WCHAR_SIGNED_CHECK(ch >= 0) && (ch <= 1114111))
494	return true;
495
496	return false;
497	}
498
499	/** Compare two NULL terminated strings.
500	*
501	* Do a char-by-char comparison of two NULL-terminated strings.
502	* The strings are considered equal iff their length is equal
503	* and both strings consist of the same sequence of characters.
504	*
505	* A string S1 is less than another string S2 if it has a character with
506	* lower value at the first character position where the strings differ.
507	* If the strings differ in length, the shorter one is treated as if
508	* padded by characters with a value of zero.
509	*
510	* @param s1 First string to compare.
511	* @param s2 Second string to compare.
512	*
513	* @return 0 if the strings are equal, -1 if the first is less than the second,
514	* 1 if the second is less than the first.
515	*
516	*/
517	int str_cmp(const char s1, const char s2)
518	{
519	wchar_t c1 = 0;
520	wchar_t c2 = 0;
521
522	size_t off1 = 0;
523	size_t off2 = 0;
524
525	while (true) {
526	c1 = str_decode(s1, &off1, STR_NO_LIMIT);
527	c2 = str_decode(s2, &off2, STR_NO_LIMIT);
528
529	if (c1 < c2)
530	return -1;
531
532	if (c1 > c2)
533	return 1;
534
535	if (c1 == 0 \|\| c2 == 0)
536	break;
537	}
538
539	return 0;
540	}
541
542	/** Compare two NULL terminated strings with length limit.
543	*
544	* Do a char-by-char comparison of two NULL-terminated strings.
545	* The strings are considered equal iff
546	* min(str_length(s1), max_len) == min(str_length(s2), max_len)
547	* and both strings consist of the same sequence of characters,
548	* up to max_len characters.
549	*
550	* A string S1 is less than another string S2 if it has a character with
551	* lower value at the first character position where the strings differ.
552	* If the strings differ in length, the shorter one is treated as if
553	* padded by characters with a value of zero. Only the first max_len
554	* characters are considered.
555	*
556	* @param s1 First string to compare.
557	* @param s2 Second string to compare.
558	* @param max_len Maximum number of characters to consider.
559	*
560	* @return 0 if the strings are equal, -1 if the first is less than the second,
561	* 1 if the second is less than the first.
562	*
563	*/
564	int str_lcmp(const char s1, const char s2, size_t max_len)
565	{
566	wchar_t c1 = 0;
567	wchar_t c2 = 0;
568
569	size_t off1 = 0;
570	size_t off2 = 0;
571
572	size_t len = 0;
573
574	while (true) {
575	if (len >= max_len)
576	break;
577
578	c1 = str_decode(s1, &off1, STR_NO_LIMIT);
579	c2 = str_decode(s2, &off2, STR_NO_LIMIT);
580
581	if (c1 < c2)
582	return -1;
583
584	if (c1 > c2)
585	return 1;
586
587	if (c1 == 0 \|\| c2 == 0)
588	break;
589
590	++len;
591	}
592
593	return 0;
594
595	}
596
597	/** Compare two NULL terminated strings in case-insensitive manner.
598	*
599	* Do a char-by-char comparison of two NULL-terminated strings.
600	* The strings are considered equal iff their length is equal
601	* and both strings consist of the same sequence of characters
602	* when converted to lower case.
603	*
604	* A string S1 is less than another string S2 if it has a character with
605	* lower value at the first character position where the strings differ.
606	* If the strings differ in length, the shorter one is treated as if
607	* padded by characters with a value of zero.
608	*
609	* @param s1 First string to compare.
610	* @param s2 Second string to compare.
611	*
612	* @return 0 if the strings are equal, -1 if the first is less than the second,
613	* 1 if the second is less than the first.
614	*
615	*/
616	int str_casecmp(const char s1, const char s2)
617	{
618	wchar_t c1 = 0;
619	wchar_t c2 = 0;
620
621	size_t off1 = 0;
622	size_t off2 = 0;
623
624	while (true) {
625	c1 = tolower(str_decode(s1, &off1, STR_NO_LIMIT));
626	c2 = tolower(str_decode(s2, &off2, STR_NO_LIMIT));
627
628	if (c1 < c2)
629	return -1;
630
631	if (c1 > c2)
632	return 1;
633
634	if (c1 == 0 \|\| c2 == 0)
635	break;
636	}
637
638	return 0;
639	}
640
641	/** Compare two NULL terminated strings with length limit in case-insensitive
642	* manner.
643	*
644	* Do a char-by-char comparison of two NULL-terminated strings.
645	* The strings are considered equal iff
646	* min(str_length(s1), max_len) == min(str_length(s2), max_len)
647	* and both strings consist of the same sequence of characters,
648	* up to max_len characters.
649	*
650	* A string S1 is less than another string S2 if it has a character with
651	* lower value at the first character position where the strings differ.
652	* If the strings differ in length, the shorter one is treated as if
653	* padded by characters with a value of zero. Only the first max_len
654	* characters are considered.
655	*
656	* @param s1 First string to compare.
657	* @param s2 Second string to compare.
658	* @param max_len Maximum number of characters to consider.
659	*
660	* @return 0 if the strings are equal, -1 if the first is less than the second,
661	* 1 if the second is less than the first.
662	*
663	*/
664	int str_lcasecmp(const char s1, const char s2, size_t max_len)
665	{
666	wchar_t c1 = 0;
667	wchar_t c2 = 0;
668
669	size_t off1 = 0;
670	size_t off2 = 0;
671
672	size_t len = 0;
673
674	while (true) {
675	if (len >= max_len)
676	break;
677
678	c1 = tolower(str_decode(s1, &off1, STR_NO_LIMIT));
679	c2 = tolower(str_decode(s2, &off2, STR_NO_LIMIT));
680
681	if (c1 < c2)
682	return -1;
683
684	if (c1 > c2)
685	return 1;
686
687	if (c1 == 0 \|\| c2 == 0)
688	break;
689
690	++len;
691	}
692
693	return 0;
694
695	}
696
697	/** Test whether p is a prefix of s.
698	*
699	* Do a char-by-char comparison of two NULL-terminated strings
700	* and determine if p is a prefix of s.
701	*
702	* @param s The string in which to look
703	* @param p The string to check if it is a prefix of s
704	*
705	* @return true iff p is prefix of s else false
706	*
707	*/
708	bool str_test_prefix(const char s, const char p)
709	{
710	wchar_t c1 = 0;
711	wchar_t c2 = 0;
712
713	size_t off1 = 0;
714	size_t off2 = 0;
715
716	while (true) {
717	c1 = str_decode(s, &off1, STR_NO_LIMIT);
718	c2 = str_decode(p, &off2, STR_NO_LIMIT);
719
720	if (c2 == 0)
721	return true;
722
723	if (c1 != c2)
724	return false;
725
726	if (c1 == 0)
727	break;
728	}
729
730	return false;
731	}
732
733	/** Copy string.
734	*
735	* Copy source string @a src to destination buffer @a dest.
736	* No more than @a size bytes are written. If the size of the output buffer
737	* is at least one byte, the output string will always be well-formed, i.e.
738	* null-terminated and containing only complete characters.
739	*
740	* @param dest Destination buffer.
741	* @param count Size of the destination buffer (must be > 0).
742	* @param src Source string.
743	*
744	*/
745	void str_cpy(char dest, size_t size, const char src)
746	{
747	/* There must be space for a null terminator in the buffer. */
748	assert(size > 0);
749
750	size_t src_off = 0;
751	size_t dest_off = 0;
752
753	wchar_t ch;
754	while ((ch = str_decode(src, &src_off, STR_NO_LIMIT)) != 0) {
755	if (chr_encode(ch, dest, &dest_off, size - 1) != EOK)
756	break;
757	}
758
759	dest[dest_off] = '\0';
760	}
761
762	/** Copy size-limited substring.
763	*
764	* Copy prefix of string @a src of max. size @a size to destination buffer
765	* @a dest. No more than @a size bytes are written. The output string will
766	* always be well-formed, i.e. null-terminated and containing only complete
767	* characters.
768	*
769	* No more than @a n bytes are read from the input string, so it does not
770	* have to be null-terminated.
771	*
772	* @param dest Destination buffer.
773	* @param count Size of the destination buffer (must be > 0).
774	* @param src Source string.
775	* @param n Maximum number of bytes to read from @a src.
776	*
777	*/
778	void str_ncpy(char dest, size_t size, const char src, size_t n)
779	{
780	/* There must be space for a null terminator in the buffer. */
781	assert(size > 0);
782
783	size_t src_off = 0;
784	size_t dest_off = 0;
785
786	wchar_t ch;
787	while ((ch = str_decode(src, &src_off, n)) != 0) {
788	if (chr_encode(ch, dest, &dest_off, size - 1) != EOK)
789	break;
790	}
791
792	dest[dest_off] = '\0';
793	}
794
795	/** Append one string to another.
796	*
797	* Append source string @a src to string in destination buffer @a dest.
798	* Size of the destination buffer is @a dest. If the size of the output buffer
799	* is at least one byte, the output string will always be well-formed, i.e.
800	* null-terminated and containing only complete characters.
801	*
802	* @param dest Destination buffer.
803	* @param count Size of the destination buffer.
804	* @param src Source string.
805	*/
806	void str_append(char dest, size_t size, const char src)
807	{
808	size_t dstr_size;
809
810	dstr_size = str_size(dest);
811	if (dstr_size >= size)
812	return;
813
814	str_cpy(dest + dstr_size, size - dstr_size, src);
815	}
816
817	/** Convert space-padded ASCII to string.
818	*
819	* Common legacy text encoding in hardware is 7-bit ASCII fitted into
820	* a fixed-width byte buffer (bit 7 always zero), right-padded with spaces
821	* (ASCII 0x20). Convert space-padded ascii to string representation.
822	*
823	* If the text does not fit into the destination buffer, the function converts
824	* as many characters as possible and returns EOVERFLOW.
825	*
826	* If the text contains non-ASCII bytes (with bit 7 set), the whole string is
827	* converted anyway and invalid characters are replaced with question marks
828	* (U_SPECIAL) and the function returns EIO.
829	*
830	* Regardless of return value upon return @a dest will always be well-formed.
831	*
832	* @param dest Destination buffer
833	* @param size Size of destination buffer
834	* @param src Space-padded ASCII.
835	* @param n Size of the source buffer in bytes.
836	*
837	* @return EOK on success, EOVERFLOW if the text does not fit
838	* destination buffer, EIO if the text contains
839	* non-ASCII bytes.
840	*/
841	int spascii_to_str(char dest, size_t size, const uint8_t src, size_t n)
842	{
843	size_t sidx;
844	size_t didx;
845	size_t dlast;
846	uint8_t byte;
847	int rc;
848	int result;
849
850	/* There must be space for a null terminator in the buffer. */
851	assert(size > 0);
852	result = EOK;
853
854	didx = 0;
855	dlast = 0;
856	for (sidx = 0; sidx < n; ++sidx) {
857	byte = src[sidx];
858	if (!ascii_check(byte)) {
859	byte = U_SPECIAL;
860	result = EIO;
861	}
862
863	rc = chr_encode(byte, dest, &didx, size - 1);
864	if (rc != EOK) {
865	assert(rc == EOVERFLOW);
866	dest[didx] = '\0';
867	return rc;
868	}
869
870	/* Remember dest index after last non-empty character */
871	if (byte != 0x20)
872	dlast = didx;
873	}
874
875	/* Terminate string after last non-empty character */
876	dest[dlast] = '\0';
877	return result;
878	}
879
880	/** Convert wide string to string.
881	*
882	* Convert wide string @a src to string. The output is written to the buffer
883	* specified by @a dest and @a size. @a size must be non-zero and the string
884	* written will always be well-formed.
885	*
886	* @param dest Destination buffer.
887	* @param size Size of the destination buffer.
888	* @param src Source wide string.
889	*/
890	void wstr_to_str(char dest, size_t size, const wchar_t src)
891	{
892	wchar_t ch;
893	size_t src_idx;
894	size_t dest_off;
895
896	/* There must be space for a null terminator in the buffer. */
897	assert(size > 0);
898
899	src_idx = 0;
900	dest_off = 0;
901
902	while ((ch = src[src_idx++]) != 0) {
903	if (chr_encode(ch, dest, &dest_off, size - 1) != EOK)
904	break;
905	}
906
907	dest[dest_off] = '\0';
908	}
909
910	/** Convert UTF16 string to string.
911	*
912	* Convert utf16 string @a src to string. The output is written to the buffer
913	* specified by @a dest and @a size. @a size must be non-zero and the string
914	* written will always be well-formed. Surrogate pairs also supported.
915	*
916	* @param dest Destination buffer.
917	* @param size Size of the destination buffer.
918	* @param src Source utf16 string.
919	*
920	* @return EOK, if success, negative otherwise.
921	*/
922	int utf16_to_str(char dest, size_t size, const uint16_t src)
923	{
924	size_t idx = 0, dest_off = 0;
925	wchar_t ch;
926	int rc = EOK;
927
928	/* There must be space for a null terminator in the buffer. */
929	assert(size > 0);
930
931	while (src[idx]) {
932	if ((src[idx] & 0xfc00) == 0xd800) {
933	if (src[idx + 1] && (src[idx + 1] & 0xfc00) == 0xdc00) {
934	ch = 0x10000;
935	ch += (src[idx] & 0x03FF) << 10;
936	ch += (src[idx + 1] & 0x03FF);
937	idx += 2;
938	}
939	else
940	break;
941	} else {
942	ch = src[idx];
943	idx++;
944	}
945	rc = chr_encode(ch, dest, &dest_off, size - 1);
946	if (rc != EOK)
947	break;
948	}
949	dest[dest_off] = '\0';
950	return rc;
951	}
952
953	/** Convert string to UTF16 string.
954	*
955	* Convert string @a src to utf16 string. The output is written to the buffer
956	* specified by @a dest and @a dlen. @a dlen must be non-zero and the string
957	* written will always be well-formed. Surrogate pairs also supported.
958	*
959	* @param dest Destination buffer.
960	* @param dlen Number of utf16 characters that fit in the destination buffer.
961	* @param src Source string.
962	*
963	* @return EOK, if success, negative otherwise.
964	*/
965	int str_to_utf16(uint16_t dest, size_t dlen, const char src)
966	{
967	int rc = EOK;
968	size_t offset = 0;
969	size_t idx = 0;
970	wchar_t c;
971
972	assert(dlen > 0);
973
974	while ((c = str_decode(src, &offset, STR_NO_LIMIT)) != 0) {
975	if (c > 0x10000) {
976	if (idx + 2 >= dlen - 1) {
977	rc = EOVERFLOW;
978	break;
979	}
980	c = (c - 0x10000);
981	dest[idx] = 0xD800 \| (c >> 10);
982	dest[idx + 1] = 0xDC00 \| (c & 0x3FF);
983	idx++;
984	} else {
985	dest[idx] = c;
986	}
987
988	idx++;
989	if (idx >= dlen - 1) {
990	rc = EOVERFLOW;
991	break;
992	}
993	}
994
995	dest[idx] = '\0';
996	return rc;
997	}
998
999
1000	/** Convert wide string to new string.
1001	*
1002	* Convert wide string @a src to string. Space for the new string is allocated
1003	* on the heap.
1004	*
1005	* @param src Source wide string.
1006	* @return New string.
1007	*/
1008	char wstr_to_astr(const wchar_t src)
1009	{
1010	char dbuf[STR_BOUNDS(1)];
1011	char *str;
1012	wchar_t ch;
1013
1014	size_t src_idx;
1015	size_t dest_off;
1016	size_t dest_size;
1017
1018	/* Compute size of encoded string. */
1019
1020	src_idx = 0;
1021	dest_size = 0;
1022
1023	while ((ch = src[src_idx++]) != 0) {
1024	dest_off = 0;
1025	if (chr_encode(ch, dbuf, &dest_off, STR_BOUNDS(1)) != EOK)
1026	break;
1027	dest_size += dest_off;
1028	}
1029
1030	str = malloc(dest_size + 1);
1031	if (str == NULL)
1032	return NULL;
1033
1034	/* Encode string. */
1035
1036	src_idx = 0;
1037	dest_off = 0;
1038
1039	while ((ch = src[src_idx++]) != 0) {
1040	if (chr_encode(ch, str, &dest_off, dest_size) != EOK)
1041	break;
1042	}
1043
1044	str[dest_size] = '\0';
1045	return str;
1046	}
1047
1048
1049	/** Convert string to wide string.
1050	*
1051	* Convert string @a src to wide string. The output is written to the
1052	* buffer specified by @a dest and @a dlen. @a dlen must be non-zero
1053	* and the wide string written will always be null-terminated.
1054	*
1055	* @param dest Destination buffer.
1056	* @param dlen Length of destination buffer (number of wchars).
1057	* @param src Source string.
1058	*/
1059	void str_to_wstr(wchar_t dest, size_t dlen, const char src)
1060	{
1061	size_t offset;
1062	size_t di;
1063	wchar_t c;
1064
1065	assert(dlen > 0);
1066
1067	offset = 0;
1068	di = 0;
1069
1070	do {
1071	if (di >= dlen - 1)
1072	break;
1073
1074	c = str_decode(src, &offset, STR_NO_LIMIT);
1075	dest[di++] = c;
1076	} while (c != '\0');
1077
1078	dest[dlen - 1] = '\0';
1079	}
1080
1081	/** Convert string to wide string.
1082	*
1083	* Convert string @a src to wide string. A new wide NULL-terminated
1084	* string will be allocated on the heap.
1085	*
1086	* @param src Source string.
1087	*/
1088	wchar_t str_to_awstr(const char str)
1089	{
1090	size_t len = str_length(str);
1091
1092	wchar_t *wstr = calloc(len+1, sizeof(wchar_t));
1093	if (wstr == NULL)
1094	return NULL;
1095
1096	str_to_wstr(wstr, len + 1, str);
1097	return wstr;
1098	}
1099
1100	/** Find first occurence of character in string.
1101	*
1102	* @param str String to search.
1103	* @param ch Character to look for.
1104	*
1105	* @return Pointer to character in @a str or NULL if not found.
1106	*/
1107	char str_chr(const char str, wchar_t ch)
1108	{
1109	wchar_t acc;
1110	size_t off = 0;
1111	size_t last = 0;
1112
1113	while ((acc = str_decode(str, &off, STR_NO_LIMIT)) != 0) {
1114	if (acc == ch)
1115	return (char *) (str + last);
1116	last = off;
1117	}
1118
1119	return NULL;
1120	}
1121
1122	/** Removes specified trailing characters from a string.
1123	*
1124	* @param str String to remove from.
1125	* @param ch Character to remove.
1126	*/
1127	void str_rtrim(char *str, wchar_t ch)
1128	{
1129	size_t off = 0;
1130	size_t pos = 0;
1131	wchar_t c;
1132	bool update_last_chunk = true;
1133	char *last_chunk = NULL;
1134
1135	while ((c = str_decode(str, &off, STR_NO_LIMIT))) {
1136	if (c != ch) {
1137	update_last_chunk = true;
1138	last_chunk = NULL;
1139	} else if (update_last_chunk) {
1140	update_last_chunk = false;
1141	last_chunk = (str + pos);
1142	}
1143	pos = off;
1144	}
1145
1146	if (last_chunk)
1147	*last_chunk = '\0';
1148	}
1149
1150	/** Removes specified leading characters from a string.
1151	*
1152	* @param str String to remove from.
1153	* @param ch Character to remove.
1154	*/
1155	void str_ltrim(char *str, wchar_t ch)
1156	{
1157	wchar_t acc;
1158	size_t off = 0;
1159	size_t pos = 0;
1160	size_t str_sz = str_size(str);
1161
1162	while ((acc = str_decode(str, &off, STR_NO_LIMIT)) != 0) {
1163	if (acc != ch)
1164	break;
1165	else
1166	pos = off;
1167	}
1168
1169	if (pos > 0) {
1170	memmove(str, &str[pos], str_sz - pos);
1171	pos = str_sz - pos;
1172	str[pos] = '\0';
1173	}
1174	}
1175
1176	/** Find last occurence of character in string.
1177	*
1178	* @param str String to search.
1179	* @param ch Character to look for.
1180	*
1181	* @return Pointer to character in @a str or NULL if not found.
1182	*/
1183	char str_rchr(const char str, wchar_t ch)
1184	{
1185	wchar_t acc;
1186	size_t off = 0;
1187	size_t last = 0;
1188	const char *res = NULL;
1189
1190	while ((acc = str_decode(str, &off, STR_NO_LIMIT)) != 0) {
1191	if (acc == ch)
1192	res = (str + last);
1193	last = off;
1194	}
1195
1196	return (char *) res;
1197	}
1198
1199	/** Insert a wide character into a wide string.
1200	*
1201	* Insert a wide character into a wide string at position
1202	* @a pos. The characters after the position are shifted.
1203	*
1204	* @param str String to insert to.
1205	* @param ch Character to insert to.
1206	* @param pos Character index where to insert.
1207	@ @param max_pos Characters in the buffer.
1208	*
1209	* @return True if the insertion was sucessful, false if the position
1210	* is out of bounds.
1211	*
1212	*/
1213	bool wstr_linsert(wchar_t *str, wchar_t ch, size_t pos, size_t max_pos)
1214	{
1215	size_t len = wstr_length(str);
1216
1217	if ((pos > len) \|\| (pos + 1 > max_pos))
1218	return false;
1219
1220	size_t i;
1221	for (i = len; i + 1 > pos; i--)
1222	str[i + 1] = str[i];
1223
1224	str[pos] = ch;
1225
1226	return true;
1227	}
1228
1229	/** Remove a wide character from a wide string.
1230	*
1231	* Remove a wide character from a wide string at position
1232	* @a pos. The characters after the position are shifted.
1233	*
1234	* @param str String to remove from.
1235	* @param pos Character index to remove.
1236	*
1237	* @return True if the removal was sucessful, false if the position
1238	* is out of bounds.
1239	*
1240	*/
1241	bool wstr_remove(wchar_t *str, size_t pos)
1242	{
1243	size_t len = wstr_length(str);
1244
1245	if (pos >= len)
1246	return false;
1247
1248	size_t i;
1249	for (i = pos + 1; i <= len; i++)
1250	str[i - 1] = str[i];
1251
1252	return true;
1253	}
1254
1255	/** Convert string to a number.
1256	* Core of strtol and strtoul functions.
1257	*
1258	* @param nptr Pointer to string.
1259	* @param endptr If not NULL, function stores here pointer to the first
1260	* invalid character.
1261	* @param base Zero or number between 2 and 36 inclusive.
1262	* @param sgn It's set to 1 if minus found.
1263	* @return Result of conversion.
1264	*/
1265	static unsigned long
1266	_strtoul(const char nptr, char endptr, int base, char sgn)
1267	{
1268	unsigned char c;
1269	unsigned long result = 0;
1270	unsigned long a, b;
1271	const char *str = nptr;
1272	const char *tmpptr;
1273
1274	while (isspace(*str))
1275	str++;
1276
1277	if (*str == '-') {
1278	*sgn = 1;
1279	++str;
1280	} else if (*str == '+')
1281	++str;
1282
1283	if (base) {
1284	if ((base == 1) \|\| (base > 36)) {
1285	/* FIXME: set errno to EINVAL */
1286	return 0;
1287	}
1288	if ((base == 16) && (*str == '0') && ((str[1] == 'x') \|\|
1289	(str[1] == 'X'))) {
1290	str += 2;
1291	}
1292	} else {
1293	base = 10;
1294
1295	if (*str == '0') {
1296	base = 8;
1297	if ((str[1] == 'X') \|\| (str[1] == 'x')) {
1298	base = 16;
1299	str += 2;
1300	}
1301	}
1302	}
1303
1304	tmpptr = str;
1305
1306	while (*str) {
1307	c = *str;
1308	c = (c >= 'a' ? c - 'a' + 10 : (c >= 'A' ? c - 'A' + 10 :
1309	(c <= '9' ? c - '0' : 0xff)));
1310	if (c >= base) {
1311	break;
1312	}
1313
1314	a = (result & 0xff) * base + c;
1315	b = (result >> 8) * base + (a >> 8);
1316
1317	if (b > (ULONG_MAX >> 8)) {
1318	/* overflow */
1319	/* FIXME: errno = ERANGE*/
1320	return ULONG_MAX;
1321	}
1322
1323	result = (b << 8) + (a & 0xff);
1324	++str;
1325	}
1326
1327	if (str == tmpptr) {
1328	/*
1329	* No number was found => first invalid character is the first
1330	* character of the string.
1331	*/
1332	/* FIXME: set errno to EINVAL */
1333	str = nptr;
1334	result = 0;
1335	}
1336
1337	if (endptr)
1338	endptr = (char ) str;
1339
1340	if (nptr == str) {
1341	/FIXME: errno = EINVAL/
1342	return 0;
1343	}
1344
1345	return result;
1346	}
1347
1348	/** Convert initial part of string to long int according to given base.
1349	* The number may begin with an arbitrary number of whitespaces followed by
1350	* optional sign (`+' or `-'). If the base is 0 or 16, the prefix `0x' may be
1351	* inserted and the number will be taken as hexadecimal one. If the base is 0
1352	* and the number begin with a zero, number will be taken as octal one (as with
1353	* base 8). Otherwise the base 0 is taken as decimal.
1354	*
1355	* @param nptr Pointer to string.
1356	* @param endptr If not NULL, function stores here pointer to the first
1357	* invalid character.
1358	* @param base Zero or number between 2 and 36 inclusive.
1359	* @return Result of conversion.
1360	*/
1361	long int strtol(const char nptr, char *endptr, int base)
1362	{
1363	char sgn = 0;
1364	unsigned long number = 0;
1365
1366	number = _strtoul(nptr, endptr, base, &sgn);
1367
1368	if (number > LONG_MAX) {
1369	if ((sgn) && (number == (unsigned long) (LONG_MAX) + 1)) {
1370	/* FIXME: set 0 to errno */
1371	return number;
1372	}
1373	/* FIXME: set ERANGE to errno */
1374	return (sgn ? LONG_MIN : LONG_MAX);
1375	}
1376
1377	return (sgn ? -number : number);
1378	}
1379
1380	/** Duplicate string.
1381	*
1382	* Allocate a new string and copy characters from the source
1383	* string into it. The duplicate string is allocated via sleeping
1384	* malloc(), thus this function can sleep in no memory conditions.
1385	*
1386	* The allocation cannot fail and the return value is always
1387	* a valid pointer. The duplicate string is always a well-formed
1388	* null-terminated UTF-8 string, but it can differ from the source
1389	* string on the byte level.
1390	*
1391	* @param src Source string.
1392	*
1393	* @return Duplicate string.
1394	*
1395	*/
1396	char str_dup(const char src)
1397	{
1398	size_t size = str_size(src) + 1;
1399	char dest = (char ) malloc(size);
1400	if (dest == NULL)
1401	return (char *) NULL;
1402
1403	str_cpy(dest, size, src);
1404	return dest;
1405	}
1406
1407	/** Duplicate string with size limit.
1408	*
1409	* Allocate a new string and copy up to @max_size bytes from the source
1410	* string into it. The duplicate string is allocated via sleeping
1411	* malloc(), thus this function can sleep in no memory conditions.
1412	* No more than @max_size + 1 bytes is allocated, but if the size
1413	* occupied by the source string is smaller than @max_size + 1,
1414	* less is allocated.
1415	*
1416	* The allocation cannot fail and the return value is always
1417	* a valid pointer. The duplicate string is always a well-formed
1418	* null-terminated UTF-8 string, but it can differ from the source
1419	* string on the byte level.
1420	*
1421	* @param src Source string.
1422	* @param n Maximum number of bytes to duplicate.
1423	*
1424	* @return Duplicate string.
1425	*
1426	*/
1427	char str_ndup(const char src, size_t n)
1428	{
1429	size_t size = str_size(src);
1430	if (size > n)
1431	size = n;
1432
1433	char dest = (char ) malloc(size + 1);
1434	if (dest == NULL)
1435	return (char *) NULL;
1436
1437	str_ncpy(dest, size + 1, src, size);
1438	return dest;
1439	}
1440
1441	/** Convert initial part of string to unsigned long according to given base.
1442	* The number may begin with an arbitrary number of whitespaces followed by
1443	* optional sign (`+' or `-'). If the base is 0 or 16, the prefix `0x' may be
1444	* inserted and the number will be taken as hexadecimal one. If the base is 0
1445	* and the number begin with a zero, number will be taken as octal one (as with
1446	* base 8). Otherwise the base 0 is taken as decimal.
1447	*
1448	* @param nptr Pointer to string.
1449	* @param endptr If not NULL, function stores here pointer to the first
1450	* invalid character
1451	* @param base Zero or number between 2 and 36 inclusive.
1452	* @return Result of conversion.
1453	*/
1454	unsigned long strtoul(const char nptr, char *endptr, int base)
1455	{
1456	char sgn = 0;
1457	unsigned long number = 0;
1458
1459	number = _strtoul(nptr, endptr, base, &sgn);
1460
1461	return (sgn ? -number : number);
1462	}
1463
1464	/** Split string by delimiters.
1465	*
1466	* @param s String to be tokenized. May not be NULL.
1467	* @param delim String with the delimiters.
1468	* @param next Variable which will receive the pointer to the
1469	* continuation of the string following the first
1470	* occurrence of any of the delimiter characters.
1471	* May be NULL.
1472	* @return Pointer to the prefix of @a s before the first
1473	* delimiter character. NULL if no such prefix
1474	* exists.
1475	*/
1476	char str_tok(char s, const char delim, char *next)
1477	{
1478	char start, end;
1479
1480	if (!s)
1481	return NULL;
1482
1483	size_t len = str_size(s);
1484	size_t cur;
1485	size_t tmp;
1486	wchar_t ch;
1487
1488	/* Skip over leading delimiters. */
1489	for (tmp = cur = 0;
1490	(ch = str_decode(s, &tmp, len)) && str_chr(delim, ch); /**/)
1491	cur = tmp;
1492	start = &s[cur];
1493
1494	/* Skip over token characters. */
1495	for (tmp = cur;
1496	(ch = str_decode(s, &tmp, len)) && !str_chr(delim, ch); /**/)
1497	cur = tmp;
1498	end = &s[cur];
1499	if (next)
1500	*next = (ch ? &s[tmp] : &s[cur]);
1501
1502	if (start == end)
1503	return NULL; /* No more tokens. */
1504
1505	/* Overwrite delimiter with NULL terminator. */
1506	*end = '\0';
1507	return start;
1508	}
1509
1510	/** Convert string to uint64_t (internal variant).
1511	*
1512	* @param nptr Pointer to string.
1513	* @param endptr Pointer to the first invalid character is stored here.
1514	* @param base Zero or number between 2 and 36 inclusive.
1515	* @param neg Indication of unary minus is stored here.
1516	* @apram result Result of the conversion.
1517	*
1518	* @return EOK if conversion was successful.
1519	*
1520	*/
1521	static int str_uint(const char nptr, char *endptr, unsigned int base,
1522	bool neg, uint64_t result)
1523	{
1524	assert(endptr != NULL);
1525	assert(neg != NULL);
1526	assert(result != NULL);
1527
1528	*neg = false;
1529	const char *str = nptr;
1530
1531	/* Ignore leading whitespace */
1532	while (isspace(*str))
1533	str++;
1534
1535	if (*str == '-') {
1536	*neg = true;
1537	str++;
1538	} else if (*str == '+')
1539	str++;
1540
1541	if (base == 0) {
1542	/* Decode base if not specified */
1543	base = 10;
1544
1545	if (*str == '0') {
1546	base = 8;
1547	str++;
1548
1549	switch (*str) {
1550	case 'b':
1551	case 'B':
1552	base = 2;
1553	str++;
1554	break;
1555	case 'o':
1556	case 'O':
1557	base = 8;
1558	str++;
1559	break;
1560	case 'd':
1561	case 'D':
1562	case 't':
1563	case 'T':
1564	base = 10;
1565	str++;
1566	break;
1567	case 'x':
1568	case 'X':
1569	base = 16;
1570	str++;
1571	break;
1572	default:
1573	str--;
1574	}
1575	}
1576	} else {
1577	/* Check base range */
1578	if ((base < 2) \|\| (base > 36)) {
1579	endptr = (char ) str;
1580	return EINVAL;
1581	}
1582	}
1583
1584	*result = 0;
1585	const char *startstr = str;
1586
1587	while (*str != 0) {
1588	unsigned int digit;
1589
1590	if ((str >= 'a') && (str <= 'z'))
1591	digit = *str - 'a' + 10;
1592	else if ((str >= 'A') && (str <= 'Z'))
1593	digit = *str - 'A' + 10;
1594	else if ((str >= '0') && (str <= '9'))
1595	digit = *str - '0';
1596	else
1597	break;
1598
1599	if (digit >= base)
1600	break;
1601
1602	uint64_t prev = *result;
1603	result = (result) * base + digit;
1604
1605	if (*result < prev) {
1606	/* Overflow */
1607	endptr = (char ) str;
1608	return EOVERFLOW;
1609	}
1610
1611	str++;
1612	}
1613
1614	if (str == startstr) {
1615	/*
1616	* No digits were decoded => first invalid character is
1617	* the first character of the string.
1618	*/
1619	str = nptr;
1620	}
1621
1622	endptr = (char ) str;
1623
1624	if (str == nptr)
1625	return EINVAL;
1626
1627	return EOK;
1628	}
1629
1630	/** Convert string to uint8_t.
1631	*
1632	* @param nptr Pointer to string.
1633	* @param endptr If not NULL, pointer to the first invalid character
1634	* is stored here.
1635	* @param base Zero or number between 2 and 36 inclusive.
1636	* @param strict Do not allow any trailing characters.
1637	* @param result Result of the conversion.
1638	*
1639	* @return EOK if conversion was successful.
1640	*
1641	*/
1642	int str_uint8_t(const char nptr, const char *endptr, unsigned int base,
1643	bool strict, uint8_t *result)
1644	{
1645	assert(result != NULL);
1646
1647	bool neg;
1648	char *lendptr;
1649	uint64_t res;
1650	int ret = str_uint(nptr, &lendptr, base, &neg, &res);
1651
1652	if (endptr != NULL)
1653	endptr = (char ) lendptr;
1654
1655	if (ret != EOK)
1656	return ret;
1657
1658	/* Do not allow negative values */
1659	if (neg)
1660	return EINVAL;
1661
1662	/* Check whether we are at the end of
1663	the string in strict mode */
1664	if ((strict) && (*lendptr != 0))
1665	return EINVAL;
1666
1667	/* Check for overflow */
1668	uint8_t _res = (uint8_t) res;
1669	if (_res != res)
1670	return EOVERFLOW;
1671
1672	*result = _res;
1673
1674	return EOK;
1675	}
1676
1677	/** Convert string to uint16_t.
1678	*
1679	* @param nptr Pointer to string.
1680	* @param endptr If not NULL, pointer to the first invalid character
1681	* is stored here.
1682	* @param base Zero or number between 2 and 36 inclusive.
1683	* @param strict Do not allow any trailing characters.
1684	* @param result Result of the conversion.
1685	*
1686	* @return EOK if conversion was successful.
1687	*
1688	*/
1689	int str_uint16_t(const char nptr, const char *endptr, unsigned int base,
1690	bool strict, uint16_t *result)
1691	{
1692	assert(result != NULL);
1693
1694	bool neg;
1695	char *lendptr;
1696	uint64_t res;
1697	int ret = str_uint(nptr, &lendptr, base, &neg, &res);
1698
1699	if (endptr != NULL)
1700	endptr = (char ) lendptr;
1701
1702	if (ret != EOK)
1703	return ret;
1704
1705	/* Do not allow negative values */
1706	if (neg)
1707	return EINVAL;
1708
1709	/* Check whether we are at the end of
1710	the string in strict mode */
1711	if ((strict) && (*lendptr != 0))
1712	return EINVAL;
1713
1714	/* Check for overflow */
1715	uint16_t _res = (uint16_t) res;
1716	if (_res != res)
1717	return EOVERFLOW;
1718
1719	*result = _res;
1720
1721	return EOK;
1722	}
1723
1724	/** Convert string to uint32_t.
1725	*
1726	* @param nptr Pointer to string.
1727	* @param endptr If not NULL, pointer to the first invalid character
1728	* is stored here.
1729	* @param base Zero or number between 2 and 36 inclusive.
1730	* @param strict Do not allow any trailing characters.
1731	* @param result Result of the conversion.
1732	*
1733	* @return EOK if conversion was successful.
1734	*
1735	*/
1736	int str_uint32_t(const char nptr, const char *endptr, unsigned int base,
1737	bool strict, uint32_t *result)
1738	{
1739	assert(result != NULL);
1740
1741	bool neg;
1742	char *lendptr;
1743	uint64_t res;
1744	int ret = str_uint(nptr, &lendptr, base, &neg, &res);
1745
1746	if (endptr != NULL)
1747	endptr = (char ) lendptr;
1748
1749	if (ret != EOK)
1750	return ret;
1751
1752	/* Do not allow negative values */
1753	if (neg)
1754	return EINVAL;
1755
1756	/* Check whether we are at the end of
1757	the string in strict mode */
1758	if ((strict) && (*lendptr != 0))
1759	return EINVAL;
1760
1761	/* Check for overflow */
1762	uint32_t _res = (uint32_t) res;
1763	if (_res != res)
1764	return EOVERFLOW;
1765
1766	*result = _res;
1767
1768	return EOK;
1769	}
1770
1771	/** Convert string to uint64_t.
1772	*
1773	* @param nptr Pointer to string.
1774	* @param endptr If not NULL, pointer to the first invalid character
1775	* is stored here.
1776	* @param base Zero or number between 2 and 36 inclusive.
1777	* @param strict Do not allow any trailing characters.
1778	* @param result Result of the conversion.
1779	*
1780	* @return EOK if conversion was successful.
1781	*
1782	*/
1783	int str_uint64_t(const char nptr, const char *endptr, unsigned int base,
1784	bool strict, uint64_t *result)
1785	{
1786	assert(result != NULL);
1787
1788	bool neg;
1789	char *lendptr;
1790	int ret = str_uint(nptr, &lendptr, base, &neg, result);
1791
1792	if (endptr != NULL)
1793	endptr = (char ) lendptr;
1794
1795	if (ret != EOK)
1796	return ret;
1797
1798	/* Do not allow negative values */
1799	if (neg)
1800	return EINVAL;
1801
1802	/* Check whether we are at the end of
1803	the string in strict mode */
1804	if ((strict) && (*lendptr != 0))
1805	return EINVAL;
1806
1807	return EOK;
1808	}
1809
1810	/** Convert string to size_t.
1811	*
1812	* @param nptr Pointer to string.
1813	* @param endptr If not NULL, pointer to the first invalid character
1814	* is stored here.
1815	* @param base Zero or number between 2 and 36 inclusive.
1816	* @param strict Do not allow any trailing characters.
1817	* @param result Result of the conversion.
1818	*
1819	* @return EOK if conversion was successful.
1820	*
1821	*/
1822	int str_size_t(const char nptr, const char *endptr, unsigned int base,
1823	bool strict, size_t *result)
1824	{
1825	assert(result != NULL);
1826
1827	bool neg;
1828	char *lendptr;
1829	uint64_t res;
1830	int ret = str_uint(nptr, &lendptr, base, &neg, &res);
1831
1832	if (endptr != NULL)
1833	endptr = (char ) lendptr;
1834
1835	if (ret != EOK)
1836	return ret;
1837
1838	/* Do not allow negative values */
1839	if (neg)
1840	return EINVAL;
1841
1842	/* Check whether we are at the end of
1843	the string in strict mode */
1844	if ((strict) && (*lendptr != 0))
1845	return EINVAL;
1846
1847	/* Check for overflow */
1848	size_t _res = (size_t) res;
1849	if (_res != res)
1850	return EOVERFLOW;
1851
1852	*result = _res;
1853
1854	return EOK;
1855	}
1856
1857	void order_suffix(const uint64_t val, uint64_t rv, char suffix)
1858	{
1859	if (val > UINT64_C(10000000000000000000)) {
1860	*rv = val / UINT64_C(1000000000000000000);
1861	*suffix = 'Z';
1862	} else if (val > UINT64_C(1000000000000000000)) {
1863	*rv = val / UINT64_C(1000000000000000);
1864	*suffix = 'E';
1865	} else if (val > UINT64_C(1000000000000000)) {
1866	*rv = val / UINT64_C(1000000000000);
1867	*suffix = 'T';
1868	} else if (val > UINT64_C(1000000000000)) {
1869	*rv = val / UINT64_C(1000000000);
1870	*suffix = 'G';
1871	} else if (val > UINT64_C(1000000000)) {
1872	*rv = val / UINT64_C(1000000);
1873	*suffix = 'M';
1874	} else if (val > UINT64_C(1000000)) {
1875	*rv = val / UINT64_C(1000);
1876	*suffix = 'k';
1877	} else {
1878	*rv = val;
1879	*suffix = ' ';
1880	}
1881	}
1882
1883	void bin_order_suffix(const uint64_t val, uint64_t rv, const char *suffix,
1884	bool fixed)
1885	{
1886	if (val > UINT64_C(1152921504606846976)) {
1887	*rv = val / UINT64_C(1125899906842624);
1888	*suffix = "EiB";
1889	} else if (val > UINT64_C(1125899906842624)) {
1890	*rv = val / UINT64_C(1099511627776);
1891	*suffix = "TiB";
1892	} else if (val > UINT64_C(1099511627776)) {
1893	*rv = val / UINT64_C(1073741824);
1894	*suffix = "GiB";
1895	} else if (val > UINT64_C(1073741824)) {
1896	*rv = val / UINT64_C(1048576);
1897	*suffix = "MiB";
1898	} else if (val > UINT64_C(1048576)) {
1899	*rv = val / UINT64_C(1024);
1900	*suffix = "KiB";
1901	} else {
1902	*rv = val;
1903	if (fixed)
1904	*suffix = "B ";
1905	else
1906	*suffix = "B";
1907	}
1908	}
1909
1910	/** @}
1911	*/

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: mainline/uspace/lib/c/generic/str.c@ b06414f

Download in other formats: