Context Navigation

source: mainline/kernel/generic/src/lib/str.c@ 13d5639

Visit:

lfn serial ticket/834-toolchain-update topic/msim-upgrade topic/simplify-dev-export

Last change on this file since 13d5639 was 8e893ae, checked in by Martin Decky <martin@…>, 13 years ago
avoid comparison with 0 if the type is unsigned
Property mode set to `100644`
File size: 23.5 KB

Line
1	/*
2	* Copyright (c) 2001-2004 Jakub Jermar
3	* All rights reserved.
4	*
5	* Redistribution and use in source and binary forms, with or without
6	* modification, are permitted provided that the following conditions
7	* are met:
8	*
9	* - Redistributions of source code must retain the above copyright
10	* notice, this list of conditions and the following disclaimer.
11	* - Redistributions in binary form must reproduce the above copyright
12	* notice, this list of conditions and the following disclaimer in the
13	* documentation and/or other materials provided with the distribution.
14	* - The name of the author may not be used to endorse or promote products
15	* derived from this software without specific prior written permission.
16	*
17	* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18	* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19	* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20	* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21	* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22	* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23	* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24	* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25	* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26	* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27	*/
28
29	/** @addtogroup generic
30	* @{
31	*/
32
33	/**
34	* @file
35	* @brief String functions.
36	*
37	* Strings and characters use the Universal Character Set (UCS). The standard
38	* strings, called just strings are encoded in UTF-8. Wide strings (encoded
39	* in UTF-32) are supported to a limited degree. A single character is
40	* represented as wchar_t.@n
41	*
42	* Overview of the terminology:@n
43	*
44	* Term Meaning
45	* -------------------- ----------------------------------------------------
46	* byte 8 bits stored in uint8_t (unsigned 8 bit integer)
47	*
48	* character UTF-32 encoded Unicode character, stored in wchar_t
49	* (signed 32 bit integer), code points 0 .. 1114111
50	* are valid
51	*
52	* ASCII character 7 bit encoded ASCII character, stored in char
53	* (usually signed 8 bit integer), code points 0 .. 127
54	* are valid
55	*
56	* string UTF-8 encoded NULL-terminated Unicode string, char *
57	*
58	* wide string UTF-32 encoded NULL-terminated Unicode string,
59	* wchar_t *
60	*
61	* [wide] string size number of BYTES in a [wide] string (excluding
62	* the NULL-terminator), size_t
63	*
64	* [wide] string length number of CHARACTERS in a [wide] string (excluding
65	* the NULL-terminator), size_t
66	*
67	* [wide] string width number of display cells on a monospace display taken
68	* by a [wide] string, size_t
69	*
70	*
71	* Overview of string metrics:@n
72	*
73	* Metric Abbrev. Type Meaning
74	* ------ ------ ------ -------------------------------------------------
75	* size n size_t number of BYTES in a string (excluding the
76	* NULL-terminator)
77	*
78	* length l size_t number of CHARACTERS in a string (excluding the
79	* null terminator)
80	*
81	* width w size_t number of display cells on a monospace display
82	* taken by a string
83	*
84	*
85	* Function naming prefixes:@n
86	*
87	* chr_ operate on characters
88	* ascii_ operate on ASCII characters
89	* str_ operate on strings
90	* wstr_ operate on wide strings
91	*
92	* [w]str_[n\|l\|w] operate on a prefix limited by size, length
93	* or width
94	*
95	*
96	* A specific character inside a [wide] string can be referred to by:@n
97	*
98	* pointer (char , wchar_t )
99	* byte offset (size_t)
100	* character index (size_t)
101	*
102	*/
103
104	#include <str.h>
105	#include <print.h>
106	#include <cpu.h>
107	#include <arch/asm.h>
108	#include <arch.h>
109	#include <errno.h>
110	#include <align.h>
111	#include <debug.h>
112	#include <macros.h>
113
114	/** Check the condition if wchar_t is signed */
115	#ifdef WCHAR_IS_UNSIGNED
116	#define WCHAR_SIGNED_CHECK(cond) (true)
117	#else
118	#define WCHAR_SIGNED_CHECK(cond) (cond)
119	#endif
120
121	/** Byte mask consisting of lowest @n bits (out of 8) */
122	#define LO_MASK_8(n) ((uint8_t) ((1 << (n)) - 1))
123
124	/** Byte mask consisting of lowest @n bits (out of 32) */
125	#define LO_MASK_32(n) ((uint32_t) ((1 << (n)) - 1))
126
127	/** Byte mask consisting of highest @n bits (out of 8) */
128	#define HI_MASK_8(n) (~LO_MASK_8(8 - (n)))
129
130	/** Number of data bits in a UTF-8 continuation byte */
131	#define CONT_BITS 6
132
133	/** Decode a single character from a string.
134	*
135	* Decode a single character from a string of size @a size. Decoding starts
136	* at @a offset and this offset is moved to the beginning of the next
137	* character. In case of decoding error, offset generally advances at least
138	* by one. However, offset is never moved beyond size.
139	*
140	* @param str String (not necessarily NULL-terminated).
141	* @param offset Byte offset in string where to start decoding.
142	* @param size Size of the string (in bytes).
143	*
144	* @return Value of decoded character, U_SPECIAL on decoding error or
145	* NULL if attempt to decode beyond @a size.
146	*
147	*/
148	wchar_t str_decode(const char str, size_t offset, size_t size)
149	{
150	if (*offset + 1 > size)
151	return 0;
152
153	/* First byte read from string */
154	uint8_t b0 = (uint8_t) str[(*offset)++];
155
156	/* Determine code length */
157
158	unsigned int b0_bits; /* Data bits in first byte */
159	unsigned int cbytes; /* Number of continuation bytes */
160
161	if ((b0 & 0x80) == 0) {
162	/* 0xxxxxxx (Plain ASCII) */
163	b0_bits = 7;
164	cbytes = 0;
165	} else if ((b0 & 0xe0) == 0xc0) {
166	/* 110xxxxx 10xxxxxx */
167	b0_bits = 5;
168	cbytes = 1;
169	} else if ((b0 & 0xf0) == 0xe0) {
170	/* 1110xxxx 10xxxxxx 10xxxxxx */
171	b0_bits = 4;
172	cbytes = 2;
173	} else if ((b0 & 0xf8) == 0xf0) {
174	/* 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx */
175	b0_bits = 3;
176	cbytes = 3;
177	} else {
178	/* 10xxxxxx -- unexpected continuation byte */
179	return U_SPECIAL;
180	}
181
182	if (*offset + cbytes > size)
183	return U_SPECIAL;
184
185	wchar_t ch = b0 & LO_MASK_8(b0_bits);
186
187	/* Decode continuation bytes */
188	while (cbytes > 0) {
189	uint8_t b = (uint8_t) str[(*offset)++];
190
191	/* Must be 10xxxxxx */
192	if ((b & 0xc0) != 0x80)
193	return U_SPECIAL;
194
195	/* Shift data bits to ch */
196	ch = (ch << CONT_BITS) \| (wchar_t) (b & LO_MASK_8(CONT_BITS));
197	cbytes--;
198	}
199
200	return ch;
201	}
202
203	/** Encode a single character to string representation.
204	*
205	* Encode a single character to string representation (i.e. UTF-8) and store
206	* it into a buffer at @a offset. Encoding starts at @a offset and this offset
207	* is moved to the position where the next character can be written to.
208	*
209	* @param ch Input character.
210	* @param str Output buffer.
211	* @param offset Byte offset where to start writing.
212	* @param size Size of the output buffer (in bytes).
213	*
214	* @return EOK if the character was encoded successfully, EOVERFLOW if there
215	* was not enough space in the output buffer or EINVAL if the character
216	* code was invalid.
217	*/
218	int chr_encode(const wchar_t ch, char str, size_t offset, size_t size)
219	{
220	if (*offset >= size)
221	return EOVERFLOW;
222
223	if (!chr_check(ch))
224	return EINVAL;
225
226	/* Unsigned version of ch (bit operations should only be done
227	on unsigned types). */
228	uint32_t cc = (uint32_t) ch;
229
230	/* Determine how many continuation bytes are needed */
231
232	unsigned int b0_bits; /* Data bits in first byte */
233	unsigned int cbytes; /* Number of continuation bytes */
234
235	if ((cc & ~LO_MASK_32(7)) == 0) {
236	b0_bits = 7;
237	cbytes = 0;
238	} else if ((cc & ~LO_MASK_32(11)) == 0) {
239	b0_bits = 5;
240	cbytes = 1;
241	} else if ((cc & ~LO_MASK_32(16)) == 0) {
242	b0_bits = 4;
243	cbytes = 2;
244	} else if ((cc & ~LO_MASK_32(21)) == 0) {
245	b0_bits = 3;
246	cbytes = 3;
247	} else {
248	/* Codes longer than 21 bits are not supported */
249	return EINVAL;
250	}
251
252	/* Check for available space in buffer */
253	if (*offset + cbytes >= size)
254	return EOVERFLOW;
255
256	/* Encode continuation bytes */
257	unsigned int i;
258	for (i = cbytes; i > 0; i--) {
259	str[*offset + i] = 0x80 \| (cc & LO_MASK_32(CONT_BITS));
260	cc = cc >> CONT_BITS;
261	}
262
263	/* Encode first byte */
264	str[*offset] = (cc & LO_MASK_32(b0_bits)) \| HI_MASK_8(8 - b0_bits - 1);
265
266	/* Advance offset */
267	*offset += cbytes + 1;
268
269	return EOK;
270	}
271
272	/** Get size of string.
273	*
274	* Get the number of bytes which are used by the string @a str (excluding the
275	* NULL-terminator).
276	*
277	* @param str String to consider.
278	*
279	* @return Number of bytes used by the string
280	*
281	*/
282	size_t str_size(const char *str)
283	{
284	size_t size = 0;
285
286	while (*str++ != 0)
287	size++;
288
289	return size;
290	}
291
292	/** Get size of wide string.
293	*
294	* Get the number of bytes which are used by the wide string @a str (excluding the
295	* NULL-terminator).
296	*
297	* @param str Wide string to consider.
298	*
299	* @return Number of bytes used by the wide string
300	*
301	*/
302	size_t wstr_size(const wchar_t *str)
303	{
304	return (wstr_length(str) * sizeof(wchar_t));
305	}
306
307	/** Get size of string with length limit.
308	*
309	* Get the number of bytes which are used by up to @a max_len first
310	* characters in the string @a str. If @a max_len is greater than
311	* the length of @a str, the entire string is measured (excluding the
312	* NULL-terminator).
313	*
314	* @param str String to consider.
315	* @param max_len Maximum number of characters to measure.
316	*
317	* @return Number of bytes used by the characters.
318	*
319	*/
320	size_t str_lsize(const char *str, size_t max_len)
321	{
322	size_t len = 0;
323	size_t offset = 0;
324
325	while (len < max_len) {
326	if (str_decode(str, &offset, STR_NO_LIMIT) == 0)
327	break;
328
329	len++;
330	}
331
332	return offset;
333	}
334
335	/** Get size of wide string with length limit.
336	*
337	* Get the number of bytes which are used by up to @a max_len first
338	* wide characters in the wide string @a str. If @a max_len is greater than
339	* the length of @a str, the entire wide string is measured (excluding the
340	* NULL-terminator).
341	*
342	* @param str Wide string to consider.
343	* @param max_len Maximum number of wide characters to measure.
344	*
345	* @return Number of bytes used by the wide characters.
346	*
347	*/
348	size_t wstr_lsize(const wchar_t *str, size_t max_len)
349	{
350	return (wstr_nlength(str, max_len * sizeof(wchar_t)) * sizeof(wchar_t));
351	}
352
353	/** Get number of characters in a string.
354	*
355	* @param str NULL-terminated string.
356	*
357	* @return Number of characters in string.
358	*
359	*/
360	size_t str_length(const char *str)
361	{
362	size_t len = 0;
363	size_t offset = 0;
364
365	while (str_decode(str, &offset, STR_NO_LIMIT) != 0)
366	len++;
367
368	return len;
369	}
370
371	/** Get number of characters in a wide string.
372	*
373	* @param str NULL-terminated wide string.
374	*
375	* @return Number of characters in @a str.
376	*
377	*/
378	size_t wstr_length(const wchar_t *wstr)
379	{
380	size_t len = 0;
381
382	while (*wstr++ != 0)
383	len++;
384
385	return len;
386	}
387
388	/** Get number of characters in a string with size limit.
389	*
390	* @param str NULL-terminated string.
391	* @param size Maximum number of bytes to consider.
392	*
393	* @return Number of characters in string.
394	*
395	*/
396	size_t str_nlength(const char *str, size_t size)
397	{
398	size_t len = 0;
399	size_t offset = 0;
400
401	while (str_decode(str, &offset, size) != 0)
402	len++;
403
404	return len;
405	}
406
407	/** Get number of characters in a string with size limit.
408	*
409	* @param str NULL-terminated string.
410	* @param size Maximum number of bytes to consider.
411	*
412	* @return Number of characters in string.
413	*
414	*/
415	size_t wstr_nlength(const wchar_t *str, size_t size)
416	{
417	size_t len = 0;
418	size_t limit = ALIGN_DOWN(size, sizeof(wchar_t));
419	size_t offset = 0;
420
421	while ((offset < limit) && (*str++ != 0)) {
422	len++;
423	offset += sizeof(wchar_t);
424	}
425
426	return len;
427	}
428
429	/** Check whether character is plain ASCII.
430	*
431	* @return True if character is plain ASCII.
432	*
433	*/
434	bool ascii_check(wchar_t ch)
435	{
436	if (WCHAR_SIGNED_CHECK(ch >= 0) && (ch <= 127))
437	return true;
438
439	return false;
440	}
441
442	/** Check whether character is valid
443	*
444	* @return True if character is a valid Unicode code point.
445	*
446	*/
447	bool chr_check(wchar_t ch)
448	{
449	if (WCHAR_SIGNED_CHECK(ch >= 0) && (ch <= 1114111))
450	return true;
451
452	return false;
453	}
454
455	/** Compare two NULL terminated strings.
456	*
457	* Do a char-by-char comparison of two NULL-terminated strings.
458	* The strings are considered equal iff they consist of the same
459	* characters on the minimum of their lengths.
460	*
461	* @param s1 First string to compare.
462	* @param s2 Second string to compare.
463	*
464	* @return 0 if the strings are equal, -1 if first is smaller,
465	* 1 if second smaller.
466	*
467	*/
468	int str_cmp(const char s1, const char s2)
469	{
470	wchar_t c1 = 0;
471	wchar_t c2 = 0;
472
473	size_t off1 = 0;
474	size_t off2 = 0;
475
476	while (true) {
477	c1 = str_decode(s1, &off1, STR_NO_LIMIT);
478	c2 = str_decode(s2, &off2, STR_NO_LIMIT);
479
480	if (c1 < c2)
481	return -1;
482
483	if (c1 > c2)
484	return 1;
485
486	if (c1 == 0 \|\| c2 == 0)
487	break;
488	}
489
490	return 0;
491	}
492
493	/** Compare two NULL terminated strings with length limit.
494	*
495	* Do a char-by-char comparison of two NULL-terminated strings.
496	* The strings are considered equal iff they consist of the same
497	* characters on the minimum of their lengths and the length limit.
498	*
499	* @param s1 First string to compare.
500	* @param s2 Second string to compare.
501	* @param max_len Maximum number of characters to consider.
502	*
503	* @return 0 if the strings are equal, -1 if first is smaller,
504	* 1 if second smaller.
505	*
506	*/
507	int str_lcmp(const char s1, const char s2, size_t max_len)
508	{
509	wchar_t c1 = 0;
510	wchar_t c2 = 0;
511
512	size_t off1 = 0;
513	size_t off2 = 0;
514
515	size_t len = 0;
516
517	while (true) {
518	if (len >= max_len)
519	break;
520
521	c1 = str_decode(s1, &off1, STR_NO_LIMIT);
522	c2 = str_decode(s2, &off2, STR_NO_LIMIT);
523
524	if (c1 < c2)
525	return -1;
526
527	if (c1 > c2)
528	return 1;
529
530	if (c1 == 0 \|\| c2 == 0)
531	break;
532
533	++len;
534	}
535
536	return 0;
537
538	}
539
540	/** Copy string.
541	*
542	* Copy source string @a src to destination buffer @a dest.
543	* No more than @a size bytes are written. If the size of the output buffer
544	* is at least one byte, the output string will always be well-formed, i.e.
545	* null-terminated and containing only complete characters.
546	*
547	* @param dest Destination buffer.
548	* @param count Size of the destination buffer (must be > 0).
549	* @param src Source string.
550	*
551	*/
552	void str_cpy(char dest, size_t size, const char src)
553	{
554	/* There must be space for a null terminator in the buffer. */
555	ASSERT(size > 0);
556
557	size_t src_off = 0;
558	size_t dest_off = 0;
559
560	wchar_t ch;
561	while ((ch = str_decode(src, &src_off, STR_NO_LIMIT)) != 0) {
562	if (chr_encode(ch, dest, &dest_off, size - 1) != EOK)
563	break;
564	}
565
566	dest[dest_off] = '\0';
567	}
568
569	/** Copy size-limited substring.
570	*
571	* Copy prefix of string @a src of max. size @a size to destination buffer
572	* @a dest. No more than @a size bytes are written. The output string will
573	* always be well-formed, i.e. null-terminated and containing only complete
574	* characters.
575	*
576	* No more than @a n bytes are read from the input string, so it does not
577	* have to be null-terminated.
578	*
579	* @param dest Destination buffer.
580	* @param count Size of the destination buffer (must be > 0).
581	* @param src Source string.
582	* @param n Maximum number of bytes to read from @a src.
583	*
584	*/
585	void str_ncpy(char dest, size_t size, const char src, size_t n)
586	{
587	/* There must be space for a null terminator in the buffer. */
588	ASSERT(size > 0);
589
590	size_t src_off = 0;
591	size_t dest_off = 0;
592
593	wchar_t ch;
594	while ((ch = str_decode(src, &src_off, n)) != 0) {
595	if (chr_encode(ch, dest, &dest_off, size - 1) != EOK)
596	break;
597	}
598
599	dest[dest_off] = '\0';
600	}
601
602	/** Duplicate string.
603	*
604	* Allocate a new string and copy characters from the source
605	* string into it. The duplicate string is allocated via sleeping
606	* malloc(), thus this function can sleep in no memory conditions.
607	*
608	* The allocation cannot fail and the return value is always
609	* a valid pointer. The duplicate string is always a well-formed
610	* null-terminated UTF-8 string, but it can differ from the source
611	* string on the byte level.
612	*
613	* @param src Source string.
614	*
615	* @return Duplicate string.
616	*
617	*/
618	char str_dup(const char src)
619	{
620	size_t size = str_size(src) + 1;
621	char *dest = malloc(size, 0);
622	ASSERT(dest);
623
624	str_cpy(dest, size, src);
625	return dest;
626	}
627
628	/** Duplicate string with size limit.
629	*
630	* Allocate a new string and copy up to @max_size bytes from the source
631	* string into it. The duplicate string is allocated via sleeping
632	* malloc(), thus this function can sleep in no memory conditions.
633	* No more than @max_size + 1 bytes is allocated, but if the size
634	* occupied by the source string is smaller than @max_size + 1,
635	* less is allocated.
636	*
637	* The allocation cannot fail and the return value is always
638	* a valid pointer. The duplicate string is always a well-formed
639	* null-terminated UTF-8 string, but it can differ from the source
640	* string on the byte level.
641	*
642	* @param src Source string.
643	* @param n Maximum number of bytes to duplicate.
644	*
645	* @return Duplicate string.
646	*
647	*/
648	char str_ndup(const char src, size_t n)
649	{
650	size_t size = str_size(src);
651	if (size > n)
652	size = n;
653
654	char *dest = malloc(size + 1, 0);
655	ASSERT(dest);
656
657	str_ncpy(dest, size + 1, src, size);
658	return dest;
659	}
660
661	/** Convert wide string to string.
662	*
663	* Convert wide string @a src to string. The output is written to the buffer
664	* specified by @a dest and @a size. @a size must be non-zero and the string
665	* written will always be well-formed.
666	*
667	* @param dest Destination buffer.
668	* @param size Size of the destination buffer.
669	* @param src Source wide string.
670	*/
671	void wstr_to_str(char dest, size_t size, const wchar_t src)
672	{
673	wchar_t ch;
674	size_t src_idx;
675	size_t dest_off;
676
677	/* There must be space for a null terminator in the buffer. */
678	ASSERT(size > 0);
679
680	src_idx = 0;
681	dest_off = 0;
682
683	while ((ch = src[src_idx++]) != 0) {
684	if (chr_encode(ch, dest, &dest_off, size - 1) != EOK)
685	break;
686	}
687
688	dest[dest_off] = '\0';
689	}
690
691	/** Find first occurence of character in string.
692	*
693	* @param str String to search.
694	* @param ch Character to look for.
695	*
696	* @return Pointer to character in @a str or NULL if not found.
697	*
698	*/
699	char str_chr(const char str, wchar_t ch)
700	{
701	wchar_t acc;
702	size_t off = 0;
703	size_t last = 0;
704
705	while ((acc = str_decode(str, &off, STR_NO_LIMIT)) != 0) {
706	if (acc == ch)
707	return (char *) (str + last);
708	last = off;
709	}
710
711	return NULL;
712	}
713
714	/** Insert a wide character into a wide string.
715	*
716	* Insert a wide character into a wide string at position
717	* @a pos. The characters after the position are shifted.
718	*
719	* @param str String to insert to.
720	* @param ch Character to insert to.
721	* @param pos Character index where to insert.
722	@ @param max_pos Characters in the buffer.
723	*
724	* @return True if the insertion was sucessful, false if the position
725	* is out of bounds.
726	*
727	*/
728	bool wstr_linsert(wchar_t *str, wchar_t ch, size_t pos, size_t max_pos)
729	{
730	size_t len = wstr_length(str);
731
732	if ((pos > len) \|\| (pos + 1 > max_pos))
733	return false;
734
735	size_t i;
736	for (i = len; i + 1 > pos; i--)
737	str[i + 1] = str[i];
738
739	str[pos] = ch;
740
741	return true;
742	}
743
744	/** Remove a wide character from a wide string.
745	*
746	* Remove a wide character from a wide string at position
747	* @a pos. The characters after the position are shifted.
748	*
749	* @param str String to remove from.
750	* @param pos Character index to remove.
751	*
752	* @return True if the removal was sucessful, false if the position
753	* is out of bounds.
754	*
755	*/
756	bool wstr_remove(wchar_t *str, size_t pos)
757	{
758	size_t len = wstr_length(str);
759
760	if (pos >= len)
761	return false;
762
763	size_t i;
764	for (i = pos + 1; i <= len; i++)
765	str[i - 1] = str[i];
766
767	return true;
768	}
769
770	/** Convert string to uint64_t (internal variant).
771	*
772	* @param nptr Pointer to string.
773	* @param endptr Pointer to the first invalid character is stored here.
774	* @param base Zero or number between 2 and 36 inclusive.
775	* @param neg Indication of unary minus is stored here.
776	* @apram result Result of the conversion.
777	*
778	* @return EOK if conversion was successful.
779	*
780	*/
781	static int str_uint(const char nptr, char *endptr, unsigned int base,
782	bool neg, uint64_t result)
783	{
784	ASSERT(endptr != NULL);
785	ASSERT(neg != NULL);
786	ASSERT(result != NULL);
787
788	*neg = false;
789	const char *str = nptr;
790
791	/* Ignore leading whitespace */
792	while (isspace(*str))
793	str++;
794
795	if (*str == '-') {
796	*neg = true;
797	str++;
798	} else if (*str == '+')
799	str++;
800
801	if (base == 0) {
802	/* Decode base if not specified */
803	base = 10;
804
805	if (*str == '0') {
806	base = 8;
807	str++;
808
809	switch (*str) {
810	case 'b':
811	case 'B':
812	base = 2;
813	str++;
814	break;
815	case 'o':
816	case 'O':
817	base = 8;
818	str++;
819	break;
820	case 'd':
821	case 'D':
822	case 't':
823	case 'T':
824	base = 10;
825	str++;
826	break;
827	case 'x':
828	case 'X':
829	base = 16;
830	str++;
831	break;
832	default:
833	str--;
834	}
835	}
836	} else {
837	/* Check base range */
838	if ((base < 2) \|\| (base > 36)) {
839	endptr = (char ) str;
840	return EINVAL;
841	}
842	}
843
844	*result = 0;
845	const char *startstr = str;
846
847	while (*str != 0) {
848	unsigned int digit;
849
850	if ((str >= 'a') && (str <= 'z'))
851	digit = *str - 'a' + 10;
852	else if ((str >= 'A') && (str <= 'Z'))
853	digit = *str - 'A' + 10;
854	else if ((str >= '0') && (str <= '9'))
855	digit = *str - '0';
856	else
857	break;
858
859	if (digit >= base)
860	break;
861
862	uint64_t prev = *result;
863	result = (result) * base + digit;
864
865	if (*result < prev) {
866	/* Overflow */
867	endptr = (char ) str;
868	return EOVERFLOW;
869	}
870
871	str++;
872	}
873
874	if (str == startstr) {
875	/*
876	* No digits were decoded => first invalid character is
877	* the first character of the string.
878	*/
879	str = nptr;
880	}
881
882	endptr = (char ) str;
883
884	if (str == nptr)
885	return EINVAL;
886
887	return EOK;
888	}
889
890	/** Convert string to uint64_t.
891	*
892	* @param nptr Pointer to string.
893	* @param endptr If not NULL, pointer to the first invalid character
894	* is stored here.
895	* @param base Zero or number between 2 and 36 inclusive.
896	* @param strict Do not allow any trailing characters.
897	* @param result Result of the conversion.
898	*
899	* @return EOK if conversion was successful.
900	*
901	*/
902	int str_uint64_t(const char nptr, char *endptr, unsigned int base,
903	bool strict, uint64_t *result)
904	{
905	ASSERT(result != NULL);
906
907	bool neg;
908	char *lendptr;
909	int ret = str_uint(nptr, &lendptr, base, &neg, result);
910
911	if (endptr != NULL)
912	endptr = (char ) lendptr;
913
914	if (ret != EOK)
915	return ret;
916
917	/* Do not allow negative values */
918	if (neg)
919	return EINVAL;
920
921	/* Check whether we are at the end of
922	the string in strict mode */
923	if ((strict) && (*lendptr != 0))
924	return EINVAL;
925
926	return EOK;
927	}
928
929	void order_suffix(const uint64_t val, uint64_t rv, char suffix)
930	{
931	if (val > UINT64_C(10000000000000000000)) {
932	*rv = val / UINT64_C(1000000000000000000);
933	*suffix = 'Z';
934	} else if (val > UINT64_C(1000000000000000000)) {
935	*rv = val / UINT64_C(1000000000000000);
936	*suffix = 'E';
937	} else if (val > UINT64_C(1000000000000000)) {
938	*rv = val / UINT64_C(1000000000000);
939	*suffix = 'T';
940	} else if (val > UINT64_C(1000000000000)) {
941	*rv = val / UINT64_C(1000000000);
942	*suffix = 'G';
943	} else if (val > UINT64_C(1000000000)) {
944	*rv = val / UINT64_C(1000000);
945	*suffix = 'M';
946	} else if (val > UINT64_C(1000000)) {
947	*rv = val / UINT64_C(1000);
948	*suffix = 'k';
949	} else {
950	*rv = val;
951	*suffix = ' ';
952	}
953	}
954
955	void bin_order_suffix(const uint64_t val, uint64_t rv, const char *suffix,
956	bool fixed)
957	{
958	if (val > UINT64_C(1152921504606846976)) {
959	*rv = val / UINT64_C(1125899906842624);
960	*suffix = "EiB";
961	} else if (val > UINT64_C(1125899906842624)) {
962	*rv = val / UINT64_C(1099511627776);
963	*suffix = "TiB";
964	} else if (val > UINT64_C(1099511627776)) {
965	*rv = val / UINT64_C(1073741824);
966	*suffix = "GiB";
967	} else if (val > UINT64_C(1073741824)) {
968	*rv = val / UINT64_C(1048576);
969	*suffix = "MiB";
970	} else if (val > UINT64_C(1048576)) {
971	*rv = val / UINT64_C(1024);
972	*suffix = "KiB";
973	} else {
974	*rv = val;
975	if (fixed)
976	*suffix = "B ";
977	else
978	*suffix = "B";
979	}
980	}
981
982	/** @}
983	*/

Note: See TracBrowser for help on using the repository browser.

Download in other formats: