1 // SPDX-License-Identifier: GPL-2.0-only
2 /* -*- linux-c -*- ------------------------------------------------------- *
3  *
4  *   Copyright (C) 1991, 1992 Linus Torvalds
5  *   Copyright 2007 rPath, Inc. - All Rights Reserved
6  *
7  * ----------------------------------------------------------------------- */
8 
9 /*
10  * Oh, it's a waste of space, but oh-so-yummy for debugging.
11  */
12 
13 #include <linux/stdarg.h>
14 
15 #include <linux/compiler.h>
16 #include <linux/ctype.h>
17 #include <linux/kernel.h>
18 #include <linux/limits.h>
19 #include <linux/string.h>
20 #include <linux/types.h>
21 
22 static
23 int skip_atoi(const char **s)
24 {
25 	int i = 0;
26 
27 	while (isdigit(**s))
28 		i = i * 10 + *((*s)++) - '0';
29 	return i;
30 }
31 
32 /*
33  * put_dec_full4 handles numbers in the range 0 <= r < 10000.
34  * The multiplier 0xccd is round(2^15/10), and the approximation
35  * r/10 == (r * 0xccd) >> 15 is exact for all r < 16389.
36  */
37 static
38 void put_dec_full4(char *end, unsigned int r)
39 {
40 	int i;
41 
42 	for (i = 0; i < 3; i++) {
43 		unsigned int q = (r * 0xccd) >> 15;
44 		*--end = '0' + (r - q * 10);
45 		r = q;
46 	}
47 	*--end = '0' + r;
48 }
49 
50 /* put_dec is copied from lib/vsprintf.c with small modifications */
51 
52 /*
53  * Call put_dec_full4 on x % 10000, return x / 10000.
54  * The approximation x/10000 == (x * 0x346DC5D7) >> 43
55  * holds for all x < 1,128,869,999.  The largest value this
56  * helper will ever be asked to convert is 1,125,520,955.
57  * (second call in the put_dec code, assuming n is all-ones).
58  */
59 static
60 unsigned int put_dec_helper4(char *end, unsigned int x)
61 {
62 	unsigned int q = (x * 0x346DC5D7ULL) >> 43;
63 
64 	put_dec_full4(end, x - q * 10000);
65 	return q;
66 }
67 
68 /* Based on code by Douglas W. Jones found at
69  * <http://www.cs.uiowa.edu/~jones/bcd/decimal.html#sixtyfour>
70  * (with permission from the author).
71  * Performs no 64-bit division and hence should be fast on 32-bit machines.
72  */
73 static
74 char *put_dec(char *end, unsigned long long n)
75 {
76 	unsigned int d3, d2, d1, q, h;
77 	char *p = end;
78 
79 	d1  = ((unsigned int)n >> 16); /* implicit "& 0xffff" */
80 	h   = (n >> 32);
81 	d2  = (h      ) & 0xffff;
82 	d3  = (h >> 16); /* implicit "& 0xffff" */
83 
84 	/* n = 2^48 d3 + 2^32 d2 + 2^16 d1 + d0
85 	     = 281_4749_7671_0656 d3 + 42_9496_7296 d2 + 6_5536 d1 + d0 */
86 	q = 656 * d3 + 7296 * d2 + 5536 * d1 + ((unsigned int)n & 0xffff);
87 	q = put_dec_helper4(p, q);
88 	p -= 4;
89 
90 	q += 7671 * d3 + 9496 * d2 + 6 * d1;
91 	q = put_dec_helper4(p, q);
92 	p -= 4;
93 
94 	q += 4749 * d3 + 42 * d2;
95 	q = put_dec_helper4(p, q);
96 	p -= 4;
97 
98 	q += 281 * d3;
99 	q = put_dec_helper4(p, q);
100 	p -= 4;
101 
102 	put_dec_full4(p, q);
103 	p -= 4;
104 
105 	/* strip off the extra 0's we printed */
106 	while (p < end && *p == '0')
107 		++p;
108 
109 	return p;
110 }
111 
112 static
113 char *number(char *end, unsigned long long num, int base, char locase)
114 {
115 	/*
116 	 * locase = 0 or 0x20. ORing digits or letters with 'locase'
117 	 * produces same digits or (maybe lowercased) letters
118 	 */
119 
120 	/* we are called with base 8, 10 or 16, only, thus don't need "G..."  */
121 	static const char digits[16] = "0123456789ABCDEF"; /* "GHIJKLMNOPQRSTUVWXYZ"; */
122 
123 	switch (base) {
124 	case 10:
125 		if (num != 0)
126 			end = put_dec(end, num);
127 		break;
128 	case 8:
129 		for (; num != 0; num >>= 3)
130 			*--end = '0' + (num & 07);
131 		break;
132 	case 16:
133 		for (; num != 0; num >>= 4)
134 			*--end = digits[num & 0xf] | locase;
135 		break;
136 	default:
137 		unreachable();
138 	}
139 
140 	return end;
141 }
142 
143 #define ZEROPAD	1		/* pad with zero */
144 #define SIGN	2		/* unsigned/signed long */
145 #define PLUS	4		/* show plus */
146 #define SPACE	8		/* space if plus */
147 #define LEFT	16		/* left justified */
148 #define SMALL	32		/* Must be 32 == 0x20 */
149 #define SPECIAL	64		/* 0x */
150 #define WIDE	128		/* UTF-16 string */
151 
152 static
153 int get_flags(const char **fmt)
154 {
155 	int flags = 0;
156 
157 	do {
158 		switch (**fmt) {
159 		case '-':
160 			flags |= LEFT;
161 			break;
162 		case '+':
163 			flags |= PLUS;
164 			break;
165 		case ' ':
166 			flags |= SPACE;
167 			break;
168 		case '#':
169 			flags |= SPECIAL;
170 			break;
171 		case '0':
172 			flags |= ZEROPAD;
173 			break;
174 		default:
175 			return flags;
176 		}
177 		++(*fmt);
178 	} while (1);
179 }
180 
181 static
182 int get_int(const char **fmt, va_list *ap)
183 {
184 	if (isdigit(**fmt))
185 		return skip_atoi(fmt);
186 	if (**fmt == '*') {
187 		++(*fmt);
188 		/* it's the next argument */
189 		return va_arg(*ap, int);
190 	}
191 	return 0;
192 }
193 
194 static
195 unsigned long long get_number(int sign, int qualifier, va_list *ap)
196 {
197 	if (sign) {
198 		switch (qualifier) {
199 		case 'L':
200 			return va_arg(*ap, long long);
201 		case 'l':
202 			return va_arg(*ap, long);
203 		case 'h':
204 			return (short)va_arg(*ap, int);
205 		case 'H':
206 			return (signed char)va_arg(*ap, int);
207 		default:
208 			return va_arg(*ap, int);
209 		};
210 	} else {
211 		switch (qualifier) {
212 		case 'L':
213 			return va_arg(*ap, unsigned long long);
214 		case 'l':
215 			return va_arg(*ap, unsigned long);
216 		case 'h':
217 			return (unsigned short)va_arg(*ap, int);
218 		case 'H':
219 			return (unsigned char)va_arg(*ap, int);
220 		default:
221 			return va_arg(*ap, unsigned int);
222 		}
223 	}
224 }
225 
226 static
227 char get_sign(long long *num, int flags)
228 {
229 	if (!(flags & SIGN))
230 		return 0;
231 	if (*num < 0) {
232 		*num = -(*num);
233 		return '-';
234 	}
235 	if (flags & PLUS)
236 		return '+';
237 	if (flags & SPACE)
238 		return ' ';
239 	return 0;
240 }
241 
242 static
243 size_t utf16s_utf8nlen(const u16 *s16, size_t maxlen)
244 {
245 	size_t len, clen;
246 
247 	for (len = 0; len < maxlen && *s16; len += clen) {
248 		u16 c0 = *s16++;
249 
250 		/* First, get the length for a BMP character */
251 		clen = 1 + (c0 >= 0x80) + (c0 >= 0x800);
252 		if (len + clen > maxlen)
253 			break;
254 		/*
255 		 * If this is a high surrogate, and we're already at maxlen, we
256 		 * can't include the character if it's a valid surrogate pair.
257 		 * Avoid accessing one extra word just to check if it's valid
258 		 * or not.
259 		 */
260 		if ((c0 & 0xfc00) == 0xd800) {
261 			if (len + clen == maxlen)
262 				break;
263 			if ((*s16 & 0xfc00) == 0xdc00) {
264 				++s16;
265 				++clen;
266 			}
267 		}
268 	}
269 
270 	return len;
271 }
272 
273 static
274 u32 utf16_to_utf32(const u16 **s16)
275 {
276 	u16 c0, c1;
277 
278 	c0 = *(*s16)++;
279 	/* not a surrogate */
280 	if ((c0 & 0xf800) != 0xd800)
281 		return c0;
282 	/* invalid: low surrogate instead of high */
283 	if (c0 & 0x0400)
284 		return 0xfffd;
285 	c1 = **s16;
286 	/* invalid: missing low surrogate */
287 	if ((c1 & 0xfc00) != 0xdc00)
288 		return 0xfffd;
289 	/* valid surrogate pair */
290 	++(*s16);
291 	return (0x10000 - (0xd800 << 10) - 0xdc00) + (c0 << 10) + c1;
292 }
293 
294 #define PUTC(c) \
295 do {				\
296 	if (pos < size)		\
297 		buf[pos] = (c);	\
298 	++pos;			\
299 } while (0);
300 
301 int vsnprintf(char *buf, size_t size, const char *fmt, va_list ap)
302 {
303 	/* The maximum space required is to print a 64-bit number in octal */
304 	char tmp[(sizeof(unsigned long long) * 8 + 2) / 3];
305 	char *tmp_end = &tmp[ARRAY_SIZE(tmp)];
306 	long long num;
307 	int base;
308 	const char *s;
309 	size_t len, pos;
310 	char sign;
311 
312 	int flags;		/* flags to number() */
313 
314 	int field_width;	/* width of output field */
315 	int precision;		/* min. # of digits for integers; max
316 				   number of chars for from string */
317 	int qualifier;		/* 'h', 'hh', 'l' or 'll' for integer fields */
318 
319 	va_list args;
320 
321 	/*
322 	 * We want to pass our input va_list to helper functions by reference,
323 	 * but there's an annoying edge case. If va_list was originally passed
324 	 * to us by value, we could just pass &ap down to the helpers. This is
325 	 * the case on, for example, X86_32.
326 	 * However, on X86_64 (and possibly others), va_list is actually a
327 	 * size-1 array containing a structure. Our function parameter ap has
328 	 * decayed from T[1] to T*, and &ap has type T** rather than T(*)[1],
329 	 * which is what will be expected by a function taking a va_list *
330 	 * parameter.
331 	 * One standard way to solve this mess is by creating a copy in a local
332 	 * variable of type va_list and then passing a pointer to that local
333 	 * copy instead, which is what we do here.
334 	 */
335 	va_copy(args, ap);
336 
337 	for (pos = 0; *fmt; ++fmt) {
338 		if (*fmt != '%' || *++fmt == '%') {
339 			PUTC(*fmt);
340 			continue;
341 		}
342 
343 		/* process flags */
344 		flags = get_flags(&fmt);
345 
346 		/* get field width */
347 		field_width = get_int(&fmt, &args);
348 		if (field_width < 0) {
349 			field_width = -field_width;
350 			flags |= LEFT;
351 		}
352 
353 		if (flags & LEFT)
354 			flags &= ~ZEROPAD;
355 
356 		/* get the precision */
357 		precision = -1;
358 		if (*fmt == '.') {
359 			++fmt;
360 			precision = get_int(&fmt, &args);
361 			if (precision >= 0)
362 				flags &= ~ZEROPAD;
363 		}
364 
365 		/* get the conversion qualifier */
366 		qualifier = -1;
367 		if (*fmt == 'h' || *fmt == 'l') {
368 			qualifier = *fmt;
369 			++fmt;
370 			if (qualifier == *fmt) {
371 				qualifier -= 'a'-'A';
372 				++fmt;
373 			}
374 		}
375 
376 		sign = 0;
377 
378 		switch (*fmt) {
379 		case 'c':
380 			flags &= LEFT;
381 			s = tmp;
382 			if (qualifier == 'l') {
383 				((u16 *)tmp)[0] = (u16)va_arg(args, unsigned int);
384 				((u16 *)tmp)[1] = L'\0';
385 				precision = INT_MAX;
386 				goto wstring;
387 			} else {
388 				tmp[0] = (unsigned char)va_arg(args, int);
389 				precision = len = 1;
390 			}
391 			goto output;
392 
393 		case 's':
394 			flags &= LEFT;
395 			if (precision < 0)
396 				precision = INT_MAX;
397 			s = va_arg(args, void *);
398 			if (!s)
399 				s = precision < 6 ? "" : "(null)";
400 			else if (qualifier == 'l') {
401 		wstring:
402 				flags |= WIDE;
403 				precision = len = utf16s_utf8nlen((const u16 *)s, precision);
404 				goto output;
405 			}
406 			precision = len = strnlen(s, precision);
407 			goto output;
408 
409 			/* integer number formats - set up the flags and "break" */
410 		case 'o':
411 			base = 8;
412 			break;
413 
414 		case 'p':
415 			if (precision < 0)
416 				precision = 2 * sizeof(void *);
417 			fallthrough;
418 		case 'x':
419 			flags |= SMALL;
420 			fallthrough;
421 		case 'X':
422 			base = 16;
423 			break;
424 
425 		case 'd':
426 		case 'i':
427 			flags |= SIGN;
428 			fallthrough;
429 		case 'u':
430 			flags &= ~SPECIAL;
431 			base = 10;
432 			break;
433 
434 		default:
435 			/*
436 			 * Bail out if the conversion specifier is invalid.
437 			 * There's probably a typo in the format string and the
438 			 * remaining specifiers are unlikely to match up with
439 			 * the arguments.
440 			 */
441 			goto fail;
442 		}
443 		if (*fmt == 'p') {
444 			num = (unsigned long)va_arg(args, void *);
445 		} else {
446 			num = get_number(flags & SIGN, qualifier, &args);
447 		}
448 
449 		sign = get_sign(&num, flags);
450 		if (sign)
451 			--field_width;
452 
453 		s = number(tmp_end, num, base, flags & SMALL);
454 		len = tmp_end - s;
455 		/* default precision is 1 */
456 		if (precision < 0)
457 			precision = 1;
458 		/* precision is minimum number of digits to print */
459 		if (precision < len)
460 			precision = len;
461 		if (flags & SPECIAL) {
462 			/*
463 			 * For octal, a leading 0 is printed only if necessary,
464 			 * i.e. if it's not already there because of the
465 			 * precision.
466 			 */
467 			if (base == 8 && precision == len)
468 				++precision;
469 			/*
470 			 * For hexadecimal, the leading 0x is skipped if the
471 			 * output is empty, i.e. both the number and the
472 			 * precision are 0.
473 			 */
474 			if (base == 16 && precision > 0)
475 				field_width -= 2;
476 			else
477 				flags &= ~SPECIAL;
478 		}
479 		/*
480 		 * For zero padding, increase the precision to fill the field
481 		 * width.
482 		 */
483 		if ((flags & ZEROPAD) && field_width > precision)
484 			precision = field_width;
485 
486 output:
487 		/* Calculate the padding necessary */
488 		field_width -= precision;
489 		/* Leading padding with ' ' */
490 		if (!(flags & LEFT))
491 			while (field_width-- > 0)
492 				PUTC(' ');
493 		/* sign */
494 		if (sign)
495 			PUTC(sign);
496 		/* 0x/0X for hexadecimal */
497 		if (flags & SPECIAL) {
498 			PUTC('0');
499 			PUTC( 'X' | (flags & SMALL));
500 		}
501 		/* Zero padding and excess precision */
502 		while (precision-- > len)
503 			PUTC('0');
504 		/* Actual output */
505 		if (flags & WIDE) {
506 			const u16 *ws = (const u16 *)s;
507 
508 			while (len-- > 0) {
509 				u32 c32 = utf16_to_utf32(&ws);
510 				u8 *s8;
511 				size_t clen;
512 
513 				if (c32 < 0x80) {
514 					PUTC(c32);
515 					continue;
516 				}
517 
518 				/* Number of trailing octets */
519 				clen = 1 + (c32 >= 0x800) + (c32 >= 0x10000);
520 
521 				len -= clen;
522 				s8 = (u8 *)&buf[pos];
523 
524 				/* Avoid writing partial character */
525 				PUTC('\0');
526 				pos += clen;
527 				if (pos >= size)
528 					continue;
529 
530 				/* Set high bits of leading octet */
531 				*s8 = (0xf00 >> 1) >> clen;
532 				/* Write trailing octets in reverse order */
533 				for (s8 += clen; clen; --clen, c32 >>= 6)
534 					*s8-- = 0x80 | (c32 & 0x3f);
535 				/* Set low bits of leading octet */
536 				*s8 |= c32;
537 			}
538 		} else {
539 			while (len-- > 0)
540 				PUTC(*s++);
541 		}
542 		/* Trailing padding with ' ' */
543 		while (field_width-- > 0)
544 			PUTC(' ');
545 	}
546 fail:
547 	va_end(args);
548 
549 	if (size)
550 		buf[min(pos, size-1)] = '\0';
551 
552 	return pos;
553 }
554 
555 int snprintf(char *buf, size_t size, const char *fmt, ...)
556 {
557 	va_list args;
558 	int i;
559 
560 	va_start(args, fmt);
561 	i = vsnprintf(buf, size, fmt, args);
562 	va_end(args);
563 	return i;
564 }
565