xref: /openbmc/linux/lib/842/842_compress.c (revision 75bf465f0bc33e9b776a46d6a1b9b990f5fb7c37)
1*c942fddfSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
22da572c9SDan Streetman /*
32da572c9SDan Streetman  * 842 Software Compression
42da572c9SDan Streetman  *
52da572c9SDan Streetman  * Copyright (C) 2015 Dan Streetman, IBM Corp
62da572c9SDan Streetman  *
72da572c9SDan Streetman  * See 842.h for details of the 842 compressed format.
82da572c9SDan Streetman  */
92da572c9SDan Streetman 
102da572c9SDan Streetman #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
112da572c9SDan Streetman #define MODULE_NAME "842_compress"
122da572c9SDan Streetman 
132da572c9SDan Streetman #include <linux/hashtable.h>
142da572c9SDan Streetman 
152da572c9SDan Streetman #include "842.h"
162da572c9SDan Streetman #include "842_debugfs.h"
172da572c9SDan Streetman 
182da572c9SDan Streetman #define SW842_HASHTABLE8_BITS	(10)
192da572c9SDan Streetman #define SW842_HASHTABLE4_BITS	(11)
202da572c9SDan Streetman #define SW842_HASHTABLE2_BITS	(10)
212da572c9SDan Streetman 
222da572c9SDan Streetman /* By default, we allow compressing input buffers of any length, but we must
232da572c9SDan Streetman  * use the non-standard "short data" template so the decompressor can correctly
242da572c9SDan Streetman  * reproduce the uncompressed data buffer at the right length.  However the
252da572c9SDan Streetman  * hardware 842 compressor will not recognize the "short data" template, and
262da572c9SDan Streetman  * will fail to decompress any compressed buffer containing it (I have no idea
272da572c9SDan Streetman  * why anyone would want to use software to compress and hardware to decompress
282da572c9SDan Streetman  * but that's beside the point).  This parameter forces the compression
292da572c9SDan Streetman  * function to simply reject any input buffer that isn't a multiple of 8 bytes
302da572c9SDan Streetman  * long, instead of using the "short data" template, so that all compressed
312da572c9SDan Streetman  * buffers produced by this function will be decompressable by the 842 hardware
322da572c9SDan Streetman  * decompressor.  Unless you have a specific need for that, leave this disabled
332da572c9SDan Streetman  * so that any length buffer can be compressed.
342da572c9SDan Streetman  */
352da572c9SDan Streetman static bool sw842_strict;
362da572c9SDan Streetman module_param_named(strict, sw842_strict, bool, 0644);
372da572c9SDan Streetman 
382da572c9SDan Streetman static u8 comp_ops[OPS_MAX][5] = { /* params size in bits */
392da572c9SDan Streetman 	{ I8, N0, N0, N0, 0x19 }, /* 8 */
402da572c9SDan Streetman 	{ I4, I4, N0, N0, 0x18 }, /* 18 */
412da572c9SDan Streetman 	{ I4, I2, I2, N0, 0x17 }, /* 25 */
422da572c9SDan Streetman 	{ I2, I2, I4, N0, 0x13 }, /* 25 */
432da572c9SDan Streetman 	{ I2, I2, I2, I2, 0x12 }, /* 32 */
442da572c9SDan Streetman 	{ I4, I2, D2, N0, 0x16 }, /* 33 */
452da572c9SDan Streetman 	{ I4, D2, I2, N0, 0x15 }, /* 33 */
462da572c9SDan Streetman 	{ I2, D2, I4, N0, 0x0e }, /* 33 */
472da572c9SDan Streetman 	{ D2, I2, I4, N0, 0x09 }, /* 33 */
482da572c9SDan Streetman 	{ I2, I2, I2, D2, 0x11 }, /* 40 */
492da572c9SDan Streetman 	{ I2, I2, D2, I2, 0x10 }, /* 40 */
502da572c9SDan Streetman 	{ I2, D2, I2, I2, 0x0d }, /* 40 */
512da572c9SDan Streetman 	{ D2, I2, I2, I2, 0x08 }, /* 40 */
522da572c9SDan Streetman 	{ I4, D4, N0, N0, 0x14 }, /* 41 */
532da572c9SDan Streetman 	{ D4, I4, N0, N0, 0x04 }, /* 41 */
542da572c9SDan Streetman 	{ I2, I2, D4, N0, 0x0f }, /* 48 */
552da572c9SDan Streetman 	{ I2, D2, I2, D2, 0x0c }, /* 48 */
562da572c9SDan Streetman 	{ I2, D4, I2, N0, 0x0b }, /* 48 */
572da572c9SDan Streetman 	{ D2, I2, I2, D2, 0x07 }, /* 48 */
582da572c9SDan Streetman 	{ D2, I2, D2, I2, 0x06 }, /* 48 */
592da572c9SDan Streetman 	{ D4, I2, I2, N0, 0x03 }, /* 48 */
602da572c9SDan Streetman 	{ I2, D2, D4, N0, 0x0a }, /* 56 */
612da572c9SDan Streetman 	{ D2, I2, D4, N0, 0x05 }, /* 56 */
622da572c9SDan Streetman 	{ D4, I2, D2, N0, 0x02 }, /* 56 */
632da572c9SDan Streetman 	{ D4, D2, I2, N0, 0x01 }, /* 56 */
642da572c9SDan Streetman 	{ D8, N0, N0, N0, 0x00 }, /* 64 */
652da572c9SDan Streetman };
662da572c9SDan Streetman 
672da572c9SDan Streetman struct sw842_hlist_node8 {
682da572c9SDan Streetman 	struct hlist_node node;
692da572c9SDan Streetman 	u64 data;
702da572c9SDan Streetman 	u8 index;
712da572c9SDan Streetman };
722da572c9SDan Streetman 
732da572c9SDan Streetman struct sw842_hlist_node4 {
742da572c9SDan Streetman 	struct hlist_node node;
752da572c9SDan Streetman 	u32 data;
762da572c9SDan Streetman 	u16 index;
772da572c9SDan Streetman };
782da572c9SDan Streetman 
792da572c9SDan Streetman struct sw842_hlist_node2 {
802da572c9SDan Streetman 	struct hlist_node node;
812da572c9SDan Streetman 	u16 data;
822da572c9SDan Streetman 	u8 index;
832da572c9SDan Streetman };
842da572c9SDan Streetman 
852da572c9SDan Streetman #define INDEX_NOT_FOUND		(-1)
862da572c9SDan Streetman #define INDEX_NOT_CHECKED	(-2)
872da572c9SDan Streetman 
882da572c9SDan Streetman struct sw842_param {
892da572c9SDan Streetman 	u8 *in;
902da572c9SDan Streetman 	u8 *instart;
912da572c9SDan Streetman 	u64 ilen;
922da572c9SDan Streetman 	u8 *out;
932da572c9SDan Streetman 	u64 olen;
942da572c9SDan Streetman 	u8 bit;
952da572c9SDan Streetman 	u64 data8[1];
962da572c9SDan Streetman 	u32 data4[2];
972da572c9SDan Streetman 	u16 data2[4];
982da572c9SDan Streetman 	int index8[1];
992da572c9SDan Streetman 	int index4[2];
1002da572c9SDan Streetman 	int index2[4];
1012da572c9SDan Streetman 	DECLARE_HASHTABLE(htable8, SW842_HASHTABLE8_BITS);
1022da572c9SDan Streetman 	DECLARE_HASHTABLE(htable4, SW842_HASHTABLE4_BITS);
1032da572c9SDan Streetman 	DECLARE_HASHTABLE(htable2, SW842_HASHTABLE2_BITS);
1042da572c9SDan Streetman 	struct sw842_hlist_node8 node8[1 << I8_BITS];
1052da572c9SDan Streetman 	struct sw842_hlist_node4 node4[1 << I4_BITS];
1062da572c9SDan Streetman 	struct sw842_hlist_node2 node2[1 << I2_BITS];
1072da572c9SDan Streetman };
1082da572c9SDan Streetman 
1092da572c9SDan Streetman #define get_input_data(p, o, b)						\
1102da572c9SDan Streetman 	be##b##_to_cpu(get_unaligned((__be##b *)((p)->in + (o))))
1112da572c9SDan Streetman 
1122da572c9SDan Streetman #define init_hashtable_nodes(p, b)	do {			\
1132da572c9SDan Streetman 	int _i;							\
1142da572c9SDan Streetman 	hash_init((p)->htable##b);				\
1152da572c9SDan Streetman 	for (_i = 0; _i < ARRAY_SIZE((p)->node##b); _i++) {	\
1162da572c9SDan Streetman 		(p)->node##b[_i].index = _i;			\
1172da572c9SDan Streetman 		(p)->node##b[_i].data = 0;			\
1182da572c9SDan Streetman 		INIT_HLIST_NODE(&(p)->node##b[_i].node);	\
1192da572c9SDan Streetman 	}							\
1202da572c9SDan Streetman } while (0)
1212da572c9SDan Streetman 
1222da572c9SDan Streetman #define find_index(p, b, n)	({					\
1232da572c9SDan Streetman 	struct sw842_hlist_node##b *_n;					\
1242da572c9SDan Streetman 	p->index##b[n] = INDEX_NOT_FOUND;				\
1252da572c9SDan Streetman 	hash_for_each_possible(p->htable##b, _n, node, p->data##b[n]) {	\
1262da572c9SDan Streetman 		if (p->data##b[n] == _n->data) {			\
1272da572c9SDan Streetman 			p->index##b[n] = _n->index;			\
1282da572c9SDan Streetman 			break;						\
1292da572c9SDan Streetman 		}							\
1302da572c9SDan Streetman 	}								\
1312da572c9SDan Streetman 	p->index##b[n] >= 0;						\
1322da572c9SDan Streetman })
1332da572c9SDan Streetman 
1342da572c9SDan Streetman #define check_index(p, b, n)			\
1352da572c9SDan Streetman 	((p)->index##b[n] == INDEX_NOT_CHECKED	\
1362da572c9SDan Streetman 	 ? find_index(p, b, n)			\
1372da572c9SDan Streetman 	 : (p)->index##b[n] >= 0)
1382da572c9SDan Streetman 
1392da572c9SDan Streetman #define replace_hash(p, b, i, d)	do {				\
1402da572c9SDan Streetman 	struct sw842_hlist_node##b *_n = &(p)->node##b[(i)+(d)];	\
1412da572c9SDan Streetman 	hash_del(&_n->node);						\
1422da572c9SDan Streetman 	_n->data = (p)->data##b[d];					\
1432da572c9SDan Streetman 	pr_debug("add hash index%x %x pos %x data %lx\n", b,		\
1442da572c9SDan Streetman 		 (unsigned int)_n->index,				\
1452da572c9SDan Streetman 		 (unsigned int)((p)->in - (p)->instart),		\
1462da572c9SDan Streetman 		 (unsigned long)_n->data);				\
1472da572c9SDan Streetman 	hash_add((p)->htable##b, &_n->node, _n->data);			\
1482da572c9SDan Streetman } while (0)
1492da572c9SDan Streetman 
1502da572c9SDan Streetman static u8 bmask[8] = { 0x00, 0x80, 0xc0, 0xe0, 0xf0, 0xf8, 0xfc, 0xfe };
1512da572c9SDan Streetman 
1522da572c9SDan Streetman static int add_bits(struct sw842_param *p, u64 d, u8 n);
1532da572c9SDan Streetman 
__split_add_bits(struct sw842_param * p,u64 d,u8 n,u8 s)1542da572c9SDan Streetman static int __split_add_bits(struct sw842_param *p, u64 d, u8 n, u8 s)
1552da572c9SDan Streetman {
1562da572c9SDan Streetman 	int ret;
1572da572c9SDan Streetman 
1582da572c9SDan Streetman 	if (n <= s)
1592da572c9SDan Streetman 		return -EINVAL;
1602da572c9SDan Streetman 
1612da572c9SDan Streetman 	ret = add_bits(p, d >> s, n - s);
1622da572c9SDan Streetman 	if (ret)
1632da572c9SDan Streetman 		return ret;
1642da572c9SDan Streetman 	return add_bits(p, d & GENMASK_ULL(s - 1, 0), s);
1652da572c9SDan Streetman }
1662da572c9SDan Streetman 
add_bits(struct sw842_param * p,u64 d,u8 n)1672da572c9SDan Streetman static int add_bits(struct sw842_param *p, u64 d, u8 n)
1682da572c9SDan Streetman {
1692da572c9SDan Streetman 	int b = p->bit, bits = b + n, s = round_up(bits, 8) - bits;
1702da572c9SDan Streetman 	u64 o;
1712da572c9SDan Streetman 	u8 *out = p->out;
1722da572c9SDan Streetman 
1732da572c9SDan Streetman 	pr_debug("add %u bits %lx\n", (unsigned char)n, (unsigned long)d);
1742da572c9SDan Streetman 
1752da572c9SDan Streetman 	if (n > 64)
1762da572c9SDan Streetman 		return -EINVAL;
1772da572c9SDan Streetman 
1782da572c9SDan Streetman 	/* split this up if writing to > 8 bytes (i.e. n == 64 && p->bit > 0),
1792da572c9SDan Streetman 	 * or if we're at the end of the output buffer and would write past end
1802da572c9SDan Streetman 	 */
1812da572c9SDan Streetman 	if (bits > 64)
1822da572c9SDan Streetman 		return __split_add_bits(p, d, n, 32);
1832da572c9SDan Streetman 	else if (p->olen < 8 && bits > 32 && bits <= 56)
1842da572c9SDan Streetman 		return __split_add_bits(p, d, n, 16);
1852da572c9SDan Streetman 	else if (p->olen < 4 && bits > 16 && bits <= 24)
1862da572c9SDan Streetman 		return __split_add_bits(p, d, n, 8);
1872da572c9SDan Streetman 
1882da572c9SDan Streetman 	if (DIV_ROUND_UP(bits, 8) > p->olen)
1892da572c9SDan Streetman 		return -ENOSPC;
1902da572c9SDan Streetman 
1912da572c9SDan Streetman 	o = *out & bmask[b];
1922da572c9SDan Streetman 	d <<= s;
1932da572c9SDan Streetman 
1942da572c9SDan Streetman 	if (bits <= 8)
1952da572c9SDan Streetman 		*out = o | d;
1962da572c9SDan Streetman 	else if (bits <= 16)
1972da572c9SDan Streetman 		put_unaligned(cpu_to_be16(o << 8 | d), (__be16 *)out);
1982da572c9SDan Streetman 	else if (bits <= 24)
1992da572c9SDan Streetman 		put_unaligned(cpu_to_be32(o << 24 | d << 8), (__be32 *)out);
2002da572c9SDan Streetman 	else if (bits <= 32)
2012da572c9SDan Streetman 		put_unaligned(cpu_to_be32(o << 24 | d), (__be32 *)out);
2022da572c9SDan Streetman 	else if (bits <= 40)
2032da572c9SDan Streetman 		put_unaligned(cpu_to_be64(o << 56 | d << 24), (__be64 *)out);
2042da572c9SDan Streetman 	else if (bits <= 48)
2052da572c9SDan Streetman 		put_unaligned(cpu_to_be64(o << 56 | d << 16), (__be64 *)out);
2062da572c9SDan Streetman 	else if (bits <= 56)
2072da572c9SDan Streetman 		put_unaligned(cpu_to_be64(o << 56 | d << 8), (__be64 *)out);
2082da572c9SDan Streetman 	else
2092da572c9SDan Streetman 		put_unaligned(cpu_to_be64(o << 56 | d), (__be64 *)out);
2102da572c9SDan Streetman 
2112da572c9SDan Streetman 	p->bit += n;
2122da572c9SDan Streetman 
2132da572c9SDan Streetman 	if (p->bit > 7) {
2142da572c9SDan Streetman 		p->out += p->bit / 8;
2152da572c9SDan Streetman 		p->olen -= p->bit / 8;
2162da572c9SDan Streetman 		p->bit %= 8;
2172da572c9SDan Streetman 	}
2182da572c9SDan Streetman 
2192da572c9SDan Streetman 	return 0;
2202da572c9SDan Streetman }
2212da572c9SDan Streetman 
add_template(struct sw842_param * p,u8 c)2222da572c9SDan Streetman static int add_template(struct sw842_param *p, u8 c)
2232da572c9SDan Streetman {
2242da572c9SDan Streetman 	int ret, i, b = 0;
2252da572c9SDan Streetman 	u8 *t = comp_ops[c];
2262da572c9SDan Streetman 	bool inv = false;
2272da572c9SDan Streetman 
2282da572c9SDan Streetman 	if (c >= OPS_MAX)
2292da572c9SDan Streetman 		return -EINVAL;
2302da572c9SDan Streetman 
2312da572c9SDan Streetman 	pr_debug("template %x\n", t[4]);
2322da572c9SDan Streetman 
2332da572c9SDan Streetman 	ret = add_bits(p, t[4], OP_BITS);
2342da572c9SDan Streetman 	if (ret)
2352da572c9SDan Streetman 		return ret;
2362da572c9SDan Streetman 
2372da572c9SDan Streetman 	for (i = 0; i < 4; i++) {
2382da572c9SDan Streetman 		pr_debug("op %x\n", t[i]);
2392da572c9SDan Streetman 
2402da572c9SDan Streetman 		switch (t[i] & OP_AMOUNT) {
2412da572c9SDan Streetman 		case OP_AMOUNT_8:
2422da572c9SDan Streetman 			if (b)
2432da572c9SDan Streetman 				inv = true;
2442da572c9SDan Streetman 			else if (t[i] & OP_ACTION_INDEX)
2452da572c9SDan Streetman 				ret = add_bits(p, p->index8[0], I8_BITS);
2462da572c9SDan Streetman 			else if (t[i] & OP_ACTION_DATA)
2472da572c9SDan Streetman 				ret = add_bits(p, p->data8[0], 64);
2482da572c9SDan Streetman 			else
2492da572c9SDan Streetman 				inv = true;
2502da572c9SDan Streetman 			break;
2512da572c9SDan Streetman 		case OP_AMOUNT_4:
2522da572c9SDan Streetman 			if (b == 2 && t[i] & OP_ACTION_DATA)
2532da572c9SDan Streetman 				ret = add_bits(p, get_input_data(p, 2, 32), 32);
2542da572c9SDan Streetman 			else if (b != 0 && b != 4)
2552da572c9SDan Streetman 				inv = true;
2562da572c9SDan Streetman 			else if (t[i] & OP_ACTION_INDEX)
2572da572c9SDan Streetman 				ret = add_bits(p, p->index4[b >> 2], I4_BITS);
2582da572c9SDan Streetman 			else if (t[i] & OP_ACTION_DATA)
2592da572c9SDan Streetman 				ret = add_bits(p, p->data4[b >> 2], 32);
2602da572c9SDan Streetman 			else
2612da572c9SDan Streetman 				inv = true;
2622da572c9SDan Streetman 			break;
2632da572c9SDan Streetman 		case OP_AMOUNT_2:
2642da572c9SDan Streetman 			if (b != 0 && b != 2 && b != 4 && b != 6)
2652da572c9SDan Streetman 				inv = true;
2662da572c9SDan Streetman 			if (t[i] & OP_ACTION_INDEX)
2672da572c9SDan Streetman 				ret = add_bits(p, p->index2[b >> 1], I2_BITS);
2682da572c9SDan Streetman 			else if (t[i] & OP_ACTION_DATA)
2692da572c9SDan Streetman 				ret = add_bits(p, p->data2[b >> 1], 16);
2702da572c9SDan Streetman 			else
2712da572c9SDan Streetman 				inv = true;
2722da572c9SDan Streetman 			break;
2732da572c9SDan Streetman 		case OP_AMOUNT_0:
2742da572c9SDan Streetman 			inv = (b != 8) || !(t[i] & OP_ACTION_NOOP);
2752da572c9SDan Streetman 			break;
2762da572c9SDan Streetman 		default:
2772da572c9SDan Streetman 			inv = true;
2782da572c9SDan Streetman 			break;
2792da572c9SDan Streetman 		}
2802da572c9SDan Streetman 
2812da572c9SDan Streetman 		if (ret)
2822da572c9SDan Streetman 			return ret;
2832da572c9SDan Streetman 
2842da572c9SDan Streetman 		if (inv) {
2852da572c9SDan Streetman 			pr_err("Invalid templ %x op %d : %x %x %x %x\n",
2862da572c9SDan Streetman 			       c, i, t[0], t[1], t[2], t[3]);
2872da572c9SDan Streetman 			return -EINVAL;
2882da572c9SDan Streetman 		}
2892da572c9SDan Streetman 
2902da572c9SDan Streetman 		b += t[i] & OP_AMOUNT;
2912da572c9SDan Streetman 	}
2922da572c9SDan Streetman 
2932da572c9SDan Streetman 	if (b != 8) {
2942da572c9SDan Streetman 		pr_err("Invalid template %x len %x : %x %x %x %x\n",
2952da572c9SDan Streetman 		       c, b, t[0], t[1], t[2], t[3]);
2962da572c9SDan Streetman 		return -EINVAL;
2972da572c9SDan Streetman 	}
2982da572c9SDan Streetman 
2992da572c9SDan Streetman 	if (sw842_template_counts)
3002da572c9SDan Streetman 		atomic_inc(&template_count[t[4]]);
3012da572c9SDan Streetman 
3022da572c9SDan Streetman 	return 0;
3032da572c9SDan Streetman }
3042da572c9SDan Streetman 
add_repeat_template(struct sw842_param * p,u8 r)3052da572c9SDan Streetman static int add_repeat_template(struct sw842_param *p, u8 r)
3062da572c9SDan Streetman {
3072da572c9SDan Streetman 	int ret;
3082da572c9SDan Streetman 
3092da572c9SDan Streetman 	/* repeat param is 0-based */
3102da572c9SDan Streetman 	if (!r || --r > REPEAT_BITS_MAX)
3112da572c9SDan Streetman 		return -EINVAL;
3122da572c9SDan Streetman 
3132da572c9SDan Streetman 	ret = add_bits(p, OP_REPEAT, OP_BITS);
3142da572c9SDan Streetman 	if (ret)
3152da572c9SDan Streetman 		return ret;
3162da572c9SDan Streetman 
3172da572c9SDan Streetman 	ret = add_bits(p, r, REPEAT_BITS);
3182da572c9SDan Streetman 	if (ret)
3192da572c9SDan Streetman 		return ret;
3202da572c9SDan Streetman 
3212da572c9SDan Streetman 	if (sw842_template_counts)
3222da572c9SDan Streetman 		atomic_inc(&template_repeat_count);
3232da572c9SDan Streetman 
3242da572c9SDan Streetman 	return 0;
3252da572c9SDan Streetman }
3262da572c9SDan Streetman 
add_short_data_template(struct sw842_param * p,u8 b)3272da572c9SDan Streetman static int add_short_data_template(struct sw842_param *p, u8 b)
3282da572c9SDan Streetman {
3292da572c9SDan Streetman 	int ret, i;
3302da572c9SDan Streetman 
3312da572c9SDan Streetman 	if (!b || b > SHORT_DATA_BITS_MAX)
3322da572c9SDan Streetman 		return -EINVAL;
3332da572c9SDan Streetman 
3342da572c9SDan Streetman 	ret = add_bits(p, OP_SHORT_DATA, OP_BITS);
3352da572c9SDan Streetman 	if (ret)
3362da572c9SDan Streetman 		return ret;
3372da572c9SDan Streetman 
3382da572c9SDan Streetman 	ret = add_bits(p, b, SHORT_DATA_BITS);
3392da572c9SDan Streetman 	if (ret)
3402da572c9SDan Streetman 		return ret;
3412da572c9SDan Streetman 
3422da572c9SDan Streetman 	for (i = 0; i < b; i++) {
3432da572c9SDan Streetman 		ret = add_bits(p, p->in[i], 8);
3442da572c9SDan Streetman 		if (ret)
3452da572c9SDan Streetman 			return ret;
3462da572c9SDan Streetman 	}
3472da572c9SDan Streetman 
3482da572c9SDan Streetman 	if (sw842_template_counts)
3492da572c9SDan Streetman 		atomic_inc(&template_short_data_count);
3502da572c9SDan Streetman 
3512da572c9SDan Streetman 	return 0;
3522da572c9SDan Streetman }
3532da572c9SDan Streetman 
add_zeros_template(struct sw842_param * p)3542da572c9SDan Streetman static int add_zeros_template(struct sw842_param *p)
3552da572c9SDan Streetman {
3562da572c9SDan Streetman 	int ret = add_bits(p, OP_ZEROS, OP_BITS);
3572da572c9SDan Streetman 
3582da572c9SDan Streetman 	if (ret)
3592da572c9SDan Streetman 		return ret;
3602da572c9SDan Streetman 
3612da572c9SDan Streetman 	if (sw842_template_counts)
3622da572c9SDan Streetman 		atomic_inc(&template_zeros_count);
3632da572c9SDan Streetman 
3642da572c9SDan Streetman 	return 0;
3652da572c9SDan Streetman }
3662da572c9SDan Streetman 
add_end_template(struct sw842_param * p)3672da572c9SDan Streetman static int add_end_template(struct sw842_param *p)
3682da572c9SDan Streetman {
3692da572c9SDan Streetman 	int ret = add_bits(p, OP_END, OP_BITS);
3702da572c9SDan Streetman 
3712da572c9SDan Streetman 	if (ret)
3722da572c9SDan Streetman 		return ret;
3732da572c9SDan Streetman 
3742da572c9SDan Streetman 	if (sw842_template_counts)
3752da572c9SDan Streetman 		atomic_inc(&template_end_count);
3762da572c9SDan Streetman 
3772da572c9SDan Streetman 	return 0;
3782da572c9SDan Streetman }
3792da572c9SDan Streetman 
check_template(struct sw842_param * p,u8 c)3802da572c9SDan Streetman static bool check_template(struct sw842_param *p, u8 c)
3812da572c9SDan Streetman {
3822da572c9SDan Streetman 	u8 *t = comp_ops[c];
3832da572c9SDan Streetman 	int i, match, b = 0;
3842da572c9SDan Streetman 
3852da572c9SDan Streetman 	if (c >= OPS_MAX)
3862da572c9SDan Streetman 		return false;
3872da572c9SDan Streetman 
3882da572c9SDan Streetman 	for (i = 0; i < 4; i++) {
3892da572c9SDan Streetman 		if (t[i] & OP_ACTION_INDEX) {
3902da572c9SDan Streetman 			if (t[i] & OP_AMOUNT_2)
3912da572c9SDan Streetman 				match = check_index(p, 2, b >> 1);
3922da572c9SDan Streetman 			else if (t[i] & OP_AMOUNT_4)
3932da572c9SDan Streetman 				match = check_index(p, 4, b >> 2);
3942da572c9SDan Streetman 			else if (t[i] & OP_AMOUNT_8)
3952da572c9SDan Streetman 				match = check_index(p, 8, 0);
3962da572c9SDan Streetman 			else
3972da572c9SDan Streetman 				return false;
3982da572c9SDan Streetman 			if (!match)
3992da572c9SDan Streetman 				return false;
4002da572c9SDan Streetman 		}
4012da572c9SDan Streetman 
4022da572c9SDan Streetman 		b += t[i] & OP_AMOUNT;
4032da572c9SDan Streetman 	}
4042da572c9SDan Streetman 
4052da572c9SDan Streetman 	return true;
4062da572c9SDan Streetman }
4072da572c9SDan Streetman 
get_next_data(struct sw842_param * p)4082da572c9SDan Streetman static void get_next_data(struct sw842_param *p)
4092da572c9SDan Streetman {
4102da572c9SDan Streetman 	p->data8[0] = get_input_data(p, 0, 64);
4112da572c9SDan Streetman 	p->data4[0] = get_input_data(p, 0, 32);
4122da572c9SDan Streetman 	p->data4[1] = get_input_data(p, 4, 32);
4132da572c9SDan Streetman 	p->data2[0] = get_input_data(p, 0, 16);
4142da572c9SDan Streetman 	p->data2[1] = get_input_data(p, 2, 16);
4152da572c9SDan Streetman 	p->data2[2] = get_input_data(p, 4, 16);
4162da572c9SDan Streetman 	p->data2[3] = get_input_data(p, 6, 16);
4172da572c9SDan Streetman }
4182da572c9SDan Streetman 
4192da572c9SDan Streetman /* update the hashtable entries.
4202da572c9SDan Streetman  * only call this after finding/adding the current template
4212da572c9SDan Streetman  * the dataN fields for the current 8 byte block must be already updated
4222da572c9SDan Streetman  */
update_hashtables(struct sw842_param * p)4232da572c9SDan Streetman static void update_hashtables(struct sw842_param *p)
4242da572c9SDan Streetman {
4252da572c9SDan Streetman 	u64 pos = p->in - p->instart;
4262da572c9SDan Streetman 	u64 n8 = (pos >> 3) % (1 << I8_BITS);
4272da572c9SDan Streetman 	u64 n4 = (pos >> 2) % (1 << I4_BITS);
4282da572c9SDan Streetman 	u64 n2 = (pos >> 1) % (1 << I2_BITS);
4292da572c9SDan Streetman 
4302da572c9SDan Streetman 	replace_hash(p, 8, n8, 0);
4312da572c9SDan Streetman 	replace_hash(p, 4, n4, 0);
4322da572c9SDan Streetman 	replace_hash(p, 4, n4, 1);
4332da572c9SDan Streetman 	replace_hash(p, 2, n2, 0);
4342da572c9SDan Streetman 	replace_hash(p, 2, n2, 1);
4352da572c9SDan Streetman 	replace_hash(p, 2, n2, 2);
4362da572c9SDan Streetman 	replace_hash(p, 2, n2, 3);
4372da572c9SDan Streetman }
4382da572c9SDan Streetman 
4392da572c9SDan Streetman /* find the next template to use, and add it
4402da572c9SDan Streetman  * the p->dataN fields must already be set for the current 8 byte block
4412da572c9SDan Streetman  */
process_next(struct sw842_param * p)4422da572c9SDan Streetman static int process_next(struct sw842_param *p)
4432da572c9SDan Streetman {
4442da572c9SDan Streetman 	int ret, i;
4452da572c9SDan Streetman 
4462da572c9SDan Streetman 	p->index8[0] = INDEX_NOT_CHECKED;
4472da572c9SDan Streetman 	p->index4[0] = INDEX_NOT_CHECKED;
4482da572c9SDan Streetman 	p->index4[1] = INDEX_NOT_CHECKED;
4492da572c9SDan Streetman 	p->index2[0] = INDEX_NOT_CHECKED;
4502da572c9SDan Streetman 	p->index2[1] = INDEX_NOT_CHECKED;
4512da572c9SDan Streetman 	p->index2[2] = INDEX_NOT_CHECKED;
4522da572c9SDan Streetman 	p->index2[3] = INDEX_NOT_CHECKED;
4532da572c9SDan Streetman 
4542da572c9SDan Streetman 	/* check up to OPS_MAX - 1; last op is our fallback */
4552da572c9SDan Streetman 	for (i = 0; i < OPS_MAX - 1; i++) {
4562da572c9SDan Streetman 		if (check_template(p, i))
4572da572c9SDan Streetman 			break;
4582da572c9SDan Streetman 	}
4592da572c9SDan Streetman 
4602da572c9SDan Streetman 	ret = add_template(p, i);
4612da572c9SDan Streetman 	if (ret)
4622da572c9SDan Streetman 		return ret;
4632da572c9SDan Streetman 
4642da572c9SDan Streetman 	return 0;
4652da572c9SDan Streetman }
4662da572c9SDan Streetman 
4672da572c9SDan Streetman /**
4682da572c9SDan Streetman  * sw842_compress
4692da572c9SDan Streetman  *
4702da572c9SDan Streetman  * Compress the uncompressed buffer of length @ilen at @in to the output buffer
4712da572c9SDan Streetman  * @out, using no more than @olen bytes, using the 842 compression format.
4722da572c9SDan Streetman  *
4732da572c9SDan Streetman  * Returns: 0 on success, error on failure.  The @olen parameter
4742da572c9SDan Streetman  * will contain the number of output bytes written on success, or
4752da572c9SDan Streetman  * 0 on error.
4762da572c9SDan Streetman  */
sw842_compress(const u8 * in,unsigned int ilen,u8 * out,unsigned int * olen,void * wmem)4772da572c9SDan Streetman int sw842_compress(const u8 *in, unsigned int ilen,
4782da572c9SDan Streetman 		   u8 *out, unsigned int *olen, void *wmem)
4792da572c9SDan Streetman {
4802da572c9SDan Streetman 	struct sw842_param *p = (struct sw842_param *)wmem;
4812da572c9SDan Streetman 	int ret;
4822da572c9SDan Streetman 	u64 last, next, pad, total;
4832da572c9SDan Streetman 	u8 repeat_count = 0;
484ea0b3984SHaren Myneni 	u32 crc;
4852da572c9SDan Streetman 
4862da572c9SDan Streetman 	BUILD_BUG_ON(sizeof(*p) > SW842_MEM_COMPRESS);
4872da572c9SDan Streetman 
4882da572c9SDan Streetman 	init_hashtable_nodes(p, 8);
4892da572c9SDan Streetman 	init_hashtable_nodes(p, 4);
4902da572c9SDan Streetman 	init_hashtable_nodes(p, 2);
4912da572c9SDan Streetman 
4922da572c9SDan Streetman 	p->in = (u8 *)in;
4932da572c9SDan Streetman 	p->instart = p->in;
4942da572c9SDan Streetman 	p->ilen = ilen;
4952da572c9SDan Streetman 	p->out = out;
4962da572c9SDan Streetman 	p->olen = *olen;
4972da572c9SDan Streetman 	p->bit = 0;
4982da572c9SDan Streetman 
4992da572c9SDan Streetman 	total = p->olen;
5002da572c9SDan Streetman 
5012da572c9SDan Streetman 	*olen = 0;
5022da572c9SDan Streetman 
5032da572c9SDan Streetman 	/* if using strict mode, we can only compress a multiple of 8 */
5042da572c9SDan Streetman 	if (sw842_strict && (ilen % 8)) {
5052da572c9SDan Streetman 		pr_err("Using strict mode, can't compress len %d\n", ilen);
5062da572c9SDan Streetman 		return -EINVAL;
5072da572c9SDan Streetman 	}
5082da572c9SDan Streetman 
5092da572c9SDan Streetman 	/* let's compress at least 8 bytes, mkay? */
5102da572c9SDan Streetman 	if (unlikely(ilen < 8))
5112da572c9SDan Streetman 		goto skip_comp;
5122da572c9SDan Streetman 
5132da572c9SDan Streetman 	/* make initial 'last' different so we don't match the first time */
5142da572c9SDan Streetman 	last = ~get_unaligned((u64 *)p->in);
5152da572c9SDan Streetman 
5162da572c9SDan Streetman 	while (p->ilen > 7) {
5172da572c9SDan Streetman 		next = get_unaligned((u64 *)p->in);
5182da572c9SDan Streetman 
5192da572c9SDan Streetman 		/* must get the next data, as we need to update the hashtable
5202da572c9SDan Streetman 		 * entries with the new data every time
5212da572c9SDan Streetman 		 */
5222da572c9SDan Streetman 		get_next_data(p);
5232da572c9SDan Streetman 
5242da572c9SDan Streetman 		/* we don't care about endianness in last or next;
5252da572c9SDan Streetman 		 * we're just comparing 8 bytes to another 8 bytes,
5262da572c9SDan Streetman 		 * they're both the same endianness
5272da572c9SDan Streetman 		 */
5282da572c9SDan Streetman 		if (next == last) {
5292da572c9SDan Streetman 			/* repeat count bits are 0-based, so we stop at +1 */
5302da572c9SDan Streetman 			if (++repeat_count <= REPEAT_BITS_MAX)
5312da572c9SDan Streetman 				goto repeat;
5322da572c9SDan Streetman 		}
5332da572c9SDan Streetman 		if (repeat_count) {
5342da572c9SDan Streetman 			ret = add_repeat_template(p, repeat_count);
5352da572c9SDan Streetman 			repeat_count = 0;
5362da572c9SDan Streetman 			if (next == last) /* reached max repeat bits */
5372da572c9SDan Streetman 				goto repeat;
5382da572c9SDan Streetman 		}
5392da572c9SDan Streetman 
5402da572c9SDan Streetman 		if (next == 0)
5412da572c9SDan Streetman 			ret = add_zeros_template(p);
5422da572c9SDan Streetman 		else
5432da572c9SDan Streetman 			ret = process_next(p);
5442da572c9SDan Streetman 
5452da572c9SDan Streetman 		if (ret)
5462da572c9SDan Streetman 			return ret;
5472da572c9SDan Streetman 
5482da572c9SDan Streetman repeat:
5492da572c9SDan Streetman 		last = next;
5502da572c9SDan Streetman 		update_hashtables(p);
5512da572c9SDan Streetman 		p->in += 8;
5522da572c9SDan Streetman 		p->ilen -= 8;
5532da572c9SDan Streetman 	}
5542da572c9SDan Streetman 
5552da572c9SDan Streetman 	if (repeat_count) {
5562da572c9SDan Streetman 		ret = add_repeat_template(p, repeat_count);
5572da572c9SDan Streetman 		if (ret)
5582da572c9SDan Streetman 			return ret;
5592da572c9SDan Streetman 	}
5602da572c9SDan Streetman 
5612da572c9SDan Streetman skip_comp:
5622da572c9SDan Streetman 	if (p->ilen > 0) {
5632da572c9SDan Streetman 		ret = add_short_data_template(p, p->ilen);
5642da572c9SDan Streetman 		if (ret)
5652da572c9SDan Streetman 			return ret;
5662da572c9SDan Streetman 
5672da572c9SDan Streetman 		p->in += p->ilen;
5682da572c9SDan Streetman 		p->ilen = 0;
5692da572c9SDan Streetman 	}
5702da572c9SDan Streetman 
5712da572c9SDan Streetman 	ret = add_end_template(p);
5722da572c9SDan Streetman 	if (ret)
5732da572c9SDan Streetman 		return ret;
5742da572c9SDan Streetman 
575ea0b3984SHaren Myneni 	/*
576ea0b3984SHaren Myneni 	 * crc(0:31) is appended to target data starting with the next
577ea0b3984SHaren Myneni 	 * bit after End of stream template.
578ea0b3984SHaren Myneni 	 * nx842 calculates CRC for data in big-endian format. So doing
579ea0b3984SHaren Myneni 	 * same here so that sw842 decompression can be used for both
580ea0b3984SHaren Myneni 	 * compressed data.
581ea0b3984SHaren Myneni 	 */
582ea0b3984SHaren Myneni 	crc = crc32_be(0, in, ilen);
583ea0b3984SHaren Myneni 	ret = add_bits(p, crc, CRC_BITS);
584ea0b3984SHaren Myneni 	if (ret)
585ea0b3984SHaren Myneni 		return ret;
586ea0b3984SHaren Myneni 
5872da572c9SDan Streetman 	if (p->bit) {
5882da572c9SDan Streetman 		p->out++;
5892da572c9SDan Streetman 		p->olen--;
5902da572c9SDan Streetman 		p->bit = 0;
5912da572c9SDan Streetman 	}
5922da572c9SDan Streetman 
5932da572c9SDan Streetman 	/* pad compressed length to multiple of 8 */
5942da572c9SDan Streetman 	pad = (8 - ((total - p->olen) % 8)) % 8;
5952da572c9SDan Streetman 	if (pad) {
5962da572c9SDan Streetman 		if (pad > p->olen) /* we were so close! */
5972da572c9SDan Streetman 			return -ENOSPC;
5982da572c9SDan Streetman 		memset(p->out, 0, pad);
5992da572c9SDan Streetman 		p->out += pad;
6002da572c9SDan Streetman 		p->olen -= pad;
6012da572c9SDan Streetman 	}
6022da572c9SDan Streetman 
6032da572c9SDan Streetman 	if (unlikely((total - p->olen) > UINT_MAX))
6042da572c9SDan Streetman 		return -ENOSPC;
6052da572c9SDan Streetman 
6062da572c9SDan Streetman 	*olen = total - p->olen;
6072da572c9SDan Streetman 
6082da572c9SDan Streetman 	return 0;
6092da572c9SDan Streetman }
6102da572c9SDan Streetman EXPORT_SYMBOL_GPL(sw842_compress);
6112da572c9SDan Streetman 
sw842_init(void)6122da572c9SDan Streetman static int __init sw842_init(void)
6132da572c9SDan Streetman {
6142da572c9SDan Streetman 	if (sw842_template_counts)
6152da572c9SDan Streetman 		sw842_debugfs_create();
6162da572c9SDan Streetman 
6172da572c9SDan Streetman 	return 0;
6182da572c9SDan Streetman }
6192da572c9SDan Streetman module_init(sw842_init);
6202da572c9SDan Streetman 
sw842_exit(void)6212da572c9SDan Streetman static void __exit sw842_exit(void)
6222da572c9SDan Streetman {
6232da572c9SDan Streetman 	if (sw842_template_counts)
6242da572c9SDan Streetman 		sw842_debugfs_remove();
6252da572c9SDan Streetman }
6262da572c9SDan Streetman module_exit(sw842_exit);
6272da572c9SDan Streetman 
6282da572c9SDan Streetman MODULE_LICENSE("GPL");
6292da572c9SDan Streetman MODULE_DESCRIPTION("Software 842 Compressor");
6302da572c9SDan Streetman MODULE_AUTHOR("Dan Streetman <ddstreet@ieee.org>");
631