xref: /linux/drivers/md/bcache/util.c (revision 47344e330eabc1515cbe6061eb337100a3ab6d37)
1 /*
2  * random utiility code, for bcache but in theory not specific to bcache
3  *
4  * Copyright 2010, 2011 Kent Overstreet <kent.overstreet@gmail.com>
5  * Copyright 2012 Google, Inc.
6  */
7 
8 #include <linux/bio.h>
9 #include <linux/blkdev.h>
10 #include <linux/ctype.h>
11 #include <linux/debugfs.h>
12 #include <linux/module.h>
13 #include <linux/seq_file.h>
14 #include <linux/types.h>
15 #include <linux/sched/clock.h>
16 
17 #include "util.h"
18 
19 #define simple_strtoint(c, end, base)	simple_strtol(c, end, base)
20 #define simple_strtouint(c, end, base)	simple_strtoul(c, end, base)
21 
22 #define STRTO_H(name, type)					\
23 int bch_ ## name ## _h(const char *cp, type *res)		\
24 {								\
25 	int u = 0;						\
26 	char *e;						\
27 	type i = simple_ ## name(cp, &e, 10);			\
28 								\
29 	switch (tolower(*e)) {					\
30 	default:						\
31 		return -EINVAL;					\
32 	case 'y':						\
33 	case 'z':						\
34 		u++;						\
35 		/* fall through */				\
36 	case 'e':						\
37 		u++;						\
38 		/* fall through */				\
39 	case 'p':						\
40 		u++;						\
41 		/* fall through */				\
42 	case 't':						\
43 		u++;						\
44 		/* fall through */				\
45 	case 'g':						\
46 		u++;						\
47 		/* fall through */				\
48 	case 'm':						\
49 		u++;						\
50 		/* fall through */				\
51 	case 'k':						\
52 		u++;						\
53 		if (e++ == cp)					\
54 			return -EINVAL;				\
55 		/* fall through */				\
56 	case '\n':						\
57 	case '\0':						\
58 		if (*e == '\n')					\
59 			e++;					\
60 	}							\
61 								\
62 	if (*e)							\
63 		return -EINVAL;					\
64 								\
65 	while (u--) {						\
66 		if ((type) ~0 > 0 &&				\
67 		    (type) ~0 / 1024 <= i)			\
68 			return -EINVAL;				\
69 		if ((i > 0 && ANYSINT_MAX(type) / 1024 < i) ||	\
70 		    (i < 0 && -ANYSINT_MAX(type) / 1024 > i))	\
71 			return -EINVAL;				\
72 		i *= 1024;					\
73 	}							\
74 								\
75 	*res = i;						\
76 	return 0;						\
77 }								\
78 
79 STRTO_H(strtoint, int)
80 STRTO_H(strtouint, unsigned int)
81 STRTO_H(strtoll, long long)
82 STRTO_H(strtoull, unsigned long long)
83 
84 /**
85  * bch_hprint - formats @v to human readable string for sysfs.
86  * @buf: the (at least 8 byte) buffer to format the result into.
87  * @v: signed 64 bit integer
88  *
89  * Returns the number of bytes used by format.
90  */
91 ssize_t bch_hprint(char *buf, int64_t v)
92 {
93 	static const char units[] = "?kMGTPEZY";
94 	int u = 0, t;
95 
96 	uint64_t q;
97 
98 	if (v < 0)
99 		q = -v;
100 	else
101 		q = v;
102 
103 	/* For as long as the number is more than 3 digits, but at least
104 	 * once, shift right / divide by 1024.  Keep the remainder for
105 	 * a digit after the decimal point.
106 	 */
107 	do {
108 		u++;
109 
110 		t = q & ~(~0 << 10);
111 		q >>= 10;
112 	} while (q >= 1000);
113 
114 	if (v < 0)
115 		/* '-', up to 3 digits, '.', 1 digit, 1 character, null;
116 		 * yields 8 bytes.
117 		 */
118 		return sprintf(buf, "-%llu.%i%c", q, t * 10 / 1024, units[u]);
119 	else
120 		return sprintf(buf, "%llu.%i%c", q, t * 10 / 1024, units[u]);
121 }
122 
123 ssize_t bch_snprint_string_list(char *buf, size_t size, const char * const list[],
124 			    size_t selected)
125 {
126 	char *out = buf;
127 	size_t i;
128 
129 	for (i = 0; list[i]; i++)
130 		out += snprintf(out, buf + size - out,
131 				i == selected ? "[%s] " : "%s ", list[i]);
132 
133 	out[-1] = '\n';
134 	return out - buf;
135 }
136 
137 ssize_t bch_read_string_list(const char *buf, const char * const list[])
138 {
139 	size_t i;
140 	char *s, *d = kstrndup(buf, PAGE_SIZE - 1, GFP_KERNEL);
141 	if (!d)
142 		return -ENOMEM;
143 
144 	s = strim(d);
145 
146 	for (i = 0; list[i]; i++)
147 		if (!strcmp(list[i], s))
148 			break;
149 
150 	kfree(d);
151 
152 	if (!list[i])
153 		return -EINVAL;
154 
155 	return i;
156 }
157 
158 bool bch_is_zero(const char *p, size_t n)
159 {
160 	size_t i;
161 
162 	for (i = 0; i < n; i++)
163 		if (p[i])
164 			return false;
165 	return true;
166 }
167 
168 int bch_parse_uuid(const char *s, char *uuid)
169 {
170 	size_t i, j, x;
171 	memset(uuid, 0, 16);
172 
173 	for (i = 0, j = 0;
174 	     i < strspn(s, "-0123456789:ABCDEFabcdef") && j < 32;
175 	     i++) {
176 		x = s[i] | 32;
177 
178 		switch (x) {
179 		case '0'...'9':
180 			x -= '0';
181 			break;
182 		case 'a'...'f':
183 			x -= 'a' - 10;
184 			break;
185 		default:
186 			continue;
187 		}
188 
189 		if (!(j & 1))
190 			x <<= 4;
191 		uuid[j++ >> 1] |= x;
192 	}
193 	return i;
194 }
195 
196 void bch_time_stats_update(struct time_stats *stats, uint64_t start_time)
197 {
198 	uint64_t now, duration, last;
199 
200 	spin_lock(&stats->lock);
201 
202 	now		= local_clock();
203 	duration	= time_after64(now, start_time)
204 		? now - start_time : 0;
205 	last		= time_after64(now, stats->last)
206 		? now - stats->last : 0;
207 
208 	stats->max_duration = max(stats->max_duration, duration);
209 
210 	if (stats->last) {
211 		ewma_add(stats->average_duration, duration, 8, 8);
212 
213 		if (stats->average_frequency)
214 			ewma_add(stats->average_frequency, last, 8, 8);
215 		else
216 			stats->average_frequency  = last << 8;
217 	} else {
218 		stats->average_duration  = duration << 8;
219 	}
220 
221 	stats->last = now ?: 1;
222 
223 	spin_unlock(&stats->lock);
224 }
225 
226 /**
227  * bch_next_delay() - update ratelimiting statistics and calculate next delay
228  * @d: the struct bch_ratelimit to update
229  * @done: the amount of work done, in arbitrary units
230  *
231  * Increment @d by the amount of work done, and return how long to delay in
232  * jiffies until the next time to do some work.
233  */
234 uint64_t bch_next_delay(struct bch_ratelimit *d, uint64_t done)
235 {
236 	uint64_t now = local_clock();
237 
238 	d->next += div_u64(done * NSEC_PER_SEC, d->rate);
239 
240 	/* Bound the time.  Don't let us fall further than 2 seconds behind
241 	 * (this prevents unnecessary backlog that would make it impossible
242 	 * to catch up).  If we're ahead of the desired writeback rate,
243 	 * don't let us sleep more than 2.5 seconds (so we can notice/respond
244 	 * if the control system tells us to speed up!).
245 	 */
246 	if (time_before64(now + NSEC_PER_SEC * 5LLU / 2LLU, d->next))
247 		d->next = now + NSEC_PER_SEC * 5LLU / 2LLU;
248 
249 	if (time_after64(now - NSEC_PER_SEC * 2, d->next))
250 		d->next = now - NSEC_PER_SEC * 2;
251 
252 	return time_after64(d->next, now)
253 		? div_u64(d->next - now, NSEC_PER_SEC / HZ)
254 		: 0;
255 }
256 
257 /*
258  * Generally it isn't good to access .bi_io_vec and .bi_vcnt directly,
259  * the preferred way is bio_add_page, but in this case, bch_bio_map()
260  * supposes that the bvec table is empty, so it is safe to access
261  * .bi_vcnt & .bi_io_vec in this way even after multipage bvec is
262  * supported.
263  */
264 void bch_bio_map(struct bio *bio, void *base)
265 {
266 	size_t size = bio->bi_iter.bi_size;
267 	struct bio_vec *bv = bio->bi_io_vec;
268 
269 	BUG_ON(!bio->bi_iter.bi_size);
270 	BUG_ON(bio->bi_vcnt);
271 
272 	bv->bv_offset = base ? offset_in_page(base) : 0;
273 	goto start;
274 
275 	for (; size; bio->bi_vcnt++, bv++) {
276 		bv->bv_offset	= 0;
277 start:		bv->bv_len	= min_t(size_t, PAGE_SIZE - bv->bv_offset,
278 					size);
279 		if (base) {
280 			bv->bv_page = is_vmalloc_addr(base)
281 				? vmalloc_to_page(base)
282 				: virt_to_page(base);
283 
284 			base += bv->bv_len;
285 		}
286 
287 		size -= bv->bv_len;
288 	}
289 }
290 
291 /**
292  * bch_bio_alloc_pages - allocates a single page for each bvec in a bio
293  * @bio: bio to allocate pages for
294  * @gfp_mask: flags for allocation
295  *
296  * Allocates pages up to @bio->bi_vcnt.
297  *
298  * Returns 0 on success, -ENOMEM on failure. On failure, any allocated pages are
299  * freed.
300  */
301 int bch_bio_alloc_pages(struct bio *bio, gfp_t gfp_mask)
302 {
303 	int i;
304 	struct bio_vec *bv;
305 
306 	bio_for_each_segment_all(bv, bio, i) {
307 		bv->bv_page = alloc_page(gfp_mask);
308 		if (!bv->bv_page) {
309 			while (--bv >= bio->bi_io_vec)
310 				__free_page(bv->bv_page);
311 			return -ENOMEM;
312 		}
313 	}
314 
315 	return 0;
316 }
317 
318 /*
319  * Portions Copyright (c) 1996-2001, PostgreSQL Global Development Group (Any
320  * use permitted, subject to terms of PostgreSQL license; see.)
321 
322  * If we have a 64-bit integer type, then a 64-bit CRC looks just like the
323  * usual sort of implementation. (See Ross Williams' excellent introduction
324  * A PAINLESS GUIDE TO CRC ERROR DETECTION ALGORITHMS, available from
325  * ftp://ftp.rocksoft.com/papers/crc_v3.txt or several other net sites.)
326  * If we have no working 64-bit type, then fake it with two 32-bit registers.
327  *
328  * The present implementation is a normal (not "reflected", in Williams'
329  * terms) 64-bit CRC, using initial all-ones register contents and a final
330  * bit inversion. The chosen polynomial is borrowed from the DLT1 spec
331  * (ECMA-182, available from http://www.ecma.ch/ecma1/STAND/ECMA-182.HTM):
332  *
333  * x^64 + x^62 + x^57 + x^55 + x^54 + x^53 + x^52 + x^47 + x^46 + x^45 +
334  * x^40 + x^39 + x^38 + x^37 + x^35 + x^33 + x^32 + x^31 + x^29 + x^27 +
335  * x^24 + x^23 + x^22 + x^21 + x^19 + x^17 + x^13 + x^12 + x^10 + x^9 +
336  * x^7 + x^4 + x + 1
337 */
338 
339 static const uint64_t crc_table[256] = {
340 	0x0000000000000000ULL, 0x42F0E1EBA9EA3693ULL, 0x85E1C3D753D46D26ULL,
341 	0xC711223CFA3E5BB5ULL, 0x493366450E42ECDFULL, 0x0BC387AEA7A8DA4CULL,
342 	0xCCD2A5925D9681F9ULL, 0x8E224479F47CB76AULL, 0x9266CC8A1C85D9BEULL,
343 	0xD0962D61B56FEF2DULL, 0x17870F5D4F51B498ULL, 0x5577EEB6E6BB820BULL,
344 	0xDB55AACF12C73561ULL, 0x99A54B24BB2D03F2ULL, 0x5EB4691841135847ULL,
345 	0x1C4488F3E8F96ED4ULL, 0x663D78FF90E185EFULL, 0x24CD9914390BB37CULL,
346 	0xE3DCBB28C335E8C9ULL, 0xA12C5AC36ADFDE5AULL, 0x2F0E1EBA9EA36930ULL,
347 	0x6DFEFF5137495FA3ULL, 0xAAEFDD6DCD770416ULL, 0xE81F3C86649D3285ULL,
348 	0xF45BB4758C645C51ULL, 0xB6AB559E258E6AC2ULL, 0x71BA77A2DFB03177ULL,
349 	0x334A9649765A07E4ULL, 0xBD68D2308226B08EULL, 0xFF9833DB2BCC861DULL,
350 	0x388911E7D1F2DDA8ULL, 0x7A79F00C7818EB3BULL, 0xCC7AF1FF21C30BDEULL,
351 	0x8E8A101488293D4DULL, 0x499B3228721766F8ULL, 0x0B6BD3C3DBFD506BULL,
352 	0x854997BA2F81E701ULL, 0xC7B97651866BD192ULL, 0x00A8546D7C558A27ULL,
353 	0x4258B586D5BFBCB4ULL, 0x5E1C3D753D46D260ULL, 0x1CECDC9E94ACE4F3ULL,
354 	0xDBFDFEA26E92BF46ULL, 0x990D1F49C77889D5ULL, 0x172F5B3033043EBFULL,
355 	0x55DFBADB9AEE082CULL, 0x92CE98E760D05399ULL, 0xD03E790CC93A650AULL,
356 	0xAA478900B1228E31ULL, 0xE8B768EB18C8B8A2ULL, 0x2FA64AD7E2F6E317ULL,
357 	0x6D56AB3C4B1CD584ULL, 0xE374EF45BF6062EEULL, 0xA1840EAE168A547DULL,
358 	0x66952C92ECB40FC8ULL, 0x2465CD79455E395BULL, 0x3821458AADA7578FULL,
359 	0x7AD1A461044D611CULL, 0xBDC0865DFE733AA9ULL, 0xFF3067B657990C3AULL,
360 	0x711223CFA3E5BB50ULL, 0x33E2C2240A0F8DC3ULL, 0xF4F3E018F031D676ULL,
361 	0xB60301F359DBE0E5ULL, 0xDA050215EA6C212FULL, 0x98F5E3FE438617BCULL,
362 	0x5FE4C1C2B9B84C09ULL, 0x1D14202910527A9AULL, 0x93366450E42ECDF0ULL,
363 	0xD1C685BB4DC4FB63ULL, 0x16D7A787B7FAA0D6ULL, 0x5427466C1E109645ULL,
364 	0x4863CE9FF6E9F891ULL, 0x0A932F745F03CE02ULL, 0xCD820D48A53D95B7ULL,
365 	0x8F72ECA30CD7A324ULL, 0x0150A8DAF8AB144EULL, 0x43A04931514122DDULL,
366 	0x84B16B0DAB7F7968ULL, 0xC6418AE602954FFBULL, 0xBC387AEA7A8DA4C0ULL,
367 	0xFEC89B01D3679253ULL, 0x39D9B93D2959C9E6ULL, 0x7B2958D680B3FF75ULL,
368 	0xF50B1CAF74CF481FULL, 0xB7FBFD44DD257E8CULL, 0x70EADF78271B2539ULL,
369 	0x321A3E938EF113AAULL, 0x2E5EB66066087D7EULL, 0x6CAE578BCFE24BEDULL,
370 	0xABBF75B735DC1058ULL, 0xE94F945C9C3626CBULL, 0x676DD025684A91A1ULL,
371 	0x259D31CEC1A0A732ULL, 0xE28C13F23B9EFC87ULL, 0xA07CF2199274CA14ULL,
372 	0x167FF3EACBAF2AF1ULL, 0x548F120162451C62ULL, 0x939E303D987B47D7ULL,
373 	0xD16ED1D631917144ULL, 0x5F4C95AFC5EDC62EULL, 0x1DBC74446C07F0BDULL,
374 	0xDAAD56789639AB08ULL, 0x985DB7933FD39D9BULL, 0x84193F60D72AF34FULL,
375 	0xC6E9DE8B7EC0C5DCULL, 0x01F8FCB784FE9E69ULL, 0x43081D5C2D14A8FAULL,
376 	0xCD2A5925D9681F90ULL, 0x8FDAB8CE70822903ULL, 0x48CB9AF28ABC72B6ULL,
377 	0x0A3B7B1923564425ULL, 0x70428B155B4EAF1EULL, 0x32B26AFEF2A4998DULL,
378 	0xF5A348C2089AC238ULL, 0xB753A929A170F4ABULL, 0x3971ED50550C43C1ULL,
379 	0x7B810CBBFCE67552ULL, 0xBC902E8706D82EE7ULL, 0xFE60CF6CAF321874ULL,
380 	0xE224479F47CB76A0ULL, 0xA0D4A674EE214033ULL, 0x67C58448141F1B86ULL,
381 	0x253565A3BDF52D15ULL, 0xAB1721DA49899A7FULL, 0xE9E7C031E063ACECULL,
382 	0x2EF6E20D1A5DF759ULL, 0x6C0603E6B3B7C1CAULL, 0xF6FAE5C07D3274CDULL,
383 	0xB40A042BD4D8425EULL, 0x731B26172EE619EBULL, 0x31EBC7FC870C2F78ULL,
384 	0xBFC9838573709812ULL, 0xFD39626EDA9AAE81ULL, 0x3A28405220A4F534ULL,
385 	0x78D8A1B9894EC3A7ULL, 0x649C294A61B7AD73ULL, 0x266CC8A1C85D9BE0ULL,
386 	0xE17DEA9D3263C055ULL, 0xA38D0B769B89F6C6ULL, 0x2DAF4F0F6FF541ACULL,
387 	0x6F5FAEE4C61F773FULL, 0xA84E8CD83C212C8AULL, 0xEABE6D3395CB1A19ULL,
388 	0x90C79D3FEDD3F122ULL, 0xD2377CD44439C7B1ULL, 0x15265EE8BE079C04ULL,
389 	0x57D6BF0317EDAA97ULL, 0xD9F4FB7AE3911DFDULL, 0x9B041A914A7B2B6EULL,
390 	0x5C1538ADB04570DBULL, 0x1EE5D94619AF4648ULL, 0x02A151B5F156289CULL,
391 	0x4051B05E58BC1E0FULL, 0x87409262A28245BAULL, 0xC5B073890B687329ULL,
392 	0x4B9237F0FF14C443ULL, 0x0962D61B56FEF2D0ULL, 0xCE73F427ACC0A965ULL,
393 	0x8C8315CC052A9FF6ULL, 0x3A80143F5CF17F13ULL, 0x7870F5D4F51B4980ULL,
394 	0xBF61D7E80F251235ULL, 0xFD913603A6CF24A6ULL, 0x73B3727A52B393CCULL,
395 	0x31439391FB59A55FULL, 0xF652B1AD0167FEEAULL, 0xB4A25046A88DC879ULL,
396 	0xA8E6D8B54074A6ADULL, 0xEA16395EE99E903EULL, 0x2D071B6213A0CB8BULL,
397 	0x6FF7FA89BA4AFD18ULL, 0xE1D5BEF04E364A72ULL, 0xA3255F1BE7DC7CE1ULL,
398 	0x64347D271DE22754ULL, 0x26C49CCCB40811C7ULL, 0x5CBD6CC0CC10FAFCULL,
399 	0x1E4D8D2B65FACC6FULL, 0xD95CAF179FC497DAULL, 0x9BAC4EFC362EA149ULL,
400 	0x158E0A85C2521623ULL, 0x577EEB6E6BB820B0ULL, 0x906FC95291867B05ULL,
401 	0xD29F28B9386C4D96ULL, 0xCEDBA04AD0952342ULL, 0x8C2B41A1797F15D1ULL,
402 	0x4B3A639D83414E64ULL, 0x09CA82762AAB78F7ULL, 0x87E8C60FDED7CF9DULL,
403 	0xC51827E4773DF90EULL, 0x020905D88D03A2BBULL, 0x40F9E43324E99428ULL,
404 	0x2CFFE7D5975E55E2ULL, 0x6E0F063E3EB46371ULL, 0xA91E2402C48A38C4ULL,
405 	0xEBEEC5E96D600E57ULL, 0x65CC8190991CB93DULL, 0x273C607B30F68FAEULL,
406 	0xE02D4247CAC8D41BULL, 0xA2DDA3AC6322E288ULL, 0xBE992B5F8BDB8C5CULL,
407 	0xFC69CAB42231BACFULL, 0x3B78E888D80FE17AULL, 0x7988096371E5D7E9ULL,
408 	0xF7AA4D1A85996083ULL, 0xB55AACF12C735610ULL, 0x724B8ECDD64D0DA5ULL,
409 	0x30BB6F267FA73B36ULL, 0x4AC29F2A07BFD00DULL, 0x08327EC1AE55E69EULL,
410 	0xCF235CFD546BBD2BULL, 0x8DD3BD16FD818BB8ULL, 0x03F1F96F09FD3CD2ULL,
411 	0x41011884A0170A41ULL, 0x86103AB85A2951F4ULL, 0xC4E0DB53F3C36767ULL,
412 	0xD8A453A01B3A09B3ULL, 0x9A54B24BB2D03F20ULL, 0x5D45907748EE6495ULL,
413 	0x1FB5719CE1045206ULL, 0x919735E51578E56CULL, 0xD367D40EBC92D3FFULL,
414 	0x1476F63246AC884AULL, 0x568617D9EF46BED9ULL, 0xE085162AB69D5E3CULL,
415 	0xA275F7C11F7768AFULL, 0x6564D5FDE549331AULL, 0x279434164CA30589ULL,
416 	0xA9B6706FB8DFB2E3ULL, 0xEB46918411358470ULL, 0x2C57B3B8EB0BDFC5ULL,
417 	0x6EA7525342E1E956ULL, 0x72E3DAA0AA188782ULL, 0x30133B4B03F2B111ULL,
418 	0xF7021977F9CCEAA4ULL, 0xB5F2F89C5026DC37ULL, 0x3BD0BCE5A45A6B5DULL,
419 	0x79205D0E0DB05DCEULL, 0xBE317F32F78E067BULL, 0xFCC19ED95E6430E8ULL,
420 	0x86B86ED5267CDBD3ULL, 0xC4488F3E8F96ED40ULL, 0x0359AD0275A8B6F5ULL,
421 	0x41A94CE9DC428066ULL, 0xCF8B0890283E370CULL, 0x8D7BE97B81D4019FULL,
422 	0x4A6ACB477BEA5A2AULL, 0x089A2AACD2006CB9ULL, 0x14DEA25F3AF9026DULL,
423 	0x562E43B4931334FEULL, 0x913F6188692D6F4BULL, 0xD3CF8063C0C759D8ULL,
424 	0x5DEDC41A34BBEEB2ULL, 0x1F1D25F19D51D821ULL, 0xD80C07CD676F8394ULL,
425 	0x9AFCE626CE85B507ULL,
426 };
427 
428 uint64_t bch_crc64_update(uint64_t crc, const void *_data, size_t len)
429 {
430 	const unsigned char *data = _data;
431 
432 	while (len--) {
433 		int i = ((int) (crc >> 56) ^ *data++) & 0xFF;
434 		crc = crc_table[i] ^ (crc << 8);
435 	}
436 
437 	return crc;
438 }
439 
440 uint64_t bch_crc64(const void *data, size_t len)
441 {
442 	uint64_t crc = 0xffffffffffffffffULL;
443 
444 	crc = bch_crc64_update(crc, data, len);
445 
446 	return crc ^ 0xffffffffffffffffULL;
447 }
448