Line data Source code
1 : // SPDX-License-Identifier: GPL-3.0-or-later
2 : // Copyright (C) 2015 Andrea Mazzoleni
3 :
4 : #include "portable.h"
5 :
6 : #include "support.h"
7 : #include "state.h"
8 : #include "raid/raid.h"
9 :
10 72727 : void device_name_set(devinfo_t* dev, const char* name, int index)
11 : {
12 72727 : if (index == 0)
13 29146 : pathcpy(dev->name, sizeof(dev->name), name);
14 : else
15 43581 : pathprint(dev->name, sizeof(dev->name), "%s/%d", name, index);
16 72727 : }
17 :
18 : /**
19 : * The following are Failure Rate tables computed from the data that
20 : * BackBlaze made available at:
21 : *
22 : * Reliability Data Set For 41,000 Hard Drives Now Open Source
23 : * https://www.backblaze.com/blog/hard-drive-data-feb2015/
24 : *
25 : * Hard Drive Data Sets
26 : * https://www.backblaze.com/hard-drive-test-data.html
27 : *
28 : * Note that in this data:
29 : * - Disks all passed the load-testing and have made it to production,
30 : * and then Dead On Arrival (DOA) failures are excluded.
31 : * - Disks that are predicted to fail by BackBlaze are removed before
32 : * they really fail, not counting as a failure.
33 : *
34 : * The following tables are computed using the data from 2014-02-14 to
35 : * 2014-12-31 because it's the period when more SMART attributes were gathered.
36 : *
37 : * In this period there are 47322 disks seen, with 1988 removed because failed,
38 : * and with 4121 removed because predicted to fail.
39 : */
40 :
41 : /**
42 : * Number of data points in each table.
43 : */
44 : #define SMART_MEASURES 256
45 :
46 : /*
47 : * Divider for SMART attribute 5
48 : */
49 : static unsigned SMART_5_STEP = 1;
50 :
51 : /*
52 : * Failure rate for 30 days, for a disk
53 : * with SMART attribute 5 at a given value.
54 : */
55 : static double SMART_5_R[SMART_MEASURES] = {
56 : 0.0026, 0.0748, 0.0919, 0.1013, 0.1079,
57 : 0.1137, 0.1194, 0.1235, 0.1301, 0.1398,
58 : 0.1453, 0.1490, 0.1528, 0.1566, 0.1595,
59 : 0.1635, 0.1656, 0.1701, 0.1718, 0.1740,
60 : 0.1762, 0.1787, 0.1808, 0.1833, 0.1858,
61 : 0.1885, 0.1901, 0.1915, 0.1934, 0.1958,
62 : 0.1975, 0.1993, 0.2014, 0.2048, 0.2068,
63 : 0.2088, 0.2109, 0.2120, 0.2137, 0.2160,
64 : 0.2173, 0.2214, 0.2226, 0.2237, 0.2262,
65 : 0.2277, 0.2292, 0.2304, 0.2338, 0.2369,
66 : 0.2381, 0.2396, 0.2411, 0.2427, 0.2445,
67 : 0.2462, 0.2472, 0.2488, 0.2496, 0.2504,
68 : 0.2514, 0.2525, 0.2535, 0.2544, 0.2554,
69 : 0.2571, 0.2583, 0.2601, 0.2622, 0.2631,
70 : 0.2635, 0.2644, 0.2659, 0.2675, 0.2682,
71 : 0.2692, 0.2701, 0.2707, 0.2712, 0.2726,
72 : 0.2745, 0.2767, 0.2778, 0.2784, 0.2800,
73 : 0.2814, 0.2834, 0.2839, 0.2851, 0.2877,
74 : 0.2883, 0.2891, 0.2900, 0.2907, 0.2916,
75 : 0.2934, 0.2950, 0.2969, 0.2975, 0.2983,
76 : 0.2999, 0.3006, 0.3013, 0.3021, 0.3033,
77 : 0.3054, 0.3066, 0.3074, 0.3082, 0.3094,
78 : 0.3106, 0.3112, 0.3120, 0.3137, 0.3141,
79 : 0.3145, 0.3151, 0.3159, 0.3169, 0.3174,
80 : 0.3181, 0.3194, 0.3215, 0.3219, 0.3231,
81 : 0.3234, 0.3237, 0.3242, 0.3255, 0.3270,
82 : 0.3283, 0.3286, 0.3289, 0.3304, 0.3315,
83 : 0.3322, 0.3347, 0.3361, 0.3382, 0.3384,
84 : 0.3395, 0.3398, 0.3401, 0.3405, 0.3411,
85 : 0.3431, 0.3435, 0.3442, 0.3447, 0.3450,
86 : 0.3455, 0.3464, 0.3472, 0.3486, 0.3497,
87 : 0.3501, 0.3509, 0.3517, 0.3531, 0.3535,
88 : 0.3540, 0.3565, 0.3569, 0.3576, 0.3579,
89 : 0.3584, 0.3590, 0.3594, 0.3599, 0.3621,
90 : 0.3627, 0.3642, 0.3649, 0.3655, 0.3658,
91 : 0.3667, 0.3683, 0.3699, 0.3704, 0.3707,
92 : 0.3711, 0.3715, 0.3718, 0.3721, 0.3727,
93 : 0.3740, 0.3744, 0.3748, 0.3753, 0.3756,
94 : 0.3761, 0.3766, 0.3775, 0.3794, 0.3801,
95 : 0.3804, 0.3813, 0.3817, 0.3823, 0.3831,
96 : 0.3847, 0.3875, 0.3881, 0.3886, 0.3890,
97 : 0.3893, 0.3896, 0.3900, 0.3907, 0.3923,
98 : 0.3925, 0.3933, 0.3936, 0.3961, 0.3971,
99 : 0.3981, 0.3989, 0.4007, 0.4012, 0.4018,
100 : 0.4023, 0.4027, 0.4041, 0.4048, 0.4056,
101 : 0.4073, 0.4079, 0.4086, 0.4104, 0.4107,
102 : 0.4109, 0.4112, 0.4118, 0.4133, 0.4139,
103 : 0.4144, 0.4146, 0.4148, 0.4164, 0.4165,
104 : 0.4174, 0.4191, 0.4197, 0.4201, 0.4204,
105 : 0.4210, 0.4213, 0.4216, 0.4221, 0.4231,
106 : 0.4235, 0.4237, 0.4239, 0.4241, 0.4244,
107 : 0.4249,
108 : };
109 :
110 : /*
111 : * Divider for SMART attribute 187
112 : */
113 : static unsigned SMART_187_STEP = 1;
114 :
115 : /*
116 : * Failure rate for 30 days, for a disk
117 : * with SMART attribute 187 at a given value.
118 : */
119 : static double SMART_187_R[SMART_MEASURES] = {
120 : 0.0039, 0.1287, 0.1579, 0.1776, 0.1905,
121 : 0.2013, 0.2226, 0.3263, 0.3612, 0.3869,
122 : 0.4086, 0.4292, 0.4559, 0.5278, 0.5593,
123 : 0.5847, 0.6124, 0.6345, 0.6517, 0.6995,
124 : 0.7308, 0.7541, 0.7814, 0.8122, 0.8306,
125 : 0.8839, 0.9100, 0.9505, 0.9906, 1.0254,
126 : 1.0483, 1.1060, 1.1280, 1.1624, 1.1895,
127 : 1.2138, 1.2452, 1.2864, 1.3120, 1.3369,
128 : 1.3705, 1.3894, 1.4055, 1.4218, 1.4434,
129 : 1.4670, 1.4834, 1.4993, 1.5174, 1.5400,
130 : 1.5572, 1.5689, 1.5808, 1.6198, 1.6346,
131 : 1.6405, 1.6570, 1.6618, 1.6755, 1.6877,
132 : 1.7100, 1.7258, 1.7347, 1.7814, 1.7992,
133 : 1.8126, 1.8225, 1.8269, 1.8341, 1.8463,
134 : 1.8765, 1.8850, 1.9005, 1.9281, 1.9398,
135 : 1.9618, 1.9702, 1.9905, 2.0099, 2.0480,
136 : 2.0565, 2.0611, 2.0709, 2.0846, 2.0895,
137 : 2.0958, 2.1008, 2.1055, 2.1097, 2.1235,
138 : 2.1564, 2.1737, 2.1956, 2.1989, 2.2015,
139 : 2.2148, 2.2355, 2.2769, 2.2940, 2.3045,
140 : 2.3096, 2.3139, 2.3344, 2.3669, 2.3779,
141 : 2.3941, 2.4036, 2.4396, 2.4473, 2.4525,
142 : 2.4656, 2.4762, 2.4787, 2.5672, 2.5732,
143 : 2.5755, 2.5794, 2.5886, 2.6100, 2.6144,
144 : 2.6341, 2.6614, 2.6679, 2.6796, 2.6847,
145 : 2.6872, 2.6910, 2.6934, 2.6995, 2.7110,
146 : 2.7179, 2.7204, 2.7232, 2.7282, 2.7355,
147 : 2.7375, 2.7422, 2.7558, 2.7580, 2.7643,
148 : 2.7767, 2.7770, 2.8016, 2.9292, 2.9294,
149 : 2.9337, 2.9364, 2.9409, 2.9436, 2.9457,
150 : 2.9466, 2.9498, 2.9543, 2.9570, 2.9573,
151 : 2.9663, 2.9708, 2.9833, 2.9859, 2.9895,
152 : 2.9907, 2.9932, 2.9935, 3.0021, 3.0035,
153 : 3.0079, 3.0103, 3.0126, 3.0151, 3.0266,
154 : 3.0288, 3.0320, 3.0330, 3.0343, 3.0373,
155 : 3.0387, 3.0438, 3.0570, 3.0579, 3.0616,
156 : 3.0655, 3.0728, 3.0771, 3.0794, 3.0799,
157 : 3.0812, 3.1769, 3.1805, 3.1819, 3.1860,
158 : 3.1869, 3.2004, 3.2016, 3.2025, 3.2070,
159 : 3.2129, 3.2173, 3.2205, 3.2254, 3.2263,
160 : 3.2300, 3.2413, 3.2543, 3.2580, 3.2595,
161 : 3.2611, 3.2624, 3.2787, 3.2798, 3.2809,
162 : 3.2823, 3.2833, 3.2834, 3.2853, 3.2866,
163 : 3.3332, 3.3580, 3.3595, 3.3625, 3.3631,
164 : 3.3667, 3.3702, 3.3737, 3.3742, 3.3747,
165 : 3.3769, 3.3775, 3.3791, 3.3809, 3.3813,
166 : 3.3814, 3.3822, 3.3827, 3.3828, 3.3833,
167 : 3.3833, 3.3843, 3.3882, 3.3963, 3.4047,
168 : 3.4057, 3.4213, 3.4218, 3.4230, 3.4231,
169 : 3.4240, 3.4262, 3.4283, 3.4283, 3.4288,
170 : 3.4293, 3.4302, 3.4317, 3.4478, 3.4486,
171 : 3.4520,
172 : };
173 :
174 : /*
175 : * Divider for SMART attribute 188
176 : */
177 : static unsigned SMART_188_STEP = 1;
178 :
179 : /*
180 : * Failure rate for 30 days, for a disk
181 : * with SMART attribute 188 at a given value.
182 : */
183 : static double SMART_188_R[SMART_MEASURES] = {
184 : 0.0025, 0.0129, 0.0182, 0.0215, 0.0236,
185 : 0.0257, 0.0279, 0.0308, 0.0341, 0.0382,
186 : 0.0430, 0.0491, 0.0565, 0.0658, 0.0770,
187 : 0.0906, 0.1037, 0.1197, 0.1355, 0.1525,
188 : 0.1686, 0.1864, 0.2011, 0.2157, 0.2281,
189 : 0.2404, 0.2505, 0.2591, 0.2676, 0.2766,
190 : 0.2827, 0.2913, 0.2999, 0.3100, 0.3185,
191 : 0.3298, 0.3361, 0.3446, 0.3506, 0.3665,
192 : 0.3699, 0.3820, 0.3890, 0.4059, 0.4108,
193 : 0.4255, 0.4290, 0.4424, 0.4473, 0.4617,
194 : 0.4667, 0.4770, 0.4829, 0.4977, 0.4997,
195 : 0.5102, 0.5137, 0.5283, 0.5316, 0.5428,
196 : 0.5480, 0.5597, 0.5634, 0.5791, 0.5826,
197 : 0.5929, 0.5945, 0.6025, 0.6102, 0.6175,
198 : 0.6245, 0.6313, 0.6421, 0.6468, 0.6497,
199 : 0.6557, 0.6570, 0.6647, 0.6698, 0.6769,
200 : 0.6849, 0.6884, 0.6925, 0.7025, 0.7073,
201 : 0.7161, 0.7223, 0.7256, 0.7280, 0.7411,
202 : 0.7445, 0.7530, 0.7628, 0.7755, 0.7900,
203 : 0.8006, 0.8050, 0.8098, 0.8132, 0.8192,
204 : 0.8230, 0.8293, 0.8356, 0.8440, 0.8491,
205 : 0.8672, 0.8766, 0.8907, 0.8934, 0.8992,
206 : 0.9062, 0.9111, 0.9209, 0.9290, 0.9329,
207 : 0.9378, 0.9385, 0.9402, 0.9427, 0.9448,
208 : 0.9459, 0.9568, 0.9626, 0.9628, 0.9730,
209 : 0.9765, 0.9797, 0.9825, 0.9873, 0.9902,
210 : 0.9926, 0.9991, 1.0031, 1.0044, 1.0062,
211 : 1.0120, 1.0148, 1.0188, 1.0218, 1.0231,
212 : 1.0249, 1.0277, 1.0335, 1.0355, 1.0417,
213 : 1.0467, 1.0474, 1.0510, 1.0529, 1.0532,
214 : 1.0562, 1.0610, 1.0702, 1.0708, 1.0800,
215 : 1.0804, 1.0845, 1.1120, 1.1191, 1.1225,
216 : 1.1264, 1.1265, 1.1335, 1.1347, 1.1479,
217 : 1.1479, 1.1519, 1.1545, 1.1645, 1.1646,
218 : 1.1647, 1.1649, 1.1678, 1.1713, 1.1723,
219 : 1.1733, 1.1736, 1.1736, 1.1738, 1.1739,
220 : 1.1739, 1.1741, 1.1741, 1.1746, 1.1746,
221 : 1.1748, 1.1750, 1.1760, 1.1794, 1.1854,
222 : 1.1908, 1.1912, 1.1912, 1.1971, 1.2033,
223 : 1.2033, 1.2120, 1.2166, 1.2185, 1.2185,
224 : 1.2189, 1.2211, 1.2226, 1.2234, 1.2320,
225 : 1.2345, 1.2345, 1.2347, 1.2350, 1.2350,
226 : 1.2407, 1.2408, 1.2408, 1.2408, 1.2409,
227 : 1.2460, 1.2518, 1.2519, 1.2519, 1.2519,
228 : 1.2520, 1.2520, 1.2521, 1.2521, 1.2521,
229 : 1.2593, 1.2745, 1.2760, 1.2772, 1.2831,
230 : 1.2833, 1.2890, 1.2906, 1.3166, 1.3201,
231 : 1.3202, 1.3202, 1.3202, 1.3204, 1.3204,
232 : 1.3314, 1.3422, 1.3423, 1.3441, 1.3491,
233 : 1.3583, 1.3602, 1.3606, 1.3636, 1.3650,
234 : 1.3661, 1.3703, 1.3708, 1.3716, 1.3730,
235 : 1.3731,
236 : };
237 :
238 : /*
239 : * Divider for SMART attribute 197
240 : */
241 : static unsigned SMART_197_STEP = 1;
242 :
243 : /*
244 : * Failure rate for 30 days, for a disk
245 : * with SMART attribute 197 at a given value.
246 : */
247 : static double SMART_197_R[SMART_MEASURES] = {
248 : 0.0028, 0.2972, 0.3883, 0.4363, 0.4644,
249 : 0.4813, 0.4948, 0.5051, 0.5499, 0.8535,
250 : 0.8678, 0.8767, 0.8882, 0.8933, 0.9012,
251 : 0.9076, 0.9368, 1.1946, 1.2000, 1.2110,
252 : 1.2177, 1.2305, 1.2385, 1.2447, 1.2699,
253 : 1.4713, 1.4771, 1.4802, 1.4887, 1.5292,
254 : 1.5384, 1.5442, 1.5645, 1.7700, 1.7755,
255 : 1.7778, 1.7899, 1.7912, 1.7991, 1.7998,
256 : 1.8090, 1.9974, 1.9992, 2.0088, 2.0132,
257 : 2.0146, 2.0161, 2.0171, 2.0273, 2.1845,
258 : 2.1866, 2.1877, 2.1900, 2.1922, 2.1944,
259 : 2.1974, 2.2091, 2.3432, 2.3459, 2.3463,
260 : 2.3468, 2.3496, 2.3503, 2.3533, 2.3593,
261 : 2.4604, 2.4606, 2.4609, 2.4612, 2.4620,
262 : 2.4626, 2.4638, 2.4689, 2.5575, 2.5581,
263 : 2.5586, 2.5586, 2.5588, 2.5602, 2.5602,
264 : 2.5648, 2.6769, 2.6769, 2.6769, 2.6794,
265 : 2.6805, 2.6811, 2.6814, 2.6862, 2.7742,
266 : 2.7755, 2.7771, 2.7780, 2.7790, 2.7797,
267 : 2.7807, 2.7871, 2.9466, 2.9478, 2.9492,
268 : 2.9612, 2.9618, 2.9624, 2.9628, 2.9669,
269 : 3.1467, 3.1481, 3.1494, 3.1499, 3.1504,
270 : 3.1507, 3.1509, 3.1532, 3.2675, 3.2681,
271 : 3.2703, 3.2712, 3.2714, 3.2726, 3.2726,
272 : 3.2743, 3.3376, 3.3379, 3.3382, 3.3397,
273 : 3.3403, 3.3410, 3.3410, 3.3429, 3.4052,
274 : 3.4052, 3.4052, 3.4052, 3.4052, 3.4053,
275 : 3.4053, 3.4075, 3.4616, 3.4616, 3.4616,
276 : 3.4616, 3.4616, 3.4616, 3.4620, 3.4634,
277 : 3.4975, 3.4975, 3.4975, 3.4975, 3.4979,
278 : 3.4979, 3.4979, 3.4998, 3.5489, 3.5489,
279 : 3.5489, 3.5489, 3.5489, 3.5493, 3.5497,
280 : 3.5512, 3.5827, 3.5828, 3.5828, 3.5828,
281 : 3.5828, 3.5828, 3.5828, 3.5844, 3.6251,
282 : 3.6251, 3.6251, 3.6267, 3.6267, 3.6271,
283 : 3.6271, 3.6279, 3.6562, 3.6562, 3.6563,
284 : 3.7206, 3.7242, 3.7332, 3.7332, 3.7346,
285 : 3.7548, 3.7548, 3.7553, 3.7576, 3.7581,
286 : 3.7586, 3.7587, 3.7600, 3.7773, 3.7812,
287 : 3.7836, 3.7841, 3.7842, 3.7851, 3.7856,
288 : 3.7876, 3.8890, 3.8890, 3.8890, 3.8890,
289 : 3.8890, 3.8890, 3.8890, 3.8897, 3.9111,
290 : 3.9114, 3.9114, 3.9114, 3.9114, 3.9114,
291 : 3.9114, 3.9126, 3.9440, 3.9440, 3.9440,
292 : 3.9440, 3.9440, 3.9498, 3.9498, 3.9509,
293 : 3.9783, 3.9783, 3.9784, 3.9784, 3.9784,
294 : 3.9784, 4.0012, 4.0019, 4.0406, 4.0413,
295 : 4.0413, 4.0413, 4.0413, 4.0414, 4.0414,
296 : 4.0421, 4.0552, 4.0552, 4.0558, 4.0558,
297 : 4.0558, 4.0558, 4.0558, 4.0563, 4.0753,
298 : 4.0753, 4.0760, 4.1131, 4.1131, 4.1131,
299 : 4.1131,
300 : };
301 :
302 : /*
303 : * Divider for SMART attribute 198
304 : */
305 : static unsigned SMART_198_STEP = 1;
306 :
307 : /*
308 : * Failure rate for 30 days, for a disk
309 : * with SMART attribute 198 at a given value.
310 : */
311 : static double SMART_198_R[SMART_MEASURES] = {
312 : 0.0030, 0.5479, 0.5807, 0.5949, 0.6046,
313 : 0.6086, 0.6139, 0.6224, 0.6639, 1.0308,
314 : 1.0329, 1.0364, 1.0371, 1.0387, 1.0399,
315 : 1.0421, 1.0675, 1.3730, 1.3733, 1.3741,
316 : 1.3741, 1.3752, 1.3794, 1.3800, 1.3985,
317 : 1.6291, 1.6303, 1.6309, 1.6352, 1.6384,
318 : 1.6448, 1.6464, 1.6645, 1.8949, 1.8951,
319 : 1.8962, 1.9073, 1.9073, 1.9152, 1.9161,
320 : 1.9240, 2.1308, 2.1315, 2.1328, 2.1328,
321 : 2.1328, 2.1328, 2.1329, 2.1439, 2.3203,
322 : 2.3205, 2.3205, 2.3205, 2.3205, 2.3205,
323 : 2.3205, 2.3265, 2.4729, 2.4729, 2.4729,
324 : 2.4729, 2.4729, 2.4729, 2.4729, 2.4778,
325 : 2.5900, 2.5900, 2.5901, 2.5901, 2.5901,
326 : 2.5901, 2.5901, 2.5949, 2.6964, 2.6965,
327 : 2.6965, 2.6965, 2.6965, 2.6965, 2.6965,
328 : 2.7010, 2.8328, 2.8328, 2.8328, 2.8329,
329 : 2.8329, 2.8329, 2.8329, 2.8366, 2.9405,
330 : 2.9405, 2.9405, 2.9405, 2.9405, 2.9405,
331 : 2.9405, 2.9442, 3.1344, 3.1344, 3.1346,
332 : 3.1463, 3.1463, 3.1463, 3.1463, 3.1493,
333 : 3.3076, 3.3076, 3.3076, 3.3076, 3.3076,
334 : 3.3077, 3.3077, 3.3097, 3.4456, 3.4456,
335 : 3.4456, 3.4456, 3.4456, 3.4456, 3.4456,
336 : 3.4473, 3.5236, 3.5236, 3.5236, 3.5236,
337 : 3.5236, 3.5236, 3.5236, 3.5249, 3.6004,
338 : 3.6004, 3.6004, 3.6004, 3.6004, 3.6004,
339 : 3.6004, 3.6026, 3.6684, 3.6684, 3.6684,
340 : 3.6684, 3.6684, 3.6684, 3.6684, 3.6697,
341 : 3.7121, 3.7121, 3.7121, 3.7121, 3.7121,
342 : 3.7121, 3.7121, 3.7136, 3.7744, 3.7744,
343 : 3.7744, 3.7744, 3.7744, 3.7745, 3.7745,
344 : 3.7756, 3.8151, 3.8151, 3.8151, 3.8151,
345 : 3.8151, 3.8151, 3.8151, 3.8163, 3.8673,
346 : 3.8673, 3.8673, 3.8673, 3.8673, 3.8673,
347 : 3.8673, 3.8680, 3.9044, 3.9044, 3.9044,
348 : 3.9044, 3.9044, 3.9044, 3.9044, 3.9056,
349 : 3.9297, 3.9297, 3.9297, 3.9297, 3.9297,
350 : 3.9297, 3.9297, 3.9305, 3.9494, 3.9494,
351 : 3.9494, 3.9494, 3.9494, 3.9494, 3.9494,
352 : 3.9514, 4.0725, 4.0725, 4.0725, 4.0725,
353 : 4.0725, 4.0725, 4.0725, 4.0731, 4.0990,
354 : 4.0993, 4.0993, 4.0993, 4.0993, 4.0993,
355 : 4.0993, 4.1004, 4.1385, 4.1385, 4.1385,
356 : 4.1386, 4.1386, 4.1387, 4.1387, 4.1398,
357 : 4.1732, 4.2284, 4.2284, 4.2284, 4.2284,
358 : 4.2284, 4.2284, 4.2290, 4.2781, 4.2781,
359 : 4.2963, 4.2963, 4.2963, 4.2963, 4.2963,
360 : 4.2971, 4.3141, 4.3141, 4.3141, 4.3141,
361 : 4.3141, 4.3141, 4.3141, 4.3146, 4.3393,
362 : 4.3393, 4.3393, 4.3393, 4.3393, 4.3393,
363 : 4.3393,
364 : };
365 :
366 : /**
367 : * Computes the estimated Annual Failure Rate from the specified table.
368 : */
369 350783 : static double smart_afr_value(double* tab, unsigned step, uint64_t value)
370 : {
371 350783 : value /= step;
372 :
373 350783 : if (value >= SMART_MEASURES)
374 0 : value = SMART_MEASURES - 1;
375 :
376 : /* table rates are for a month, so we scale to a year */
377 350783 : return 365.0 / 30.0 * tab[value];
378 : }
379 :
380 : /**
381 : * Computes the estimated Annual Failure Rate of a set of SMART attributes.
382 : *
383 : * We define the Annual Failure Rate as the average number of
384 : * failures you expect in a year from a disk slot:
385 : *
386 : * AFR = 8760/MTBF (Mean Time Between Failures in hours).
387 : *
388 : * Note that this definition is different from the one given
389 : * by Seagate, that defines AFR = 1 - exp(-8760/MTBF), that
390 : * instead represents the probability of a failure in the next
391 : * year.
392 : *
393 : * To combine the different AFR from different SMART attributes,
394 : * we use the maximum rate reported, and we do not sum them,
395 : * because the attributes are not independent.
396 : */
397 72621 : static double smart_afr(devinfo_t* devinfo)
398 : {
399 72621 : double afr = 0;
400 72621 : uint64_t mask32 = 0xffffffffU;
401 72621 : uint64_t mask16 = 0xffffU;
402 72621 : uint64_t* info = devinfo->info;
403 72621 : struct smart_attr* smart = devinfo->smart;
404 :
405 : /* do not estimate for not rotational */
406 72621 : if (info[INFO_ROTATION_RATE] == 0)
407 2 : return 0;
408 :
409 72619 : if (smart[5].raw != SMART_UNASSIGNED) {
410 70188 : double r = smart_afr_value(SMART_5_R, SMART_5_STEP, smart[5].raw & mask32);
411 70188 : if (afr < r)
412 70188 : afr = r;
413 : }
414 :
415 72619 : if (smart[187].raw != SMART_UNASSIGNED) {
416 : /*
417 : * With some disks, only the lower 16 bits are significant
418 : * See: http://web.archive.org/web/20130507072056/http://media.kingston.com/support/downloads/MKP_306_SMART_attribute.pdf
419 : */
420 70155 : double r = smart_afr_value(SMART_187_R, SMART_187_STEP, smart[187].raw & mask16);
421 70155 : if (afr < r)
422 70155 : afr = r;
423 : }
424 :
425 72619 : if (
426 : /**
427 : * Don't check Command_Timeout (188) for Seagate disks.
428 : *
429 : * It's reported by users that for Archive SMR (Shingled Magnetic Recording)
430 : * and IronWolf disks to be a not significant test as
431 : * this value increases too often also on sane disks.
432 : */
433 72619 : strncmp(devinfo->model, "ST", 2) != 0 && smart[188].raw != SMART_UNASSIGNED
434 : ) {
435 : /*
436 : * With Seagate disks, there are three different 16 bits value reported
437 : * the lowest one is the most significant
438 : */
439 70149 : double r = smart_afr_value(SMART_188_R, SMART_188_STEP, smart[188].raw & mask16);
440 70149 : if (afr < r)
441 0 : afr = r;
442 : }
443 :
444 72619 : if (smart[197].raw != SMART_UNASSIGNED) {
445 70103 : double r = smart_afr_value(SMART_197_R, SMART_197_STEP, smart[197].raw & mask32);
446 70103 : if (afr < r)
447 33 : afr = r;
448 : }
449 :
450 72619 : if (smart[198].raw != SMART_UNASSIGNED) {
451 70188 : double r = smart_afr_value(SMART_198_R, SMART_198_STEP, smart[198].raw & mask32);
452 70188 : if (afr < r)
453 33 : afr = r;
454 : }
455 :
456 72619 : return afr;
457 : }
458 :
459 : /**
460 : * Calculates the probability of at least one failure occurring
461 : * within a year using a Poisson distribution.
462 : *
463 : * @param afr The aggregate Annual Failure Rate (lambda).
464 : * @return The probability as a double between 0 and 1.
465 : */
466 70248 : static double poisson_prob_at_least_one_failure(double rate)
467 : {
468 70248 : return 1.0 - exp(-rate);
469 : }
470 :
471 : /**
472 : * Probability of having data loss in a RAID system with the specified ::redundancy
473 : * supposing the specified ::array_failure_rate, and ::replace_rate.
474 : */
475 18 : static double raid_prob_of_one_or_more_failures(double array_failure_rate, double replace_rate, unsigned n, unsigned redundancy)
476 : {
477 : unsigned i;
478 : double MTBF;
479 : double MTTR;
480 : double MTTDL;
481 : double raid_failure_rate;
482 :
483 : /*
484 : * Use the MTTDL model (Mean Time To Data Loss) to estimate the
485 : * failure rate of the array.
486 : *
487 : * See:
488 : * Garth Alan Gibson, "Redundant Disk Arrays: Reliable, Parallel Secondary Storage", 1990
489 : */
490 :
491 : /* avoid division by zero */
492 18 : if (array_failure_rate == 0)
493 0 : return 0;
494 :
495 : /*
496 : * Get the Mean Time Between Failure of a single disk
497 : * from the array failure rate
498 : */
499 18 : MTBF = n / array_failure_rate;
500 :
501 : /*
502 : * Get the Mean Time Between Repair (the time that a failed disk is replaced)
503 : * from the repair rate
504 : */
505 18 : MTTR = 1.0 / replace_rate;
506 :
507 : /* use the approximated MTTDL equation */
508 18 : MTTDL = pow(MTBF, redundancy + 1) / pow(MTTR, redundancy);
509 99 : for (i = 0; i < redundancy + 1; ++i)
510 81 : MTTDL /= n - i;
511 :
512 : /* the raid failure rate is just the inverse of the MTTDL */
513 18 : raid_failure_rate = 1.0 / MTTDL;
514 :
515 : /* probability of at least one RAID failure */
516 18 : return poisson_prob_at_least_one_failure(raid_failure_rate);
517 : }
518 :
519 72624 : static void state_info_log(devinfo_t* devinfo)
520 : {
521 : char esc_buffer[ESC_MAX];
522 :
523 72624 : log_tag("info:%s:%s\n", devinfo->file, devinfo->name);
524 72624 : if (devinfo->serial[0])
525 72624 : log_tag("attr:%s:%s:serial:%s\n", devinfo->file, devinfo->name, esc_tag(devinfo->serial, esc_buffer));
526 72624 : if (devinfo->family[0])
527 72606 : log_tag("attr:%s:%s:family:%s\n", devinfo->file, devinfo->name, esc_tag(devinfo->family, esc_buffer));
528 72624 : if (devinfo->model[0])
529 72624 : log_tag("attr:%s:%s:model:%s\n", devinfo->file, devinfo->name, esc_tag(devinfo->model, esc_buffer));
530 72624 : if (devinfo->interf[0])
531 72612 : log_tag("attr:%s:%s:interface:%s\n", devinfo->file, devinfo->name, esc_tag(devinfo->interf, esc_buffer));
532 72624 : if (devinfo->info[INFO_SIZE] != SMART_UNASSIGNED)
533 72624 : log_tag("attr:%s:%s:size:%" PRIu64 "\n", devinfo->file, devinfo->name, devinfo->info[INFO_SIZE]);
534 72624 : if (devinfo->info[INFO_ROTATION_RATE] != SMART_UNASSIGNED)
535 72624 : log_tag("attr:%s:%s:rotationrate:%" PRIu64 "\n", devinfo->file, devinfo->name, devinfo->info[INFO_ROTATION_RATE]);
536 72624 : }
537 :
538 72624 : static void state_smart_ignore(struct snapraid_state* state, devinfo_t* devinfo)
539 : {
540 : /* clear attributes to ignore */
541 363120 : for (int i = 0; i < SMART_IGNORE_MAX; ++i) {
542 290496 : devinfo->smart[state->smartignore[i]].raw = SMART_UNASSIGNED;
543 290496 : devinfo->smart[devinfo->smartignore[i]].raw = SMART_UNASSIGNED;
544 : }
545 72624 : }
546 :
547 72624 : static void state_smart_log(devinfo_t* devinfo, double afr)
548 : {
549 : unsigned j;
550 :
551 72624 : log_tag("smart:%s:%s\n", devinfo->file, devinfo->name);
552 72624 : if (devinfo->smart[SMART_ERROR_PROTOCOL].raw != SMART_UNASSIGNED)
553 72612 : log_tag("attr:%s:%s:error_protocol:%" PRIu64 "\n", devinfo->file, devinfo->name, devinfo->smart[SMART_ERROR_PROTOCOL].raw);
554 72624 : if (devinfo->smart[SMART_ERROR_MEDIUM].raw != SMART_UNASSIGNED)
555 72570 : log_tag("attr:%s:%s:error_medium:%" PRIu64 "\n", devinfo->file, devinfo->name, devinfo->smart[SMART_ERROR_MEDIUM].raw);
556 72624 : if (devinfo->smart[SMART_WEAR_LEVEL].raw != SMART_UNASSIGNED)
557 72573 : log_tag("attr:%s:%s:wear_level:%" PRIu64 "\n", devinfo->file, devinfo->name, devinfo->smart[SMART_WEAR_LEVEL].raw);
558 72624 : if (devinfo->smart[SMART_FLAGS].raw != SMART_UNASSIGNED)
559 19394 : log_tag("attr:%s:%s:flags:%" PRIu64 ":%" PRIx64 "\n", devinfo->file, devinfo->name, devinfo->smart[SMART_FLAGS].raw, devinfo->smart[SMART_FLAGS].raw);
560 :
561 72624 : if (afr != 0)
562 70188 : log_tag("attr:%s:%s:afr:%g:%g\n", devinfo->file, devinfo->name, afr, poisson_prob_at_least_one_failure(afr));
563 :
564 18664368 : for (j = 0; j < 256; ++j) {
565 18591744 : struct smart_attr* attr = &devinfo->smart[j];
566 18591744 : if (attr->raw != SMART_UNASSIGNED) {
567 17891596 : const char* type = "";;
568 17891596 : const char* updated = "";
569 17891596 : const char* when_failed = "";
570 :
571 17891596 : if (attr->flags & SMART_ATTR_TYPE_PREFAIL)
572 189 : type = "prefail";
573 17891407 : else if (attr->flags & SMART_ATTR_TYPE_OLDAGE)
574 570 : type = "oldage";
575 17891596 : if (attr->flags & SMART_ATTR_UPDATE_ALWAYS)
576 639 : updated = "always";
577 17890957 : else if (attr->flags & SMART_ATTR_UPDATE_OFFLINE)
578 120 : updated = "offline";
579 17891596 : if (attr->flags & SMART_ATTR_WHEN_FAILED_NOW)
580 0 : when_failed = "now";
581 17891596 : else if (attr->flags & SMART_ATTR_WHEN_FAILED_PAST)
582 6 : when_failed = "past";
583 17891590 : else if (attr->flags & SMART_ATTR_WHEN_FAILED_NEVER)
584 753 : when_failed = "never";
585 :
586 17891596 : log_tag("attr:%s:%s:%u:%" PRIu64 ":%" PRIx64 ":%" PRIu64 ":%" PRIu64 ":%" PRIu64 ":%s:%s:%s:%s\n", devinfo->file, devinfo->name, j, attr->raw, attr->raw, attr->norm, attr->worst, attr->thresh, attr->name, type, updated, when_failed);
587 : }
588 : }
589 :
590 72624 : int temp = smart_temp(devinfo);
591 72624 : if (temp >= 0)
592 72612 : log_tag("attr:%s:%s:temperature:%d\n", devinfo->file, devinfo->name, temp);
593 72624 : }
594 :
595 2 : static void state_smart(struct snapraid_state* state, unsigned n, tommy_list* low)
596 : {
597 : tommy_node* i;
598 : unsigned j;
599 : size_t device_pad;
600 : size_t serial_pad;
601 : int have_parent;
602 : double array_failure_rate;
603 : double p_at_least_one_failure;
604 2 : int make_it_fail = 0;
605 2 : uint64_t mask32 = 0xffffffffU;
606 :
607 : /* compute lengths for padding */
608 2 : device_pad = 0;
609 2 : serial_pad = 0;
610 2 : have_parent = 0;
611 46 : for (i = tommy_list_head(low); i != 0; i = i->next) {
612 : size_t len;
613 44 : devinfo_t* devinfo = i->data;
614 :
615 44 : len = strlen(devinfo->file);
616 44 : if (len > device_pad)
617 2 : device_pad = len;
618 :
619 44 : len = strlen(devinfo->serial);
620 44 : if (len > serial_pad)
621 3 : serial_pad = len;
622 :
623 44 : if (devinfo->parent != 0)
624 14 : have_parent = 1;
625 : }
626 :
627 2 : printf("SnapRAID SMART report:\n");
628 2 : printf("\n");
629 2 : printf(" Temp");
630 2 : printf(" Power");
631 2 : printf(" Error");
632 2 : printf(" FP");
633 2 : printf(" Wear");
634 2 : printf(" Size");
635 2 : printf("\n");
636 2 : printf(" C");
637 2 : printf(" OnDays");
638 2 : printf(" Count");
639 2 : printf(" ");
640 2 : printf("Level");
641 2 : printf(" TB");
642 2 : printf(" "); printl("Serial", serial_pad);
643 2 : printf(" "); printl("Device", device_pad);
644 2 : printf(" Disk");
645 2 : printf("\n");
646 : /* |<##################################################################72>|####80>| */
647 2 : printf(" -----------------------------------------------------------------------\n");
648 :
649 2 : array_failure_rate = 0;
650 46 : for (i = tommy_list_head(low); i != 0; i = i->next) {
651 44 : devinfo_t* devinfo = i->data;
652 : double afr;
653 : uint64_t flag;
654 :
655 44 : state_smart_ignore(state, devinfo);
656 :
657 44 : int temp = smart_temp(devinfo);
658 44 : if (temp >= 0)
659 44 : printf("%7d", temp);
660 : else
661 0 : printf(" -");
662 :
663 44 : if (devinfo->smart[SMART_POWER_ON_HOURS].raw != SMART_UNASSIGNED)
664 43 : printf("%7" PRIu64, (devinfo->smart[SMART_POWER_ON_HOURS].raw & mask32) / 24);
665 : else
666 1 : printf(" -");
667 :
668 44 : uint64_t error_count = 0;
669 44 : if (devinfo->smart[SMART_ERROR_PROTOCOL].raw != SMART_UNASSIGNED && devinfo->smart[SMART_ERROR_PROTOCOL].raw != 0)
670 1 : error_count += devinfo->smart[SMART_ERROR_PROTOCOL].raw;
671 44 : if (devinfo->smart[SMART_ERROR_MEDIUM].raw != SMART_UNASSIGNED && devinfo->smart[SMART_ERROR_MEDIUM].raw != 0)
672 0 : error_count += devinfo->smart[SMART_ERROR_MEDIUM].raw;
673 44 : if (devinfo->smart[SMART_FLAGS].raw != SMART_UNASSIGNED)
674 22 : flag = devinfo->smart[SMART_FLAGS].raw;
675 : else
676 22 : flag = 0;
677 :
678 44 : if (flag & SMARTCTL_FLAG_FAIL)
679 1 : printf(" FAIL");
680 43 : else if (flag & SMARTCTL_FLAG_PREFAIL)
681 1 : printf(" PREFAIL");
682 42 : else if (flag & SMARTCTL_FLAG_PREFAIL_LOGGED)
683 3 : printf(" logfail");
684 39 : else if (error_count != 0) {
685 1 : printf("%8" PRIu64, error_count);
686 38 : } else if (flag & SMARTCTL_FLAG_ERROR_LOGGED)
687 1 : printf(" logerr");
688 37 : else if (flag & SMARTCTL_FLAG_SELFERROR_LOGGED)
689 1 : printf(" selferr");
690 : else
691 36 : printf(" -");
692 :
693 : /* if some fail/prefail attribute, make the command to fail */
694 44 : if (flag & (SMARTCTL_FLAG_FAIL | SMARTCTL_FLAG_PREFAIL))
695 2 : make_it_fail = 1;
696 :
697 : /*
698 : * Note that in older smartmontools, like 5.x, rotation rate is not present
699 : * and then it could remain unassigned
700 : */
701 :
702 44 : if (flag & (SMARTCTL_FLAG_UNSUPPORTED | SMARTCTL_FLAG_OPEN)) {
703 : /* if error running smartctl, skip AFR estimation */
704 2 : afr = 0;
705 2 : printf(" n/a");
706 42 : } else if (devinfo->info[INFO_ROTATION_RATE] == 0) {
707 : /* if SSD, skip AFR estimation as data is from not SSD disks */
708 1 : afr = 0;
709 1 : printf(" SSD");
710 : } else {
711 41 : afr = smart_afr(devinfo);
712 :
713 41 : if (afr == 0) {
714 : /* this happens only if no data */
715 1 : printf(" -");
716 : } else {
717 : /* use only the disks in the array */
718 40 : if (devinfo->parent != 0 || !have_parent)
719 40 : array_failure_rate += afr;
720 :
721 40 : printf("%4.0f%%", poisson_prob_at_least_one_failure(afr) * 100);
722 : }
723 : }
724 :
725 44 : if (devinfo->smart[SMART_WEAR_LEVEL].raw != SMART_UNASSIGNED) {
726 31 : printf(" %3" PRIu64 "%%", devinfo->smart[SMART_WEAR_LEVEL].raw);
727 : } else {
728 13 : printf(" -");
729 : }
730 :
731 44 : if (devinfo->info[INFO_SIZE] != SMART_UNASSIGNED)
732 44 : printf(" %4.1f", devinfo->info[INFO_SIZE] / 1E12);
733 : else
734 0 : printf(" -");
735 :
736 44 : printf(" ");
737 44 : if (*devinfo->serial)
738 44 : printl(devinfo->serial, serial_pad);
739 : else
740 0 : printl("-", serial_pad);
741 :
742 44 : printf(" ");
743 44 : if (*devinfo->file)
744 44 : printl(devinfo->file, device_pad);
745 : else
746 0 : printl("-", device_pad);
747 :
748 44 : printf(" ");
749 44 : if (*devinfo->name)
750 44 : printf("%s", devinfo->name);
751 : else
752 0 : printf("-");
753 :
754 44 : printf("\n");
755 :
756 44 : state_info_log(devinfo);
757 44 : state_smart_log(devinfo, afr);
758 : }
759 :
760 2 : printf("\n");
761 :
762 : /* |<##################################################################72>|####80>| */
763 2 : printf("The FP column is the estimated probability (in percentage) that the disk\n");
764 2 : printf("is going to fail in the next year.\n");
765 2 : printf("\n");
766 :
767 : /*
768 : * The probability of one and of at least one failure is computed assuming
769 : * a Poisson distribution with the estimated array failure rate.
770 : */
771 2 : p_at_least_one_failure = poisson_prob_at_least_one_failure(array_failure_rate);
772 :
773 2 : printf("Probability that at least one disk is going to fail in the next year is %.0f%%.\n", p_at_least_one_failure * 100);
774 2 : log_tag("summary:array_failure:%g:%g\n", array_failure_rate, p_at_least_one_failure);
775 :
776 : /* print extra stats only in verbose mode */
777 2 : if (msg_level < MSG_VERBOSE)
778 1 : goto bail;
779 :
780 : /* |<##################################################################72>|####80>| */
781 1 : printf("\n");
782 1 : printf("Probability of data loss in the next year for different parity and\n");
783 1 : printf("combined scrub and repair time:\n");
784 1 : printf("\n");
785 1 : printf(" Parity 1 Week 1 Month 3 Months\n");
786 1 : printf(" -----------------------------------------------------------------------\n");
787 7 : for (j = 0; j < RAID_PARITY_MAX; ++j) {
788 6 : printf("%6u", j + 1);
789 6 : printf(" ");
790 6 : printp(raid_prob_of_one_or_more_failures(array_failure_rate, 365.0 / 7, n, j + 1) * 100, 19);
791 6 : printf(" ");
792 6 : printp(raid_prob_of_one_or_more_failures(array_failure_rate, 365.0 / 30, n, j + 1) * 100, 17);
793 6 : printf(" ");
794 6 : printp(raid_prob_of_one_or_more_failures(array_failure_rate, 365.0 / 90, n, j + 1) * 100, 13);
795 6 : printf("\n");
796 : }
797 :
798 1 : printf("\n");
799 :
800 : /* |<##################################################################72>|####80>| */
801 1 : printf("These values are the probabilities that in the next year you'll have a\n");
802 1 : printf("sequence of failures from which the parity won't be able to recover,\n");
803 1 : printf("assuming that you regularly scrub and repair the array (as needed)\n");
804 1 : printf("within the specified time.\n");
805 :
806 2 : bail:
807 2 : if (make_it_fail) {
808 1 : printf("\n");
809 1 : printf("DANGER! SMART is reporting that one or more disks are FAILING!\n");
810 1 : printf("Please take immediate action!\n");
811 1 : exit(EXIT_FAILURE);
812 : }
813 1 : }
814 :
815 2417 : void state_attr(struct snapraid_state* state, tommy_list* low)
816 : {
817 : tommy_node* i;
818 :
819 : (void)state;
820 :
821 74909 : for (i = tommy_list_head(low); i != 0; i = i->next) {
822 72492 : devinfo_t* devinfo = i->data;
823 :
824 72492 : state_smart_ignore(state, devinfo);
825 :
826 72492 : double afr = smart_afr(devinfo);
827 :
828 72492 : state_info_log(devinfo);
829 72492 : state_smart_log(devinfo, afr);
830 : }
831 2417 : }
832 :
833 4 : static void state_probe_report(struct snapraid_state* state, tommy_list* low)
834 : {
835 : tommy_node* i;
836 : size_t device_pad;
837 :
838 : (void)state;
839 :
840 : /* compute lengths for padding */
841 4 : device_pad = 0;
842 92 : for (i = tommy_list_head(low); i != 0; i = i->next) {
843 : size_t len;
844 88 : devinfo_t* devinfo = i->data;
845 :
846 88 : state_smart_ignore(state, devinfo);
847 :
848 88 : len = strlen(devinfo->file);
849 88 : if (len > device_pad)
850 4 : device_pad = len;
851 :
852 88 : double afr = smart_afr(devinfo);
853 :
854 88 : state_info_log(devinfo);
855 88 : state_smart_log(devinfo, afr);
856 : }
857 :
858 4 : printf("SnapRAID PROBE report:\n");
859 4 : printf("\n");
860 4 : printf(" State ");
861 4 : printf(" ");
862 4 : printl("Device", device_pad);
863 4 : printf(" Disk");
864 4 : printf("\n");
865 : /* |<##################################################################72>|####80>| */
866 4 : printf(" -----------------------------------------------------------------------\n");
867 :
868 92 : for (i = tommy_list_head(low); i != 0; i = i->next) {
869 88 : devinfo_t* devinfo = i->data;
870 :
871 88 : printf(" ");
872 :
873 88 : switch (devinfo->power) {
874 12 : case POWER_STANDBY : printf("StandBy"); break;
875 76 : case POWER_ACTIVE : printf(" Active"); break;
876 0 : default : printf("Unknown"); break;
877 : }
878 :
879 88 : printf(" ");
880 88 : if (*devinfo->file)
881 88 : printl(devinfo->file, device_pad);
882 : else
883 0 : printl("-", device_pad);
884 :
885 88 : printf(" ");
886 88 : if (*devinfo->name)
887 88 : printf("%s", devinfo->name);
888 : else
889 0 : printf("-");
890 :
891 88 : printf("\n");
892 :
893 88 : log_tag("probe:%s:%s:%d\n", devinfo->file, devinfo->name, devinfo->power);
894 : }
895 :
896 4 : printf("\n");
897 4 : }
898 :
899 11 : static void state_stat(struct snapraid_state* state, tommy_list* high)
900 : {
901 : tommy_node* i;
902 :
903 : (void)state;
904 :
905 : /* compute lengths for padding */
906 223 : for (i = tommy_list_head(high); i != 0; i = i->next) {
907 212 : devinfo_t* devinfo = i->data;
908 :
909 : /* print disk access_stat (not split) */
910 212 : if (devinfo->split == 0 && devinfo->access_stat != 0) {
911 104 : if (devinfo->name[0])
912 104 : log_tag("stat:%s:%" PRIu64 "\n", devinfo->name, devinfo->access_stat);
913 : }
914 : }
915 11 : }
916 :
917 2 : static void state_devices(struct snapraid_state* state, tommy_list* low)
918 : {
919 : tommy_node* i;
920 :
921 : (void)state;
922 :
923 46 : for (i = tommy_list_head(low); i != 0; i = i->next) {
924 44 : devinfo_t* devinfo = i->data;
925 44 : devinfo_t* parent = devinfo->parent;
926 :
927 44 : if (parent) {
928 : #ifdef _WIN32
929 : printf("%" PRIu64 "\t%s\t%08" PRIx64 "\t%s\t%s\n", devinfo->device, devinfo->wfile, parent->device, parent->wfile, parent->name);
930 : #else
931 44 : printf("%u:%u\t%s\t%u:%u\t%s\t%s\n", major(devinfo->device), minor(devinfo->device), devinfo->file, major(parent->device), minor(parent->device), parent->file, parent->name);
932 : #endif
933 : }
934 : }
935 2 : }
936 :
937 2419 : int devtest(tommy_list* high, tommy_list* low, int operation)
938 : {
939 : tommy_node* i;
940 : unsigned count;
941 :
942 2419 : if (operation != DEVICE_SMART && operation != DEVICE_PROBE)
943 0 : return -1;
944 :
945 : /* for each device add some fake data */
946 2419 : count = 0;
947 74989 : for (i = tommy_list_head(high); i != 0; i = i->next) {
948 72570 : devinfo_t* devinfo = i->data;
949 : devinfo_t* entry;
950 : int j;
951 :
952 72570 : ++count;
953 :
954 72570 : entry = calloc_nofail(1, sizeof(devinfo_t));
955 :
956 : /* fake device number */
957 72570 : entry->device = tommy_strhash_u32(0, devinfo->name);
958 :
959 72570 : tommy_list_insert_tail(low, &entry->node, entry);
960 :
961 18650490 : for (j = 0; j < 256; ++j) {
962 18577920 : switch (count) {
963 0 : case 0 :
964 0 : entry->smart[j].raw = 0;
965 0 : break;
966 619264 : case 1 :
967 619264 : entry->smart[j].raw = SMART_UNASSIGNED;
968 619264 : break;
969 17958656 : default :
970 17958656 : entry->smart[j].raw = 0;
971 17958656 : break;
972 : }
973 : }
974 :
975 72570 : pathprint(entry->serial, sizeof(entry->serial), "FAKE_%s", devinfo->serial);
976 72570 : pathprint(entry->family, sizeof(entry->family), "FAKE_%s", devinfo->family);
977 72570 : pathprint(entry->model, sizeof(entry->model), "FAKE_%s", devinfo->model);
978 72570 : pathprint(entry->interf, sizeof(entry->interf), "FAKE_%s", devinfo->interf);
979 72570 : pathprint(entry->file, sizeof(entry->file), "FAKE_%s", devinfo->file);
980 72570 : pathcpy(entry->name, sizeof(entry->name), devinfo->name);
981 72570 : entry->info[INFO_SIZE] = count * TERA;
982 72570 : entry->info[INFO_ROTATION_RATE] = 7200;
983 72570 : entry->smart[SMART_ERROR_MEDIUM].raw = 0;
984 72570 : entry->smart[SMART_ERROR_PROTOCOL].raw = 0;
985 72570 : entry->smart[SMART_FLAGS].raw = SMART_UNASSIGNED;
986 72570 : entry->smart[SMART_TEMPERATURE_CELSIUS].raw = 27;
987 :
988 72570 : switch (count) {
989 2419 : case 3 : entry->smart[SMART_ERROR_PROTOCOL].raw = 1; break;
990 2419 : case 4 : entry->smart[SMART_FLAGS].raw = SMARTCTL_FLAG_UNSUPPORTED; break;
991 2419 : case 5 : entry->smart[SMART_FLAGS].raw = SMARTCTL_FLAG_COMMAND; break;
992 2419 : case 6 : entry->smart[SMART_FLAGS].raw = SMARTCTL_FLAG_OPEN; break;
993 2419 : case 7 : entry->smart[SMART_FLAGS].raw = SMARTCTL_FLAG_FAIL; break;
994 2419 : case 8 : entry->smart[SMART_FLAGS].raw = SMARTCTL_FLAG_PREFAIL; break;
995 2419 : case 9 : entry->smart[SMART_FLAGS].raw = SMARTCTL_FLAG_PREFAIL_LOGGED; break;
996 2419 : case 10 : entry->smart[SMART_FLAGS].raw = SMARTCTL_FLAG_ERROR_LOGGED; break;
997 2419 : case 11 : entry->smart[SMART_FLAGS].raw = SMARTCTL_FLAG_SELFERROR_LOGGED; break;
998 : }
999 :
1000 72570 : entry->power = POWER_ACTIVE;
1001 : }
1002 :
1003 2419 : return 0;
1004 : }
1005 :
1006 13 : void state_device(struct snapraid_state* state, int operation, tommy_list* filterlist_disk)
1007 : {
1008 : tommy_node* i;
1009 : unsigned j;
1010 : tommy_list high;
1011 : tommy_list low;
1012 : int ret;
1013 13 : time_t now = time(0);
1014 :
1015 : /* map device if not already done */
1016 13 : if (!state->mapped_device) {
1017 13 : devmap();
1018 13 : state->mapped_device = 1;
1019 : }
1020 :
1021 13 : switch (operation) {
1022 2 : case DEVICE_UP : msg_progress("Spinup...\n"); break;
1023 2 : case DEVICE_DOWN : msg_progress("Spindown...\n"); break;
1024 : }
1025 :
1026 13 : tommy_list_init(&high);
1027 13 : tommy_list_init(&low);
1028 :
1029 : /* for all disks */
1030 119 : for (i = state->disklist; i != 0; i = i->next) {
1031 106 : struct snapraid_disk* disk = i->data;
1032 : devinfo_t* entry;
1033 :
1034 106 : if (filterlist_disk != 0 && filter_path(filterlist_disk, 0, disk->name, 0) != 0)
1035 5 : continue;
1036 :
1037 101 : entry = calloc_nofail(1, sizeof(devinfo_t));
1038 :
1039 101 : entry->device = disk->mount_device;
1040 101 : device_name_set(entry, disk->name, 0);
1041 101 : pathcpy(entry->mount, sizeof(entry->mount), disk->dir);
1042 101 : pathcpy(entry->smartctl, sizeof(entry->smartctl), disk->smartctl);
1043 101 : memcpy(entry->smartignore, disk->smartignore, sizeof(entry->smartignore));
1044 :
1045 101 : tommy_list_insert_tail(&high, &entry->node, entry);
1046 : }
1047 :
1048 : /* for all parities */
1049 63 : for (j = 0; j < state->level; ++j) {
1050 : devinfo_t* entry;
1051 : devinfo_t* split;
1052 : unsigned s;
1053 :
1054 50 : if (filterlist_disk != 0 && filter_path(filterlist_disk, 0, lev_config_name(j), 0) != 0)
1055 5 : continue;
1056 :
1057 183 : for (s = 0; s < state->parity[j].split_mac; ++s) {
1058 138 : entry = calloc_nofail(1, sizeof(devinfo_t));
1059 :
1060 : /* keep track of the first split */
1061 138 : if (s == 0)
1062 45 : split = entry;
1063 : else
1064 93 : entry->split = split;
1065 :
1066 138 : entry->device = state->parity[j].split_map[s].device;
1067 138 : device_name_set(entry, lev_config_name(j), s);
1068 138 : pathcpy(entry->mount, sizeof(entry->mount), state->parity[j].split_map[s].path);
1069 138 : pathcpy(entry->smartctl, sizeof(entry->smartctl), state->parity[j].smartctl);
1070 138 : memcpy(entry->smartignore, state->parity[j].smartignore, sizeof(entry->smartignore));
1071 138 : pathcut(entry->mount); /* remove the parity file */
1072 :
1073 138 : tommy_list_insert_tail(&high, &entry->node, entry);
1074 : }
1075 : }
1076 :
1077 : /* extra disks are never spundown or spunup */
1078 13 : int include_extra = 1;
1079 13 : switch (operation) {
1080 5 : case DEVICE_UP :
1081 : case DEVICE_DOWN :
1082 : case DEVICE_DOWNIFUP :
1083 5 : include_extra = 0;
1084 5 : break;
1085 : }
1086 13 : if (include_extra) {
1087 : /* for all extra disks */
1088 16 : for (i = state->extralist; i != 0; i = i->next) {
1089 8 : struct snapraid_extra* extra = i->data;
1090 : devinfo_t* entry;
1091 :
1092 8 : if (filterlist_disk != 0 && filter_path(filterlist_disk, 0, extra->name, 0) != 0)
1093 0 : continue;
1094 :
1095 8 : entry = calloc_nofail(1, sizeof(devinfo_t));
1096 :
1097 8 : entry->device = extra->device;
1098 8 : device_name_set(entry, extra->name, 0);
1099 8 : pathcpy(entry->mount, sizeof(entry->mount), extra->dir);
1100 8 : pathcpy(entry->smartctl, sizeof(entry->smartctl), extra->smartctl);
1101 8 : memcpy(entry->smartignore, extra->smartignore, sizeof(extra->smartignore));
1102 :
1103 8 : tommy_list_insert_tail(&high, &entry->node, entry);
1104 : }
1105 : }
1106 :
1107 : /* with a GUI always gives time reference */
1108 13 : if (state->opt.gui)
1109 3 : log_tag("unixtime:%" PRIi64 "\n", (int64_t)now);
1110 :
1111 13 : if (state->opt.fake_device) {
1112 3 : ret = devtest(&high, &low, operation);
1113 : } else {
1114 10 : ret = devquery(&high, &low, operation);
1115 : }
1116 :
1117 : /* if the list is empty, it's not supported in this platform */
1118 13 : if (ret == 0 && tommy_list_empty(&low))
1119 0 : ret = -1;
1120 :
1121 13 : if (ret != 0) {
1122 2 : const char* ope = 0;
1123 2 : switch (operation) {
1124 1 : case DEVICE_UP : ope = "Spinup"; break;
1125 1 : case DEVICE_DOWN : ope = "Spindown"; break;
1126 0 : case DEVICE_LIST : ope = "Device listing"; break;
1127 0 : case DEVICE_SMART : ope = "Smart"; break;
1128 0 : case DEVICE_PROBE : ope = "Probe"; break;
1129 0 : case DEVICE_DOWNIFUP : ope = "Spindown"; break;
1130 : }
1131 2 : log_fatal(ESOFT, "%s is unsupported in this platform.\n", ope);
1132 : } else {
1133 11 : state_stat(state, &high);
1134 :
1135 11 : if (operation == DEVICE_SMART)
1136 2 : state_smart(state, state->level + tommy_list_count(&state->disklist), &low);
1137 :
1138 10 : if (operation == DEVICE_PROBE)
1139 4 : state_probe_report(state, &low);
1140 :
1141 10 : if (operation == DEVICE_UP)
1142 1 : state_attr(state, &low);
1143 :
1144 10 : if (operation == DEVICE_LIST)
1145 2 : state_devices(state, &low);
1146 : }
1147 :
1148 12 : tommy_list_foreach(&high, free);
1149 12 : tommy_list_foreach(&low, free);
1150 12 : }
1151 :
|