Deleted Added
full compact
geom_bsd.c (107832) geom_bsd.c (107953)
1/*-
2 * Copyright (c) 2002 Poul-Henning Kamp
3 * Copyright (c) 2002 Networks Associates Technology, Inc.
4 * All rights reserved.
5 *
6 * This software was developed for the FreeBSD Project by Poul-Henning Kamp
7 * and NAI Labs, the Security Research Division of Network Associates, Inc.
8 * under DARPA/SPAWAR contract N66001-01-C-8035 ("CBOSS"), as part of the
9 * DARPA CHATS research program.
10 *
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 3. The names of the authors may not be used to endorse or promote
20 * products derived from this software without specific prior written
21 * permission.
22 *
23 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
24 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 * SUCH DAMAGE.
34 *
1/*-
2 * Copyright (c) 2002 Poul-Henning Kamp
3 * Copyright (c) 2002 Networks Associates Technology, Inc.
4 * All rights reserved.
5 *
6 * This software was developed for the FreeBSD Project by Poul-Henning Kamp
7 * and NAI Labs, the Security Research Division of Network Associates, Inc.
8 * under DARPA/SPAWAR contract N66001-01-C-8035 ("CBOSS"), as part of the
9 * DARPA CHATS research program.
10 *
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 3. The names of the authors may not be used to endorse or promote
20 * products derived from this software without specific prior written
21 * permission.
22 *
23 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
24 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 * SUCH DAMAGE.
34 *
35 * $FreeBSD: head/sys/geom/geom_bsd.c 107832 2002-12-13 21:31:13Z phk $
35 * $FreeBSD: head/sys/geom/geom_bsd.c 107953 2002-12-16 22:33:27Z phk $
36 *
37 * This is the method for dealing with BSD disklabels. It has been
38 * extensively (by my standards at least) commented, in the vain hope that
39 * it will server as the source in future copy&paste operations.
40 */
41
42#include <sys/param.h>
43#ifndef _KERNEL
44#include <stdio.h>
45#include <string.h>
46#include <stdlib.h>
47#include <signal.h>
48#include <err.h>
49#else
50#include <sys/systm.h>
51#include <sys/kernel.h>
52#include <sys/conf.h>
53#include <sys/bio.h>
54#include <sys/malloc.h>
55#include <sys/lock.h>
56#include <sys/mutex.h>
57#endif
58#include <sys/stdint.h>
59#include <sys/errno.h>
60#include <sys/disklabel.h>
61#include <geom/geom.h>
62#include <geom/geom_slice.h>
63
64#define BSD_CLASS_NAME "BSD"
65
66#define ALPHA_LABEL_OFFSET 64
67
68/*
69 * Our private data about one instance. All the rest is handled by the
70 * slice code and stored in its softc, so this is just the stuff
71 * specific to BSD disklabels.
72 */
73struct g_bsd_softc {
74 off_t labeloffset;
75 off_t mbroffset;
76 off_t rawoffset;
77 struct disklabel ondisk;
78 struct disklabel inram;
79};
80
81/*
82 * The next 4 functions isolate us from how the compiler lays out and pads
83 * "struct disklabel". We treat what we read from disk as a bytestream and
84 * explicitly convert it into a struct disklabel. This makes us compiler-
85 * endianness- and wordsize- agnostic.
86 * For now we only have little-endian formats to deal with.
87 */
88
89static void
90g_bsd_ledec_partition(u_char *ptr, struct partition *d)
91{
92 d->p_size = g_dec_le4(ptr + 0);
93 d->p_offset = g_dec_le4(ptr + 4);
94 d->p_fsize = g_dec_le4(ptr + 8);
95 d->p_fstype = ptr[12];
96 d->p_frag = ptr[13];
97 d->p_cpg = g_dec_le2(ptr + 14);
98}
99
100static void
101g_bsd_ledec_disklabel(u_char *ptr, struct disklabel *d)
102{
103 int i;
104
105 d->d_magic = g_dec_le4(ptr + 0);
106 d->d_type = g_dec_le2(ptr + 4);
107 d->d_subtype = g_dec_le2(ptr + 6);
108 bcopy(ptr + 8, d->d_typename, 16);
109 bcopy(ptr + 24, d->d_packname, 16);
110 d->d_secsize = g_dec_le4(ptr + 40);
111 d->d_nsectors = g_dec_le4(ptr + 44);
112 d->d_ntracks = g_dec_le4(ptr + 48);
113 d->d_ncylinders = g_dec_le4(ptr + 52);
114 d->d_secpercyl = g_dec_le4(ptr + 56);
115 d->d_secperunit = g_dec_le4(ptr + 60);
116 d->d_sparespertrack = g_dec_le2(ptr + 64);
117 d->d_sparespercyl = g_dec_le2(ptr + 66);
118 d->d_acylinders = g_dec_le4(ptr + 68);
119 d->d_rpm = g_dec_le2(ptr + 72);
120 d->d_interleave = g_dec_le2(ptr + 74);
121 d->d_trackskew = g_dec_le2(ptr + 76);
122 d->d_cylskew = g_dec_le2(ptr + 78);
123 d->d_headswitch = g_dec_le4(ptr + 80);
124 d->d_trkseek = g_dec_le4(ptr + 84);
125 d->d_flags = g_dec_le4(ptr + 88);
126 d->d_drivedata[0] = g_dec_le4(ptr + 92);
127 d->d_drivedata[1] = g_dec_le4(ptr + 96);
128 d->d_drivedata[2] = g_dec_le4(ptr + 100);
129 d->d_drivedata[3] = g_dec_le4(ptr + 104);
130 d->d_drivedata[4] = g_dec_le4(ptr + 108);
131 d->d_spare[0] = g_dec_le4(ptr + 112);
132 d->d_spare[1] = g_dec_le4(ptr + 116);
133 d->d_spare[2] = g_dec_le4(ptr + 120);
134 d->d_spare[3] = g_dec_le4(ptr + 124);
135 d->d_spare[4] = g_dec_le4(ptr + 128);
136 d->d_magic2 = g_dec_le4(ptr + 132);
137 d->d_checksum = g_dec_le2(ptr + 136);
138 d->d_npartitions = g_dec_le2(ptr + 138);
139 d->d_bbsize = g_dec_le4(ptr + 140);
140 d->d_sbsize = g_dec_le4(ptr + 144);
141 for (i = 0; i < MAXPARTITIONS; i++)
142 g_bsd_ledec_partition(ptr + 148 + 16 * i, &d->d_partitions[i]);
143}
144
145static void
146g_bsd_leenc_partition(u_char *ptr, struct partition *d)
147{
148 g_enc_le4(ptr + 0, d->p_size);
149 g_enc_le4(ptr + 4, d->p_offset);
150 g_enc_le4(ptr + 8, d->p_fsize);
151 ptr[12] = d->p_fstype;
152 ptr[13] = d->p_frag;
153 g_enc_le2(ptr + 14, d->p_cpg);
154}
155
156static void
157g_bsd_leenc_disklabel(u_char *ptr, struct disklabel *d)
158{
159 int i;
160
161 g_enc_le4(ptr + 0, d->d_magic);
162 g_enc_le2(ptr + 4, d->d_type);
163 g_enc_le2(ptr + 6, d->d_subtype);
164 bcopy(d->d_typename, ptr + 8, 16);
165 bcopy(d->d_packname, ptr + 24, 16);
166 g_enc_le4(ptr + 40, d->d_secsize);
167 g_enc_le4(ptr + 44, d->d_nsectors);
168 g_enc_le4(ptr + 48, d->d_ntracks);
169 g_enc_le4(ptr + 52, d->d_ncylinders);
170 g_enc_le4(ptr + 56, d->d_secpercyl);
171 g_enc_le4(ptr + 60, d->d_secperunit);
172 g_enc_le2(ptr + 64, d->d_sparespertrack);
173 g_enc_le2(ptr + 66, d->d_sparespercyl);
174 g_enc_le4(ptr + 68, d->d_acylinders);
175 g_enc_le2(ptr + 72, d->d_rpm);
176 g_enc_le2(ptr + 74, d->d_interleave);
177 g_enc_le2(ptr + 76, d->d_trackskew);
178 g_enc_le2(ptr + 78, d->d_cylskew);
179 g_enc_le4(ptr + 80, d->d_headswitch);
180 g_enc_le4(ptr + 84, d->d_trkseek);
181 g_enc_le4(ptr + 88, d->d_flags);
182 g_enc_le4(ptr + 92, d->d_drivedata[0]);
183 g_enc_le4(ptr + 96, d->d_drivedata[1]);
184 g_enc_le4(ptr + 100, d->d_drivedata[2]);
185 g_enc_le4(ptr + 104, d->d_drivedata[3]);
186 g_enc_le4(ptr + 108, d->d_drivedata[4]);
187 g_enc_le4(ptr + 112, d->d_spare[0]);
188 g_enc_le4(ptr + 116, d->d_spare[1]);
189 g_enc_le4(ptr + 120, d->d_spare[2]);
190 g_enc_le4(ptr + 124, d->d_spare[3]);
191 g_enc_le4(ptr + 128, d->d_spare[4]);
192 g_enc_le4(ptr + 132, d->d_magic2);
193 g_enc_le2(ptr + 136, d->d_checksum);
194 g_enc_le2(ptr + 138, d->d_npartitions);
195 g_enc_le4(ptr + 140, d->d_bbsize);
196 g_enc_le4(ptr + 144, d->d_sbsize);
197 for (i = 0; i < MAXPARTITIONS; i++)
198 g_bsd_leenc_partition(ptr + 148 + 16 * i, &d->d_partitions[i]);
199}
200
201static int
202g_bsd_ondisk_size(void)
203{
204 return (148 + 16 * MAXPARTITIONS);
205}
206
207/*
208 * For reasons which were valid and just in their days, FreeBSD/i386 uses
209 * absolute disk-addresses in disklabels. The way it works is that the
210 * p_offset field of all partitions have the first sector number of the
211 * disk slice added to them. This was hidden kernel-magic, userland did
212 * not see these offsets. These two functions subtract and add them
213 * while converting from the "ondisk" to the "inram" labels and vice
214 * versa.
215 */
216static void
217ondisk2inram(struct g_bsd_softc *sc)
218{
219 struct partition *ppp;
220 struct disklabel *dl;
221 int i;
222
223 sc->inram = sc->ondisk;
224 dl = &sc->inram;
225
226 /* Basic sanity-check needed to avoid mistakes. */
227 if (dl->d_magic != DISKMAGIC || dl->d_magic2 != DISKMAGIC)
228 return;
229 if (dl->d_npartitions > MAXPARTITIONS)
230 return;
231
232 sc->rawoffset = dl->d_partitions[RAW_PART].p_offset;
233 for (i = 0; i < dl->d_npartitions; i++) {
234 ppp = &dl->d_partitions[i];
235 if (ppp->p_size != 0 && ppp->p_offset < sc->rawoffset)
236 sc->rawoffset = 0;
237 }
238 if (sc->rawoffset > 0) {
239 for (i = 0; i < dl->d_npartitions; i++) {
240 ppp = &dl->d_partitions[i];
241 if (ppp->p_offset != 0)
242 ppp->p_offset -= sc->rawoffset;
243 }
244 }
245 dl->d_checksum = 0;
246 dl->d_checksum = dkcksum(&sc->inram);
247}
248
249static void
250inram2ondisk(struct g_bsd_softc *sc)
251{
252 struct partition *ppp;
253 int i;
254
255 sc->ondisk = sc->inram;
256 if (sc->mbroffset != 0)
257 sc->rawoffset = sc->mbroffset / sc->inram.d_secsize;
258 if (sc->rawoffset != 0) {
259 for (i = 0; i < sc->inram.d_npartitions; i++) {
260 ppp = &sc->ondisk.d_partitions[i];
261 if (ppp->p_size > 0)
262 ppp->p_offset += sc->rawoffset;
263 else
264 ppp->p_offset = 0;
265 }
266 }
267 sc->ondisk.d_checksum = 0;
268 sc->ondisk.d_checksum = dkcksum(&sc->ondisk);
269}
270
271/*
272 * Check that this looks like a valid disklabel, but be prepared
273 * to get any kind of junk. The checksum must be checked only
274 * after this function returns success to prevent a bogus d_npartitions
275 * value from tripping us up.
276 */
277static int
278g_bsd_checklabel(struct disklabel *dl)
279{
280 struct partition *ppp;
281 int i;
282
283 if (dl->d_magic != DISKMAGIC || dl->d_magic2 != DISKMAGIC)
284 return (EINVAL);
285 /*
286 * If the label specifies more partitions than we can handle
287 * we have to reject it: If people updated the label they would
288 * trash it, and that would break the checksum.
289 */
290 if (dl->d_npartitions > MAXPARTITIONS)
291 return (EINVAL);
292
293 for (i = 0; i < dl->d_npartitions; i++) {
294 ppp = &dl->d_partitions[i];
295 /* Cannot extend past unit. */
296 if (ppp->p_size != 0 &&
297 ppp->p_offset + ppp->p_size > dl->d_secperunit) {
298 return (EINVAL);
299 }
300 }
301 return (0);
302}
303
304/*
305 * Modify our slicer to match proposed disklabel, if possible.
306 * First carry out all the simple checks, then lock topology
307 * and check that no open providers are affected negatively
308 * then carry out all the changes.
309 *
310 * NB: Returns with topology held only if successful return.
311 */
312static int
313g_bsd_modify(struct g_geom *gp, struct disklabel *dl)
314{
315 int i, error;
316 struct partition *ppp;
317 struct g_slicer *gsp;
318 struct g_consumer *cp;
36 *
37 * This is the method for dealing with BSD disklabels. It has been
38 * extensively (by my standards at least) commented, in the vain hope that
39 * it will server as the source in future copy&paste operations.
40 */
41
42#include <sys/param.h>
43#ifndef _KERNEL
44#include <stdio.h>
45#include <string.h>
46#include <stdlib.h>
47#include <signal.h>
48#include <err.h>
49#else
50#include <sys/systm.h>
51#include <sys/kernel.h>
52#include <sys/conf.h>
53#include <sys/bio.h>
54#include <sys/malloc.h>
55#include <sys/lock.h>
56#include <sys/mutex.h>
57#endif
58#include <sys/stdint.h>
59#include <sys/errno.h>
60#include <sys/disklabel.h>
61#include <geom/geom.h>
62#include <geom/geom_slice.h>
63
64#define BSD_CLASS_NAME "BSD"
65
66#define ALPHA_LABEL_OFFSET 64
67
68/*
69 * Our private data about one instance. All the rest is handled by the
70 * slice code and stored in its softc, so this is just the stuff
71 * specific to BSD disklabels.
72 */
73struct g_bsd_softc {
74 off_t labeloffset;
75 off_t mbroffset;
76 off_t rawoffset;
77 struct disklabel ondisk;
78 struct disklabel inram;
79};
80
81/*
82 * The next 4 functions isolate us from how the compiler lays out and pads
83 * "struct disklabel". We treat what we read from disk as a bytestream and
84 * explicitly convert it into a struct disklabel. This makes us compiler-
85 * endianness- and wordsize- agnostic.
86 * For now we only have little-endian formats to deal with.
87 */
88
89static void
90g_bsd_ledec_partition(u_char *ptr, struct partition *d)
91{
92 d->p_size = g_dec_le4(ptr + 0);
93 d->p_offset = g_dec_le4(ptr + 4);
94 d->p_fsize = g_dec_le4(ptr + 8);
95 d->p_fstype = ptr[12];
96 d->p_frag = ptr[13];
97 d->p_cpg = g_dec_le2(ptr + 14);
98}
99
100static void
101g_bsd_ledec_disklabel(u_char *ptr, struct disklabel *d)
102{
103 int i;
104
105 d->d_magic = g_dec_le4(ptr + 0);
106 d->d_type = g_dec_le2(ptr + 4);
107 d->d_subtype = g_dec_le2(ptr + 6);
108 bcopy(ptr + 8, d->d_typename, 16);
109 bcopy(ptr + 24, d->d_packname, 16);
110 d->d_secsize = g_dec_le4(ptr + 40);
111 d->d_nsectors = g_dec_le4(ptr + 44);
112 d->d_ntracks = g_dec_le4(ptr + 48);
113 d->d_ncylinders = g_dec_le4(ptr + 52);
114 d->d_secpercyl = g_dec_le4(ptr + 56);
115 d->d_secperunit = g_dec_le4(ptr + 60);
116 d->d_sparespertrack = g_dec_le2(ptr + 64);
117 d->d_sparespercyl = g_dec_le2(ptr + 66);
118 d->d_acylinders = g_dec_le4(ptr + 68);
119 d->d_rpm = g_dec_le2(ptr + 72);
120 d->d_interleave = g_dec_le2(ptr + 74);
121 d->d_trackskew = g_dec_le2(ptr + 76);
122 d->d_cylskew = g_dec_le2(ptr + 78);
123 d->d_headswitch = g_dec_le4(ptr + 80);
124 d->d_trkseek = g_dec_le4(ptr + 84);
125 d->d_flags = g_dec_le4(ptr + 88);
126 d->d_drivedata[0] = g_dec_le4(ptr + 92);
127 d->d_drivedata[1] = g_dec_le4(ptr + 96);
128 d->d_drivedata[2] = g_dec_le4(ptr + 100);
129 d->d_drivedata[3] = g_dec_le4(ptr + 104);
130 d->d_drivedata[4] = g_dec_le4(ptr + 108);
131 d->d_spare[0] = g_dec_le4(ptr + 112);
132 d->d_spare[1] = g_dec_le4(ptr + 116);
133 d->d_spare[2] = g_dec_le4(ptr + 120);
134 d->d_spare[3] = g_dec_le4(ptr + 124);
135 d->d_spare[4] = g_dec_le4(ptr + 128);
136 d->d_magic2 = g_dec_le4(ptr + 132);
137 d->d_checksum = g_dec_le2(ptr + 136);
138 d->d_npartitions = g_dec_le2(ptr + 138);
139 d->d_bbsize = g_dec_le4(ptr + 140);
140 d->d_sbsize = g_dec_le4(ptr + 144);
141 for (i = 0; i < MAXPARTITIONS; i++)
142 g_bsd_ledec_partition(ptr + 148 + 16 * i, &d->d_partitions[i]);
143}
144
145static void
146g_bsd_leenc_partition(u_char *ptr, struct partition *d)
147{
148 g_enc_le4(ptr + 0, d->p_size);
149 g_enc_le4(ptr + 4, d->p_offset);
150 g_enc_le4(ptr + 8, d->p_fsize);
151 ptr[12] = d->p_fstype;
152 ptr[13] = d->p_frag;
153 g_enc_le2(ptr + 14, d->p_cpg);
154}
155
156static void
157g_bsd_leenc_disklabel(u_char *ptr, struct disklabel *d)
158{
159 int i;
160
161 g_enc_le4(ptr + 0, d->d_magic);
162 g_enc_le2(ptr + 4, d->d_type);
163 g_enc_le2(ptr + 6, d->d_subtype);
164 bcopy(d->d_typename, ptr + 8, 16);
165 bcopy(d->d_packname, ptr + 24, 16);
166 g_enc_le4(ptr + 40, d->d_secsize);
167 g_enc_le4(ptr + 44, d->d_nsectors);
168 g_enc_le4(ptr + 48, d->d_ntracks);
169 g_enc_le4(ptr + 52, d->d_ncylinders);
170 g_enc_le4(ptr + 56, d->d_secpercyl);
171 g_enc_le4(ptr + 60, d->d_secperunit);
172 g_enc_le2(ptr + 64, d->d_sparespertrack);
173 g_enc_le2(ptr + 66, d->d_sparespercyl);
174 g_enc_le4(ptr + 68, d->d_acylinders);
175 g_enc_le2(ptr + 72, d->d_rpm);
176 g_enc_le2(ptr + 74, d->d_interleave);
177 g_enc_le2(ptr + 76, d->d_trackskew);
178 g_enc_le2(ptr + 78, d->d_cylskew);
179 g_enc_le4(ptr + 80, d->d_headswitch);
180 g_enc_le4(ptr + 84, d->d_trkseek);
181 g_enc_le4(ptr + 88, d->d_flags);
182 g_enc_le4(ptr + 92, d->d_drivedata[0]);
183 g_enc_le4(ptr + 96, d->d_drivedata[1]);
184 g_enc_le4(ptr + 100, d->d_drivedata[2]);
185 g_enc_le4(ptr + 104, d->d_drivedata[3]);
186 g_enc_le4(ptr + 108, d->d_drivedata[4]);
187 g_enc_le4(ptr + 112, d->d_spare[0]);
188 g_enc_le4(ptr + 116, d->d_spare[1]);
189 g_enc_le4(ptr + 120, d->d_spare[2]);
190 g_enc_le4(ptr + 124, d->d_spare[3]);
191 g_enc_le4(ptr + 128, d->d_spare[4]);
192 g_enc_le4(ptr + 132, d->d_magic2);
193 g_enc_le2(ptr + 136, d->d_checksum);
194 g_enc_le2(ptr + 138, d->d_npartitions);
195 g_enc_le4(ptr + 140, d->d_bbsize);
196 g_enc_le4(ptr + 144, d->d_sbsize);
197 for (i = 0; i < MAXPARTITIONS; i++)
198 g_bsd_leenc_partition(ptr + 148 + 16 * i, &d->d_partitions[i]);
199}
200
201static int
202g_bsd_ondisk_size(void)
203{
204 return (148 + 16 * MAXPARTITIONS);
205}
206
207/*
208 * For reasons which were valid and just in their days, FreeBSD/i386 uses
209 * absolute disk-addresses in disklabels. The way it works is that the
210 * p_offset field of all partitions have the first sector number of the
211 * disk slice added to them. This was hidden kernel-magic, userland did
212 * not see these offsets. These two functions subtract and add them
213 * while converting from the "ondisk" to the "inram" labels and vice
214 * versa.
215 */
216static void
217ondisk2inram(struct g_bsd_softc *sc)
218{
219 struct partition *ppp;
220 struct disklabel *dl;
221 int i;
222
223 sc->inram = sc->ondisk;
224 dl = &sc->inram;
225
226 /* Basic sanity-check needed to avoid mistakes. */
227 if (dl->d_magic != DISKMAGIC || dl->d_magic2 != DISKMAGIC)
228 return;
229 if (dl->d_npartitions > MAXPARTITIONS)
230 return;
231
232 sc->rawoffset = dl->d_partitions[RAW_PART].p_offset;
233 for (i = 0; i < dl->d_npartitions; i++) {
234 ppp = &dl->d_partitions[i];
235 if (ppp->p_size != 0 && ppp->p_offset < sc->rawoffset)
236 sc->rawoffset = 0;
237 }
238 if (sc->rawoffset > 0) {
239 for (i = 0; i < dl->d_npartitions; i++) {
240 ppp = &dl->d_partitions[i];
241 if (ppp->p_offset != 0)
242 ppp->p_offset -= sc->rawoffset;
243 }
244 }
245 dl->d_checksum = 0;
246 dl->d_checksum = dkcksum(&sc->inram);
247}
248
249static void
250inram2ondisk(struct g_bsd_softc *sc)
251{
252 struct partition *ppp;
253 int i;
254
255 sc->ondisk = sc->inram;
256 if (sc->mbroffset != 0)
257 sc->rawoffset = sc->mbroffset / sc->inram.d_secsize;
258 if (sc->rawoffset != 0) {
259 for (i = 0; i < sc->inram.d_npartitions; i++) {
260 ppp = &sc->ondisk.d_partitions[i];
261 if (ppp->p_size > 0)
262 ppp->p_offset += sc->rawoffset;
263 else
264 ppp->p_offset = 0;
265 }
266 }
267 sc->ondisk.d_checksum = 0;
268 sc->ondisk.d_checksum = dkcksum(&sc->ondisk);
269}
270
271/*
272 * Check that this looks like a valid disklabel, but be prepared
273 * to get any kind of junk. The checksum must be checked only
274 * after this function returns success to prevent a bogus d_npartitions
275 * value from tripping us up.
276 */
277static int
278g_bsd_checklabel(struct disklabel *dl)
279{
280 struct partition *ppp;
281 int i;
282
283 if (dl->d_magic != DISKMAGIC || dl->d_magic2 != DISKMAGIC)
284 return (EINVAL);
285 /*
286 * If the label specifies more partitions than we can handle
287 * we have to reject it: If people updated the label they would
288 * trash it, and that would break the checksum.
289 */
290 if (dl->d_npartitions > MAXPARTITIONS)
291 return (EINVAL);
292
293 for (i = 0; i < dl->d_npartitions; i++) {
294 ppp = &dl->d_partitions[i];
295 /* Cannot extend past unit. */
296 if (ppp->p_size != 0 &&
297 ppp->p_offset + ppp->p_size > dl->d_secperunit) {
298 return (EINVAL);
299 }
300 }
301 return (0);
302}
303
304/*
305 * Modify our slicer to match proposed disklabel, if possible.
306 * First carry out all the simple checks, then lock topology
307 * and check that no open providers are affected negatively
308 * then carry out all the changes.
309 *
310 * NB: Returns with topology held only if successful return.
311 */
312static int
313g_bsd_modify(struct g_geom *gp, struct disklabel *dl)
314{
315 int i, error;
316 struct partition *ppp;
317 struct g_slicer *gsp;
318 struct g_consumer *cp;
319 u_int secsize;
319 u_int secsize, u;
320 off_t mediasize;
321
322 /* Basic check that this is indeed a disklabel. */
323 error = g_bsd_checklabel(dl);
324 if (error)
325 return (error);
326
327 /* Make sure the checksum is OK. */
328 if (dkcksum(dl) != 0)
329 return (EINVAL);
330
331 /* Get dimensions of our device. */
332 cp = LIST_FIRST(&gp->consumer);
333 secsize = cp->provider->sectorsize;
334 mediasize = cp->provider->mediasize;
335
336#ifdef nolonger
337 /*
338 * The raw-partition must start at zero. We do not check that the
339 * size == mediasize because this is overly restrictive. We have
340 * already tested in g_bsd_checklabel() that it is not longer.
341 * XXX: RAW_PART is archaic anyway, and we should drop it.
342 */
343 if (dl->d_partitions[RAW_PART].p_offset != 0)
344 return (EINVAL);
345#endif
346
347#ifdef notyet
348 /*
349 * Indications are that the d_secperunit is not correctly
350 * initialized in many cases, and since we don't need it
351 * for anything, we dont strictly need this test.
352 * Preemptive action to avoid confusing people in disklabel(8)
353 * may be in order.
354 */
355 /* The label cannot claim a larger size than the media. */
356 if ((off_t)dl->d_secperunit * dl->d_secsize > mediasize)
357 return (EINVAL);
358#endif
359
360
361 /* ... or a smaller sector size. */
362 if (dl->d_secsize < secsize)
363 return (EINVAL);
364
365 /* ... or a non-multiple sector size. */
366 if (dl->d_secsize % secsize != 0)
367 return (EINVAL);
368
369 g_topology_lock();
370
371 /* Don't munge open partitions. */
372 gsp = gp->softc;
373 for (i = 0; i < dl->d_npartitions; i++) {
374 ppp = &dl->d_partitions[i];
375
376 error = g_slice_config(gp, i, G_SLICE_CONFIG_CHECK,
377 (off_t)ppp->p_offset * dl->d_secsize,
378 (off_t)ppp->p_size * dl->d_secsize,
379 dl->d_secsize,
380 "%s%c", gp->name, 'a' + i);
381 if (error) {
382 g_topology_unlock();
383 return (error);
384 }
385 }
386
387 /* Look good, go for it... */
320 off_t mediasize;
321
322 /* Basic check that this is indeed a disklabel. */
323 error = g_bsd_checklabel(dl);
324 if (error)
325 return (error);
326
327 /* Make sure the checksum is OK. */
328 if (dkcksum(dl) != 0)
329 return (EINVAL);
330
331 /* Get dimensions of our device. */
332 cp = LIST_FIRST(&gp->consumer);
333 secsize = cp->provider->sectorsize;
334 mediasize = cp->provider->mediasize;
335
336#ifdef nolonger
337 /*
338 * The raw-partition must start at zero. We do not check that the
339 * size == mediasize because this is overly restrictive. We have
340 * already tested in g_bsd_checklabel() that it is not longer.
341 * XXX: RAW_PART is archaic anyway, and we should drop it.
342 */
343 if (dl->d_partitions[RAW_PART].p_offset != 0)
344 return (EINVAL);
345#endif
346
347#ifdef notyet
348 /*
349 * Indications are that the d_secperunit is not correctly
350 * initialized in many cases, and since we don't need it
351 * for anything, we dont strictly need this test.
352 * Preemptive action to avoid confusing people in disklabel(8)
353 * may be in order.
354 */
355 /* The label cannot claim a larger size than the media. */
356 if ((off_t)dl->d_secperunit * dl->d_secsize > mediasize)
357 return (EINVAL);
358#endif
359
360
361 /* ... or a smaller sector size. */
362 if (dl->d_secsize < secsize)
363 return (EINVAL);
364
365 /* ... or a non-multiple sector size. */
366 if (dl->d_secsize % secsize != 0)
367 return (EINVAL);
368
369 g_topology_lock();
370
371 /* Don't munge open partitions. */
372 gsp = gp->softc;
373 for (i = 0; i < dl->d_npartitions; i++) {
374 ppp = &dl->d_partitions[i];
375
376 error = g_slice_config(gp, i, G_SLICE_CONFIG_CHECK,
377 (off_t)ppp->p_offset * dl->d_secsize,
378 (off_t)ppp->p_size * dl->d_secsize,
379 dl->d_secsize,
380 "%s%c", gp->name, 'a' + i);
381 if (error) {
382 g_topology_unlock();
383 return (error);
384 }
385 }
386
387 /* Look good, go for it... */
388 for (i = 0; i < gsp->nslice; i++) {
389 ppp = &dl->d_partitions[i];
390 g_slice_config(gp, i, G_SLICE_CONFIG_SET,
388 for (u = 0; u < gsp->nslice; u++) {
389 ppp = &dl->d_partitions[u];
390 g_slice_config(gp, u, G_SLICE_CONFIG_SET,
391 (off_t)ppp->p_offset * dl->d_secsize,
392 (off_t)ppp->p_size * dl->d_secsize,
393 dl->d_secsize,
391 (off_t)ppp->p_offset * dl->d_secsize,
392 (off_t)ppp->p_size * dl->d_secsize,
393 dl->d_secsize,
394 "%s%c", gp->name, 'a' + i);
394 "%s%c", gp->name, 'a' + u);
395 }
396 return (0);
397}
398
399/*
400 * Calculate a disklabel checksum for a little-endian byte-stream.
401 * We need access to the decoded disklabel because the checksum only
402 * covers the partition data for the first d_npartitions.
403 */
404static int
405g_bsd_lesum(struct disklabel *dl, u_char *p)
406{
407 u_char *pe;
408 uint16_t sum;
409
410 pe = p + 148 + 16 * dl->d_npartitions;
411 sum = 0;
412 while (p < pe) {
413 sum ^= g_dec_le2(p);
414 p += 2;
415 }
416 return (sum);
417}
418
419/*
420 * This is an internal helper function, called multiple times from the taste
421 * function to try to locate a disklabel on the disk. More civilized formats
422 * will not need this, as there is only one possible place on disk to look
423 * for the magic spot.
424 */
425
426static int
427g_bsd_try(struct g_geom *gp, struct g_slicer *gsp, struct g_consumer *cp, int secsize, struct g_bsd_softc *ms, off_t offset)
428{
429 int error;
430 u_char *buf;
431 struct disklabel *dl;
432 off_t secoff;
433
434 /*
435 * We need to read entire aligned sectors, and we assume that the
436 * disklabel does not span sectors, so one sector is enough.
437 */
438 error = 0;
439 secoff = offset % secsize;
440 buf = g_read_data(cp, offset - secoff, secsize, &error);
441 if (buf == NULL || error != 0)
442 return (ENOENT);
443
444 /* Decode into our native format. */
445 dl = &ms->ondisk;
446 g_bsd_ledec_disklabel(buf + secoff, dl);
447
448 ondisk2inram(ms);
449
450 dl = &ms->inram;
451 /* Does it look like a label at all? */
452 if (g_bsd_checklabel(dl))
453 error = ENOENT;
454 /* ... and does the raw data have a good checksum? */
455 if (error == 0 && g_bsd_lesum(dl, buf + secoff) != 0)
456 error = ENOENT;
457
458 /* Remember to free the buffer g_read_data() gave us. */
459 g_free(buf);
460
461 /* If we had a label, record it properly. */
462 if (error == 0) {
463 gsp->frontstuff = 16 * secsize; /* XXX */
464 ms->labeloffset = offset;
465 g_topology_lock();
466 g_slice_conf_hot(gp, 0, offset, g_bsd_ondisk_size());
467 g_topology_unlock();
468 }
469 return (error);
470}
471
472/*
473 * Implement certain ioctls to modify disklabels with. This function
474 * is called by the event handler thread with topology locked as result
475 * of the g_call_me() in g_bsd_start(). It is not necessary to keep
476 * topology locked all the time but make sure to return with topology
477 * locked as well.
478 */
479
480static void
481g_bsd_ioctl(void *arg)
482{
483 struct bio *bp;
484 struct g_geom *gp;
485 struct g_slicer *gsp;
486 struct g_bsd_softc *ms;
487 struct disklabel *dl;
488 struct g_ioctl *gio;
489 struct g_consumer *cp;
490 u_char *buf;
491 off_t secoff;
492 u_int secsize;
493 int error, i;
494 uint64_t sum;
495
496 /* We don't need topology for now. */
497 g_topology_unlock();
498
499 /* Get hold of the interesting bits from the bio. */
500 bp = arg;
501 gp = bp->bio_to->geom;
502 gsp = gp->softc;
503 ms = gsp->softc;
504 gio = (struct g_ioctl *)bp->bio_data;
505
506 /* The disklabel to set is the ioctl argument. */
507 dl = gio->data;
508
509 /* Validate and modify our slice instance to match. */
510 error = g_bsd_modify(gp, dl); /* Picks up topology lock on success. */
511 if (error) {
512 g_topology_lock();
513 g_io_deliver(bp, error);
514 return;
515 }
516 /* Update our copy of the disklabel. */
517 ms->inram = *dl;
518 inram2ondisk(ms);
519
520 if (gio->cmd == DIOCSDINFO) {
521 g_io_deliver(bp, 0);
522 return;
523 }
524 KASSERT(gio->cmd == DIOCWDINFO, ("Unknown ioctl in g_bsd_ioctl"));
525 cp = LIST_FIRST(&gp->consumer);
526 /* Get sector size, we need it to read data. */
527 secsize = cp->provider->sectorsize;
528 secoff = ms->labeloffset % secsize;
529 buf = g_read_data(cp, ms->labeloffset - secoff, secsize, &error);
530 if (buf == NULL || error != 0) {
531 g_io_deliver(bp, error);
532 return;
533 }
534 dl = &ms->ondisk;
535 g_bsd_leenc_disklabel(buf + secoff, dl);
536 if (ms->labeloffset == ALPHA_LABEL_OFFSET) {
537 sum = 0;
538 for (i = 0; i < 63; i++)
539 sum += g_dec_le8(buf + i * 8);
540 g_enc_le8(buf + 504, sum);
541 }
542 error = g_write_data(cp, ms->labeloffset - secoff, buf, secsize);
543 g_free(buf);
544 g_io_deliver(bp, error);
545}
546
547/*
548 * If the user tries to overwrite our disklabel through an open partition
549 * or via a magicwrite config call, we end up here and try to prevent
550 * footshooting as best we can.
551 */
552static void
553g_bsd_hotwrite(void *arg)
554{
555 struct bio *bp;
556 struct g_geom *gp;
557 struct g_slicer *gsp;
558 struct g_slice *gsl;
559 struct g_bsd_softc *ms;
560 struct g_bsd_softc fake;
561 u_char *p;
562 int error;
563
564 bp = arg;
565 gp = bp->bio_to->geom;
566 gsp = gp->softc;
567 ms = gsp->softc;
568 gsl = &gsp->slices[bp->bio_to->index];
395 }
396 return (0);
397}
398
399/*
400 * Calculate a disklabel checksum for a little-endian byte-stream.
401 * We need access to the decoded disklabel because the checksum only
402 * covers the partition data for the first d_npartitions.
403 */
404static int
405g_bsd_lesum(struct disklabel *dl, u_char *p)
406{
407 u_char *pe;
408 uint16_t sum;
409
410 pe = p + 148 + 16 * dl->d_npartitions;
411 sum = 0;
412 while (p < pe) {
413 sum ^= g_dec_le2(p);
414 p += 2;
415 }
416 return (sum);
417}
418
419/*
420 * This is an internal helper function, called multiple times from the taste
421 * function to try to locate a disklabel on the disk. More civilized formats
422 * will not need this, as there is only one possible place on disk to look
423 * for the magic spot.
424 */
425
426static int
427g_bsd_try(struct g_geom *gp, struct g_slicer *gsp, struct g_consumer *cp, int secsize, struct g_bsd_softc *ms, off_t offset)
428{
429 int error;
430 u_char *buf;
431 struct disklabel *dl;
432 off_t secoff;
433
434 /*
435 * We need to read entire aligned sectors, and we assume that the
436 * disklabel does not span sectors, so one sector is enough.
437 */
438 error = 0;
439 secoff = offset % secsize;
440 buf = g_read_data(cp, offset - secoff, secsize, &error);
441 if (buf == NULL || error != 0)
442 return (ENOENT);
443
444 /* Decode into our native format. */
445 dl = &ms->ondisk;
446 g_bsd_ledec_disklabel(buf + secoff, dl);
447
448 ondisk2inram(ms);
449
450 dl = &ms->inram;
451 /* Does it look like a label at all? */
452 if (g_bsd_checklabel(dl))
453 error = ENOENT;
454 /* ... and does the raw data have a good checksum? */
455 if (error == 0 && g_bsd_lesum(dl, buf + secoff) != 0)
456 error = ENOENT;
457
458 /* Remember to free the buffer g_read_data() gave us. */
459 g_free(buf);
460
461 /* If we had a label, record it properly. */
462 if (error == 0) {
463 gsp->frontstuff = 16 * secsize; /* XXX */
464 ms->labeloffset = offset;
465 g_topology_lock();
466 g_slice_conf_hot(gp, 0, offset, g_bsd_ondisk_size());
467 g_topology_unlock();
468 }
469 return (error);
470}
471
472/*
473 * Implement certain ioctls to modify disklabels with. This function
474 * is called by the event handler thread with topology locked as result
475 * of the g_call_me() in g_bsd_start(). It is not necessary to keep
476 * topology locked all the time but make sure to return with topology
477 * locked as well.
478 */
479
480static void
481g_bsd_ioctl(void *arg)
482{
483 struct bio *bp;
484 struct g_geom *gp;
485 struct g_slicer *gsp;
486 struct g_bsd_softc *ms;
487 struct disklabel *dl;
488 struct g_ioctl *gio;
489 struct g_consumer *cp;
490 u_char *buf;
491 off_t secoff;
492 u_int secsize;
493 int error, i;
494 uint64_t sum;
495
496 /* We don't need topology for now. */
497 g_topology_unlock();
498
499 /* Get hold of the interesting bits from the bio. */
500 bp = arg;
501 gp = bp->bio_to->geom;
502 gsp = gp->softc;
503 ms = gsp->softc;
504 gio = (struct g_ioctl *)bp->bio_data;
505
506 /* The disklabel to set is the ioctl argument. */
507 dl = gio->data;
508
509 /* Validate and modify our slice instance to match. */
510 error = g_bsd_modify(gp, dl); /* Picks up topology lock on success. */
511 if (error) {
512 g_topology_lock();
513 g_io_deliver(bp, error);
514 return;
515 }
516 /* Update our copy of the disklabel. */
517 ms->inram = *dl;
518 inram2ondisk(ms);
519
520 if (gio->cmd == DIOCSDINFO) {
521 g_io_deliver(bp, 0);
522 return;
523 }
524 KASSERT(gio->cmd == DIOCWDINFO, ("Unknown ioctl in g_bsd_ioctl"));
525 cp = LIST_FIRST(&gp->consumer);
526 /* Get sector size, we need it to read data. */
527 secsize = cp->provider->sectorsize;
528 secoff = ms->labeloffset % secsize;
529 buf = g_read_data(cp, ms->labeloffset - secoff, secsize, &error);
530 if (buf == NULL || error != 0) {
531 g_io_deliver(bp, error);
532 return;
533 }
534 dl = &ms->ondisk;
535 g_bsd_leenc_disklabel(buf + secoff, dl);
536 if (ms->labeloffset == ALPHA_LABEL_OFFSET) {
537 sum = 0;
538 for (i = 0; i < 63; i++)
539 sum += g_dec_le8(buf + i * 8);
540 g_enc_le8(buf + 504, sum);
541 }
542 error = g_write_data(cp, ms->labeloffset - secoff, buf, secsize);
543 g_free(buf);
544 g_io_deliver(bp, error);
545}
546
547/*
548 * If the user tries to overwrite our disklabel through an open partition
549 * or via a magicwrite config call, we end up here and try to prevent
550 * footshooting as best we can.
551 */
552static void
553g_bsd_hotwrite(void *arg)
554{
555 struct bio *bp;
556 struct g_geom *gp;
557 struct g_slicer *gsp;
558 struct g_slice *gsl;
559 struct g_bsd_softc *ms;
560 struct g_bsd_softc fake;
561 u_char *p;
562 int error;
563
564 bp = arg;
565 gp = bp->bio_to->geom;
566 gsp = gp->softc;
567 ms = gsp->softc;
568 gsl = &gsp->slices[bp->bio_to->index];
569 p = bp->bio_data + ms->labeloffset
569 p = (u_char*)bp->bio_data + ms->labeloffset
570 - (bp->bio_offset + gsl->offset);
571 g_bsd_ledec_disklabel(p, &fake.ondisk);
572
573 ondisk2inram(&fake);
574 if (g_bsd_checklabel(&fake.inram)) {
575 g_io_deliver(bp, EPERM);
576 return;
577 }
578 if (g_bsd_lesum(&fake.ondisk, p) != 0) {
579 g_io_deliver(bp, EPERM);
580 return;
581 }
582 g_topology_unlock();
583 error = g_bsd_modify(gp, &fake.inram); /* May pick up topology. */
584 if (error) {
585 g_io_deliver(bp, EPERM);
586 g_topology_lock();
587 return;
588 }
589 /* Update our copy of the disklabel. */
590 ms->inram = fake.inram;
591 inram2ondisk(ms);
592 g_bsd_leenc_disklabel(p, &ms->ondisk);
593 g_slice_finish_hot(bp);
594}
595
596/*-
597 * This start routine is only called for non-trivial requests, all the
598 * trivial ones are handled autonomously by the slice code.
599 * For requests we handle here, we must call the g_io_deliver() on the
600 * bio, and return non-zero to indicate to the slice code that we did so.
601 * This code executes in the "DOWN" I/O path, this means:
602 * * No sleeping.
603 * * Don't grab the topology lock.
604 * * Don't call biowait, g_getattr(), g_setattr() or g_read_data()
605 */
606
607static int
608g_bsd_start(struct bio *bp)
609{
610 struct g_geom *gp;
611 struct g_bsd_softc *ms;
612 struct g_slicer *gsp;
613 struct g_ioctl *gio;
614 int error;
615
616 gp = bp->bio_to->geom;
617 gsp = gp->softc;
618 ms = gsp->softc;
619 switch(bp->bio_cmd) {
620 case BIO_READ:
621 /* We allow reading of our hot spots */
622 return (0);
623 case BIO_DELETE:
624 /* We do not allow deleting our hot spots */
625 return (EPERM);
626 case BIO_WRITE:
627 g_call_me(g_bsd_hotwrite, bp);
628 return (EJUSTRETURN);
629 case BIO_GETATTR:
630 case BIO_SETATTR:
631 break;
632 default:
633 KASSERT(0 == 1, ("Unknown bio_cmd in g_bsd_start (%d)",
634 bp->bio_cmd));
635 }
636
637 /* We only handle ioctl(2) requests of the right format. */
638 if (strcmp(bp->bio_attribute, "GEOM::ioctl"))
639 return (0);
640 else if (bp->bio_length != sizeof(*gio))
641 return (0);
642
643 /* Get hold of the ioctl parameters. */
644 gio = (struct g_ioctl *)bp->bio_data;
645
646 switch (gio->cmd) {
647 case DIOCGDINFO:
648 /* Return a copy of the disklabel to userland. */
649 bcopy(&ms->inram, gio->data, sizeof(ms->inram));
650 g_io_deliver(bp, 0);
651 return (1);
652 case DIOCSDINFO:
653 case DIOCWDINFO:
654 /*
655 * These we cannot do without the topology lock and some
656 * some I/O requests. Ask the event-handler to schedule
657 * us in a less restricted environment.
658 */
659 error = g_call_me(g_bsd_ioctl, bp);
660 if (error)
661 g_io_deliver(bp, error);
662 /*
663 * We must return non-zero to indicate that we will deal
664 * with this bio, even though we have not done so yet.
665 */
666 return (1);
667 default:
668 return (0);
669 }
670}
671
672/*
673 * Dump configuration information in XML format.
674 * Notice that the function is called once for the geom and once for each
675 * consumer and provider. We let g_slice_dumpconf() do most of the work.
676 */
677static void
570 - (bp->bio_offset + gsl->offset);
571 g_bsd_ledec_disklabel(p, &fake.ondisk);
572
573 ondisk2inram(&fake);
574 if (g_bsd_checklabel(&fake.inram)) {
575 g_io_deliver(bp, EPERM);
576 return;
577 }
578 if (g_bsd_lesum(&fake.ondisk, p) != 0) {
579 g_io_deliver(bp, EPERM);
580 return;
581 }
582 g_topology_unlock();
583 error = g_bsd_modify(gp, &fake.inram); /* May pick up topology. */
584 if (error) {
585 g_io_deliver(bp, EPERM);
586 g_topology_lock();
587 return;
588 }
589 /* Update our copy of the disklabel. */
590 ms->inram = fake.inram;
591 inram2ondisk(ms);
592 g_bsd_leenc_disklabel(p, &ms->ondisk);
593 g_slice_finish_hot(bp);
594}
595
596/*-
597 * This start routine is only called for non-trivial requests, all the
598 * trivial ones are handled autonomously by the slice code.
599 * For requests we handle here, we must call the g_io_deliver() on the
600 * bio, and return non-zero to indicate to the slice code that we did so.
601 * This code executes in the "DOWN" I/O path, this means:
602 * * No sleeping.
603 * * Don't grab the topology lock.
604 * * Don't call biowait, g_getattr(), g_setattr() or g_read_data()
605 */
606
607static int
608g_bsd_start(struct bio *bp)
609{
610 struct g_geom *gp;
611 struct g_bsd_softc *ms;
612 struct g_slicer *gsp;
613 struct g_ioctl *gio;
614 int error;
615
616 gp = bp->bio_to->geom;
617 gsp = gp->softc;
618 ms = gsp->softc;
619 switch(bp->bio_cmd) {
620 case BIO_READ:
621 /* We allow reading of our hot spots */
622 return (0);
623 case BIO_DELETE:
624 /* We do not allow deleting our hot spots */
625 return (EPERM);
626 case BIO_WRITE:
627 g_call_me(g_bsd_hotwrite, bp);
628 return (EJUSTRETURN);
629 case BIO_GETATTR:
630 case BIO_SETATTR:
631 break;
632 default:
633 KASSERT(0 == 1, ("Unknown bio_cmd in g_bsd_start (%d)",
634 bp->bio_cmd));
635 }
636
637 /* We only handle ioctl(2) requests of the right format. */
638 if (strcmp(bp->bio_attribute, "GEOM::ioctl"))
639 return (0);
640 else if (bp->bio_length != sizeof(*gio))
641 return (0);
642
643 /* Get hold of the ioctl parameters. */
644 gio = (struct g_ioctl *)bp->bio_data;
645
646 switch (gio->cmd) {
647 case DIOCGDINFO:
648 /* Return a copy of the disklabel to userland. */
649 bcopy(&ms->inram, gio->data, sizeof(ms->inram));
650 g_io_deliver(bp, 0);
651 return (1);
652 case DIOCSDINFO:
653 case DIOCWDINFO:
654 /*
655 * These we cannot do without the topology lock and some
656 * some I/O requests. Ask the event-handler to schedule
657 * us in a less restricted environment.
658 */
659 error = g_call_me(g_bsd_ioctl, bp);
660 if (error)
661 g_io_deliver(bp, error);
662 /*
663 * We must return non-zero to indicate that we will deal
664 * with this bio, even though we have not done so yet.
665 */
666 return (1);
667 default:
668 return (0);
669 }
670}
671
672/*
673 * Dump configuration information in XML format.
674 * Notice that the function is called once for the geom and once for each
675 * consumer and provider. We let g_slice_dumpconf() do most of the work.
676 */
677static void
678g_bsd_dumpconf(struct sbuf *sb, char *indent, struct g_geom *gp, struct g_consumer *cp, struct g_provider *pp)
678g_bsd_dumpconf(struct sbuf *sb, const char *indent, struct g_geom *gp, struct g_consumer *cp, struct g_provider *pp)
679{
680 struct g_bsd_softc *ms;
681 struct g_slicer *gsp;
682
683 gsp = gp->softc;
684 ms = gsp->softc;
685 g_slice_dumpconf(sb, indent, gp, cp, pp);
686 if (indent != NULL && pp == NULL && cp == NULL) {
687 sbuf_printf(sb, "%s<labeloffset>%jd</labeloffset>\n",
688 indent, (intmax_t)ms->labeloffset);
689 sbuf_printf(sb, "%s<rawoffset>%jd</rawoffset>\n",
690 indent, (intmax_t)ms->rawoffset);
691 sbuf_printf(sb, "%s<mbroffset>%jd</mbroffset>\n",
692 indent, (intmax_t)ms->mbroffset);
693 }
694}
695
696/*
697 * The taste function is called from the event-handler, with the topology
698 * lock already held and a provider to examine. The flags are unused.
699 *
700 * If flags == G_TF_NORMAL, the idea is to take a bite of the provider and
701 * if we find valid, consistent magic on it, build a geom on it.
702 * any magic bits which indicate that we should automatically put a BSD
703 * geom on it.
704 *
705 * There may be cases where the operator would like to put a BSD-geom on
706 * providers which do not meet all of the requirements. This can be done
707 * by instead passing the G_TF_INSIST flag, which will override these
708 * checks.
709 *
710 * The final flags value is G_TF_TRANSPARENT, which instructs the method
711 * to put a geom on top of the provider and configure it to be as transparent
712 * as possible. This is not really relevant to the BSD method and therefore
713 * not implemented here.
714 */
715
716static struct g_geom *
717g_bsd_taste(struct g_class *mp, struct g_provider *pp, int flags)
718{
719 struct g_geom *gp;
720 struct g_consumer *cp;
721 int error, i;
722 struct g_bsd_softc *ms;
723 struct disklabel *dl;
724 u_int secsize;
725 struct g_slicer *gsp;
726
727 g_trace(G_T_TOPOLOGY, "bsd_taste(%s,%s)", mp->name, pp->name);
728 g_topology_assert();
729
730 /* We don't implement transparent inserts. */
731 if (flags == G_TF_TRANSPARENT)
732 return (NULL);
733
734 /*
735 * The BSD-method will not automatically configure itself recursively
736 * Note that it is legal to examine the class-name of our provider,
737 * nothing else should ever be examined inside the provider.
738 */
739 if (flags == G_TF_NORMAL &&
740 !strcmp(pp->geom->class->name, BSD_CLASS_NAME))
741 return (NULL);
742
743 /*
744 * BSD labels are a subclass of the general "slicing" topology so
745 * a lot of the work can be done by the common "slice" code.
746 * Create a geom with space for MAXPARTITIONS providers, one consumer
747 * and a softc structure for us. Specify the provider to attach
748 * the consumer to and our "start" routine for special requests.
749 * The provider is opened with mode (1,0,0) so we can do reads
750 * from it.
751 */
752 gp = g_slice_new(mp, MAXPARTITIONS, pp, &cp, &ms,
753 sizeof(*ms), g_bsd_start);
754 if (gp == NULL)
755 return (NULL);
756
757 /*
758 * Now that we have attached to and opened our provider, we do
759 * not need the topology lock until we change the topology again
760 * next time.
761 */
762 g_topology_unlock();
763
764 /*
765 * Fill in the optional details, in our case we have a dumpconf
766 * routine which the "slice" code should call at the right time
767 */
768 gp->dumpconf = g_bsd_dumpconf;
769
770 /* Get the geom_slicer softc from the geom. */
771 gsp = gp->softc;
772
773 /*
774 * The do...while loop here allows us to have multiple escapes
775 * using a simple "break". This improves code clarity without
776 * ending up in deep nesting and without using goto or come from.
777 */
778 do {
779 /*
780 * If the provider is an MBR we will only auto attach
781 * to type 165 slices in the G_TF_NORMAL case. We will
782 * attach to any other type (BSD was handles above)
783 */
784 error = g_getattr("MBR::type", cp, &i);
785 if (!error) {
786 if (i != 165 && flags == G_TF_NORMAL)
787 break;
788 error = g_getattr("MBR::offset", cp, &ms->mbroffset);
789 if (error)
790 break;
791 }
792
793 /* Same thing if we are inside a PC98 */
794 error = g_getattr("PC98::type", cp, &i);
795 if (!error) {
796 if (i != 0xc494 && flags == G_TF_NORMAL)
797 break;
798 error = g_getattr("PC98::offset", cp, &ms->mbroffset);
799 if (error)
800 break;
801 }
802
803 /* Get sector size, we need it to read data. */
804 secsize = cp->provider->sectorsize;
805 if (secsize < 512)
806 break;
807
808 /* First look for a label at the start of the second sector. */
809 error = g_bsd_try(gp, gsp, cp, secsize, ms, secsize);
810
811 /* Next, look for alpha labels */
812 if (error)
813 error = g_bsd_try(gp, gsp, cp, secsize, ms,
814 ALPHA_LABEL_OFFSET);
815
816 /* If we didn't find a label, punt. */
817 if (error)
818 break;
819
820 /*
821 * Process the found disklabel, and modify our "slice"
822 * instance to match it, if possible.
823 */
824 dl = &ms->inram;
825 error = g_bsd_modify(gp, dl); /* Picks up topology lock. */
826 if (!error)
827 g_topology_unlock();
828 break;
829 } while (0);
830
831 /* Success of failure, we can close our provider now. */
832 g_topology_lock();
833 error = g_access_rel(cp, -1, 0, 0);
834
835 /* If we have configured any providers, return the new geom. */
836 if (gsp->nprovider > 0)
837 return (gp);
838 /*
839 * ...else push the "self-destruct" button, by spoiling our own
840 * consumer. This triggers a call to g_std_spoiled which will
841 * dismantle what was setup.
842 */
843 g_std_spoiled(cp);
844 return (NULL);
845}
846
847/* Finally, register with GEOM infrastructure. */
848static struct g_class g_bsd_class = {
849 BSD_CLASS_NAME,
850 g_bsd_taste,
851 NULL,
852 G_CLASS_INITIALIZER
853};
854
855DECLARE_GEOM_CLASS(g_bsd_class, g_bsd);
679{
680 struct g_bsd_softc *ms;
681 struct g_slicer *gsp;
682
683 gsp = gp->softc;
684 ms = gsp->softc;
685 g_slice_dumpconf(sb, indent, gp, cp, pp);
686 if (indent != NULL && pp == NULL && cp == NULL) {
687 sbuf_printf(sb, "%s<labeloffset>%jd</labeloffset>\n",
688 indent, (intmax_t)ms->labeloffset);
689 sbuf_printf(sb, "%s<rawoffset>%jd</rawoffset>\n",
690 indent, (intmax_t)ms->rawoffset);
691 sbuf_printf(sb, "%s<mbroffset>%jd</mbroffset>\n",
692 indent, (intmax_t)ms->mbroffset);
693 }
694}
695
696/*
697 * The taste function is called from the event-handler, with the topology
698 * lock already held and a provider to examine. The flags are unused.
699 *
700 * If flags == G_TF_NORMAL, the idea is to take a bite of the provider and
701 * if we find valid, consistent magic on it, build a geom on it.
702 * any magic bits which indicate that we should automatically put a BSD
703 * geom on it.
704 *
705 * There may be cases where the operator would like to put a BSD-geom on
706 * providers which do not meet all of the requirements. This can be done
707 * by instead passing the G_TF_INSIST flag, which will override these
708 * checks.
709 *
710 * The final flags value is G_TF_TRANSPARENT, which instructs the method
711 * to put a geom on top of the provider and configure it to be as transparent
712 * as possible. This is not really relevant to the BSD method and therefore
713 * not implemented here.
714 */
715
716static struct g_geom *
717g_bsd_taste(struct g_class *mp, struct g_provider *pp, int flags)
718{
719 struct g_geom *gp;
720 struct g_consumer *cp;
721 int error, i;
722 struct g_bsd_softc *ms;
723 struct disklabel *dl;
724 u_int secsize;
725 struct g_slicer *gsp;
726
727 g_trace(G_T_TOPOLOGY, "bsd_taste(%s,%s)", mp->name, pp->name);
728 g_topology_assert();
729
730 /* We don't implement transparent inserts. */
731 if (flags == G_TF_TRANSPARENT)
732 return (NULL);
733
734 /*
735 * The BSD-method will not automatically configure itself recursively
736 * Note that it is legal to examine the class-name of our provider,
737 * nothing else should ever be examined inside the provider.
738 */
739 if (flags == G_TF_NORMAL &&
740 !strcmp(pp->geom->class->name, BSD_CLASS_NAME))
741 return (NULL);
742
743 /*
744 * BSD labels are a subclass of the general "slicing" topology so
745 * a lot of the work can be done by the common "slice" code.
746 * Create a geom with space for MAXPARTITIONS providers, one consumer
747 * and a softc structure for us. Specify the provider to attach
748 * the consumer to and our "start" routine for special requests.
749 * The provider is opened with mode (1,0,0) so we can do reads
750 * from it.
751 */
752 gp = g_slice_new(mp, MAXPARTITIONS, pp, &cp, &ms,
753 sizeof(*ms), g_bsd_start);
754 if (gp == NULL)
755 return (NULL);
756
757 /*
758 * Now that we have attached to and opened our provider, we do
759 * not need the topology lock until we change the topology again
760 * next time.
761 */
762 g_topology_unlock();
763
764 /*
765 * Fill in the optional details, in our case we have a dumpconf
766 * routine which the "slice" code should call at the right time
767 */
768 gp->dumpconf = g_bsd_dumpconf;
769
770 /* Get the geom_slicer softc from the geom. */
771 gsp = gp->softc;
772
773 /*
774 * The do...while loop here allows us to have multiple escapes
775 * using a simple "break". This improves code clarity without
776 * ending up in deep nesting and without using goto or come from.
777 */
778 do {
779 /*
780 * If the provider is an MBR we will only auto attach
781 * to type 165 slices in the G_TF_NORMAL case. We will
782 * attach to any other type (BSD was handles above)
783 */
784 error = g_getattr("MBR::type", cp, &i);
785 if (!error) {
786 if (i != 165 && flags == G_TF_NORMAL)
787 break;
788 error = g_getattr("MBR::offset", cp, &ms->mbroffset);
789 if (error)
790 break;
791 }
792
793 /* Same thing if we are inside a PC98 */
794 error = g_getattr("PC98::type", cp, &i);
795 if (!error) {
796 if (i != 0xc494 && flags == G_TF_NORMAL)
797 break;
798 error = g_getattr("PC98::offset", cp, &ms->mbroffset);
799 if (error)
800 break;
801 }
802
803 /* Get sector size, we need it to read data. */
804 secsize = cp->provider->sectorsize;
805 if (secsize < 512)
806 break;
807
808 /* First look for a label at the start of the second sector. */
809 error = g_bsd_try(gp, gsp, cp, secsize, ms, secsize);
810
811 /* Next, look for alpha labels */
812 if (error)
813 error = g_bsd_try(gp, gsp, cp, secsize, ms,
814 ALPHA_LABEL_OFFSET);
815
816 /* If we didn't find a label, punt. */
817 if (error)
818 break;
819
820 /*
821 * Process the found disklabel, and modify our "slice"
822 * instance to match it, if possible.
823 */
824 dl = &ms->inram;
825 error = g_bsd_modify(gp, dl); /* Picks up topology lock. */
826 if (!error)
827 g_topology_unlock();
828 break;
829 } while (0);
830
831 /* Success of failure, we can close our provider now. */
832 g_topology_lock();
833 error = g_access_rel(cp, -1, 0, 0);
834
835 /* If we have configured any providers, return the new geom. */
836 if (gsp->nprovider > 0)
837 return (gp);
838 /*
839 * ...else push the "self-destruct" button, by spoiling our own
840 * consumer. This triggers a call to g_std_spoiled which will
841 * dismantle what was setup.
842 */
843 g_std_spoiled(cp);
844 return (NULL);
845}
846
847/* Finally, register with GEOM infrastructure. */
848static struct g_class g_bsd_class = {
849 BSD_CLASS_NAME,
850 g_bsd_taste,
851 NULL,
852 G_CLASS_INITIALIZER
853};
854
855DECLARE_GEOM_CLASS(g_bsd_class, g_bsd);