author | ek110237 |
Wed, 11 Jul 2007 16:37:00 -0700 | |
changeset 4634 | 39bfb9e90d34 |
parent 4603 | c7840c367d00 |
child 4787 | 602d3f97842c |
permissions | -rw-r--r-- |
789 | 1 |
/* |
2 |
* CDDL HEADER START |
|
3 |
* |
|
4 |
* The contents of this file are subject to the terms of the |
|
1544 | 5 |
* Common Development and Distribution License (the "License"). |
6 |
* You may not use this file except in compliance with the License. |
|
789 | 7 |
* |
8 |
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE |
|
9 |
* or http://www.opensolaris.org/os/licensing. |
|
10 |
* See the License for the specific language governing permissions |
|
11 |
* and limitations under the License. |
|
12 |
* |
|
13 |
* When distributing Covered Code, include this CDDL HEADER in each |
|
14 |
* file and include the License file at usr/src/OPENSOLARIS.LICENSE. |
|
15 |
* If applicable, add the following below this CDDL HEADER, with the |
|
16 |
* fields enclosed by brackets "[]" replaced with your own identifying |
|
17 |
* information: Portions Copyright [yyyy] [name of copyright owner] |
|
18 |
* |
|
19 |
* CDDL HEADER END |
|
20 |
*/ |
|
21 |
/* |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
22 |
* Copyright 2007 Sun Microsystems, Inc. All rights reserved. |
789 | 23 |
* Use is subject to license terms. |
24 |
*/ |
|
25 |
||
26 |
#pragma ident "%Z%%M% %I% %E% SMI" |
|
27 |
||
4543 | 28 |
#include <sys/cred.h> |
789 | 29 |
#include <sys/zfs_context.h> |
30 |
#include <sys/dmu_objset.h> |
|
31 |
#include <sys/dsl_dir.h> |
|
32 |
#include <sys/dsl_dataset.h> |
|
33 |
#include <sys/dsl_prop.h> |
|
34 |
#include <sys/dsl_pool.h> |
|
2199 | 35 |
#include <sys/dsl_synctask.h> |
4543 | 36 |
#include <sys/dsl_deleg.h> |
789 | 37 |
#include <sys/dnode.h> |
38 |
#include <sys/dbuf.h> |
|
2885 | 39 |
#include <sys/zvol.h> |
789 | 40 |
#include <sys/dmu_tx.h> |
41 |
#include <sys/zio_checksum.h> |
|
42 |
#include <sys/zap.h> |
|
43 |
#include <sys/zil.h> |
|
44 |
#include <sys/dmu_impl.h> |
|
4543 | 45 |
#include <sys/zfs_ioctl.h> |
789 | 46 |
|
47 |
||
48 |
spa_t * |
|
49 |
dmu_objset_spa(objset_t *os) |
|
50 |
{ |
|
51 |
return (os->os->os_spa); |
|
52 |
} |
|
53 |
||
54 |
zilog_t * |
|
55 |
dmu_objset_zil(objset_t *os) |
|
56 |
{ |
|
57 |
return (os->os->os_zil); |
|
58 |
} |
|
59 |
||
60 |
dsl_pool_t * |
|
61 |
dmu_objset_pool(objset_t *os) |
|
62 |
{ |
|
63 |
dsl_dataset_t *ds; |
|
64 |
||
65 |
if ((ds = os->os->os_dsl_dataset) != NULL && ds->ds_dir) |
|
66 |
return (ds->ds_dir->dd_pool); |
|
67 |
else |
|
68 |
return (spa_get_dsl(os->os->os_spa)); |
|
69 |
} |
|
70 |
||
71 |
dsl_dataset_t * |
|
72 |
dmu_objset_ds(objset_t *os) |
|
73 |
{ |
|
74 |
return (os->os->os_dsl_dataset); |
|
75 |
} |
|
76 |
||
77 |
dmu_objset_type_t |
|
78 |
dmu_objset_type(objset_t *os) |
|
79 |
{ |
|
80 |
return (os->os->os_phys->os_type); |
|
81 |
} |
|
82 |
||
83 |
void |
|
84 |
dmu_objset_name(objset_t *os, char *buf) |
|
85 |
{ |
|
86 |
dsl_dataset_name(os->os->os_dsl_dataset, buf); |
|
87 |
} |
|
88 |
||
89 |
uint64_t |
|
90 |
dmu_objset_id(objset_t *os) |
|
91 |
{ |
|
92 |
dsl_dataset_t *ds = os->os->os_dsl_dataset; |
|
93 |
||
94 |
return (ds ? ds->ds_object : 0); |
|
95 |
} |
|
96 |
||
97 |
static void |
|
98 |
checksum_changed_cb(void *arg, uint64_t newval) |
|
99 |
{ |
|
100 |
objset_impl_t *osi = arg; |
|
101 |
||
102 |
/* |
|
103 |
* Inheritance should have been done by now. |
|
104 |
*/ |
|
105 |
ASSERT(newval != ZIO_CHECKSUM_INHERIT); |
|
106 |
||
107 |
osi->os_checksum = zio_checksum_select(newval, ZIO_CHECKSUM_ON_VALUE); |
|
108 |
} |
|
109 |
||
110 |
static void |
|
111 |
compression_changed_cb(void *arg, uint64_t newval) |
|
112 |
{ |
|
113 |
objset_impl_t *osi = arg; |
|
114 |
||
115 |
/* |
|
116 |
* Inheritance and range checking should have been done by now. |
|
117 |
*/ |
|
118 |
ASSERT(newval != ZIO_COMPRESS_INHERIT); |
|
119 |
||
120 |
osi->os_compress = zio_compress_select(newval, ZIO_COMPRESS_ON_VALUE); |
|
121 |
} |
|
122 |
||
3835 | 123 |
static void |
124 |
copies_changed_cb(void *arg, uint64_t newval) |
|
125 |
{ |
|
126 |
objset_impl_t *osi = arg; |
|
127 |
||
128 |
/* |
|
129 |
* Inheritance and range checking should have been done by now. |
|
130 |
*/ |
|
131 |
ASSERT(newval > 0); |
|
132 |
ASSERT(newval <= spa_max_replication(osi->os_spa)); |
|
133 |
||
134 |
osi->os_copies = newval; |
|
135 |
} |
|
136 |
||
789 | 137 |
void |
138 |
dmu_objset_byteswap(void *buf, size_t size) |
|
139 |
{ |
|
140 |
objset_phys_t *osp = buf; |
|
141 |
||
142 |
ASSERT(size == sizeof (objset_phys_t)); |
|
143 |
dnode_byteswap(&osp->os_meta_dnode); |
|
144 |
byteswap_uint64_array(&osp->os_zil_header, sizeof (zil_header_t)); |
|
145 |
osp->os_type = BSWAP_64(osp->os_type); |
|
146 |
} |
|
147 |
||
1544 | 148 |
int |
149 |
dmu_objset_open_impl(spa_t *spa, dsl_dataset_t *ds, blkptr_t *bp, |
|
150 |
objset_impl_t **osip) |
|
789 | 151 |
{ |
152 |
objset_impl_t *winner, *osi; |
|
153 |
int i, err, checksum; |
|
154 |
||
155 |
osi = kmem_zalloc(sizeof (objset_impl_t), KM_SLEEP); |
|
156 |
osi->os.os = osi; |
|
157 |
osi->os_dsl_dataset = ds; |
|
158 |
osi->os_spa = spa; |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
159 |
osi->os_rootbp = bp; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
160 |
if (!BP_IS_HOLE(osi->os_rootbp)) { |
2391 | 161 |
uint32_t aflags = ARC_WAIT; |
1544 | 162 |
zbookmark_t zb; |
163 |
zb.zb_objset = ds ? ds->ds_object : 0; |
|
164 |
zb.zb_object = 0; |
|
165 |
zb.zb_level = -1; |
|
166 |
zb.zb_blkid = 0; |
|
167 |
||
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
168 |
dprintf_bp(osi->os_rootbp, "reading %s", ""); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
169 |
err = arc_read(NULL, spa, osi->os_rootbp, |
789 | 170 |
dmu_ot[DMU_OT_OBJSET].ot_byteswap, |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
171 |
arc_getbuf_func, &osi->os_phys_buf, |
2391 | 172 |
ZIO_PRIORITY_SYNC_READ, ZIO_FLAG_CANFAIL, &aflags, &zb); |
1544 | 173 |
if (err) { |
174 |
kmem_free(osi, sizeof (objset_impl_t)); |
|
175 |
return (err); |
|
176 |
} |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
177 |
osi->os_phys = osi->os_phys_buf->b_data; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
178 |
arc_release(osi->os_phys_buf, &osi->os_phys_buf); |
789 | 179 |
} else { |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
180 |
osi->os_phys_buf = arc_buf_alloc(spa, sizeof (objset_phys_t), |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
181 |
&osi->os_phys_buf, ARC_BUFC_METADATA); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
182 |
osi->os_phys = osi->os_phys_buf->b_data; |
789 | 183 |
bzero(osi->os_phys, sizeof (objset_phys_t)); |
184 |
} |
|
185 |
||
186 |
/* |
|
187 |
* Note: the changed_cb will be called once before the register |
|
188 |
* func returns, thus changing the checksum/compression from the |
|
2082 | 189 |
* default (fletcher2/off). Snapshots don't need to know, and |
190 |
* registering would complicate clone promotion. |
|
789 | 191 |
*/ |
2082 | 192 |
if (ds && ds->ds_phys->ds_num_children == 0) { |
789 | 193 |
err = dsl_prop_register(ds, "checksum", |
194 |
checksum_changed_cb, osi); |
|
1544 | 195 |
if (err == 0) |
196 |
err = dsl_prop_register(ds, "compression", |
|
197 |
compression_changed_cb, osi); |
|
3835 | 198 |
if (err == 0) |
199 |
err = dsl_prop_register(ds, "copies", |
|
200 |
copies_changed_cb, osi); |
|
1544 | 201 |
if (err) { |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
202 |
VERIFY(arc_buf_remove_ref(osi->os_phys_buf, |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
203 |
&osi->os_phys_buf) == 1); |
1544 | 204 |
kmem_free(osi, sizeof (objset_impl_t)); |
205 |
return (err); |
|
206 |
} |
|
2082 | 207 |
} else if (ds == NULL) { |
789 | 208 |
/* It's the meta-objset. */ |
209 |
osi->os_checksum = ZIO_CHECKSUM_FLETCHER_4; |
|
1544 | 210 |
osi->os_compress = ZIO_COMPRESS_LZJB; |
3835 | 211 |
osi->os_copies = spa_max_replication(spa); |
789 | 212 |
} |
213 |
||
1544 | 214 |
osi->os_zil = zil_alloc(&osi->os, &osi->os_phys->os_zil_header); |
215 |
||
789 | 216 |
/* |
217 |
* Metadata always gets compressed and checksummed. |
|
218 |
* If the data checksum is multi-bit correctable, and it's not |
|
219 |
* a ZBT-style checksum, then it's suitable for metadata as well. |
|
220 |
* Otherwise, the metadata checksum defaults to fletcher4. |
|
221 |
*/ |
|
222 |
checksum = osi->os_checksum; |
|
223 |
||
224 |
if (zio_checksum_table[checksum].ci_correctable && |
|
225 |
!zio_checksum_table[checksum].ci_zbt) |
|
226 |
osi->os_md_checksum = checksum; |
|
227 |
else |
|
228 |
osi->os_md_checksum = ZIO_CHECKSUM_FLETCHER_4; |
|
1544 | 229 |
osi->os_md_compress = ZIO_COMPRESS_LZJB; |
789 | 230 |
|
231 |
for (i = 0; i < TXG_SIZE; i++) { |
|
232 |
list_create(&osi->os_dirty_dnodes[i], sizeof (dnode_t), |
|
233 |
offsetof(dnode_t, dn_dirty_link[i])); |
|
234 |
list_create(&osi->os_free_dnodes[i], sizeof (dnode_t), |
|
235 |
offsetof(dnode_t, dn_dirty_link[i])); |
|
236 |
} |
|
237 |
list_create(&osi->os_dnodes, sizeof (dnode_t), |
|
238 |
offsetof(dnode_t, dn_link)); |
|
239 |
list_create(&osi->os_downgraded_dbufs, sizeof (dmu_buf_impl_t), |
|
240 |
offsetof(dmu_buf_impl_t, db_link)); |
|
241 |
||
2856 | 242 |
mutex_init(&osi->os_lock, NULL, MUTEX_DEFAULT, NULL); |
243 |
mutex_init(&osi->os_obj_lock, NULL, MUTEX_DEFAULT, NULL); |
|
244 |
||
789 | 245 |
osi->os_meta_dnode = dnode_special_open(osi, |
246 |
&osi->os_phys->os_meta_dnode, DMU_META_DNODE_OBJECT); |
|
247 |
||
248 |
if (ds != NULL) { |
|
249 |
winner = dsl_dataset_set_user_ptr(ds, osi, dmu_objset_evict); |
|
250 |
if (winner) { |
|
251 |
dmu_objset_evict(ds, osi); |
|
252 |
osi = winner; |
|
253 |
} |
|
254 |
} |
|
255 |
||
1544 | 256 |
*osip = osi; |
257 |
return (0); |
|
789 | 258 |
} |
259 |
||
260 |
/* called from zpl */ |
|
261 |
int |
|
262 |
dmu_objset_open(const char *name, dmu_objset_type_t type, int mode, |
|
263 |
objset_t **osp) |
|
264 |
{ |
|
265 |
dsl_dataset_t *ds; |
|
266 |
int err; |
|
267 |
objset_t *os; |
|
268 |
objset_impl_t *osi; |
|
269 |
||
270 |
os = kmem_alloc(sizeof (objset_t), KM_SLEEP); |
|
271 |
err = dsl_dataset_open(name, mode, os, &ds); |
|
272 |
if (err) { |
|
273 |
kmem_free(os, sizeof (objset_t)); |
|
274 |
return (err); |
|
275 |
} |
|
276 |
||
277 |
osi = dsl_dataset_get_user_ptr(ds); |
|
278 |
if (osi == NULL) { |
|
1544 | 279 |
err = dmu_objset_open_impl(dsl_dataset_get_spa(ds), |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
280 |
ds, &ds->ds_phys->ds_bp, &osi); |
1544 | 281 |
if (err) { |
282 |
dsl_dataset_close(ds, mode, os); |
|
283 |
kmem_free(os, sizeof (objset_t)); |
|
284 |
return (err); |
|
285 |
} |
|
789 | 286 |
} |
287 |
||
288 |
os->os = osi; |
|
289 |
os->os_mode = mode; |
|
290 |
||
291 |
if (type != DMU_OST_ANY && type != os->os->os_phys->os_type) { |
|
292 |
dmu_objset_close(os); |
|
293 |
return (EINVAL); |
|
294 |
} |
|
295 |
*osp = os; |
|
296 |
return (0); |
|
297 |
} |
|
298 |
||
299 |
void |
|
300 |
dmu_objset_close(objset_t *os) |
|
301 |
{ |
|
302 |
dsl_dataset_close(os->os->os_dsl_dataset, os->os_mode, os); |
|
303 |
kmem_free(os, sizeof (objset_t)); |
|
304 |
} |
|
305 |
||
1646
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
306 |
int |
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
307 |
dmu_objset_evict_dbufs(objset_t *os, int try) |
1544 | 308 |
{ |
309 |
objset_impl_t *osi = os->os; |
|
310 |
dnode_t *dn; |
|
1596
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
311 |
|
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
312 |
mutex_enter(&osi->os_lock); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
313 |
|
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
314 |
/* process the mdn last, since the other dnodes have holds on it */ |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
315 |
list_remove(&osi->os_dnodes, osi->os_meta_dnode); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
316 |
list_insert_tail(&osi->os_dnodes, osi->os_meta_dnode); |
1544 | 317 |
|
318 |
/* |
|
1596
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
319 |
* Find the first dnode with holds. We have to do this dance |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
320 |
* because dnode_add_ref() only works if you already have a |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
321 |
* hold. If there are no holds then it has no dbufs so OK to |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
322 |
* skip. |
1544 | 323 |
*/ |
1596
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
324 |
for (dn = list_head(&osi->os_dnodes); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
325 |
dn && refcount_is_zero(&dn->dn_holds); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
326 |
dn = list_next(&osi->os_dnodes, dn)) |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
327 |
continue; |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
328 |
if (dn) |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
329 |
dnode_add_ref(dn, FTAG); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
330 |
|
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
331 |
while (dn) { |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
332 |
dnode_t *next_dn = dn; |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
333 |
|
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
334 |
do { |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
335 |
next_dn = list_next(&osi->os_dnodes, next_dn); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
336 |
} while (next_dn && refcount_is_zero(&next_dn->dn_holds)); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
337 |
if (next_dn) |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
338 |
dnode_add_ref(next_dn, FTAG); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
339 |
|
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
340 |
mutex_exit(&osi->os_lock); |
1646
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
341 |
if (dnode_evict_dbufs(dn, try)) { |
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
342 |
dnode_rele(dn, FTAG); |
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
343 |
if (next_dn) |
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
344 |
dnode_rele(next_dn, FTAG); |
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
345 |
return (1); |
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
346 |
} |
1596
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
347 |
dnode_rele(dn, FTAG); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
348 |
mutex_enter(&osi->os_lock); |
2e2377ccbf85
6395371 ASSERT in dmu_tx_count_free: blkid + i < dn->dn_phys->dn_nblkptr
ahrens
parents:
1544
diff
changeset
|
349 |
dn = next_dn; |
1544 | 350 |
} |
351 |
mutex_exit(&osi->os_lock); |
|
1646
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
352 |
return (0); |
1544 | 353 |
} |
354 |
||
355 |
void |
|
789 | 356 |
dmu_objset_evict(dsl_dataset_t *ds, void *arg) |
357 |
{ |
|
358 |
objset_impl_t *osi = arg; |
|
1544 | 359 |
objset_t os; |
2082 | 360 |
int i; |
789 | 361 |
|
362 |
for (i = 0; i < TXG_SIZE; i++) { |
|
363 |
ASSERT(list_head(&osi->os_dirty_dnodes[i]) == NULL); |
|
364 |
ASSERT(list_head(&osi->os_free_dnodes[i]) == NULL); |
|
365 |
} |
|
366 |
||
2082 | 367 |
if (ds && ds->ds_phys->ds_num_children == 0) { |
368 |
VERIFY(0 == dsl_prop_unregister(ds, "checksum", |
|
369 |
checksum_changed_cb, osi)); |
|
370 |
VERIFY(0 == dsl_prop_unregister(ds, "compression", |
|
371 |
compression_changed_cb, osi)); |
|
3835 | 372 |
VERIFY(0 == dsl_prop_unregister(ds, "copies", |
373 |
copies_changed_cb, osi)); |
|
789 | 374 |
} |
375 |
||
1544 | 376 |
/* |
377 |
* We should need only a single pass over the dnode list, since |
|
378 |
* nothing can be added to the list at this point. |
|
379 |
*/ |
|
380 |
os.os = osi; |
|
1646
b4e43ae19fff
6393443 Remove remaining txg_wait_synced() from zfs unmount path.
perrin
parents:
1596
diff
changeset
|
381 |
(void) dmu_objset_evict_dbufs(&os, 0); |
1544 | 382 |
|
789 | 383 |
ASSERT3P(list_head(&osi->os_dnodes), ==, osi->os_meta_dnode); |
384 |
ASSERT3P(list_tail(&osi->os_dnodes), ==, osi->os_meta_dnode); |
|
385 |
ASSERT3P(list_head(&osi->os_meta_dnode->dn_dbufs), ==, NULL); |
|
386 |
||
387 |
dnode_special_close(osi->os_meta_dnode); |
|
388 |
zil_free(osi->os_zil); |
|
389 |
||
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
390 |
VERIFY(arc_buf_remove_ref(osi->os_phys_buf, &osi->os_phys_buf) == 1); |
2856 | 391 |
mutex_destroy(&osi->os_lock); |
392 |
mutex_destroy(&osi->os_obj_lock); |
|
789 | 393 |
kmem_free(osi, sizeof (objset_impl_t)); |
394 |
} |
|
395 |
||
396 |
/* called from dsl for meta-objset */ |
|
397 |
objset_impl_t * |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
398 |
dmu_objset_create_impl(spa_t *spa, dsl_dataset_t *ds, blkptr_t *bp, |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
399 |
dmu_objset_type_t type, dmu_tx_t *tx) |
789 | 400 |
{ |
401 |
objset_impl_t *osi; |
|
402 |
dnode_t *mdn; |
|
403 |
||
404 |
ASSERT(dmu_tx_is_syncing(tx)); |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
405 |
VERIFY(0 == dmu_objset_open_impl(spa, ds, bp, &osi)); |
789 | 406 |
mdn = osi->os_meta_dnode; |
407 |
||
408 |
dnode_allocate(mdn, DMU_OT_DNODE, 1 << DNODE_BLOCK_SHIFT, |
|
409 |
DN_MAX_INDBLKSHIFT, DMU_OT_NONE, 0, tx); |
|
410 |
||
411 |
/* |
|
412 |
* We don't want to have to increase the meta-dnode's nlevels |
|
413 |
* later, because then we could do it in quescing context while |
|
414 |
* we are also accessing it in open context. |
|
415 |
* |
|
416 |
* This precaution is not necessary for the MOS (ds == NULL), |
|
417 |
* because the MOS is only updated in syncing context. |
|
418 |
* This is most fortunate: the MOS is the only objset that |
|
419 |
* needs to be synced multiple times as spa_sync() iterates |
|
420 |
* to convergence, so minimizing its dn_nlevels matters. |
|
421 |
*/ |
|
1544 | 422 |
if (ds != NULL) { |
423 |
int levels = 1; |
|
424 |
||
425 |
/* |
|
426 |
* Determine the number of levels necessary for the meta-dnode |
|
427 |
* to contain DN_MAX_OBJECT dnodes. |
|
428 |
*/ |
|
429 |
while ((uint64_t)mdn->dn_nblkptr << (mdn->dn_datablkshift + |
|
430 |
(levels - 1) * (mdn->dn_indblkshift - SPA_BLKPTRSHIFT)) < |
|
431 |
DN_MAX_OBJECT * sizeof (dnode_phys_t)) |
|
432 |
levels++; |
|
433 |
||
789 | 434 |
mdn->dn_next_nlevels[tx->tx_txg & TXG_MASK] = |
1544 | 435 |
mdn->dn_nlevels = levels; |
436 |
} |
|
789 | 437 |
|
438 |
ASSERT(type != DMU_OST_NONE); |
|
439 |
ASSERT(type != DMU_OST_ANY); |
|
440 |
ASSERT(type < DMU_OST_NUMTYPES); |
|
441 |
osi->os_phys->os_type = type; |
|
442 |
||
443 |
dsl_dataset_dirty(ds, tx); |
|
444 |
||
445 |
return (osi); |
|
446 |
} |
|
447 |
||
448 |
struct oscarg { |
|
4543 | 449 |
void (*userfunc)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx); |
789 | 450 |
void *userarg; |
451 |
dsl_dataset_t *clone_parent; |
|
452 |
const char *lastname; |
|
453 |
dmu_objset_type_t type; |
|
454 |
}; |
|
455 |
||
4543 | 456 |
/*ARGSUSED*/ |
789 | 457 |
static int |
2199 | 458 |
dmu_objset_create_check(void *arg1, void *arg2, dmu_tx_t *tx) |
789 | 459 |
{ |
2199 | 460 |
dsl_dir_t *dd = arg1; |
461 |
struct oscarg *oa = arg2; |
|
462 |
objset_t *mos = dd->dd_pool->dp_meta_objset; |
|
463 |
int err; |
|
464 |
uint64_t ddobj; |
|
465 |
||
466 |
err = zap_lookup(mos, dd->dd_phys->dd_child_dir_zapobj, |
|
467 |
oa->lastname, sizeof (uint64_t), 1, &ddobj); |
|
468 |
if (err != ENOENT) |
|
469 |
return (err ? err : EEXIST); |
|
470 |
||
471 |
if (oa->clone_parent != NULL) { |
|
472 |
/* |
|
473 |
* You can't clone across pools. |
|
474 |
*/ |
|
475 |
if (oa->clone_parent->ds_dir->dd_pool != dd->dd_pool) |
|
476 |
return (EXDEV); |
|
477 |
||
478 |
/* |
|
479 |
* You can only clone snapshots, not the head datasets. |
|
480 |
*/ |
|
481 |
if (oa->clone_parent->ds_phys->ds_num_children == 0) |
|
482 |
return (EINVAL); |
|
483 |
} |
|
4543 | 484 |
|
2199 | 485 |
return (0); |
486 |
} |
|
487 |
||
488 |
static void |
|
4543 | 489 |
dmu_objset_create_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) |
2199 | 490 |
{ |
491 |
dsl_dir_t *dd = arg1; |
|
492 |
struct oscarg *oa = arg2; |
|
789 | 493 |
dsl_dataset_t *ds; |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
494 |
blkptr_t *bp; |
2199 | 495 |
uint64_t dsobj; |
789 | 496 |
|
497 |
ASSERT(dmu_tx_is_syncing(tx)); |
|
498 |
||
2199 | 499 |
dsobj = dsl_dataset_create_sync(dd, oa->lastname, |
789 | 500 |
oa->clone_parent, tx); |
501 |
||
2199 | 502 |
VERIFY(0 == dsl_dataset_open_obj(dd->dd_pool, dsobj, NULL, |
1544 | 503 |
DS_MODE_STANDARD | DS_MODE_READONLY, FTAG, &ds)); |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
504 |
bp = dsl_dataset_get_blkptr(ds); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
505 |
if (BP_IS_HOLE(bp)) { |
789 | 506 |
objset_impl_t *osi; |
507 |
||
508 |
/* This is an empty dmu_objset; not a clone. */ |
|
509 |
osi = dmu_objset_create_impl(dsl_dataset_get_spa(ds), |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
510 |
ds, bp, oa->type, tx); |
789 | 511 |
|
512 |
if (oa->userfunc) |
|
4543 | 513 |
oa->userfunc(&osi->os, oa->userarg, cr, tx); |
789 | 514 |
} |
4543 | 515 |
|
516 |
/* |
|
517 |
* Create create time permission if any? |
|
518 |
*/ |
|
519 |
dsl_deleg_set_create_perms(ds->ds_dir, tx, cr); |
|
520 |
||
521 |
spa_history_internal_log(LOG_DS_CREATE, dd->dd_pool->dp_spa, |
|
522 |
tx, cr, "dataset = %llu", dsobj); |
|
523 |
||
789 | 524 |
dsl_dataset_close(ds, DS_MODE_STANDARD | DS_MODE_READONLY, FTAG); |
525 |
} |
|
526 |
||
527 |
int |
|
528 |
dmu_objset_create(const char *name, dmu_objset_type_t type, |
|
529 |
objset_t *clone_parent, |
|
4543 | 530 |
void (*func)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx), void *arg) |
789 | 531 |
{ |
2199 | 532 |
dsl_dir_t *pdd; |
789 | 533 |
const char *tail; |
534 |
int err = 0; |
|
2199 | 535 |
struct oscarg oa = { 0 }; |
789 | 536 |
|
2199 | 537 |
ASSERT(strchr(name, '@') == NULL); |
538 |
err = dsl_dir_open(name, FTAG, &pdd, &tail); |
|
1544 | 539 |
if (err) |
540 |
return (err); |
|
789 | 541 |
if (tail == NULL) { |
2199 | 542 |
dsl_dir_close(pdd, FTAG); |
789 | 543 |
return (EEXIST); |
544 |
} |
|
545 |
||
546 |
dprintf("name=%s\n", name); |
|
547 |
||
2199 | 548 |
oa.userfunc = func; |
549 |
oa.userarg = arg; |
|
550 |
oa.lastname = tail; |
|
551 |
oa.type = type; |
|
4543 | 552 |
|
2199 | 553 |
if (clone_parent != NULL) { |
789 | 554 |
/* |
2199 | 555 |
* You can't clone to a different type. |
789 | 556 |
*/ |
2199 | 557 |
if (clone_parent->os->os_phys->os_type != type) { |
558 |
dsl_dir_close(pdd, FTAG); |
|
559 |
return (EINVAL); |
|
789 | 560 |
} |
2199 | 561 |
oa.clone_parent = clone_parent->os->os_dsl_dataset; |
789 | 562 |
} |
2199 | 563 |
err = dsl_sync_task_do(pdd->dd_pool, dmu_objset_create_check, |
564 |
dmu_objset_create_sync, pdd, &oa, 5); |
|
565 |
dsl_dir_close(pdd, FTAG); |
|
789 | 566 |
return (err); |
567 |
} |
|
568 |
||
569 |
int |
|
570 |
dmu_objset_destroy(const char *name) |
|
571 |
{ |
|
572 |
objset_t *os; |
|
573 |
int error; |
|
574 |
||
575 |
/* |
|
576 |
* If it looks like we'll be able to destroy it, and there's |
|
577 |
* an unplayed replay log sitting around, destroy the log. |
|
578 |
* It would be nicer to do this in dsl_dataset_destroy_sync(), |
|
579 |
* but the replay log objset is modified in open context. |
|
580 |
*/ |
|
581 |
error = dmu_objset_open(name, DMU_OST_ANY, DS_MODE_EXCLUSIVE, &os); |
|
582 |
if (error == 0) { |
|
1807
35c8b566d7af
6410711 intent log blocks don't get invited to pool parties
bonwick
parents:
1775
diff
changeset
|
583 |
zil_destroy(dmu_objset_zil(os), B_FALSE); |
789 | 584 |
dmu_objset_close(os); |
585 |
} |
|
586 |
||
587 |
return (dsl_dataset_destroy(name)); |
|
588 |
} |
|
589 |
||
590 |
int |
|
591 |
dmu_objset_rollback(const char *name) |
|
592 |
{ |
|
593 |
int err; |
|
594 |
objset_t *os; |
|
595 |
||
2199 | 596 |
err = dmu_objset_open(name, DMU_OST_ANY, |
597 |
DS_MODE_EXCLUSIVE | DS_MODE_INCONSISTENT, &os); |
|
789 | 598 |
if (err == 0) { |
599 |
err = zil_suspend(dmu_objset_zil(os)); |
|
600 |
if (err == 0) |
|
601 |
zil_resume(dmu_objset_zil(os)); |
|
602 |
if (err == 0) { |
|
603 |
/* XXX uncache everything? */ |
|
2199 | 604 |
err = dsl_dataset_rollback(os->os->os_dsl_dataset); |
789 | 605 |
} |
2199 | 606 |
dmu_objset_close(os); |
789 | 607 |
} |
608 |
return (err); |
|
609 |
} |
|
610 |
||
2199 | 611 |
struct snaparg { |
612 |
dsl_sync_task_group_t *dstg; |
|
613 |
char *snapname; |
|
614 |
char failed[MAXPATHLEN]; |
|
4543 | 615 |
boolean_t checkperms; |
2199 | 616 |
}; |
617 |
||
618 |
static int |
|
619 |
dmu_objset_snapshot_one(char *name, void *arg) |
|
620 |
{ |
|
621 |
struct snaparg *sn = arg; |
|
622 |
objset_t *os; |
|
3637
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
623 |
dmu_objset_stats_t stat; |
2199 | 624 |
int err; |
625 |
||
626 |
(void) strcpy(sn->failed, name); |
|
627 |
||
4543 | 628 |
/* |
629 |
* Check permissions only when requested. This only applies when |
|
630 |
* doing a recursive snapshot. The permission checks for the starting |
|
631 |
* dataset have already been performed in zfs_secpolicy_snapshot() |
|
632 |
*/ |
|
633 |
if (sn->checkperms == B_TRUE && |
|
634 |
(err = zfs_secpolicy_snapshot_perms(name, CRED()))) |
|
635 |
return (err); |
|
636 |
||
2199 | 637 |
err = dmu_objset_open(name, DMU_OST_ANY, DS_MODE_STANDARD, &os); |
638 |
if (err != 0) |
|
639 |
return (err); |
|
640 |
||
641 |
/* |
|
3637
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
642 |
* If the objset is in an inconsistent state, return busy. |
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
643 |
*/ |
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
644 |
dmu_objset_fast_stat(os, &stat); |
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
645 |
if (stat.dds_inconsistent) { |
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
646 |
dmu_objset_close(os); |
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
647 |
return (EBUSY); |
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
648 |
} |
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
649 |
|
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
650 |
/* |
2199 | 651 |
* NB: we need to wait for all in-flight changes to get to disk, |
652 |
* so that we snapshot those changes. zil_suspend does this as |
|
653 |
* a side effect. |
|
654 |
*/ |
|
655 |
err = zil_suspend(dmu_objset_zil(os)); |
|
656 |
if (err == 0) { |
|
657 |
dsl_sync_task_create(sn->dstg, dsl_dataset_snapshot_check, |
|
658 |
dsl_dataset_snapshot_sync, os, sn->snapname, 3); |
|
3637
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
659 |
} else { |
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
660 |
dmu_objset_close(os); |
2199 | 661 |
} |
3637
526d8412c163
6402600 administrative actions while doing 'zfs recv' or 'zfs destroy' can cause confusing situation
rm160521
parents:
3547
diff
changeset
|
662 |
|
2199 | 663 |
return (err); |
664 |
} |
|
665 |
||
666 |
int |
|
667 |
dmu_objset_snapshot(char *fsname, char *snapname, boolean_t recursive) |
|
668 |
{ |
|
669 |
dsl_sync_task_t *dst; |
|
670 |
struct snaparg sn = { 0 }; |
|
671 |
spa_t *spa; |
|
672 |
int err; |
|
673 |
||
674 |
(void) strcpy(sn.failed, fsname); |
|
675 |
||
4603
c7840c367d00
6494569 zfs recv -d pool/<doesn't exist> core dumps for top-level filesystem backups
ahrens
parents:
4543
diff
changeset
|
676 |
err = spa_open(fsname, &spa, FTAG); |
2199 | 677 |
if (err) |
678 |
return (err); |
|
679 |
||
680 |
sn.dstg = dsl_sync_task_group_create(spa_get_dsl(spa)); |
|
681 |
sn.snapname = snapname; |
|
682 |
||
2417 | 683 |
if (recursive) { |
4543 | 684 |
sn.checkperms = B_TRUE; |
2417 | 685 |
err = dmu_objset_find(fsname, |
686 |
dmu_objset_snapshot_one, &sn, DS_FIND_CHILDREN); |
|
687 |
} else { |
|
4543 | 688 |
sn.checkperms = B_FALSE; |
2199 | 689 |
err = dmu_objset_snapshot_one(fsname, &sn); |
2417 | 690 |
} |
2199 | 691 |
|
692 |
if (err) |
|
693 |
goto out; |
|
694 |
||
695 |
err = dsl_sync_task_group_wait(sn.dstg); |
|
696 |
||
697 |
for (dst = list_head(&sn.dstg->dstg_tasks); dst; |
|
698 |
dst = list_next(&sn.dstg->dstg_tasks, dst)) { |
|
699 |
objset_t *os = dst->dst_arg1; |
|
700 |
if (dst->dst_err) |
|
701 |
dmu_objset_name(os, sn.failed); |
|
702 |
zil_resume(dmu_objset_zil(os)); |
|
703 |
dmu_objset_close(os); |
|
704 |
} |
|
705 |
out: |
|
706 |
if (err) |
|
707 |
(void) strcpy(fsname, sn.failed); |
|
708 |
dsl_sync_task_group_destroy(sn.dstg); |
|
709 |
spa_close(spa, FTAG); |
|
710 |
return (err); |
|
711 |
} |
|
712 |
||
789 | 713 |
static void |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
714 |
dmu_objset_sync_dnodes(list_t *list, dmu_tx_t *tx) |
789 | 715 |
{ |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
716 |
dnode_t *dn; |
789 | 717 |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
718 |
while (dn = list_head(list)) { |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
719 |
ASSERT(dn->dn_object != DMU_META_DNODE_OBJECT); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
720 |
ASSERT(dn->dn_dbuf->db_data_pending); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
721 |
/* |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
722 |
* Initialize dn_zio outside dnode_sync() |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
723 |
* to accomodate meta-dnode |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
724 |
*/ |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
725 |
dn->dn_zio = dn->dn_dbuf->db_data_pending->dr_zio; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
726 |
ASSERT(dn->dn_zio); |
789 | 727 |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
728 |
ASSERT3U(dn->dn_nlevels, <=, DN_MAX_LEVELS); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
729 |
list_remove(list, dn); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
730 |
dnode_sync(dn, tx); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
731 |
} |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
732 |
} |
2981 | 733 |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
734 |
/* ARGSUSED */ |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
735 |
static void |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
736 |
ready(zio_t *zio, arc_buf_t *abuf, void *arg) |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
737 |
{ |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
738 |
objset_impl_t *os = arg; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
739 |
blkptr_t *bp = os->os_rootbp; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
740 |
dnode_phys_t *dnp = &os->os_phys->os_meta_dnode; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
741 |
int i; |
2981 | 742 |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
743 |
/* |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
744 |
* Update rootbp fill count. |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
745 |
*/ |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
746 |
bp->blk_fill = 1; /* count the meta-dnode */ |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
747 |
for (i = 0; i < dnp->dn_nblkptr; i++) |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
748 |
bp->blk_fill += dnp->dn_blkptr[i].blk_fill; |
789 | 749 |
} |
750 |
||
751 |
/* ARGSUSED */ |
|
752 |
static void |
|
753 |
killer(zio_t *zio, arc_buf_t *abuf, void *arg) |
|
754 |
{ |
|
755 |
objset_impl_t *os = arg; |
|
756 |
||
757 |
ASSERT3U(zio->io_error, ==, 0); |
|
758 |
||
759 |
BP_SET_TYPE(zio->io_bp, DMU_OT_OBJSET); |
|
760 |
BP_SET_LEVEL(zio->io_bp, 0); |
|
761 |
||
762 |
if (!DVA_EQUAL(BP_IDENTITY(zio->io_bp), |
|
763 |
BP_IDENTITY(&zio->io_bp_orig))) { |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
764 |
if (zio->io_bp_orig.blk_birth == os->os_synctx->tx_txg) |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
765 |
dsl_dataset_block_kill(os->os_dsl_dataset, |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
766 |
&zio->io_bp_orig, NULL, os->os_synctx); |
789 | 767 |
dsl_dataset_block_born(os->os_dsl_dataset, zio->io_bp, |
768 |
os->os_synctx); |
|
769 |
} |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
770 |
arc_release(os->os_phys_buf, &os->os_phys_buf); |
789 | 771 |
} |
772 |
||
773 |
/* called from dsl */ |
|
774 |
void |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
775 |
dmu_objset_sync(objset_impl_t *os, zio_t *pio, dmu_tx_t *tx) |
789 | 776 |
{ |
777 |
int txgoff; |
|
1544 | 778 |
zbookmark_t zb; |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
779 |
zio_t *zio; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
780 |
list_t *list; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
781 |
dbuf_dirty_record_t *dr; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
782 |
|
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
783 |
dprintf_ds(os->os_dsl_dataset, "txg=%llu\n", tx->tx_txg); |
789 | 784 |
|
785 |
ASSERT(dmu_tx_is_syncing(tx)); |
|
786 |
/* XXX the write_done callback should really give us the tx... */ |
|
787 |
os->os_synctx = tx; |
|
788 |
||
3882 | 789 |
if (os->os_dsl_dataset == NULL) { |
790 |
/* |
|
791 |
* This is the MOS. If we have upgraded, |
|
792 |
* spa_max_replication() could change, so reset |
|
793 |
* os_copies here. |
|
794 |
*/ |
|
795 |
os->os_copies = spa_max_replication(os->os_spa); |
|
796 |
} |
|
797 |
||
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
798 |
/* |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
799 |
* Create the root block IO |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
800 |
*/ |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
801 |
zb.zb_objset = os->os_dsl_dataset ? os->os_dsl_dataset->ds_object : 0; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
802 |
zb.zb_object = 0; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
803 |
zb.zb_level = -1; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
804 |
zb.zb_blkid = 0; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
805 |
if (BP_IS_OLDER(os->os_rootbp, tx->tx_txg)) |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
806 |
dsl_dataset_block_kill(os->os_dsl_dataset, |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
807 |
os->os_rootbp, pio, tx); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
808 |
zio = arc_write(pio, os->os_spa, os->os_md_checksum, |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
809 |
os->os_md_compress, |
3835 | 810 |
dmu_get_replication_level(os, &zb, DMU_OT_OBJSET), |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
811 |
tx->tx_txg, os->os_rootbp, os->os_phys_buf, ready, killer, os, |
4634
39bfb9e90d34
6437054 vdev_cache wises up: increase DB performance by 16%
ek110237
parents:
4603
diff
changeset
|
812 |
ZIO_PRIORITY_ASYNC_WRITE, ZIO_FLAG_MUSTSUCCEED | ZIO_FLAG_METADATA, |
39bfb9e90d34
6437054 vdev_cache wises up: increase DB performance by 16%
ek110237
parents:
4603
diff
changeset
|
813 |
&zb); |
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
814 |
|
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
815 |
/* |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
816 |
* Sync meta-dnode - the parent IO for the sync is the root block |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
817 |
*/ |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
818 |
os->os_meta_dnode->dn_zio = zio; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
819 |
dnode_sync(os->os_meta_dnode, tx); |
789 | 820 |
|
821 |
txgoff = tx->tx_txg & TXG_MASK; |
|
822 |
||
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
823 |
dmu_objset_sync_dnodes(&os->os_free_dnodes[txgoff], tx); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
824 |
dmu_objset_sync_dnodes(&os->os_dirty_dnodes[txgoff], tx); |
789 | 825 |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
826 |
list = &os->os_meta_dnode->dn_dirty_records[txgoff]; |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
827 |
while (dr = list_head(list)) { |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
828 |
ASSERT(dr->dr_dbuf->db_level == 0); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
829 |
list_remove(list, dr); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
830 |
if (dr->dr_zio) |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
831 |
zio_nowait(dr->dr_zio); |
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
832 |
} |
789 | 833 |
/* |
834 |
* Free intent log blocks up to this tx. |
|
835 |
*/ |
|
836 |
zil_sync(os->os_zil, tx); |
|
3547
e396e0a440b1
6512391 DMU should leverage ZIO dependencies to achieve greater parallelism
maybee
parents:
3290
diff
changeset
|
837 |
zio_nowait(zio); |
789 | 838 |
} |
839 |
||
840 |
void |
|
2885 | 841 |
dmu_objset_space(objset_t *os, uint64_t *refdbytesp, uint64_t *availbytesp, |
842 |
uint64_t *usedobjsp, uint64_t *availobjsp) |
|
843 |
{ |
|
844 |
dsl_dataset_space(os->os->os_dsl_dataset, refdbytesp, availbytesp, |
|
845 |
usedobjsp, availobjsp); |
|
846 |
} |
|
847 |
||
848 |
uint64_t |
|
849 |
dmu_objset_fsid_guid(objset_t *os) |
|
850 |
{ |
|
851 |
return (dsl_dataset_fsid_guid(os->os->os_dsl_dataset)); |
|
852 |
} |
|
853 |
||
854 |
void |
|
855 |
dmu_objset_fast_stat(objset_t *os, dmu_objset_stats_t *stat) |
|
789 | 856 |
{ |
2885 | 857 |
stat->dds_type = os->os->os_phys->os_type; |
858 |
if (os->os->os_dsl_dataset) |
|
859 |
dsl_dataset_fast_stat(os->os->os_dsl_dataset, stat); |
|
860 |
} |
|
861 |
||
862 |
void |
|
863 |
dmu_objset_stats(objset_t *os, nvlist_t *nv) |
|
864 |
{ |
|
865 |
ASSERT(os->os->os_dsl_dataset || |
|
866 |
os->os->os_phys->os_type == DMU_OST_META); |
|
867 |
||
868 |
if (os->os->os_dsl_dataset != NULL) |
|
869 |
dsl_dataset_stats(os->os->os_dsl_dataset, nv); |
|
870 |
||
871 |
dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_TYPE, |
|
872 |
os->os->os_phys->os_type); |
|
789 | 873 |
} |
874 |
||
875 |
int |
|
876 |
dmu_objset_is_snapshot(objset_t *os) |
|
877 |
{ |
|
878 |
if (os->os->os_dsl_dataset != NULL) |
|
879 |
return (dsl_dataset_is_snapshot(os->os->os_dsl_dataset)); |
|
880 |
else |
|
881 |
return (B_FALSE); |
|
882 |
} |
|
883 |
||
884 |
int |
|
885 |
dmu_snapshot_list_next(objset_t *os, int namelen, char *name, |
|
885
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
886 |
uint64_t *idp, uint64_t *offp) |
789 | 887 |
{ |
888 |
dsl_dataset_t *ds = os->os->os_dsl_dataset; |
|
889 |
zap_cursor_t cursor; |
|
890 |
zap_attribute_t attr; |
|
891 |
||
892 |
if (ds->ds_phys->ds_snapnames_zapobj == 0) |
|
893 |
return (ENOENT); |
|
894 |
||
895 |
zap_cursor_init_serialized(&cursor, |
|
896 |
ds->ds_dir->dd_pool->dp_meta_objset, |
|
897 |
ds->ds_phys->ds_snapnames_zapobj, *offp); |
|
898 |
||
885
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
899 |
if (zap_cursor_retrieve(&cursor, &attr) != 0) { |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
900 |
zap_cursor_fini(&cursor); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
901 |
return (ENOENT); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
902 |
} |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
903 |
|
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
904 |
if (strlen(attr.za_name) + 1 > namelen) { |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
905 |
zap_cursor_fini(&cursor); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
906 |
return (ENAMETOOLONG); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
907 |
} |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
908 |
|
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
909 |
(void) strcpy(name, attr.za_name); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
910 |
if (idp) |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
911 |
*idp = attr.za_first_integer; |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
912 |
zap_cursor_advance(&cursor); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
913 |
*offp = zap_cursor_serialize(&cursor); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
914 |
zap_cursor_fini(&cursor); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
915 |
|
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
916 |
return (0); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
917 |
} |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
918 |
|
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
919 |
int |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
920 |
dmu_dir_list_next(objset_t *os, int namelen, char *name, |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
921 |
uint64_t *idp, uint64_t *offp) |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
922 |
{ |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
923 |
dsl_dir_t *dd = os->os->os_dsl_dataset->ds_dir; |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
924 |
zap_cursor_t cursor; |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
925 |
zap_attribute_t attr; |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
926 |
|
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
927 |
/* there is no next dir on a snapshot! */ |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
928 |
if (os->os->os_dsl_dataset->ds_object != |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
929 |
dd->dd_phys->dd_head_dataset_obj) |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
930 |
return (ENOENT); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
931 |
|
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
932 |
zap_cursor_init_serialized(&cursor, |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
933 |
dd->dd_pool->dp_meta_objset, |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
934 |
dd->dd_phys->dd_child_dir_zapobj, *offp); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
935 |
|
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
936 |
if (zap_cursor_retrieve(&cursor, &attr) != 0) { |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
937 |
zap_cursor_fini(&cursor); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
938 |
return (ENOENT); |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
939 |
} |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
940 |
|
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
941 |
if (strlen(attr.za_name) + 1 > namelen) { |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
942 |
zap_cursor_fini(&cursor); |
789 | 943 |
return (ENAMETOOLONG); |
885
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
944 |
} |
789 | 945 |
|
946 |
(void) strcpy(name, attr.za_name); |
|
885
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
947 |
if (idp) |
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
948 |
*idp = attr.za_first_integer; |
789 | 949 |
zap_cursor_advance(&cursor); |
950 |
*offp = zap_cursor_serialize(&cursor); |
|
885
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
951 |
zap_cursor_fini(&cursor); |
789 | 952 |
|
953 |
return (0); |
|
954 |
} |
|
955 |
||
956 |
/* |
|
957 |
* Find all objsets under name, and for each, call 'func(child_name, arg)'. |
|
958 |
*/ |
|
2199 | 959 |
int |
960 |
dmu_objset_find(char *name, int func(char *, void *), void *arg, int flags) |
|
789 | 961 |
{ |
962 |
dsl_dir_t *dd; |
|
963 |
objset_t *os; |
|
964 |
uint64_t snapobj; |
|
965 |
zap_cursor_t zc; |
|
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
966 |
zap_attribute_t *attr; |
789 | 967 |
char *child; |
1544 | 968 |
int do_self, err; |
789 | 969 |
|
1544 | 970 |
err = dsl_dir_open(name, FTAG, &dd, NULL); |
971 |
if (err) |
|
2199 | 972 |
return (err); |
789 | 973 |
|
2199 | 974 |
/* NB: the $MOS dir doesn't have a head dataset */ |
789 | 975 |
do_self = (dd->dd_phys->dd_head_dataset_obj != 0); |
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
976 |
attr = kmem_alloc(sizeof (zap_attribute_t), KM_SLEEP); |
789 | 977 |
|
978 |
/* |
|
979 |
* Iterate over all children. |
|
980 |
*/ |
|
2417 | 981 |
if (flags & DS_FIND_CHILDREN) { |
982 |
for (zap_cursor_init(&zc, dd->dd_pool->dp_meta_objset, |
|
983 |
dd->dd_phys->dd_child_dir_zapobj); |
|
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
984 |
zap_cursor_retrieve(&zc, attr) == 0; |
2417 | 985 |
(void) zap_cursor_advance(&zc)) { |
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
986 |
ASSERT(attr->za_integer_length == sizeof (uint64_t)); |
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
987 |
ASSERT(attr->za_num_integers == 1); |
789 | 988 |
|
2417 | 989 |
/* |
990 |
* No separating '/' because parent's name ends in /. |
|
991 |
*/ |
|
992 |
child = kmem_alloc(MAXPATHLEN, KM_SLEEP); |
|
993 |
/* XXX could probably just use name here */ |
|
994 |
dsl_dir_name(dd, child); |
|
995 |
(void) strcat(child, "/"); |
|
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
996 |
(void) strcat(child, attr->za_name); |
2417 | 997 |
err = dmu_objset_find(child, func, arg, flags); |
998 |
kmem_free(child, MAXPATHLEN); |
|
999 |
if (err) |
|
1000 |
break; |
|
1001 |
} |
|
1002 |
zap_cursor_fini(&zc); |
|
2199 | 1003 |
|
2417 | 1004 |
if (err) { |
1005 |
dsl_dir_close(dd, FTAG); |
|
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
1006 |
kmem_free(attr, sizeof (zap_attribute_t)); |
2417 | 1007 |
return (err); |
1008 |
} |
|
789 | 1009 |
} |
1010 |
||
1011 |
/* |
|
1012 |
* Iterate over all snapshots. |
|
1013 |
*/ |
|
1014 |
if ((flags & DS_FIND_SNAPSHOTS) && |
|
1015 |
dmu_objset_open(name, DMU_OST_ANY, |
|
1016 |
DS_MODE_STANDARD | DS_MODE_READONLY, &os) == 0) { |
|
1017 |
||
1018 |
snapobj = os->os->os_dsl_dataset->ds_phys->ds_snapnames_zapobj; |
|
1019 |
dmu_objset_close(os); |
|
1020 |
||
1021 |
for (zap_cursor_init(&zc, dd->dd_pool->dp_meta_objset, snapobj); |
|
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
1022 |
zap_cursor_retrieve(&zc, attr) == 0; |
789 | 1023 |
(void) zap_cursor_advance(&zc)) { |
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
1024 |
ASSERT(attr->za_integer_length == sizeof (uint64_t)); |
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
1025 |
ASSERT(attr->za_num_integers == 1); |
789 | 1026 |
|
1027 |
child = kmem_alloc(MAXPATHLEN, KM_SLEEP); |
|
1028 |
/* XXX could probably just use name here */ |
|
1029 |
dsl_dir_name(dd, child); |
|
1030 |
(void) strcat(child, "@"); |
|
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
1031 |
(void) strcat(child, attr->za_name); |
2199 | 1032 |
err = func(child, arg); |
789 | 1033 |
kmem_free(child, MAXPATHLEN); |
2199 | 1034 |
if (err) |
1035 |
break; |
|
789 | 1036 |
} |
885
d925b21dba78
6347493 tar of 25K empty directory entries in ZFS takes 30+ seconds ...
ahrens
parents:
789
diff
changeset
|
1037 |
zap_cursor_fini(&zc); |
789 | 1038 |
} |
1039 |
||
1040 |
dsl_dir_close(dd, FTAG); |
|
3978
2dd668007b7a
6533813 recursive snapshotting resulted in a bad stack overflow
mmusante
parents:
3897
diff
changeset
|
1041 |
kmem_free(attr, sizeof (zap_attribute_t)); |
789 | 1042 |
|
2199 | 1043 |
if (err) |
1044 |
return (err); |
|
1045 |
||
789 | 1046 |
/* |
1047 |
* Apply to self if appropriate. |
|
1048 |
*/ |
|
1049 |
if (do_self) |
|
2199 | 1050 |
err = func(name, arg); |
1051 |
return (err); |
|
789 | 1052 |
} |