1 #include <linux/ceph/ceph_debug.h>
5 #include "mds_client.h"
14 * get and set the file layout
16 static long ceph_ioctl_get_layout(struct file
*file
, void __user
*arg
)
18 struct ceph_inode_info
*ci
= ceph_inode(file_inode(file
));
19 struct ceph_ioctl_layout l
;
22 err
= ceph_do_getattr(file_inode(file
), CEPH_STAT_CAP_LAYOUT
);
24 l
.stripe_unit
= ceph_file_layout_su(ci
->i_layout
);
25 l
.stripe_count
= ceph_file_layout_stripe_count(ci
->i_layout
);
26 l
.object_size
= ceph_file_layout_object_size(ci
->i_layout
);
27 l
.data_pool
= le32_to_cpu(ci
->i_layout
.fl_pg_pool
);
28 l
.preferred_osd
= (s32
)-1;
29 if (copy_to_user(arg
, &l
, sizeof(l
)))
36 static long __validate_layout(struct ceph_mds_client
*mdsc
,
37 struct ceph_ioctl_layout
*l
)
41 /* validate striping parameters */
42 if ((l
->object_size
& ~PAGE_MASK
) ||
43 (l
->stripe_unit
& ~PAGE_MASK
) ||
44 (l
->stripe_unit
!= 0 &&
45 ((unsigned)l
->object_size
% (unsigned)l
->stripe_unit
)))
48 /* make sure it's a valid data pool */
49 mutex_lock(&mdsc
->mutex
);
51 for (i
= 0; i
< mdsc
->mdsmap
->m_num_data_pg_pools
; i
++)
52 if (mdsc
->mdsmap
->m_data_pg_pools
[i
] == l
->data_pool
) {
56 mutex_unlock(&mdsc
->mutex
);
63 static long ceph_ioctl_set_layout(struct file
*file
, void __user
*arg
)
65 struct inode
*inode
= file_inode(file
);
66 struct ceph_mds_client
*mdsc
= ceph_sb_to_client(inode
->i_sb
)->mdsc
;
67 struct ceph_mds_request
*req
;
68 struct ceph_ioctl_layout l
;
69 struct ceph_inode_info
*ci
= ceph_inode(file_inode(file
));
70 struct ceph_ioctl_layout nl
;
73 if (copy_from_user(&l
, arg
, sizeof(l
)))
76 /* validate changed params against current layout */
77 err
= ceph_do_getattr(file_inode(file
), CEPH_STAT_CAP_LAYOUT
);
81 memset(&nl
, 0, sizeof(nl
));
83 nl
.stripe_count
= l
.stripe_count
;
85 nl
.stripe_count
= ceph_file_layout_stripe_count(ci
->i_layout
);
87 nl
.stripe_unit
= l
.stripe_unit
;
89 nl
.stripe_unit
= ceph_file_layout_su(ci
->i_layout
);
91 nl
.object_size
= l
.object_size
;
93 nl
.object_size
= ceph_file_layout_object_size(ci
->i_layout
);
95 nl
.data_pool
= l
.data_pool
;
97 nl
.data_pool
= ceph_file_layout_pg_pool(ci
->i_layout
);
99 /* this is obsolete, and always -1 */
100 nl
.preferred_osd
= le64_to_cpu(-1);
102 err
= __validate_layout(mdsc
, &nl
);
106 req
= ceph_mdsc_create_request(mdsc
, CEPH_MDS_OP_SETLAYOUT
,
110 req
->r_inode
= inode
;
114 req
->r_inode_drop
= CEPH_CAP_FILE_SHARED
| CEPH_CAP_FILE_EXCL
;
116 req
->r_args
.setlayout
.layout
.fl_stripe_unit
=
117 cpu_to_le32(l
.stripe_unit
);
118 req
->r_args
.setlayout
.layout
.fl_stripe_count
=
119 cpu_to_le32(l
.stripe_count
);
120 req
->r_args
.setlayout
.layout
.fl_object_size
=
121 cpu_to_le32(l
.object_size
);
122 req
->r_args
.setlayout
.layout
.fl_pg_pool
= cpu_to_le32(l
.data_pool
);
124 err
= ceph_mdsc_do_request(mdsc
, NULL
, req
);
125 ceph_mdsc_put_request(req
);
130 * Set a layout policy on a directory inode. All items in the tree
131 * rooted at this inode will inherit this layout on creation,
132 * (It doesn't apply retroactively )
133 * unless a subdirectory has its own layout policy.
135 static long ceph_ioctl_set_layout_policy (struct file
*file
, void __user
*arg
)
137 struct inode
*inode
= file_inode(file
);
138 struct ceph_mds_request
*req
;
139 struct ceph_ioctl_layout l
;
141 struct ceph_mds_client
*mdsc
= ceph_sb_to_client(inode
->i_sb
)->mdsc
;
143 /* copy and validate */
144 if (copy_from_user(&l
, arg
, sizeof(l
)))
147 err
= __validate_layout(mdsc
, &l
);
151 req
= ceph_mdsc_create_request(mdsc
, CEPH_MDS_OP_SETDIRLAYOUT
,
156 req
->r_inode
= inode
;
160 req
->r_args
.setlayout
.layout
.fl_stripe_unit
=
161 cpu_to_le32(l
.stripe_unit
);
162 req
->r_args
.setlayout
.layout
.fl_stripe_count
=
163 cpu_to_le32(l
.stripe_count
);
164 req
->r_args
.setlayout
.layout
.fl_object_size
=
165 cpu_to_le32(l
.object_size
);
166 req
->r_args
.setlayout
.layout
.fl_pg_pool
=
167 cpu_to_le32(l
.data_pool
);
169 err
= ceph_mdsc_do_request(mdsc
, inode
, req
);
170 ceph_mdsc_put_request(req
);
175 * Return object name, size/offset information, and location (OSD
176 * number, network address) for a given file offset.
178 static long ceph_ioctl_get_dataloc(struct file
*file
, void __user
*arg
)
180 struct ceph_ioctl_dataloc dl
;
181 struct inode
*inode
= file_inode(file
);
182 struct ceph_inode_info
*ci
= ceph_inode(inode
);
183 struct ceph_osd_client
*osdc
=
184 &ceph_sb_to_client(inode
->i_sb
)->client
->osdc
;
185 struct ceph_object_locator oloc
;
186 struct ceph_object_id oid
;
192 /* copy and validate */
193 if (copy_from_user(&dl
, arg
, sizeof(dl
)))
196 down_read(&osdc
->map_sem
);
197 r
= ceph_calc_file_object_mapping(&ci
->i_layout
, dl
.file_offset
, len
,
198 &dl
.object_no
, &dl
.object_offset
,
201 up_read(&osdc
->map_sem
);
204 dl
.file_offset
-= dl
.object_offset
;
205 dl
.object_size
= ceph_file_layout_object_size(ci
->i_layout
);
206 dl
.block_size
= ceph_file_layout_su(ci
->i_layout
);
208 /* block_offset = object_offset % block_size */
209 tmp
= dl
.object_offset
;
210 dl
.block_offset
= do_div(tmp
, dl
.block_size
);
212 snprintf(dl
.object_name
, sizeof(dl
.object_name
), "%llx.%08llx",
213 ceph_ino(inode
), dl
.object_no
);
215 oloc
.pool
= ceph_file_layout_pg_pool(ci
->i_layout
);
216 ceph_oid_set_name(&oid
, dl
.object_name
);
218 r
= ceph_oloc_oid_to_pg(osdc
->osdmap
, &oloc
, &oid
, &pgid
);
220 up_read(&osdc
->map_sem
);
224 dl
.osd
= ceph_calc_pg_primary(osdc
->osdmap
, pgid
);
226 struct ceph_entity_addr
*a
=
227 ceph_osd_addr(osdc
->osdmap
, dl
.osd
);
229 memcpy(&dl
.osd_addr
, &a
->in_addr
, sizeof(dl
.osd_addr
));
231 memset(&dl
.osd_addr
, 0, sizeof(dl
.osd_addr
));
233 up_read(&osdc
->map_sem
);
235 /* send result back to user */
236 if (copy_to_user(arg
, &dl
, sizeof(dl
)))
242 static long ceph_ioctl_lazyio(struct file
*file
)
244 struct ceph_file_info
*fi
= file
->private_data
;
245 struct inode
*inode
= file_inode(file
);
246 struct ceph_inode_info
*ci
= ceph_inode(inode
);
248 if ((fi
->fmode
& CEPH_FILE_MODE_LAZY
) == 0) {
249 spin_lock(&ci
->i_ceph_lock
);
250 ci
->i_nr_by_mode
[fi
->fmode
]--;
251 fi
->fmode
|= CEPH_FILE_MODE_LAZY
;
252 ci
->i_nr_by_mode
[fi
->fmode
]++;
253 spin_unlock(&ci
->i_ceph_lock
);
254 dout("ioctl_layzio: file %p marked lazy\n", file
);
256 ceph_check_caps(ci
, 0, NULL
);
258 dout("ioctl_layzio: file %p already lazy\n", file
);
263 static long ceph_ioctl_syncio(struct file
*file
)
265 struct ceph_file_info
*fi
= file
->private_data
;
267 fi
->flags
|= CEPH_F_SYNC
;
271 long ceph_ioctl(struct file
*file
, unsigned int cmd
, unsigned long arg
)
273 dout("ioctl file %p cmd %u arg %lu\n", file
, cmd
, arg
);
275 case CEPH_IOC_GET_LAYOUT
:
276 return ceph_ioctl_get_layout(file
, (void __user
*)arg
);
278 case CEPH_IOC_SET_LAYOUT
:
279 return ceph_ioctl_set_layout(file
, (void __user
*)arg
);
281 case CEPH_IOC_SET_LAYOUT_POLICY
:
282 return ceph_ioctl_set_layout_policy(file
, (void __user
*)arg
);
284 case CEPH_IOC_GET_DATALOC
:
285 return ceph_ioctl_get_dataloc(file
, (void __user
*)arg
);
287 case CEPH_IOC_LAZYIO
:
288 return ceph_ioctl_lazyio(file
);
290 case CEPH_IOC_SYNCIO
:
291 return ceph_ioctl_syncio(file
);